diff --git a/.asf.yaml b/.asf.yaml
index 3935a525ff3c4..296aaff5c4a2d 100644
--- a/.asf.yaml
+++ b/.asf.yaml
@@ -13,7 +13,7 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
-# https://cwiki.apache.org/confluence/display/INFRA/git+-+.asf.yaml+features
+# https://github.com/apache/infrastructure-asfyaml/blob/main/README.md
 ---
 github:
   description: "Apache Spark - A unified analytics engine for large-scale data processing"
diff --git a/.github/workflows/benchmark.yml b/.github/workflows/benchmark.yml
index 6b2e72b3f23be..3e90bb329be56 100644
--- a/.github/workflows/benchmark.yml
+++ b/.github/workflows/benchmark.yml
@@ -50,6 +50,11 @@ on:
         description: 'Number of job splits'
         required: true
         default: '1'
+      create-commit:
+        type: boolean
+        description: 'Commit the benchmark results to the current branch'
+        required: true
+        default: false
 
 jobs:
   matrix-gen:
@@ -195,10 +200,31 @@ jobs:
         # To keep the directory structure and file permissions, tar them
         # See also https://github.com/actions/upload-artifact#maintaining-file-permissions-and-case-sensitive-files
         echo "Preparing the benchmark results:"
-        tar -cvf benchmark-results-${{ inputs.jdk }}-${{ inputs.scala }}.tar `git diff --name-only` `git ls-files --others --exclude=tpcds-sf-1 --exclude=tpcds-sf-1-text --exclude-standard`
+        tar -cvf target/benchmark-results-${{ inputs.jdk }}-${{ inputs.scala }}.tar `git diff --name-only` `git ls-files --others --exclude=tpcds-sf-1 --exclude=tpcds-sf-1-text --exclude-standard`
+    - name: Create a pull request with the results
+      if: ${{ inputs.create-commit && success() }}
+      run: |
+        git config --local user.name "${{ github.actor }}"
+        git config --local user.email "${{ github.event.pusher.email || format('{0}@users.noreply.github.com', github.actor) }}"
+        git add -A
+        git commit -m "Benchmark results for ${{ inputs.class }} (JDK ${{ inputs.jdk }}, Scala ${{ inputs.scala }}, split ${{ matrix.split }} of ${{ inputs.num-splits }})"
+        for i in {1..5}; do
+          echo "Attempt $i to push..."
+          git fetch origin ${{ github.ref_name }}
+          git rebase origin/${{ github.ref_name }}
+          if git push origin ${{ github.ref_name }}:${{ github.ref_name }}; then
+            echo "Push successful."
+            exit 0
+          else
+            echo "Push failed, retrying in 3 seconds..."
+            sleep 3
+          fi
+        done
+        echo "Error: Failed to push after 5 attempts."
+        exit 1
     - name: Upload benchmark results
       uses: actions/upload-artifact@v4
       with:
         name: benchmark-results-${{ inputs.jdk }}-${{ inputs.scala }}-${{ matrix.split }}
-        path: benchmark-results-${{ inputs.jdk }}-${{ inputs.scala }}.tar
+        path: target/benchmark-results-${{ inputs.jdk }}-${{ inputs.scala }}.tar
 
diff --git a/.github/workflows/build_and_test.yml b/.github/workflows/build_and_test.yml
index ff005103a2461..5e6d22256e2f3 100644
--- a/.github/workflows/build_and_test.yml
+++ b/.github/workflows/build_and_test.yml
@@ -112,7 +112,7 @@ jobs:
             ui=false
             docs=false
           fi
-          build=`./dev/is-changed.py -m "core,unsafe,kvstore,avro,utils,network-common,network-shuffle,repl,launcher,examples,sketch,variant,api,catalyst,hive-thriftserver,mllib-local,mllib,graphx,streaming,sql-kafka-0-10,streaming-kafka-0-10,streaming-kinesis-asl,kubernetes,hadoop-cloud,spark-ganglia-lgpl,profiler,protobuf,yarn,connect,sql,hive,pipelines"`
+          build=`./dev/is-changed.py -m "core,unsafe,kvstore,avro,utils,utils-java,network-common,network-shuffle,repl,launcher,examples,sketch,variant,api,catalyst,hive-thriftserver,mllib-local,mllib,graphx,streaming,sql-kafka-0-10,streaming-kafka-0-10,streaming-kinesis-asl,kubernetes,hadoop-cloud,spark-ganglia-lgpl,profiler,protobuf,yarn,connect,sql,hive,pipelines"`
           precondition="
             {
               \"build\": \"$build\",
@@ -122,6 +122,8 @@ jobs:
               \"tpcds-1g\": \"$tpcds\",
               \"docker-integration-tests\": \"$docker\",
               \"lint\" : \"true\",
+              \"java17\" : \"$build\",
+              \"java25\" : \"$build\",
               \"docs\" : \"$docs\",
               \"yarn\" : \"$yarn\",
               \"k8s-integration-tests\" : \"$kubernetes\",
@@ -240,7 +242,7 @@ jobs:
         # Note that the modules below are from sparktestsupport/modules.py.
         modules:
           - >-
-            core, unsafe, kvstore, avro, utils,
+            core, unsafe, kvstore, avro, utils, utils-java,
             network-common, network-shuffle, repl, launcher,
             examples, sketch, variant
           - >-
@@ -360,7 +362,7 @@ jobs:
     - name: Install Python packages (Python 3.11)
       if: (contains(matrix.modules, 'sql') && !contains(matrix.modules, 'sql-')) || contains(matrix.modules, 'connect') || contains(matrix.modules, 'yarn')
       run: |
-        python3.11 -m pip install 'numpy>=1.20.0' pyarrow pandas scipy unittest-xml-reporting 'lxml==4.9.4' 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1'
+        python3.11 -m pip install 'numpy>=1.22' pyarrow pandas scipy unittest-xml-reporting 'lxml==4.9.4' 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1'
         python3.11 -m pip list
     # Run the tests.
     - name: Run tests
@@ -519,13 +521,9 @@ jobs:
           - >-
             pyspark-pandas-slow
           - >-
-            pyspark-pandas-connect-part0
+            pyspark-pandas-connect-part0, pyspark-pandas-connect-part3
           - >-
-            pyspark-pandas-connect-part1
-          - >-
-            pyspark-pandas-connect-part2
-          - >-
-            pyspark-pandas-connect-part3
+            pyspark-pandas-connect-part1, pyspark-pandas-connect-part2
         exclude:
           # Always run if pyspark == 'true', even infra-image is skip (such as non-master job)
           # In practice, the build will run in individual PR, but not against the individual commit
@@ -605,8 +603,9 @@ jobs:
       run: |
         for py in $(echo $PYTHON_TO_TEST | tr "," "\n")
         do
-          echo $py
+          $py --version
           $py -m pip list
+          echo ""
         done
     - name: Install Conda for pip packaging test
       if: contains(matrix.modules, 'pyspark-errors')
@@ -919,6 +918,42 @@ jobs:
     - name: R linter
       run: ./dev/lint-r
 
+  java17:
+    needs: [precondition]
+    if: fromJson(needs.precondition.outputs.required).java17 == 'true'
+    name: Java 17 build with Maven
+    runs-on: ubuntu-latest
+    timeout-minutes: 120
+    steps:
+    - uses: actions/checkout@v4
+    - uses: actions/setup-java@v4
+      with:
+        distribution: zulu
+        java-version: 17
+    - name: Build with Maven
+      run: |
+        export MAVEN_OPTS="-Xss64m -Xmx4g -Xms4g -XX:ReservedCodeCacheSize=128m -Dorg.slf4j.simpleLogger.defaultLogLevel=WARN"
+        export MAVEN_CLI_OPTS="--no-transfer-progress"
+        ./build/mvn $MAVEN_CLI_OPTS -DskipTests -Pyarn -Pkubernetes -Pvolcano -Phive -Phive-thriftserver -Phadoop-cloud -Pjvm-profiler -Pspark-ganglia-lgpl -Pkinesis-asl clean install
+
+  java25:
+    needs: [precondition]
+    if: fromJson(needs.precondition.outputs.required).java25 == 'true'
+    name: Java 25 build with Maven
+    runs-on: ubuntu-latest
+    timeout-minutes: 120
+    steps:
+    - uses: actions/checkout@v4
+    - uses: actions/setup-java@v4
+      with:
+        distribution: zulu
+        java-version: 25-ea
+    - name: Build with Maven
+      run: |
+        export MAVEN_OPTS="-Xss64m -Xmx4g -Xms4g -XX:ReservedCodeCacheSize=128m -Dorg.slf4j.simpleLogger.defaultLogLevel=WARN"
+        export MAVEN_CLI_OPTS="--no-transfer-progress"
+        ./build/mvn $MAVEN_CLI_OPTS -DskipTests -Pyarn -Pkubernetes -Pvolcano -Phive -Phive-thriftserver -Phadoop-cloud -Pjvm-profiler -Pspark-ganglia-lgpl -Pkinesis-asl clean install
+
   # Documentation build
   docs:
     needs: [precondition, infra-image]
@@ -998,10 +1033,14 @@ jobs:
         # Should unpin 'sphinxcontrib-*' after upgrading sphinx>5
         python3.9 -m pip install 'sphinx==4.5.0' mkdocs 'pydata_sphinx_theme>=0.13' sphinx-copybutton nbsphinx numpydoc jinja2 markupsafe 'pyzmq<24.0.0' 'sphinxcontrib-applehelp==1.0.4' 'sphinxcontrib-devhelp==1.0.2' 'sphinxcontrib-htmlhelp==2.0.1' 'sphinxcontrib-qthelp==1.0.3' 'sphinxcontrib-serializinghtml==1.1.5'
         python3.9 -m pip install ipython_genutils # See SPARK-38517
-        python3.9 -m pip install sphinx_plotly_directive 'numpy>=1.20.0' pyarrow pandas 'plotly<6.0.0'
+        python3.9 -m pip install sphinx_plotly_directive 'numpy>=1.22' pyarrow pandas 'plotly<6.0.0'
         python3.9 -m pip install 'docutils<0.18.0' # See SPARK-39421
-    - name: List Python packages
+    - name: List Python packages for branch-3.5 and branch-4.0
+      if: inputs.branch == 'branch-3.5' || inputs.branch == 'branch-4.0'
       run: python3.9 -m pip list
+    - name: List Python packages
+      if: inputs.branch != 'branch-3.5' && inputs.branch != 'branch-4.0'
+      run: python3.11 -m pip list
     - name: Install dependencies for documentation generation
       run: |
         # Keep the version of Bundler here in sync with the following locations:
@@ -1010,7 +1049,8 @@ jobs:
         gem install bundler -v 2.4.22
         cd docs
         bundle install --retry=100
-    - name: Run documentation build
+    - name: Run documentation build for branch-3.5 and branch-4.0
+      if: inputs.branch == 'branch-3.5' || inputs.branch == 'branch-4.0'
       run: |
         # We need this link to make sure `python3` points to `python3.9` which contains the prerequisite packages.
         ln -s "$(which python3.9)" "/usr/local/bin/python3"
@@ -1031,6 +1071,30 @@ jobs:
         echo "SKIP_SQLDOC: $SKIP_SQLDOC"
         cd docs
         bundle exec jekyll build
+    - name: Run documentation build
+      if: inputs.branch != 'branch-3.5' && inputs.branch != 'branch-4.0'
+      run: |
+        # We need this link to make sure `python3` points to `python3.11` which contains the prerequisite packages.
+        ln -s "$(which python3.11)" "/usr/local/bin/python3"
+        # Build docs first with SKIP_API to ensure they are buildable without requiring any
+        # language docs to be built beforehand.
+        cd docs; SKIP_ERRORDOC=1 SKIP_API=1 bundle exec jekyll build; cd ..
+        if [ -f "./dev/is-changed.py" ]; then
+          # Skip PySpark and SparkR docs while keeping Scala/Java/SQL docs
+          pyspark_modules=`cd dev && python3.11 -c "import sparktestsupport.modules as m; print(','.join(m.name for m in m.all_modules if m.name.startswith('pyspark')))"`
+          if [ `./dev/is-changed.py -m $pyspark_modules` = false ]; then export SKIP_PYTHONDOC=1; fi
+          if [ `./dev/is-changed.py -m sparkr` = false ]; then export SKIP_RDOC=1; fi
+        fi
+        export PYSPARK_DRIVER_PYTHON=python3.11
+        export PYSPARK_PYTHON=python3.11
+        # Print the values of environment variables `SKIP_ERRORDOC`, `SKIP_SCALADOC`, `SKIP_PYTHONDOC`, `SKIP_RDOC` and `SKIP_SQLDOC`
+        echo "SKIP_ERRORDOC: $SKIP_ERRORDOC"
+        echo "SKIP_SCALADOC: $SKIP_SCALADOC"
+        echo "SKIP_PYTHONDOC: $SKIP_PYTHONDOC"
+        echo "SKIP_RDOC: $SKIP_RDOC"
+        echo "SKIP_SQLDOC: $SKIP_SQLDOC"
+        cd docs
+        bundle exec jekyll build
     - name: Tar documentation
       if: github.repository != 'apache/spark'
       run: tar cjf site.tar.bz2 docs/_site
@@ -1279,8 +1343,10 @@ jobs:
           kubectl create clusterrolebinding serviceaccounts-cluster-admin --clusterrole=cluster-admin --group=system:serviceaccounts || true
           if [[ "${{ inputs.branch }}" == 'branch-3.5' ]]; then
             kubectl apply -f https://raw.githubusercontent.com/volcano-sh/volcano/v1.7.0/installer/volcano-development.yaml || true
-          else
+          elif [[ "${{ inputs.branch }}" == 'branch-4.0' ]]; then
             kubectl apply -f https://raw.githubusercontent.com/volcano-sh/volcano/v1.11.0/installer/volcano-development.yaml || true
+          else
+            kubectl apply -f https://raw.githubusercontent.com/volcano-sh/volcano/v1.12.2/installer/volcano-development.yaml || true
           fi
           eval $(minikube docker-env)
           build/sbt -Phadoop-3 -Psparkr -Pkubernetes -Pvolcano -Pkubernetes-integration-tests -Dspark.kubernetes.test.volcanoMaxConcurrencyJobNum=1 -Dtest.exclude.tags=local "kubernetes-integration-tests/test"
diff --git a/.github/workflows/build_infra_images_cache.yml b/.github/workflows/build_infra_images_cache.yml
index ccd47826ff099..9ec93a4af52c1 100644
--- a/.github/workflows/build_infra_images_cache.yml
+++ b/.github/workflows/build_infra_images_cache.yml
@@ -33,7 +33,6 @@ on:
     - 'dev/spark-test-image/python-minimum/Dockerfile'
     - 'dev/spark-test-image/python-ps-minimum/Dockerfile'
     - 'dev/spark-test-image/pypy-310/Dockerfile'
-    - 'dev/spark-test-image/python-309/Dockerfile'
     - 'dev/spark-test-image/python-310/Dockerfile'
     - 'dev/spark-test-image/python-311/Dockerfile'
     - 'dev/spark-test-image/python-311-classic-only/Dockerfile'
@@ -153,19 +152,6 @@ jobs:
       - name: Image digest (PySpark with PyPy 3.10)
         if: hashFiles('dev/spark-test-image/pypy-310/Dockerfile') != ''
         run: echo ${{ steps.docker_build_pyspark_pypy_310.outputs.digest }}
-      - name: Build and push (PySpark with Python 3.9)
-        if: hashFiles('dev/spark-test-image/python-309/Dockerfile') != ''
-        id: docker_build_pyspark_python_309
-        uses: docker/build-push-action@v6
-        with:
-          context: ./dev/spark-test-image/python-309/
-          push: true
-          tags: ghcr.io/apache/spark/apache-spark-github-action-image-pyspark-python-309-cache:${{ github.ref_name }}-static
-          cache-from: type=registry,ref=ghcr.io/apache/spark/apache-spark-github-action-image-pyspark-python-309-cache:${{ github.ref_name }}
-          cache-to: type=registry,ref=ghcr.io/apache/spark/apache-spark-github-action-image-pyspark-python-309-cache:${{ github.ref_name }},mode=max
-      - name: Image digest (PySpark with Python 3.9)
-        if: hashFiles('dev/spark-test-image/python-309/Dockerfile') != ''
-        run: echo ${{ steps.docker_build_pyspark_python_309.outputs.digest }}
       - name: Build and push (PySpark with Python 3.10)
         if: hashFiles('dev/spark-test-image/python-310/Dockerfile') != ''
         id: docker_build_pyspark_python_310
diff --git a/.github/workflows/build_maven_java21_arm.yml b/.github/workflows/build_maven_java21_arm.yml
index 505bdd63189c0..16417bb1c5f22 100644
--- a/.github/workflows/build_maven_java21_arm.yml
+++ b/.github/workflows/build_maven_java21_arm.yml
@@ -21,7 +21,7 @@ name: "Build / Maven (master, Scala 2.13, Hadoop 3, JDK 21, ARM)"
 
 on:
   schedule:
-    - cron: '0 15 * * *'
+    - cron: '0 15 */2 * *'
   workflow_dispatch:
 
 jobs:
diff --git a/.github/workflows/build_non_ansi.yml b/.github/workflows/build_non_ansi.yml
index 547a227e61d7e..debdaf4f8709d 100644
--- a/.github/workflows/build_non_ansi.yml
+++ b/.github/workflows/build_non_ansi.yml
@@ -40,6 +40,7 @@ jobs:
           "PYSPARK_IMAGE_TO_TEST": "python-311",
           "PYTHON_TO_TEST": "python3.11",
           "SPARK_ANSI_SQL_MODE": "false",
+          "SPARK_TEST_SPARK_BLOOM_FILTER_SUITE_ENABLED": "true"
         }
       jobs: >-
         {
diff --git a/.github/workflows/build_python_3.9.yml b/.github/workflows/build_python_3.9.yml
deleted file mode 100644
index 0df17699140ed..0000000000000
--- a/.github/workflows/build_python_3.9.yml
+++ /dev/null
@@ -1,47 +0,0 @@
-#
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-#
-
-name: "Build / Python-only (master, Python 3.9)"
-
-on:
-  schedule:
-    - cron: '0 21 * * *'
-  workflow_dispatch:
-
-jobs:
-  run-build:
-    permissions:
-      packages: write
-    name: Run
-    uses: ./.github/workflows/build_and_test.yml
-    if: github.repository == 'apache/spark'
-    with:
-      java: 17
-      branch: master
-      hadoop: hadoop3
-      envs: >-
-        {
-          "PYSPARK_IMAGE_TO_TEST": "python-309",
-          "PYTHON_TO_TEST": "python3.9"
-        }
-      jobs: >-
-        {
-          "pyspark": "true",
-          "pyspark-pandas": "true"
-        }
diff --git a/.github/workflows/build_python_connect.yml b/.github/workflows/build_python_connect.yml
index 8d82ff192ab07..bf247db613dba 100644
--- a/.github/workflows/build_python_connect.yml
+++ b/.github/workflows/build_python_connect.yml
@@ -72,7 +72,7 @@ jobs:
           python packaging/client/setup.py sdist
           cd dist
           pip install pyspark*client-*.tar.gz
-          pip install 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1' 'googleapis-common-protos==1.65.0' 'graphviz==0.20.3' 'six==1.16.0' 'pandas==2.2.3' scipy 'plotly<6.0.0' 'mlflow>=2.8.1' coverage matplotlib openpyxl 'memory-profiler>=0.61.0' 'scikit-learn>=1.3.2' 'graphviz==0.20.3' 'torch<2.6.0' torchvision torcheval deepspeed unittest-xml-reporting
+          pip install 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1' 'googleapis-common-protos==1.65.0' 'graphviz==0.20.3' 'six==1.16.0' 'pandas==2.3.2' scipy 'plotly<6.0.0' 'mlflow>=2.8.1' coverage matplotlib openpyxl 'memory-profiler>=0.61.0' 'scikit-learn>=1.3.2' 'graphviz==0.20.3' 'torch<2.6.0' torchvision torcheval deepspeed unittest-xml-reporting
       - name: List Python packages
         run: python -m pip list
       - name: Run tests (local)
diff --git a/.github/workflows/build_python_connect35.yml b/.github/workflows/build_python_connect35.yml
index e68f288f0184f..6c37091afcb4f 100644
--- a/.github/workflows/build_python_connect35.yml
+++ b/.github/workflows/build_python_connect35.yml
@@ -68,7 +68,7 @@ jobs:
           ./build/sbt -Phive Test/package
       - name: Install Python dependencies
         run: |
-          pip install 'numpy==1.25.1' 'pyarrow==12.0.1' 'pandas<=2.0.3' scipy unittest-xml-reporting 'plotly<6.0.0' 'mlflow>=2.3.1' coverage 'matplotlib==3.7.2' openpyxl 'memory-profiler==0.60.0' 'scikit-learn==1.1.*'
+          pip install 'numpy==1.25.1' 'pyarrow>=18.0.0' 'pandas<=2.0.3' scipy unittest-xml-reporting 'plotly<6.0.0' 'mlflow>=2.3.1' coverage 'matplotlib==3.7.2' openpyxl 'memory-profiler==0.60.0' 'scikit-learn==1.1.*'
 
           # Add Python deps for Spark Connect.
           pip install 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1' 'googleapis-common-protos==1.65.0' 'graphviz==0.20.3'
diff --git a/.github/workflows/build_python_minimum.yml b/.github/workflows/build_python_minimum.yml
index 4e65503006489..3514a82f6217c 100644
--- a/.github/workflows/build_python_minimum.yml
+++ b/.github/workflows/build_python_minimum.yml
@@ -38,7 +38,7 @@ jobs:
       envs: >-
         {
           "PYSPARK_IMAGE_TO_TEST": "python-minimum",
-          "PYTHON_TO_TEST": "python3.9"
+          "PYTHON_TO_TEST": "python3.10"
         }
       jobs: >-
         {
diff --git a/.github/workflows/build_python_ps_minimum.yml b/.github/workflows/build_python_ps_minimum.yml
index 3aa83ff06a996..ed80a904ebd7f 100644
--- a/.github/workflows/build_python_ps_minimum.yml
+++ b/.github/workflows/build_python_ps_minimum.yml
@@ -38,7 +38,7 @@ jobs:
       envs: >-
         {
           "PYSPARK_IMAGE_TO_TEST": "python-ps-minimum",
-          "PYTHON_TO_TEST": "python3.9"
+          "PYTHON_TO_TEST": "python3.10"
         }
       jobs: >-
         {
diff --git a/.github/workflows/build_sparkr_window.yml b/.github/workflows/build_sparkr_window.yml
index e3ef9d7ba0752..8bbcdf79bd58b 100644
--- a/.github/workflows/build_sparkr_window.yml
+++ b/.github/workflows/build_sparkr_window.yml
@@ -16,7 +16,7 @@
 # specific language governing permissions and limitations
 # under the License.
 #
-name: "Build / SparkR-only (master, 4.4.3, windows-2022)"
+name: "Build / SparkR-only (master, 4.4.3, windows-2025)"
 
 on:
   schedule:
@@ -26,7 +26,7 @@ on:
 jobs:
   build:
     name: "Build module: sparkr"
-    runs-on: windows-2022
+    runs-on: windows-2025
     timeout-minutes: 120
     if: github.repository == 'apache/spark'
     steps:
diff --git a/.github/workflows/maven_test.yml b/.github/workflows/maven_test.yml
index e0a5e411571a0..5b1d3b47858d6 100644
--- a/.github/workflows/maven_test.yml
+++ b/.github/workflows/maven_test.yml
@@ -67,7 +67,7 @@ jobs:
           - hive2.3
         modules:
           - >-
-            core,launcher,common#unsafe,common#kvstore,common#network-common,common#network-shuffle,common#sketch,common#utils,common#variant
+            core,launcher,common#unsafe,common#kvstore,common#network-common,common#network-shuffle,common#sketch,common#utils,common#utils-java,common#variant
           - >-
             graphx,streaming,hadoop-cloud
           - >-
@@ -181,7 +181,7 @@ jobs:
       - name: Install Python packages (Python 3.11)
         if: contains(matrix.modules, 'resource-managers#yarn') || (contains(matrix.modules, 'sql#core')) || contains(matrix.modules, 'connect')
         run: |
-          python3.11 -m pip install 'numpy>=1.20.0' pyarrow pandas scipy unittest-xml-reporting 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1'
+          python3.11 -m pip install 'numpy>=1.22' pyarrow pandas scipy unittest-xml-reporting 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1'
           python3.11 -m pip list
       # Run the tests.
       - name: Run tests
@@ -190,6 +190,7 @@ jobs:
           export MAVEN_OPTS="-Xss64m -Xmx4g -Xms4g -XX:ReservedCodeCacheSize=128m -Dorg.slf4j.simpleLogger.defaultLogLevel=WARN"
           export MAVEN_CLI_OPTS="--no-transfer-progress"
           export JAVA_VERSION=${{ matrix.java }}
+          export INPUT_BRANCH=${{ inputs.branch }}
           export ENABLE_KINESIS_TESTS=0
           # Replace with the real module name, for example, connector#kafka-0-10 -> connector/kafka-0-10
           export TEST_MODULES=`echo "$MODULES_TO_TEST" | sed -e "s%#%/%g"`
@@ -209,6 +210,14 @@ jobs:
           elif [[ "$MODULES_TO_TEST" == *"sql#hive-thriftserver"* ]]; then
             # To avoid a compilation loop, for the `sql/hive-thriftserver` module, run `clean install` instead
             ./build/mvn $MAVEN_CLI_OPTS -pl "$TEST_MODULES" -Pyarn -Pkubernetes -Pvolcano -Phive -Phive-thriftserver -Phadoop-cloud -Pjvm-profiler -Pspark-ganglia-lgpl -Pkinesis-asl -Djava.version=${JAVA_VERSION/-ea} clean install -fae
+          elif [[ "$MODULES_TO_TEST" == *"sql#pipelines"* && "$INPUT_BRANCH" == "branch-4.0" ]]; then
+            # SPARK-52441: Remove sql/pipelines from TEST_MODULES for branch-4.0, this branch can be deleted after the EOL of branch-4.0.
+            TEST_MODULES=${TEST_MODULES/,sql\/pipelines/}
+            ./build/mvn $MAVEN_CLI_OPTS -pl "$TEST_MODULES" -Pyarn -Pkubernetes -Pvolcano -Phive -Phive-thriftserver -Pspark-ganglia-lgpl -Phadoop-cloud -Pjvm-profiler -Pkinesis-asl -Djava.version=${JAVA_VERSION/-ea} test -fae
+          elif [[ "$MODULES_TO_TEST" == *"common#utils-java"* && "$INPUT_BRANCH" == "branch-4.0" ]]; then
+            # SPARK-53138: Remove common/utils-java from TEST_MODULES for branch-4.0, this branch can be deleted after the EOL of branch-4.0.
+            TEST_MODULES=${TEST_MODULES/,common\/utils-java/}
+            ./build/mvn $MAVEN_CLI_OPTS -pl "$TEST_MODULES" -Pyarn -Pkubernetes -Pvolcano -Phive -Phive-thriftserver -Pspark-ganglia-lgpl -Phadoop-cloud -Pjvm-profiler -Pkinesis-asl -Djava.version=${JAVA_VERSION/-ea} test -fae
           else
             ./build/mvn $MAVEN_CLI_OPTS -pl "$TEST_MODULES" -Pyarn -Pkubernetes -Pvolcano -Phive -Phive-thriftserver -Pspark-ganglia-lgpl -Phadoop-cloud -Pjvm-profiler -Pkinesis-asl -Djava.version=${JAVA_VERSION/-ea} test -fae
           fi
diff --git a/.github/workflows/pages.yml b/.github/workflows/pages.yml
index 4bcc275064d3c..8293c2429c9d1 100644
--- a/.github/workflows/pages.yml
+++ b/.github/workflows/pages.yml
@@ -52,16 +52,16 @@ jobs:
         with:
           distribution: zulu
           java-version: 17
-      - name: Install Python 3.9
+      - name: Install Python 3.11
         uses: actions/setup-python@v5
         with:
-          python-version: '3.9'
+          python-version: '3.11'
           architecture: x64
           cache: 'pip'
       - name: Install Python dependencies
         run: |
          pip install 'sphinx==4.5.0' mkdocs 'pydata_sphinx_theme>=0.13' sphinx-copybutton nbsphinx numpydoc jinja2 markupsafe 'pyzmq<24.0.0' \
-            ipython ipython_genutils sphinx_plotly_directive 'numpy>=1.20.0' pyarrow 'pandas==2.2.3' 'plotly>=4.8' 'docutils<0.18.0' \
+            ipython ipython_genutils sphinx_plotly_directive 'numpy>=1.22' pyarrow 'pandas==2.3.2' 'plotly>=4.8' 'docutils<0.18.0' \
             'flake8==3.9.0' 'mypy==1.8.0' 'pytest==7.1.3' 'pytest-mypy-plugins==1.9.3' 'black==23.12.1' \
             'pandas-stubs==1.2.0.53' 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1' 'grpc-stubs==1.24.11' 'googleapis-common-protos-stubs==2.2.0' \
             'sphinxcontrib-applehelp==1.0.4' 'sphinxcontrib-devhelp==1.0.2' 'sphinxcontrib-htmlhelp==2.0.1' 'sphinxcontrib-qthelp==1.0.3' 'sphinxcontrib-serializinghtml==1.1.5'
diff --git a/.github/workflows/python_hosted_runner_test.yml b/.github/workflows/python_hosted_runner_test.yml
index 9a87c4f7061b0..afc016186be52 100644
--- a/.github/workflows/python_hosted_runner_test.yml
+++ b/.github/workflows/python_hosted_runner_test.yml
@@ -149,7 +149,7 @@ jobs:
         run: |
           python${{matrix.python}} -m pip install --ignore-installed 'blinker>=1.6.2'
           python${{matrix.python}} -m pip install --ignore-installed 'six==1.16.0'
-          python${{matrix.python}} -m pip install numpy 'pyarrow>=19.0.0' 'six==1.16.0' 'pandas==2.2.3' scipy 'plotly<6.0.0' 'mlflow>=2.8.1' coverage matplotlib openpyxl 'memory-profiler>=0.61.0' 'scikit-learn>=1.3.2' unittest-xml-reporting && \
+          python${{matrix.python}} -m pip install numpy 'pyarrow>=21.0.0' 'six==1.16.0' 'pandas==2.3.2' scipy 'plotly<6.0.0' 'mlflow>=2.8.1' coverage matplotlib openpyxl 'memory-profiler>=0.61.0' 'scikit-learn>=1.3.2' unittest-xml-reporting && \
           python${{matrix.python}} -m pip install 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1' 'googleapis-common-protos==1.65.0' 'graphviz==0.20.3' && \
           python${{matrix.python}} -m pip cache purge
       - name: List Python packages
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 976aaf616295c..a6fa04b120de5 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -74,7 +74,8 @@ on:
     inputs:
       branch:
         description: 'Branch to release. Leave it empty to launch a dryrun. Dispatch this workflow only in the forked repository.'
-        required: false
+        required: true
+        default: master
       release-version:
         description: 'Release version. Leave it empty to launch a dryrun.'
         required: false
@@ -90,10 +91,23 @@ jobs:
   release:
     name: Release Apache Spark
     runs-on: ubuntu-latest
-    # Do not allow dispatching this workflow manually in the main repo.
-    # and skip this workflow in forked repository when running as a
-    # scheduled job (dryrun).
-    if: ${{ (github.repository == 'apache/spark') != (inputs.branch != '' && inputs.release-version != '') }}
+    # Allow workflow to run only in the following cases:
+    # 1. In the apache/spark repository:
+    #    - Only allow dry runs (i.e., both 'branch' and 'release-version' inputs are empty).
+    # 2. In forked repositories:
+    #    - Allow real runs when both 'branch' and 'release-version' are provided.
+    #    - Allow dry runs only if manually dispatched (not on a schedule).
+    if: |
+      (
+        github.repository == 'apache/spark' &&
+        inputs.branch == '' &&
+        inputs.release-version == ''
+      ) || (
+        github.repository != 'apache/spark' &&
+        (
+          (inputs.branch != '' && inputs.release-version != '') || github.event_name == 'workflow_dispatch'
+        )
+      )
     steps:
       - name: Checkout Spark repository
         uses: actions/checkout@v4
@@ -132,22 +146,12 @@ jobs:
             sleep 60
           fi
 
-          empty_count=0
-          non_empty_count=0
-          for val in "$GIT_BRANCH" "$RELEASE_VERSION" "$SPARK_RC_COUNT"; do
-            if [ -z "$val" ]; then
-              empty_count=$((empty_count+1))
-            else
-              non_empty_count=$((non_empty_count+1))
-            fi
-          done
-
-          if [ "$empty_count" -gt 0 ] && [ "$non_empty_count" -gt 0 ]; then
-            echo "Error: Either provide all inputs or leave them all empty for a dryrun."
+          if { [ -n "$RELEASE_VERSION" ] && [ -z "$SPARK_RC_COUNT" ]; } || { [ -z "$RELEASE_VERSION" ] && [ -n "$SPARK_RC_COUNT" ]; }; then
+            echo "Error: Either provide both 'Release version' and 'RC number', or leave both empty for a dryrun."
             exit 1
           fi
 
-          if [ "$empty_count" -eq 3 ]; then
+          if [ -z "$RELEASE_VERSION" ] && [ -z "$SPARK_RC_COUNT" ]; then
             echo "Dry run mode enabled"
             export DRYRUN_MODE=1
             ASF_PASSWORD="not_used"
@@ -155,7 +159,6 @@ jobs:
             GPG_PASSPHRASE="not_used"
             ASF_USERNAME="gurwls223"
             export SKIP_TAG=1
-            unset GIT_BRANCH
             unset RELEASE_VERSION
           else
             echo "Full release mode enabled"
@@ -163,7 +166,7 @@ jobs:
           fi
 
           export ASF_PASSWORD GPG_PRIVATE_KEY GPG_PASSPHRASE ASF_USERNAME
-          [ -n "$GIT_BRANCH" ] && export GIT_BRANCH
+          export GIT_BRANCH="${GIT_BRANCH:-master}"
           [ -n "$RELEASE_VERSION" ] && export RELEASE_VERSION
 
           if [ "$DRYRUN_MODE" = "1" ]; then
@@ -237,9 +240,18 @@ jobs:
             cp "$file" "$file.bak"
             for pattern in "${PATTERNS[@]}"; do
               [ -n "$pattern" ] || continue  # Skip empty patterns
-              escaped_pattern=$(printf '%s\n' "$pattern" | sed 's/[\/&]/\\&/g')
-              sed -i "s/${escaped_pattern}/***/g" "$file"
+          
+              # Safely escape special characters for sed
+              escaped_pattern=${pattern//\\/\\\\} # Escape backslashes
+              escaped_pattern=${escaped_pattern//\//\\/} # Escape forward slashes
+              escaped_pattern=${escaped_pattern//&/\\&} # Escape &
+              escaped_pattern=${escaped_pattern//$'\n'/} # Remove newlines
+              escaped_pattern=${escaped_pattern//$'\r'/} # Remove carriage returns (optional)
+          
+              # Redact the pattern
+              sed -i.bak "s/${escaped_pattern}/***/g" "$file"
             done
+            rm -f "$file.bak"
           done
 
           # Zip logs/output
diff --git a/.gitignore b/.gitignore
index b6a1e63c41920..bbf02496498c1 100644
--- a/.gitignore
+++ b/.gitignore
@@ -125,3 +125,7 @@ sql/api/gen/
 sql/api/src/main/gen/
 sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseLexer.tokens
 sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/gen/
+
+tpcds-sf-1/
+tpcds-sf-1-text/
+tpcds-kit/
diff --git a/connect-examples/server-library-example/client/src/main/resources/log4j2.xml b/.mvn/extensions.xml
similarity index 72%
rename from connect-examples/server-library-example/client/src/main/resources/log4j2.xml
rename to .mvn/extensions.xml
index 21b0d9719193e..da2aee8827a54 100644
--- a/connect-examples/server-library-example/client/src/main/resources/log4j2.xml
+++ b/.mvn/extensions.xml
@@ -15,16 +15,10 @@
   ~ See the License for the specific language governing permissions and
   ~ limitations under the License.
   -->
-
-<Configuration status="WARN">
-  <Appenders>
-    <Console name="Console" target="SYSTEM_OUT">
-      <PatternLayout pattern="%d{yyyy-MM-dd HH:mm:ss} [%t] %-5level %logger{36} - %msg%n" />
-    </Console>
-  </Appenders>
-  <Loggers>
-    <Root level="info">
-      <AppenderRef ref="Console" />
-    </Root>
-  </Loggers>
-</Configuration>
+<extensions>
+  <extension>
+    <groupId>eu.maveniverse.maven.nisse</groupId>
+    <artifactId>extension</artifactId>
+    <version>0.4.6</version>
+  </extension>
+</extensions>
diff --git a/.mvn/jvm.config b/.mvn/jvm.config
index 81b88d8173419..b41dca0e56a6b 100644
--- a/.mvn/jvm.config
+++ b/.mvn/jvm.config
@@ -1 +1,4 @@
+-XX:+IgnoreUnrecognizedVMOptions
+-XX:+UnlockDiagnosticVMOptions
+-XX:GCLockerRetryAllocationCount=100
 --enable-native-access=ALL-UNNAMED
diff --git a/.mvn/maven.config b/.mvn/maven.config
new file mode 100644
index 0000000000000..e61f1a94abdef
--- /dev/null
+++ b/.mvn/maven.config
@@ -0,0 +1 @@
+-Dnisse.compat.osDetector
diff --git a/LICENSE b/LICENSE
index 9b1e96a44a58c..ef8192ec38d05 100644
--- a/LICENSE
+++ b/LICENSE
@@ -217,6 +217,7 @@ core/src/main/resources/org/apache/spark/ui/static/vis*
 connector/spark-ganglia-lgpl/src/main/java/com/codahale/metrics/ganglia/GangliaReporter.java
 core/src/main/resources/org/apache/spark/ui/static/d3-flamegraph.min.js
 core/src/main/resources/org/apache/spark/ui/static/d3-flamegraph.css
+mllib-local/src/main/scala/scala/collection/compat/package.scala
 
 Python Software Foundation License
 ----------------------------------
diff --git a/LICENSE-binary b/LICENSE-binary
index 0c3c7aecb71ac..6f6bf9db5448a 100644
--- a/LICENSE-binary
+++ b/LICENSE-binary
@@ -365,8 +365,6 @@ org.apache.xbean:xbean-asm9-shaded
 org.apache.yetus:audience-annotations
 org.apache.zookeeper:zookeeper
 org.apache.zookeeper:zookeeper-jute
-org.codehaus.jackson:jackson-core-asl
-org.codehaus.jackson:jackson-mapper-asl
 org.datanucleus:datanucleus-api-jdo
 org.datanucleus:datanucleus-core
 org.datanucleus:datanucleus-rdbms
@@ -388,7 +386,6 @@ org.glassfish.jersey.core:jersey-common
 org.glassfish.jersey.core:jersey-server
 org.glassfish.jersey.inject:jersey-hk2
 org.javassist:javassist
-org.jetbrains:annotations
 org.json4s:json4s-ast_2.13
 org.json4s:json4s-core_2.13
 org.json4s:json4s-jackson-core_2.13
@@ -401,7 +398,6 @@ org.rocksdb:rocksdbjni
 org.scala-lang:scala-compiler
 org.scala-lang:scala-library
 org.scala-lang:scala-reflect
-org.scala-lang.modules:scala-collection-compat_2.13
 org.scala-lang.modules:scala-parallel-collections_2.13
 org.scala-lang.modules:scala-parser-combinators_2.13
 org.scala-lang.modules:scala-xml_2.13
@@ -442,7 +438,6 @@ com.github.luben:zstd-jni
 com.github.wendykierp:JTransforms
 javolution:javolution
 jline:jline
-org.jodd:jodd-core
 pl.edu.icm:JLargeArrays
 
 python/pyspark/errors/exceptions/tblib.py
@@ -465,6 +460,7 @@ org.codehaus.janino:janino
 org.fusesource.leveldbjni:leveldbjni-all
 org.jline:jline
 org.jpmml:pmml-model
+org.locationtech.jts:jts-core
 org.threeten:threeten-extra
 
 python/lib/py4j-*-src.zip
diff --git a/README.md b/README.md
index 0f0bf039550d7..17344563d90ac 100644
--- a/README.md
+++ b/README.md
@@ -36,7 +36,6 @@ This README file only contains basic setup instructions.
 |            | [![GitHub Actions Build](https://github.com/apache/spark/actions/workflows/build_maven_java21_arm.yml/badge.svg)](https://github.com/apache/spark/actions/workflows/build_maven_java21_arm.yml)                 |
 |            | [![GitHub Actions Build](https://github.com/apache/spark/actions/workflows/build_coverage.yml/badge.svg)](https://github.com/apache/spark/actions/workflows/build_coverage.yml)                          |
 |            | [![GitHub Actions Build](https://github.com/apache/spark/actions/workflows/build_python_pypy3.10.yml/badge.svg)](https://github.com/apache/spark/actions/workflows/build_python_pypy3.10.yml)                   |
-|            | [![GitHub Actions Build](https://github.com/apache/spark/actions/workflows/build_python_3.9.yml/badge.svg)](https://github.com/apache/spark/actions/workflows/build_python_3.9.yml)                             |
 |            | [![GitHub Actions Build](https://github.com/apache/spark/actions/workflows/build_python_3.10.yml/badge.svg)](https://github.com/apache/spark/actions/workflows/build_python_3.10.yml)                           |
 |            | [![GitHub Actions Build](https://github.com/apache/spark/actions/workflows/build_python_3.11_classic_only.yml/badge.svg)](https://github.com/apache/spark/actions/workflows/build_python_3.11_classic_only.yml) |
 |            | [![GitHub Actions Build](https://github.com/apache/spark/actions/workflows/build_python_3.11_arm.yml/badge.svg)](https://github.com/apache/spark/actions/workflows/build_python_3.11_arm.yml)                   |
diff --git a/assembly/pom.xml b/assembly/pom.xml
index a85ac5d9bc837..3a6b73b4522db 100644
--- a/assembly/pom.xml
+++ b/assembly/pom.xml
@@ -306,13 +306,6 @@
       <properties>
         <hive.deps.scope>provided</hive.deps.scope>
         <hive.llap.scope>provided</hive.llap.scope>
-        <hive.jackson.scope>provided</hive.jackson.scope>
-      </properties>
-    </profile>
-    <profile>
-      <id>hive-jackson-provided</id>
-      <properties>
-        <hive.jackson.scope>provided</hive.jackson.scope>
       </properties>
     </profile>
     <profile>
diff --git a/bin/spark-pipelines b/bin/spark-pipelines
index 52baeeafab08a..2174df7bed699 100755
--- a/bin/spark-pipelines
+++ b/bin/spark-pipelines
@@ -30,4 +30,4 @@ fi
 export PYTHONPATH="${SPARK_HOME}/python/:$PYTHONPATH"
 export PYTHONPATH="${SPARK_HOME}/python/lib/py4j-0.10.9.9-src.zip:$PYTHONPATH"
 
-$PYSPARK_PYTHON "${SPARK_HOME}"/python/pyspark/pipelines/cli.py "$@"
+exec "${SPARK_HOME}"/bin/spark-class org.apache.spark.deploy.SparkPipelines "$@"
diff --git a/build/sbt b/build/sbt
index db9d3b345ff6f..7644c143ad423 100755
--- a/build/sbt
+++ b/build/sbt
@@ -36,7 +36,7 @@ fi
 declare -r noshare_opts="-Dsbt.global.base=project/.sbtboot -Dsbt.boot.directory=project/.boot -Dsbt.ivy.home=project/.ivy"
 declare -r sbt_opts_file=".sbtopts"
 declare -r etc_sbt_opts_file="/etc/sbt/sbtopts"
-declare -r default_sbt_opts="-Xss64m"
+declare -r default_sbt_opts="-Xss64m -XX:+IgnoreUnrecognizedVMOptions -XX:+UnlockDiagnosticVMOptions -XX:GCLockerRetryAllocationCount=100"
 
 usage() {
  cat <<EOM
diff --git a/common/kvstore/pom.xml b/common/kvstore/pom.xml
index b96aca3d842f5..5d923ecc69ffe 100644
--- a/common/kvstore/pom.xml
+++ b/common/kvstore/pom.xml
@@ -71,17 +71,6 @@
       <artifactId>slf4j-api</artifactId>
     </dependency>
 
-    <dependency>
-      <groupId>commons-io</groupId>
-      <artifactId>commons-io</artifactId>
-      <scope>test</scope>
-    </dependency>
-    <dependency>
-      <groupId>org.apache.commons</groupId>
-      <artifactId>commons-lang3</artifactId>
-      <scope>test</scope>
-    </dependency>
-
     <dependency>
       <groupId>org.apache.logging.log4j</groupId>
       <artifactId>log4j-api</artifactId>
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/ArrayWrappers.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/ArrayWrappers.java
index 5265881e990e9..a9d6784805f6d 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/ArrayWrappers.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/ArrayWrappers.java
@@ -19,7 +19,7 @@
 
 import java.util.Arrays;
 
-import com.google.common.base.Preconditions;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * A factory for array wrappers so that arrays can be used as keys in a map, sorted or not.
@@ -38,7 +38,7 @@ class ArrayWrappers {
 
   @SuppressWarnings("unchecked")
   public static Comparable<Object> forArray(Object a) {
-    Preconditions.checkArgument(a.getClass().isArray());
+    JavaUtils.checkArgument(a.getClass().isArray(), "Input should be an array");
     Comparable<?> ret;
     if (a instanceof int[] ia) {
       ret = new ComparableIntArray(ia);
@@ -47,7 +47,8 @@ public static Comparable<Object> forArray(Object a) {
     } else if (a instanceof byte[] ba) {
       ret = new ComparableByteArray(ba);
     } else {
-      Preconditions.checkArgument(!a.getClass().getComponentType().isPrimitive());
+      JavaUtils.checkArgument(!a.getClass().getComponentType().isPrimitive(),
+        "Array element is primitive");
       ret = new ComparableObjectArray((Object[]) a);
     }
     return (Comparable<Object>) ret;
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/InMemoryStore.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/InMemoryStore.java
index a353a53d4b8d7..9a45a10532dee 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/InMemoryStore.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/InMemoryStore.java
@@ -24,6 +24,7 @@
 import java.util.HashSet;
 import java.util.List;
 import java.util.NoSuchElementException;
+import java.util.Objects;
 import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.ConcurrentMap;
 import java.util.function.BiConsumer;
@@ -31,10 +32,8 @@
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 
-import com.google.common.base.Objects;
-import com.google.common.base.Preconditions;
-
 import org.apache.spark.annotation.Private;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Implementation of KVStore that keeps data deserialized in memory. This store does not index
@@ -70,7 +69,7 @@ public long count(Class<?> type, String index, Object indexedValue) throws Excep
     Object comparable = asKey(indexedValue);
     KVTypeInfo.Accessor accessor = list.getIndexAccessor(index);
     for (Object o : view(type)) {
-      if (Objects.equal(comparable, asKey(accessor.get(o)))) {
+      if (Objects.equals(comparable, asKey(accessor.get(o)))) {
         count++;
       }
     }
@@ -419,7 +418,7 @@ private List<T> copyElements() {
           // Go through all the values in `data` and collect all the objects has certain parent
           // value. This can be slow when there is a large number of entries in `data`.
           KVTypeInfo.Accessor parentGetter = ti.getParentAccessor(index);
-          Preconditions.checkArgument(parentGetter != null, "Parent filter for non-child index.");
+          JavaUtils.checkArgument(parentGetter != null, "Parent filter for non-child index.");
           return data.values().stream()
             .filter(e -> compare(e, parentGetter, parentKey) == 0)
             .collect(Collectors.toList());
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVStoreView.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVStoreView.java
index 90135268fdef7..cfdcc1a2c8789 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVStoreView.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVStoreView.java
@@ -17,9 +17,10 @@
 
 package org.apache.spark.util.kvstore;
 
-import com.google.common.base.Preconditions;
+import java.util.Objects;
 
 import org.apache.spark.annotation.Private;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * A configurable view that allows iterating over values in a {@link KVStore}.
@@ -58,7 +59,7 @@ public KVStoreView<T> reverse() {
    * Iterates according to the given index.
    */
   public KVStoreView<T> index(String name) {
-    this.index = Preconditions.checkNotNull(name);
+    this.index = Objects.requireNonNull(name);
     return this;
   }
 
@@ -96,7 +97,7 @@ public KVStoreView<T> last(Object value) {
    * Stops iteration after a number of elements has been retrieved.
    */
   public KVStoreView<T> max(long max) {
-    Preconditions.checkArgument(max > 0L, "max must be positive.");
+    JavaUtils.checkArgument(max > 0L, "max must be positive.");
     this.max = max;
     return this;
   }
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVTypeInfo.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVTypeInfo.java
index bf7c256fc94ff..86f32abc9075d 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVTypeInfo.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/KVTypeInfo.java
@@ -23,9 +23,8 @@
 import java.util.Map;
 import java.util.stream.Stream;
 
-import com.google.common.base.Preconditions;
-
 import org.apache.spark.annotation.Private;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Wrapper around types managed in a KVStore, providing easy access to their indexed fields.
@@ -56,7 +55,7 @@ public KVTypeInfo(Class<?> type) {
       KVIndex idx = m.getAnnotation(KVIndex.class);
       if (idx != null) {
         checkIndex(idx, indices);
-        Preconditions.checkArgument(m.getParameterCount() == 0,
+        JavaUtils.checkArgument(m.getParameterCount() == 0,
           "Annotated method %s::%s should not have any parameters.", type.getName(), m.getName());
         m.setAccessible(true);
         indices.put(idx.value(), idx);
@@ -64,29 +63,29 @@ public KVTypeInfo(Class<?> type) {
       }
     }
 
-    Preconditions.checkArgument(indices.containsKey(KVIndex.NATURAL_INDEX_NAME),
+    JavaUtils.checkArgument(indices.containsKey(KVIndex.NATURAL_INDEX_NAME),
         "No natural index defined for type %s.", type.getName());
 
     for (KVIndex idx : indices.values()) {
       if (!idx.parent().isEmpty()) {
         KVIndex parent = indices.get(idx.parent());
-        Preconditions.checkArgument(parent != null,
+        JavaUtils.checkArgument(parent != null,
           "Cannot find parent %s of index %s.", idx.parent(), idx.value());
-        Preconditions.checkArgument(parent.parent().isEmpty(),
+        JavaUtils.checkArgument(parent.parent().isEmpty(),
           "Parent index %s of index %s cannot be itself a child index.", idx.parent(), idx.value());
       }
     }
   }
 
   private void checkIndex(KVIndex idx, Map<String, KVIndex> indices) {
-    Preconditions.checkArgument(idx.value() != null && !idx.value().isEmpty(),
+    JavaUtils.checkArgument(idx.value() != null && !idx.value().isEmpty(),
       "No name provided for index in type %s.", type.getName());
-    Preconditions.checkArgument(
+    JavaUtils.checkArgument(
       !idx.value().startsWith("_") || idx.value().equals(KVIndex.NATURAL_INDEX_NAME),
       "Index name %s (in type %s) is not allowed.", idx.value(), type.getName());
-    Preconditions.checkArgument(idx.parent().isEmpty() || !idx.parent().equals(idx.value()),
+    JavaUtils.checkArgument(idx.parent().isEmpty() || !idx.parent().equals(idx.value()),
       "Index %s cannot be parent of itself.", idx.value());
-    Preconditions.checkArgument(!indices.containsKey(idx.value()),
+    JavaUtils.checkArgument(!indices.containsKey(idx.value()),
       "Duplicate index %s for type %s.", idx.value(), type.getName());
   }
 
@@ -104,7 +103,7 @@ public Stream<KVIndex> indices() {
 
   Accessor getAccessor(String indexName) {
     Accessor a = accessors.get(indexName);
-    Preconditions.checkArgument(a != null, "No index %s.", indexName);
+    JavaUtils.checkArgument(a != null, "No index %s.", indexName);
     return a;
   }
 
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDB.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDB.java
index 74843806b3ea0..91b2cde2d84fe 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDB.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDB.java
@@ -30,8 +30,6 @@
 import static java.nio.charset.StandardCharsets.UTF_8;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
 import org.fusesource.leveldbjni.JniDBFactory;
 import org.iq80.leveldb.DB;
 import org.iq80.leveldb.DBIterator;
@@ -39,6 +37,7 @@
 import org.iq80.leveldb.WriteBatch;
 
 import org.apache.spark.annotation.Private;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Implementation of KVStore that uses LevelDB as the underlying data store.
@@ -137,20 +136,20 @@ <T> T get(byte[] key, Class<T> klass) throws Exception {
   }
 
   private void put(byte[] key, Object value) throws Exception {
-    Preconditions.checkArgument(value != null, "Null values are not allowed.");
+    JavaUtils.checkArgument(value != null, "Null values are not allowed.");
     db().put(key, serializer.serialize(value));
   }
 
   @Override
   public <T> T read(Class<T> klass, Object naturalKey) throws Exception {
-    Preconditions.checkArgument(naturalKey != null, "Null keys are not allowed.");
+    JavaUtils.checkArgument(naturalKey != null, "Null keys are not allowed.");
     byte[] key = getTypeInfo(klass).naturalIndex().start(null, naturalKey);
     return get(key, klass);
   }
 
   @Override
   public void write(Object value) throws Exception {
-    Preconditions.checkArgument(value != null, "Null values are not allowed.");
+    JavaUtils.checkArgument(value != null, "Null values are not allowed.");
     LevelDBTypeInfo ti = getTypeInfo(value.getClass());
 
     try (WriteBatch batch = db().createWriteBatch()) {
@@ -163,7 +162,7 @@ public void write(Object value) throws Exception {
   }
 
   public void writeAll(List<?> values) throws Exception {
-    Preconditions.checkArgument(values != null && !values.isEmpty(),
+    JavaUtils.checkArgument(values != null && !values.isEmpty(),
       "Non-empty values required.");
 
     // Group by class, in case there are values from different classes in the values
@@ -225,7 +224,7 @@ private void updateBatch(
 
   @Override
   public void delete(Class<?> type, Object naturalKey) throws Exception {
-    Preconditions.checkArgument(naturalKey != null, "Null keys are not allowed.");
+    JavaUtils.checkArgument(naturalKey != null, "Null keys are not allowed.");
     try (WriteBatch batch = db().createWriteBatch()) {
       LevelDBTypeInfo ti = getTypeInfo(type);
       byte[] key = ti.naturalIndex().start(null, naturalKey);
@@ -256,7 +255,7 @@ public Iterator<T> iterator() {
           iteratorTracker.add(new WeakReference<>(it));
           return it;
         } catch (Exception e) {
-          Throwables.throwIfUnchecked(e);
+          if (e instanceof RuntimeException re) throw re;
           throw new RuntimeException(e);
         }
       }
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBIterator.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBIterator.java
index 29ed37ffa44e5..d80e002ddb06e 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBIterator.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBIterator.java
@@ -26,12 +26,11 @@
 import java.util.concurrent.atomic.AtomicBoolean;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
 import org.iq80.leveldb.DBIterator;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
+import org.apache.spark.network.util.JavaUtils;
 
 class LevelDBIterator<T> implements KVStoreIterator<T> {
 
@@ -66,7 +65,7 @@ class LevelDBIterator<T> implements KVStoreIterator<T> {
     this.resourceCleaner = new ResourceCleaner(it, db);
     this.cleanable = CLEANER.register(this, this.resourceCleaner);
 
-    Preconditions.checkArgument(!index.isChild() || params.parent != null,
+    JavaUtils.checkArgument(!index.isChild() || params.parent != null,
       "Cannot iterate over child index %s without parent value.", params.index);
     byte[] parent = index.isChild() ? index.parent().childPrefix(params.parent) : null;
 
@@ -151,7 +150,7 @@ public T next() {
       next = null;
       return ret;
     } catch (Exception e) {
-      Throwables.throwIfUnchecked(e);
+      if (e instanceof RuntimeException re) throw re;
       throw new RuntimeException(e);
     }
   }
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBTypeInfo.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBTypeInfo.java
index 21a412a36f39b..341e34606a9b2 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBTypeInfo.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/LevelDBTypeInfo.java
@@ -18,14 +18,17 @@
 package org.apache.spark.util.kvstore;
 
 import java.lang.reflect.Array;
+import java.util.Arrays;
 import java.util.Collection;
 import java.util.HashMap;
 import java.util.Map;
+import java.util.Objects;
 import static java.nio.charset.StandardCharsets.UTF_8;
 
-import com.google.common.base.Preconditions;
 import org.iq80.leveldb.WriteBatch;
 
+import org.apache.spark.network.util.JavaUtils;
+
 /**
  * Holds metadata about app-specific types stored in LevelDB. Serves as a cache for data collected
  * via reflection, to make it cheaper to access it multiple times.
@@ -162,7 +165,7 @@ Index naturalIndex() {
 
   Index index(String name) {
     Index i = indices.get(name);
-    Preconditions.checkArgument(i != null, "Index %s does not exist for type %s.", name,
+    JavaUtils.checkArgument(i != null, "Index %s does not exist for type %s.", name,
       type.getName());
     return i;
   }
@@ -251,7 +254,7 @@ Index parent() {
      * same parent index exist.
      */
     byte[] childPrefix(Object value) {
-      Preconditions.checkState(parent == null, "Not a parent index.");
+      JavaUtils.checkState(parent == null, "Not a parent index.");
       return buildKey(name, toParentKey(value));
     }
 
@@ -266,9 +269,9 @@ Object getValue(Object entity) throws Exception {
 
     private void checkParent(byte[] prefix) {
       if (prefix != null) {
-        Preconditions.checkState(parent != null, "Parent prefix provided for parent index.");
+        JavaUtils.checkState(parent != null, "Parent prefix provided for parent index.");
       } else {
-        Preconditions.checkState(parent == null, "Parent prefix missing for child index.");
+        JavaUtils.checkState(parent == null, "Parent prefix missing for child index.");
       }
     }
 
@@ -305,8 +308,9 @@ byte[] end(byte[] prefix, Object value) {
     /** The full key in the index that identifies the given entity. */
     byte[] entityKey(byte[] prefix, Object entity) throws Exception {
       Object indexValue = getValue(entity);
-      Preconditions.checkNotNull(indexValue, "Null index value for %s in type %s.",
-        name, type.getName());
+      Objects.requireNonNull(indexValue, () ->
+        String.format(
+          "Null index value for %s in type %s.", Arrays.toString(name), type.getName()));
       byte[] entityKey = start(prefix, indexValue);
       if (!isNatural) {
         entityKey = buildKey(false, entityKey, toKey(naturalIndex().getValue(entity)));
@@ -331,8 +335,9 @@ private void addOrRemove(
         byte[] naturalKey,
         byte[] prefix) throws Exception {
       Object indexValue = getValue(entity);
-      Preconditions.checkNotNull(indexValue, "Null index value for %s in type %s.",
-        name, type.getName());
+      Objects.requireNonNull(indexValue, () ->
+        String.format(
+          "Null index value for %s in type %s.", Arrays.toString(name), type.getName()));
 
       byte[] entityKey = start(prefix, indexValue);
       if (!isNatural) {
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDB.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDB.java
index 8c9ac5a232001..4b69b9441dc32 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDB.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDB.java
@@ -31,11 +31,10 @@
 import static java.nio.charset.StandardCharsets.UTF_8;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
 import org.rocksdb.*;
 
 import org.apache.spark.annotation.Private;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Implementation of KVStore that uses RocksDB as the underlying data store.
@@ -170,20 +169,20 @@ <T> T get(byte[] key, Class<T> klass) throws Exception {
   }
 
   private void put(byte[] key, Object value) throws Exception {
-    Preconditions.checkArgument(value != null, "Null values are not allowed.");
+    JavaUtils.checkArgument(value != null, "Null values are not allowed.");
     db().put(key, serializer.serialize(value));
   }
 
   @Override
   public <T> T read(Class<T> klass, Object naturalKey) throws Exception {
-    Preconditions.checkArgument(naturalKey != null, "Null keys are not allowed.");
+    JavaUtils.checkArgument(naturalKey != null, "Null keys are not allowed.");
     byte[] key = getTypeInfo(klass).naturalIndex().start(null, naturalKey);
     return get(key, klass);
   }
 
   @Override
   public void write(Object value) throws Exception {
-    Preconditions.checkArgument(value != null, "Null values are not allowed.");
+    JavaUtils.checkArgument(value != null, "Null values are not allowed.");
     RocksDBTypeInfo ti = getTypeInfo(value.getClass());
     byte[] data = serializer.serialize(value);
     synchronized (ti) {
@@ -195,7 +194,7 @@ public void write(Object value) throws Exception {
   }
 
   public void writeAll(List<?> values) throws Exception {
-    Preconditions.checkArgument(values != null && !values.isEmpty(),
+    JavaUtils.checkArgument(values != null && !values.isEmpty(),
       "Non-empty values required.");
 
     // Group by class, in case there are values from different classes in the values
@@ -257,7 +256,7 @@ private void updateBatch(
 
   @Override
   public void delete(Class<?> type, Object naturalKey) throws Exception {
-    Preconditions.checkArgument(naturalKey != null, "Null keys are not allowed.");
+    JavaUtils.checkArgument(naturalKey != null, "Null keys are not allowed.");
     try (WriteBatch writeBatch = new WriteBatch()) {
       RocksDBTypeInfo ti = getTypeInfo(type);
       byte[] key = ti.naturalIndex().start(null, naturalKey);
@@ -288,7 +287,7 @@ public Iterator<T> iterator() {
           iteratorTracker.add(new WeakReference<>(it));
           return it;
         } catch (Exception e) {
-          Throwables.throwIfUnchecked(e);
+          if (e instanceof RuntimeException re) throw re;
           throw new RuntimeException(e);
         }
       }
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBIterator.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBIterator.java
index e350ddc2d445a..d37a4bd7b0b2d 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBIterator.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBIterator.java
@@ -23,10 +23,10 @@
 import java.util.concurrent.atomic.AtomicBoolean;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
 import org.rocksdb.RocksIterator;
 
+import org.apache.spark.network.util.JavaUtils;
+
 class RocksDBIterator<T> implements KVStoreIterator<T> {
 
   private static final Cleaner CLEANER = Cleaner.create();
@@ -58,7 +58,7 @@ class RocksDBIterator<T> implements KVStoreIterator<T> {
     this.resourceCleaner = new RocksDBIterator.ResourceCleaner(it, db);
     this.cleanable = CLEANER.register(this, resourceCleaner);
 
-    Preconditions.checkArgument(!index.isChild() || params.parent != null,
+    JavaUtils.checkArgument(!index.isChild() || params.parent != null,
       "Cannot iterate over child index %s without parent value.", params.index);
     byte[] parent = index.isChild() ? index.parent().childPrefix(params.parent) : null;
 
@@ -137,7 +137,7 @@ public T next() {
       next = null;
       return ret;
     } catch (Exception e) {
-      Throwables.throwIfUnchecked(e);
+      if (e instanceof RuntimeException re) throw re;
       throw new RuntimeException(e);
     }
   }
diff --git a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBTypeInfo.java b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBTypeInfo.java
index 3d1ba72f94d77..3b325a56ff2ca 100644
--- a/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBTypeInfo.java
+++ b/common/kvstore/src/main/java/org/apache/spark/util/kvstore/RocksDBTypeInfo.java
@@ -17,14 +17,17 @@
 
 package org.apache.spark.util.kvstore;
 
-import com.google.common.base.Preconditions;
-import org.rocksdb.RocksDBException;
-import org.rocksdb.WriteBatch;
-
 import java.lang.reflect.Array;
+import java.util.Arrays;
 import java.util.Collection;
 import java.util.HashMap;
 import java.util.Map;
+import java.util.Objects;
+
+import org.rocksdb.RocksDBException;
+import org.rocksdb.WriteBatch;
+
+import org.apache.spark.network.util.JavaUtils;
 
 import static java.nio.charset.StandardCharsets.UTF_8;
 
@@ -164,7 +167,7 @@ Index naturalIndex() {
 
   Index index(String name) {
     Index i = indices.get(name);
-    Preconditions.checkArgument(i != null, "Index %s does not exist for type %s.", name,
+    JavaUtils.checkArgument(i != null, "Index %s does not exist for type %s.", name,
       type.getName());
     return i;
   }
@@ -253,7 +256,7 @@ Index parent() {
      * same parent index exist.
      */
     byte[] childPrefix(Object value) {
-      Preconditions.checkState(parent == null, "Not a parent index.");
+      JavaUtils.checkState(parent == null, "Not a parent index.");
       return buildKey(name, toParentKey(value));
     }
 
@@ -268,9 +271,9 @@ Object getValue(Object entity) throws Exception {
 
     private void checkParent(byte[] prefix) {
       if (prefix != null) {
-        Preconditions.checkState(parent != null, "Parent prefix provided for parent index.");
+        JavaUtils.checkState(parent != null, "Parent prefix provided for parent index.");
       } else {
-        Preconditions.checkState(parent == null, "Parent prefix missing for child index.");
+        JavaUtils.checkState(parent == null, "Parent prefix missing for child index.");
       }
     }
 
@@ -307,8 +310,9 @@ byte[] end(byte[] prefix, Object value) {
     /** The full key in the index that identifies the given entity. */
     byte[] entityKey(byte[] prefix, Object entity) throws Exception {
       Object indexValue = getValue(entity);
-      Preconditions.checkNotNull(indexValue, "Null index value for %s in type %s.",
-        name, type.getName());
+      Objects.requireNonNull(indexValue, () ->
+        String.format(
+          "Null index value for %s in type %s.", Arrays.toString(name), type.getName()));
       byte[] entityKey = start(prefix, indexValue);
       if (!isNatural) {
         entityKey = buildKey(false, entityKey, toKey(naturalIndex().getValue(entity)));
@@ -333,8 +337,9 @@ private void addOrRemove(
         byte[] naturalKey,
         byte[] prefix) throws Exception {
       Object indexValue = getValue(entity);
-      Preconditions.checkNotNull(indexValue, "Null index value for %s in type %s.",
-        name, type.getName());
+      Objects.requireNonNull(indexValue, () ->
+        String.format(
+          "Null index value for %s in type %s.", Arrays.toString(name), type.getName()));
 
       byte[] entityKey = start(prefix, indexValue);
       if (!isNatural) {
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/DBIteratorSuite.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/DBIteratorSuite.java
index 72c3690d1a187..dd99d4876763e 100644
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/DBIteratorSuite.java
+++ b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/DBIteratorSuite.java
@@ -499,7 +499,9 @@ private KVStoreView<CustomType1> view() throws Exception {
 
   private List<CustomType1> collect(KVStoreView<CustomType1> view) throws Exception {
     try (KVStoreIterator<CustomType1> iterator = view.closeableIterator()) {
-      return Lists.newArrayList(iterator);
+      List<CustomType1> list = new ArrayList<>();
+      iterator.forEachRemaining(list::add);
+      return list;
     }
   }
 
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/InMemoryStoreSuite.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/InMemoryStoreSuite.java
index 81f1d21c49c24..c7ae03f078297 100644
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/InMemoryStoreSuite.java
+++ b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/InMemoryStoreSuite.java
@@ -17,9 +17,9 @@
 
 package org.apache.spark.util.kvstore;
 
+import java.util.Set;
 import java.util.NoSuchElementException;
 
-import com.google.common.collect.ImmutableSet;
 import org.junit.jupiter.api.Test;
 import static org.junit.jupiter.api.Assertions.*;
 
@@ -147,25 +147,25 @@ public void testRemoveAll() throws Exception {
     assertFalse(store.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       KVIndex.NATURAL_INDEX_NAME,
-      ImmutableSet.of(new int[] {10, 10, 10}, new int[] { 3, 3, 3 })));
+      Set.of(new int[] {10, 10, 10}, new int[] { 3, 3, 3 })));
     assertEquals(9, store.count(ArrayKeyIndexType.class));
 
     assertTrue(store.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       KVIndex.NATURAL_INDEX_NAME,
-      ImmutableSet.of(new int[] {0, 0, 0}, new int[] { 2, 2, 2 })));
+      Set.of(new int[] {0, 0, 0}, new int[] { 2, 2, 2 })));
     assertEquals(7, store.count(ArrayKeyIndexType.class));
 
     assertTrue(store.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       "id",
-      ImmutableSet.of(new String [] { "things" })));
+      Set.<String[]>of(new String [] { "things" })));
     assertEquals(4, store.count(ArrayKeyIndexType.class));
 
     assertTrue(store.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       "id",
-      ImmutableSet.of(new String [] { "more things" })));
+      Set.<String[]>of(new String [] { "more things" })));
     assertEquals(0, store.count(ArrayKeyIndexType.class));
   }
 
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBBenchmark.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBBenchmark.java
index ff6db8fc34c96..a9bfea44c4f30 100644
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBBenchmark.java
+++ b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBBenchmark.java
@@ -28,7 +28,6 @@
 import com.codahale.metrics.Slf4jReporter;
 import com.codahale.metrics.Snapshot;
 import com.codahale.metrics.Timer;
-import org.apache.commons.io.FileUtils;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.AfterAll;
 import org.junit.jupiter.api.BeforeEach;
@@ -37,6 +36,9 @@
 // checkstyle.off: RegexpSinglelineJava
 import org.slf4j.LoggerFactory;
 // checkstyle.on: RegexpSinglelineJava
+
+import org.apache.spark.network.util.JavaUtils;
+
 import static org.junit.jupiter.api.Assertions.*;
 
 /**
@@ -79,7 +81,7 @@ public void cleanup() throws Exception {
       }
     }
     if (dbpath != null) {
-      FileUtils.deleteQuietly(dbpath);
+      JavaUtils.deleteQuietly(dbpath);
     }
   }
 
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBIteratorSuite.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBIteratorSuite.java
index 6ff6286654450..11afb9281d15b 100644
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBIteratorSuite.java
+++ b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBIteratorSuite.java
@@ -19,11 +19,12 @@
 
 import java.io.File;
 
-import org.apache.commons.io.FileUtils;
-import org.apache.commons.lang3.SystemUtils;
 import org.junit.jupiter.api.AfterAll;
 import static org.junit.jupiter.api.Assumptions.assumeFalse;
 
+import org.apache.spark.network.util.JavaUtils;
+import org.apache.spark.util.SparkSystemUtils$;
+
 public class LevelDBIteratorSuite extends DBIteratorSuite {
 
   private static File dbpath;
@@ -35,13 +36,13 @@ public static void cleanup() throws Exception {
       db.close();
     }
     if (dbpath != null) {
-      FileUtils.deleteQuietly(dbpath);
+      JavaUtils.deleteQuietly(dbpath);
     }
   }
 
   @Override
   protected KVStore createStore() throws Exception {
-    assumeFalse(SystemUtils.IS_OS_MAC_OSX && SystemUtils.OS_ARCH.equals("aarch64"));
+    assumeFalse(SparkSystemUtils$.MODULE$.isMacOnAppleSilicon());
     dbpath = File.createTempFile("test.", ".ldb");
     dbpath.delete();
     db = new LevelDB(dbpath);
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBSuite.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBSuite.java
index 040ccce70b5a1..25e6664d28dd1 100644
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBSuite.java
+++ b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/LevelDBSuite.java
@@ -25,18 +25,19 @@
 import java.util.Iterator;
 import java.util.List;
 import java.util.NoSuchElementException;
+import java.util.Set;
 import java.util.Spliterators;
 import java.util.stream.Collectors;
 import java.util.stream.StreamSupport;
 
-import com.google.common.collect.ImmutableSet;
-import org.apache.commons.io.FileUtils;
-import org.apache.commons.lang3.SystemUtils;
 import org.iq80.leveldb.DBIterator;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
 
+import org.apache.spark.network.util.JavaUtils;
+import org.apache.spark.util.SparkSystemUtils$;
+
 import static org.junit.jupiter.api.Assertions.*;
 import static org.junit.jupiter.api.Assumptions.assumeFalse;
 
@@ -51,13 +52,13 @@ public void cleanup() throws Exception {
       db.close();
     }
     if (dbpath != null) {
-      FileUtils.deleteQuietly(dbpath);
+      JavaUtils.deleteQuietly(dbpath);
     }
   }
 
   @BeforeEach
   public void setup() throws Exception {
-    assumeFalse(SystemUtils.IS_OS_MAC_OSX && SystemUtils.OS_ARCH.equals("aarch64"));
+    assumeFalse(SparkSystemUtils$.MODULE$.isMacOnAppleSilicon());
     dbpath = File.createTempFile("test.", ".ldb");
     dbpath.delete();
     db = new LevelDB(dbpath);
@@ -219,19 +220,19 @@ public void testRemoveAll() throws Exception {
     db.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       KVIndex.NATURAL_INDEX_NAME,
-      ImmutableSet.of(new int[] {0, 0, 0}, new int[] { 2, 2, 2 }));
+      Set.of(new int[] {0, 0, 0}, new int[] { 2, 2, 2 }));
     assertEquals(7, db.count(ArrayKeyIndexType.class));
 
     db.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       "id",
-      ImmutableSet.of(new String[] { "things" }));
+      Set.<String[]>of(new String[] { "things" }));
     assertEquals(4, db.count(ArrayKeyIndexType.class));
 
     db.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       "id",
-      ImmutableSet.of(new String[] { "more things" }));
+      Set.<String[]>of(new String[] { "more things" }));
     assertEquals(0, db.count(ArrayKeyIndexType.class));
   }
 
@@ -305,7 +306,7 @@ public void testCloseLevelDBIterator() throws Exception {
     }
     dbForCloseTest.close();
     assertTrue(dbPathForCloseTest.exists());
-    FileUtils.deleteQuietly(dbPathForCloseTest);
+    JavaUtils.deleteQuietly(dbPathForCloseTest);
     assertTrue(!dbPathForCloseTest.exists());
   }
 
@@ -419,7 +420,7 @@ public void testResourceCleaner() throws Exception {
       assertTrue(resourceCleaner.isCompleted());
     } finally {
       dbForCleanerTest.close();
-      FileUtils.deleteQuietly(dbPathForCleanerTest);
+      JavaUtils.deleteQuietly(dbPathForCleanerTest);
     }
   }
 
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBBenchmark.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBBenchmark.java
deleted file mode 100644
index c1b8009e97e66..0000000000000
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBBenchmark.java
+++ /dev/null
@@ -1,287 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.util.kvstore;
-
-import java.io.File;
-import java.util.ArrayList;
-import java.util.Collections;
-import java.util.List;
-import java.util.Map;
-import java.util.concurrent.atomic.AtomicInteger;
-
-import com.codahale.metrics.MetricRegistry;
-import com.codahale.metrics.Slf4jReporter;
-import com.codahale.metrics.Snapshot;
-import com.codahale.metrics.Timer;
-import org.apache.commons.io.FileUtils;
-import org.junit.jupiter.api.AfterEach;
-import org.junit.jupiter.api.AfterAll;
-import org.junit.jupiter.api.BeforeEach;
-import org.junit.jupiter.api.Disabled;
-import org.junit.jupiter.api.Test;
-// checkstyle.off: RegexpSinglelineJava
-import org.slf4j.LoggerFactory;
-// checkstyle.on: RegexpSinglelineJava
-import static org.junit.jupiter.api.Assertions.*;
-
-/**
- * A set of small benchmarks for the RocksDB implementation.
- *
- * The benchmarks are run over two different types (one with just a natural index, and one
- * with a ref index), over a set of 2^20 elements, and the following tests are performed:
- *
- * - write (then update) elements in sequential natural key order
- * - write (then update) elements in random natural key order
- * - iterate over natural index, ascending and descending
- * - iterate over ref index, ascending and descending
- */
-@Disabled
-public class RocksDBBenchmark {
-
-  private static final int COUNT = 1024;
-  private static final AtomicInteger IDGEN = new AtomicInteger();
-  private static final MetricRegistry metrics = new MetricRegistry();
-  private static final Timer dbCreation = metrics.timer("dbCreation");
-  private static final Timer dbClose = metrics.timer("dbClose");
-
-  private RocksDB db;
-  private File dbpath;
-
-  @BeforeEach
-  public void setup() throws Exception {
-    dbpath = File.createTempFile("test.", ".rdb");
-    dbpath.delete();
-    try(Timer.Context ctx = dbCreation.time()) {
-      db = new RocksDB(dbpath);
-    }
-  }
-
-  @AfterEach
-  public void cleanup() throws Exception {
-    if (db != null) {
-      try(Timer.Context ctx = dbClose.time()) {
-        db.close();
-      }
-    }
-    if (dbpath != null) {
-      FileUtils.deleteQuietly(dbpath);
-    }
-  }
-
-  @AfterAll
-  public static void report() {
-    if (metrics.getTimers().isEmpty()) {
-      return;
-    }
-
-    int headingPrefix = 0;
-    for (Map.Entry<String, Timer> e : metrics.getTimers().entrySet()) {
-      headingPrefix = Math.max(e.getKey().length(), headingPrefix);
-    }
-    headingPrefix += 4;
-
-    StringBuilder heading = new StringBuilder();
-    for (int i = 0; i < headingPrefix; i++) {
-      heading.append(" ");
-    }
-    heading.append("\tcount");
-    heading.append("\tmean");
-    heading.append("\tmin");
-    heading.append("\tmax");
-    heading.append("\t95th");
-    System.out.println(heading);
-
-    for (Map.Entry<String, Timer> e : metrics.getTimers().entrySet()) {
-      StringBuilder row = new StringBuilder();
-      row.append(e.getKey());
-      for (int i = 0; i < headingPrefix - e.getKey().length(); i++) {
-        row.append(" ");
-      }
-
-      Snapshot s = e.getValue().getSnapshot();
-      row.append("\t").append(e.getValue().getCount());
-      row.append("\t").append(toMs(s.getMean()));
-      row.append("\t").append(toMs(s.getMin()));
-      row.append("\t").append(toMs(s.getMax()));
-      row.append("\t").append(toMs(s.get95thPercentile()));
-
-      System.out.println(row);
-    }
-
-    Slf4jReporter.forRegistry(metrics).outputTo(LoggerFactory.getLogger(RocksDBBenchmark.class))
-      .build().report();
-  }
-
-  private static String toMs(double nanos) {
-    return String.format("%.3f", nanos / 1000 / 1000);
-  }
-
-  @Test
-  public void sequentialWritesNoIndex() throws Exception {
-    List<SimpleType> entries = createSimpleType();
-    writeAll(entries, "sequentialWritesNoIndex");
-    writeAll(entries, "sequentialUpdatesNoIndex");
-    deleteNoIndex(entries, "sequentialDeleteNoIndex");
-  }
-
-  @Test
-  public void randomWritesNoIndex() throws Exception {
-    List<SimpleType> entries = createSimpleType();
-
-    Collections.shuffle(entries);
-    writeAll(entries, "randomWritesNoIndex");
-
-    Collections.shuffle(entries);
-    writeAll(entries, "randomUpdatesNoIndex");
-
-    Collections.shuffle(entries);
-    deleteNoIndex(entries, "randomDeletesNoIndex");
-  }
-
-  @Test
-  public void sequentialWritesIndexedType() throws Exception {
-    List<IndexedType> entries = createIndexedType();
-    writeAll(entries, "sequentialWritesIndexed");
-    writeAll(entries, "sequentialUpdatesIndexed");
-    deleteIndexed(entries, "sequentialDeleteIndexed");
-  }
-
-  @Test
-  public void randomWritesIndexedTypeAndIteration() throws Exception {
-    List<IndexedType> entries = createIndexedType();
-
-    Collections.shuffle(entries);
-    writeAll(entries, "randomWritesIndexed");
-
-    Collections.shuffle(entries);
-    writeAll(entries, "randomUpdatesIndexed");
-
-    // Run iteration benchmarks here since we've gone through the trouble of writing all
-    // the data already.
-    KVStoreView<?> view = db.view(IndexedType.class);
-    iterate(view, "naturalIndex");
-    iterate(view.reverse(), "naturalIndexDescending");
-    iterate(view.index("name"), "refIndex");
-    iterate(view.index("name").reverse(), "refIndexDescending");
-
-    Collections.shuffle(entries);
-    deleteIndexed(entries, "randomDeleteIndexed");
-  }
-
-  private void iterate(KVStoreView<?> view, String name) throws Exception {
-    Timer create = metrics.timer(name + "CreateIterator");
-    Timer iter = metrics.timer(name + "Iteration");
-    KVStoreIterator<?> it = null;
-    {
-      // Create the iterator several times, just to have multiple data points.
-      for (int i = 0; i < 1024; i++) {
-        if (it != null) {
-          it.close();
-        }
-        try(Timer.Context ctx = create.time()) {
-          it = view.closeableIterator();
-        }
-      }
-    }
-    try {
-      while (it.hasNext()) {
-        try (Timer.Context ctx = iter.time()) {
-          it.next();
-        }
-      }
-    } finally {
-      if (it != null) {
-        it.close();
-      }
-    }
-  }
-
-  private void writeAll(List<?> entries, String timerName) throws Exception {
-    Timer timer = newTimer(timerName);
-    for (Object o : entries) {
-      try(Timer.Context ctx = timer.time()) {
-        db.write(o);
-      }
-    }
-  }
-
-  private void deleteNoIndex(List<SimpleType> entries, String timerName) throws Exception {
-    Timer delete = newTimer(timerName);
-    for (SimpleType i : entries) {
-      try(Timer.Context ctx = delete.time()) {
-        db.delete(i.getClass(), i.key);
-      }
-    }
-  }
-
-  private void deleteIndexed(List<IndexedType> entries, String timerName) throws Exception {
-    Timer delete = newTimer(timerName);
-    for (IndexedType i : entries) {
-      try(Timer.Context ctx = delete.time()) {
-        db.delete(i.getClass(), i.key);
-      }
-    }
-  }
-
-  private List<SimpleType> createSimpleType() {
-    List<SimpleType> entries = new ArrayList<>();
-    for (int i = 0; i < COUNT; i++) {
-      SimpleType t = new SimpleType();
-      t.key = IDGEN.getAndIncrement();
-      t.name = "name" + (t.key % 1024);
-      entries.add(t);
-    }
-    return entries;
-  }
-
-  private List<IndexedType> createIndexedType() {
-    List<IndexedType> entries = new ArrayList<>();
-    for (int i = 0; i < COUNT; i++) {
-      IndexedType t = new IndexedType();
-      t.key = IDGEN.getAndIncrement();
-      t.name = "name" + (t.key % 1024);
-      entries.add(t);
-    }
-    return entries;
-  }
-
-  private Timer newTimer(String name) {
-    assertNull(metrics.getTimers().get(name), "Timer already exists: " + name);
-    return metrics.timer(name);
-  }
-
-  public static class SimpleType {
-
-    @KVIndex
-    public int key;
-
-    public String name;
-
-  }
-
-  public static class IndexedType {
-
-    @KVIndex
-    public int key;
-
-    @KVIndex("name")
-    public String name;
-
-  }
-
-}
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBIteratorSuite.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBIteratorSuite.java
index f8d79484fae1a..f53ec870d1a11 100644
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBIteratorSuite.java
+++ b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBIteratorSuite.java
@@ -19,9 +19,10 @@
 
 import java.io.File;
 
-import org.apache.commons.io.FileUtils;
 import org.junit.jupiter.api.AfterAll;
 
+import org.apache.spark.network.util.JavaUtils;
+
 public class RocksDBIteratorSuite extends DBIteratorSuite {
 
   private static File dbpath;
@@ -33,7 +34,7 @@ public static void cleanup() throws Exception {
       db.close();
     }
     if (dbpath != null) {
-      FileUtils.deleteQuietly(dbpath);
+      JavaUtils.deleteQuietly(dbpath);
     }
   }
 
diff --git a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBSuite.java b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBSuite.java
index 34a12d8fddec8..1334386fde74d 100644
--- a/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBSuite.java
+++ b/common/kvstore/src/test/java/org/apache/spark/util/kvstore/RocksDBSuite.java
@@ -25,17 +25,18 @@
 import java.util.Iterator;
 import java.util.List;
 import java.util.NoSuchElementException;
+import java.util.Set;
 import java.util.Spliterators;
 import java.util.stream.Collectors;
 import java.util.stream.StreamSupport;
 
-import com.google.common.collect.ImmutableSet;
-import org.apache.commons.io.FileUtils;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
 import org.rocksdb.RocksIterator;
 
+import org.apache.spark.network.util.JavaUtils;
+
 import static org.junit.jupiter.api.Assertions.*;
 
 public class RocksDBSuite {
@@ -49,7 +50,7 @@ public void cleanup() throws Exception {
       db.close();
     }
     if (dbpath != null) {
-      FileUtils.deleteQuietly(dbpath);
+      JavaUtils.deleteQuietly(dbpath);
     }
   }
 
@@ -216,19 +217,19 @@ public void testRemoveAll() throws Exception {
     db.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       KVIndex.NATURAL_INDEX_NAME,
-      ImmutableSet.of(new int[] {0, 0, 0}, new int[] { 2, 2, 2 }));
+      Set.of(new int[] {0, 0, 0}, new int[] { 2, 2, 2 }));
     assertEquals(7, db.count(ArrayKeyIndexType.class));
 
     db.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       "id",
-      ImmutableSet.of(new String[] { "things" }));
+      Set.<String[]>of(new String[] { "things" }));
     assertEquals(4, db.count(ArrayKeyIndexType.class));
 
     db.removeAllByIndexValues(
       ArrayKeyIndexType.class,
       "id",
-      ImmutableSet.of(new String[] { "more things" }));
+      Set.<String[]>of(new String[] { "more things" }));
     assertEquals(0, db.count(ArrayKeyIndexType.class));
   }
 
@@ -302,7 +303,7 @@ public void testCloseRocksDBIterator() throws Exception {
     }
     dbForCloseTest.close();
     assertTrue(dbPathForCloseTest.exists());
-    FileUtils.deleteQuietly(dbPathForCloseTest);
+    JavaUtils.deleteQuietly(dbPathForCloseTest);
     assertTrue(!dbPathForCloseTest.exists());
   }
 
@@ -417,7 +418,7 @@ public void testResourceCleaner() throws Exception {
       assertTrue(resourceCleaner.isCompleted());
     } finally {
       dbForCleanerTest.close();
-      FileUtils.deleteQuietly(dbPathForCleanerTest);
+      JavaUtils.deleteQuietly(dbPathForCleanerTest);
     }
   }
 
diff --git a/common/network-common/pom.xml b/common/network-common/pom.xml
index 2f2be88ac9dd1..51b782920e6d9 100644
--- a/common/network-common/pom.xml
+++ b/common/network-common/pom.xml
@@ -83,10 +83,6 @@
     </dependency>
     <!-- Netty End -->
 
-    <dependency>
-      <groupId>org.apache.commons</groupId>
-      <artifactId>commons-lang3</artifactId>
-    </dependency>
     <dependency>
       <groupId>${leveldbjni.group}</groupId>
       <artifactId>leveldbjni-all</artifactId>
@@ -174,7 +170,7 @@
 
     <dependency>
       <groupId>org.apache.spark</groupId>
-      <artifactId>spark-common-utils_${scala.binary.version}</artifactId>
+      <artifactId>spark-common-utils-java_${scala.binary.version}</artifactId>
       <version>${project.version}</version>
     </dependency>
 
diff --git a/common/network-common/src/main/java/org/apache/spark/network/buffer/FileSegmentManagedBuffer.java b/common/network-common/src/main/java/org/apache/spark/network/buffer/FileSegmentManagedBuffer.java
index dd7c2061ec95b..eed43a8d28d90 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/buffer/FileSegmentManagedBuffer.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/buffer/FileSegmentManagedBuffer.java
@@ -26,11 +26,8 @@
 import java.nio.channels.FileChannel;
 import java.nio.file.StandardOpenOption;
 
-import com.google.common.io.ByteStreams;
 import io.netty.channel.DefaultFileRegion;
 import io.netty.handler.stream.ChunkedStream;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.LimitedInputStream;
@@ -100,7 +97,7 @@ public InputStream createInputStream() throws IOException {
     boolean shouldClose = true;
     try {
       is = new FileInputStream(file);
-      ByteStreams.skipFully(is, offset);
+      is.skipNBytes(offset);
       InputStream r = new LimitedInputStream(is, length);
       shouldClose = false;
       return r;
@@ -152,10 +149,7 @@ public Object convertToNettyForSsl() throws IOException {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("file", file)
-      .append("offset", offset)
-      .append("length", length)
-      .toString();
+    return "FileSegmentManagedBuffer[file=" + file + ",offset=" + offset +
+        ",length=" + length + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/buffer/NettyManagedBuffer.java b/common/network-common/src/main/java/org/apache/spark/network/buffer/NettyManagedBuffer.java
index a40cfc8bc04b1..e7b8bafa92f4b 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/buffer/NettyManagedBuffer.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/buffer/NettyManagedBuffer.java
@@ -23,8 +23,6 @@
 
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.ByteBufInputStream;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
  * A {@link ManagedBuffer} backed by a Netty {@link ByteBuf}.
@@ -75,8 +73,6 @@ public Object convertToNettyForSsl() throws IOException {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("buf", buf)
-      .toString();
+    return "NettyManagedBuffer[buf=" + buf + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/buffer/NioManagedBuffer.java b/common/network-common/src/main/java/org/apache/spark/network/buffer/NioManagedBuffer.java
index 6eb8d4e2c731c..d97f853c58f1f 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/buffer/NioManagedBuffer.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/buffer/NioManagedBuffer.java
@@ -23,8 +23,6 @@
 
 import io.netty.buffer.ByteBufInputStream;
 import io.netty.buffer.Unpooled;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
  * A {@link ManagedBuffer} backed by {@link ByteBuffer}.
@@ -73,9 +71,7 @@ public Object convertToNettyForSsl() throws IOException {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("buf", buf)
-      .toString();
+    return "NioManagedBuffer[buf=" + buf + "]";
   }
 }
 
diff --git a/common/network-common/src/main/java/org/apache/spark/network/client/TransportClient.java b/common/network-common/src/main/java/org/apache/spark/network/client/TransportClient.java
index a9df47645d36f..f02f2c63ecd4c 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/client/TransportClient.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/client/TransportClient.java
@@ -21,20 +21,17 @@
 import java.io.IOException;
 import java.net.SocketAddress;
 import java.nio.ByteBuffer;
+import java.util.Objects;
 import java.util.UUID;
 import java.util.concurrent.ExecutionException;
 import java.util.concurrent.TimeUnit;
 import javax.annotation.Nullable;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
 import com.google.common.util.concurrent.SettableFuture;
 import io.netty.channel.Channel;
 import io.netty.util.concurrent.Future;
 import io.netty.util.concurrent.GenericFutureListener;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
@@ -43,6 +40,7 @@
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NioManagedBuffer;
 import org.apache.spark.network.protocol.*;
+import org.apache.spark.network.util.JavaUtils;
 
 import static org.apache.spark.network.util.NettyUtils.getRemoteAddress;
 
@@ -81,8 +79,8 @@ public class TransportClient implements Closeable {
   private volatile boolean timedOut;
 
   public TransportClient(Channel channel, TransportResponseHandler handler) {
-    this.channel = Preconditions.checkNotNull(channel);
-    this.handler = Preconditions.checkNotNull(handler);
+    this.channel = Objects.requireNonNull(channel);
+    this.handler = Objects.requireNonNull(handler);
     this.timedOut = false;
   }
 
@@ -113,7 +111,7 @@ public String getClientId() {
    * Trying to set a different client ID after it's been set will result in an exception.
    */
   public void setClientId(String id) {
-    Preconditions.checkState(clientId == null, "Client ID has already been set.");
+    JavaUtils.checkState(clientId == null, "Client ID has already been set.");
     this.clientId = id;
   }
 
@@ -290,10 +288,9 @@ public void onFailure(Throwable e) {
     try {
       return result.get(timeoutMs, TimeUnit.MILLISECONDS);
     } catch (ExecutionException e) {
-      Throwables.throwIfUnchecked(e.getCause());
       throw new RuntimeException(e.getCause());
     } catch (Exception e) {
-      Throwables.throwIfUnchecked(e);
+      if (e instanceof RuntimeException re) throw re;
       throw new RuntimeException(e);
     }
   }
@@ -338,11 +335,8 @@ public void close() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("remoteAddress", channel.remoteAddress())
-      .append("clientId", clientId)
-      .append("isActive", isActive())
-      .toString();
+    return "TransportClient[remoteAddress=" + channel.remoteAddress() + "clientId=" + clientId +
+        ",isActive=" + isActive() + "]";
   }
 
   private static long requestId() {
@@ -369,8 +363,8 @@ public void operationComplete(Future<? super Void> future) throws Exception {
         }
       } else {
         logger.error("Failed to send RPC {} to {}", future.cause(),
-            MDC.of(LogKeys.REQUEST_ID$.MODULE$, requestId),
-            MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
+            MDC.of(LogKeys.REQUEST_ID, requestId),
+            MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
         channel.close();
         try {
           String errorMsg = String.format("Failed to send RPC %s to %s: %s", requestId,
diff --git a/common/network-common/src/main/java/org/apache/spark/network/client/TransportClientFactory.java b/common/network-common/src/main/java/org/apache/spark/network/client/TransportClientFactory.java
index d64b8c8f838e9..2137b5f3136ef 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/client/TransportClientFactory.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/client/TransportClientFactory.java
@@ -21,16 +21,15 @@
 import java.io.IOException;
 import java.net.InetSocketAddress;
 import java.net.SocketAddress;
+import java.util.ArrayList;
 import java.util.List;
+import java.util.Objects;
 import java.util.Random;
 import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.atomic.AtomicReference;
 
 import com.codahale.metrics.MetricSet;
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
-import com.google.common.collect.Lists;
 import io.netty.bootstrap.Bootstrap;
 import io.netty.buffer.PooledByteBufAllocator;
 import io.netty.channel.Channel;
@@ -100,9 +99,9 @@ private static class ClientPool {
   public TransportClientFactory(
       TransportContext context,
       List<TransportClientBootstrap> clientBootstraps) {
-    this.context = Preconditions.checkNotNull(context);
+    this.context = Objects.requireNonNull(context);
     this.conf = context.getConf();
-    this.clientBootstraps = Lists.newArrayList(Preconditions.checkNotNull(clientBootstraps));
+    this.clientBootstraps = new ArrayList<>(Objects.requireNonNull(clientBootstraps));
     this.connectionPool = new ConcurrentHashMap<>();
     this.numConnectionsPerPeer = conf.numConnectionsPerPeer();
     this.rand = new Random();
@@ -193,9 +192,9 @@ public TransportClient createClient(String remoteHost, int remotePort, boolean f
     final String resolvMsg = resolvedAddress.isUnresolved() ? "failed" : "succeed";
     if (hostResolveTimeMs > 2000) {
       logger.warn("DNS resolution {} for {} took {} ms",
-        MDC.of(LogKeys.STATUS$.MODULE$, resolvMsg),
-        MDC.of(LogKeys.HOST_PORT$.MODULE$, resolvedAddress),
-        MDC.of(LogKeys.TIME$.MODULE$, hostResolveTimeMs));
+        MDC.of(LogKeys.STATUS, resolvMsg),
+        MDC.of(LogKeys.HOST_PORT, resolvedAddress),
+        MDC.of(LogKeys.TIME, hostResolveTimeMs));
     } else {
       logger.trace("DNS resolution {} for {} took {} ms",
           resolvMsg, resolvedAddress, hostResolveTimeMs);
@@ -210,7 +209,7 @@ public TransportClient createClient(String remoteHost, int remotePort, boolean f
           return cachedClient;
         } else {
           logger.info("Found inactive connection to {}, creating a new one.",
-            MDC.of(LogKeys.HOST_PORT$.MODULE$, resolvedAddress));
+            MDC.of(LogKeys.HOST_PORT, resolvedAddress));
         }
       }
       // If this connection should fast fail when last connection failed in last fast fail time
@@ -314,7 +313,7 @@ public void operationComplete(final Future<Channel> handshakeFuture) {
               logger.debug("{} successfully completed TLS handshake to ", address);
             } else {
               logger.info("failed to complete TLS handshake to {}", handshakeFuture.cause(),
-                MDC.of(LogKeys.HOST_PORT$.MODULE$, address));
+                MDC.of(LogKeys.HOST_PORT, address));
               cf.channel().close();
             }
           }
@@ -340,17 +339,17 @@ public void operationComplete(final Future<Channel> handshakeFuture) {
     } catch (Exception e) { // catch non-RuntimeExceptions too as bootstrap may be written in Scala
       long bootstrapTimeMs = (System.nanoTime() - preBootstrap) / 1000000;
       logger.error("Exception while bootstrapping client after {} ms", e,
-        MDC.of(LogKeys.BOOTSTRAP_TIME$.MODULE$, bootstrapTimeMs));
+        MDC.of(LogKeys.BOOTSTRAP_TIME, bootstrapTimeMs));
       client.close();
-      Throwables.throwIfUnchecked(e);
+      if (e instanceof RuntimeException re) throw re;
       throw new RuntimeException(e);
     }
     long postBootstrap = System.nanoTime();
 
     logger.info("Successfully created connection to {} after {} ms ({} ms spent in bootstraps)",
-      MDC.of(LogKeys.HOST_PORT$.MODULE$, address),
-      MDC.of(LogKeys.ELAPSED_TIME$.MODULE$, (postBootstrap - preConnect) / 1000000),
-      MDC.of(LogKeys.BOOTSTRAP_TIME$.MODULE$, (postBootstrap - preBootstrap) / 1000000));
+      MDC.of(LogKeys.HOST_PORT, address),
+      MDC.of(LogKeys.ELAPSED_TIME, (postBootstrap - preConnect) / 1000000),
+      MDC.of(LogKeys.BOOTSTRAP_TIME, (postBootstrap - preBootstrap) / 1000000));
 
     return client;
   }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/client/TransportResponseHandler.java b/common/network-common/src/main/java/org/apache/spark/network/client/TransportResponseHandler.java
index be4cf4a58abeb..d27fa08d829bb 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/client/TransportResponseHandler.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/client/TransportResponseHandler.java
@@ -26,8 +26,6 @@
 
 import com.google.common.annotations.VisibleForTesting;
 import io.netty.channel.Channel;
-import org.apache.commons.lang3.tuple.ImmutablePair;
-import org.apache.commons.lang3.tuple.Pair;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
@@ -45,6 +43,7 @@
 import org.apache.spark.network.server.MessageHandler;
 import static org.apache.spark.network.util.NettyUtils.getRemoteAddress;
 import org.apache.spark.network.util.TransportFrameDecoder;
+import org.apache.spark.util.Pair;
 
 /**
  * Handler that processes server responses, in response to requests issued from a
@@ -96,7 +95,7 @@ public void removeRpcRequest(long requestId) {
 
   public void addStreamCallback(String streamId, StreamCallback callback) {
     updateTimeOfLastRequest();
-    streamCallbacks.offer(ImmutablePair.of(streamId, callback));
+    streamCallbacks.offer(Pair.of(streamId, callback));
   }
 
   @VisibleForTesting
@@ -125,7 +124,7 @@ private void failOutstandingRequests(Throwable cause) {
     }
     for (Pair<String, StreamCallback> entry : streamCallbacks) {
       try {
-        entry.getValue().onFailure(entry.getKey(), cause);
+        entry.getRight().onFailure(entry.getLeft(), cause);
       } catch (Exception e) {
         logger.warn("StreamCallback.onFailure throws exception", e);
       }
@@ -146,8 +145,8 @@ public void channelInactive() {
     if (hasOutstandingRequests()) {
       String remoteAddress = getRemoteAddress(channel);
       logger.error("Still have {} requests outstanding when connection from {} is closed",
-        MDC.of(LogKeys.COUNT$.MODULE$, numOutstandingRequests()),
-        MDC.of(LogKeys.HOST_PORT$.MODULE$, remoteAddress));
+        MDC.of(LogKeys.COUNT, numOutstandingRequests()),
+        MDC.of(LogKeys.HOST_PORT, remoteAddress));
       failOutstandingRequests(new IOException("Connection from " + remoteAddress + " closed"));
     }
   }
@@ -157,8 +156,8 @@ public void exceptionCaught(Throwable cause) {
     if (hasOutstandingRequests()) {
       String remoteAddress = getRemoteAddress(channel);
       logger.error("Still have {} requests outstanding when connection from {} is closed",
-        MDC.of(LogKeys.COUNT$.MODULE$, numOutstandingRequests()),
-        MDC.of(LogKeys.HOST_PORT$.MODULE$, remoteAddress));
+        MDC.of(LogKeys.COUNT, numOutstandingRequests()),
+        MDC.of(LogKeys.HOST_PORT, remoteAddress));
       failOutstandingRequests(cause);
     }
   }
@@ -169,8 +168,8 @@ public void handle(ResponseMessage message) throws Exception {
       ChunkReceivedCallback listener = outstandingFetches.get(resp.streamChunkId);
       if (listener == null) {
         logger.warn("Ignoring response for block {} from {} since it is not outstanding",
-          MDC.of(LogKeys.STREAM_CHUNK_ID$.MODULE$, resp.streamChunkId),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
+          MDC.of(LogKeys.STREAM_CHUNK_ID, resp.streamChunkId),
+          MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
         resp.body().release();
       } else {
         outstandingFetches.remove(resp.streamChunkId);
@@ -181,9 +180,9 @@ public void handle(ResponseMessage message) throws Exception {
       ChunkReceivedCallback listener = outstandingFetches.get(resp.streamChunkId);
       if (listener == null) {
         logger.warn("Ignoring response for block {} from {} ({}) since it is not outstanding",
-          MDC.of(LogKeys.STREAM_CHUNK_ID$.MODULE$, resp.streamChunkId),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)),
-          MDC.of(LogKeys.ERROR$.MODULE$, resp.errorString));
+          MDC.of(LogKeys.STREAM_CHUNK_ID, resp.streamChunkId),
+          MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)),
+          MDC.of(LogKeys.ERROR, resp.errorString));
       } else {
         outstandingFetches.remove(resp.streamChunkId);
         listener.onFailure(resp.streamChunkId.chunkIndex(), new ChunkFetchFailureException(
@@ -193,9 +192,9 @@ public void handle(ResponseMessage message) throws Exception {
       RpcResponseCallback listener = (RpcResponseCallback) outstandingRpcs.get(resp.requestId);
       if (listener == null) {
         logger.warn("Ignoring response for RPC {} from {} ({} bytes) since it is not outstanding",
-          MDC.of(LogKeys.REQUEST_ID$.MODULE$, resp.requestId),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)),
-          MDC.of(LogKeys.RESPONSE_BODY_SIZE$.MODULE$, resp.body().size()));
+          MDC.of(LogKeys.REQUEST_ID, resp.requestId),
+          MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)),
+          MDC.of(LogKeys.RESPONSE_BODY_SIZE, resp.body().size()));
         resp.body().release();
       } else {
         outstandingRpcs.remove(resp.requestId);
@@ -209,9 +208,9 @@ public void handle(ResponseMessage message) throws Exception {
       BaseResponseCallback listener = outstandingRpcs.get(resp.requestId);
       if (listener == null) {
         logger.warn("Ignoring response for RPC {} from {} ({}) since it is not outstanding",
-          MDC.of(LogKeys.REQUEST_ID$.MODULE$, resp.requestId),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)),
-          MDC.of(LogKeys.ERROR$.MODULE$, resp.errorString));
+          MDC.of(LogKeys.REQUEST_ID, resp.requestId),
+          MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)),
+          MDC.of(LogKeys.ERROR, resp.errorString));
       } else {
         outstandingRpcs.remove(resp.requestId);
         listener.onFailure(new RuntimeException(resp.errorString));
@@ -223,9 +222,9 @@ public void handle(ResponseMessage message) throws Exception {
         if (listener == null) {
           logger.warn("Ignoring response for MergedBlockMetaRequest {} from {} ({} bytes) since "
             + "it is not outstanding",
-            MDC.of(LogKeys.REQUEST_ID$.MODULE$, resp.requestId),
-            MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)),
-            MDC.of(LogKeys.RESPONSE_BODY_SIZE$.MODULE$, resp.body().size()));
+            MDC.of(LogKeys.REQUEST_ID, resp.requestId),
+            MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)),
+            MDC.of(LogKeys.RESPONSE_BODY_SIZE, resp.body().size()));
         } else {
           outstandingRpcs.remove(resp.requestId);
           listener.onSuccess(resp.getNumChunks(), resp.body());
@@ -236,7 +235,7 @@ public void handle(ResponseMessage message) throws Exception {
     } else if (message instanceof StreamResponse resp) {
       Pair<String, StreamCallback> entry = streamCallbacks.poll();
       if (entry != null) {
-        StreamCallback callback = entry.getValue();
+        StreamCallback callback = entry.getRight();
         if (resp.byteCount > 0) {
           StreamInterceptor<ResponseMessage> interceptor = new StreamInterceptor<>(
             this, resp.streamId, resp.byteCount, callback);
@@ -262,7 +261,7 @@ public void handle(ResponseMessage message) throws Exception {
     } else if (message instanceof StreamFailure resp) {
       Pair<String, StreamCallback> entry = streamCallbacks.poll();
       if (entry != null) {
-        StreamCallback callback = entry.getValue();
+        StreamCallback callback = entry.getRight();
         try {
           callback.onFailure(resp.streamId, new RuntimeException(resp.error));
         } catch (IOException ioe) {
@@ -270,7 +269,7 @@ public void handle(ResponseMessage message) throws Exception {
         }
       } else {
         logger.warn("Stream failure with unknown callback: {}",
-          MDC.of(LogKeys.ERROR$.MODULE$, resp.error));
+          MDC.of(LogKeys.ERROR, resp.error));
       }
     } else {
       throw new IllegalStateException("Unknown response type: " + message.type());
diff --git a/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthEngine.java b/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthEngine.java
index 8449a774a404a..f02fbc3aa26c7 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthEngine.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthEngine.java
@@ -21,10 +21,10 @@
 import java.io.Closeable;
 import java.security.GeneralSecurityException;
 import java.util.Arrays;
+import java.util.Objects;
 import java.util.Properties;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
 import com.google.common.primitives.Bytes;
 import com.google.crypto.tink.subtle.AesGcmJce;
 import com.google.crypto.tink.subtle.Hkdf;
@@ -33,6 +33,8 @@
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
 import static java.nio.charset.StandardCharsets.UTF_8;
+
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.TransportConf;
 
 /**
@@ -61,10 +63,8 @@ class AuthEngine implements Closeable {
   private TransportCipher sessionCipher;
 
   AuthEngine(String appId, String preSharedSecret, TransportConf conf) {
-    Preconditions.checkNotNull(appId);
-    Preconditions.checkNotNull(preSharedSecret);
-    this.appId = appId;
-    this.preSharedSecret = preSharedSecret.getBytes(UTF_8);
+    this.appId = Objects.requireNonNull(appId);
+    this.preSharedSecret = Objects.requireNonNull(preSharedSecret).getBytes(UTF_8);
     this.conf = conf;
     this.cryptoConf = conf.cryptoConf();
     // This is for backward compatibility with version 1.0 of this protocol,
@@ -126,7 +126,7 @@ private AuthMessage encryptEphemeralPublicKey(
   private byte[] decryptEphemeralPublicKey(
       AuthMessage encryptedPublicKey,
       byte[] transcript) throws GeneralSecurityException {
-    Preconditions.checkArgument(appId.equals(encryptedPublicKey.appId()));
+    JavaUtils.checkArgument(appId.equals(encryptedPublicKey.appId()), "appID is different.");
     // Mix in the app ID, salt, and transcript into HKDF and use it as AES-GCM AAD
     byte[] aadState = Bytes.concat(appId.getBytes(UTF_8), encryptedPublicKey.salt(), transcript);
     // Use HKDF to derive an AES_GCM key from the pre-shared key, non-secret salt, and AAD state
@@ -162,7 +162,7 @@ AuthMessage challenge() throws GeneralSecurityException {
    * @return An encrypted server ephemeral public key to be sent to the client.
    */
   AuthMessage response(AuthMessage encryptedClientPublicKey) throws GeneralSecurityException {
-    Preconditions.checkArgument(appId.equals(encryptedClientPublicKey.appId()));
+    JavaUtils.checkArgument(appId.equals(encryptedClientPublicKey.appId()), "appId is different.");
     // Compute a shared secret given the client public key and the server private key
     byte[] clientPublicKey =
         decryptEphemeralPublicKey(encryptedClientPublicKey, EMPTY_TRANSCRIPT);
@@ -190,8 +190,7 @@ AuthMessage response(AuthMessage encryptedClientPublicKey) throws GeneralSecurit
    */
   void deriveSessionCipher(AuthMessage encryptedClientPublicKey,
                            AuthMessage encryptedServerPublicKey) throws GeneralSecurityException {
-    Preconditions.checkArgument(appId.equals(encryptedClientPublicKey.appId()));
-    Preconditions.checkArgument(appId.equals(encryptedServerPublicKey.appId()));
+    JavaUtils.checkArgument(appId.equals(encryptedClientPublicKey.appId()), "appId is different.");
     // Compute a shared secret given the server public key and the client private key,
     // mixing in the protocol transcript.
     byte[] serverPublicKey = decryptEphemeralPublicKey(
@@ -252,7 +251,7 @@ private byte[] getTranscript(AuthMessage... encryptedPublicKeys) {
   }
 
   TransportCipher sessionCipher() {
-    Preconditions.checkState(sessionCipher != null);
+    JavaUtils.checkState(sessionCipher != null, "sessionCipher is null.");
     return sessionCipher;
   }
 
diff --git a/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthRpcHandler.java b/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthRpcHandler.java
index 087e3d21e22bb..8ce4680f32437 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthRpcHandler.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/crypto/AuthRpcHandler.java
@@ -20,8 +20,6 @@
 import java.nio.ByteBuffer;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
 import io.netty.channel.Channel;
@@ -36,6 +34,7 @@
 import org.apache.spark.network.sasl.SaslRpcHandler;
 import org.apache.spark.network.server.AbstractAuthRpcHandler;
 import org.apache.spark.network.server.RpcHandler;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.TransportConf;
 
 /**
@@ -93,7 +92,7 @@ protected boolean doAuthChallenge(
     } catch (RuntimeException e) {
       if (conf.saslFallback()) {
         LOG.warn("Failed to parse new auth challenge, reverting to SASL for client {}.",
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, channel.remoteAddress()));
+          MDC.of(LogKeys.HOST_PORT, channel.remoteAddress()));
         saslHandler = new SaslRpcHandler(conf, channel, null, secretKeyHolder);
         message.position(position);
         message.limit(limit);
@@ -111,7 +110,7 @@ protected boolean doAuthChallenge(
     AuthEngine engine = null;
     try {
       String secret = secretKeyHolder.getSecretKey(challenge.appId());
-      Preconditions.checkState(secret != null,
+      JavaUtils.checkState(secret != null,
         "Trying to authenticate non-registered app %s.", challenge.appId());
       LOG.debug("Authenticating challenge for app {}.", challenge.appId());
       engine = new AuthEngine(challenge.appId(), secret, conf);
@@ -132,7 +131,7 @@ protected boolean doAuthChallenge(
         try {
           engine.close();
         } catch (Exception e) {
-          Throwables.throwIfUnchecked(e);
+          if (e instanceof RuntimeException re) throw re;
           throw new RuntimeException(e);
         }
       }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/crypto/CtrTransportCipher.java b/common/network-common/src/main/java/org/apache/spark/network/crypto/CtrTransportCipher.java
index 85b893751b39c..de7d1ae5753d9 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/crypto/CtrTransportCipher.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/crypto/CtrTransportCipher.java
@@ -27,7 +27,6 @@
 import javax.crypto.spec.IvParameterSpec;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
 import io.netty.channel.*;
@@ -37,6 +36,7 @@
 import org.apache.spark.network.util.AbstractFileRegion;
 import org.apache.spark.network.util.ByteArrayReadableChannel;
 import org.apache.spark.network.util.ByteArrayWritableChannel;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Cipher for encryption and decryption.
@@ -239,7 +239,7 @@ static class EncryptedMessage extends AbstractFileRegion {
         Object msg,
         ByteArrayWritableChannel byteEncChannel,
         ByteArrayWritableChannel byteRawChannel) {
-      Preconditions.checkArgument(msg instanceof ByteBuf || msg instanceof FileRegion,
+      JavaUtils.checkArgument(msg instanceof ByteBuf || msg instanceof FileRegion,
         "Unrecognized message type: %s", msg.getClass().getName());
       this.handler = handler;
       this.isByteBuf = msg instanceof ByteBuf;
@@ -304,7 +304,7 @@ public boolean release(int decrement) {
 
     @Override
     public long transferTo(WritableByteChannel target, long position) throws IOException {
-      Preconditions.checkArgument(position == transferred(), "Invalid position.");
+      JavaUtils.checkArgument(position == transferred(), "Invalid position.");
 
       if (transferred == count) {
         return 0;
diff --git a/common/network-common/src/main/java/org/apache/spark/network/crypto/GcmTransportCipher.java b/common/network-common/src/main/java/org/apache/spark/network/crypto/GcmTransportCipher.java
index c3540838bef09..e1cf22a612ea4 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/crypto/GcmTransportCipher.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/crypto/GcmTransportCipher.java
@@ -18,15 +18,16 @@
 package org.apache.spark.network.crypto;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
 import com.google.common.primitives.Longs;
 import com.google.crypto.tink.subtle.*;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
 import io.netty.channel.*;
 import io.netty.util.ReferenceCounted;
+
 import org.apache.spark.network.util.AbstractFileRegion;
 import org.apache.spark.network.util.ByteBufferWriteableChannel;
+import org.apache.spark.network.util.JavaUtils;
 
 import javax.crypto.spec.SecretKeySpec;
 import java.io.IOException;
@@ -118,7 +119,7 @@ static class GcmEncryptedMessage extends AbstractFileRegion {
                             Object plaintextMessage,
                             ByteBuffer plaintextBuffer,
                             ByteBuffer ciphertextBuffer) throws GeneralSecurityException {
-            Preconditions.checkArgument(
+            JavaUtils.checkArgument(
                     plaintextMessage instanceof ByteBuf || plaintextMessage instanceof FileRegion,
                     "Unrecognized message type: %s", plaintextMessage.getClass().getName());
             this.plaintextMessage = plaintextMessage;
@@ -221,10 +222,12 @@ public long transferTo(WritableByteChannel target, long position) throws IOExcep
                 int readLimit =
                         (int) Math.min(readableBytes, plaintextBuffer.remaining());
                 if (plaintextMessage instanceof ByteBuf byteBuf) {
-                    Preconditions.checkState(0 == plaintextBuffer.position());
+                    JavaUtils.checkState(0 == plaintextBuffer.position(),
+                      "plaintextBuffer.position is not 0");
                     plaintextBuffer.limit(readLimit);
                     byteBuf.readBytes(plaintextBuffer);
-                    Preconditions.checkState(readLimit == plaintextBuffer.position());
+                    JavaUtils.checkState(readLimit == plaintextBuffer.position(),
+                      "plaintextBuffer.position should be equal to readLimit.");
                 } else if (plaintextMessage instanceof FileRegion fileRegion) {
                     ByteBufferWriteableChannel plaintextChannel =
                             new ByteBufferWriteableChannel(plaintextBuffer);
@@ -347,7 +350,7 @@ private boolean initalizeDecrypter(ByteBuf ciphertextNettyBuf)
         @Override
         public void channelRead(ChannelHandlerContext ctx, Object ciphertextMessage)
                 throws GeneralSecurityException {
-            Preconditions.checkArgument(ciphertextMessage instanceof ByteBuf,
+            JavaUtils.checkArgument(ciphertextMessage instanceof ByteBuf,
                     "Unrecognized message type: %s",
                     ciphertextMessage.getClass().getName());
             ByteBuf ciphertextNettyBuf = (ByteBuf) ciphertextMessage;
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/AbstractMessage.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/AbstractMessage.java
index 2924218c2f08b..1170fd3f1ab33 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/AbstractMessage.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/AbstractMessage.java
@@ -17,7 +17,7 @@
 
 package org.apache.spark.network.protocol;
 
-import com.google.common.base.Objects;
+import java.util.Objects;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 
@@ -48,7 +48,7 @@ public boolean isBodyInFrame() {
   }
 
   protected boolean equals(AbstractMessage other) {
-    return isBodyInFrame == other.isBodyInFrame && Objects.equal(body, other.body);
+    return isBodyInFrame == other.isBodyInFrame && Objects.equals(body, other.body);
   }
 
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchFailure.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchFailure.java
index cbad4c61b9b4a..736d8e6f5eea2 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchFailure.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchFailure.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
  * Response to {@link ChunkFetchRequest} when there is an error fetching the chunk.
@@ -70,9 +68,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamChunkId", streamChunkId)
-      .append("errorString", errorString)
-      .toString();
+    return "ChunkFetchFailure[streamChunkId=" + streamChunkId + ",errorString=" + errorString + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchRequest.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchRequest.java
index 2865388b3297c..cc042fdf76b77 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchRequest.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchRequest.java
@@ -18,8 +18,6 @@
 package org.apache.spark.network.protocol;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
  * Request to fetch a sequence of a single chunk of a stream. This will correspond to a single
@@ -64,8 +62,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamChunkId", streamChunkId)
-      .toString();
+    return "ChunkFetchRequest[streamChunkId=" + streamChunkId + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchSuccess.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchSuccess.java
index aa89b2062f626..948190e7a2d53 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchSuccess.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/ChunkFetchSuccess.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NettyManagedBuffer;
@@ -83,9 +81,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamChunkId", streamChunkId)
-      .append("buffer", body())
-      .toString();
+    return "ChunkFetchSuccess[streamChunkId=" + streamChunkId + ",body=" + body() + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/EncryptedMessageWithHeader.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/EncryptedMessageWithHeader.java
index 321ac13881c2a..84917eca17190 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/EncryptedMessageWithHeader.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/EncryptedMessageWithHeader.java
@@ -21,7 +21,6 @@
 import java.io.InputStream;
 import javax.annotation.Nullable;
 
-import com.google.common.base.Preconditions;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.ByteBufAllocator;
 import io.netty.channel.ChannelHandlerContext;
@@ -29,6 +28,7 @@
 import io.netty.handler.stream.ChunkedInput;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * A wrapper message that holds two separate pieces (a header and a body).
@@ -60,7 +60,7 @@ public class EncryptedMessageWithHeader implements ChunkedInput<ByteBuf> {
 
   public EncryptedMessageWithHeader(
       @Nullable ManagedBuffer managedBuffer, ByteBuf header, Object body, long bodyLength) {
-    Preconditions.checkArgument(body instanceof InputStream || body instanceof ChunkedStream,
+    JavaUtils.checkArgument(body instanceof InputStream || body instanceof ChunkedStream,
       "Body must be an InputStream or a ChunkedStream.");
     this.managedBuffer = managedBuffer;
     this.header = header;
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaRequest.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaRequest.java
index 3723730ebc06c..0b1476664f651 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaRequest.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaRequest.java
@@ -17,10 +17,9 @@
 
 package org.apache.spark.network.protocol;
 
-import com.google.common.base.Objects;
+import java.util.Objects;
+
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
  * Request to find the meta information for the specified merged block. The meta information
@@ -79,7 +78,7 @@ public static MergedBlockMetaRequest decode(ByteBuf buf) {
 
   @Override
   public int hashCode() {
-    return Objects.hashCode(requestId, appId, shuffleId, shuffleMergeId, reduceId);
+    return Objects.hash(requestId, appId, shuffleId, shuffleMergeId, reduceId);
   }
 
   @Override
@@ -87,19 +86,14 @@ public boolean equals(Object other) {
     if (other instanceof MergedBlockMetaRequest o) {
       return requestId == o.requestId && shuffleId == o.shuffleId &&
         shuffleMergeId == o.shuffleMergeId && reduceId == o.reduceId &&
-        Objects.equal(appId, o.appId);
+        Objects.equals(appId, o.appId);
     }
     return false;
   }
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("requestId", requestId)
-      .append("appId", appId)
-      .append("shuffleId", shuffleId)
-      .append("shuffleMergeId", shuffleMergeId)
-      .append("reduceId", reduceId)
-      .toString();
+    return "MergedBlockMetaRequest[requestId=" + requestId + ",appId=" + appId + ",shuffleId=" +
+        shuffleId + ",shuffleMergeId=" + shuffleMergeId + ",reduceId=" + reduceId + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaSuccess.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaSuccess.java
index d2edaf4532e11..255174e34600c 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaSuccess.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/MergedBlockMetaSuccess.java
@@ -17,10 +17,9 @@
 
 package org.apache.spark.network.protocol;
 
-import com.google.common.base.Objects;
+import java.util.Objects;
+
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NettyManagedBuffer;
@@ -51,13 +50,12 @@ public Type type() {
 
   @Override
   public int hashCode() {
-    return Objects.hashCode(requestId, numChunks);
+    return Objects.hash(requestId, numChunks);
   }
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("requestId", requestId).append("numChunks", numChunks).toString();
+    return "MergedBlockMetaSuccess[requestId=" + requestId + ",numChunks=" + numChunks + "]";
   }
 
   @Override
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageEncoder.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageEncoder.java
index ab20fb908eb42..3f23c17939e6c 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageEncoder.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageEncoder.java
@@ -66,8 +66,8 @@ public void encode(ChannelHandlerContext ctx, Message in, List<Object> out) thro
           // Re-encode this message as a failure response.
           String error = e.getMessage() != null ? e.getMessage() : "null";
           logger.error("Error processing {} for client {}", e,
-            MDC.of(LogKeys.MESSAGE$.MODULE$, in),
-            MDC.of(LogKeys.HOST_PORT$.MODULE$, ctx.channel().remoteAddress()));
+            MDC.of(LogKeys.MESSAGE, in),
+            MDC.of(LogKeys.HOST_PORT, ctx.channel().remoteAddress()));
           encode(ctx, resp.createFailureResponse(error), out);
         } else {
           throw e;
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageWithHeader.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageWithHeader.java
index e8eb83e7577bf..993ce2381caa5 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageWithHeader.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/MessageWithHeader.java
@@ -22,13 +22,13 @@
 import java.nio.channels.WritableByteChannel;
 import javax.annotation.Nullable;
 
-import com.google.common.base.Preconditions;
 import io.netty.buffer.ByteBuf;
 import io.netty.channel.FileRegion;
 import io.netty.util.ReferenceCountUtil;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.util.AbstractFileRegion;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * A wrapper message that holds two separate pieces (a header and a body).
@@ -72,7 +72,7 @@ public class MessageWithHeader extends AbstractFileRegion {
       ByteBuf header,
       Object body,
       long bodyLength) {
-    Preconditions.checkArgument(body instanceof ByteBuf || body instanceof FileRegion,
+    JavaUtils.checkArgument(body instanceof ByteBuf || body instanceof FileRegion,
       "Body must be a ByteBuf or a FileRegion.");
     this.managedBuffer = managedBuffer;
     this.header = header;
@@ -105,7 +105,7 @@ public long transferred() {
    */
   @Override
   public long transferTo(final WritableByteChannel target, final long position) throws IOException {
-    Preconditions.checkArgument(position == totalBytesTransferred, "Invalid position.");
+    JavaUtils.checkArgument(position == totalBytesTransferred, "Invalid position.");
     // Bytes written for header in this call.
     long writtenHeader = 0;
     if (header.readableBytes() > 0) {
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/OneWayMessage.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/OneWayMessage.java
index 91c818f3612a9..de1f91bc8d318 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/OneWayMessage.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/OneWayMessage.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NettyManagedBuffer;
@@ -74,8 +72,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("body", body())
-      .toString();
+    return "OneWayMessage[body=" + body() + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcFailure.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcFailure.java
index 02a45d68c650e..f48264a494f0e 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcFailure.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcFailure.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /** Response to {@link RpcRequest} for a failed RPC. */
 public final class RpcFailure extends AbstractMessage implements ResponseMessage {
@@ -68,9 +66,6 @@ public boolean equals(Object other) {
 
   @Override
    public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("requestId", requestId)
-      .append("errorString", errorString)
-      .toString();
+    return "RpcFailure[requestId=" + requestId + ",errorString=" + errorString + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcRequest.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcRequest.java
index a7dbe1283b314..2619b176e331e 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcRequest.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcRequest.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NettyManagedBuffer;
@@ -80,9 +78,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("requestId", requestId)
-      .append("body", body())
-      .toString();
+    return "RpcRequest[requestId=" + requestId  + ",body=" + body() + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcResponse.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcResponse.java
index 85709e36f83ee..a9805bcf686b4 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcResponse.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/RpcResponse.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NettyManagedBuffer;
@@ -80,9 +78,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("requestId", requestId)
-      .append("body", body())
-      .toString();
+    return "RpcResponse[requestId=" + requestId + ",body=" + body() + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/SslMessageEncoder.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/SslMessageEncoder.java
index abe6ccca7bfd6..083e45b3d6bdb 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/SslMessageEncoder.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/SslMessageEncoder.java
@@ -71,8 +71,8 @@ public void encode(ChannelHandlerContext ctx, Message in, List<Object> out) thro
           // Re-encode this message as a failure response.
           String error = e.getMessage() != null ? e.getMessage() : "null";
           logger.error("Error processing {} for client {}", e,
-            MDC.of(LogKeys.MESSAGE$.MODULE$, in),
-            MDC.of(LogKeys.HOST_PORT$.MODULE$, ctx.channel().remoteAddress()));
+            MDC.of(LogKeys.MESSAGE, in),
+            MDC.of(LogKeys.HOST_PORT, ctx.channel().remoteAddress()));
           encode(ctx, resp.createFailureResponse(error), out);
         } else {
           throw e;
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamChunkId.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamChunkId.java
index c3b715009dffe..61aae3e36eceb 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamChunkId.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamChunkId.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
 * Encapsulates a request for a particular chunk of a stream.
@@ -61,9 +59,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamId", streamId)
-      .append("chunkIndex", chunkIndex)
-      .toString();
+    return "StreamChunkId[streamId=" + streamId + ",chunkIndex=" + chunkIndex + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamFailure.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamFailure.java
index 9a7bf2f65af3a..50cc25a4919a5 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamFailure.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamFailure.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
  * Message indicating an error when transferring a stream.
@@ -70,10 +68,7 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamId", streamId)
-      .append("error", error)
-      .toString();
+    return "StreamFailure[streamId=" + streamId + ",error=" + error + "]";
   }
 
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamRequest.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamRequest.java
index 5906b4d380d6e..45ca2578b01a4 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamRequest.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamRequest.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 /**
  * Request to stream data from the remote end.
@@ -69,9 +67,7 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamId", streamId)
-      .toString();
+    return "StreamRequest[streamId=" + streamId + "]";
   }
 
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamResponse.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamResponse.java
index 0c0aa5c9a635b..d7c304e5c5b34 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamResponse.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/StreamResponse.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 
@@ -83,11 +81,8 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamId", streamId)
-      .append("byteCount", byteCount)
-      .append("body", body())
-      .toString();
+    return "StreamResponse[streamId=" + streamId + ",byteCount=" + byteCount +
+        ",body=" + body() + "]";
   }
 
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/protocol/UploadStream.java b/common/network-common/src/main/java/org/apache/spark/network/protocol/UploadStream.java
index 4722f39dfa9db..09baaf60c3f92 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/protocol/UploadStream.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/protocol/UploadStream.java
@@ -21,8 +21,6 @@
 import java.nio.ByteBuffer;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NettyManagedBuffer;
@@ -99,9 +97,6 @@ public boolean equals(Object other) {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("requestId", requestId)
-      .append("body", body())
-      .toString();
+    return "UploadStream[requestId=" + requestId + ",body=" + body() + "]";
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/sasl/SaslEncryption.java b/common/network-common/src/main/java/org/apache/spark/network/sasl/SaslEncryption.java
index e1275689ae6a0..1cdb951d2d04e 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/sasl/SaslEncryption.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/sasl/SaslEncryption.java
@@ -23,7 +23,6 @@
 import java.util.List;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
 import io.netty.channel.Channel;
@@ -35,6 +34,7 @@
 
 import org.apache.spark.network.util.AbstractFileRegion;
 import org.apache.spark.network.util.ByteArrayWritableChannel;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.NettyUtils;
 
 /**
@@ -152,7 +152,7 @@ static class EncryptedMessage extends AbstractFileRegion {
     private long transferred;
 
     EncryptedMessage(SaslEncryptionBackend backend, Object msg, int maxOutboundBlockSize) {
-      Preconditions.checkArgument(msg instanceof ByteBuf || msg instanceof FileRegion,
+      JavaUtils.checkArgument(msg instanceof ByteBuf || msg instanceof FileRegion,
         "Unrecognized message type: %s", msg.getClass().getName());
       this.backend = backend;
       this.isByteBuf = msg instanceof ByteBuf;
@@ -241,7 +241,7 @@ public boolean release(int decrement) {
     public long transferTo(final WritableByteChannel target, final long position)
       throws IOException {
 
-      Preconditions.checkArgument(position == transferred(), "Invalid position.");
+      JavaUtils.checkArgument(position == transferred(), "Invalid position.");
 
       long reportedWritten = 0L;
       long actuallyWritten = 0L;
diff --git a/common/network-common/src/main/java/org/apache/spark/network/sasl/SparkSaslServer.java b/common/network-common/src/main/java/org/apache/spark/network/sasl/SparkSaslServer.java
index f32fd5145c7c5..24e01c924ef3a 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/sasl/SparkSaslServer.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/sasl/SparkSaslServer.java
@@ -29,8 +29,8 @@
 import javax.security.sasl.SaslServer;
 import java.nio.charset.StandardCharsets;
 import java.util.Map;
+import java.util.Objects;
 
-import com.google.common.base.Preconditions;
 import com.google.common.collect.ImmutableMap;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
@@ -182,13 +182,13 @@ public void handle(Callback[] callbacks) throws UnsupportedCallbackException {
 
   /* Encode a byte[] identifier as a Base64-encoded string. */
   public static String encodeIdentifier(String identifier) {
-    Preconditions.checkNotNull(identifier, "User cannot be null if SASL is enabled");
+    Objects.requireNonNull(identifier, "User cannot be null if SASL is enabled");
     return getBase64EncodedString(identifier);
   }
 
   /** Encode a password as a base64-encoded char[] array. */
   public static char[] encodePassword(String password) {
-    Preconditions.checkNotNull(password, "Password cannot be null if SASL is enabled");
+    Objects.requireNonNull(password, "Password cannot be null if SASL is enabled");
     return getBase64EncodedString(password).toCharArray();
   }
 
diff --git a/common/network-common/src/main/java/org/apache/spark/network/server/BlockPushNonFatalFailure.java b/common/network-common/src/main/java/org/apache/spark/network/server/BlockPushNonFatalFailure.java
index f60a74670d149..a0e9305265385 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/server/BlockPushNonFatalFailure.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/server/BlockPushNonFatalFailure.java
@@ -18,8 +18,9 @@
 package org.apache.spark.network.server;
 
 import java.nio.ByteBuffer;
+import java.util.Objects;
 
-import com.google.common.base.Preconditions;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * A special RuntimeException thrown when shuffle service experiences a non-fatal failure
@@ -101,14 +102,12 @@ public synchronized Throwable fillInStackTrace() {
 
   public ByteBuffer getResponse() {
     // Ensure we do not invoke this method if response is not set
-    Preconditions.checkNotNull(response);
-    return response;
+    return Objects.requireNonNull(response);
   }
 
   public ReturnCode getReturnCode() {
     // Ensure we do not invoke this method if returnCode is not set
-    Preconditions.checkNotNull(returnCode);
-    return returnCode;
+    return Objects.requireNonNull(returnCode);
   }
 
   public enum ReturnCode {
@@ -171,7 +170,7 @@ public static boolean shouldNotRetryErrorCode(ReturnCode returnCode) {
   }
 
   public static String getErrorMsg(String blockId, ReturnCode errorCode) {
-    Preconditions.checkArgument(errorCode != ReturnCode.SUCCESS);
+    JavaUtils.checkArgument(errorCode != ReturnCode.SUCCESS, "errorCode should not be SUCCESS.");
     return "Block " + blockId + errorCode.errorMsgSuffix;
   }
 }
diff --git a/common/network-common/src/main/java/org/apache/spark/network/server/ChunkFetchRequestHandler.java b/common/network-common/src/main/java/org/apache/spark/network/server/ChunkFetchRequestHandler.java
index cc0bed7ed5b6d..c7d4d671dec7d 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/server/ChunkFetchRequestHandler.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/server/ChunkFetchRequestHandler.java
@@ -19,7 +19,6 @@
 
 import java.net.SocketAddress;
 
-import com.google.common.base.Throwables;
 import io.netty.channel.Channel;
 import io.netty.channel.ChannelFuture;
 import io.netty.channel.ChannelFutureListener;
@@ -36,6 +35,7 @@
 import org.apache.spark.network.protocol.ChunkFetchRequest;
 import org.apache.spark.network.protocol.ChunkFetchSuccess;
 import org.apache.spark.network.protocol.Encodable;
+import org.apache.spark.network.util.JavaUtils;
 
 import static org.apache.spark.network.util.NettyUtils.*;
 
@@ -74,7 +74,7 @@ public ChunkFetchRequestHandler(
   @Override
   public void exceptionCaught(ChannelHandlerContext ctx, Throwable cause) throws Exception {
     logger.warn("Exception in connection from {}", cause,
-      MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(ctx.channel())));
+      MDC.of(LogKeys.HOST_PORT, getRemoteAddress(ctx.channel())));
     ctx.close();
   }
 
@@ -96,8 +96,8 @@ public void processFetchRequest(
       long chunksBeingTransferred = streamManager.chunksBeingTransferred();
       if (chunksBeingTransferred >= maxChunksBeingTransferred) {
         logger.warn("The number of chunks being transferred {} is above {}, close the connection.",
-          MDC.of(LogKeys.NUM_CHUNKS$.MODULE$, chunksBeingTransferred),
-          MDC.of(LogKeys.MAX_NUM_CHUNKS$.MODULE$, maxChunksBeingTransferred));
+          MDC.of(LogKeys.NUM_CHUNKS, chunksBeingTransferred),
+          MDC.of(LogKeys.MAX_NUM_CHUNKS, maxChunksBeingTransferred));
         channel.close();
         return;
       }
@@ -111,10 +111,10 @@ public void processFetchRequest(
       }
     } catch (Exception e) {
       logger.error("Error opening block {} for request from {}", e,
-        MDC.of(LogKeys.STREAM_CHUNK_ID$.MODULE$, msg.streamChunkId),
-        MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
+        MDC.of(LogKeys.STREAM_CHUNK_ID, msg.streamChunkId),
+        MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
       respond(channel, new ChunkFetchFailure(msg.streamChunkId,
-        Throwables.getStackTraceAsString(e)));
+        JavaUtils.stackTraceToString(e)));
       return;
     }
 
@@ -153,8 +153,8 @@ private ChannelFuture respond(
       } else {
         logger.error("Error sending result {} to {}; closing connection",
           future.cause(),
-          MDC.of(LogKeys.RESULT$.MODULE$, result),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, remoteAddress));
+          MDC.of(LogKeys.RESULT, result),
+          MDC.of(LogKeys.HOST_PORT, remoteAddress));
         channel.close();
       }
     });
diff --git a/common/network-common/src/main/java/org/apache/spark/network/server/OneForOneStreamManager.java b/common/network-common/src/main/java/org/apache/spark/network/server/OneForOneStreamManager.java
index f322293782dee..cb53d565e7e87 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/server/OneForOneStreamManager.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/server/OneForOneStreamManager.java
@@ -19,20 +19,20 @@
 
 import java.util.Iterator;
 import java.util.Map;
+import java.util.Objects;
 import java.util.Random;
 import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.atomic.AtomicLong;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
 import io.netty.channel.Channel;
-import org.apache.commons.lang3.tuple.ImmutablePair;
-import org.apache.commons.lang3.tuple.Pair;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.client.TransportClient;
+import org.apache.spark.network.util.JavaUtils;
+import org.apache.spark.util.Pair;
 
 /**
  * StreamManager which allows registration of an Iterator&lt;ManagedBuffer&gt;, which are
@@ -72,7 +72,7 @@ private static class StreamState {
         Channel channel,
         boolean isBufferMaterializedOnNext) {
       this.appId = appId;
-      this.buffers = Preconditions.checkNotNull(buffers);
+      this.buffers = Objects.requireNonNull(buffers);
       this.associatedChannel = channel;
       this.isBufferMaterializedOnNext = isBufferMaterializedOnNext;
     }
@@ -127,7 +127,7 @@ public static Pair<Long, Integer> parseStreamChunkId(String streamChunkId) {
       "Stream id and chunk index should be specified.";
     long streamId = Long.valueOf(array[0]);
     int chunkIndex = Integer.valueOf(array[1]);
-    return ImmutablePair.of(streamId, chunkIndex);
+    return Pair.of(streamId, chunkIndex);
   }
 
   @Override
@@ -167,7 +167,7 @@ public void connectionTerminated(Channel channel) {
   public void checkAuthorization(TransportClient client, long streamId) {
     if (client.getClientId() != null) {
       StreamState state = streams.get(streamId);
-      Preconditions.checkArgument(state != null, "Unknown stream ID.");
+      JavaUtils.checkArgument(state != null, "Unknown stream ID.");
       if (!client.getClientId().equals(state.appId)) {
         throw new SecurityException(String.format(
           "Client %s not authorized to read stream %d (app %s).",
diff --git a/common/network-common/src/main/java/org/apache/spark/network/server/TransportChannelHandler.java b/common/network-common/src/main/java/org/apache/spark/network/server/TransportChannelHandler.java
index 283f0f0a431fd..d0df24873cbce 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/server/TransportChannelHandler.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/server/TransportChannelHandler.java
@@ -88,7 +88,7 @@ public TransportClient getClient() {
   @Override
   public void exceptionCaught(ChannelHandlerContext ctx, Throwable cause) throws Exception {
     logger.warn("Exception in connection from {}", cause,
-      MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(ctx.channel())));
+      MDC.of(LogKeys.HOST_PORT, getRemoteAddress(ctx.channel())));
     requestHandler.exceptionCaught(cause);
     responseHandler.exceptionCaught(cause);
     ctx.close();
@@ -168,9 +168,9 @@ public void userEventTriggered(ChannelHandlerContext ctx, Object evt) throws Exc
             logger.error("Connection to {} has been quiet for {} ms while there are outstanding " +
               "requests. Assuming connection is dead; please adjust" +
               " spark.{}.io.connectionTimeout if this is wrong.",
-              MDC.of(LogKeys.HOST_PORT$.MODULE$, address),
-              MDC.of(LogKeys.TIMEOUT$.MODULE$, requestTimeoutNs / 1000 / 1000),
-              MDC.of(LogKeys.MODULE_NAME$.MODULE$, transportContext.getConf().getModuleName()));
+              MDC.of(LogKeys.HOST_PORT, address),
+              MDC.of(LogKeys.TIMEOUT, requestTimeoutNs / 1000 / 1000),
+              MDC.of(LogKeys.MODULE_NAME, transportContext.getConf().getModuleName()));
             client.timeOut();
             ctx.close();
           } else if (closeIdleConnections) {
diff --git a/common/network-common/src/main/java/org/apache/spark/network/server/TransportRequestHandler.java b/common/network-common/src/main/java/org/apache/spark/network/server/TransportRequestHandler.java
index 2727051894b7a..464d4d9eb378f 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/server/TransportRequestHandler.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/server/TransportRequestHandler.java
@@ -21,7 +21,6 @@
 import java.net.SocketAddress;
 import java.nio.ByteBuffer;
 
-import com.google.common.base.Throwables;
 import io.netty.channel.Channel;
 import io.netty.channel.ChannelFuture;
 
@@ -33,6 +32,7 @@
 import org.apache.spark.network.buffer.NioManagedBuffer;
 import org.apache.spark.network.client.*;
 import org.apache.spark.network.protocol.*;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.TransportFrameDecoder;
 
 import static org.apache.spark.network.util.NettyUtils.getRemoteAddress;
@@ -132,8 +132,8 @@ private void processStreamRequest(final StreamRequest req) {
       long chunksBeingTransferred = streamManager.chunksBeingTransferred();
       if (chunksBeingTransferred >= maxChunksBeingTransferred) {
         logger.warn("The number of chunks being transferred {} is above {}, close the connection.",
-          MDC.of(LogKeys.NUM_CHUNKS$.MODULE$, chunksBeingTransferred),
-          MDC.of(LogKeys.MAX_NUM_CHUNKS$.MODULE$, maxChunksBeingTransferred));
+          MDC.of(LogKeys.NUM_CHUNKS, chunksBeingTransferred),
+          MDC.of(LogKeys.MAX_NUM_CHUNKS, maxChunksBeingTransferred));
         channel.close();
         return;
       }
@@ -143,9 +143,9 @@ private void processStreamRequest(final StreamRequest req) {
       buf = streamManager.openStream(req.streamId);
     } catch (Exception e) {
       logger.error("Error opening stream {} for request from {}", e,
-        MDC.of(LogKeys.STREAM_ID$.MODULE$, req.streamId),
-        MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
-      respond(new StreamFailure(req.streamId, Throwables.getStackTraceAsString(e)));
+        MDC.of(LogKeys.STREAM_ID, req.streamId),
+        MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
+      respond(new StreamFailure(req.streamId, JavaUtils.stackTraceToString(e)));
       return;
     }
 
@@ -172,14 +172,14 @@ public void onSuccess(ByteBuffer response) {
 
         @Override
         public void onFailure(Throwable e) {
-          respond(new RpcFailure(req.requestId, Throwables.getStackTraceAsString(e)));
+          respond(new RpcFailure(req.requestId, JavaUtils.stackTraceToString(e)));
         }
       });
     } catch (Exception e) {
       logger.error("Error while invoking RpcHandler#receive() on RPC id {} from {}", e,
-        MDC.of(LogKeys.REQUEST_ID$.MODULE$, req.requestId),
-        MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
-      respond(new RpcFailure(req.requestId, Throwables.getStackTraceAsString(e)));
+        MDC.of(LogKeys.REQUEST_ID, req.requestId),
+        MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
+      respond(new RpcFailure(req.requestId, JavaUtils.stackTraceToString(e)));
     } finally {
       req.body().release();
     }
@@ -199,7 +199,7 @@ public void onSuccess(ByteBuffer response) {
 
         @Override
         public void onFailure(Throwable e) {
-          respond(new RpcFailure(req.requestId, Throwables.getStackTraceAsString(e)));
+          respond(new RpcFailure(req.requestId, JavaUtils.stackTraceToString(e)));
         }
       };
       TransportFrameDecoder frameDecoder = (TransportFrameDecoder)
@@ -264,9 +264,9 @@ public String getID() {
           new NioManagedBuffer(blockPushNonFatalFailure.getResponse())));
       } else {
         logger.error("Error while invoking RpcHandler#receive() on RPC id {} from {}", e,
-          MDC.of(LogKeys.REQUEST_ID$.MODULE$, req.requestId),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
-        respond(new RpcFailure(req.requestId, Throwables.getStackTraceAsString(e)));
+          MDC.of(LogKeys.REQUEST_ID, req.requestId),
+          MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
+        respond(new RpcFailure(req.requestId, JavaUtils.stackTraceToString(e)));
       }
       // We choose to totally fail the channel, rather than trying to recover as we do in other
       // cases.  We don't know how many bytes of the stream the client has already sent for the
@@ -282,7 +282,7 @@ private void processOneWayMessage(OneWayMessage req) {
       rpcHandler.receive(reverseClient, req.body().nioByteBuffer());
     } catch (Exception e) {
       logger.error("Error while invoking RpcHandler#receive() for one-way message from {}.", e,
-        MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
+        MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
     } finally {
       req.body().release();
     }
@@ -302,16 +302,16 @@ public void onSuccess(int numChunks, ManagedBuffer buffer) {
           @Override
           public void onFailure(Throwable e) {
             logger.trace("Failed to send meta for {}", req);
-            respond(new RpcFailure(req.requestId, Throwables.getStackTraceAsString(e)));
+            respond(new RpcFailure(req.requestId, JavaUtils.stackTraceToString(e)));
           }
       });
     } catch (Exception e) {
       logger.error("Error while invoking receiveMergeBlockMetaReq() for appId {} shuffleId {} "
-        + "reduceId {} from {}", e, MDC.of(LogKeys.APP_ID$.MODULE$, req.appId),
-          MDC.of(LogKeys.SHUFFLE_ID$.MODULE$, req.shuffleId),
-          MDC.of(LogKeys.REDUCE_ID$.MODULE$, req.reduceId),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, getRemoteAddress(channel)));
-      respond(new RpcFailure(req.requestId, Throwables.getStackTraceAsString(e)));
+        + "reduceId {} from {}", e, MDC.of(LogKeys.APP_ID, req.appId),
+          MDC.of(LogKeys.SHUFFLE_ID, req.shuffleId),
+          MDC.of(LogKeys.REDUCE_ID, req.reduceId),
+          MDC.of(LogKeys.HOST_PORT, getRemoteAddress(channel)));
+      respond(new RpcFailure(req.requestId, JavaUtils.stackTraceToString(e)));
     }
   }
 
@@ -326,8 +326,8 @@ private ChannelFuture respond(Encodable result) {
         logger.trace("Sent result {} to client {}", result, remoteAddress);
       } else {
         logger.error("Error sending result {} to {}; closing connection", future.cause(),
-          MDC.of(LogKeys.RESULT$.MODULE$, result),
-          MDC.of(LogKeys.HOST_PORT$.MODULE$, remoteAddress));
+          MDC.of(LogKeys.RESULT, result),
+          MDC.of(LogKeys.HOST_PORT, remoteAddress));
         channel.close();
       }
     });
diff --git a/common/network-common/src/main/java/org/apache/spark/network/server/TransportServer.java b/common/network-common/src/main/java/org/apache/spark/network/server/TransportServer.java
index d1a19652f5649..be5d9e03c45c1 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/server/TransportServer.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/server/TransportServer.java
@@ -19,13 +19,13 @@
 
 import java.io.Closeable;
 import java.net.InetSocketAddress;
+import java.util.ArrayList;
 import java.util.List;
+import java.util.Objects;
 import java.util.concurrent.TimeUnit;
 
 import com.codahale.metrics.Counter;
 import com.codahale.metrics.MetricSet;
-import com.google.common.base.Preconditions;
-import com.google.common.collect.Lists;
 import io.netty.bootstrap.ServerBootstrap;
 import io.netty.buffer.PooledByteBufAllocator;
 import io.netty.channel.ChannelFuture;
@@ -33,7 +33,6 @@
 import io.netty.channel.ChannelOption;
 import io.netty.channel.EventLoopGroup;
 import io.netty.channel.socket.SocketChannel;
-import org.apache.commons.lang3.SystemUtils;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
@@ -77,7 +76,7 @@ public TransportServer(
       this.pooledAllocator = NettyUtils.createPooledByteBufAllocator(
           conf.preferDirectBufs(), true /* allowCache */, conf.serverThreads());
     }
-    this.bootstraps = Lists.newArrayList(Preconditions.checkNotNull(bootstraps));
+    this.bootstraps = new ArrayList<>(Objects.requireNonNull(bootstraps));
 
     boolean shouldClose = true;
     try {
@@ -105,11 +104,13 @@ private void init(String hostToBind, int portToBind) {
     EventLoopGroup workerGroup =  NettyUtils.createEventLoop(ioMode, conf.serverThreads(),
       conf.getModuleName() + "-server");
 
+    String name = System.getProperty("os.name");
+    boolean isNotWindows = !name.regionMatches(true, 0, "Windows", 0, 7);
     bootstrap = new ServerBootstrap()
       .group(bossGroup, workerGroup)
       .channel(NettyUtils.getServerChannelClass(ioMode))
       .option(ChannelOption.ALLOCATOR, pooledAllocator)
-      .option(ChannelOption.SO_REUSEADDR, !SystemUtils.IS_OS_WINDOWS)
+      .option(ChannelOption.SO_REUSEADDR, isNotWindows)
       .childOption(ChannelOption.ALLOCATOR, pooledAllocator);
 
     this.metrics = new NettyMemoryMetrics(
diff --git a/common/network-common/src/main/java/org/apache/spark/network/ssl/SSLFactory.java b/common/network-common/src/main/java/org/apache/spark/network/ssl/SSLFactory.java
index a2e42e3eb39f6..f4b245ca7b128 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/ssl/SSLFactory.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/ssl/SSLFactory.java
@@ -20,6 +20,7 @@
 import java.io.FileInputStream;
 import java.io.IOException;
 import java.io.InputStream;
+import java.nio.file.Files;
 import java.security.GeneralSecurityException;
 import java.security.KeyStore;
 import java.security.KeyStoreException;
@@ -41,8 +42,6 @@
 import javax.net.ssl.TrustManagerFactory;
 import javax.net.ssl.X509TrustManager;
 
-import com.google.common.io.Files;
-
 import io.netty.buffer.ByteBufAllocator;
 import io.netty.handler.ssl.OpenSsl;
 import io.netty.handler.ssl.SslContext;
@@ -378,7 +377,7 @@ private static TrustManager[] trustStoreManagers(
 
   private static TrustManager[] defaultTrustManagers(File trustStore, String trustStorePassword)
       throws IOException, KeyStoreException, CertificateException, NoSuchAlgorithmException {
-    try (InputStream input = Files.asByteSource(trustStore).openStream()) {
+    try (InputStream input = Files.newInputStream(trustStore.toPath())) {
       KeyStore ks = KeyStore.getInstance(KeyStore.getDefaultType());
       char[] passwordCharacters = trustStorePassword != null?
         trustStorePassword.toCharArray() : null;
diff --git a/common/network-common/src/main/java/org/apache/spark/network/util/LevelDBProvider.java b/common/network-common/src/main/java/org/apache/spark/network/util/LevelDBProvider.java
index 391931961a474..ec3e032102e4f 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/util/LevelDBProvider.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/util/LevelDBProvider.java
@@ -50,7 +50,7 @@ public static DB initLevelDB(File dbFile, StoreVersion version, ObjectMapper map
         tmpDb = JniDBFactory.factory.open(dbFile, options);
       } catch (NativeDB.DBException e) {
         if (e.isNotFound() || e.getMessage().contains(" does not exist ")) {
-          logger.info("Creating state database at {}", MDC.of(LogKeys.PATH$.MODULE$, dbFile));
+          logger.info("Creating state database at {}", MDC.of(LogKeys.PATH, dbFile));
           options.createIfMissing(true);
           try {
             tmpDb = JniDBFactory.factory.open(dbFile, options);
@@ -61,16 +61,16 @@ public static DB initLevelDB(File dbFile, StoreVersion version, ObjectMapper map
           // the leveldb file seems to be corrupt somehow.  Lets just blow it away and create a new
           // one, so we can keep processing new apps
           logger.error("error opening leveldb file {}. Creating new file, will not be able to " +
-              "recover state for existing applications", e, MDC.of(LogKeys.PATH$.MODULE$, dbFile));
+              "recover state for existing applications", e, MDC.of(LogKeys.PATH, dbFile));
           if (dbFile.isDirectory()) {
             for (File f : dbFile.listFiles()) {
               if (!f.delete()) {
-                logger.warn("error deleting {}", MDC.of(LogKeys.PATH$.MODULE$, f.getPath()));
+                logger.warn("error deleting {}", MDC.of(LogKeys.PATH, f.getPath()));
               }
             }
           }
           if (!dbFile.delete()) {
-            logger.warn("error deleting {}", MDC.of(LogKeys.PATH$.MODULE$, dbFile.getPath()));
+            logger.warn("error deleting {}", MDC.of(LogKeys.PATH, dbFile.getPath()));
           }
           options.createIfMissing(true);
           try {
diff --git a/common/network-common/src/main/java/org/apache/spark/network/util/LimitedInputStream.java b/common/network-common/src/main/java/org/apache/spark/network/util/LimitedInputStream.java
index e6cf02a590e29..79cf0eb7c6153 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/util/LimitedInputStream.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/util/LimitedInputStream.java
@@ -21,8 +21,7 @@
 import java.io.FilterInputStream;
 import java.io.IOException;
 import java.io.InputStream;
-
-import com.google.common.base.Preconditions;
+import java.util.Objects;
 
 /**
  * Wraps a {@link InputStream}, limiting the number of bytes which can be read.
@@ -50,10 +49,9 @@ public LimitedInputStream(InputStream in, long limit) {
    * @param closeWrappedStream whether to close {@code in} when {@link #close} is called
      */
   public LimitedInputStream(InputStream in, long limit, boolean closeWrappedStream) {
-    super(in);
+    super(Objects.requireNonNull(in));
     this.closeWrappedStream = closeWrappedStream;
-    Preconditions.checkNotNull(in);
-    Preconditions.checkArgument(limit >= 0, "limit must be non-negative");
+    JavaUtils.checkArgument(limit >= 0, "limit must be non-negative");
     left = limit;
   }
   @Override public int available() throws IOException {
diff --git a/common/network-common/src/main/java/org/apache/spark/network/util/RocksDBProvider.java b/common/network-common/src/main/java/org/apache/spark/network/util/RocksDBProvider.java
index 1753c124c9935..cea9207d3470a 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/util/RocksDBProvider.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/util/RocksDBProvider.java
@@ -67,7 +67,7 @@ public static RocksDB initRockDB(File dbFile, StoreVersion version, ObjectMapper
           tmpDb = RocksDB.open(dbOptions, dbFile.toString());
         } catch (RocksDBException e) {
           if (e.getStatus().getCode() == Status.Code.NotFound) {
-            logger.info("Creating state database at {}", MDC.of(LogKeys.PATH$.MODULE$, dbFile));
+            logger.info("Creating state database at {}", MDC.of(LogKeys.PATH, dbFile));
             dbOptions.setCreateIfMissing(true);
             try {
               tmpDb = RocksDB.open(dbOptions, dbFile.toString());
@@ -78,16 +78,16 @@ public static RocksDB initRockDB(File dbFile, StoreVersion version, ObjectMapper
             // the RocksDB file seems to be corrupt somehow.  Let's just blow it away and create
             // a new one, so we can keep processing new apps
             logger.error("error opening rocksdb file {}. Creating new file, will not be able to " +
-              "recover state for existing applications", e, MDC.of(LogKeys.PATH$.MODULE$, dbFile));
+              "recover state for existing applications", e, MDC.of(LogKeys.PATH, dbFile));
             if (dbFile.isDirectory()) {
               for (File f : Objects.requireNonNull(dbFile.listFiles())) {
                 if (!f.delete()) {
-                  logger.warn("error deleting {}", MDC.of(LogKeys.PATH$.MODULE$, f.getPath()));
+                  logger.warn("error deleting {}", MDC.of(LogKeys.PATH, f.getPath()));
                 }
               }
             }
             if (!dbFile.delete()) {
-              logger.warn("error deleting {}", MDC.of(LogKeys.PATH$.MODULE$, dbFile.getPath()));
+              logger.warn("error deleting {}", MDC.of(LogKeys.PATH, dbFile.getPath()));
             }
             dbOptions.setCreateIfMissing(true);
             try {
diff --git a/common/network-common/src/main/java/org/apache/spark/network/util/TransportConf.java b/common/network-common/src/main/java/org/apache/spark/network/util/TransportConf.java
index 822b8aa310a22..003e72edf29ee 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/util/TransportConf.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/util/TransportConf.java
@@ -21,8 +21,6 @@
 import java.util.Locale;
 import java.util.Properties;
 import java.util.concurrent.TimeUnit;
-import com.google.common.base.Preconditions;
-import com.google.common.primitives.Ints;
 import io.netty.util.NettyRuntime;
 
 /**
@@ -171,7 +169,7 @@ public int ioRetryWaitTimeMs() {
    * memory mapping has high overhead for blocks close to or below the page size of the OS.
    */
   public int memoryMapBytes() {
-    return Ints.checkedCast(JavaUtils.byteStringAsBytes(
+    return JavaUtils.checkedCast(JavaUtils.byteStringAsBytes(
       conf.get("spark.storage.memoryMapThreshold", "2m")));
   }
 
@@ -248,7 +246,7 @@ public boolean saslEncryption() {
    * Maximum number of bytes to be encrypted at a time when SASL encryption is used.
    */
   public int maxSaslEncryptedBlockSize() {
-    return Ints.checkedCast(JavaUtils.byteStringAsBytes(
+    return JavaUtils.checkedCast(JavaUtils.byteStringAsBytes(
       conf.get("spark.network.sasl.maxEncryptedBlockSize", "64k")));
   }
 
@@ -263,7 +261,7 @@ public boolean saslServerAlwaysEncrypt() {
    * When Secure (SSL/TLS) Shuffle is enabled, the Chunk size to use for shuffling files.
    */
   public int sslShuffleChunkSize() {
-    return Ints.checkedCast(JavaUtils.byteStringAsBytes(
+    return JavaUtils.checkedCast(JavaUtils.byteStringAsBytes(
       conf.get("spark.network.ssl.maxEncryptedBlockSize", "64k")));
   }
 
@@ -504,7 +502,7 @@ public int finalizeShuffleMergeHandlerThreads() {
     if (!this.getModuleName().equalsIgnoreCase("shuffle")) {
       return 0;
     }
-    Preconditions.checkArgument(separateFinalizeShuffleMerge(),
+    JavaUtils.checkArgument(separateFinalizeShuffleMerge(),
         "Please set spark.shuffle.server.finalizeShuffleMergeThreadsPercent to a positive value");
     int finalizeShuffleMergeThreadsPercent =
         Integer.parseInt(conf.get("spark.shuffle.server.finalizeShuffleMergeThreadsPercent"));
@@ -567,7 +565,7 @@ public String mergedShuffleFileManagerImpl() {
    * service unnecessarily.
    */
   public int minChunkSizeInMergedShuffleFile() {
-    return Ints.checkedCast(JavaUtils.byteStringAsBytes(
+    return JavaUtils.checkedCast(JavaUtils.byteStringAsBytes(
       conf.get("spark.shuffle.push.server.minChunkSizeInMergedShuffleFile", "2m")));
   }
 
diff --git a/common/network-common/src/main/java/org/apache/spark/network/util/TransportFrameDecoder.java b/common/network-common/src/main/java/org/apache/spark/network/util/TransportFrameDecoder.java
index cef0e415aa40a..6b490068507aa 100644
--- a/common/network-common/src/main/java/org/apache/spark/network/util/TransportFrameDecoder.java
+++ b/common/network-common/src/main/java/org/apache/spark/network/util/TransportFrameDecoder.java
@@ -20,7 +20,6 @@
 import java.util.LinkedList;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.CompositeByteBuf;
 import io.netty.buffer.Unpooled;
@@ -145,9 +144,9 @@ private ByteBuf decodeNext() {
     }
 
     if (frameBuf == null) {
-      Preconditions.checkArgument(frameSize < MAX_FRAME_SIZE,
+      JavaUtils.checkArgument(frameSize < MAX_FRAME_SIZE,
           "Too large frame: %s", frameSize);
-      Preconditions.checkArgument(frameSize > 0,
+      JavaUtils.checkArgument(frameSize > 0,
           "Frame length should be positive: %s", frameSize);
       frameRemainingBytes = (int) frameSize;
 
@@ -252,7 +251,7 @@ public void handlerRemoved(ChannelHandlerContext ctx) throws Exception {
   }
 
   public void setInterceptor(Interceptor interceptor) {
-    Preconditions.checkState(this.interceptor == null, "Already have an interceptor.");
+    JavaUtils.checkState(this.interceptor == null, "Already have an interceptor.");
     this.interceptor = interceptor;
   }
 
diff --git a/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchIntegrationSuite.java b/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchIntegrationSuite.java
index 576a106934fda..75ccd8d5789d4 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchIntegrationSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchIntegrationSuite.java
@@ -30,7 +30,6 @@
 import java.util.concurrent.Semaphore;
 import java.util.concurrent.TimeUnit;
 
-import com.google.common.collect.Sets;
 import com.google.common.io.Closeables;
 import org.junit.jupiter.api.AfterAll;
 import org.junit.jupiter.api.BeforeAll;
@@ -188,7 +187,7 @@ public void onFailure(int chunkIndex, Throwable e) {
   @Test
   public void fetchBufferChunk() throws Exception {
     FetchResult res = fetchChunks(Arrays.asList(BUFFER_CHUNK_INDEX));
-    assertEquals(Sets.newHashSet(BUFFER_CHUNK_INDEX), res.successChunks);
+    assertEquals(Set.of(BUFFER_CHUNK_INDEX), res.successChunks);
     assertTrue(res.failedChunks.isEmpty());
     assertBufferListsEqual(Arrays.asList(bufferChunk), res.buffers);
     res.releaseBuffers();
@@ -197,7 +196,7 @@ public void fetchBufferChunk() throws Exception {
   @Test
   public void fetchFileChunk() throws Exception {
     FetchResult res = fetchChunks(Arrays.asList(FILE_CHUNK_INDEX));
-    assertEquals(Sets.newHashSet(FILE_CHUNK_INDEX), res.successChunks);
+    assertEquals(Set.of(FILE_CHUNK_INDEX), res.successChunks);
     assertTrue(res.failedChunks.isEmpty());
     assertBufferListsEqual(Arrays.asList(fileChunk), res.buffers);
     res.releaseBuffers();
@@ -207,14 +206,14 @@ public void fetchFileChunk() throws Exception {
   public void fetchNonExistentChunk() throws Exception {
     FetchResult res = fetchChunks(Arrays.asList(12345));
     assertTrue(res.successChunks.isEmpty());
-    assertEquals(Sets.newHashSet(12345), res.failedChunks);
+    assertEquals(Set.of(12345), res.failedChunks);
     assertTrue(res.buffers.isEmpty());
   }
 
   @Test
   public void fetchBothChunks() throws Exception {
     FetchResult res = fetchChunks(Arrays.asList(BUFFER_CHUNK_INDEX, FILE_CHUNK_INDEX));
-    assertEquals(Sets.newHashSet(BUFFER_CHUNK_INDEX, FILE_CHUNK_INDEX), res.successChunks);
+    assertEquals(Set.of(BUFFER_CHUNK_INDEX, FILE_CHUNK_INDEX), res.successChunks);
     assertTrue(res.failedChunks.isEmpty());
     assertBufferListsEqual(Arrays.asList(bufferChunk, fileChunk), res.buffers);
     res.releaseBuffers();
@@ -223,8 +222,8 @@ public void fetchBothChunks() throws Exception {
   @Test
   public void fetchChunkAndNonExistent() throws Exception {
     FetchResult res = fetchChunks(Arrays.asList(BUFFER_CHUNK_INDEX, 12345));
-    assertEquals(Sets.newHashSet(BUFFER_CHUNK_INDEX), res.successChunks);
-    assertEquals(Sets.newHashSet(12345), res.failedChunks);
+    assertEquals(Set.of(BUFFER_CHUNK_INDEX), res.successChunks);
+    assertEquals(Set.of(12345), res.failedChunks);
     assertBufferListsEqual(Arrays.asList(bufferChunk), res.buffers);
     res.releaseBuffers();
   }
diff --git a/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchRequestHandlerSuite.java b/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchRequestHandlerSuite.java
index 74dffd87dcf30..e9a4c355ebe48 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchRequestHandlerSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/ChunkFetchRequestHandlerSuite.java
@@ -27,8 +27,6 @@
 
 import static org.mockito.Mockito.*;
 
-import org.apache.commons.lang3.tuple.ImmutablePair;
-import org.apache.commons.lang3.tuple.Pair;
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.client.TransportClient;
 import org.apache.spark.network.protocol.*;
@@ -36,6 +34,7 @@
 import org.apache.spark.network.server.NoOpRpcHandler;
 import org.apache.spark.network.server.OneForOneStreamManager;
 import org.apache.spark.network.server.RpcHandler;
+import org.apache.spark.util.Pair;
 
 public class ChunkFetchRequestHandlerSuite {
 
@@ -54,7 +53,7 @@ public void handleChunkFetchRequest() throws Exception {
       .thenAnswer(invocationOnMock0 -> {
         Object response = invocationOnMock0.getArguments()[0];
         ExtendedChannelPromise channelFuture = new ExtendedChannelPromise(channel);
-        responseAndPromisePairs.add(ImmutablePair.of(response, channelFuture));
+        responseAndPromisePairs.add(Pair.of(response, channelFuture));
         return channelFuture;
       });
 
diff --git a/common/network-common/src/test/java/org/apache/spark/network/ProtocolSuite.java b/common/network-common/src/test/java/org/apache/spark/network/ProtocolSuite.java
index 8c1299ebcd836..500d91868bbbd 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/ProtocolSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/ProtocolSuite.java
@@ -19,7 +19,6 @@
 
 import java.util.List;
 
-import com.google.common.primitives.Ints;
 import io.netty.buffer.Unpooled;
 import io.netty.channel.ChannelHandlerContext;
 import io.netty.channel.FileRegion;
@@ -44,6 +43,7 @@
 import org.apache.spark.network.protocol.StreamRequest;
 import org.apache.spark.network.protocol.StreamResponse;
 import org.apache.spark.network.util.ByteArrayWritableChannel;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.NettyUtils;
 
 public class ProtocolSuite {
@@ -115,7 +115,8 @@ private static class FileRegionEncoder extends MessageToMessageEncoder<FileRegio
     public void encode(ChannelHandlerContext ctx, FileRegion in, List<Object> out)
       throws Exception {
 
-      ByteArrayWritableChannel channel = new ByteArrayWritableChannel(Ints.checkedCast(in.count()));
+      ByteArrayWritableChannel channel =
+        new ByteArrayWritableChannel(JavaUtils.checkedCast(in.count()));
       while (in.transferred() < in.count()) {
         in.transferTo(channel, in.transferred());
       }
diff --git a/common/network-common/src/test/java/org/apache/spark/network/RpcIntegrationSuite.java b/common/network-common/src/test/java/org/apache/spark/network/RpcIntegrationSuite.java
index 40495d6912c91..e229e32e91717 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/RpcIntegrationSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/RpcIntegrationSuite.java
@@ -24,10 +24,6 @@
 import java.util.concurrent.Semaphore;
 import java.util.concurrent.TimeUnit;
 
-import com.google.common.collect.Sets;
-import com.google.common.io.Files;
-import org.apache.commons.lang3.tuple.ImmutablePair;
-import org.apache.commons.lang3.tuple.Pair;
 import org.junit.jupiter.api.AfterAll;
 import org.junit.jupiter.api.BeforeAll;
 import org.junit.jupiter.api.Test;
@@ -41,6 +37,7 @@
 import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.MapConfigProvider;
 import org.apache.spark.network.util.TransportConf;
+import org.apache.spark.util.Pair;
 
 public class RpcIntegrationSuite {
   static TransportConf conf;
@@ -248,14 +245,14 @@ public void onFailure(Throwable e) {
   @Test
   public void singleRPC() throws Exception {
     RpcResult res = sendRPC("hello/Aaron");
-    assertEquals(Sets.newHashSet("Hello, Aaron!"), res.successMessages);
+    assertEquals(Set.of("Hello, Aaron!"), res.successMessages);
     assertTrue(res.errorMessages.isEmpty());
   }
 
   @Test
   public void doubleRPC() throws Exception {
     RpcResult res = sendRPC("hello/Aaron", "hello/Reynold");
-    assertEquals(Sets.newHashSet("Hello, Aaron!", "Hello, Reynold!"), res.successMessages);
+    assertEquals(Set.of("Hello, Aaron!", "Hello, Reynold!"), res.successMessages);
     assertTrue(res.errorMessages.isEmpty());
   }
 
@@ -263,28 +260,28 @@ public void doubleRPC() throws Exception {
   public void returnErrorRPC() throws Exception {
     RpcResult res = sendRPC("return error/OK");
     assertTrue(res.successMessages.isEmpty());
-    assertErrorsContain(res.errorMessages, Sets.newHashSet("Returned: OK"));
+    assertErrorsContain(res.errorMessages, Set.of("Returned: OK"));
   }
 
   @Test
   public void throwErrorRPC() throws Exception {
     RpcResult res = sendRPC("throw error/uh-oh");
     assertTrue(res.successMessages.isEmpty());
-    assertErrorsContain(res.errorMessages, Sets.newHashSet("Thrown: uh-oh"));
+    assertErrorsContain(res.errorMessages, Set.of("Thrown: uh-oh"));
   }
 
   @Test
   public void doubleTrouble() throws Exception {
     RpcResult res = sendRPC("return error/OK", "throw error/uh-oh");
     assertTrue(res.successMessages.isEmpty());
-    assertErrorsContain(res.errorMessages, Sets.newHashSet("Returned: OK", "Thrown: uh-oh"));
+    assertErrorsContain(res.errorMessages, Set.of("Returned: OK", "Thrown: uh-oh"));
   }
 
   @Test
   public void sendSuccessAndFailure() throws Exception {
     RpcResult res = sendRPC("hello/Bob", "throw error/the", "hello/Builder", "return error/!");
-    assertEquals(Sets.newHashSet("Hello, Bob!", "Hello, Builder!"), res.successMessages);
-    assertErrorsContain(res.errorMessages, Sets.newHashSet("Thrown: the", "Returned: !"));
+    assertEquals(Set.of("Hello, Bob!", "Hello, Builder!"), res.successMessages);
+    assertErrorsContain(res.errorMessages, Set.of("Thrown: the", "Returned: !"));
   }
 
   @Test
@@ -311,7 +308,7 @@ public void sendRpcWithStreamOneAtATime() throws Exception {
     for (String stream : StreamTestHelper.STREAMS) {
       RpcResult res = sendRpcWithStream(stream);
       assertTrue(res.errorMessages.isEmpty(), "there were error messages!" + res.errorMessages);
-      assertEquals(Sets.newHashSet(stream), res.successMessages);
+      assertEquals(Set.of(stream), res.successMessages);
     }
   }
 
@@ -322,7 +319,7 @@ public void sendRpcWithStreamConcurrently() throws Exception {
       streams[i] = StreamTestHelper.STREAMS[i % StreamTestHelper.STREAMS.length];
     }
     RpcResult res = sendRpcWithStream(streams);
-    assertEquals(Sets.newHashSet(StreamTestHelper.STREAMS), res.successMessages);
+    assertEquals(Set.of(StreamTestHelper.STREAMS), res.successMessages);
     assertTrue(res.errorMessages.isEmpty());
   }
 
@@ -342,8 +339,8 @@ public void sendRpcWithStreamFailures() throws Exception {
     RpcResult exceptionInOnComplete =
         sendRpcWithStream("fail/exception-oncomplete/smallBuffer", "smallBuffer");
     assertErrorsContain(exceptionInOnComplete.errorMessages,
-        Sets.newHashSet("Failure post-processing"));
-    assertEquals(Sets.newHashSet("smallBuffer"), exceptionInOnComplete.successMessages);
+        Set.of("Failure post-processing"));
+    assertEquals(Set.of("smallBuffer"), exceptionInOnComplete.successMessages);
   }
 
   private void assertErrorsContain(Set<String> errors, Set<String> contains) {
@@ -365,14 +362,14 @@ private void assertErrorAndClosed(RpcResult result, String expectedError) {
 
     // We expect 1 additional error due to closed connection and here are possible keywords in the
     // error message.
-    Set<String> possibleClosedErrors = Sets.newHashSet(
+    Set<String> possibleClosedErrors = Set.of(
         "closed",
         "Connection reset",
         "java.nio.channels.ClosedChannelException",
         "io.netty.channel.StacklessClosedChannelException",
         "java.io.IOException: Broken pipe"
     );
-    Set<String> containsAndClosed = Sets.newHashSet(expectedError);
+    Set<String> containsAndClosed = new HashSet<>(Set.of(expectedError));
     containsAndClosed.addAll(possibleClosedErrors);
 
     Pair<Set<String>, Set<String>> r = checkErrorsContain(errors, containsAndClosed);
@@ -392,8 +389,8 @@ private void assertErrorAndClosed(RpcResult result, String expectedError) {
   private Pair<Set<String>, Set<String>> checkErrorsContain(
       Set<String> errors,
       Set<String> contains) {
-    Set<String> remainingErrors = Sets.newHashSet(errors);
-    Set<String> notFound = Sets.newHashSet();
+    Set<String> remainingErrors = new HashSet<>(errors);
+    Set<String> notFound = new HashSet<>();
     for (String contain : contains) {
       Iterator<String> it = remainingErrors.iterator();
       boolean foundMatch = false;
@@ -408,7 +405,7 @@ private Pair<Set<String>, Set<String>> checkErrorsContain(
         notFound.add(contain);
       }
     }
-    return new ImmutablePair<>(remainingErrors, notFound);
+    return new Pair<>(remainingErrors, notFound);
   }
 
   private static class VerifyingStreamCallback implements StreamCallbackWithID {
@@ -431,7 +428,8 @@ private static class VerifyingStreamCallback implements StreamCallbackWithID {
 
     void verify() throws IOException {
       if (streamId.equals("file")) {
-        assertTrue(Files.equal(testData.testFile, outFile), "File stream did not match.");
+        assertTrue(JavaUtils.contentEquals(testData.testFile, outFile),
+          "File stream did not match.");
       } else {
         byte[] result = ((ByteArrayOutputStream)out).toByteArray();
         ByteBuffer srcBuffer = testData.srcBuffer(streamId);
diff --git a/common/network-common/src/test/java/org/apache/spark/network/StreamSuite.java b/common/network-common/src/test/java/org/apache/spark/network/StreamSuite.java
index 4f4637e302b94..496af96cb1cac 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/StreamSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/StreamSuite.java
@@ -29,7 +29,6 @@
 import java.util.concurrent.ExecutorService;
 import java.util.concurrent.TimeUnit;
 
-import com.google.common.io.Files;
 import org.junit.jupiter.api.AfterAll;
 import org.junit.jupiter.api.BeforeAll;
 import org.junit.jupiter.api.Test;
@@ -43,6 +42,7 @@
 import org.apache.spark.network.server.RpcHandler;
 import org.apache.spark.network.server.StreamManager;
 import org.apache.spark.network.server.TransportServer;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.MapConfigProvider;
 import org.apache.spark.network.util.TransportConf;
 
@@ -212,7 +212,8 @@ public void run() {
         callback.waitForCompletion(timeoutMs);
 
         if (srcBuffer == null) {
-          assertTrue(Files.equal(testData.testFile, outFile), "File stream did not match.");
+          assertTrue(JavaUtils.contentEquals(testData.testFile, outFile),
+            "File stream did not match.");
         } else {
           ByteBuffer base;
           synchronized (srcBuffer) {
diff --git a/common/network-common/src/test/java/org/apache/spark/network/TestManagedBuffer.java b/common/network-common/src/test/java/org/apache/spark/network/TestManagedBuffer.java
index d1e93e3cb5845..828d995ba444b 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/TestManagedBuffer.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/TestManagedBuffer.java
@@ -21,11 +21,11 @@
 import java.io.InputStream;
 import java.nio.ByteBuffer;
 
-import com.google.common.base.Preconditions;
 import io.netty.buffer.Unpooled;
 
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.buffer.NettyManagedBuffer;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * A ManagedBuffer implementation that contains 0, 1, 2, 3, ..., (len-1).
@@ -38,7 +38,7 @@ public class TestManagedBuffer extends ManagedBuffer {
   private NettyManagedBuffer underlying;
 
   public TestManagedBuffer(int len) {
-    Preconditions.checkArgument(len <= Byte.MAX_VALUE);
+    JavaUtils.checkArgument(len <= Byte.MAX_VALUE, "length exceeds limit " + Byte.MAX_VALUE);
     this.len = len;
     byte[] byteArray = new byte[len];
     for (int i = 0; i < len; i ++) {
diff --git a/common/network-common/src/test/java/org/apache/spark/network/TransportRequestHandlerSuite.java b/common/network-common/src/test/java/org/apache/spark/network/TransportRequestHandlerSuite.java
index d643fb4f662e3..9433e274b507f 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/TransportRequestHandlerSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/TransportRequestHandlerSuite.java
@@ -28,8 +28,6 @@
 import static org.junit.jupiter.api.Assertions.*;
 import static org.mockito.Mockito.*;
 
-import org.apache.commons.lang3.tuple.ImmutablePair;
-import org.apache.commons.lang3.tuple.Pair;
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.client.RpcResponseCallback;
 import org.apache.spark.network.client.TransportClient;
@@ -39,6 +37,7 @@
 import org.apache.spark.network.server.RpcHandler;
 import org.apache.spark.network.server.StreamManager;
 import org.apache.spark.network.server.TransportRequestHandler;
+import org.apache.spark.util.Pair;
 
 public class TransportRequestHandlerSuite {
 
@@ -53,7 +52,7 @@ public void handleStreamRequest() throws Exception {
       .thenAnswer(invocationOnMock0 -> {
         Object response = invocationOnMock0.getArguments()[0];
         ExtendedChannelPromise channelFuture = new ExtendedChannelPromise(channel);
-        responseAndPromisePairs.add(ImmutablePair.of(response, channelFuture));
+        responseAndPromisePairs.add(Pair.of(response, channelFuture));
         return channelFuture;
       });
 
@@ -145,7 +144,7 @@ public MergedBlockMetaReqHandler getMergedBlockMetaReqHandler() {
     when(channel.writeAndFlush(any())).thenAnswer(invocationOnMock0 -> {
       Object response = invocationOnMock0.getArguments()[0];
       ExtendedChannelPromise channelFuture = new ExtendedChannelPromise(channel);
-      responseAndPromisePairs.add(ImmutablePair.of(response, channelFuture));
+      responseAndPromisePairs.add(Pair.of(response, channelFuture));
       return channelFuture;
     });
 
diff --git a/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthEngineSuite.java b/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthEngineSuite.java
index 628de9e780337..904deabba5867 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthEngineSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthEngineSuite.java
@@ -21,7 +21,6 @@
 import java.security.GeneralSecurityException;
 import java.util.Map;
 
-import com.google.common.collect.ImmutableMap;
 import com.google.crypto.tink.subtle.Hex;
 import org.apache.spark.network.util.*;
 
@@ -49,7 +48,7 @@ abstract class AuthEngineSuite {
   static TransportConf getConf(int authEngineVerison, boolean useCtr) {
     String authEngineVersion = (authEngineVerison == 1) ? "1" : "2";
     String mode = useCtr ? "AES/CTR/NoPadding" : "AES/GCM/NoPadding";
-    Map<String, String> confMap = ImmutableMap.of(
+    Map<String, String> confMap = Map.of(
             "spark.network.crypto.enabled", "true",
             "spark.network.crypto.authEngineVersion", authEngineVersion,
             "spark.network.crypto.cipher", mode
diff --git a/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthIntegrationSuite.java b/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthIntegrationSuite.java
index cb5929f7c65b4..8d1773316878b 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthIntegrationSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/crypto/AuthIntegrationSuite.java
@@ -22,7 +22,6 @@
 import java.util.List;
 import java.util.Map;
 
-import com.google.common.collect.ImmutableMap;
 import io.netty.channel.Channel;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.Test;
@@ -214,7 +213,7 @@ private static class AuthTestCtx {
     }
 
     AuthTestCtx(RpcHandler rpcHandler, String mode) throws Exception {
-      Map<String, String> testConf = ImmutableMap.of(
+      Map<String, String> testConf = Map.of(
               "spark.network.crypto.enabled", "true",
               "spark.network.crypto.cipher", mode);
       this.conf = new TransportConf("rpc", new MapConfigProvider(testConf));
diff --git a/common/network-common/src/test/java/org/apache/spark/network/protocol/MergedBlockMetaSuccessSuite.java b/common/network-common/src/test/java/org/apache/spark/network/protocol/MergedBlockMetaSuccessSuite.java
index a3750ce11172b..41b84f3895876 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/protocol/MergedBlockMetaSuccessSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/protocol/MergedBlockMetaSuccessSuite.java
@@ -21,9 +21,9 @@
 import java.io.File;
 import java.io.FileOutputStream;
 import java.nio.file.Files;
+import java.util.ArrayList;
 import java.util.List;
 
-import com.google.common.collect.Lists;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.ByteBufAllocator;
 import io.netty.buffer.Unpooled;
@@ -65,7 +65,7 @@ public void testMergedBlocksMetaEncodeDecode() throws Exception {
     MergedBlockMetaSuccess expectedMeta = new MergedBlockMetaSuccess(requestId, 2,
       new FileSegmentManagedBuffer(conf, chunkMetaFile, 0, chunkMetaFile.length()));
 
-    List<Object> out = Lists.newArrayList();
+    List<Object> out = new ArrayList<>();
     ChannelHandlerContext context = mock(ChannelHandlerContext.class);
     when(context.alloc()).thenReturn(ByteBufAllocator.DEFAULT);
 
diff --git a/common/network-common/src/test/java/org/apache/spark/network/sasl/SparkSaslSuite.java b/common/network-common/src/test/java/org/apache/spark/network/sasl/SparkSaslSuite.java
index bf0424a1506a3..4feaf5cef3f2b 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/sasl/SparkSaslSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/sasl/SparkSaslSuite.java
@@ -23,6 +23,7 @@
 import java.io.File;
 import java.lang.reflect.Method;
 import java.nio.ByteBuffer;
+import java.nio.file.Files;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
@@ -36,8 +37,6 @@
 import javax.security.sasl.SaslException;
 
 import com.google.common.collect.ImmutableMap;
-import com.google.common.io.ByteStreams;
-import com.google.common.io.Files;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
 import io.netty.channel.Channel;
@@ -221,7 +220,7 @@ public void testEncryptedMessageChunking() throws Exception {
 
       byte[] data = new byte[8 * 1024];
       new Random().nextBytes(data);
-      Files.write(data, file);
+      Files.write(file.toPath(), data);
 
       SaslEncryptionBackend backend = mock(SaslEncryptionBackend.class);
       // It doesn't really matter what we return here, as long as it's not null.
@@ -245,7 +244,7 @@ public void testEncryptedMessageChunking() throws Exception {
 
   @Test
   public void testFileRegionEncryption() throws Exception {
-    Map<String, String> testConf = ImmutableMap.of(
+    Map<String, String> testConf = Map.of(
       "spark.network.sasl.maxEncryptedBlockSize", "1k");
 
     AtomicReference<ManagedBuffer> response = new AtomicReference<>();
@@ -262,7 +261,7 @@ public void testFileRegionEncryption() throws Exception {
 
       byte[] data = new byte[8 * 1024];
       new Random().nextBytes(data);
-      Files.write(data, file);
+      Files.write(file.toPath(), data);
 
       ctx = new SaslTestCtx(rpcHandler, true, false, testConf);
 
@@ -282,7 +281,7 @@ public void testFileRegionEncryption() throws Exception {
       verify(callback, times(1)).onSuccess(anyInt(), any(ManagedBuffer.class));
       verify(callback, never()).onFailure(anyInt(), any(Throwable.class));
 
-      byte[] received = ByteStreams.toByteArray(response.get().createInputStream());
+      byte[] received = response.get().createInputStream().readAllBytes();
       assertArrayEquals(data, received);
     } finally {
       file.delete();
@@ -299,7 +298,7 @@ public void testFileRegionEncryption() throws Exception {
   public void testServerAlwaysEncrypt() {
     Exception re = assertThrows(Exception.class,
       () -> new SaslTestCtx(mock(RpcHandler.class), false, false,
-              ImmutableMap.of("spark.network.sasl.serverAlwaysEncrypt", "true")));
+              Map.of("spark.network.sasl.serverAlwaysEncrypt", "true")));
     assertTrue(re.getCause() instanceof SaslException);
   }
 
diff --git a/common/network-common/src/test/java/org/apache/spark/network/util/CryptoUtilsSuite.java b/common/network-common/src/test/java/org/apache/spark/network/util/CryptoUtilsSuite.java
index 47c9ef2490d2e..9673bbfbc2de7 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/util/CryptoUtilsSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/util/CryptoUtilsSuite.java
@@ -20,7 +20,6 @@
 import java.util.Map;
 import java.util.Properties;
 
-import com.google.common.collect.ImmutableMap;
 import org.junit.jupiter.api.Test;
 import static org.junit.jupiter.api.Assertions.*;
 
@@ -38,7 +37,7 @@ public void testConfConversion() {
     String confVal2 = "val2";
     String cryptoKey2 = CryptoUtils.COMMONS_CRYPTO_CONFIG_PREFIX + "A.b.c";
 
-    Map<String, String> conf = ImmutableMap.of(
+    Map<String, String> conf = Map.of(
       confKey1, confVal1,
       confKey2, confVal2);
 
diff --git a/common/network-common/src/test/java/org/apache/spark/network/util/DBProviderSuite.java b/common/network-common/src/test/java/org/apache/spark/network/util/DBProviderSuite.java
index 81bfc55264c4c..f7299e157674e 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/util/DBProviderSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/util/DBProviderSuite.java
@@ -18,7 +18,6 @@
 package org.apache.spark.network.util;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
-import org.apache.commons.lang3.SystemUtils;
 import org.apache.spark.network.shuffledb.DBBackend;
 import org.apache.spark.network.shuffledb.StoreVersion;
 import org.junit.jupiter.api.Assertions;
@@ -38,7 +37,7 @@ public void testRockDBCheckVersionFailed() throws IOException, InterruptedExcept
 
   @Test
   public void testLevelDBCheckVersionFailed() throws IOException, InterruptedException {
-    assumeFalse(SystemUtils.IS_OS_MAC_OSX && SystemUtils.OS_ARCH.equals("aarch64"));
+    assumeFalse(JavaUtils.isMacOnAppleSilicon);
     testCheckVersionFailed(DBBackend.LEVELDB, "leveldb");
   }
 
diff --git a/common/network-common/src/test/java/org/apache/spark/network/util/JavaUtilsSuite.java b/common/network-common/src/test/java/org/apache/spark/network/util/JavaUtilsSuite.java
index 1336a587fd2eb..2edeb3f05c9b0 100644
--- a/common/network-common/src/test/java/org/apache/spark/network/util/JavaUtilsSuite.java
+++ b/common/network-common/src/test/java/org/apache/spark/network/util/JavaUtilsSuite.java
@@ -18,6 +18,7 @@
 
 import java.io.File;
 import java.io.IOException;
+import java.nio.file.Files;
 
 import org.junit.jupiter.api.Test;
 
@@ -55,4 +56,33 @@ public void testCreateDirectory() throws IOException {
       () -> JavaUtils.createDirectory(testDirPath, "scenario4"));
     assertTrue(testDir.setWritable(true));
   }
+
+  @Test
+  public void testListFiles() throws IOException {
+    File tmp = Files.createTempDirectory("testListFiles").toFile();
+    File file = new File(tmp, "file");
+
+    // Return emtpy set on non-existent input
+    assertFalse(file.exists());
+    assertEquals(0, JavaUtils.listFiles(file).size());
+    assertEquals(0, JavaUtils.listPaths(file).size());
+
+    // Return emtpy set on non-directory input
+    file.createNewFile();
+    assertTrue(file.exists());
+    assertEquals(0, JavaUtils.listFiles(file).size());
+    assertEquals(0, JavaUtils.listPaths(file).size());
+
+    // Return empty set on an empty directory location
+    File dir = new File(tmp, "dir");
+    dir.mkdir();
+    new File(dir, "1").createNewFile();
+    assertEquals(1, JavaUtils.listFiles(dir).size());
+    assertEquals(1, JavaUtils.listPaths(dir).size());
+
+    File symlink = new File(tmp, "symlink");
+    Files.createSymbolicLink(symlink.toPath(), dir.toPath());
+    assertEquals(1, JavaUtils.listFiles(symlink).size());
+    assertEquals(1, JavaUtils.listPaths(symlink).size());
+  }
 }
diff --git a/common/network-shuffle/pom.xml b/common/network-shuffle/pom.xml
index adfc55d28c357..60ad971573997 100644
--- a/common/network-shuffle/pom.xml
+++ b/common/network-shuffle/pom.xml
@@ -42,6 +42,11 @@
       <version>${project.version}</version>
     </dependency>
 
+    <dependency>
+      <groupId>org.apache.commons</groupId>
+      <artifactId>commons-lang3</artifactId>
+    </dependency>
+
     <dependency>
       <groupId>io.dropwizard.metrics</groupId>
       <artifactId>metrics-core</artifactId>
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/sasl/ShuffleSecretManager.java b/common/network-shuffle/src/main/java/org/apache/spark/network/sasl/ShuffleSecretManager.java
index d67f2a3099d35..625cb2e1257da 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/sasl/ShuffleSecretManager.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/sasl/ShuffleSecretManager.java
@@ -55,7 +55,7 @@ public void registerApp(String appId, String shuffleSecret) {
     // to the applicationId since the secrets change between application attempts on yarn.
     shuffleSecretMap.put(appId, shuffleSecret);
     logger.info("Registered shuffle secret for application {}",
-      MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+      MDC.of(LogKeys.APP_ID, appId));
   }
 
   /**
@@ -72,7 +72,7 @@ public void registerApp(String appId, ByteBuffer shuffleSecret) {
   public void unregisterApp(String appId) {
     shuffleSecretMap.remove(appId);
     logger.info("Unregistered shuffle secret for application {}",
-      MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+      MDC.of(LogKeys.APP_ID, appId));
   }
 
   /**
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/AppsWithRecoveryDisabled.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/AppsWithRecoveryDisabled.java
index 6a029a1083a47..7a0b316a3a8ea 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/AppsWithRecoveryDisabled.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/AppsWithRecoveryDisabled.java
@@ -18,11 +18,10 @@
 package org.apache.spark.network.shuffle;
 
 import java.util.Collections;
+import java.util.Objects;
 import java.util.Set;
 import java.util.concurrent.ConcurrentHashMap;
 
-import com.google.common.base.Preconditions;
-
 /**
  * Stores the applications which have recovery disabled.
  */
@@ -41,8 +40,7 @@ private AppsWithRecoveryDisabled() {
    * @param appId application id
    */
   public static void disableRecoveryOfApp(String appId) {
-    Preconditions.checkNotNull(appId);
-    INSTANCE.appsWithRecoveryDisabled.add(appId);
+    INSTANCE.appsWithRecoveryDisabled.add(Objects.requireNonNull(appId));
   }
 
   /**
@@ -51,8 +49,7 @@ public static void disableRecoveryOfApp(String appId) {
    * @return true if the application is enabled for recovery; false otherwise.
    */
   public static boolean isRecoveryEnabledForApp(String appId) {
-    Preconditions.checkNotNull(appId);
-    return !INSTANCE.appsWithRecoveryDisabled.contains(appId);
+    return !INSTANCE.appsWithRecoveryDisabled.contains(Objects.requireNonNull(appId));
   }
 
   /**
@@ -60,7 +57,6 @@ public static boolean isRecoveryEnabledForApp(String appId) {
    * @param appId application id
    */
   public static void removeApp(String appId) {
-    Preconditions.checkNotNull(appId);
-    INSTANCE.appsWithRecoveryDisabled.remove(appId);
+    INSTANCE.appsWithRecoveryDisabled.remove(Objects.requireNonNull(appId));
   }
 }
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/BlockStoreClient.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/BlockStoreClient.java
index dcb0a52b0d66c..ceb5d64699744 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/BlockStoreClient.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/BlockStoreClient.java
@@ -173,7 +173,7 @@ public void onSuccess(ByteBuffer response) {
               ((LocalDirsForExecutors) msgObj).getLocalDirsByExec());
           } catch (Throwable t) {
             logger.warn("Error while trying to get the host local dirs for {}", t.getCause(),
-              MDC.of(LogKeys.EXECUTOR_IDS$.MODULE$, Arrays.toString(getLocalDirsMessage.execIds)));
+              MDC.of(LogKeys.EXECUTOR_IDS, Arrays.toString(getLocalDirsMessage.execIds)));
             hostLocalDirsCompletable.completeExceptionally(t);
           }
         }
@@ -181,7 +181,7 @@ public void onSuccess(ByteBuffer response) {
         @Override
         public void onFailure(Throwable t) {
           logger.warn("Error while trying to get the host local dirs for {}", t.getCause(),
-            MDC.of(LogKeys.EXECUTOR_IDS$.MODULE$, Arrays.toString(getLocalDirsMessage.execIds)));
+            MDC.of(LogKeys.EXECUTOR_IDS, Arrays.toString(getLocalDirsMessage.execIds)));
           hostLocalDirsCompletable.completeExceptionally(t);
         }
       });
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ErrorHandler.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ErrorHandler.java
index 31ed10ad76f8f..298611cc8567f 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ErrorHandler.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ErrorHandler.java
@@ -20,10 +20,9 @@
 import java.io.FileNotFoundException;
 import java.net.ConnectException;
 
-import com.google.common.base.Throwables;
-
 import org.apache.spark.annotation.Evolving;
 import org.apache.spark.network.server.BlockPushNonFatalFailure;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Plugs into {@link RetryingBlockTransferor} to further control when an exception should be retried
@@ -105,12 +104,12 @@ class BlockFetchErrorHandler implements ErrorHandler {
 
     @Override
     public boolean shouldRetryError(Throwable t) {
-      return !Throwables.getStackTraceAsString(t).contains(STALE_SHUFFLE_BLOCK_FETCH);
+      return !JavaUtils.stackTraceToString(t).contains(STALE_SHUFFLE_BLOCK_FETCH);
     }
 
     @Override
     public boolean shouldLogError(Throwable t) {
-      return !Throwables.getStackTraceAsString(t).contains(STALE_SHUFFLE_BLOCK_FETCH);
+      return !JavaUtils.stackTraceToString(t).contains(STALE_SHUFFLE_BLOCK_FETCH);
     }
   }
 }
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockHandler.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockHandler.java
index 5d33bfb345a9e..45d0ff69de900 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockHandler.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockHandler.java
@@ -21,8 +21,10 @@
 import java.io.IOException;
 import java.nio.ByteBuffer;
 import java.util.HashMap;
+import java.util.HashSet;
 import java.util.Iterator;
 import java.util.Map;
+import java.util.Objects;
 import java.util.Set;
 import java.util.concurrent.TimeUnit;
 import java.util.function.Function;
@@ -35,8 +37,6 @@
 import com.codahale.metrics.Timer;
 import com.codahale.metrics.Counter;
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.collect.Sets;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
@@ -199,7 +199,7 @@ protected void handleMessage(
 
     } else if (msgObj instanceof GetLocalDirsForExecutors msg) {
       checkAuth(client, msg.appId);
-      Set<String> execIdsForBlockResolver = Sets.newHashSet(msg.execIds);
+      Set<String> execIdsForBlockResolver = new HashSet<>(Set.of(msg.execIds));
       boolean fetchMergedBlockDirs = execIdsForBlockResolver.remove(SHUFFLE_MERGER_IDENTIFIER);
       Map<String, String[]> localDirs = blockManager.getLocalDirs(msg.appId,
         execIdsForBlockResolver);
@@ -224,9 +224,9 @@ protected void handleMessage(
     } else if (msgObj instanceof RemoveShuffleMerge msg) {
       checkAuth(client, msg.appId);
       logger.info("Removing shuffle merge data for application {} shuffle {} shuffleMerge {}",
-        MDC.of(LogKeys.APP_ID$.MODULE$, msg.appId),
-        MDC.of(LogKeys.SHUFFLE_ID$.MODULE$, msg.shuffleId),
-        MDC.of(LogKeys.SHUFFLE_MERGE_ID$.MODULE$, msg.shuffleMergeId));
+        MDC.of(LogKeys.APP_ID, msg.appId),
+        MDC.of(LogKeys.SHUFFLE_ID, msg.shuffleId),
+        MDC.of(LogKeys.SHUFFLE_MERGE_ID, msg.shuffleMergeId));
       mergeManager.removeShuffleMerge(msg);
     } else if (msgObj instanceof DiagnoseCorruption msg) {
       checkAuth(client, msg.appId);
@@ -585,7 +585,7 @@ public boolean hasNext() {
 
     @Override
     public ManagedBuffer next() {
-      ManagedBuffer block = Preconditions.checkNotNull(mergeManager.getMergedBlockData(
+      ManagedBuffer block = Objects.requireNonNull(mergeManager.getMergedBlockData(
         appId, shuffleId, shuffleMergeId, reduceIds[reduceIdx], chunkIds[reduceIdx][chunkIdx]));
       if (chunkIdx < chunkIds[reduceIdx].length - 1) {
         chunkIdx += 1;
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockStoreClient.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockStoreClient.java
index 97723f77723d4..4fdd39c3471fc 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockStoreClient.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalBlockStoreClient.java
@@ -19,6 +19,7 @@
 
 import java.io.IOException;
 import java.nio.ByteBuffer;
+import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.HashMap;
 import java.util.List;
@@ -27,7 +28,6 @@
 import java.util.concurrent.Future;
 
 import com.codahale.metrics.MetricSet;
-import com.google.common.collect.Lists;
 
 import org.apache.spark.internal.LogKeys;
 import org.apache.spark.internal.MDC;
@@ -82,7 +82,7 @@ public void init(String appId) {
     this.appId = appId;
     TransportContext context = new TransportContext(
       transportConf, new NoOpRpcHandler(), true, true);
-    List<TransportClientBootstrap> bootstraps = Lists.newArrayList();
+    List<TransportClientBootstrap> bootstraps = new ArrayList<>();
     if (authEnabled) {
       bootstraps.add(new AuthClientBootstrap(transportConf, appId, secretKeyHolder));
     }
@@ -106,7 +106,7 @@ private void setComparableAppAttemptId(String appAttemptId) {
     } catch (NumberFormatException e) {
       logger.warn("Push based shuffle requires comparable application attemptId, " +
         "but the appAttemptId {} cannot be parsed to Integer", e,
-          MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, appAttemptId));
+          MDC.of(LogKeys.APP_ATTEMPT_ID, appAttemptId));
     }
   }
 
@@ -221,8 +221,8 @@ public void onFailure(Throwable e) {
       });
     } catch (Exception e) {
       logger.error("Exception while sending finalizeShuffleMerge request to {}:{}", e,
-        MDC.of(LogKeys.HOST$.MODULE$, host),
-        MDC.of(LogKeys.PORT$.MODULE$, port));
+        MDC.of(LogKeys.HOST, host),
+        MDC.of(LogKeys.PORT, port));
       listener.onShuffleMergeFailure(e);
     }
   }
@@ -322,8 +322,8 @@ public void onSuccess(ByteBuffer response) {
         } catch (Throwable t) {
           logger.warn("Error trying to remove blocks {} via external shuffle service from " +
             "executor: {}", t,
-            MDC.of(LogKeys.BLOCK_IDS$.MODULE$, Arrays.toString(blockIds)),
-            MDC.of(LogKeys.EXECUTOR_ID$.MODULE$, execId));
+            MDC.of(LogKeys.BLOCK_IDS, Arrays.toString(blockIds)),
+            MDC.of(LogKeys.EXECUTOR_ID, execId));
           numRemovedBlocksFuture.complete(0);
         }
       }
@@ -331,8 +331,8 @@ public void onSuccess(ByteBuffer response) {
       @Override
       public void onFailure(Throwable e) {
         logger.warn("Error trying to remove blocks {} via external shuffle service from " +
-          "executor: {}", e, MDC.of(LogKeys.BLOCK_IDS$.MODULE$, Arrays.toString(blockIds)),
-          MDC.of(LogKeys.EXECUTOR_ID$.MODULE$, execId));
+          "executor: {}", e, MDC.of(LogKeys.BLOCK_IDS, Arrays.toString(blockIds)),
+          MDC.of(LogKeys.EXECUTOR_ID, execId));
         numRemovedBlocksFuture.complete(0);
       }
     });
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolver.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolver.java
index e43eedd8b25eb..b3002833fce1a 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolver.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolver.java
@@ -20,15 +20,13 @@
 import java.io.*;
 import java.nio.charset.StandardCharsets;
 import java.util.*;
+import java.util.concurrent.ConcurrentHashMap;
 import java.util.concurrent.ConcurrentMap;
 import java.util.concurrent.ExecutionException;
 import java.util.concurrent.Executor;
 import java.util.concurrent.Executors;
 import java.util.stream.Collectors;
 
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
-import org.apache.commons.lang3.tuple.Pair;
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import com.fasterxml.jackson.databind.ObjectMapper;
@@ -37,7 +35,6 @@
 import com.google.common.cache.CacheLoader;
 import com.google.common.cache.LoadingCache;
 import com.google.common.cache.Weigher;
-import com.google.common.collect.Maps;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
@@ -56,6 +53,7 @@
 import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.NettyUtils;
 import org.apache.spark.network.util.TransportConf;
+import org.apache.spark.util.Pair;
 
 /**
  * Manages converting shuffle BlockIds into physical segments of local files, from a process outside
@@ -134,11 +132,11 @@ public ShuffleIndexInformation load(String filePath) throws IOException {
     db = DBProvider.initDB(dbBackend, this.registeredExecutorFile, CURRENT_VERSION, mapper);
     if (db != null) {
       logger.info("Use {} as the implementation of {}",
-        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_NAME$.MODULE$, dbBackend),
-        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_KEY$.MODULE$, Constants.SHUFFLE_SERVICE_DB_BACKEND));
+        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_NAME, dbBackend),
+        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_KEY, Constants.SHUFFLE_SERVICE_DB_BACKEND));
       executors = reloadRegisteredExecutors(db);
     } else {
-      executors = Maps.newConcurrentMap();
+      executors = new ConcurrentHashMap<>();
     }
     this.directoryCleaner = directoryCleaner;
   }
@@ -154,8 +152,8 @@ public void registerExecutor(
       ExecutorShuffleInfo executorInfo) {
     AppExecId fullId = new AppExecId(appId, execId);
     logger.info("Registered executor {} with {}",
-      MDC.of(LogKeys.APP_EXECUTOR_ID$.MODULE$, fullId),
-      MDC.of(LogKeys.EXECUTOR_SHUFFLE_INFO$.MODULE$, executorInfo));
+      MDC.of(LogKeys.APP_EXECUTOR_ID, fullId),
+      MDC.of(LogKeys.EXECUTOR_SHUFFLE_INFO, executorInfo));
     try {
       if (db != null && AppsWithRecoveryDisabled.isRecoveryEnabledForApp(appId)) {
         byte[] key = dbAppExecKey(fullId);
@@ -221,8 +219,8 @@ public ManagedBuffer getRddBlockData(
    */
   public void applicationRemoved(String appId, boolean cleanupLocalDirs) {
     logger.info("Application {} removed, cleanupLocalDirs = {}",
-      MDC.of(LogKeys.APP_ID$.MODULE$, appId),
-      MDC.of(LogKeys.CLEANUP_LOCAL_DIRS$.MODULE$, cleanupLocalDirs));
+      MDC.of(LogKeys.APP_ID, appId),
+      MDC.of(LogKeys.CLEANUP_LOCAL_DIRS, cleanupLocalDirs));
     Iterator<Map.Entry<AppExecId, ExecutorShuffleInfo>> it = executors.entrySet().iterator();
     while (it.hasNext()) {
       Map.Entry<AppExecId, ExecutorShuffleInfo> entry = it.next();
@@ -237,14 +235,14 @@ public void applicationRemoved(String appId, boolean cleanupLocalDirs) {
             db.delete(dbAppExecKey(fullId));
           } catch (IOException e) {
             logger.error("Error deleting {} from executor state db", e,
-              MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+              MDC.of(LogKeys.APP_ID, appId));
           }
         }
 
         if (cleanupLocalDirs) {
           logger.info("Cleaning up executor {}'s {} local dirs",
-            MDC.of(LogKeys.APP_EXECUTOR_ID$.MODULE$, fullId),
-            MDC.of(LogKeys.NUM_LOCAL_DIRS$.MODULE$, executor.localDirs.length));
+            MDC.of(LogKeys.APP_EXECUTOR_ID, fullId),
+            MDC.of(LogKeys.NUM_LOCAL_DIRS, executor.localDirs.length));
 
           // Execute the actual deletion in a different thread, as it may take some time.
           directoryCleaner.execute(() -> deleteExecutorDirs(executor.localDirs));
@@ -259,18 +257,18 @@ public void applicationRemoved(String appId, boolean cleanupLocalDirs) {
    */
   public void executorRemoved(String executorId, String appId) {
     logger.info("Clean up non-shuffle and non-RDD files associated with the finished executor {}",
-      MDC.of(LogKeys.EXECUTOR_ID$.MODULE$, executorId));
+      MDC.of(LogKeys.EXECUTOR_ID, executorId));
     AppExecId fullId = new AppExecId(appId, executorId);
     final ExecutorShuffleInfo executor = executors.get(fullId);
     if (executor == null) {
       // Executor not registered, skip clean up of the local directories.
       logger.info("Executor is not registered (appId={}, execId={})",
-        MDC.of(LogKeys.APP_ID$.MODULE$, appId),
-        MDC.of(LogKeys.EXECUTOR_ID$.MODULE$, executorId));
+        MDC.of(LogKeys.APP_ID, appId),
+        MDC.of(LogKeys.EXECUTOR_ID, executorId));
     } else {
       logger.info("Cleaning up non-shuffle and non-RDD files in executor {}'s {} local dirs",
-        MDC.of(LogKeys.APP_EXECUTOR_ID$.MODULE$, fullId),
-        MDC.of(LogKeys.NUM_LOCAL_DIRS$.MODULE$, executor.localDirs.length));
+        MDC.of(LogKeys.APP_EXECUTOR_ID, fullId),
+        MDC.of(LogKeys.NUM_LOCAL_DIRS, executor.localDirs.length));
 
       // Execute the actual deletion in a different thread, as it may take some time.
       directoryCleaner.execute(() -> deleteNonShuffleServiceServedFiles(executor.localDirs));
@@ -288,7 +286,7 @@ private void deleteExecutorDirs(String[] dirs) {
         logger.debug("Successfully cleaned up directory: {}", localDir);
       } catch (Exception e) {
         logger.error("Failed to delete directory: {}", e,
-          MDC.of(LogKeys.PATH$.MODULE$, localDir));
+          MDC.of(LogKeys.PATH, localDir));
       }
     }
   }
@@ -311,7 +309,7 @@ private void deleteNonShuffleServiceServedFiles(String[] dirs) {
           localDir);
       } catch (Exception e) {
         logger.error("Failed to delete files not served by shuffle service in directory: {}", e,
-          MDC.of(LogKeys.PATH$.MODULE$, localDir));
+          MDC.of(LogKeys.PATH, localDir));
       }
     }
   }
@@ -384,7 +382,7 @@ public int removeBlocks(String appId, String execId, String[] blockIds) {
         numRemovedBlocks++;
       } else {
         logger.warn("Failed to delete block: {}",
-          MDC.of(LogKeys.PATH$.MODULE$, file.getAbsolutePath()));
+          MDC.of(LogKeys.PATH, file.getAbsolutePath()));
       }
     }
     return numRemovedBlocks;
@@ -400,7 +398,7 @@ public Map<String, String[]> getLocalDirs(String appId, Set<String> execIds) {
         }
         return Pair.of(exec, info.localDirs);
       })
-      .collect(Collectors.toMap(Pair::getKey, Pair::getValue));
+      .collect(Collectors.toMap(Pair::getLeft, Pair::getRight));
   }
 
   /**
@@ -451,10 +449,7 @@ public int hashCode() {
 
     @Override
     public String toString() {
-      return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-        .append("appId", appId)
-        .append("execId", execId)
-        .toString();
+      return "ExternalShuffleBlockResolver[appId=" + appId + ",execId=" + execId + "]";
     }
   }
 
@@ -477,7 +472,7 @@ private static AppExecId parseDbAppExecKey(String s) throws IOException {
   @VisibleForTesting
   static ConcurrentMap<AppExecId, ExecutorShuffleInfo> reloadRegisteredExecutors(DB db)
       throws IOException {
-    ConcurrentMap<AppExecId, ExecutorShuffleInfo> registeredExecutors = Maps.newConcurrentMap();
+    ConcurrentMap<AppExecId, ExecutorShuffleInfo> registeredExecutors = new ConcurrentHashMap<>();
     if (db != null) {
       try (DBIterator itr = db.iterator()) {
         itr.seek(APP_KEY_PREFIX.getBytes(StandardCharsets.UTF_8));
@@ -489,7 +484,7 @@ static ConcurrentMap<AppExecId, ExecutorShuffleInfo> reloadRegisteredExecutors(D
           }
           AppExecId id = parseDbAppExecKey(key);
           logger.info("Reloading registered executors: {}",
-            MDC.of(LogKeys.APP_EXECUTOR_ID$.MODULE$, id));
+            MDC.of(LogKeys.APP_EXECUTOR_ID, id));
           ExecutorShuffleInfo shuffleInfo =
             mapper.readValue(e.getValue(), ExecutorShuffleInfo.class);
           registeredExecutors.put(id, shuffleInfo);
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/MergedBlockMeta.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/MergedBlockMeta.java
index 5541b7460ac96..ca8d9bbe65500 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/MergedBlockMeta.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/MergedBlockMeta.java
@@ -20,8 +20,8 @@
 import java.io.IOException;
 import java.util.ArrayList;
 import java.util.List;
+import java.util.Objects;
 
-import com.google.common.base.Preconditions;
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.Unpooled;
 import org.roaringbitmap.RoaringBitmap;
@@ -43,7 +43,7 @@ public class MergedBlockMeta {
 
   public MergedBlockMeta(int numChunks, ManagedBuffer chunksBitmapBuffer) {
     this.numChunks = numChunks;
-    this.chunksBitmapBuffer = Preconditions.checkNotNull(chunksBitmapBuffer);
+    this.chunksBitmapBuffer = Objects.requireNonNull(chunksBitmapBuffer);
   }
 
   public int getNumChunks() {
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/OneForOneBlockPusher.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/OneForOneBlockPusher.java
index d90ca1a88a267..05158a6600d0d 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/OneForOneBlockPusher.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/OneForOneBlockPusher.java
@@ -21,8 +21,6 @@
 import java.util.Arrays;
 import java.util.Map;
 
-import com.google.common.base.Preconditions;
-
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.network.buffer.ManagedBuffer;
@@ -34,6 +32,7 @@
 import org.apache.spark.network.shuffle.protocol.BlockPushReturnCode;
 import org.apache.spark.network.shuffle.protocol.BlockTransferMessage;
 import org.apache.spark.network.shuffle.protocol.PushBlockStream;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Similar to {@link OneForOneBlockFetcher}, but for pushing blocks to remote shuffle service to
@@ -90,7 +89,7 @@ public void onSuccess(ByteBuffer response) {
       ReturnCode returnCode = BlockPushNonFatalFailure.getReturnCode(pushResponse.returnCode);
       if (returnCode != ReturnCode.SUCCESS) {
         String blockId = pushResponse.failureBlockId;
-        Preconditions.checkArgument(!blockId.isEmpty());
+        JavaUtils.checkArgument(!blockId.isEmpty(), "BlockID should not be empty");
         checkAndFailRemainingBlocks(index, new BlockPushNonFatalFailure(returnCode,
           BlockPushNonFatalFailure.getErrorMsg(blockId, returnCode)));
       } else {
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RemoteBlockPushResolver.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RemoteBlockPushResolver.java
index 6e9bd548f5327..a48208bad5b8c 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RemoteBlockPushResolver.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RemoteBlockPushResolver.java
@@ -55,7 +55,6 @@
 import com.codahale.metrics.Metric;
 import com.codahale.metrics.MetricSet;
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
 import com.google.common.cache.CacheBuilder;
 import com.google.common.cache.CacheLoader;
 import com.google.common.cache.LoadingCache;
@@ -187,8 +186,8 @@ public ShuffleIndexInformation load(String filePath) throws IOException {
     db = DBProvider.initDB(dbBackend, this.recoveryFile, CURRENT_VERSION, mapper);
     if (db != null) {
       logger.info("Use {} as the implementation of {}",
-        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_NAME$.MODULE$, dbBackend),
-        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_KEY$.MODULE$, Constants.SHUFFLE_SERVICE_DB_BACKEND));
+        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_NAME, dbBackend),
+        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_KEY, Constants.SHUFFLE_SERVICE_DB_BACKEND));
       reloadAndCleanUpAppShuffleInfo(db);
     }
     this.pushMergeMetrics = new PushMergeMetrics();
@@ -211,7 +210,7 @@ public boolean shouldLogError(Throwable t) {
   protected AppShuffleInfo validateAndGetAppShuffleInfo(String appId) {
     // TODO: [SPARK-33236] Change the message when this service is able to handle NM restart
     AppShuffleInfo appShuffleInfo = appsShuffleInfo.get(appId);
-    Preconditions.checkArgument(appShuffleInfo != null,
+    JavaUtils.checkArgument(appShuffleInfo != null,
       "application " + appId + " is not registered or NM was restarted.");
     return appShuffleInfo;
   }
@@ -234,10 +233,10 @@ AppShufflePartitionInfo getOrCreateAppShufflePartitionInfo(
         if (mergePartitionsInfo == null) {
           logger.info("{} attempt {} shuffle {} shuffleMerge {}: creating a new shuffle " +
             "merge metadata",
-            MDC.of(LogKeys.APP_ID$.MODULE$, appShuffleInfo.appId),
-            MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, appShuffleInfo.attemptId),
-            MDC.of(LogKeys.SHUFFLE_ID$.MODULE$, shuffleId),
-            MDC.of(LogKeys.SHUFFLE_MERGE_ID$.MODULE$, shuffleMergeId));
+            MDC.of(LogKeys.APP_ID, appShuffleInfo.appId),
+            MDC.of(LogKeys.APP_ATTEMPT_ID, appShuffleInfo.attemptId),
+            MDC.of(LogKeys.SHUFFLE_ID, shuffleId),
+            MDC.of(LogKeys.SHUFFLE_MERGE_ID, shuffleMergeId));
           return new AppShuffleMergePartitionsInfo(shuffleMergeId, false);
         } else {
           int latestShuffleMergeId = mergePartitionsInfo.shuffleMergeId;
@@ -256,10 +255,10 @@ AppShufflePartitionInfo getOrCreateAppShufflePartitionInfo(
                     shuffleId, latestShuffleMergeId);
             logger.info("{}: creating a new shuffle merge metadata since received " +
               "shuffleMergeId {} is higher than latest shuffleMergeId {}",
-              MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$,
+              MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID,
                 currentAppAttemptShuffleMergeId),
-              MDC.of(LogKeys.SHUFFLE_MERGE_ID$.MODULE$, shuffleMergeId),
-              MDC.of(LogKeys.LATEST_SHUFFLE_MERGE_ID$.MODULE$, latestShuffleMergeId));
+              MDC.of(LogKeys.SHUFFLE_MERGE_ID, shuffleMergeId),
+              MDC.of(LogKeys.LATEST_SHUFFLE_MERGE_ID, latestShuffleMergeId));
             submitCleanupTask(() ->
                 closeAndDeleteOutdatedPartitions(currentAppAttemptShuffleMergeId,
                     mergePartitionsInfo.shuffleMergePartitions));
@@ -293,13 +292,13 @@ AppShufflePartitionInfo getOrCreateAppShufflePartitionInfo(
       } catch (IOException e) {
         logger.error("{} attempt {} shuffle {} shuffleMerge {}: cannot create merged shuffle " +
           "partition with data file {}, index file {}, and meta file {}",
-          MDC.of(LogKeys.APP_ID$.MODULE$, appShuffleInfo.appId),
-          MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, appShuffleInfo.attemptId),
-          MDC.of(LogKeys.SHUFFLE_ID$.MODULE$, shuffleId),
-          MDC.of(LogKeys.SHUFFLE_MERGE_ID$.MODULE$, shuffleMergeId),
-          MDC.of(LogKeys.DATA_FILE$.MODULE$, dataFile.getAbsolutePath()),
-          MDC.of(LogKeys.INDEX_FILE$.MODULE$, indexFile.getAbsolutePath()),
-          MDC.of(LogKeys.META_FILE$.MODULE$, metaFile.getAbsolutePath()));
+          MDC.of(LogKeys.APP_ID, appShuffleInfo.appId),
+          MDC.of(LogKeys.APP_ATTEMPT_ID, appShuffleInfo.attemptId),
+          MDC.of(LogKeys.SHUFFLE_ID, shuffleId),
+          MDC.of(LogKeys.SHUFFLE_MERGE_ID, shuffleMergeId),
+          MDC.of(LogKeys.DATA_FILE, dataFile.getAbsolutePath()),
+          MDC.of(LogKeys.INDEX_FILE, indexFile.getAbsolutePath()),
+          MDC.of(LogKeys.META_FILE, metaFile.getAbsolutePath()));
         throw new RuntimeException(
           String.format("Cannot initialize merged shuffle partition for appId %s shuffleId %s "
             + "shuffleMergeId %s reduceId %s", appShuffleInfo.appId, shuffleId, shuffleMergeId,
@@ -411,8 +410,8 @@ private void removeOldApplicationAttemptsFromDb(AppShuffleInfo info) {
   @Override
   public void applicationRemoved(String appId, boolean cleanupLocalDirs) {
     logger.info("Application {} removed, cleanupLocalDirs = {}",
-      MDC.of(LogKeys.APP_ID$.MODULE$, appId),
-      MDC.of(LogKeys.CLEANUP_LOCAL_DIRS$.MODULE$, cleanupLocalDirs));
+      MDC.of(LogKeys.APP_ID, appId),
+      MDC.of(LogKeys.CLEANUP_LOCAL_DIRS, cleanupLocalDirs));
     // Cleanup the DB within critical section to gain the consistency between
     // DB and in-memory hashmap.
     AtomicReference<AppShuffleInfo> ref = new AtomicReference<>(null);
@@ -523,7 +522,7 @@ void removeAppAttemptPathInfoFromDB(String appId, int attemptId) {
         db.delete(key);
       } catch (Exception e) {
         logger.error("Failed to remove the application attempt {} local path in DB", e,
-          MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, appAttemptId));
+          MDC.of(LogKeys.APP_ATTEMPT_ID, appAttemptId));
       }
     }
   }
@@ -593,10 +592,10 @@ void deleteMergedFiles(
       }
     }
     logger.info("Delete {} data files, {} index files, {} meta files for {}",
-      MDC.of(LogKeys.NUM_DATA_FILES$.MODULE$, dataFilesDeleteCnt),
-      MDC.of(LogKeys.NUM_INDEX_FILES$.MODULE$, indexFilesDeleteCnt),
-      MDC.of(LogKeys.NUM_META_FILES$.MODULE$, metaFilesDeleteCnt),
-      MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId));
+      MDC.of(LogKeys.NUM_DATA_FILES, dataFilesDeleteCnt),
+      MDC.of(LogKeys.NUM_INDEX_FILES, indexFilesDeleteCnt),
+      MDC.of(LogKeys.NUM_META_FILES, metaFilesDeleteCnt),
+      MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId));
   }
 
   /**
@@ -609,7 +608,7 @@ void removeAppShufflePartitionInfoFromDB(AppAttemptShuffleMergeId appAttemptShuf
         db.delete(getDbAppAttemptShufflePartitionKey(appAttemptShuffleMergeId));
       } catch (Exception e) {
         logger.error("Error deleting {} from application shuffle merged partition info in DB", e,
-          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId));
+          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId));
       }
     }
   }
@@ -629,7 +628,7 @@ void deleteExecutorDirs(AppShuffleInfo appShuffleInfo) {
         }
       } catch (Exception e) {
         logger.error("Failed to delete directory: {}", e,
-          MDC.of(LogKeys.PATH$.MODULE$, localDir));
+          MDC.of(LogKeys.PATH, localDir));
       }
     }
   }
@@ -759,10 +758,10 @@ public ByteBuffer getCompletionResponse() {
   @Override
   public MergeStatuses finalizeShuffleMerge(FinalizeShuffleMerge msg) {
     logger.info("{} attempt {} shuffle {} shuffleMerge {}: finalize shuffle merge",
-      MDC.of(LogKeys.APP_ID$.MODULE$, msg.appId),
-      MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, msg.appAttemptId),
-      MDC.of(LogKeys.SHUFFLE_ID$.MODULE$, msg.shuffleId),
-      MDC.of(LogKeys.SHUFFLE_MERGE_ID$.MODULE$, msg.shuffleMergeId));
+      MDC.of(LogKeys.APP_ID, msg.appId),
+      MDC.of(LogKeys.APP_ATTEMPT_ID, msg.appAttemptId),
+      MDC.of(LogKeys.SHUFFLE_ID, msg.shuffleId),
+      MDC.of(LogKeys.SHUFFLE_MERGE_ID, msg.shuffleMergeId));
     AppShuffleInfo appShuffleInfo = validateAndGetAppShuffleInfo(msg.appId);
     if (appShuffleInfo.attemptId != msg.appAttemptId) {
       // If finalizeShuffleMerge from a former application attempt, it is considered late,
@@ -846,12 +845,12 @@ public MergeStatuses finalizeShuffleMerge(FinalizeShuffleMerge msg) {
           } catch (IOException ioe) {
             logger.warn("{} attempt {} shuffle {} shuffleMerge {}: exception while " +
               "finalizing shuffle partition {}. Exception message: {}",
-              MDC.of(LogKeys.APP_ID$.MODULE$, msg.appId),
-              MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, msg.appAttemptId),
-              MDC.of(LogKeys.SHUFFLE_ID$.MODULE$, msg.shuffleId),
-              MDC.of(LogKeys.SHUFFLE_MERGE_ID$.MODULE$, msg.shuffleMergeId),
-              MDC.of(LogKeys.REDUCE_ID$.MODULE$, partition.reduceId),
-              MDC.of(LogKeys.EXCEPTION$.MODULE$, ioe.getMessage()));
+              MDC.of(LogKeys.APP_ID, msg.appId),
+              MDC.of(LogKeys.APP_ATTEMPT_ID, msg.appAttemptId),
+              MDC.of(LogKeys.SHUFFLE_ID, msg.shuffleId),
+              MDC.of(LogKeys.SHUFFLE_MERGE_ID, msg.shuffleMergeId),
+              MDC.of(LogKeys.REDUCE_ID, partition.reduceId),
+              MDC.of(LogKeys.EXCEPTION, ioe.getMessage()));
           } finally {
             partition.cleanable.clean();
           }
@@ -863,10 +862,10 @@ public MergeStatuses finalizeShuffleMerge(FinalizeShuffleMerge msg) {
       appShuffleInfo.shuffles.get(msg.shuffleId).setReduceIds(Ints.toArray(reduceIds));
     }
     logger.info("{} attempt {} shuffle {} shuffleMerge {}: finalization of shuffle merge completed",
-      MDC.of(LogKeys.APP_ID$.MODULE$, msg.appId),
-      MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$,  msg.appAttemptId),
-      MDC.of(LogKeys.SHUFFLE_ID$.MODULE$, msg.shuffleId),
-      MDC.of(LogKeys.SHUFFLE_MERGE_ID$.MODULE$, msg.shuffleMergeId));
+      MDC.of(LogKeys.APP_ID, msg.appId),
+      MDC.of(LogKeys.APP_ATTEMPT_ID,  msg.appAttemptId),
+      MDC.of(LogKeys.SHUFFLE_ID, msg.shuffleId),
+      MDC.of(LogKeys.SHUFFLE_MERGE_ID, msg.shuffleMergeId));
     return mergeStatuses;
   }
 
@@ -934,8 +933,8 @@ public void registerExecutor(String appId, ExecutorShuffleInfo executorInfo) {
           if (originalAppShuffleInfo.get() != null) {
             AppShuffleInfo appShuffleInfo = originalAppShuffleInfo.get();
             logger.warn("Cleanup shuffle info and merged shuffle files for {}_{} as new " +
-              "application attempt registered", MDC.of(LogKeys.APP_ID$.MODULE$, appId),
-              MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, appShuffleInfo.attemptId));
+              "application attempt registered", MDC.of(LogKeys.APP_ID, appId),
+              MDC.of(LogKeys.APP_ATTEMPT_ID, appShuffleInfo.attemptId));
             // Clean up all the merge shuffle related information in the DB for the former attempt
             submitCleanupTask(
               () -> closeAndDeletePartitionsIfNeeded(appShuffleInfo, true)
@@ -992,12 +991,12 @@ private void shutdownMergedShuffleCleanerNow() {
       List<Runnable> unfinishedTasks = mergedShuffleCleaner.shutdownNow();
       logger.warn("There are still {} tasks not completed in mergedShuffleCleaner " +
         "after {} ms.",
-         MDC.of(LogKeys.COUNT$.MODULE$, unfinishedTasks.size()),
-         MDC.of(LogKeys.TIMEOUT$.MODULE$, cleanerShutdownTimeout * 1000L));
+         MDC.of(LogKeys.COUNT, unfinishedTasks.size()),
+         MDC.of(LogKeys.TIMEOUT, cleanerShutdownTimeout * 1000L));
       // Wait a while for tasks to respond to being cancelled
       if (!mergedShuffleCleaner.awaitTermination(cleanerShutdownTimeout, TimeUnit.SECONDS)) {
         logger.warn("mergedShuffleCleaner did not terminate in {} ms.",
-          MDC.of(LogKeys.TIMEOUT$.MODULE$, cleanerShutdownTimeout * 1000L));
+          MDC.of(LogKeys.TIMEOUT, cleanerShutdownTimeout * 1000L));
       }
     } catch (InterruptedException ignored) {
       Thread.currentThread().interrupt();
@@ -1017,7 +1016,7 @@ private void writeAppPathsInfoToDb(String appId, int attemptId, AppPathsInfo app
         db.put(key, value);
       } catch (Exception e) {
         logger.error("Error saving registered app paths info for {}", e,
-          MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, appAttemptId));
+          MDC.of(LogKeys.APP_ATTEMPT_ID, appAttemptId));
       }
     }
   }
@@ -1035,7 +1034,7 @@ private void writeAppAttemptShuffleMergeInfoToDB(
         db.put(dbKey, new byte[0]);
       } catch (Exception e) {
         logger.error("Error saving active app shuffle partition {}", e,
-          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId));
+          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId));
       }
     }
   }
@@ -1137,7 +1136,7 @@ List<byte[]> reloadActiveAppAttemptsPathInfo(DB db) throws IOException {
                       dbKeysToBeRemoved.add(getDbAppAttemptPathsKey(existingAppAttemptId));
                     } catch (IOException e) {
                       logger.error("Failed to get the DB key for {}", e,
-                        MDC.of(LogKeys.APP_ATTEMPT_ID$.MODULE$, existingAppAttemptId));
+                        MDC.of(LogKeys.APP_ATTEMPT_ID, existingAppAttemptId));
                     }
                   }
                   return new AppShuffleInfo(
@@ -1187,7 +1186,7 @@ List<byte[]> reloadFinalizedAppAttemptsShuffleMergeInfo(DB db) throws IOExceptio
                             getDbAppAttemptShufflePartitionKey(appAttemptShuffleMergeId));
                       } catch (Exception e) {
                         logger.error("Error getting the DB key for {}", e, MDC.of(
-                          LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId));
+                          LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId));
                       }
                     }
                     return new AppShuffleMergePartitionsInfo(partitionId.shuffleMergeId, true);
@@ -1216,7 +1215,7 @@ void removeOutdatedKeyValuesInDB(List<byte[]> dbKeysToBeRemoved) {
               db.delete(key);
             } catch (Exception e) {
               logger.error("Error deleting dangling key {} in DB", e,
-                MDC.of(LogKeys.KEY$.MODULE$, key));
+                MDC.of(LogKeys.KEY, key));
             }
           }
       );
@@ -1267,12 +1266,12 @@ private PushBlockStreamCallback(
         String streamId,
         AppShufflePartitionInfo partitionInfo,
         int mapIndex) {
-      Preconditions.checkArgument(mergeManager != null);
+      JavaUtils.checkArgument(mergeManager != null, "mergeManager is null");
       this.mergeManager = mergeManager;
-      Preconditions.checkArgument(appShuffleInfo != null);
+      JavaUtils.checkArgument(appShuffleInfo != null, "appShuffleInfo is null");
       this.appShuffleInfo = appShuffleInfo;
       this.streamId = streamId;
-      Preconditions.checkArgument(partitionInfo != null);
+      JavaUtils.checkArgument(partitionInfo != null, "partitionInfo is null");
       this.partitionInfo = partitionInfo;
       this.mapIndex = mapIndex;
       abortIfNecessary();
@@ -1599,7 +1598,7 @@ public void onComplete(String streamId) throws IOException {
     public void onFailure(String streamId, Throwable throwable) throws IOException {
       if (ERROR_HANDLER.shouldLogError(throwable)) {
         logger.error("Encountered issue when merging {}", throwable,
-          MDC.of(LogKeys.STREAM_ID$.MODULE$, streamId));
+          MDC.of(LogKeys.STREAM_ID, streamId));
       } else {
         logger.debug("Encountered issue when merging {}", streamId, throwable);
       }
@@ -1719,7 +1718,7 @@ public AppAttemptShuffleMergeId(
         @JsonProperty("attemptId") int attemptId,
         @JsonProperty("shuffleId") int shuffleId,
         @JsonProperty("shuffleMergeId") int shuffleMergeId) {
-      Preconditions.checkArgument(appId != null, "app id is null");
+      JavaUtils.checkArgument(appId != null, "app id is null");
       this.appId = appId;
       this.attemptId = attemptId;
       this.shuffleId = shuffleId;
@@ -1860,8 +1859,8 @@ void updateChunkInfo(long chunkOffset, int mapIndex) throws IOException {
         indexMetaUpdateFailed = false;
       } catch (IOException ioe) {
         logger.warn("{} reduceId {} update to index/meta failed",
-          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId),
-          MDC.of(LogKeys.REDUCE_ID$.MODULE$, reduceId));
+          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId),
+          MDC.of(LogKeys.REDUCE_ID, reduceId));
         indexMetaUpdateFailed = true;
         // Any exception here is propagated to the caller and the caller can decide whether to
         // abort or not.
@@ -1913,8 +1912,8 @@ private void finalizePartition() throws IOException {
     private void deleteAllFiles() {
       if (!dataFile.delete()) {
         logger.info("Error deleting data file for {} reduceId {}",
-          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId),
-          MDC.of(LogKeys.REDUCE_ID$.MODULE$, reduceId));
+          MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId),
+          MDC.of(LogKeys.REDUCE_ID, reduceId));
       }
       metaFile.delete();
       indexFile.delete();
@@ -1983,22 +1982,22 @@ private void closeAllFiles(
           }
         } catch (IOException ioe) {
           logger.warn("Error closing data channel for {} reduceId {}",
-            MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId),
-            MDC.of(LogKeys.REDUCE_ID$.MODULE$, reduceId));
+            MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId),
+            MDC.of(LogKeys.REDUCE_ID, reduceId));
         }
         try {
           metaFile.close();
         } catch (IOException ioe) {
           logger.warn("Error closing meta file for {} reduceId {}",
-            MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId),
-            MDC.of(LogKeys.REDUCE_ID$.MODULE$, reduceId));
+            MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId),
+            MDC.of(LogKeys.REDUCE_ID, reduceId));
         }
         try {
           indexFile.close();
         } catch (IOException ioe) {
           logger.warn("Error closing index file for {} reduceId {}",
-            MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID$.MODULE$, appAttemptShuffleMergeId),
-            MDC.of(LogKeys.REDUCE_ID$.MODULE$, reduceId));
+            MDC.of(LogKeys.APP_ATTEMPT_SHUFFLE_MERGE_ID, appAttemptShuffleMergeId),
+            MDC.of(LogKeys.REDUCE_ID, reduceId));
         }
       }
     }
@@ -2043,9 +2042,9 @@ private AppPathsInfo(
       this.subDirsPerLocalDir = subDirsPerLocalDir;
       if (logger.isInfoEnabled()) {
         logger.info("Updated active local dirs {} and sub dirs {} for application {}",
-          MDC.of(LogKeys.PATHS$.MODULE$, Arrays.toString(activeLocalDirs)),
-          MDC.of(LogKeys.NUM_SUB_DIRS$.MODULE$, subDirsPerLocalDir),
-          MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+          MDC.of(LogKeys.PATHS, Arrays.toString(activeLocalDirs)),
+          MDC.of(LogKeys.NUM_SUB_DIRS, subDirsPerLocalDir),
+          MDC.of(LogKeys.APP_ID, appId));
       }
     }
 
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RetryingBlockTransferor.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RetryingBlockTransferor.java
index 31c454f63a92e..1dae2d54120cb 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RetryingBlockTransferor.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/RetryingBlockTransferor.java
@@ -25,8 +25,6 @@
 import java.util.concurrent.TimeUnit;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.collect.Sets;
 import com.google.common.util.concurrent.Uninterruptibles;
 
 import org.apache.spark.internal.SparkLogger;
@@ -35,6 +33,7 @@
 import org.apache.spark.internal.MDC;
 import org.apache.spark.network.buffer.ManagedBuffer;
 import org.apache.spark.network.sasl.SaslTimeoutException;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.NettyUtils;
 import org.apache.spark.network.util.TransportConf;
 
@@ -131,7 +130,7 @@ public RetryingBlockTransferor(
     this.listener = listener;
     this.maxRetries = conf.maxIORetries();
     this.retryWaitTime = conf.ioRetryWaitTimeMs();
-    this.outstandingBlocksIds = Sets.newLinkedHashSet();
+    this.outstandingBlocksIds = new LinkedHashSet<>();
     Collections.addAll(outstandingBlocksIds, blockIds);
     this.currentListener = new RetryingBlockTransferListener();
     this.errorHandler = errorHandler;
@@ -182,13 +181,13 @@ private void transferAllOutstanding() {
     } catch (Exception e) {
       if (numRetries > 0) {
         logger.error("Exception while beginning {} of {} outstanding blocks (after {} retries)", e,
-          MDC.of(LogKeys.TRANSFER_TYPE$.MODULE$, listener.getTransferType()),
-          MDC.of(LogKeys.NUM_BLOCKS$.MODULE$, blockIdsToTransfer.length),
-          MDC.of(LogKeys.NUM_RETRY$.MODULE$, numRetries));
+          MDC.of(LogKeys.TRANSFER_TYPE, listener.getTransferType()),
+          MDC.of(LogKeys.NUM_BLOCKS, blockIdsToTransfer.length),
+          MDC.of(LogKeys.NUM_RETRY, numRetries));
       } else {
         logger.error("Exception while beginning {} of {} outstanding blocks", e,
-          MDC.of(LogKeys.TRANSFER_TYPE$.MODULE$, listener.getTransferType()),
-          MDC.of(LogKeys.NUM_BLOCKS$.MODULE$, blockIdsToTransfer.length));
+          MDC.of(LogKeys.TRANSFER_TYPE, listener.getTransferType()),
+          MDC.of(LogKeys.NUM_BLOCKS, blockIdsToTransfer.length));
       }
       if (shouldRetry(e) && initiateRetry(e)) {
         // successfully initiated a retry
@@ -216,11 +215,11 @@ synchronized boolean initiateRetry(Throwable e) {
     currentListener = new RetryingBlockTransferListener();
 
     logger.info("Retrying {} ({}/{}) for {} outstanding blocks after {} ms",
-      MDC.of(LogKeys.TRANSFER_TYPE$.MODULE$, listener.getTransferType()),
-      MDC.of(LogKeys.NUM_RETRY$.MODULE$, retryCount),
-      MDC.of(LogKeys.MAX_ATTEMPTS$.MODULE$, maxRetries),
-      MDC.of(LogKeys.NUM_BLOCKS$.MODULE$, outstandingBlocksIds.size()),
-      MDC.of(LogKeys.RETRY_WAIT_TIME$.MODULE$, retryWaitTime));
+      MDC.of(LogKeys.TRANSFER_TYPE, listener.getTransferType()),
+      MDC.of(LogKeys.NUM_RETRY, retryCount),
+      MDC.of(LogKeys.MAX_ATTEMPTS, maxRetries),
+      MDC.of(LogKeys.NUM_BLOCKS, outstandingBlocksIds.size()),
+      MDC.of(LogKeys.RETRY_WAIT_TIME, retryWaitTime));
 
     try {
       executorService.execute(() -> {
@@ -247,7 +246,7 @@ private synchronized boolean shouldRetry(Throwable e) {
     // If this is a non SASL request failure, reduce earlier SASL failures from retryCount
     // since some subsequent SASL attempt was successful
     if (!isSaslTimeout && saslRetryCount > 0) {
-      Preconditions.checkState(retryCount >= saslRetryCount,
+      JavaUtils.checkState(retryCount >= saslRetryCount,
         "retryCount must be greater than or equal to saslRetryCount");
       retryCount -= saslRetryCount;
       saslRetryCount = 0;
@@ -282,7 +281,7 @@ private void handleBlockTransferSuccess(String blockId, ManagedBuffer data) {
           // If there were SASL failures earlier, remove them from retryCount, as there was
           // a SASL success (and some other request post bootstrap was also successful).
           if (saslRetryCount > 0) {
-            Preconditions.checkState(retryCount >= saslRetryCount,
+            JavaUtils.checkState(retryCount >= saslRetryCount,
               "retryCount must be greater than or equal to saslRetryCount");
             retryCount -= saslRetryCount;
             saslRetryCount = 0;
@@ -311,9 +310,9 @@ private void handleBlockTransferFailure(String blockId, Throwable exception) {
           } else {
             if (errorHandler.shouldLogError(exception)) {
               logger.error("Failed to {} block {}, and will not retry ({} retries)", exception,
-                MDC.of(LogKeys.TRANSFER_TYPE$.MODULE$, listener.getTransferType()),
-                MDC.of(LogKeys.BLOCK_ID$.MODULE$, blockId),
-                MDC.of(LogKeys.NUM_RETRY$.MODULE$,retryCount));
+                MDC.of(LogKeys.TRANSFER_TYPE, listener.getTransferType()),
+                MDC.of(LogKeys.BLOCK_ID, blockId),
+                MDC.of(LogKeys.NUM_RETRY,retryCount));
             } else {
               logger.debug(
                 String.format("Failed to %s block %s, and will not retry (%s retries)",
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/checksum/ShuffleChecksumHelper.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/checksum/ShuffleChecksumHelper.java
index 62fcda701d948..2dbf38be954db 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/checksum/ShuffleChecksumHelper.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/checksum/ShuffleChecksumHelper.java
@@ -21,8 +21,6 @@
 import java.util.concurrent.TimeUnit;
 import java.util.zip.*;
 
-import com.google.common.io.ByteStreams;
-
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.internal.LogKeys;
@@ -88,7 +86,7 @@ public static String getChecksumFileName(String blockName, String algorithm) {
 
   private static long readChecksumByReduceId(File checksumFile, int reduceId) throws IOException {
     try (DataInputStream in = new DataInputStream(new FileInputStream(checksumFile))) {
-      ByteStreams.skipFully(in, reduceId * 8L);
+      in.skipNBytes(reduceId * 8L);
       return in.readLong();
     }
   }
@@ -156,7 +154,7 @@ public static Cause diagnoseCorruption(
     } catch (FileNotFoundException e) {
       // Even if checksum is enabled, a checksum file may not exist if error throws during writing.
       logger.warn("Checksum file {} doesn't exit",
-        MDC.of(LogKeys.PATH$.MODULE$, checksumFile.getName()));
+        MDC.of(LogKeys.PATH, checksumFile.getName()));
       cause = Cause.UNKNOWN_ISSUE;
     } catch (Exception e) {
       logger.warn("Unable to diagnose shuffle block corruption", e);
@@ -169,9 +167,9 @@ public static Cause diagnoseCorruption(
         checksumByReader, checksumByWriter, checksumByReCalculation);
     } else {
       logger.info("Shuffle corruption diagnosis took {} ms, checksum file {}, cause {}",
-        MDC.of(LogKeys.TIME$.MODULE$, duration),
-        MDC.of(LogKeys.PATH$.MODULE$, checksumFile.getAbsolutePath()),
-        MDC.of(LogKeys.REASON$.MODULE$, cause));
+        MDC.of(LogKeys.TIME, duration),
+        MDC.of(LogKeys.PATH, checksumFile.getAbsolutePath()),
+        MDC.of(LogKeys.REASON, cause));
     }
     return cause;
   }
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/AbstractFetchShuffleBlocks.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/AbstractFetchShuffleBlocks.java
index 0fca27cf26dfa..2bc57cc52f2cd 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/AbstractFetchShuffleBlocks.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/AbstractFetchShuffleBlocks.java
@@ -17,7 +17,8 @@
 
 package org.apache.spark.network.shuffle.protocol;
 
-import com.google.common.base.Objects;
+import java.util.Objects;
+
 import io.netty.buffer.ByteBuf;
 
 import org.apache.commons.lang3.builder.ToStringBuilder;
@@ -43,12 +44,14 @@ protected AbstractFetchShuffleBlocks(
     this.shuffleId = shuffleId;
   }
 
+  // checkstyle.off: RegexpSinglelineJava
   public ToStringBuilder toStringHelper() {
     return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
       .append("appId", appId)
       .append("execId", execId)
       .append("shuffleId", shuffleId);
   }
+  // checkstyle.on: RegexpSinglelineJava
 
   /**
    * Returns number of blocks in the request.
@@ -61,7 +64,7 @@ public boolean equals(Object o) {
     if (o == null || getClass() != o.getClass()) return false;
     AbstractFetchShuffleBlocks that = (AbstractFetchShuffleBlocks) o;
     return shuffleId == that.shuffleId
-      && Objects.equal(appId, that.appId) && Objects.equal(execId, that.execId);
+      && Objects.equals(appId, that.appId) && Objects.equals(execId, that.execId);
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlockPushReturnCode.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlockPushReturnCode.java
index 05347c671e002..f4149b6875b26 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlockPushReturnCode.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlockPushReturnCode.java
@@ -19,10 +19,7 @@
 
 import java.util.Objects;
 
-import com.google.common.base.Preconditions;
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 import org.apache.spark.network.server.BlockPushNonFatalFailure;
@@ -43,7 +40,7 @@ public class BlockPushReturnCode extends BlockTransferMessage {
   public final String failureBlockId;
 
   public BlockPushReturnCode(byte returnCode, String failureBlockId) {
-    Preconditions.checkNotNull(BlockPushNonFatalFailure.getReturnCode(returnCode));
+    Objects.requireNonNull(BlockPushNonFatalFailure.getReturnCode(returnCode));
     this.returnCode = returnCode;
     this.failureBlockId = failureBlockId;
   }
@@ -60,10 +57,8 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("returnCode", returnCode)
-      .append("failureBlockId", failureBlockId)
-      .toString();
+    return "BlockPushReturnCode[returnCode=" + returnCode +
+        ",failureBlockId=" + failureBlockId + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlocksRemoved.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlocksRemoved.java
index 2a050ce40b84b..9942d68297595 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlocksRemoved.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/BlocksRemoved.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 // Needed by ScalaDoc. See SPARK-7726
 import static org.apache.spark.network.shuffle.protocol.BlockTransferMessage.Type;
@@ -44,9 +42,7 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("numRemovedBlocks", numRemovedBlocks)
-      .toString();
+    return "BlocksRemoved[numRemovedBlocks=" + numRemovedBlocks + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/CorruptionCause.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/CorruptionCause.java
index 5690eee53bd13..d9b9d4d8f36c2 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/CorruptionCause.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/CorruptionCause.java
@@ -18,8 +18,6 @@
 package org.apache.spark.network.shuffle.protocol;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.shuffle.checksum.Cause;
 
@@ -38,9 +36,7 @@ protected Type type() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("cause", cause)
-      .toString();
+    return "CorruptionCause[cause=" + cause + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/DiagnoseCorruption.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/DiagnoseCorruption.java
index 620b5ad71cd75..e509f45a9f0e3 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/DiagnoseCorruption.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/DiagnoseCorruption.java
@@ -18,8 +18,6 @@
 package org.apache.spark.network.shuffle.protocol;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 import org.apache.spark.network.protocol.Encoders;
 
 /** Request to get the cause of a corrupted block. Returns {@link CorruptionCause} */
@@ -56,15 +54,9 @@ protected Type type() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("execId", execId)
-      .append("shuffleId", shuffleId)
-      .append("mapId", mapId)
-      .append("reduceId", reduceId)
-      .append("checksum", checksum)
-      .append("algorithm", algorithm)
-      .toString();
+    return "DiagnoseCorruption[appId=" + appId + ",execId=" + execId + ",shuffleId=" + shuffleId +
+        ",mapId=" + mapId + ",reduceId=" + reduceId + ",checksum=" + checksum +
+        ",algorithm=" + algorithm + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/ExecutorShuffleInfo.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/ExecutorShuffleInfo.java
index 8a3ccdef2920b..c53ab911c30da 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/ExecutorShuffleInfo.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/ExecutorShuffleInfo.java
@@ -23,8 +23,6 @@
 import com.fasterxml.jackson.annotation.JsonCreator;
 import com.fasterxml.jackson.annotation.JsonProperty;
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encodable;
 import org.apache.spark.network.protocol.Encoders;
@@ -60,11 +58,8 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("localDirs", Arrays.toString(localDirs))
-      .append("subDirsPerLocalDir", subDirsPerLocalDir)
-      .append("shuffleManager", shuffleManager)
-      .toString();
+    return "ExecutorShuffleInfo[localDirs=" + Arrays.toString(localDirs) +
+        ",subDirsPerLocalDir=" + subDirsPerLocalDir + ",shuffleManager=" + shuffleManager + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlockChunks.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlockChunks.java
index cf4cbcf1ed08e..a6e1ce374b07f 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlockChunks.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlockChunks.java
@@ -60,11 +60,10 @@ public FetchShuffleBlockChunks(
 
   @Override
   public String toString() {
-    return toStringHelper()
-      .append("shuffleMergeId", shuffleMergeId)
-      .append("reduceIds", Arrays.toString(reduceIds))
-      .append("chunkIds", Arrays.deepToString(chunkIds))
-      .toString();
+    return "FetchShuffleBlockChunks[appId=" + appId + ",execId=" + execId +
+        ",shuffleId=" + shuffleId + ",shuffleMergeId=" + shuffleMergeId +
+        ",reduceIds=" + Arrays.toString(reduceIds) +
+        ",chunkIds=" + Arrays.deepToString(chunkIds) + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlocks.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlocks.java
index 68550a2fba86e..686207767ca1e 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlocks.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FetchShuffleBlocks.java
@@ -62,11 +62,9 @@ public FetchShuffleBlocks(
 
   @Override
   public String toString() {
-    return toStringHelper()
-      .append("mapIds", Arrays.toString(mapIds))
-      .append("reduceIds", Arrays.deepToString(reduceIds))
-      .append("batchFetchEnabled", batchFetchEnabled)
-      .toString();
+    return "FetchShuffleBlocks[appId=" + appId + ",execId=" + execId + ",shuffleId=" + shuffleId +
+        ",mapIds=" + Arrays.toString(mapIds) + ",reduceIds=" + Arrays.deepToString(reduceIds) +
+        ",batchFetchEnabled=" + batchFetchEnabled + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FinalizeShuffleMerge.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FinalizeShuffleMerge.java
index cd5e005348f42..61152f48a85ba 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FinalizeShuffleMerge.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/FinalizeShuffleMerge.java
@@ -17,10 +17,9 @@
 
 package org.apache.spark.network.shuffle.protocol;
 
-import com.google.common.base.Objects;
+import java.util.Objects;
+
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -54,23 +53,19 @@ protected BlockTransferMessage.Type type() {
 
   @Override
   public int hashCode() {
-    return Objects.hashCode(appId, appAttemptId, shuffleId, shuffleMergeId);
+    return Objects.hash(appId, appAttemptId, shuffleId, shuffleMergeId);
   }
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("attemptId", appAttemptId)
-      .append("shuffleId", shuffleId)
-      .append("shuffleMergeId", shuffleMergeId)
-      .toString();
+    return "FinalizeShuffleMerge[appId=" + appId + ",attemptId=" + appAttemptId +
+        ",shuffleId=" + shuffleId + ",shuffleMergeId=" + shuffleMergeId + "]";
   }
 
   @Override
   public boolean equals(Object other) {
     if (other instanceof FinalizeShuffleMerge o) {
-      return Objects.equal(appId, o.appId)
+      return Objects.equals(appId, o.appId)
         && appAttemptId == o.appAttemptId
         && shuffleId == o.shuffleId
         && shuffleMergeId == o.shuffleMergeId;
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/GetLocalDirsForExecutors.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/GetLocalDirsForExecutors.java
index f118f0604d9e9..8bd106c94c283 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/GetLocalDirsForExecutors.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/GetLocalDirsForExecutors.java
@@ -21,8 +21,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -49,10 +47,7 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("execIds", Arrays.toString(execIds))
-      .toString();
+    return "GetLocalDirsForExecutors[appId=" + appId + ",execIds=" + Arrays.toString(execIds) + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/LocalDirsForExecutors.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/LocalDirsForExecutors.java
index b65f351d3cf3e..060b565d420fd 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/LocalDirsForExecutors.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/LocalDirsForExecutors.java
@@ -20,8 +20,6 @@
 import java.util.*;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -64,11 +62,9 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("execIds", Arrays.toString(execIds))
-      .append("numLocalDirsByExec", Arrays.toString(numLocalDirsByExec))
-      .append("allLocalDirs", Arrays.toString(allLocalDirs))
-      .toString();
+    return "LocalDirsForExecutors[execIds=" + Arrays.toString(execIds) +
+        ",numLocalDirsByExec=" + Arrays.toString(numLocalDirsByExec) +
+        ",allLocalDirs=" + Arrays.toString(allLocalDirs) + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/MergeStatuses.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/MergeStatuses.java
index 892c3a5e77958..d21449016972f 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/MergeStatuses.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/MergeStatuses.java
@@ -19,10 +19,9 @@
 
 import java.util.Arrays;
 
-import com.google.common.base.Objects;
+import java.util.Objects;
+
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 import org.roaringbitmap.RoaringBitmap;
 
 import org.apache.spark.network.protocol.Encoders;
@@ -86,18 +85,15 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("shuffleId", shuffleId)
-      .append("shuffleMergeId", shuffleMergeId)
-      .append("reduceId size", reduceIds.length)
-      .toString();
+    return "MergeStatuses[shuffleId=" + shuffleId + ",shuffleMergeId=" + shuffleMergeId +
+        ",reduceId size=" + reduceIds.length + "]";
   }
 
   @Override
   public boolean equals(Object other) {
     if (other instanceof MergeStatuses o) {
-      return Objects.equal(shuffleId, o.shuffleId)
-        && Objects.equal(shuffleMergeId, o.shuffleMergeId)
+      return Objects.equals(shuffleId, o.shuffleId)
+        && Objects.equals(shuffleMergeId, o.shuffleMergeId)
         && Arrays.equals(bitmaps, o.bitmaps)
         && Arrays.equals(reduceIds, o.reduceIds)
         && Arrays.equals(sizes, o.sizes);
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/OpenBlocks.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/OpenBlocks.java
index 49288eef5c5de..87b40eb1fc6ac 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/OpenBlocks.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/OpenBlocks.java
@@ -21,8 +21,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -51,11 +49,8 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("execId", execId)
-      .append("blockIds", Arrays.toString(blockIds))
-      .toString();
+    return "OpenBlocks[appId=" + appId + ",execId=" + execId + ",blockIds=" +
+        Arrays.toString(blockIds) + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/PushBlockStream.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/PushBlockStream.java
index ceab54a1c0615..20e6e79c31980 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/PushBlockStream.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/PushBlockStream.java
@@ -17,11 +17,9 @@
 
 package org.apache.spark.network.shuffle.protocol;
 
-import com.google.common.base.Objects;
-import io.netty.buffer.ByteBuf;
+import java.util.Objects;
 
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
+import io.netty.buffer.ByteBuf;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -68,27 +66,21 @@ protected Type type() {
 
   @Override
   public int hashCode() {
-    return Objects.hashCode(appId, appAttemptId, shuffleId, shuffleMergeId, mapIndex , reduceId,
+    return Objects.hash(appId, appAttemptId, shuffleId, shuffleMergeId, mapIndex , reduceId,
       index);
   }
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("attemptId", appAttemptId)
-      .append("shuffleId", shuffleId)
-      .append("shuffleMergeId", shuffleMergeId)
-      .append("mapIndex", mapIndex)
-      .append("reduceId", reduceId)
-      .append("index", index)
-      .toString();
+    return "PushBlockStream[appId=" + appId + ",attemptId=" + appAttemptId +
+        ",shuffleId=" + shuffleId + ",shuffleMergeId=" + shuffleMergeId + ",mapIndex=" + mapIndex +
+        ",reduceId=" + reduceId + ",index=" + index + "]";
   }
 
   @Override
   public boolean equals(Object other) {
     if (other instanceof PushBlockStream o) {
-      return Objects.equal(appId, o.appId)
+      return Objects.equals(appId, o.appId)
         && appAttemptId == o.appAttemptId
         && shuffleId == o.shuffleId
         && shuffleMergeId == o.shuffleMergeId
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RegisterExecutor.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RegisterExecutor.java
index 9805af67b9f26..a5931126e4ff8 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RegisterExecutor.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RegisterExecutor.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -56,11 +54,8 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("execId", execId)
-      .append("executorInfo", executorInfo)
-      .toString();
+    return "RegisterExecutor[appId=" + appId + ", execId=" + execId +
+        ",executorInfo=" + executorInfo + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveBlocks.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveBlocks.java
index 7032942331c3e..2743824b3d21c 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveBlocks.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveBlocks.java
@@ -21,8 +21,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -51,11 +49,8 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("execId", execId)
-      .append("blockIds", Arrays.toString(blockIds))
-      .toString();
+    return "RemoveBlocks[appId=" + appId + ",execId=" + execId +
+        ",blockIds=" + Arrays.toString(blockIds) + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveShuffleMerge.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveShuffleMerge.java
index 8ce2e05e6097d..ac6d981b2e081 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveShuffleMerge.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/RemoveShuffleMerge.java
@@ -17,10 +17,9 @@
 
 package org.apache.spark.network.shuffle.protocol;
 
-import com.google.common.base.Objects;
+import java.util.Objects;
+
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -54,23 +53,19 @@ protected Type type() {
 
   @Override
   public int hashCode() {
-    return Objects.hashCode(appId, appAttemptId, shuffleId, shuffleMergeId);
+    return Objects.hash(appId, appAttemptId, shuffleId, shuffleMergeId);
   }
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("attemptId", appAttemptId)
-      .append("shuffleId", shuffleId)
-      .append("shuffleMergeId", shuffleMergeId)
-      .toString();
+    return "RemoveShuffleMerge[appId=" + appId + ",attemptId=" + appAttemptId +
+        ",shuffleId=" + shuffleId + ",shuffleMergeId=" + shuffleMergeId + "]";
   }
 
   @Override
   public boolean equals(Object other) {
     if (other != null && other instanceof RemoveShuffleMerge o) {
-      return Objects.equal(appId, o.appId)
+      return Objects.equals(appId, o.appId)
         && appAttemptId == o.appAttemptId
         && shuffleId == o.shuffleId
         && shuffleMergeId == o.shuffleMergeId;
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/StreamHandle.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/StreamHandle.java
index aebd6f0d5a620..629e3c472e0a6 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/StreamHandle.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/StreamHandle.java
@@ -20,8 +20,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 // Needed by ScalaDoc. See SPARK-7726
 import static org.apache.spark.network.shuffle.protocol.BlockTransferMessage.Type;
@@ -49,10 +47,7 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("streamId", streamId)
-      .append("numChunks", numChunks)
-      .toString();
+    return "StreamHandle[streamId=" + streamId + ",numChunks=" + numChunks + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlock.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlock.java
index fad187971e09a..9222134e6bb7f 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlock.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlock.java
@@ -21,8 +21,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -68,13 +66,8 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("appId", appId)
-      .append("execId", execId)
-      .append("blockId", blockId)
-      .append("metadata size", metadata.length)
-      .append("block size", blockData.length)
-      .toString();
+    return "UploadBlock[appId=" + appId + ",execId=" + execId + ",blockId=" + blockId +
+        ",metadata size=" + metadata.length + ",block size=" + blockData.length + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlockStream.java b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlockStream.java
index 95d0b3835562d..45c4c5f98de74 100644
--- a/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlockStream.java
+++ b/common/network-shuffle/src/main/java/org/apache/spark/network/shuffle/protocol/UploadBlockStream.java
@@ -21,8 +21,6 @@
 import java.util.Objects;
 
 import io.netty.buffer.ByteBuf;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 
 import org.apache.spark.network.protocol.Encoders;
 
@@ -55,10 +53,7 @@ public int hashCode() {
 
   @Override
   public String toString() {
-    return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-      .append("blockId", blockId)
-      .append("metadata size", metadata.length)
-      .toString();
+    return "UploadBlockStream[blockId=" + blockId + ",metadata size=" + metadata.length + "]";
   }
 
   @Override
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/CleanupNonShuffleServiceServedFilesSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/CleanupNonShuffleServiceServedFilesSuite.java
index ccb464c2ce5bd..0c091d88f98b5 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/CleanupNonShuffleServiceServedFilesSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/CleanupNonShuffleServiceServedFilesSuite.java
@@ -20,21 +20,17 @@
 import java.io.File;
 import java.io.IOException;
 import java.nio.charset.StandardCharsets;
-import java.nio.file.Files;
-import java.nio.file.Path;
 import java.util.*;
 import java.util.concurrent.Executor;
 import java.util.concurrent.atomic.AtomicBoolean;
 import java.util.stream.Collectors;
-import java.util.stream.Stream;
 
-import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.ImmutableSet;
 import org.junit.jupiter.api.Test;
 
 import static org.junit.jupiter.api.Assertions.assertEquals;
 import static org.junit.jupiter.api.Assertions.assertTrue;
 
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.MapConfigProvider;
 import org.apache.spark.network.util.TransportConf;
 
@@ -46,15 +42,15 @@ public class CleanupNonShuffleServiceServedFilesSuite {
   private static final String SORT_MANAGER = "org.apache.spark.shuffle.sort.SortShuffleManager";
 
   private static Set<String> expectedShuffleFilesToKeep =
-    ImmutableSet.of("shuffle_782_450_0.index", "shuffle_782_450_0.data");
+    Set.of("shuffle_782_450_0.index", "shuffle_782_450_0.data");
 
   private static Set<String> expectedShuffleAndRddFilesToKeep =
-    ImmutableSet.of("shuffle_782_450_0.index", "shuffle_782_450_0.data", "rdd_12_34");
+    Set.of("shuffle_782_450_0.index", "shuffle_782_450_0.data", "rdd_12_34");
 
   private TransportConf getConf(boolean isFetchRddEnabled) {
     return new TransportConf(
       "shuffle",
-      new MapConfigProvider(ImmutableMap.of(
+      new MapConfigProvider(Map.of(
         Constants.SHUFFLE_SERVICE_FETCH_RDD_ENABLED,
         Boolean.toString(isFetchRddEnabled))));
   }
@@ -200,28 +196,13 @@ private static void assertStillThere(TestShuffleDataContext dataContext) {
     }
   }
 
-  private static Set<String> collectFilenames(File[] files) throws IOException {
-    Set<String> result = new HashSet<>();
-    for (File file : files) {
-      if (file.exists()) {
-        try (Stream<Path> walk = Files.walk(file.toPath())) {
-          result.addAll(walk
-            .filter(Files::isRegularFile)
-            .map(x -> x.toFile().getName())
-            .collect(Collectors.toSet()));
-        }
-      }
-    }
-    return result;
-  }
-
   private static void assertContainedFilenames(
       TestShuffleDataContext dataContext,
       Set<String> expectedFilenames) throws IOException {
     Set<String> collectedFilenames = new HashSet<>();
     for (String localDir : dataContext.localDirs) {
-      File[] dirs = new File[] { new File(localDir) };
-      collectedFilenames.addAll(collectFilenames(dirs));
+      JavaUtils.listFiles(new File(localDir)).stream().map(File::getName)
+        .collect(Collectors.toCollection(() -> collectedFilenames));
     }
     assertEquals(expectedFilenames, collectedFilenames);
   }
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalBlockHandlerSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalBlockHandlerSuite.java
index f7edc8837fde7..2a3135e3c8aeb 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalBlockHandlerSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalBlockHandlerSuite.java
@@ -27,7 +27,6 @@
 import com.codahale.metrics.Meter;
 import com.codahale.metrics.Metric;
 import com.codahale.metrics.Timer;
-import com.google.common.io.ByteStreams;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
 import org.mockito.ArgumentCaptor;
@@ -136,7 +135,7 @@ private void checkDiagnosisResult(
       CheckedInputStream checkedIn = new CheckedInputStream(
         blockMarkers[0].createInputStream(), checksum);
       byte[] buffer = new byte[10];
-      ByteStreams.readFully(checkedIn, buffer, 0, (int) blockMarkers[0].size());
+      JavaUtils.readFully(checkedIn, buffer, 0, (int) blockMarkers[0].size());
       long checksumByWriter = checkedIn.getChecksum().getValue();
 
       // when checksumByWriter == checksumRecalculated and checksumByReader != checksumByWriter
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolverSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolverSuite.java
index 311827dbed4c5..488d02d63d552 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolverSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleBlockResolverSuite.java
@@ -19,12 +19,11 @@
 
 import java.io.IOException;
 import java.io.InputStream;
-import java.io.InputStreamReader;
 import java.nio.charset.StandardCharsets;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.io.CharStreams;
 import org.apache.spark.network.shuffle.protocol.ExecutorShuffleInfo;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.network.util.MapConfigProvider;
 import org.apache.spark.network.util.TransportConf;
 import org.apache.spark.network.shuffle.ExternalShuffleBlockResolver.AppExecId;
@@ -83,23 +82,17 @@ public void testSortShuffleBlocks() throws IOException {
 
     try (InputStream block0Stream = resolver.getBlockData(
         "app0", "exec0", 0, 0, 0).createInputStream()) {
-      String block0 =
-        CharStreams.toString(new InputStreamReader(block0Stream, StandardCharsets.UTF_8));
-      assertEquals(sortBlock0, block0);
+      assertEquals(sortBlock0, JavaUtils.toString(block0Stream));
     }
 
     try (InputStream block1Stream = resolver.getBlockData(
         "app0", "exec0", 0, 0, 1).createInputStream()) {
-      String block1 =
-        CharStreams.toString(new InputStreamReader(block1Stream, StandardCharsets.UTF_8));
-      assertEquals(sortBlock1, block1);
+      assertEquals(sortBlock1, JavaUtils.toString(block1Stream));
     }
 
     try (InputStream blocksStream = resolver.getContinuousBlocksData(
         "app0", "exec0", 0, 0, 0, 2).createInputStream()) {
-      String blocks =
-        CharStreams.toString(new InputStreamReader(blocksStream, StandardCharsets.UTF_8));
-      assertEquals(sortBlock0 + sortBlock1, blocks);
+      assertEquals(sortBlock0 + sortBlock1, JavaUtils.toString(blocksStream));
     }
   }
 
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleIntegrationSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleIntegrationSuite.java
index ec71f83ba743c..59381cabe063a 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleIntegrationSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleIntegrationSuite.java
@@ -32,7 +32,6 @@
 import java.util.concurrent.Semaphore;
 import java.util.concurrent.TimeUnit;
 
-import com.google.common.collect.Sets;
 import org.apache.spark.network.buffer.FileSegmentManagedBuffer;
 import org.apache.spark.network.server.OneForOneStreamManager;
 import org.junit.jupiter.api.AfterAll;
@@ -222,7 +221,7 @@ public void testFetchOneSort() throws Exception {
     try (ExternalBlockStoreClient client = createExternalBlockStoreClient()) {
       registerExecutor(client, "exec-0", dataContext0.createExecutorInfo(SORT_MANAGER));
       FetchResult exec0Fetch = fetchBlocks("exec-0", new String[] { "shuffle_0_0_0" });
-      assertEquals(Sets.newHashSet("shuffle_0_0_0"), exec0Fetch.successBlocks);
+      assertEquals(Set.of("shuffle_0_0_0"), exec0Fetch.successBlocks);
       assertTrue(exec0Fetch.failedBlocks.isEmpty());
       assertBufferListsEqual(exec0Fetch.buffers, Arrays.asList(exec0Blocks[0]));
       exec0Fetch.releaseBuffers();
@@ -235,7 +234,7 @@ public void testFetchThreeSort() throws Exception {
       registerExecutor(client,"exec-0", dataContext0.createExecutorInfo(SORT_MANAGER));
       FetchResult exec0Fetch = fetchBlocks("exec-0",
         new String[]{"shuffle_0_0_0", "shuffle_0_0_1", "shuffle_0_0_2"});
-      assertEquals(Sets.newHashSet("shuffle_0_0_0", "shuffle_0_0_1", "shuffle_0_0_2"),
+      assertEquals(Set.of("shuffle_0_0_0", "shuffle_0_0_1", "shuffle_0_0_2"),
         exec0Fetch.successBlocks);
       assertTrue(exec0Fetch.failedBlocks.isEmpty());
       assertBufferListsEqual(exec0Fetch.buffers, Arrays.asList(exec0Blocks));
@@ -256,7 +255,7 @@ public void testFetchWrongBlockId() throws Exception {
       registerExecutor(client, "exec-1", dataContext0.createExecutorInfo(SORT_MANAGER));
       FetchResult execFetch = fetchBlocks("exec-1", new String[]{"broadcast_1"});
       assertTrue(execFetch.successBlocks.isEmpty());
-      assertEquals(Sets.newHashSet("broadcast_1"), execFetch.failedBlocks);
+      assertEquals(Set.of("broadcast_1"), execFetch.failedBlocks);
     }
   }
 
@@ -267,7 +266,7 @@ public void testFetchValidRddBlock() throws Exception {
       String validBlockId = "rdd_" + RDD_ID + "_" + SPLIT_INDEX_VALID_BLOCK;
       FetchResult execFetch = fetchBlocks("exec-1", new String[]{validBlockId});
       assertTrue(execFetch.failedBlocks.isEmpty());
-      assertEquals(Sets.newHashSet(validBlockId), execFetch.successBlocks);
+      assertEquals(Set.of(validBlockId), execFetch.successBlocks);
       assertBuffersEqual(new NioManagedBuffer(ByteBuffer.wrap(exec0RddBlockValid)),
         execFetch.buffers.get(0));
     }
@@ -280,7 +279,7 @@ public void testFetchDeletedRddBlock() throws Exception {
       String missingBlockId = "rdd_" + RDD_ID + "_" + SPLIT_INDEX_MISSING_FILE;
       FetchResult execFetch = fetchBlocks("exec-1", new String[]{missingBlockId});
       assertTrue(execFetch.successBlocks.isEmpty());
-      assertEquals(Sets.newHashSet(missingBlockId), execFetch.failedBlocks);
+      assertEquals(Set.of(missingBlockId), execFetch.failedBlocks);
     }
   }
 
@@ -310,7 +309,7 @@ public void testFetchCorruptRddBlock() throws Exception {
       String corruptBlockId = "rdd_" + RDD_ID + "_" + SPLIT_INDEX_CORRUPT_LENGTH;
       FetchResult execFetch = fetchBlocks("exec-1", new String[]{corruptBlockId});
       assertTrue(execFetch.successBlocks.isEmpty());
-      assertEquals(Sets.newHashSet(corruptBlockId), execFetch.failedBlocks);
+      assertEquals(Set.of(corruptBlockId), execFetch.failedBlocks);
     }
   }
 
@@ -321,7 +320,7 @@ public void testFetchNonexistent() throws Exception {
       FetchResult execFetch = fetchBlocks("exec-0",
         new String[]{"shuffle_2_0_0"});
       assertTrue(execFetch.successBlocks.isEmpty());
-      assertEquals(Sets.newHashSet("shuffle_2_0_0"), execFetch.failedBlocks);
+      assertEquals(Set.of("shuffle_2_0_0"), execFetch.failedBlocks);
     }
   }
 
@@ -331,8 +330,8 @@ public void testFetchWrongExecutor() throws Exception {
       registerExecutor(client,"exec-0", dataContext0.createExecutorInfo(SORT_MANAGER));
       FetchResult execFetch0 = fetchBlocks("exec-0", new String[]{"shuffle_0_0_0" /* right */});
       FetchResult execFetch1 = fetchBlocks("exec-0", new String[]{"shuffle_1_0_0" /* wrong */});
-      assertEquals(Sets.newHashSet("shuffle_0_0_0"), execFetch0.successBlocks);
-      assertEquals(Sets.newHashSet("shuffle_1_0_0"), execFetch1.failedBlocks);
+      assertEquals(Set.of("shuffle_0_0_0"), execFetch0.successBlocks);
+      assertEquals(Set.of("shuffle_1_0_0"), execFetch1.failedBlocks);
     }
   }
 
@@ -343,7 +342,7 @@ public void testFetchUnregisteredExecutor() throws Exception {
       FetchResult execFetch = fetchBlocks("exec-2",
         new String[]{"shuffle_0_0_0", "shuffle_1_0_0"});
       assertTrue(execFetch.successBlocks.isEmpty());
-      assertEquals(Sets.newHashSet("shuffle_0_0_0", "shuffle_1_0_0"), execFetch.failedBlocks);
+      assertEquals(Set.of("shuffle_0_0_0", "shuffle_1_0_0"), execFetch.failedBlocks);
     }
   }
 
@@ -355,7 +354,7 @@ public void testFetchNoServer() throws Exception {
       FetchResult execFetch = fetchBlocks("exec-0",
         new String[]{"shuffle_1_0_0", "shuffle_1_0_1"}, clientConf, 1 /* port */);
       assertTrue(execFetch.successBlocks.isEmpty());
-      assertEquals(Sets.newHashSet("shuffle_1_0_0", "shuffle_1_0_1"), execFetch.failedBlocks);
+      assertEquals(Set.of("shuffle_1_0_0", "shuffle_1_0_1"), execFetch.failedBlocks);
     }
   }
 
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleSecuritySuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleSecuritySuite.java
index 76f82800c502a..170b72b409e12 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleSecuritySuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ExternalShuffleSecuritySuite.java
@@ -19,8 +19,8 @@
 
 import java.io.IOException;
 import java.util.Arrays;
+import java.util.Map;
 
-import com.google.common.collect.ImmutableMap;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -46,7 +46,7 @@ public class ExternalShuffleSecuritySuite {
   protected TransportConf createTransportConf(boolean encrypt) {
     if (encrypt) {
       return new TransportConf("shuffle", new MapConfigProvider(
-        ImmutableMap.of("spark.authenticate.enableSaslEncryption", "true")));
+        Map.of("spark.authenticate.enableSaslEncryption", "true")));
     } else {
       return new TransportConf("shuffle", MapConfigProvider.EMPTY);
     }
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockFetcherSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockFetcherSuite.java
index 7151d044105c7..f127568c8a333 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockFetcherSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockFetcherSuite.java
@@ -23,7 +23,6 @@
 import java.util.LinkedHashMap;
 import java.util.concurrent.atomic.AtomicInteger;
 
-import com.google.common.collect.Maps;
 import io.netty.buffer.Unpooled;
 import org.junit.jupiter.api.Test;
 
@@ -57,7 +56,7 @@ public class OneForOneBlockFetcherSuite {
 
   @Test
   public void testFetchOne() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffle_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[0])));
     String[] blockIds = blocks.keySet().toArray(new String[blocks.size()]);
 
@@ -72,7 +71,7 @@ public void testFetchOne() {
 
   @Test
   public void testUseOldProtocol() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffle_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[0])));
     String[] blockIds = blocks.keySet().toArray(new String[blocks.size()]);
 
@@ -91,7 +90,7 @@ public void testUseOldProtocol() {
 
   @Test
   public void testFetchThreeShuffleBlocks() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffle_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("shuffle_0_0_1", new NioManagedBuffer(ByteBuffer.wrap(new byte[23])));
     blocks.put("shuffle_0_0_2", new NettyManagedBuffer(Unpooled.wrappedBuffer(new byte[23])));
@@ -112,7 +111,7 @@ public void testFetchThreeShuffleBlocks() {
 
   @Test
   public void testBatchFetchThreeShuffleBlocks() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffle_0_0_0_3", new NioManagedBuffer(ByteBuffer.wrap(new byte[58])));
     String[] blockIds = blocks.keySet().toArray(new String[blocks.size()]);
 
@@ -129,7 +128,7 @@ public void testBatchFetchThreeShuffleBlocks() {
 
   @Test
   public void testFetchThree() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("b0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("b1", new NioManagedBuffer(ByteBuffer.wrap(new byte[23])));
     blocks.put("b2", new NettyManagedBuffer(Unpooled.wrappedBuffer(new byte[23])));
@@ -148,7 +147,7 @@ public void testFetchThree() {
 
   @Test
   public void testFailure() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("b0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("b1", null);
     blocks.put("b2", null);
@@ -168,7 +167,7 @@ public void testFailure() {
 
   @Test
   public void testFailureAndSuccess() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("b0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("b1", null);
     blocks.put("b2", new NioManagedBuffer(ByteBuffer.wrap(new byte[21])));
@@ -190,14 +189,14 @@ public void testFailureAndSuccess() {
   @Test
   public void testEmptyBlockFetch() {
     IllegalArgumentException e = assertThrows(IllegalArgumentException.class,
-      () -> fetchBlocks(Maps.newLinkedHashMap(), new String[] {},
+      () -> fetchBlocks(new LinkedHashMap<>(), new String[] {},
         new OpenBlocks("app-id", "exec-id", new String[] {}), conf));
     assertEquals("Zero-sized blockIds array", e.getMessage());
   }
 
   @Test
   public void testFetchShuffleBlocksOrder() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffle_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[1])));
     blocks.put("shuffle_0_2_1", new NioManagedBuffer(ByteBuffer.wrap(new byte[2])));
     blocks.put("shuffle_0_10_2", new NettyManagedBuffer(Unpooled.wrappedBuffer(new byte[3])));
@@ -217,7 +216,7 @@ public void testFetchShuffleBlocksOrder() {
 
   @Test
   public void testBatchFetchShuffleBlocksOrder() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffle_0_0_1_2", new NioManagedBuffer(ByteBuffer.wrap(new byte[1])));
     blocks.put("shuffle_0_2_2_3", new NioManagedBuffer(ByteBuffer.wrap(new byte[2])));
     blocks.put("shuffle_0_10_3_4", new NettyManagedBuffer(Unpooled.wrappedBuffer(new byte[3])));
@@ -237,7 +236,7 @@ public void testBatchFetchShuffleBlocksOrder() {
 
   @Test
   public void testShuffleBlockChunksFetch() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffleChunk_0_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("shuffleChunk_0_0_0_1", new NioManagedBuffer(ByteBuffer.wrap(new byte[23])));
     blocks.put("shuffleChunk_0_0_0_2",
@@ -255,7 +254,7 @@ public void testShuffleBlockChunksFetch() {
 
   @Test
   public void testShuffleBlockChunkFetchFailure() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shuffleChunk_0_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("shuffleChunk_0_0_0_1", null);
     blocks.put("shuffleChunk_0_0_0_2",
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockPusherSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockPusherSuite.java
index 32c6a8cd37eae..345ac7546af48 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockPusherSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/OneForOneBlockPusherSuite.java
@@ -23,7 +23,6 @@
 import java.util.LinkedHashMap;
 import java.util.Map;
 
-import com.google.common.collect.Maps;
 import io.netty.buffer.Unpooled;
 import org.junit.jupiter.api.Test;
 
@@ -47,7 +46,7 @@ public class OneForOneBlockPusherSuite {
 
   @Test
   public void testPushOne() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shufflePush_0_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[1])));
     String[] blockIds = blocks.keySet().toArray(new String[blocks.size()]);
 
@@ -61,7 +60,7 @@ public void testPushOne() {
 
   @Test
   public void testPushThree() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shufflePush_0_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("shufflePush_0_0_1_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[23])));
     blocks.put("shufflePush_0_0_2_0",
@@ -82,7 +81,7 @@ public void testPushThree() {
 
   @Test
   public void testServerFailures() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shufflePush_0_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("shufflePush_0_0_1_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[0])));
     blocks.put("shufflePush_0_0_2_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[0])));
@@ -102,7 +101,7 @@ public void testServerFailures() {
 
   @Test
   public void testHandlingRetriableFailures() {
-    LinkedHashMap<String, ManagedBuffer> blocks = Maps.newLinkedHashMap();
+    LinkedHashMap<String, ManagedBuffer> blocks = new LinkedHashMap<>();
     blocks.put("shufflePush_0_0_0_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[12])));
     blocks.put("shufflePush_0_0_1_0", null);
     blocks.put("shufflePush_0_0_2_0", new NioManagedBuffer(ByteBuffer.wrap(new byte[0])));
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RemoteBlockPushResolverSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RemoteBlockPushResolverSuite.java
index edd5e1961a501..b7e24fe3da8fe 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RemoteBlockPushResolverSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RemoteBlockPushResolverSuite.java
@@ -39,9 +39,7 @@
 import java.util.concurrent.TimeUnit;
 
 import com.fasterxml.jackson.databind.ObjectMapper;
-import com.google.common.collect.ImmutableMap;
 
-import org.apache.commons.io.FileUtils;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.Assertions;
 import org.junit.jupiter.api.BeforeEach;
@@ -68,6 +66,7 @@
 import org.apache.spark.network.shuffle.protocol.RemoveShuffleMerge;
 import org.apache.spark.network.util.MapConfigProvider;
 import org.apache.spark.network.util.TransportConf;
+import org.apache.spark.network.util.JavaUtils;
 
 /**
  * Tests for {@link RemoteBlockPushResolver}.
@@ -97,7 +96,7 @@ public class RemoteBlockPushResolverSuite {
   public void before() throws IOException {
     localDirs = createLocalDirs(2);
     MapConfigProvider provider = new MapConfigProvider(
-      ImmutableMap.of("spark.shuffle.push.server.minChunkSizeInMergedShuffleFile", "4"));
+      Map.of("spark.shuffle.push.server.minChunkSizeInMergedShuffleFile", "4"));
     conf = new TransportConf("shuffle", provider);
     pushResolver = new RemoteBlockPushResolver(conf, null);
     registerExecutor(TEST_APP, prepareLocalDirs(localDirs, MERGE_DIRECTORY), MERGE_DIRECTORY_META);
@@ -107,7 +106,7 @@ public void before() throws IOException {
   public void after() {
     try {
       for (Path local : localDirs) {
-        FileUtils.deleteDirectory(local.toFile());
+        JavaUtils.deleteRecursively(local.toFile());
       }
       removeApplication(TEST_APP);
     } catch (Exception e) {
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RetryingBlockTransferorSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RetryingBlockTransferorSuite.java
index 84c8b1b3353f2..cbbade779ab68 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RetryingBlockTransferorSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/RetryingBlockTransferorSuite.java
@@ -29,7 +29,6 @@
 import java.util.concurrent.TimeoutException;
 
 import com.google.common.collect.ImmutableMap;
-import com.google.common.collect.Sets;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
 import org.mockito.stubbing.Answer;
@@ -353,15 +352,15 @@ public void testIOExceptionFailsConnectionEvenWithSaslException()
             new TimeoutException());
     IOException ioException = new IOException();
     List<? extends Map<String, Object>> interactions = Arrays.asList(
-            ImmutableMap.of("b0", saslExceptionInitial),
-            ImmutableMap.of("b0", ioException),
-            ImmutableMap.of("b0", saslExceptionInitial),
-            ImmutableMap.of("b0", ioException),
-            ImmutableMap.of("b0", saslExceptionFinal),
+            Map.of("b0", saslExceptionInitial),
+            Map.of("b0", ioException),
+            Map.of("b0", saslExceptionInitial),
+            Map.of("b0", ioException),
+            Map.of("b0", saslExceptionFinal),
             // will not get invoked because the connection fails
-            ImmutableMap.of("b0", ioException),
+            Map.of("b0", ioException),
             // will not get invoked
-            ImmutableMap.of("b0", block0)
+            Map.of("b0", block0)
     );
     configMap.put("spark.shuffle.sasl.enableRetries", "true");
     performInteractions(interactions, listener);
@@ -425,7 +424,7 @@ private static void configureInteractions(List<? extends Map<String, Object>> in
     Stubber stub = null;
 
     // Contains all blockIds that are referenced across all interactions.
-    LinkedHashSet<String> blockIds = Sets.newLinkedHashSet();
+    LinkedHashSet<String> blockIds = new LinkedHashSet<>();
 
     for (Map<String, Object> interaction : interactions) {
       blockIds.addAll(interaction.keySet());
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ShuffleTransportContextSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ShuffleTransportContextSuite.java
index aef3bc51bcd4b..bd9884e81ba92 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ShuffleTransportContextSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/ShuffleTransportContextSuite.java
@@ -18,12 +18,11 @@
 package org.apache.spark.network.shuffle;
 
 import java.io.IOException;
+import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 
-import com.google.common.collect.Lists;
-
 import io.netty.buffer.ByteBuf;
 import io.netty.buffer.ByteBufAllocator;
 import io.netty.buffer.Unpooled;
@@ -74,7 +73,7 @@ ShuffleTransportContext createShuffleTransportContext(boolean separateFinalizeTh
   }
 
   private ByteBuf getDecodableMessageBuf(Message req) throws Exception {
-    List<Object> out = Lists.newArrayList();
+    List<Object> out = new ArrayList<>();
     ChannelHandlerContext context = mock(ChannelHandlerContext.class);
     when(context.alloc()).thenReturn(ByteBufAllocator.DEFAULT);
     MessageEncoder.INSTANCE.encode(context, req, out);
@@ -118,7 +117,7 @@ public void testDecodeOfFinalizeShuffleMessage() throws Exception {
     try (ShuffleTransportContext shuffleTransportContext = createShuffleTransportContext(true)) {
       ShuffleTransportContext.ShuffleMessageDecoder decoder =
         (ShuffleTransportContext.ShuffleMessageDecoder) shuffleTransportContext.getDecoder();
-      List<Object> out = Lists.newArrayList();
+      List<Object> out = new ArrayList<>();
       decoder.decode(mock(ChannelHandlerContext.class), messageBuf, out);
 
       Assertions.assertEquals(1, out.size());
@@ -137,7 +136,7 @@ public void testDecodeOfAnyOtherRpcMessage() throws Exception {
     try (ShuffleTransportContext shuffleTransportContext = createShuffleTransportContext(true)) {
       ShuffleTransportContext.ShuffleMessageDecoder decoder =
         (ShuffleTransportContext.ShuffleMessageDecoder) shuffleTransportContext.getDecoder();
-      List<Object> out = Lists.newArrayList();
+      List<Object> out = new ArrayList<>();
       decoder.decode(mock(ChannelHandlerContext.class), messageBuf, out);
 
       Assertions.assertEquals(1, out.size());
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslExternalShuffleSecuritySuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslExternalShuffleSecuritySuite.java
index 061d63dbcd72d..a04ec60ca1c1c 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslExternalShuffleSecuritySuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslExternalShuffleSecuritySuite.java
@@ -17,7 +17,7 @@
 
 package org.apache.spark.network.shuffle;
 
-import com.google.common.collect.ImmutableMap;
+import java.util.Map;
 
 import org.apache.spark.network.ssl.SslSampleConfigs;
 import org.apache.spark.network.util.TransportConf;
@@ -30,9 +30,7 @@ protected TransportConf createTransportConf(boolean encrypt) {
       return new TransportConf(
         "shuffle",
         SslSampleConfigs.createDefaultConfigProviderForRpcNamespaceWithAdditionalEntries(
-          ImmutableMap.of(
-          "spark.authenticate.enableSaslEncryption",
-          "true")
+          Map.of("spark.authenticate.enableSaslEncryption", "true")
         )
       );
     } else {
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslShuffleTransportContextSuite.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslShuffleTransportContextSuite.java
index 51463bbad5576..1a85838792d29 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslShuffleTransportContextSuite.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/SslShuffleTransportContextSuite.java
@@ -17,7 +17,7 @@
 
 package org.apache.spark.network.shuffle;
 
-import com.google.common.collect.ImmutableMap;
+import java.util.Map;
 
 import org.apache.spark.network.ssl.SslSampleConfigs;
 import org.apache.spark.network.util.TransportConf;
@@ -29,7 +29,7 @@ protected TransportConf createTransportConf(boolean separateFinalizeThread) {
     return new TransportConf(
       "shuffle",
       SslSampleConfigs.createDefaultConfigProviderForRpcNamespaceWithAdditionalEntries(
-        ImmutableMap.of(
+        Map.of(
           "spark.shuffle.server.finalizeShuffleMergeThreadsPercent",
           separateFinalizeThread ? "1" : "0")
       )
diff --git a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/TestShuffleDataContext.java b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/TestShuffleDataContext.java
index 49b17824c3c72..4b8dc33c6bf52 100644
--- a/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/TestShuffleDataContext.java
+++ b/common/network-shuffle/src/test/java/org/apache/spark/network/shuffle/TestShuffleDataContext.java
@@ -22,6 +22,7 @@
 import java.io.FileOutputStream;
 import java.io.IOException;
 import java.io.OutputStream;
+import java.nio.file.Files;
 
 import com.google.common.io.Closeables;
 
@@ -54,7 +55,7 @@ public void create() throws IOException {
       localDirs[i] = JavaUtils.createDirectory(root, "spark").getAbsolutePath();
 
       for (int p = 0; p < subDirsPerLocalDir; p ++) {
-        new File(localDirs[i], String.format("%02x", p)).mkdirs();
+        Files.createDirectories(new File(localDirs[i], String.format("%02x", p)).toPath());
       }
     }
   }
diff --git a/common/network-yarn/pom.xml b/common/network-yarn/pom.xml
index 78289684960ed..c4451923b17a5 100644
--- a/common/network-yarn/pom.xml
+++ b/common/network-yarn/pom.xml
@@ -48,7 +48,7 @@
     <dependency>
       <groupId>org.apache.spark</groupId>
       <artifactId>spark-tags_${scala.binary.version}</artifactId>
-      <scope>test</scope>
+      <scope>provided</scope>
     </dependency>
 
     <!--
@@ -99,9 +99,6 @@
             <includes>
               <include>*:*</include>
             </includes>
-            <excludes>
-              <exclude>org.scala-lang:scala-library</exclude>
-            </excludes>
           </artifactSet>
           <filters>
             <filter>
diff --git a/common/network-yarn/src/main/java/org/apache/spark/network/yarn/YarnShuffleService.java b/common/network-yarn/src/main/java/org/apache/spark/network/yarn/YarnShuffleService.java
index e0af3c5ae2468..b5718946252e1 100644
--- a/common/network-yarn/src/main/java/org/apache/spark/network/yarn/YarnShuffleService.java
+++ b/common/network-yarn/src/main/java/org/apache/spark/network/yarn/YarnShuffleService.java
@@ -22,6 +22,7 @@
 import java.net.URL;
 import java.nio.charset.StandardCharsets;
 import java.nio.ByteBuffer;
+import java.util.ArrayList;
 import java.util.List;
 import java.util.Map;
 import java.util.Objects;
@@ -31,10 +32,6 @@
 import com.fasterxml.jackson.core.type.TypeReference;
 import com.fasterxml.jackson.databind.ObjectMapper;
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.base.Preconditions;
-import com.google.common.collect.Lists;
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 import org.apache.hadoop.conf.Configuration;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
@@ -240,7 +237,7 @@ protected void serviceInit(Configuration externalConf) throws Exception {
         .getResource(SHUFFLE_SERVICE_CONF_OVERLAY_RESOURCE_NAME);
     if (confOverlayUrl != null) {
       logger.info("Initializing Spark YARN shuffle service with configuration overlay from {}",
-        MDC.of(LogKeys.SHUFFLE_SERVICE_CONF_OVERLAY_URL$.MODULE$, confOverlayUrl));
+        MDC.of(LogKeys.SHUFFLE_SERVICE_CONF_OVERLAY_URL, confOverlayUrl));
       _conf.addResource(confOverlayUrl);
     }
 
@@ -265,8 +262,8 @@ protected void serviceInit(Configuration externalConf) throws Exception {
         DBBackend.ROCKSDB.name());
       dbBackend = DBBackend.byName(dbBackendName);
       logger.info("Use {} as the implementation of {}",
-        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_NAME$.MODULE$, dbBackend),
-        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_KEY$.MODULE$, Constants.SHUFFLE_SERVICE_DB_BACKEND));
+        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_NAME, dbBackend),
+        MDC.of(LogKeys.SHUFFLE_DB_BACKEND_KEY, Constants.SHUFFLE_SERVICE_DB_BACKEND));
     }
 
     try {
@@ -293,7 +290,7 @@ protected void serviceInit(Configuration externalConf) throws Exception {
 
       // If authentication is enabled, set up the shuffle server to use a
       // special RPC handler that filters out unauthenticated fetch requests
-      List<TransportServerBootstrap> bootstraps = Lists.newArrayList();
+      List<TransportServerBootstrap> bootstraps = new ArrayList<>();
       boolean authEnabled = _conf.getBoolean(SPARK_AUTHENTICATE_KEY, DEFAULT_SPARK_AUTHENTICATE);
       if (authEnabled) {
         secretManager = new ShuffleSecretManager();
@@ -330,12 +327,12 @@ protected void serviceInit(Configuration externalConf) throws Exception {
           "PushBasedShuffleMergeManager", "Metrics on the push-based shuffle merge manager",
           mergeManagerMetrics);
       logger.info("Registered metrics with Hadoop's DefaultMetricsSystem using namespace '{}'",
-        MDC.of(LogKeys.SHUFFLE_SERVICE_METRICS_NAMESPACE$.MODULE$, metricsNamespace));
+        MDC.of(LogKeys.SHUFFLE_SERVICE_METRICS_NAMESPACE, metricsNamespace));
 
       logger.info("Started YARN shuffle service for Spark on port {}. Authentication is {}. " +
-        "Registered executor file is {}", MDC.of(LogKeys.PORT$.MODULE$, port),
-        MDC.of(LogKeys.AUTH_ENABLED$.MODULE$, authEnabledString),
-        MDC.of(LogKeys.REGISTERED_EXECUTOR_FILE$.MODULE$, registeredExecutorFile));
+        "Registered executor file is {}", MDC.of(LogKeys.PORT, port),
+        MDC.of(LogKeys.AUTH_ENABLED, authEnabledString),
+        MDC.of(LogKeys.REGISTERED_EXECUTOR_FILE, registeredExecutorFile));
     } catch (Exception e) {
       if (stopOnFailure) {
         throw e;
@@ -369,7 +366,7 @@ static MergedShuffleFileManager newMergedShuffleFileManagerInstance(
         .newInstance(conf, mergeManagerFile);
     } catch (Exception e) {
       defaultSparkLogger.error("Unable to create an instance of {}",
-        MDC.of(LogKeys.CLASS_NAME$.MODULE$, mergeManagerImplClassName));
+        MDC.of(LogKeys.CLASS_NAME, mergeManagerImplClassName));
       return new NoOpMergedShuffleFileManager(conf, mergeManagerFile);
     }
   }
@@ -433,7 +430,7 @@ public void initializeApplication(ApplicationInitializationContext context) {
         if (metadataStorageVal != null && (Boolean) metadataStorageVal) {
           AppsWithRecoveryDisabled.disableRecoveryOfApp(appId);
           logger.info("Disabling metadata persistence for application {}",
-            MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+            MDC.of(LogKeys.APP_ID, appId));
         }
       } catch (IOException ioe) {
         logger.warn("Unable to parse application data for service: " + payload);
@@ -457,7 +454,7 @@ public void initializeApplication(ApplicationInitializationContext context) {
       }
     } catch (Exception e) {
       logger.error("Exception when initializing application {}", e,
-        MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+        MDC.of(LogKeys.APP_ID, appId));
     }
   }
 
@@ -472,7 +469,7 @@ public void stopApplication(ApplicationTerminationContext context) {
             db.delete(dbAppKey(fullId));
           } catch (IOException e) {
             logger.error("Error deleting {} from executor state db", e,
-              MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+              MDC.of(LogKeys.APP_ID, appId));
           }
         }
         secretManager.unregisterApp(appId);
@@ -480,7 +477,7 @@ public void stopApplication(ApplicationTerminationContext context) {
       blockHandler.applicationRemoved(appId, false /* clean up local dirs */);
     } catch (Exception e) {
       logger.error("Exception when stopping application {}", e,
-        MDC.of(LogKeys.APP_ID$.MODULE$, appId));
+        MDC.of(LogKeys.APP_ID, appId));
     } finally {
       AppsWithRecoveryDisabled.removeApp(appId);
     }
@@ -489,13 +486,13 @@ public void stopApplication(ApplicationTerminationContext context) {
   @Override
   public void initializeContainer(ContainerInitializationContext context) {
     ContainerId containerId = context.getContainerId();
-    logger.info("Initializing container {}", MDC.of(LogKeys.CONTAINER_ID$.MODULE$, containerId));
+    logger.info("Initializing container {}", MDC.of(LogKeys.CONTAINER_ID, containerId));
   }
 
   @Override
   public void stopContainer(ContainerTerminationContext context) {
     ContainerId containerId = context.getContainerId();
-    logger.info("Stopping container {}", MDC.of(LogKeys.CONTAINER_ID$.MODULE$, containerId));
+    logger.info("Stopping container {}", MDC.of(LogKeys.CONTAINER_ID, containerId));
   }
 
   /**
@@ -548,7 +545,7 @@ protected Path getRecoveryPath(String fileName) {
    * and DB exists in the local dir of NM by old version of shuffle service.
    */
   protected File initRecoveryDb(String dbName) {
-    Preconditions.checkNotNull(_recoveryPath,
+    Objects.requireNonNull(_recoveryPath,
       "recovery path should not be null if NM recovery is enabled");
 
     File recoveryFile = new File(_recoveryPath.toUri().getPath(), dbName);
@@ -577,8 +574,8 @@ protected File initRecoveryDb(String dbName) {
           } catch (Exception e) {
             // Fail to move recovery file to new path, just continue on with new DB location
             logger.error("Failed to move recovery file {} to the path {}", e,
-              MDC.of(LogKeys.SHUFFLE_MERGE_RECOVERY_FILE$.MODULE$, dbName),
-              MDC.of(LogKeys.PATH$.MODULE$, _recoveryPath.toString()));
+              MDC.of(LogKeys.SHUFFLE_MERGE_RECOVERY_FILE, dbName),
+              MDC.of(LogKeys.PATH, _recoveryPath.toString()));
           }
         }
         return new File(newLoc.toUri().getPath());
@@ -615,9 +612,7 @@ public int hashCode() {
 
     @Override
     public String toString() {
-      return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-          .append("appId", appId)
-          .toString();
+      return "AppId[appId=" + appId + "]";
     }
   }
 
diff --git a/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilter.java b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilter.java
index 172b394689ca9..a839de0a91448 100644
--- a/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilter.java
+++ b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilter.java
@@ -17,9 +17,12 @@
 
 package org.apache.spark.util.sketch;
 
+import java.io.BufferedInputStream;
+import java.io.ByteArrayInputStream;
 import java.io.IOException;
 import java.io.InputStream;
 import java.io.OutputStream;
+import java.nio.ByteBuffer;
 
 /**
  * A Bloom filter is a space-efficient probabilistic data structure that offers an approximate
@@ -51,7 +54,22 @@ public enum Version {
      *   <li>The words/longs (numWords * 64 bit)</li>
      * </ul>
      */
-    V1(1);
+    V1(1),
+
+    /**
+     * {@code BloomFilter} binary format version 2.
+     * Fixes the int32 truncation issue with V1 indexes, but by changing the bit pattern,
+     * it will become incompatible with V1 serializations.
+     * All values written in big-endian order:
+     * <ul>
+     *   <li>Version number, always 2 (32 bit)</li>
+     *   <li>Number of hash functions (32 bit)</li>
+     *   <li>Integer seed to initialize hash functions (32 bit) </li>
+     *   <li>Total number of words of the underlying bit array (32 bit)</li>
+     *   <li>The words/longs (numWords * 64 bit)</li>
+     * </ul>
+     */
+    V2(2);
 
     private final int versionNumber;
 
@@ -175,14 +193,26 @@ public long cardinality() {
    * the stream.
    */
   public static BloomFilter readFrom(InputStream in) throws IOException {
-    return BloomFilterImpl.readFrom(in);
+    // peek into the InputStream so we can determine the version
+    BufferedInputStream bin = new BufferedInputStream(in);
+    bin.mark(4);
+    int version = ByteBuffer.wrap(bin.readNBytes(4)).getInt();
+    bin.reset();
+
+    return switch (version) {
+      case 1 -> BloomFilterImpl.readFrom(bin);
+      case 2 -> BloomFilterImplV2.readFrom(bin);
+      default -> throw new IllegalArgumentException("Unknown BloomFilter version: " + version);
+    };
   }
 
   /**
    * Reads in a {@link BloomFilter} from a byte array.
    */
   public static BloomFilter readFrom(byte[] bytes) throws IOException {
-    return BloomFilterImpl.readFrom(bytes);
+    try (ByteArrayInputStream bis = new ByteArrayInputStream(bytes)) {
+      return readFrom(bis);
+    }
   }
 
   /**
@@ -256,6 +286,19 @@ public static BloomFilter create(long expectedNumItems, double fpp) {
    * pick an optimal {@code numHashFunctions} which can minimize {@code fpp} for the bloom filter.
    */
   public static BloomFilter create(long expectedNumItems, long numBits) {
+    return create(Version.V2, expectedNumItems, numBits, BloomFilterImplV2.DEFAULT_SEED);
+  }
+
+  public static BloomFilter create(long expectedNumItems, long numBits, int seed) {
+    return create(Version.V2, expectedNumItems, numBits, seed);
+  }
+
+  public static BloomFilter create(
+      Version version,
+      long expectedNumItems,
+      long numBits,
+      int seed
+  ) {
     if (expectedNumItems <= 0) {
       throw new IllegalArgumentException("Expected insertions must be positive");
     }
@@ -264,6 +307,11 @@ public static BloomFilter create(long expectedNumItems, long numBits) {
       throw new IllegalArgumentException("Number of bits must be positive");
     }
 
-    return new BloomFilterImpl(optimalNumOfHashFunctions(expectedNumItems, numBits), numBits);
+    int numHashFunctions = optimalNumOfHashFunctions(expectedNumItems, numBits);
+
+    return switch (version) {
+      case V1 -> new BloomFilterImpl(numHashFunctions, numBits);
+      case V2 -> new BloomFilterImplV2(numHashFunctions, numBits, seed);
+    };
   }
 }
diff --git a/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterBase.java b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterBase.java
new file mode 100644
index 0000000000000..b5b321cba0407
--- /dev/null
+++ b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterBase.java
@@ -0,0 +1,199 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.util.sketch;
+
+import java.util.Objects;
+
+abstract class BloomFilterBase extends BloomFilter {
+
+  public static final int DEFAULT_SEED = 0;
+
+  protected int seed;
+  protected int numHashFunctions;
+  protected BitArray bits;
+
+  protected BloomFilterBase(int numHashFunctions, long numBits) {
+    this(numHashFunctions, numBits, DEFAULT_SEED);
+  }
+
+  protected BloomFilterBase(int numHashFunctions, long numBits, int seed) {
+    this(new BitArray(numBits), numHashFunctions, seed);
+  }
+
+  protected BloomFilterBase(BitArray bits, int numHashFunctions, int seed) {
+    this.bits = bits;
+    this.numHashFunctions = numHashFunctions;
+    this.seed = seed;
+  }
+
+  protected BloomFilterBase() {}
+
+  @Override
+  public boolean equals(Object other) {
+    if (other == this) {
+      return true;
+    }
+
+    if (!(other instanceof BloomFilterBase that)) {
+      return false;
+    }
+
+    return
+      this.getClass() == that.getClass()
+      && this.numHashFunctions == that.numHashFunctions
+      && this.seed == that.seed
+      // TODO: this.bits can be null temporarily, during deserialization,
+      //  should we worry about this?
+      && this.bits.equals(that.bits);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(numHashFunctions, seed, bits);
+  }
+
+  @Override
+  public double expectedFpp() {
+    return Math.pow((double) bits.cardinality() / bits.bitSize(), numHashFunctions);
+  }
+
+  @Override
+  public long bitSize() {
+    return bits.bitSize();
+  }
+
+  @Override
+  public boolean put(Object item) {
+    if (item instanceof String str) {
+      return putString(str);
+    } else if (item instanceof byte[] bytes) {
+      return putBinary(bytes);
+    } else {
+      return putLong(Utils.integralToLong(item));
+    }
+  }
+
+  protected HiLoHash hashLongToIntPair(long item, int seed) {
+    // Here we first hash the input long element into 2 int hash values, h1 and h2, then produce n
+    // hash values by `h1 + i * h2` with 1 <= i <= numHashFunctions.
+    // Note that `CountMinSketch` use a different strategy, it hash the input long element with
+    // every i to produce n hash values.
+    // TODO: the strategy of `CountMinSketch` looks more advanced, should we follow it here?
+    int h1 = Murmur3_x86_32.hashLong(item, seed);
+    int h2 = Murmur3_x86_32.hashLong(item, h1);
+    return new HiLoHash(h1, h2);
+  }
+
+  protected HiLoHash hashBytesToIntPair(byte[] item, int seed) {
+    int h1 = Murmur3_x86_32.hashUnsafeBytes(item, Platform.BYTE_ARRAY_OFFSET, item.length, seed);
+    int h2 = Murmur3_x86_32.hashUnsafeBytes(item, Platform.BYTE_ARRAY_OFFSET, item.length, h1);
+    return new HiLoHash(h1, h2);
+  }
+
+  protected abstract boolean scatterHashAndSetAllBits(HiLoHash inputHash);
+
+  protected abstract boolean scatterHashAndGetAllBits(HiLoHash inputHash);
+
+  @Override
+  public boolean putString(String item) {
+    return putBinary(Utils.getBytesFromUTF8String(item));
+  }
+
+  @Override
+  public boolean putBinary(byte[] item) {
+    HiLoHash hiLoHash = hashBytesToIntPair(item, seed);
+    return scatterHashAndSetAllBits(hiLoHash);
+  }
+
+  @Override
+  public boolean mightContainString(String item) {
+    return mightContainBinary(Utils.getBytesFromUTF8String(item));
+  }
+
+  @Override
+  public boolean mightContainBinary(byte[] item) {
+    HiLoHash hiLoHash = hashBytesToIntPair(item, seed);
+    return scatterHashAndGetAllBits(hiLoHash);
+  }
+
+  public boolean putLong(long item) {
+    HiLoHash hiLoHash = hashLongToIntPair(item, seed);
+    return scatterHashAndSetAllBits(hiLoHash);
+  }
+
+  @Override
+  public boolean mightContainLong(long item) {
+    HiLoHash hiLoHash = hashLongToIntPair(item, seed);
+    return scatterHashAndGetAllBits(hiLoHash);
+  }
+
+  @Override
+  public boolean mightContain(Object item) {
+    if (item instanceof String str) {
+      return mightContainString(str);
+    } else if (item instanceof byte[] bytes) {
+      return mightContainBinary(bytes);
+    } else {
+      return mightContainLong(Utils.integralToLong(item));
+    }
+  }
+
+  @Override
+  public boolean isCompatible(BloomFilter other) {
+    if (other == null) {
+      return false;
+    }
+
+    if (!(other instanceof BloomFilterBase that)) {
+      return false;
+    }
+
+    return
+      this.getClass() == that.getClass()
+      && this.bitSize() == that.bitSize()
+      && this.numHashFunctions == that.numHashFunctions
+      && this.seed == that.seed;
+  }
+
+  @Override
+  public BloomFilter mergeInPlace(BloomFilter other) throws IncompatibleMergeException {
+    BloomFilterBase otherImplInstance = checkCompatibilityForMerge(other);
+
+    this.bits.putAll(otherImplInstance.bits);
+    return this;
+  }
+
+  @Override
+  public BloomFilter intersectInPlace(BloomFilter other) throws IncompatibleMergeException {
+    BloomFilterBase otherImplInstance = checkCompatibilityForMerge(other);
+
+    this.bits.and(otherImplInstance.bits);
+    return this;
+  }
+
+  @Override
+  public long cardinality() {
+    return this.bits.cardinality();
+  }
+
+  protected abstract BloomFilterBase checkCompatibilityForMerge(BloomFilter other)
+    throws IncompatibleMergeException;
+
+  public record HiLoHash(int hi, int lo) {}
+
+}
diff --git a/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterImpl.java b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterImpl.java
index 3bd04a531fe75..743fd9fb6738e 100644
--- a/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterImpl.java
+++ b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterImpl.java
@@ -19,71 +19,17 @@
 
 import java.io.*;
 
-class BloomFilterImpl extends BloomFilter implements Serializable {
-
-  private int numHashFunctions;
-
-  private BitArray bits;
+class BloomFilterImpl extends BloomFilterBase implements Serializable {
 
   BloomFilterImpl(int numHashFunctions, long numBits) {
-    this(new BitArray(numBits), numHashFunctions);
-  }
-
-  private BloomFilterImpl(BitArray bits, int numHashFunctions) {
-    this.bits = bits;
-    this.numHashFunctions = numHashFunctions;
+    super(numHashFunctions, numBits);
   }
 
   private BloomFilterImpl() {}
 
-  @Override
-  public boolean equals(Object other) {
-    if (other == this) {
-      return true;
-    }
-
-    if (!(other instanceof BloomFilterImpl that)) {
-      return false;
-    }
-
-    return this.numHashFunctions == that.numHashFunctions && this.bits.equals(that.bits);
-  }
-
-  @Override
-  public int hashCode() {
-    return bits.hashCode() * 31 + numHashFunctions;
-  }
-
-  @Override
-  public double expectedFpp() {
-    return Math.pow((double) bits.cardinality() / bits.bitSize(), numHashFunctions);
-  }
-
-  @Override
-  public long bitSize() {
-    return bits.bitSize();
-  }
-
-  @Override
-  public boolean put(Object item) {
-    if (item instanceof String str) {
-      return putString(str);
-    } else if (item instanceof byte[] bytes) {
-      return putBinary(bytes);
-    } else {
-      return putLong(Utils.integralToLong(item));
-    }
-  }
-
-  @Override
-  public boolean putString(String item) {
-    return putBinary(Utils.getBytesFromUTF8String(item));
-  }
-
-  @Override
-  public boolean putBinary(byte[] item) {
-    int h1 = Murmur3_x86_32.hashUnsafeBytes(item, Platform.BYTE_ARRAY_OFFSET, item.length, 0);
-    int h2 = Murmur3_x86_32.hashUnsafeBytes(item, Platform.BYTE_ARRAY_OFFSET, item.length, h1);
+  protected boolean scatterHashAndSetAllBits(HiLoHash inputHash) {
+    int h1 = inputHash.hi();
+    int h2 = inputHash.lo();
 
     long bitSize = bits.bitSize();
     boolean bitsChanged = false;
@@ -98,15 +44,9 @@ public boolean putBinary(byte[] item) {
     return bitsChanged;
   }
 
-  @Override
-  public boolean mightContainString(String item) {
-    return mightContainBinary(Utils.getBytesFromUTF8String(item));
-  }
-
-  @Override
-  public boolean mightContainBinary(byte[] item) {
-    int h1 = Murmur3_x86_32.hashUnsafeBytes(item, Platform.BYTE_ARRAY_OFFSET, item.length, 0);
-    int h2 = Murmur3_x86_32.hashUnsafeBytes(item, Platform.BYTE_ARRAY_OFFSET, item.length, h1);
+  protected boolean scatterHashAndGetAllBits(HiLoHash inputHash) {
+    int h1 = inputHash.hi();
+    int h2 = inputHash.lo();
 
     long bitSize = bits.bitSize();
     for (int i = 1; i <= numHashFunctions; i++) {
@@ -122,94 +62,7 @@ public boolean mightContainBinary(byte[] item) {
     return true;
   }
 
-  @Override
-  public boolean putLong(long item) {
-    // Here we first hash the input long element into 2 int hash values, h1 and h2, then produce n
-    // hash values by `h1 + i * h2` with 1 <= i <= numHashFunctions.
-    // Note that `CountMinSketch` use a different strategy, it hash the input long element with
-    // every i to produce n hash values.
-    // TODO: the strategy of `CountMinSketch` looks more advanced, should we follow it here?
-    int h1 = Murmur3_x86_32.hashLong(item, 0);
-    int h2 = Murmur3_x86_32.hashLong(item, h1);
-
-    long bitSize = bits.bitSize();
-    boolean bitsChanged = false;
-    for (int i = 1; i <= numHashFunctions; i++) {
-      int combinedHash = h1 + (i * h2);
-      // Flip all the bits if it's negative (guaranteed positive number)
-      if (combinedHash < 0) {
-        combinedHash = ~combinedHash;
-      }
-      bitsChanged |= bits.set(combinedHash % bitSize);
-    }
-    return bitsChanged;
-  }
-
-  @Override
-  public boolean mightContainLong(long item) {
-    int h1 = Murmur3_x86_32.hashLong(item, 0);
-    int h2 = Murmur3_x86_32.hashLong(item, h1);
-
-    long bitSize = bits.bitSize();
-    for (int i = 1; i <= numHashFunctions; i++) {
-      int combinedHash = h1 + (i * h2);
-      // Flip all the bits if it's negative (guaranteed positive number)
-      if (combinedHash < 0) {
-        combinedHash = ~combinedHash;
-      }
-      if (!bits.get(combinedHash % bitSize)) {
-        return false;
-      }
-    }
-    return true;
-  }
-
-  @Override
-  public boolean mightContain(Object item) {
-    if (item instanceof String str) {
-      return mightContainString(str);
-    } else if (item instanceof byte[] bytes) {
-      return mightContainBinary(bytes);
-    } else {
-      return mightContainLong(Utils.integralToLong(item));
-    }
-  }
-
-  @Override
-  public boolean isCompatible(BloomFilter other) {
-    if (other == null) {
-      return false;
-    }
-
-    if (!(other instanceof BloomFilterImpl that)) {
-      return false;
-    }
-
-    return this.bitSize() == that.bitSize() && this.numHashFunctions == that.numHashFunctions;
-  }
-
-  @Override
-  public BloomFilter mergeInPlace(BloomFilter other) throws IncompatibleMergeException {
-    BloomFilterImpl otherImplInstance = checkCompatibilityForMerge(other);
-
-    this.bits.putAll(otherImplInstance.bits);
-    return this;
-  }
-
-  @Override
-  public BloomFilter intersectInPlace(BloomFilter other) throws IncompatibleMergeException {
-    BloomFilterImpl otherImplInstance = checkCompatibilityForMerge(other);
-
-    this.bits.and(otherImplInstance.bits);
-    return this;
-  }
-
-  @Override
-  public long cardinality() {
-    return this.bits.cardinality();
-  }
-
-  private BloomFilterImpl checkCompatibilityForMerge(BloomFilter other)
+  protected BloomFilterImpl checkCompatibilityForMerge(BloomFilter other)
           throws IncompatibleMergeException {
     // Duplicates the logic of `isCompatible` here to provide better error message.
     if (other == null) {
@@ -240,6 +93,7 @@ public void writeTo(OutputStream out) throws IOException {
 
     dos.writeInt(Version.V1.getVersionNumber());
     dos.writeInt(numHashFunctions);
+    // ignore seed
     bits.writeTo(dos);
   }
 
@@ -252,6 +106,7 @@ private void readFrom0(InputStream in) throws IOException {
     }
 
     this.numHashFunctions = dis.readInt();
+    this.seed = DEFAULT_SEED;
     this.bits = BitArray.readFrom(dis);
   }
 
@@ -261,16 +116,18 @@ public static BloomFilterImpl readFrom(InputStream in) throws IOException {
     return filter;
   }
 
-  public static BloomFilterImpl readFrom(byte[] bytes) throws IOException {
-    try (ByteArrayInputStream bis = new ByteArrayInputStream(bytes)) {
-      return readFrom(bis);
-    }
+  // no longer necessary, but can't remove without triggering MIMA violations
+  @Deprecated
+  public static BloomFilter readFrom(byte[] bytes) throws IOException {
+    return BloomFilter.readFrom(bytes);
   }
 
+  @Serial
   private void writeObject(ObjectOutputStream out) throws IOException {
     writeTo(out);
   }
 
+  @Serial
   private void readObject(ObjectInputStream in) throws IOException {
     readFrom0(in);
   }
diff --git a/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterImplV2.java b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterImplV2.java
new file mode 100644
index 0000000000000..fa0a1df384865
--- /dev/null
+++ b/common/sketch/src/main/java/org/apache/spark/util/sketch/BloomFilterImplV2.java
@@ -0,0 +1,160 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.util.sketch;
+
+import java.io.*;
+
+class BloomFilterImplV2 extends BloomFilterBase implements Serializable {
+
+  BloomFilterImplV2(int numHashFunctions, long numBits, int seed) {
+    this(new BitArray(numBits), numHashFunctions, seed);
+  }
+
+  private BloomFilterImplV2(BitArray bits, int numHashFunctions, int seed) {
+    super(bits, numHashFunctions, seed);
+  }
+
+  private BloomFilterImplV2() {}
+
+  @Override
+  public boolean equals(Object other) {
+    if (other == this) {
+      return true;
+    }
+
+    if (!(other instanceof BloomFilterImplV2 that)) {
+      return false;
+    }
+
+    return
+      this.numHashFunctions == that.numHashFunctions
+      && this.seed == that.seed
+      && this.bits.equals(that.bits);
+  }
+
+  protected boolean scatterHashAndSetAllBits(HiLoHash inputHash) {
+    int h1 = inputHash.hi();
+    int h2 = inputHash.lo();
+
+    long bitSize = bits.bitSize();
+    boolean bitsChanged = false;
+
+    // Integer.MAX_VALUE takes care of scrambling the higher four bytes of combinedHash
+    long combinedHash = (long) h1 * Integer.MAX_VALUE;
+    for (long i = 0; i < numHashFunctions; i++) {
+      combinedHash += h2;
+
+      // Flip all the bits if it's negative (guaranteed positive number)
+      long combinedIndex = combinedHash < 0 ? ~combinedHash : combinedHash;
+
+      bitsChanged |= bits.set(combinedIndex % bitSize);
+    }
+    return bitsChanged;
+  }
+
+  protected boolean scatterHashAndGetAllBits(HiLoHash inputHash) {
+    int h1 = inputHash.hi();
+    int h2 = inputHash.lo();
+
+    long bitSize = bits.bitSize();
+
+    // Integer.MAX_VALUE takes care of scrambling the higher four bytes of combinedHash
+    long combinedHash = (long) h1 * Integer.MAX_VALUE;
+    for (long i = 0; i < numHashFunctions; i++) {
+      combinedHash += h2;
+
+      // Flip all the bits if it's negative (guaranteed positive number)
+      long combinedIndex = combinedHash < 0 ? ~combinedHash : combinedHash;
+
+      if (!bits.get(combinedIndex % bitSize)) {
+        return false;
+      }
+    }
+    return true;
+  }
+
+  protected BloomFilterImplV2 checkCompatibilityForMerge(BloomFilter other)
+          throws IncompatibleMergeException {
+    // Duplicates the logic of `isCompatible` here to provide better error message.
+    if (other == null) {
+      throw new IncompatibleMergeException("Cannot merge null bloom filter");
+    }
+
+    if (!(other instanceof BloomFilterImplV2 that)) {
+      throw new IncompatibleMergeException(
+        "Cannot merge bloom filter of class " + other.getClass().getName()
+      );
+    }
+
+    if (this.bitSize() != that.bitSize()) {
+      throw new IncompatibleMergeException("Cannot merge bloom filters with different bit size");
+    }
+
+    if (this.seed != that.seed) {
+      throw new IncompatibleMergeException(
+              "Cannot merge bloom filters with different seeds"
+      );
+    }
+
+    if (this.numHashFunctions != that.numHashFunctions) {
+      throw new IncompatibleMergeException(
+        "Cannot merge bloom filters with different number of hash functions"
+      );
+    }
+    return that;
+  }
+
+  @Override
+  public void writeTo(OutputStream out) throws IOException {
+    DataOutputStream dos = new DataOutputStream(out);
+
+    dos.writeInt(Version.V2.getVersionNumber());
+    dos.writeInt(numHashFunctions);
+    dos.writeInt(seed);
+    bits.writeTo(dos);
+  }
+
+  private void readFrom0(InputStream in) throws IOException {
+    DataInputStream dis = new DataInputStream(in);
+
+    int version = dis.readInt();
+    if (version != Version.V2.getVersionNumber()) {
+      throw new IOException("Unexpected Bloom filter version number (" + version + ")");
+    }
+
+    this.numHashFunctions = dis.readInt();
+    this.seed = dis.readInt();
+    this.bits = BitArray.readFrom(dis);
+  }
+
+  public static BloomFilterImplV2 readFrom(InputStream in) throws IOException {
+    BloomFilterImplV2 filter = new BloomFilterImplV2();
+    filter.readFrom0(in);
+    return filter;
+  }
+
+  @Serial
+  private void writeObject(ObjectOutputStream out) throws IOException {
+    writeTo(out);
+  }
+
+  @Serial
+  private void readObject(ObjectInputStream in) throws IOException {
+    readFrom0(in);
+  }
+}
diff --git a/common/sketch/src/test/java/org/apache/spark/util/sketch/SparkBloomFilterSuite.java b/common/sketch/src/test/java/org/apache/spark/util/sketch/SparkBloomFilterSuite.java
new file mode 100644
index 0000000000000..91f7423300aa6
--- /dev/null
+++ b/common/sketch/src/test/java/org/apache/spark/util/sketch/SparkBloomFilterSuite.java
@@ -0,0 +1,396 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.util.sketch;
+
+import org.junit.jupiter.api.*;
+import org.junit.jupiter.api.condition.EnabledIfEnvironmentVariable;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.Arguments;
+import org.junit.jupiter.params.provider.MethodSource;
+
+import java.io.PrintStream;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.time.Duration;
+import java.time.Instant;
+import java.util.Map;
+import java.util.concurrent.ConcurrentHashMap;
+import java.util.concurrent.atomic.LongAdder;
+import java.util.stream.LongStream;
+import java.util.stream.Stream;
+
+@EnabledIfEnvironmentVariable(
+  named = "SPARK_TEST_SPARK_BLOOM_FILTER_SUITE_ENABLED", matches = "true")
+public class SparkBloomFilterSuite {
+
+  // the implemented fpp limit is only approximating the hard boundary,
+  // so we'll need an error threshold for the assertion
+  final double FPP_ACCEPTABLE_ERROR_FACTOR = 0.10;
+
+  final long ONE_GB = 1024L * 1024L * 1024L;
+  final long REQUIRED_HEAP_UPPER_BOUND_IN_BYTES = 4 * ONE_GB;
+
+  private static Instant START;
+  private static boolean strict;
+  private static boolean verbose;
+
+  private Instant start;
+  private final Map<String,PrintStream> testOutMap = new ConcurrentHashMap<>();
+
+  @BeforeAll
+  public static void beforeAll() {
+    START = Instant.now();
+    String testClassName = SparkBloomFilterSuite.class.getName();
+    strict = Boolean.parseBoolean(System.getProperty(testClassName+ ".strict", "true"));
+    verbose = Boolean.parseBoolean(System.getProperty(testClassName+ ".verbose", "false"));
+  }
+
+  @AfterAll
+  public static void afterAll() {
+    Duration duration = Duration.between(START, Instant.now());
+    if (verbose) {
+      System.err.println(duration + " TOTAL");
+    }
+  }
+
+  @BeforeEach
+  public void beforeEach(
+    TestInfo testInfo
+  ) throws Exception {
+    start = Instant.now();
+
+    String testName = testInfo.getDisplayName();
+
+    String testClassName = SparkBloomFilterSuite.class.getName();
+    String logDir = System.getProperty(testClassName+ ".logDir", "./target/tmp");
+    Path logDirPath = Path.of(logDir);
+    Files.createDirectories(logDirPath);
+    Path testLogPath = Path.of(logDir,testName + ".log");
+    Files.deleteIfExists(testLogPath);
+
+    PrintStream testOut = new PrintStream(Files.newOutputStream(testLogPath));
+    testOutMap.put(testName, testOut);
+
+    testOut.println("testName: " + testName);
+  }
+
+  @AfterEach
+  public void afterEach(TestInfo testInfo) {
+    Duration duration = Duration.between(start, Instant.now());
+
+    String testName = testInfo.getDisplayName();
+    PrintStream testOut = testOutMap.get(testName);
+
+    testOut.println("duration: " + duration );
+    testOut.close();
+  }
+
+  private static Stream<Arguments> dataPointProvider() {
+    // temporary workaround:
+    //   to reduce running time to acceptable levels, we test only one case,
+    //   with the default FPP and the default seed only.
+    return Stream.of(
+      Arguments.of(350_000_000L, 0.03, BloomFilterImplV2.DEFAULT_SEED)
+    );
+    // preferable minimum parameter space for tests:
+    //   {1_000_000L, 1_000_000_000L}           for: long numItems
+    //   {0.05, 0.03, 0.01, 0.001}              for: double expectedFpp
+    //   {BloomFilterImpl.DEFAULT_SEED, 1, 127} for: int deterministicSeed
+  }
+
+  /**
+   * This test, in N number of iterations, inserts N even numbers (2*i) int,
+   * and leaves out N odd numbers (2*i+1) from the tested BloomFilter instance.
+   *
+   * It checks the 100% accuracy of mightContain=true on all of the even items,
+   * and measures the mightContain=true (false positive) rate on the not-inserted odd numbers.
+   *
+   * @param numItems the number of items to be inserted
+   * @param expectedFpp the expected fpp rate of the tested BloomFilter instance
+   * @param deterministicSeed the deterministic seed to use to initialize
+   *                          the primary BloomFilter instance.
+   */
+  @ParameterizedTest(name = "testAccuracyEvenOdd.n{0}_fpp{1}_seed{2}")
+  @MethodSource("dataPointProvider")
+  public void testAccuracyEvenOdd(
+    long numItems,
+    double expectedFpp,
+    int deterministicSeed,
+    TestInfo testInfo
+  ) {
+    String testName = testInfo.getDisplayName();
+    PrintStream testOut = testOutMap.get(testName);
+
+    long optimalNumOfBits = BloomFilter.optimalNumOfBits(numItems, expectedFpp);
+    testOut.printf(
+      "optimal   bitArray: %d (%d MB)\n",
+      optimalNumOfBits,
+      optimalNumOfBits / Byte.SIZE / 1024 / 1024
+    );
+    Assumptions.assumeTrue(
+      optimalNumOfBits / Byte.SIZE < REQUIRED_HEAP_UPPER_BOUND_IN_BYTES,
+      "this testcase would require allocating more than 4GB of heap mem ("
+        + optimalNumOfBits
+        + " bits)"
+    );
+
+    BloomFilter bloomFilter =
+      BloomFilter.create(
+        BloomFilter.Version.V2,
+        numItems,
+        optimalNumOfBits,
+        deterministicSeed
+      );
+
+    testOut.printf(
+      "allocated bitArray: %d (%d MB)\n",
+      bloomFilter.bitSize(),
+      bloomFilter.bitSize() / Byte.SIZE / 1024 / 1024
+    );
+
+    for (long i = 0; i < numItems; i++) {
+      if (verbose && i % 10_000_000 == 0) {
+        System.err.printf("i: %d\n", i);
+      }
+
+      bloomFilter.putLong(2 * i);
+    }
+
+    testOut.printf("bitCount: %d\nsaturation: %f\n",
+      bloomFilter.cardinality(),
+      (double) bloomFilter.cardinality() / bloomFilter.bitSize()
+    );
+
+    LongAdder mightContainEven = new LongAdder();
+    LongAdder mightContainOdd = new LongAdder();
+
+    LongStream inputStream = LongStream.range(0, numItems).parallel();
+    inputStream.forEach(
+      i -> {
+        long even = 2 * i;
+        if (bloomFilter.mightContainLong(even)) {
+          mightContainEven.increment();
+        }
+
+        long odd = 2 * i + 1;
+        if (bloomFilter.mightContainLong(odd)) {
+          mightContainOdd.increment();
+        }
+      }
+    );
+
+    Assertions.assertEquals(
+      numItems, mightContainEven.longValue(),
+      "mightContainLong must return true for all inserted numbers"
+    );
+
+    double actualFpp = mightContainOdd.doubleValue() / numItems;
+    double acceptableFpp = expectedFpp * (1 + FPP_ACCEPTABLE_ERROR_FACTOR);
+
+    testOut.printf("expectedFpp:   %f %%\n", 100 * expectedFpp);
+    testOut.printf("acceptableFpp: %f %%\n", 100 * acceptableFpp);
+    testOut.printf("actualFpp:     %f %%\n", 100 * actualFpp);
+
+    if (!strict) {
+      Assumptions.assumeTrue(
+        actualFpp <= acceptableFpp,
+        String.format(
+          "acceptableFpp(%f %%) < actualFpp (%f %%)",
+          100 * acceptableFpp,
+          100 * actualFpp
+        )
+      );
+    } else {
+      Assertions.assertTrue(
+        actualFpp <= acceptableFpp,
+        String.format(
+          "acceptableFpp(%f %%) < actualFpp (%f %%)",
+          100 * acceptableFpp,
+          100 * actualFpp
+        )
+      );
+    }
+  }
+
+  /**
+   * This test inserts N pseudorandomly generated numbers in 2N number of iterations in two
+   * differently seeded (theoretically independent) BloomFilter instances. All the random
+   * numbers generated in an even-iteration will be inserted into both filters, all the
+   * random numbers generated in an odd-iteration will be left out from both.
+   *
+   * The test checks the 100% accuracy of 'mightContain=true' for all the items inserted
+   * in an even-loop. It counts the false positives as the number of odd-loop items for
+   * which the primary filter reports 'mightContain=true', but secondary reports
+   * 'mightContain=false'. Since we inserted the same elements into both instances,
+   * and the secondary reports non-insertion, the 'mightContain=true' from the primary
+   * can only be a false positive.
+   *
+   * @param numItems the number of items to be inserted
+   * @param expectedFpp the expected fpp rate of the tested BloomFilter instance
+   * @param deterministicSeed the deterministic seed to use to initialize
+   *                          the primary BloomFilter instance. (The secondary will be
+   *                          initialized with the constant seed of 0xCAFEBABE)
+   */
+  @ParameterizedTest(name = "testAccuracyRandom.n{0}_fpp{1}_seed{2}")
+  @MethodSource("dataPointProvider")
+  public void testAccuracyRandomDistribution(
+    long numItems,
+    double expectedFpp,
+    int deterministicSeed,
+    TestInfo testInfo
+  ) {
+    String testName = testInfo.getDisplayName();
+    PrintStream testOut = testOutMap.get(testName);
+
+    long optimalNumOfBits = BloomFilter.optimalNumOfBits(numItems, expectedFpp);
+    testOut.printf(
+      "optimal   bitArray: %d (%d MB)\n",
+      optimalNumOfBits,
+      optimalNumOfBits / Byte.SIZE / 1024 / 1024
+    );
+    Assumptions.assumeTrue(
+      2 * optimalNumOfBits / Byte.SIZE < REQUIRED_HEAP_UPPER_BOUND_IN_BYTES,
+      "this testcase would require allocating more than 4GB of heap mem (2x "
+        + optimalNumOfBits
+        + " bits)"
+    );
+
+    BloomFilter bloomFilterPrimary =
+      BloomFilter.create(
+        BloomFilter.Version.V2,
+        numItems,
+        optimalNumOfBits,
+        deterministicSeed
+      );
+
+    // V1 ignores custom seed values, so the control filter must be at least V2
+    BloomFilter bloomFilterSecondary =
+      BloomFilter.create(
+        BloomFilter.Version.V2,
+        numItems,
+        optimalNumOfBits,
+        0xCAFEBABE
+      );
+
+    testOut.printf(
+      "allocated bitArray: %d (%d MB)\n",
+      bloomFilterPrimary.bitSize(),
+      bloomFilterPrimary.bitSize() / Byte.SIZE / 1024 / 1024
+    );
+
+    long iterationCount = 2 * numItems;
+
+    for (long i = 0; i < iterationCount; i++) {
+      if (verbose && i % 10_000_000 == 0) {
+        System.err.printf("i: %d\n", i);
+      }
+
+      long candidate = scramble(i);
+      if (i % 2 == 0) {
+        bloomFilterPrimary.putLong(candidate);
+        bloomFilterSecondary.putLong(candidate);
+      }
+    }
+    testOut.printf("bitCount: %d\nsaturation: %f\n",
+      bloomFilterPrimary.cardinality(),
+      (double) bloomFilterPrimary.cardinality() / bloomFilterPrimary.bitSize()
+    );
+
+    LongAdder mightContainEvenIndexed = new LongAdder();
+    LongAdder mightContainOddIndexed = new LongAdder();
+    LongAdder confirmedAsNotInserted = new LongAdder();
+    LongStream inputStream = LongStream.range(0, iterationCount).parallel();
+    inputStream.forEach(
+      i -> {
+        if (verbose && i % (iterationCount / 100) == 0) {
+          System.err.printf("%s: %2d %%\n", testName, 100 * i / iterationCount);
+        }
+
+        long candidate = scramble(i);
+
+        if (i % 2 == 0) { // EVEN
+          mightContainEvenIndexed.increment();
+        } else { // ODD
+          // for fpp estimation, only consider the odd indexes
+          // (to avoid querying the secondary with elements known to be inserted)
+
+          // since here we avoided all the even indexes,
+          // most of these secondary queries will return false
+          if (!bloomFilterSecondary.mightContainLong(candidate)) {
+            // from the odd indexes, we consider only those items
+            // where the secondary confirms the non-insertion
+
+            // anything on which the primary and the secondary
+            // disagrees here is a false positive
+            if (bloomFilterPrimary.mightContainLong(candidate)) {
+              mightContainOddIndexed.increment();
+            }
+            // count the total number of considered items for a baseline
+            confirmedAsNotInserted.increment();
+          }
+        }
+      }
+    );
+
+    Assertions.assertEquals(
+      numItems, mightContainEvenIndexed.longValue(),
+      "mightContainLong must return true for all inserted numbers"
+    );
+
+    double actualFpp =
+      mightContainOddIndexed.doubleValue() / confirmedAsNotInserted.doubleValue();
+    double acceptableFpp = expectedFpp * (1 + FPP_ACCEPTABLE_ERROR_FACTOR);
+
+    testOut.printf("mightContainOddIndexed: %10d\n", mightContainOddIndexed.longValue());
+    testOut.printf("confirmedAsNotInserted: %10d\n", confirmedAsNotInserted.longValue());
+    testOut.printf("numItems:               %10d\n", numItems);
+    testOut.printf("expectedFpp:   %f %%\n", 100 * expectedFpp);
+    testOut.printf("acceptableFpp: %f %%\n", 100 * acceptableFpp);
+    testOut.printf("actualFpp:     %f %%\n", 100 * actualFpp);
+
+    if (!strict) {
+      Assumptions.assumeTrue(
+        actualFpp <= acceptableFpp,
+        String.format(
+          "acceptableFpp(%f %%) < actualFpp (%f %%)",
+          100 * acceptableFpp,
+          100 * actualFpp
+        )
+      );
+    } else {
+      Assertions.assertTrue(
+        actualFpp <= acceptableFpp,
+        String.format(
+          "acceptableFpp(%f %%) < actualFpp (%f %%)",
+          100 * acceptableFpp,
+          100 * actualFpp
+        )
+      );
+    }
+  }
+
+  // quick scrambling logic hacked out from java.util.Random
+  //   its range is only 48bits (out of the 64bits of a Long value),
+  //   but it should be enough for the purposes of this test.
+  private static final long multiplier = 0x5DEECE66DL;
+  private static final long addend = 0xBL;
+  private static final long mask = (1L << 48) - 1;
+  private static long scramble(long value) {
+    return (value * multiplier + addend) & mask;
+  }
+}
diff --git a/common/sketch/src/test/scala/org/apache/spark/util/sketch/BloomFilterSuite.scala b/common/sketch/src/test/scala/org/apache/spark/util/sketch/BloomFilterSuite.scala
index 4d0ba66637b46..ba8f97a51aecf 100644
--- a/common/sketch/src/test/scala/org/apache/spark/util/sketch/BloomFilterSuite.scala
+++ b/common/sketch/src/test/scala/org/apache/spark/util/sketch/BloomFilterSuite.scala
@@ -46,7 +46,9 @@ class BloomFilterSuite extends AnyFunSuite { // scalastyle:ignore funsuite
       val fpp = 0.05
       val numInsertion = numItems / 10
 
-      val allItems = Array.fill(numItems)(itemGen(r))
+      // using a Set to avoid duplicates,
+      // inserting twice as many random values as used, to compensate for lost dupes
+      val allItems = Set.fill(2 * numItems)(itemGen(r)).take(numItems)
 
       val filter = BloomFilter.create(numInsertion, fpp)
 
@@ -158,5 +160,11 @@ class BloomFilterSuite extends AnyFunSuite { // scalastyle:ignore funsuite
       val filter2 = BloomFilter.create(2000, 6400)
       filter1.mergeInPlace(filter2)
     }
+
+    intercept[IncompatibleMergeException] {
+      val filter1 = BloomFilter.create(BloomFilter.Version.V1, 1000L, 6400L, 0)
+      val filter2 = BloomFilter.create(BloomFilter.Version.V2, 1000L, 6400L, 0)
+      filter1.mergeInPlace(filter2)
+    }
   }
 }
diff --git a/common/unsafe/pom.xml b/common/unsafe/pom.xml
index 896a4192cffff..c65add52ba527 100644
--- a/common/unsafe/pom.xml
+++ b/common/unsafe/pom.xml
@@ -53,12 +53,6 @@
       <version>${project.version}</version>
     </dependency>
 
-    <dependency>
-      <groupId>org.scala-lang.modules</groupId>
-      <artifactId>scala-parallel-collections_${scala.binary.version}</artifactId>
-      <scope>test</scope>
-    </dependency>
-
     <dependency>
       <groupId>com.ibm.icu</groupId>
       <artifactId>icu4j</artifactId>
@@ -94,10 +88,6 @@
       <groupId>com.google.code.findbugs</groupId>
       <artifactId>jsr305</artifactId>
     </dependency>
-    <dependency>
-      <groupId>com.google.guava</groupId>
-      <artifactId>guava</artifactId>
-    </dependency>
 
     <!-- Provided dependencies -->
     <dependency>
diff --git a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationAwareUTF8String.java b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationAwareUTF8String.java
index e455e531de0dd..2b9457c58560f 100644
--- a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationAwareUTF8String.java
+++ b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationAwareUTF8String.java
@@ -1529,9 +1529,10 @@ public static UTF8String trimRight(
   }
 
   public static UTF8String[] splitSQL(final UTF8String input, final UTF8String delim,
-      final int limit, final int collationId) {
+      final int limit, final int collationId, boolean legacySplitTruncate) {
     if (CollationFactory.fetchCollation(collationId).isUtf8BinaryType) {
-      return input.split(delim, limit);
+      return legacySplitTruncate ?
+        input.splitLegacyTruncate(delim, limit) : input.split(delim, limit);
     } else if (CollationFactory.fetchCollation(collationId).isUtf8LcaseType) {
       return lowercaseSplitSQL(input, delim, limit);
     } else {
diff --git a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationFactory.java b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationFactory.java
index 4bcd75a731059..59c23064858d0 100644
--- a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationFactory.java
+++ b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationFactory.java
@@ -22,7 +22,6 @@
 import java.util.concurrent.ConcurrentHashMap;
 import java.util.function.Function;
 import java.util.function.BiFunction;
-import java.util.function.ToLongFunction;
 import java.util.stream.Stream;
 
 import com.ibm.icu.text.CollationKey;
@@ -125,10 +124,19 @@ public static class Collation {
     public final String version;
 
     /**
-     * Collation sensitive hash function. Output for two UTF8Strings will be the same if they are
-     * equal according to the collation.
+     * Returns the sort key of the input UTF8String. Two UTF8String values are equal iff their
+     * sort keys are equal (compared as byte arrays).
+     * The sort key is defined as follows for collations without the RTRIM modifier:
+     * - UTF8_BINARY: It is the bytes of the string.
+     * - UTF8_LCASE: It is byte array we get by replacing all invalid UTF8 sequences with the
+     *   Unicode replacement character and then converting all characters of the replaced string
+     *   with their lowercase equivalents (the Greek capital and Greek small sigma both map to
+     *   the Greek final sigma).
+     * - ICU collations: It is the byte array returned by the ICU library for the collated string.
+     *   For strings with the RTRIM modifier, we right-trim the string and return the collation key
+     *   of the resulting right-trimmed string.
      */
-    public final ToLongFunction<UTF8String> hashFunction;
+    public final Function<UTF8String, byte[]> sortKeyFunction;
 
     /**
      * Potentially faster way than using comparator to compare two UTF8Strings for equality.
@@ -182,7 +190,7 @@ public Collation(
         Collator collator,
         Comparator<UTF8String> comparator,
         String version,
-        ToLongFunction<UTF8String> hashFunction,
+        Function<UTF8String, byte[]> sortKeyFunction,
         BiFunction<UTF8String, UTF8String, Boolean> equalsFunction,
         boolean isUtf8BinaryType,
         boolean isUtf8LcaseType,
@@ -192,7 +200,7 @@ public Collation(
       this.collator = collator;
       this.comparator = comparator;
       this.version = version;
-      this.hashFunction = hashFunction;
+      this.sortKeyFunction = sortKeyFunction;
       this.isUtf8BinaryType = isUtf8BinaryType;
       this.isUtf8LcaseType = isUtf8LcaseType;
       this.equalsFunction = equalsFunction;
@@ -581,18 +589,18 @@ private static boolean isValidCollationId(int collationId) {
       protected Collation buildCollation() {
         if (caseSensitivity == CaseSensitivity.UNSPECIFIED) {
           Comparator<UTF8String> comparator;
-          ToLongFunction<UTF8String> hashFunction;
+          Function<UTF8String, byte[]> sortKeyFunction;
           BiFunction<UTF8String, UTF8String, Boolean> equalsFunction;
           boolean supportsSpaceTrimming = spaceTrimming != SpaceTrimming.NONE;
 
           if (spaceTrimming == SpaceTrimming.NONE) {
             comparator = UTF8String::binaryCompare;
-            hashFunction = s -> (long) s.hashCode();
+            sortKeyFunction = s -> s.getBytes();
             equalsFunction = UTF8String::equals;
           } else {
             comparator = (s1, s2) -> applyTrimmingPolicy(s1, spaceTrimming).binaryCompare(
               applyTrimmingPolicy(s2, spaceTrimming));
-            hashFunction = s -> (long) applyTrimmingPolicy(s, spaceTrimming).hashCode();
+            sortKeyFunction = s -> applyTrimmingPolicy(s, spaceTrimming).getBytes();
             equalsFunction = (s1, s2) -> applyTrimmingPolicy(s1, spaceTrimming).equals(
               applyTrimmingPolicy(s2, spaceTrimming));
           }
@@ -603,25 +611,25 @@ protected Collation buildCollation() {
             null,
             comparator,
             CollationSpecICU.ICU_VERSION,
-            hashFunction,
+            sortKeyFunction,
             equalsFunction,
             /* isUtf8BinaryType = */ true,
             /* isUtf8LcaseType = */ false,
             spaceTrimming != SpaceTrimming.NONE);
         } else {
           Comparator<UTF8String> comparator;
-          ToLongFunction<UTF8String> hashFunction;
+          Function<UTF8String, byte[]> sortKeyFunction;
 
           if (spaceTrimming == SpaceTrimming.NONE) {
             comparator = CollationAwareUTF8String::compareLowerCase;
-            hashFunction = s ->
-              (long) CollationAwareUTF8String.lowerCaseCodePoints(s).hashCode();
+            sortKeyFunction = s ->
+              CollationAwareUTF8String.lowerCaseCodePoints(s).getBytes();
           } else {
             comparator = (s1, s2) -> CollationAwareUTF8String.compareLowerCase(
               applyTrimmingPolicy(s1, spaceTrimming),
               applyTrimmingPolicy(s2, spaceTrimming));
-            hashFunction = s -> (long) CollationAwareUTF8String.lowerCaseCodePoints(
-              applyTrimmingPolicy(s, spaceTrimming)).hashCode();
+            sortKeyFunction = s -> CollationAwareUTF8String.lowerCaseCodePoints(
+              applyTrimmingPolicy(s, spaceTrimming)).getBytes();
           }
 
           return new Collation(
@@ -630,7 +638,7 @@ protected Collation buildCollation() {
             null,
             comparator,
             CollationSpecICU.ICU_VERSION,
-            hashFunction,
+            sortKeyFunction,
             (s1, s2) -> comparator.compare(s1, s2) == 0,
             /* isUtf8BinaryType = */ false,
             /* isUtf8LcaseType = */ true,
@@ -1013,19 +1021,18 @@ protected Collation buildCollation() {
         collator.freeze();
 
         Comparator<UTF8String> comparator;
-        ToLongFunction<UTF8String> hashFunction;
+        Function<UTF8String, byte[]> sortKeyFunction;
 
         if (spaceTrimming == SpaceTrimming.NONE) {
-          hashFunction = s -> (long) collator.getCollationKey(
-            s.toValidString()).hashCode();
           comparator = (s1, s2) ->
             collator.compare(s1.toValidString(), s2.toValidString());
+          sortKeyFunction = s -> collator.getCollationKey(s.toValidString()).toByteArray();
         } else {
           comparator = (s1, s2) -> collator.compare(
             applyTrimmingPolicy(s1, spaceTrimming).toValidString(),
             applyTrimmingPolicy(s2, spaceTrimming).toValidString());
-          hashFunction = s -> (long) collator.getCollationKey(
-            applyTrimmingPolicy(s, spaceTrimming).toValidString()).hashCode();
+          sortKeyFunction = s -> collator.getCollationKey(
+            applyTrimmingPolicy(s, spaceTrimming).toValidString()).toByteArray();
         }
 
         return new Collation(
@@ -1034,7 +1041,7 @@ protected Collation buildCollation() {
           collator,
           comparator,
           ICU_VERSION,
-          hashFunction,
+          sortKeyFunction,
           (s1, s2) -> comparator.compare(s1, s2) == 0,
           /* isUtf8BinaryType = */ false,
           /* isUtf8LcaseType = */ false,
diff --git a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationSupport.java b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationSupport.java
index 135250e482b16..f950fd864c576 100644
--- a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationSupport.java
+++ b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/CollationSupport.java
@@ -706,8 +706,10 @@ public static int collationAwareRegexFlags(final int collationId) {
   public static UTF8String lowercaseRegex(final UTF8String regex) {
     return UTF8String.concat(lowercaseRegexPrefix, regex);
   }
-  public static UTF8String collationAwareRegex(final UTF8String regex, final int collationId) {
-    return supportsLowercaseRegex(collationId) ? lowercaseRegex(regex) : regex;
+  public static UTF8String collationAwareRegex(
+      final UTF8String regex, final int collationId, boolean notIgnoreEmpty) {
+    return supportsLowercaseRegex(collationId) && (notIgnoreEmpty || regex.numBytes() != 0)
+      ? lowercaseRegex(regex) : regex;
   }
 
   /**
diff --git a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/DateTimeConstants.java b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/DateTimeConstants.java
index 0ae238564d591..d52207ad860cd 100644
--- a/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/DateTimeConstants.java
+++ b/common/unsafe/src/main/java/org/apache/spark/sql/catalyst/util/DateTimeConstants.java
@@ -45,4 +45,5 @@ public class DateTimeConstants {
   public static final long NANOS_PER_MICROS = 1000L;
   public static final long NANOS_PER_MILLIS = MICROS_PER_MILLIS * NANOS_PER_MICROS;
   public static final long NANOS_PER_SECOND = MILLIS_PER_SECOND * NANOS_PER_MILLIS;
+  public static final long NANOS_PER_DAY = MICROS_PER_DAY * NANOS_PER_MICROS;
 }
diff --git a/common/unsafe/src/main/java/org/apache/spark/unsafe/types/ByteArray.java b/common/unsafe/src/main/java/org/apache/spark/unsafe/types/ByteArray.java
index f12408fb49313..310dbce9eaab6 100644
--- a/common/unsafe/src/main/java/org/apache/spark/unsafe/types/ByteArray.java
+++ b/common/unsafe/src/main/java/org/apache/spark/unsafe/types/ByteArray.java
@@ -20,9 +20,8 @@
 import java.nio.ByteOrder;
 import java.util.Arrays;
 
-import com.google.common.primitives.Ints;
-
 import org.apache.spark.unsafe.Platform;
+import org.apache.spark.network.util.JavaUtils;
 
 public final class ByteArray {
 
@@ -169,7 +168,7 @@ public static byte[] concatWS(byte[] delimiter, byte[]... inputs) {
     }
     if (totalLength > 0) totalLength -= delimiter.length;
     // Allocate a new byte array, and copy the inputs one by one into it
-    final byte[] result = new byte[Ints.checkedCast(totalLength)];
+    final byte[] result = new byte[JavaUtils.checkedCast(totalLength)];
     int offset = 0;
     for (int i = 0; i < inputs.length; i++) {
       byte[] input = inputs[i];
diff --git a/common/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java b/common/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java
index caf8461b0b5d6..9209bd3135099 100644
--- a/common/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java
+++ b/common/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java
@@ -1168,10 +1168,21 @@ public UTF8String reverse() {
   }
 
   public UTF8String repeat(int times) {
-    if (times <= 0) {
+    if (times <= 0 || numBytes == 0) {
       return EMPTY_UTF8;
     }
 
+    if (times == 1) {
+      return this;
+    }
+
+    if (numBytes == 1) {
+      byte[] newBytes = new byte[times];
+      byte b = getByte(0);
+      Arrays.fill(newBytes, b);
+      return fromBytes(newBytes);
+    }
+
     byte[] newBytes = new byte[Math.multiplyExact(numBytes, times)];
     copyMemory(this.base, this.offset, newBytes, BYTE_ARRAY_OFFSET, numBytes);
 
@@ -1483,6 +1494,25 @@ public static UTF8String concatWs(UTF8String separator, UTF8String... inputs) {
   }
 
   public UTF8String[] split(UTF8String pattern, int limit) {
+    // For the empty `pattern` a `split` function ignores trailing empty strings unless original
+    // string is empty.
+    if (numBytes() != 0 && pattern.numBytes() == 0) {
+      int newLimit = limit > numChars() || limit <= 0 ? numChars() : limit;
+      byte[] input = getBytes();
+      int byteIndex = 0;
+      UTF8String[] result = new UTF8String[newLimit];
+      for (int charIndex = 0; charIndex < newLimit - 1; charIndex++) {
+        int currCharNumBytes = numBytesForFirstByte(input[byteIndex]);
+        result[charIndex] = UTF8String.fromBytes(input, byteIndex, currCharNumBytes);
+        byteIndex += currCharNumBytes;
+      }
+      result[newLimit - 1] = UTF8String.fromBytes(input, byteIndex, numBytes() - byteIndex);
+      return result;
+    }
+    return split(pattern.toString(), limit);
+  }
+
+  public UTF8String[] splitLegacyTruncate(UTF8String pattern, int limit) {
     // For the empty `pattern` a `split` function ignores trailing empty strings unless original
     // string is empty.
     if (numBytes() != 0 && pattern.numBytes() == 0) {
diff --git a/common/unsafe/src/test/java/org/apache/spark/unsafe/types/UTF8StringSuite.java b/common/unsafe/src/test/java/org/apache/spark/unsafe/types/UTF8StringSuite.java
index c4a66fdffdd4d..26b96155377e8 100644
--- a/common/unsafe/src/test/java/org/apache/spark/unsafe/types/UTF8StringSuite.java
+++ b/common/unsafe/src/test/java/org/apache/spark/unsafe/types/UTF8StringSuite.java
@@ -24,7 +24,6 @@
 import java.nio.charset.StandardCharsets;
 import java.util.*;
 
-import com.google.common.collect.ImmutableMap;
 import org.apache.spark.unsafe.Platform;
 import org.apache.spark.unsafe.UTF8StringBuilder;
 
@@ -432,7 +431,7 @@ public void split() {
       new UTF8String[]{fromString("a"), fromString("b")},
       fromString("ab").split(fromString(""), 100));
     assertArrayEquals(
-      new UTF8String[]{fromString("a")},
+      new UTF8String[]{fromString("ab")},
       fromString("ab").split(fromString(""), 1));
     assertArrayEquals(
       new UTF8String[]{fromString("")},
@@ -495,7 +494,7 @@ public void levenshteinDistance() {
   public void translate() {
     assertEquals(
       fromString("1a2s3ae"),
-      fromString("translate").translate(ImmutableMap.of(
+      fromString("translate").translate(Map.of(
         "r", "1",
         "n", "2",
         "l", "3",
@@ -506,7 +505,7 @@ public void translate() {
       fromString("translate").translate(new HashMap<>()));
     assertEquals(
       fromString("asae"),
-      fromString("translate").translate(ImmutableMap.of(
+      fromString("translate").translate(Map.of(
         "r", "\0",
         "n", "\0",
         "l", "\0",
@@ -514,7 +513,7 @@ public void translate() {
       )));
     assertEquals(
       fromString("aa世b"),
-      fromString("花花世界").translate(ImmutableMap.of(
+      fromString("花花世界").translate(Map.of(
         "花", "a",
         "界", "b"
       )));
diff --git a/common/unsafe/src/test/scala/org/apache/spark/unsafe/types/CollationFactorySuite.scala b/common/unsafe/src/test/scala/org/apache/spark/unsafe/types/CollationFactorySuite.scala
index 8e9d33efe7a6d..ddf588b6c64c7 100644
--- a/common/unsafe/src/test/scala/org/apache/spark/unsafe/types/CollationFactorySuite.scala
+++ b/common/unsafe/src/test/scala/org/apache/spark/unsafe/types/CollationFactorySuite.scala
@@ -17,7 +17,8 @@
 
 package org.apache.spark.unsafe.types
 
-import scala.collection.parallel.immutable.ParSeq
+import java.util.stream.IntStream
+
 import scala.jdk.CollectionConverters.MapHasAsScala
 
 import com.ibm.icu.util.ULocale
@@ -139,7 +140,7 @@ class CollationFactorySuite extends AnyFunSuite with Matchers { // scalastyle:ig
 
   case class CollationTestCase[R](collationName: String, s1: String, s2: String, expectedResult: R)
 
-  test("collation aware equality and hash") {
+  test("collation aware equality and sort key") {
     val checks = Seq(
       CollationTestCase("UTF8_BINARY", "aaa", "aaa", true),
       CollationTestCase("UTF8_BINARY", "aaa", "AAA", false),
@@ -194,9 +195,9 @@ class CollationFactorySuite extends AnyFunSuite with Matchers { // scalastyle:ig
       assert(collation.equalsFunction(toUTF8(testCase.s1), toUTF8(testCase.s2)) ==
         testCase.expectedResult)
 
-      val hash1 = collation.hashFunction.applyAsLong(toUTF8(testCase.s1))
-      val hash2 = collation.hashFunction.applyAsLong(toUTF8(testCase.s2))
-      assert((hash1 == hash2) == testCase.expectedResult)
+      val sortKey1 = collation.sortKeyFunction.apply(toUTF8(testCase.s1)).asInstanceOf[Array[Byte]]
+      val sortKey2 = collation.sortKeyFunction.apply(toUTF8(testCase.s2)).asInstanceOf[Array[Byte]]
+      assert(sortKey1.sameElements(sortKey2) == testCase.expectedResult)
     })
   }
 
@@ -293,7 +294,7 @@ class CollationFactorySuite extends AnyFunSuite with Matchers { // scalastyle:ig
     (0 to 10).foreach(_ => {
       val collator = fetchCollation("UNICODE").getCollator
 
-      ParSeq(0 to 100).foreach { _ =>
+      IntStream.rangeClosed(0, 100).parallel().forEach { _ =>
         collator.getCollationKey("aaa")
       }
     })
diff --git a/common/utils-java/pom.xml b/common/utils-java/pom.xml
new file mode 100644
index 0000000000000..ba3603f810856
--- /dev/null
+++ b/common/utils-java/pom.xml
@@ -0,0 +1,84 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one or more
+  ~ contributor license agreements.  See the NOTICE file distributed with
+  ~ this work for additional information regarding copyright ownership.
+  ~ The ASF licenses this file to You under the Apache License, Version 2.0
+  ~ (the "License"); you may not use this file except in compliance with
+  ~ the License.  You may obtain a copy of the License at
+  ~
+  ~    http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing, software
+  ~ distributed under the License is distributed on an "AS IS" BASIS,
+  ~ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  ~ See the License for the specific language governing permissions and
+  ~ limitations under the License.
+  -->
+
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+  <modelVersion>4.0.0</modelVersion>
+  <parent>
+    <groupId>org.apache.spark</groupId>
+    <artifactId>spark-parent_2.13</artifactId>
+    <version>4.1.0-SNAPSHOT</version>
+    <relativePath>../../pom.xml</relativePath>
+  </parent>
+
+  <artifactId>spark-common-utils-java_2.13</artifactId>
+  <packaging>jar</packaging>
+  <name>Spark Project Common Java Utils</name>
+  <url>https://spark.apache.org/</url>
+  <properties>
+    <sbt.project.name>common-utils-java</sbt.project.name>
+  </properties>
+
+  <dependencies>
+    <dependency>
+      <groupId>org.apache.spark</groupId>
+      <artifactId>spark-tags_${scala.binary.version}</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>com.fasterxml.jackson.core</groupId>
+      <artifactId>jackson-databind</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.slf4j</groupId>
+      <artifactId>slf4j-api</artifactId>
+    </dependency>
+
+    <dependency>
+      <groupId>org.slf4j</groupId>
+      <artifactId>jul-to-slf4j</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.slf4j</groupId>
+      <artifactId>jcl-over-slf4j</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.logging.log4j</groupId>
+      <artifactId>log4j-slf4j2-impl</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.logging.log4j</groupId>
+      <artifactId>log4j-api</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.logging.log4j</groupId>
+      <artifactId>log4j-core</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.logging.log4j</groupId>
+      <artifactId>log4j-1.2-api</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.logging.log4j</groupId>
+      <artifactId>log4j-layout-template-json</artifactId>
+    </dependency>
+  </dependencies>
+  <build>
+    <outputDirectory>target/scala-${scala.binary.version}/classes</outputDirectory>
+    <testOutputDirectory>target/scala-${scala.binary.version}/test-classes</testOutputDirectory>
+  </build>
+</project>
diff --git a/common/utils/src/main/java/org/apache/spark/QueryContext.java b/common/utils-java/src/main/java/org/apache/spark/QueryContext.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/QueryContext.java
rename to common/utils-java/src/main/java/org/apache/spark/QueryContext.java
diff --git a/common/utils/src/main/java/org/apache/spark/QueryContextType.java b/common/utils-java/src/main/java/org/apache/spark/QueryContextType.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/QueryContextType.java
rename to common/utils-java/src/main/java/org/apache/spark/QueryContextType.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/CoGroupFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/CoGroupFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/CoGroupFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/CoGroupFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/DoubleFlatMapFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/DoubleFlatMapFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/DoubleFlatMapFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/DoubleFlatMapFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/DoubleFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/DoubleFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/DoubleFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/DoubleFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/FilterFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/FilterFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/FilterFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/FilterFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/FlatMapFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/FlatMapFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/FlatMapFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/FlatMapFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/FlatMapFunction2.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/FlatMapFunction2.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/FlatMapFunction2.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/FlatMapFunction2.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/FlatMapGroupsFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/FlatMapGroupsFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/FlatMapGroupsFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/FlatMapGroupsFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/ForeachFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/ForeachFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/ForeachFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/ForeachFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/ForeachPartitionFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/ForeachPartitionFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/ForeachPartitionFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/ForeachPartitionFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/Function.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/Function.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/Function.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/Function.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/Function0.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/Function0.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/Function0.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/Function0.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/Function2.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/Function2.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/Function2.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/Function2.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/Function3.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/Function3.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/Function3.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/Function3.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/Function4.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/Function4.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/Function4.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/Function4.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/MapFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/MapFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/MapFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/MapFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/MapGroupsFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/MapGroupsFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/MapGroupsFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/MapGroupsFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/MapPartitionsFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/MapPartitionsFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/MapPartitionsFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/MapPartitionsFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/PairFlatMapFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/PairFlatMapFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/PairFlatMapFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/PairFlatMapFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/PairFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/PairFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/PairFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/PairFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/ReduceFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/ReduceFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/ReduceFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/ReduceFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/VoidFunction.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/VoidFunction.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/VoidFunction.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/VoidFunction.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/VoidFunction2.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/VoidFunction2.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/VoidFunction2.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/VoidFunction2.java
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/package-info.java b/common/utils-java/src/main/java/org/apache/spark/api/java/function/package-info.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/package-info.java
rename to common/utils-java/src/main/java/org/apache/spark/api/java/function/package-info.java
diff --git a/common/utils-java/src/main/java/org/apache/spark/internal/LogKey.java b/common/utils-java/src/main/java/org/apache/spark/internal/LogKey.java
new file mode 100644
index 0000000000000..0bd0fecb43976
--- /dev/null
+++ b/common/utils-java/src/main/java/org/apache/spark/internal/LogKey.java
@@ -0,0 +1,52 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.internal;
+
+/**
+ * All structured logging `keys` used in `MDC` must be extends `LogKey`
+ * <p>
+ *
+ * `LogKey`s serve as identifiers for mapped diagnostic contexts (MDC) within logs.
+ * Follow these guidelines when adding a new LogKey:
+ * <ul>
+ *   <li>
+ *     Define all structured logging keys in `LogKeys.java`, and sort them alphabetically for
+ *     ease of search.
+ *   </li>
+ *   <li>
+ *     Use `UPPER_SNAKE_CASE` for key names.
+ *   </li>
+ *   <li>
+ *     Key names should be both simple and broad, yet include specific identifiers like `STAGE_ID`,
+ *     `TASK_ID`, and `JOB_ID` when needed for clarity. For instance, use `MAX_ATTEMPTS` as a
+ *     general key instead of creating separate keys for each scenario such as
+ *     `EXECUTOR_STATE_SYNC_MAX_ATTEMPTS` and `MAX_TASK_FAILURES`.
+ *     This balances simplicity with the detail needed for effective logging.
+ *   </li>
+ *   <li>
+ *     Use abbreviations in names if they are widely understood,
+ *     such as `APP_ID` for APPLICATION_ID, and `K8S` for KUBERNETES.
+ *   </li>
+ *   <li>
+ *     For time-related keys, use milliseconds as the unit of time.
+ *   </li>
+ * </ul>
+ */
+public interface LogKey {
+  String name();
+}
diff --git a/common/utils-java/src/main/java/org/apache/spark/internal/LogKeys.java b/common/utils-java/src/main/java/org/apache/spark/internal/LogKeys.java
new file mode 100644
index 0000000000000..0fd3627bbac1d
--- /dev/null
+++ b/common/utils-java/src/main/java/org/apache/spark/internal/LogKeys.java
@@ -0,0 +1,889 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.internal;
+
+/**
+ * Various keys used for mapped diagnostic contexts(MDC) in logging. All structured logging keys
+ * should be defined here for standardization.
+ */
+public enum LogKeys implements LogKey {
+  ACCUMULATOR_ID,
+  ACL_ENABLED,
+  ACTUAL_NUM_FILES,
+  ACTUAL_PARTITION_COLUMN,
+  ADDED_JARS,
+  ADMIN_ACLS,
+  ADMIN_ACL_GROUPS,
+  ADVISORY_TARGET_SIZE,
+  AGGREGATE_FUNCTIONS,
+  ALIGNED_FROM_TIME,
+  ALIGNED_TO_TIME,
+  ALPHA,
+  ANALYSIS_ERROR,
+  ANTLR_DFA_CACHE_DELTA,
+  ANTLR_DFA_CACHE_SIZE,
+  APP_ATTEMPT_ID,
+  APP_ATTEMPT_SHUFFLE_MERGE_ID,
+  APP_DESC,
+  APP_EXECUTOR_ID,
+  APP_ID,
+  APP_NAME,
+  APP_STATE,
+  ARCHIVE_NAME,
+  ARGS,
+  ARTIFACTS,
+  ARTIFACT_ID,
+  ATTRIBUTE_MAP,
+  AUTH_ENABLED,
+  AVG_BATCH_PROC_TIME,
+  BACKUP_FILE,
+  BARRIER_EPOCH,
+  BARRIER_ID,
+  BATCH_ID,
+  BATCH_NAME,
+  BATCH_TIMES,
+  BATCH_TIMESTAMP,
+  BATCH_WRITE,
+  BIND_ADDRESS,
+  BLOCK_GENERATOR_STATUS,
+  BLOCK_ID,
+  BLOCK_IDS,
+  BLOCK_MANAGER_ID,
+  BLOCK_MANAGER_IDS,
+  BLOCK_TYPE,
+  BOOT,
+  BOOTSTRAP_TIME,
+  BOOT_TIME,
+  BROADCAST,
+  BROADCAST_ID,
+  BROADCAST_OUTPUT_STATUS_SIZE,
+  BUCKET,
+  BYTECODE_SIZE,
+  BYTE_BUFFER,
+  BYTE_SIZE,
+  CACHED_TABLE_PARTITION_METADATA_SIZE,
+  CACHE_AUTO_REMOVED_SIZE,
+  CACHE_SIZE,
+  CACHE_UNTIL_HIGHEST_CONSUMED_SIZE,
+  CACHE_UNTIL_LAST_PRODUCED_SIZE,
+  CALL_SITE_LONG_FORM,
+  CALL_SITE_SHORT_FORM,
+  CANCEL_FUTURE_JOBS,
+  CATALOG_NAME,
+  CATEGORICAL_FEATURES,
+  CHECKPOINT_FILE,
+  CHECKPOINT_INTERVAL,
+  CHECKPOINT_LOCATION,
+  CHECKPOINT_PATH,
+  CHECKPOINT_ROOT,
+  CHECKPOINT_TIME,
+  CHOSEN_WATERMARK,
+  CLASSIFIER,
+  CLASS_LOADER,
+  CLASS_NAME,
+  CLASS_PATH,
+  CLASS_PATHS,
+  CLAUSES,
+  CLEANUP_LOCAL_DIRS,
+  CLUSTER_CENTROIDS,
+  CLUSTER_ID,
+  CLUSTER_LABEL,
+  CLUSTER_LEVEL,
+  CLUSTER_WEIGHT,
+  CODE,
+  CODEC_LEVEL,
+  CODEC_NAME,
+  CODEGEN_STAGE_ID,
+  COLUMN_DATA_TYPE_SOURCE,
+  COLUMN_DATA_TYPE_TARGET,
+  COLUMN_DEFAULT_VALUE,
+  COLUMN_NAME,
+  COLUMN_NAMES,
+  COMMAND,
+  COMMAND_OUTPUT,
+  COMMITTED_VERSION,
+  COMPACT_INTERVAL,
+  COMPONENT,
+  COMPUTE,
+  CONFIG,
+  CONFIG2,
+  CONFIG3,
+  CONFIG4,
+  CONFIG5,
+  CONFIG_DEPRECATION_MESSAGE,
+  CONFIG_KEY_UPDATED,
+  CONFIG_VERSION,
+  CONSUMER,
+  CONTAINER,
+  CONTAINER_ID,
+  CONTAINER_STATE,
+  CONTEXT,
+  COST,
+  COUNT,
+  CREATED_POOL_NAME,
+  CREATION_SITE,
+  CREDENTIALS_RENEWAL_INTERVAL_RATIO,
+  CROSS_VALIDATION_METRIC,
+  CROSS_VALIDATION_METRICS,
+  CSV_HEADER_COLUMN_NAME,
+  CSV_HEADER_COLUMN_NAMES,
+  CSV_HEADER_LENGTH,
+  CSV_SCHEMA_FIELD_NAME,
+  CSV_SCHEMA_FIELD_NAMES,
+  CSV_SOURCE,
+  CURRENT_BATCH_ID,
+  CURRENT_DISK_SIZE,
+  CURRENT_FILE,
+  CURRENT_MEMORY_SIZE,
+  CURRENT_PATH,
+  CURRENT_TIME,
+  DATA,
+  DATABASE_NAME,
+  DATAFRAME_CACHE_ENTRY,
+  DATAFRAME_ID,
+  DATA_FILE,
+  DATA_SOURCE,
+  DATA_SOURCES,
+  DEFAULT_COMPACT_INTERVAL,
+  DEFAULT_ISOLATION_LEVEL,
+  DEFAULT_NAME,
+  DEFAULT_VALUE,
+  DELAY,
+  DELEGATE,
+  DELTA,
+  DEPRECATED_KEY,
+  DERIVATIVE,
+  DESCRIPTION,
+  DESIRED_NUM_PARTITIONS,
+  DESIRED_TREE_DEPTH,
+  DESTINATION_PATH,
+  DFS_FILE,
+  DIFF_DELTA,
+  DIVISIBLE_CLUSTER_INDICES_SIZE,
+  DRIVER_ID,
+  DRIVER_JVM_MEMORY,
+  DRIVER_MEMORY_SIZE,
+  DRIVER_STATE,
+  DROPPED_PARTITIONS,
+  DSTREAM,
+  DURATION,
+  EARLIEST_LOADED_VERSION,
+  EFFECTIVE_STORAGE_LEVEL,
+  ELAPSED_TIME,
+  ENCODING,
+  ENDPOINT_NAME,
+  END_INDEX,
+  END_POINT,
+  END_VERSION,
+  ENGINE,
+  EPOCH,
+  ERROR,
+  ESTIMATOR_PARAM_MAP,
+  EVALUATED_FILTERS,
+  EVENT,
+  EVENT_LOG_DESTINATION,
+  EVENT_LOOP,
+  EVENT_NAME,
+  EVENT_QUEUE,
+  EXCEPTION,
+  EXECUTE_INFO,
+  EXECUTE_KEY,
+  EXECUTION_MEMORY_SIZE,
+  EXECUTION_PLAN_LEAVES,
+  EXECUTOR_BACKEND,
+  EXECUTOR_ENVS,
+  EXECUTOR_ENV_REGEX,
+  EXECUTOR_ID,
+  EXECUTOR_IDS,
+  EXECUTOR_LAUNCH_COMMANDS,
+  EXECUTOR_MEMORY_OFFHEAP,
+  EXECUTOR_MEMORY_OVERHEAD_SIZE,
+  EXECUTOR_MEMORY_SIZE,
+  EXECUTOR_RESOURCES,
+  EXECUTOR_SHUFFLE_INFO,
+  EXECUTOR_STATE,
+  EXECUTOR_TIMEOUT,
+  EXECUTOR_USER_CLASS_PATH_FIRST,
+  EXEC_AMOUNT,
+  EXISTING_FILE,
+  EXISTING_PATH,
+  EXIT_CODE,
+  EXPECTED_NUM_FILES,
+  EXPECTED_PARTITION_COLUMN,
+  EXPIRY_TIMESTAMP,
+  EXPR,
+  EXPR_TERMS,
+  EXTENDED_EXPLAIN_GENERATOR,
+  FAILED_STAGE,
+  FAILED_STAGE_NAME,
+  FAILURES,
+  FALLBACK_VERSION,
+  FEATURE_COLUMN,
+  FEATURE_DIMENSION,
+  FEATURE_NAME,
+  FETCH_SIZE,
+  FIELD_NAME,
+  FIELD_TYPE,
+  FILES,
+  FILE_ABSOLUTE_PATH,
+  FILE_END_OFFSET,
+  FILE_FORMAT,
+  FILE_FORMAT2,
+  FILE_LENGTH_XATTR,
+  FILE_MODIFICATION_TIME,
+  FILE_NAME,
+  FILE_NAME2,
+  FILE_NAME3,
+  FILE_NAMES,
+  FILE_START_OFFSET,
+  FILE_SYSTEM,
+  FILE_VERSION,
+  FILTER,
+  FINAL_CONTEXT,
+  FINAL_OUTPUT_PATH,
+  FINAL_PATH,
+  FINISH_TIME,
+  FINISH_TRIGGER_DURATION,
+  FLOW_NAME,
+  FREE_MEMORY_SIZE,
+  FROM_OFFSET,
+  FROM_TIME,
+  FS_DATA_OUTPUT_STREAM,
+  FUNCTION_NAME,
+  FUNCTION_PARAM,
+  GLOBAL_INIT_FILE,
+  GLOBAL_WATERMARK,
+  GROUP_BY_EXPRS,
+  GROUP_ID,
+  HADOOP_VERSION,
+  HASH_JOIN_KEYS,
+  HASH_MAP_SIZE,
+  HEARTBEAT,
+  HEARTBEAT_INTERVAL,
+  HISTORY_DIR,
+  HIVE_CLIENT_VERSION,
+  HIVE_METASTORE_VERSION,
+  HIVE_OPERATION_STATE,
+  HIVE_OPERATION_TYPE,
+  HOST,
+  HOSTS,
+  HOST_LOCAL_BLOCKS_SIZE,
+  HOST_PORT,
+  HOST_PORT2,
+  HUGE_METHOD_LIMIT,
+  HYBRID_STORE_DISK_BACKEND,
+  IDENTIFIER,
+  INCOMPATIBLE_TYPES,
+  INDEX,
+  INDEX_FILE,
+  INDEX_NAME,
+  INFERENCE_MODE,
+  INIT,
+  INITIAL_CAPACITY,
+  INITIAL_HEARTBEAT_INTERVAL,
+  INIT_MODE,
+  INIT_TIME,
+  INPUT,
+  INPUT_SPLIT,
+  INTEGRAL,
+  INTERRUPT_THREAD,
+  INTERVAL,
+  INVALID_PARAMS,
+  ISOLATION_LEVEL,
+  ISSUE_DATE,
+  IS_NETWORK_REQUEST_DONE,
+  JAR_ENTRY,
+  JAR_MESSAGE,
+  JAR_URL,
+  JAVA_VERSION,
+  JAVA_VM_NAME,
+  JOB_ID,
+  JOIN_CONDITION,
+  JOIN_CONDITION_SUB_EXPR,
+  JOIN_TYPE,
+  K8S_CONTEXT,
+  KEY,
+  KEY2,
+  KEYTAB,
+  KEYTAB_FILE,
+  KILL_EXECUTORS,
+  KINESIS_REASON,
+  LABEL_COLUMN,
+  LARGEST_CLUSTER_INDEX,
+  LAST_ACCESS_TIME,
+  LAST_COMMITTED_CHECKPOINT_ID,
+  LAST_COMMIT_BASED_CHECKPOINT_ID,
+  LAST_VALID_TIME,
+  LATEST_BATCH_ID,
+  LATEST_COMMITTED_BATCH_ID,
+  LATEST_SHUFFLE_MERGE_ID,
+  LEARNING_RATE,
+  LEFT_EXPR,
+  LEFT_LOGICAL_PLAN_STATS_SIZE_IN_BYTES,
+  LINE,
+  LINEAGE,
+  LINE_NUM,
+  LISTENER,
+  LOADED_CHECKPOINT_ID,
+  LOADED_VERSION,
+  LOAD_FACTOR,
+  LOAD_TIME,
+  LOCALE,
+  LOCAL_BLOCKS_SIZE,
+  LOCAL_SCRATCH_DIR,
+  LOCATION,
+  LOGICAL_PLAN,
+  LOGICAL_PLAN_COLUMNS,
+  LOGICAL_PLAN_LEAVES,
+  LOG_ID,
+  LOG_LEVEL,
+  LOG_OFFSET,
+  LOG_TYPE,
+  LOSSES,
+  LOWER_BOUND,
+  MALFORMATTED_STRING,
+  MAP_ID,
+  MASTER_URL,
+  MAX_ATTEMPTS,
+  MAX_CACHE_UNTIL_HIGHEST_CONSUMED_SIZE,
+  MAX_CACHE_UNTIL_LAST_PRODUCED_SIZE,
+  MAX_CAPACITY,
+  MAX_CATEGORIES,
+  MAX_EXECUTOR_FAILURES,
+  MAX_FILE_VERSION,
+  MAX_JVM_METHOD_PARAMS_LENGTH,
+  MAX_MEMORY_SIZE,
+  MAX_METHOD_CODE_SIZE,
+  MAX_NUM_BINS,
+  MAX_NUM_CHUNKS,
+  MAX_NUM_FILES,
+  MAX_NUM_LOG_POLICY,
+  MAX_NUM_PARTITIONS,
+  MAX_NUM_POSSIBLE_BINS,
+  MAX_NUM_ROWS_IN_MEMORY_BUFFER,
+  MAX_SEEN_VERSION,
+  MAX_SERVICE_NAME_LENGTH,
+  MAX_SIZE,
+  MAX_SLOTS,
+  MAX_SPLIT_BYTES,
+  MAX_TABLE_PARTITION_METADATA_SIZE,
+  MEMORY_CONSUMER,
+  MEMORY_POOL_NAME,
+  MEMORY_SIZE,
+  MEMORY_THRESHOLD_SIZE,
+  MERGE_DIR_NAME,
+  MESSAGE,
+  METADATA,
+  METADATA_DIRECTORY,
+  METADATA_JSON,
+  META_FILE,
+  METHOD_NAME,
+  METHOD_PARAM_TYPES,
+  METRICS_JSON,
+  METRIC_NAME,
+  MINI_BATCH_FRACTION,
+  MIN_COMPACTION_BATCH_ID,
+  MIN_NUM_FREQUENT_PATTERN,
+  MIN_POINT_PER_CLUSTER,
+  MIN_RATE,
+  MIN_SEEN_VERSION,
+  MIN_SHARE,
+  MIN_SIZE,
+  MIN_TIME,
+  MIN_VERSIONS_TO_DELETE,
+  MIN_VERSION_NUM,
+  MISSING_PARENT_STAGES,
+  MODEL_WEIGHTS,
+  MODIFY_ACLS,
+  MODIFY_ACLS_GROUPS,
+  MODULE_NAME,
+  NAME,
+  NAMESPACE,
+  NETWORK_IF,
+  NEW_FEATURE_COLUMN_NAME,
+  NEW_LABEL_COLUMN_NAME,
+  NEW_PATH,
+  NEW_RDD_ID,
+  NEW_STATE,
+  NEW_VALUE,
+  NEXT_RENEWAL_TIME,
+  NODES,
+  NODE_LOCATION,
+  NON_BUILT_IN_CONNECTORS,
+  NORM,
+  NUM_ADDED_PARTITIONS,
+  NUM_APPS,
+  NUM_ATTEMPT,
+  NUM_BATCHES,
+  NUM_BIN,
+  NUM_BLOCKS,
+  NUM_BLOCK_IDS,
+  NUM_BROADCAST_BLOCK,
+  NUM_BYTES,
+  NUM_BYTES_CURRENT,
+  NUM_BYTES_EVICTED,
+  NUM_BYTES_MAX,
+  NUM_BYTES_TO_FREE,
+  NUM_BYTES_TO_WARN,
+  NUM_BYTES_USED,
+  NUM_CATEGORIES,
+  NUM_CHECKSUM_FILE,
+  NUM_CHUNKS,
+  NUM_CLASSES,
+  NUM_COEFFICIENTS,
+  NUM_COLUMNS,
+  NUM_CONCURRENT_WRITER,
+  NUM_CORES,
+  NUM_DATA_FILE,
+  NUM_DATA_FILES,
+  NUM_DECOMMISSIONED,
+  NUM_DRIVERS,
+  NUM_DROPPED_PARTITIONS,
+  NUM_EFFECTIVE_RULE_OF_RUNS,
+  NUM_ELEMENTS_SPILL_RECORDS,
+  NUM_ELEMENTS_SPILL_THRESHOLD,
+  NUM_EVENTS,
+  NUM_EXAMPLES,
+  NUM_EXECUTORS,
+  NUM_EXECUTORS_EXITED,
+  NUM_EXECUTORS_KILLED,
+  NUM_EXECUTOR_CORES,
+  NUM_EXECUTOR_CORES_REMAINING,
+  NUM_EXECUTOR_CORES_TOTAL,
+  NUM_EXECUTOR_DESIRED,
+  NUM_EXECUTOR_LAUNCH,
+  NUM_EXECUTOR_TARGET,
+  NUM_FAILURES,
+  NUM_FEATURES,
+  NUM_FILES,
+  NUM_FILES_COPIED,
+  NUM_FILES_FAILED_TO_DELETE,
+  NUM_FILES_REUSED,
+  NUM_FREQUENT_ITEMS,
+  NUM_HOST_LOCAL_BLOCKS,
+  NUM_INDEX_FILE,
+  NUM_INDEX_FILES,
+  NUM_ITERATIONS,
+  NUM_KAFKA_PULLS,
+  NUM_KAFKA_RECORDS_PULLED,
+  NUM_LAGGING_STORES,
+  NUM_LEADING_SINGULAR_VALUES,
+  NUM_LEFT_PARTITION_VALUES,
+  NUM_LOADED_ENTRIES,
+  NUM_LOCAL_BLOCKS,
+  NUM_LOCAL_DIRS,
+  NUM_LOCAL_FREQUENT_PATTERN,
+  NUM_MERGERS,
+  NUM_MERGER_LOCATIONS,
+  NUM_META_FILES,
+  NUM_NODES,
+  NUM_PARTITIONS,
+  NUM_PARTITIONS2,
+  NUM_PATHS,
+  NUM_PEERS,
+  NUM_PEERS_REPLICATED_TO,
+  NUM_PEERS_TO_REPLICATE_TO,
+  NUM_PENDING_LAUNCH_TASKS,
+  NUM_POD,
+  NUM_POD_SHARED_SLOT,
+  NUM_POD_TARGET,
+  NUM_POINT,
+  NUM_PREFIXES,
+  NUM_PRUNED,
+  NUM_PUSH_MERGED_LOCAL_BLOCKS,
+  NUM_RECEIVERS,
+  NUM_RECORDS_READ,
+  NUM_RELEASED_LOCKS,
+  NUM_REMAINED,
+  NUM_REMOTE_BLOCKS,
+  NUM_REMOVED_WORKERS,
+  NUM_REPLICAS,
+  NUM_REQUESTS,
+  NUM_REQUEST_SYNC_TASK,
+  NUM_RESOURCE_SLOTS,
+  NUM_RETRIES,
+  NUM_RETRY,
+  NUM_RIGHT_PARTITION_VALUES,
+  NUM_ROWS,
+  NUM_RULE_OF_RUNS,
+  NUM_SEQUENCES,
+  NUM_SKIPPED,
+  NUM_SLOTS,
+  NUM_SPILLS,
+  NUM_SPILL_WRITERS,
+  NUM_SUB_DIRS,
+  NUM_SUCCESSFUL_TASKS,
+  NUM_TASKS,
+  NUM_TASK_CPUS,
+  NUM_TRAIN_WORD,
+  NUM_UNFINISHED_DECOMMISSIONED,
+  NUM_VERSIONS_RETAIN,
+  NUM_WEIGHTED_EXAMPLES,
+  NUM_WORKERS,
+  OBJECT_AGG_SORT_BASED_FALLBACK_THRESHOLD,
+  OBJECT_ID,
+  OFFSET,
+  OFFSETS,
+  OFFSET_SEQUENCE_METADATA,
+  OLD_BLOCK_MANAGER_ID,
+  OLD_GENERATION_GC,
+  OLD_VALUE,
+  OPEN_COST_IN_BYTES,
+  OPERATION,
+  OPERATION_HANDLE,
+  OPERATION_HANDLE_ID,
+  OPERATION_ID,
+  OPTIMIZED_PLAN_COLUMNS,
+  OPTIMIZER_CLASS_NAME,
+  OPTIONS,
+  OP_ID,
+  OP_TYPE,
+  ORIGINAL_DISK_SIZE,
+  ORIGINAL_MEMORY_SIZE,
+  OS_ARCH,
+  OS_NAME,
+  OS_VERSION,
+  OUTPUT,
+  OUTPUT_BUFFER,
+  OVERHEAD_MEMORY_SIZE,
+  PAGE_SIZE,
+  PARENT_STAGES,
+  PARSE_MODE,
+  PARTITIONED_FILE_READER,
+  PARTITIONER,
+  PARTITION_ID,
+  PARTITION_IDS,
+  PARTITION_SIZE,
+  PARTITION_SPECIFICATION,
+  PARTITION_SPECS,
+  PATH,
+  PATHS,
+  PEER,
+  PENDING_TIMES,
+  PERCENT,
+  PIPELINE_STAGE_UID,
+  PLUGIN_NAME,
+  POD_ID,
+  POD_NAME,
+  POD_NAMESPACE,
+  POD_PHASE,
+  POD_STATE,
+  POINT_OF_CENTER,
+  POLICY,
+  POOL_NAME,
+  PORT,
+  PORT2,
+  POST_SCAN_FILTERS,
+  PREDICATE,
+  PREDICATES,
+  PREFERRED_SERVICE_NAME,
+  PREFIX,
+  PRETTY_ID_STRING,
+  PRINCIPAL,
+  PROCESS,
+  PROCESSING_TIME,
+  PRODUCER_ID,
+  PROPERTY_NAME,
+  PROPORTIONAL,
+  PROTOCOL_VERSION,
+  PROVIDER,
+  PUSHED_FILTERS,
+  PUSH_MERGED_LOCAL_BLOCKS_SIZE,
+  PVC_METADATA_NAME,
+  PYTHON_EXEC,
+  PYTHON_PACKAGES,
+  PYTHON_VERSION,
+  PYTHON_WORKER_CHANNEL_IS_BLOCKING_MODE,
+  PYTHON_WORKER_CHANNEL_IS_CONNECTED,
+  PYTHON_WORKER_HAS_INPUTS,
+  PYTHON_WORKER_IDLE_TIMEOUT,
+  PYTHON_WORKER_IS_ALIVE,
+  PYTHON_WORKER_MODULE,
+  PYTHON_WORKER_RESPONSE,
+  PYTHON_WORKER_SELECTION_KEY_INTERESTS,
+  PYTHON_WORKER_SELECTION_KEY_IS_VALID,
+  PYTHON_WORKER_SELECTOR_IS_OPEN,
+  QUANTILES,
+  QUERY_CACHE_VALUE,
+  QUERY_HINT,
+  QUERY_ID,
+  QUERY_PLAN,
+  QUERY_PLAN_COMPARISON,
+  QUERY_PLAN_LENGTH_ACTUAL,
+  QUERY_PLAN_LENGTH_MAX,
+  QUERY_RUN_ID,
+  RANGE,
+  RATE_LIMIT,
+  RATIO,
+  RDD,
+  RDD_CHECKPOINT_DIR,
+  RDD_DEBUG_STRING,
+  RDD_DESCRIPTION,
+  RDD_ID,
+  READ_LIMIT,
+  REASON,
+  REATTACHABLE,
+  RECEIVED_BLOCK_INFO,
+  RECEIVED_BLOCK_TRACKER_LOG_EVENT,
+  RECEIVER_ID,
+  RECEIVER_IDS,
+  RECORDS,
+  RECOVERY_STATE,
+  RECURSIVE_DEPTH,
+  REDACTED_STATEMENT,
+  REDUCE_ID,
+  REGEX,
+  REGISTERED_EXECUTOR_FILE,
+  REGISTER_MERGE_RESULTS,
+  RELATION_NAME,
+  RELATION_OUTPUT,
+  RELATIVE_TOLERANCE,
+  RELEASED_LOCKS,
+  REMAINING_PARTITIONS,
+  REMOTE_ADDRESS,
+  REMOTE_BLOCKS_SIZE,
+  REMOVE_FROM_MASTER,
+  REPORT_DETAILS,
+  REQUESTER_SIZE,
+  REQUEST_EXECUTORS,
+  REQUEST_ID,
+  RESOURCE,
+  RESOURCE_NAME,
+  RESOURCE_PROFILE_ID,
+  RESOURCE_PROFILE_IDS,
+  RESOURCE_PROFILE_TO_TOTAL_EXECS,
+  RESPONSE_BODY_SIZE,
+  RESTART_TIME,
+  RESULT,
+  RESULT_SIZE_BYTES,
+  RESULT_SIZE_BYTES_MAX,
+  RETRY_INTERVAL,
+  RETRY_WAIT_TIME,
+  RIGHT_EXPR,
+  RIGHT_LOGICAL_PLAN_STATS_SIZE_IN_BYTES,
+  RMSE,
+  ROCKS_DB_FILE_MAPPING,
+  ROCKS_DB_LOG_LEVEL,
+  ROCKS_DB_LOG_MESSAGE,
+  RPC_ADDRESS,
+  RPC_ENDPOINT_REF,
+  RPC_MESSAGE_CAPACITY,
+  RPC_SSL_ENABLED,
+  RULE_EXECUTOR_NAME,
+  RULE_NAME,
+  RUN_ID,
+  RUN_ID_STRING,
+  SCALA_VERSION,
+  SCALING_DOWN_RATIO,
+  SCALING_UP_RATIO,
+  SCHEDULER_POOL_NAME,
+  SCHEDULING_MODE,
+  SCHEMA,
+  SCHEMA2,
+  SERVER_NAME,
+  SERVICE_NAME,
+  SERVLET_CONTEXT_HANDLER_PATH,
+  SESSION_HANDLE,
+  SESSION_HOLD_INFO,
+  SESSION_ID,
+  SESSION_KEY,
+  SET_CLIENT_INFO_REQUEST,
+  SHARD_ID,
+  SHORTER_SERVICE_NAME,
+  SHORT_USER_NAME,
+  SHUFFLE_BLOCK_INFO,
+  SHUFFLE_DB_BACKEND_KEY,
+  SHUFFLE_DB_BACKEND_NAME,
+  SHUFFLE_ID,
+  SHUFFLE_IDS,
+  SHUFFLE_MERGE_ID,
+  SHUFFLE_MERGE_RECOVERY_FILE,
+  SHUFFLE_SERVICE_CONF_OVERLAY_URL,
+  SHUFFLE_SERVICE_METRICS_NAMESPACE,
+  SHUFFLE_SERVICE_NAME,
+  SIGMAS_LENGTH,
+  SIGNAL,
+  SINK,
+  SIZE,
+  SLEEP_TIME,
+  SLIDE_DURATION,
+  SMALLEST_CLUSTER_INDEX,
+  SNAPSHOT_EVENT,
+  SNAPSHOT_EVENT_TIME_DELTA,
+  SNAPSHOT_EVENT_VERSION_DELTA,
+  SNAPSHOT_VERSION,
+  SOCKET_ADDRESS,
+  SOURCE,
+  SOURCE_PATH,
+  SPARK_BRANCH,
+  SPARK_BUILD_DATE,
+  SPARK_BUILD_USER,
+  SPARK_DATA_STREAM,
+  SPARK_PLAN_ID,
+  SPARK_REPO_URL,
+  SPARK_REVISION,
+  SPARK_VERSION,
+  SPILL_RECORDS_SIZE,
+  SPILL_RECORDS_SIZE_THRESHOLD,
+  SPILL_TIMES,
+  SQL_TEXT,
+  SRC_PATH,
+  STAGE,
+  STAGES,
+  STAGE_ATTEMPT,
+  STAGE_ATTEMPT_ID,
+  STAGE_ID,
+  STAGE_NAME,
+  STAMP,
+  START_INDEX,
+  START_TIME,
+  STATEMENT_ID,
+  STATE_NAME,
+  STATE_STORE_COORDINATOR,
+  STATE_STORE_ID,
+  STATE_STORE_PROVIDER,
+  STATE_STORE_PROVIDER_ID,
+  STATE_STORE_PROVIDER_IDS,
+  STATE_STORE_STATE,
+  STATE_STORE_VERSION,
+  STATS,
+  STATUS,
+  STDERR,
+  STOP_SITE_SHORT_FORM,
+  STORAGE_LEVEL,
+  STORAGE_LEVEL_DESERIALIZED,
+  STORAGE_LEVEL_REPLICATION,
+  STORAGE_MEMORY_SIZE,
+  STORE_ID,
+  STRATEGY,
+  STREAMING_CONTEXT,
+  STREAMING_DATA_SOURCE_DESCRIPTION,
+  STREAMING_DATA_SOURCE_NAME,
+  STREAMING_OFFSETS_END,
+  STREAMING_OFFSETS_START,
+  STREAMING_QUERY_PROGRESS,
+  STREAMING_SOURCE,
+  STREAMING_TABLE,
+  STREAMING_WRITE,
+  STREAM_CHUNK_ID,
+  STREAM_ID,
+  STREAM_NAME,
+  SUBMISSION_ID,
+  SUBSAMPLING_RATE,
+  SUB_QUERY,
+  TABLE_NAME,
+  TABLE_TYPE,
+  TABLE_TYPES,
+  TAG,
+  TARGET_NUM_EXECUTOR,
+  TARGET_NUM_EXECUTOR_DELTA,
+  TARGET_PATH,
+  TARGET_SIZE,
+  TASK_ATTEMPT_ID,
+  TASK_ID,
+  TASK_INDEX,
+  TASK_LOCALITY,
+  TASK_NAME,
+  TASK_REQUIREMENTS,
+  TASK_RESOURCES,
+  TASK_RESOURCE_ASSIGNMENTS,
+  TASK_SET_MANAGER,
+  TASK_SET_NAME,
+  TASK_STATE,
+  TEMP_FILE,
+  TEMP_OUTPUT_PATH,
+  TEMP_PATH,
+  TEST_SIZE,
+  THREAD,
+  THREAD_ID,
+  THREAD_NAME,
+  THREAD_POOL_KEEPALIVE_TIME,
+  THREAD_POOL_SIZE,
+  THREAD_POOL_WAIT_QUEUE_SIZE,
+  THRESHOLD,
+  THRESH_TIME,
+  TIME,
+  TIMEOUT,
+  TIMER,
+  TIMESTAMP,
+  TIME_UNITS,
+  TIP,
+  TOKEN,
+  TOKEN_KIND,
+  TOKEN_REGEX,
+  TOKEN_RENEWER,
+  TOPIC,
+  TOPIC_PARTITION,
+  TOPIC_PARTITIONS,
+  TOPIC_PARTITION_OFFSET,
+  TOPIC_PARTITION_OFFSET_RANGE,
+  TOTAL,
+  TOTAL_EFFECTIVE_TIME,
+  TOTAL_SIZE,
+  TOTAL_TIME,
+  TOTAL_TIME_READ,
+  TO_TIME,
+  TRAINING_SIZE,
+  TRAIN_VALIDATION_SPLIT_METRIC,
+  TRAIN_VALIDATION_SPLIT_METRICS,
+  TRANSFER_TYPE,
+  TREE_NODE,
+  TRIGGER_INTERVAL,
+  UI_ACLS,
+  UI_FILTER,
+  UI_FILTER_PARAMS,
+  UI_PROXY_BASE,
+  UNKNOWN_PARAM,
+  UNSUPPORTED_EXPR,
+  UNSUPPORTED_HINT_REASON,
+  UNTIL_OFFSET,
+  UPPER_BOUND,
+  URI,
+  URIS,
+  URL,
+  URL2,
+  URLS,
+  USER_ID,
+  USER_NAME,
+  UUID,
+  VALUE,
+  VERSIONS_TO_DELETE,
+  VERSION_NUM,
+  VIEW_ACLS,
+  VIEW_ACLS_GROUPS,
+  VIRTUAL_CORES,
+  VOCAB_SIZE,
+  WAIT_RESULT_TIME,
+  WAIT_SEND_TIME,
+  WATERMARK_CONSTRAINT,
+  WEB_URL,
+  WEIGHT,
+  WORKER,
+  WORKER_HOST,
+  WORKER_ID,
+  WORKER_PORT,
+  WORKER_URL,
+  WRITE_AHEAD_LOG_INFO,
+  WRITE_AHEAD_LOG_RECORD_HANDLE,
+  WRITE_JOB_UUID,
+  XML_SCHEDULING_MODE,
+  XSD_PATH,
+  YARN_RESOURCE,
+  YOUNG_GENERATION_GC,
+  ZERO_TIME
+}
diff --git a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomPluginBase.scala b/common/utils-java/src/main/java/org/apache/spark/internal/MDC.java
similarity index 68%
rename from connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomPluginBase.scala
rename to common/utils-java/src/main/java/org/apache/spark/internal/MDC.java
index df73e0d9a0fb8..341967812c84b 100644
--- a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomPluginBase.scala
+++ b/common/utils-java/src/main/java/org/apache/spark/internal/MDC.java
@@ -15,13 +15,15 @@
  * limitations under the License.
  */
 
-package org.apache.connect.examples.serverlibrary
+package org.apache.spark.internal;
 
-import org.apache.connect.examples.serverlibrary.proto
-import org.apache.spark.sql.connect.planner.SparkConnectPlanner
-
-trait CustomPluginBase {
-  protected def getCustomTable(table: proto.CustomTable): CustomTable = {
-    CustomTable.getTable(table.getName, table.getPath)
+/**
+ * Mapped Diagnostic Context (MDC) that will be used in log messages.
+ * The values of the MDC will be inline in the log message, while the key-value pairs will be
+ * part of the ThreadContext.
+ */
+public record MDC(LogKey key, Object value) {
+  public static MDC of(LogKey key, Object value) {
+    return new MDC(key, value);
   }
 }
diff --git a/common/utils/src/main/java/org/apache/spark/internal/SparkLogger.java b/common/utils-java/src/main/java/org/apache/spark/internal/SparkLogger.java
similarity index 96%
rename from common/utils/src/main/java/org/apache/spark/internal/SparkLogger.java
rename to common/utils-java/src/main/java/org/apache/spark/internal/SparkLogger.java
index 8c210a4fab3c3..84d6d7cf4238c 100644
--- a/common/utils/src/main/java/org/apache/spark/internal/SparkLogger.java
+++ b/common/utils-java/src/main/java/org/apache/spark/internal/SparkLogger.java
@@ -18,6 +18,7 @@
 package org.apache.spark.internal;
 
 import java.util.HashMap;
+import java.util.Locale;
 import java.util.Map;
 import java.util.function.Consumer;
 
@@ -51,7 +52,7 @@
  *
  * import org.apache.spark.internal.LogKeys;
  * import org.apache.spark.internal.MDC;
- * logger.error("Unable to delete file for partition {}", MDC.of(LogKeys.PARTITION_ID$.MODULE$, i));
+ * logger.error("Unable to delete file for partition {}", MDC.of(LogKeys.PARTITION_ID, i));
  * <p>
  *
  * Constant String Messages:
@@ -65,8 +66,10 @@
  * you can define `custom LogKey` and use it in `java` code as follows:
  * <p>
  *
- * // To add a `custom LogKey`, implement `LogKey`
- * public static class CUSTOM_LOG_KEY implements LogKey { }
+ * // Add a `CustomLogKeys`, implement `LogKey`
+ * public enum CustomLogKeys implements LogKey {
+ *   CUSTOM_LOG_KEY
+ * }
  * import org.apache.spark.internal.MDC;
  * logger.error("Unable to delete key {} for cache", MDC.of(CUSTOM_LOG_KEY, "key"));
  */
@@ -222,8 +225,8 @@ private void withLogContext(
     for (int index = 0; index < mdcs.length; index++) {
       MDC mdc = mdcs[index];
       String value = (mdc.value() != null) ? mdc.value().toString() : null;
-      if (Logging$.MODULE$.isStructuredLoggingEnabled()) {
-        context.put(mdc.key().name(), value);
+      if (SparkLoggerFactory.isStructuredLoggingEnabled()) {
+        context.put(mdc.key().name().toLowerCase(Locale.ROOT), value);
       }
       args[index] = value;
     }
diff --git a/common/utils/src/main/java/org/apache/spark/internal/SparkLoggerFactory.java b/common/utils-java/src/main/java/org/apache/spark/internal/SparkLoggerFactory.java
similarity index 77%
rename from common/utils/src/main/java/org/apache/spark/internal/SparkLoggerFactory.java
rename to common/utils-java/src/main/java/org/apache/spark/internal/SparkLoggerFactory.java
index a59c007362419..f5be570fa5b39 100644
--- a/common/utils/src/main/java/org/apache/spark/internal/SparkLoggerFactory.java
+++ b/common/utils-java/src/main/java/org/apache/spark/internal/SparkLoggerFactory.java
@@ -23,6 +23,20 @@
 
 public class SparkLoggerFactory {
 
+  private static volatile boolean structuredLoggingEnabled = false;
+
+  public static void enableStructuredLogging() {
+    structuredLoggingEnabled = true;
+  }
+
+  public static void disableStructuredLogging() {
+    structuredLoggingEnabled = false;
+  }
+
+  public static boolean isStructuredLoggingEnabled() {
+    return structuredLoggingEnabled;
+  }
+
   public static SparkLogger getLogger(String name) {
     return new SparkLogger(LoggerFactory.getLogger(name));
   }
diff --git a/common/utils/src/main/java/org/apache/spark/memory/MemoryMode.java b/common/utils-java/src/main/java/org/apache/spark/memory/MemoryMode.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/memory/MemoryMode.java
rename to common/utils-java/src/main/java/org/apache/spark/memory/MemoryMode.java
diff --git a/common/utils/src/main/java/org/apache/spark/network/util/ByteUnit.java b/common/utils-java/src/main/java/org/apache/spark/network/util/ByteUnit.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/network/util/ByteUnit.java
rename to common/utils-java/src/main/java/org/apache/spark/network/util/ByteUnit.java
diff --git a/common/utils/src/main/java/org/apache/spark/network/util/JavaUtils.java b/common/utils-java/src/main/java/org/apache/spark/network/util/JavaUtils.java
similarity index 55%
rename from common/utils/src/main/java/org/apache/spark/network/util/JavaUtils.java
rename to common/utils-java/src/main/java/org/apache/spark/network/util/JavaUtils.java
index 94f9f02ed2c9b..cf500926fa3aa 100644
--- a/common/utils/src/main/java/org/apache/spark/network/util/JavaUtils.java
+++ b/common/utils-java/src/main/java/org/apache/spark/network/util/JavaUtils.java
@@ -18,18 +18,26 @@
 package org.apache.spark.network.util;
 
 import java.io.*;
+import java.net.URL;
 import java.nio.ByteBuffer;
 import java.nio.channels.ReadableByteChannel;
 import java.nio.charset.StandardCharsets;
+import java.nio.file.DirectoryStream;
 import java.nio.file.Files;
 import java.nio.file.LinkOption;
+import java.nio.file.Path;
+import java.nio.file.FileVisitOption;
+import java.nio.file.FileVisitResult;
+import java.nio.file.SimpleFileVisitor;
+import java.nio.file.StandardCopyOption;
 import java.nio.file.attribute.BasicFileAttributes;
 import java.util.*;
 import java.util.concurrent.TimeUnit;
+import java.util.concurrent.atomic.AtomicLong;
 import java.util.regex.Matcher;
 import java.util.regex.Pattern;
-
-import org.apache.commons.lang3.SystemUtils;
+import java.util.stream.Stream;
+import java.util.stream.Collectors;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
@@ -60,6 +68,109 @@ public static void closeQuietly(Closeable closeable) {
     }
   }
 
+  /** Delete a file or directory and its contents recursively without throwing exceptions. */
+  public static void deleteQuietly(File file) {
+    if (file != null && file.exists()) {
+      Path path = file.toPath();
+      try (Stream<Path> walk = Files.walk(path)) {
+        walk.sorted(Comparator.reverseOrder()).map(Path::toFile).forEach(File::delete);
+      } catch (Exception ignored) { /* No-op */ }
+    }
+  }
+
+  /** Registers the file or directory for deletion when the JVM exists. */
+  public static void forceDeleteOnExit(File file) throws IOException {
+    if (file != null && file.exists()) {
+      if (!file.isDirectory()) {
+        file.deleteOnExit();
+      } else {
+        Path path = file.toPath();
+        Files.walkFileTree(path, new SimpleFileVisitor<Path>() {
+          @Override
+          public FileVisitResult preVisitDirectory(Path p, BasicFileAttributes a)
+              throws IOException {
+            p.toFile().deleteOnExit();
+            return a.isSymbolicLink() ? FileVisitResult.SKIP_SUBTREE : FileVisitResult.CONTINUE;
+          }
+
+          @Override
+          public FileVisitResult visitFile(Path p, BasicFileAttributes a) throws IOException {
+            p.toFile().deleteOnExit();
+            return FileVisitResult.CONTINUE;
+          }
+        });
+      }
+    }
+  }
+
+  /** Move a file from src to dst. */
+  public static void moveFile(File src, File dst) throws IOException {
+    if (src == null || dst == null || !src.exists() || src.isDirectory() || dst.exists()) {
+      throw new IllegalArgumentException("Invalid input " + src + " or " + dst);
+    }
+    if (!src.renameTo(dst)) { // Try to use File.renameTo first
+      Files.move(src.toPath(), dst.toPath());
+    }
+  }
+
+  /** Move a directory from src to dst. */
+  public static void moveDirectory(File src, File dst) throws IOException {
+    if (src == null || dst == null || !src.exists() || !src.isDirectory() || dst.exists()) {
+      throw new IllegalArgumentException("Invalid input " + src + " or " + dst);
+    }
+    if (!src.renameTo(dst)) {
+      Path from = src.toPath().toAbsolutePath().normalize();
+      Path to = dst.toPath().toAbsolutePath().normalize();
+      if (to.startsWith(from)) {
+        throw new IllegalArgumentException("Cannot move directory to itself or its subdirectory");
+      }
+      moveDirectory(from, to);
+    }
+  }
+
+  private static void moveDirectory(Path src, Path dst) throws IOException {
+    Files.createDirectories(dst);
+    try (DirectoryStream<Path> stream = Files.newDirectoryStream(src)) {
+      for (Path from : stream) {
+        Path to = dst.resolve(from.getFileName());
+        if (Files.isDirectory(from)) {
+          moveDirectory(from, to);
+        } else {
+          Files.move(from, to, StandardCopyOption.REPLACE_EXISTING);
+        }
+      }
+    }
+    Files.delete(src);
+  }
+
+  /** Copy src to the target directory simply. File attribute times are not copied. */
+  public static void copyDirectory(File src, File dst) throws IOException {
+    if (src == null || dst == null || !src.exists() || !src.isDirectory() ||
+        (dst.exists() && !dst.isDirectory())) {
+      throw new IllegalArgumentException("Invalid input file " + src + " or directory " + dst);
+    }
+    Path from = src.toPath().toAbsolutePath().normalize();
+    Path to = dst.toPath().toAbsolutePath().normalize();
+    if (to.startsWith(from)) {
+       throw new IllegalArgumentException("Cannot copy directory to itself or its subdirectory");
+    }
+    Files.createDirectories(to);
+    Files.walkFileTree(from, new SimpleFileVisitor<Path>() {
+      @Override
+      public FileVisitResult preVisitDirectory(Path dir, BasicFileAttributes attrs)
+          throws IOException {
+        Files.createDirectories(to.resolve(from.relativize(dir)));
+        return FileVisitResult.CONTINUE;
+      }
+
+      @Override
+      public FileVisitResult visitFile(Path file, BasicFileAttributes attrs) throws IOException {
+        Files.copy(file, to.resolve(from.relativize(file)), StandardCopyOption.REPLACE_EXISTING);
+        return FileVisitResult.CONTINUE;
+      }
+    });
+  }
+
   /** Returns a hash consistent with Spark's Utils.nonNegativeHash(). */
   public static int nonNegativeHash(Object obj) {
     if (obj == null) { return 0; }
@@ -83,6 +194,49 @@ public static String bytesToString(ByteBuffer b) {
     return StandardCharsets.UTF_8.decode(b.slice()).toString();
   }
 
+  public static long sizeOf(File file) throws IOException {
+    if (!file.exists()) {
+      throw new IllegalArgumentException(file.getAbsolutePath() + " not found");
+    }
+    return sizeOf(file.toPath());
+  }
+
+  public static long sizeOf(Path dirPath) throws IOException {
+    AtomicLong size = new AtomicLong(0);
+    Files.walkFileTree(dirPath, new SimpleFileVisitor<Path>() {
+        @Override
+        public FileVisitResult visitFile(Path file, BasicFileAttributes attrs) throws IOException {
+          size.addAndGet(attrs.size());
+          return FileVisitResult.CONTINUE;
+        }
+      });
+    return size.get();
+  }
+
+  public static void cleanDirectory(File dir) throws IOException {
+    if (dir == null || !dir.exists() || !dir.isDirectory()) {
+      throw new IllegalArgumentException("Invalid input directory " + dir);
+    }
+    cleanDirectory(dir.toPath());
+  }
+
+  private static void cleanDirectory(Path rootDir) throws IOException {
+    Files.walkFileTree(rootDir, new SimpleFileVisitor<Path>() {
+      @Override
+      public FileVisitResult visitFile(Path file, BasicFileAttributes attrs) throws IOException {
+        Files.delete(file);
+        return FileVisitResult.CONTINUE;
+      }
+
+      @Override
+      public FileVisitResult postVisitDirectory(Path dir, IOException e) throws IOException {
+        if (e != null) throw e;
+        if (!dir.equals(rootDir)) Files.delete(dir);
+        return FileVisitResult.CONTINUE;
+      }
+    });
+  }
+
   /**
    * Delete a file or directory and its contents recursively.
    * Don't follow directories if they are symlinks.
@@ -110,14 +264,13 @@ public static void deleteRecursively(File file, FilenameFilter filter)
     // On Unix systems, use operating system command to run faster
     // If that does not work out, fallback to the Java IO way
     // We exclude Apple Silicon test environment due to the limited resource issues.
-    if (SystemUtils.IS_OS_UNIX && filter == null && !(SystemUtils.IS_OS_MAC_OSX &&
-        (System.getenv("SPARK_TESTING") != null || System.getProperty("spark.testing") != null))) {
+    if (isUnix && filter == null && !(isMac && isTesting())) {
       try {
         deleteRecursivelyUsingUnixNative(file);
         return;
       } catch (IOException e) {
         logger.warn("Attempt to delete using native Unix OS command failed for path = {}. " +
-          "Falling back to Java IO way", e, MDC.of(LogKeys.PATH$.MODULE$, file.getAbsolutePath()));
+          "Falling back to Java IO way", e, MDC.of(LogKeys.PATH, file.getAbsolutePath()));
       }
     }
 
@@ -212,6 +365,25 @@ private static File[] listFilesSafely(File file, FilenameFilter filter) throws I
     }
   }
 
+  public static Set<Path> listPaths(File dir) throws IOException {
+    if (dir == null) throw new IllegalArgumentException("Input directory is null");
+    if (!dir.exists() || !dir.isDirectory()) return Collections.emptySet();
+    try (var stream = Files.walk(dir.toPath(), FileVisitOption.FOLLOW_LINKS)) {
+      return stream.filter(Files::isRegularFile).collect(Collectors.toCollection(HashSet::new));
+    }
+  }
+
+  public static Set<File> listFiles(File dir) throws IOException {
+    if (dir == null) throw new IllegalArgumentException("Input directory is null");
+    if (!dir.exists() || !dir.isDirectory()) return Collections.emptySet();
+    try (var stream = Files.walk(dir.toPath(), FileVisitOption.FOLLOW_LINKS)) {
+      return stream
+        .filter(Files::isRegularFile)
+        .map(Path::toFile)
+        .collect(Collectors.toCollection(HashSet::new));
+    }
+  }
+
   private static final Map<String, TimeUnit> timeSuffixes;
 
   private static final Map<String, ByteUnit> byteSuffixes;
@@ -415,7 +587,7 @@ public static File createDirectory(String root, String namePrefix) throws IOExce
         dir = new File(root, namePrefix + "-" + UUID.randomUUID());
         Files.createDirectories(dir.toPath());
       } catch (IOException | SecurityException e) {
-        logger.error("Failed to create directory {}", e, MDC.of(LogKeys.PATH$.MODULE$, dir));
+        logger.error("Failed to create directory {}", e, MDC.of(LogKeys.PATH, dir));
         dir = null;
       }
     }
@@ -435,4 +607,154 @@ public static void readFully(ReadableByteChannel channel, ByteBuffer dst) throws
     }
   }
 
+  /**
+   * Read len bytes exactly, otherwise throw exceptions.
+   */
+  public static void readFully(InputStream in, byte[] arr, int off, int len) throws IOException {
+    if (in == null || len < 0 || (off < 0 || off > arr.length - len)) {
+      throw new IllegalArgumentException("Invalid input argument");
+    }
+    if (len != in.readNBytes(arr, off, len)) {
+      throw new EOFException("Fail to read " + len + " bytes.");
+    }
+  }
+
+  /**
+   * Copy the content of a URL into a file.
+   */
+  public static void copyURLToFile(URL url, File file) throws IOException {
+    if (url == null || file == null || (file.exists() && file.isDirectory())) {
+      throw new IllegalArgumentException("Invalid input " + url + " or " + file);
+    }
+    Files.createDirectories(file.getParentFile().toPath());
+    try (InputStream in = url.openStream()) {
+      Files.copy(in, file.toPath(), StandardCopyOption.REPLACE_EXISTING);
+    }
+  }
+
+  public static String join(List<Object> arr, String sep) {
+    if (arr == null) return "";
+    StringJoiner joiner = new StringJoiner(sep == null ? "" : sep);
+    for (Object a : arr) {
+      joiner.add(a == null ? "" : a.toString());
+    }
+    return joiner.toString();
+  }
+
+  public static String stackTraceToString(Throwable t) {
+    if (t == null) {
+      return "";
+    }
+
+    ByteArrayOutputStream out = new ByteArrayOutputStream();
+    try (PrintWriter writer = new PrintWriter(out)) {
+      t.printStackTrace(writer);
+      writer.flush();
+    }
+    return out.toString(StandardCharsets.UTF_8);
+  }
+
+  public static int checkedCast(long value) {
+    if (value > Integer.MAX_VALUE || value < Integer.MIN_VALUE) {
+      throw new IllegalArgumentException("Cannot cast to integer.");
+    }
+    return (int) value;
+  }
+
+  /** Return true if the content of the files are equal or they both don't exist */
+  public static boolean contentEquals(File file1, File file2) throws IOException {
+    if (file1 == null && file2 != null || file1 != null && file2 == null) {
+      return false;
+    } else if (file1 == null && file2 == null || !file1.exists() && !file2.exists()) {
+      return true;
+    } else if (!file1.exists() || !file2.exists()) {
+      return false;
+    } else if (file1.isDirectory() || file2.isDirectory()) {
+      throw new IllegalArgumentException("Input is not a file: %s or %s".formatted(file1, file2));
+    } else if (file1.length() != file2.length()) {
+      return false;
+    } else {
+      Path path1 = file1.toPath();
+      Path path2 = file2.toPath();
+      return Files.isSameFile(path1, path2) || Files.mismatch(path1, path2) == -1L;
+    }
+  }
+
+  public static String toString(InputStream in) throws IOException {
+    return new String(in.readAllBytes(), StandardCharsets.UTF_8);
+  }
+
+  /**
+   * Indicates whether Spark is currently running unit tests.
+   */
+  public static boolean isTesting() {
+    return System.getenv("SPARK_TESTING") != null || System.getProperty("spark.testing") != null;
+  }
+
+  /**
+   * The `os.name` system property.
+   */
+  public static String osName = System.getProperty("os.name");
+
+  /**
+   * The `os.version` system property.
+   */
+  public static String osVersion = System.getProperty("os.version");
+
+  /**
+   * The `java.version` system property.
+   */
+  public static String javaVersion = Runtime.version().toString();
+
+  /**
+   * The `os.arch` system property.
+   */
+  public static String osArch = System.getProperty("os.arch");
+
+  /**
+   * Whether the underlying operating system is Windows.
+   */
+  public static boolean isWindows = osName.regionMatches(true, 0, "Windows", 0, 7);
+
+  /**
+   * Whether the underlying operating system is Mac OS X.
+   */
+  public static boolean isMac = osName.regionMatches(true, 0, "Mac OS X", 0, 8);
+
+  /**
+   * Whether the underlying operating system is Mac OS X and processor is Apple Silicon.
+   */
+  public static boolean isMacOnAppleSilicon = isMac && osArch.equals("aarch64");
+
+  /**
+   * Whether the underlying operating system is Linux.
+   */
+  public static boolean isLinux = osName.regionMatches(true, 0, "Linux", 0, 5);
+
+  /**
+   * Whether the underlying operating system is UNIX.
+   */
+  public static boolean isUnix = Stream.of("AIX", "HP-UX", "Irix", "Linux", "Mac OS X", "Solaris",
+    "SunOS", "FreeBSD", "OpenBSD", "NetBSD")
+    .anyMatch(prefix -> osName.regionMatches(true, 0, prefix, 0, prefix.length()));
+
+  /**
+   * Throws IllegalArgumentException with the given message if the check is false.
+   * Keep this clone of CommandBuilderUtils.checkArgument synced with the original.
+   */
+  public static void checkArgument(boolean check, String msg, Object... args) {
+    if (!check) {
+      throw new IllegalArgumentException(String.format(msg, args));
+    }
+  }
+
+  /**
+   * Throws IllegalStateException with the given message if the check is false.
+   * Keep this clone of CommandBuilderUtils.checkState synced with the original.
+   */
+  public static void checkState(boolean check, String msg, Object... args) {
+    if (!check) {
+      throw new IllegalStateException(String.format(msg, args));
+    }
+  }
 }
diff --git a/common/utils/src/main/java/org/apache/spark/unsafe/array/ByteArrayUtils.java b/common/utils-java/src/main/java/org/apache/spark/unsafe/array/ByteArrayUtils.java
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/unsafe/array/ByteArrayUtils.java
rename to common/utils-java/src/main/java/org/apache/spark/unsafe/array/ByteArrayUtils.java
diff --git a/common/utils-java/src/main/java/org/apache/spark/util/Pair.java b/common/utils-java/src/main/java/org/apache/spark/util/Pair.java
new file mode 100644
index 0000000000000..bdcc01b49dcf4
--- /dev/null
+++ b/common/utils-java/src/main/java/org/apache/spark/util/Pair.java
@@ -0,0 +1,29 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.util;
+
+/**
+ * An immutable pair of values. Note that the fields are intentionally designed to be `getLeft` and
+ * `getRight` instead of `left` and `right` in order to mitigate the migration burden
+ * from `org.apache.commons.lang3.tuple.Pair`.
+ */
+public record Pair<L, R>(L getLeft, R getRight) {
+  public static <L, R> Pair<L, R> of(L left, R right) {
+    return new Pair<>(left, right);
+  }
+}
diff --git a/common/utils/src/main/resources/org/apache/spark/SparkLayout.json b/common/utils-java/src/main/resources/org/apache/spark/SparkLayout.json
similarity index 100%
rename from common/utils/src/main/resources/org/apache/spark/SparkLayout.json
rename to common/utils-java/src/main/resources/org/apache/spark/SparkLayout.json
diff --git a/common/utils/src/main/resources/org/apache/spark/log4j2-defaults.properties b/common/utils-java/src/main/resources/org/apache/spark/log4j2-defaults.properties
similarity index 100%
rename from common/utils/src/main/resources/org/apache/spark/log4j2-defaults.properties
rename to common/utils-java/src/main/resources/org/apache/spark/log4j2-defaults.properties
diff --git a/common/utils/src/main/resources/org/apache/spark/log4j2-json-layout.properties b/common/utils-java/src/main/resources/org/apache/spark/log4j2-json-layout.properties
similarity index 100%
rename from common/utils/src/main/resources/org/apache/spark/log4j2-json-layout.properties
rename to common/utils-java/src/main/resources/org/apache/spark/log4j2-json-layout.properties
diff --git a/connect-examples/server-library-example/common/src/main/protobuf/base.proto b/common/utils-java/src/test/java/org/apache/spark/util/CustomLogKeys.java
similarity index 75%
rename from connect-examples/server-library-example/common/src/main/protobuf/base.proto
rename to common/utils-java/src/test/java/org/apache/spark/util/CustomLogKeys.java
index 9d902a587ed37..cadacba7c5175 100644
--- a/connect-examples/server-library-example/common/src/main/protobuf/base.proto
+++ b/common/utils-java/src/test/java/org/apache/spark/util/CustomLogKeys.java
@@ -15,14 +15,10 @@
  * limitations under the License.
  */
 
-syntax = 'proto3';
+package org.apache.spark.util;
 
-option java_multiple_files = true;
-option java_package = "org.apache.connect.examples.serverlibrary.proto";
+import org.apache.spark.internal.LogKey;
 
-message CustomTable {
-    // Path to the custom table.
-    string path = 1;
-    // Name of the custom table.
-    string name = 2;
+public enum CustomLogKeys implements LogKey {
+  CUSTOM_LOG_KEY
 }
diff --git a/common/utils/src/test/java/org/apache/spark/util/PatternSparkLoggerSuite.java b/common/utils-java/src/test/java/org/apache/spark/util/PatternSparkLoggerSuite.java
similarity index 90%
rename from common/utils/src/test/java/org/apache/spark/util/PatternSparkLoggerSuite.java
rename to common/utils-java/src/test/java/org/apache/spark/util/PatternSparkLoggerSuite.java
index 6bfe595def1d4..7f8f3f93a8d46 100644
--- a/common/utils/src/test/java/org/apache/spark/util/PatternSparkLoggerSuite.java
+++ b/common/utils-java/src/test/java/org/apache/spark/util/PatternSparkLoggerSuite.java
@@ -90,12 +90,7 @@ String expectedPatternForMsgWithMDCValueIsNull(Level level) {
   }
 
   @Override
-  String expectedPatternForScalaCustomLogKey(Level level) {
-    return toRegexPattern(level, ".*<level> <className>: Scala custom log message.\n");
-  }
-
-  @Override
-  String expectedPatternForJavaCustomLogKey(Level level) {
-    return toRegexPattern(level, ".*<level> <className>: Java custom log message.\n");
+  String expectedPatternForCustomLogKey(Level level) {
+    return toRegexPattern(level, ".*<level> <className>: Custom log message.\n");
   }
 }
diff --git a/common/utils/src/test/java/org/apache/spark/util/SparkLoggerSuiteBase.java b/common/utils-java/src/test/java/org/apache/spark/util/SparkLoggerSuiteBase.java
similarity index 83%
rename from common/utils/src/test/java/org/apache/spark/util/SparkLoggerSuiteBase.java
rename to common/utils-java/src/test/java/org/apache/spark/util/SparkLoggerSuiteBase.java
index 186088ede1d0b..d86fe12c89243 100644
--- a/common/utils/src/test/java/org/apache/spark/util/SparkLoggerSuiteBase.java
+++ b/common/utils-java/src/test/java/org/apache/spark/util/SparkLoggerSuiteBase.java
@@ -22,11 +22,9 @@
 import java.nio.file.Files;
 import java.util.List;
 
-import org.apache.commons.lang3.tuple.Pair;
 import org.apache.logging.log4j.Level;
 import org.junit.jupiter.api.Test;
 
-import org.apache.spark.internal.LogKey;
 import org.apache.spark.internal.LogKeys;
 import org.apache.spark.internal.MDC;
 import org.apache.spark.internal.SparkLogger;
@@ -73,23 +71,20 @@ private void checkLogOutput(Level level, Runnable func, ExpectedResult result) {
   private final String basicMsgWithEscapeChar =
     "This is a log message\nThis is a new line \t other msg";
 
-  private final MDC executorIDMDC = MDC.of(LogKeys.EXECUTOR_ID$.MODULE$, "1");
+  private final MDC executorIDMDC = MDC.of(LogKeys.EXECUTOR_ID, "1");
   private final String msgWithMDC = "Lost executor {}.";
 
   private final MDC[] mdcs = new MDC[] {
-    MDC.of(LogKeys.EXECUTOR_ID$.MODULE$, "1"),
-    MDC.of(LogKeys.REASON$.MODULE$, "the shuffle data is too large")};
+    MDC.of(LogKeys.EXECUTOR_ID, "1"),
+    MDC.of(LogKeys.REASON, "the shuffle data is too large")};
   private final String msgWithMDCs = "Lost executor {}, reason: {}";
 
   private final MDC[] emptyMDCs = new MDC[0];
 
-  private final MDC executorIDMDCValueIsNull = MDC.of(LogKeys.EXECUTOR_ID$.MODULE$, null);
+  private final MDC executorIDMDCValueIsNull = MDC.of(LogKeys.EXECUTOR_ID, null);
 
-  private final MDC scalaCustomLogMDC =
-    MDC.of(CustomLogKeys.CUSTOM_LOG_KEY$.MODULE$, "Scala custom log message.");
-
-  private final MDC javaCustomLogMDC =
-    MDC.of(JavaCustomLogKeys.CUSTOM_LOG_KEY, "Java custom log message.");
+  private final MDC customLogMDC =
+    MDC.of(CustomLogKeys.CUSTOM_LOG_KEY, "Custom log message.");
 
   // test for basic message (without any mdc)
   abstract String expectedPatternForBasicMsg(Level level);
@@ -118,10 +113,7 @@ String expectedPatternForMsgWithEmptyMDCsAndException(Level level) {
   abstract String expectedPatternForMsgWithMDCValueIsNull(Level level);
 
   // test for scala custom LogKey
-  abstract String expectedPatternForScalaCustomLogKey(Level level);
-
-  // test for java custom LogKey
-  abstract String expectedPatternForJavaCustomLogKey(Level level);
+  abstract String expectedPatternForCustomLogKey(Level level);
 
   @Test
   public void testBasicMsg() {
@@ -241,34 +233,14 @@ public void testLoggerWithMDCValueIsNull() {
   }
 
   @Test
-  public void testLoggerWithScalaCustomLogKey() {
-    Runnable errorFn = () -> logger().error("{}", scalaCustomLogMDC);
-    Runnable warnFn = () -> logger().warn("{}", scalaCustomLogMDC);
-    Runnable infoFn = () -> logger().info("{}", scalaCustomLogMDC);
-    List.of(
-        Pair.of(Level.ERROR, errorFn),
-        Pair.of(Level.WARN, warnFn),
-        Pair.of(Level.INFO, infoFn)).forEach(pair ->
-      checkLogOutput(pair.getLeft(), pair.getRight(), this::expectedPatternForScalaCustomLogKey));
-  }
-
-  @Test
-  public void testLoggerWithJavaCustomLogKey() {
-    Runnable errorFn = () -> logger().error("{}", javaCustomLogMDC);
-    Runnable warnFn = () -> logger().warn("{}", javaCustomLogMDC);
-    Runnable infoFn = () -> logger().info("{}", javaCustomLogMDC);
+  public void testLoggerWithCustomLogKey() {
+    Runnable errorFn = () -> logger().error("{}", customLogMDC);
+    Runnable warnFn = () -> logger().warn("{}", customLogMDC);
+    Runnable infoFn = () -> logger().info("{}", customLogMDC);
     List.of(
         Pair.of(Level.ERROR, errorFn),
         Pair.of(Level.WARN, warnFn),
         Pair.of(Level.INFO, infoFn)).forEach(pair ->
-      checkLogOutput(pair.getLeft(), pair.getRight(), this::expectedPatternForJavaCustomLogKey));
+      checkLogOutput(pair.getLeft(), pair.getRight(), this::expectedPatternForCustomLogKey));
   }
 }
-
-class JavaCustomLogKeys {
-  // Custom `LogKey` must be `implements LogKey`
-  public static class CUSTOM_LOG_KEY implements LogKey { }
-
-  // Singleton
-  public static final CUSTOM_LOG_KEY CUSTOM_LOG_KEY = new CUSTOM_LOG_KEY();
-}
diff --git a/common/utils/src/test/java/org/apache/spark/util/StructuredSparkLoggerSuite.java b/common/utils-java/src/test/java/org/apache/spark/util/StructuredSparkLoggerSuite.java
similarity index 88%
rename from common/utils/src/test/java/org/apache/spark/util/StructuredSparkLoggerSuite.java
rename to common/utils-java/src/test/java/org/apache/spark/util/StructuredSparkLoggerSuite.java
index 1fab167adfeb0..88ac8ea34710a 100644
--- a/common/utils/src/test/java/org/apache/spark/util/StructuredSparkLoggerSuite.java
+++ b/common/utils-java/src/test/java/org/apache/spark/util/StructuredSparkLoggerSuite.java
@@ -24,7 +24,6 @@
 import org.junit.jupiter.api.AfterAll;
 import org.junit.jupiter.api.BeforeAll;
 
-import org.apache.spark.internal.Logging$;
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
 
@@ -33,13 +32,13 @@ public class StructuredSparkLoggerSuite extends SparkLoggerSuiteBase {
   // Enable Structured Logging before running the tests
   @BeforeAll
   public static void setup() {
-    Logging$.MODULE$.enableStructuredLogging();
+    SparkLoggerFactory.enableStructuredLogging();
   }
 
   // Disable Structured Logging after running the tests
   @AfterAll
   public static void teardown() {
-    Logging$.MODULE$.disableStructuredLogging();
+    SparkLoggerFactory.disableStructuredLogging();
   }
 
   private static final SparkLogger LOGGER =
@@ -176,28 +175,14 @@ String expectedPatternForMsgWithMDCValueIsNull(Level level) {
   }
 
   @Override
-  String expectedPatternForScalaCustomLogKey(Level level) {
+  String expectedPatternForCustomLogKey(Level level) {
     return compactAndToRegexPattern(level, """
       {
         "ts": "<timestamp>",
         "level": "<level>",
-        "msg": "Scala custom log message.",
+        "msg": "Custom log message.",
         "context": {
-          "custom_log_key": "Scala custom log message."
-        },
-        "logger": "<className>"
-      }""");
-  }
-
-  @Override
-  String expectedPatternForJavaCustomLogKey(Level level) {
-    return compactAndToRegexPattern(level, """
-      {
-        "ts": "<timestamp>",
-        "level": "<level>",
-        "msg": "Java custom log message.",
-        "context": {
-          "custom_log_key": "Java custom log message."
+          "custom_log_key": "Custom log message."
         },
         "logger": "<className>"
       }""");
diff --git a/common/utils-java/src/test/resources/log4j2.properties b/common/utils-java/src/test/resources/log4j2.properties
new file mode 100644
index 0000000000000..cb38f5b55a0ba
--- /dev/null
+++ b/common/utils-java/src/test/resources/log4j2.properties
@@ -0,0 +1,60 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+rootLogger.level = info
+rootLogger.appenderRef.file.ref = ${sys:test.appender:-File}
+
+appender.file.type = File
+appender.file.name = File
+appender.file.fileName = target/unit-tests.log
+appender.file.layout.type = JsonTemplateLayout
+appender.file.layout.eventTemplateUri = classpath:org/apache/spark/SparkLayout.json
+
+# Structured Logging Appender
+appender.structured.type = File
+appender.structured.name = structured
+appender.structured.fileName = target/structured.log
+appender.structured.layout.type = JsonTemplateLayout
+appender.structured.layout.eventTemplateUri = classpath:org/apache/spark/SparkLayout.json
+
+# Pattern Logging Appender
+appender.pattern.type = File
+appender.pattern.name = pattern
+appender.pattern.fileName = target/pattern.log
+appender.pattern.layout.type = PatternLayout
+appender.pattern.layout.pattern = %d{yy/MM/dd HH:mm:ss} %p %c{1}: %m%n%ex
+
+# Custom loggers
+logger.structured_logging.name = org.apache.spark.util.StructuredLoggingSuite
+logger.structured_logging.level = trace
+logger.structured_logging.appenderRefs = structured
+logger.structured_logging.appenderRef.structured.ref = structured
+
+logger.pattern_logging.name = org.apache.spark.util.PatternLoggingSuite
+logger.pattern_logging.level = trace
+logger.pattern_logging.appenderRefs = pattern
+logger.pattern_logging.appenderRef.pattern.ref = pattern
+
+logger.structured_logger.name = org.apache.spark.util.StructuredSparkLoggerSuite
+logger.structured_logger.level = trace
+logger.structured_logger.appenderRefs = structured
+logger.structured_logger.appenderRef.structured.ref = structured
+
+logger.pattern_logger.name = org.apache.spark.util.PatternSparkLoggerSuite
+logger.pattern_logger.level = trace
+logger.pattern_logger.appenderRefs = pattern
+logger.pattern_logger.appenderRef.pattern.ref = pattern
diff --git a/common/utils/pom.xml b/common/utils/pom.xml
index 44771938439ae..df3bc5adb10bd 100644
--- a/common/utils/pom.xml
+++ b/common/utils/pom.xml
@@ -39,6 +39,18 @@
       <groupId>org.apache.spark</groupId>
       <artifactId>spark-tags_${scala.binary.version}</artifactId>
     </dependency>
+    <dependency>
+      <groupId>org.apache.spark</groupId>
+      <artifactId>spark-common-utils-java_${scala.binary.version}</artifactId>
+      <version>${project.version}</version>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.spark</groupId>
+      <artifactId>spark-common-utils-java_${scala.binary.version}</artifactId>
+      <version>${project.version}</version>
+      <type>test-jar</type>
+      <scope>test</scope>
+    </dependency>
     <dependency>
       <groupId>org.apache.xbean</groupId>
       <artifactId>xbean-asm9-shaded</artifactId>
@@ -51,14 +63,6 @@
       <groupId>com.fasterxml.jackson.module</groupId>
       <artifactId>jackson-module-scala_${scala.binary.version}</artifactId>
     </dependency>
-    <dependency>
-      <groupId>org.apache.commons</groupId>
-      <artifactId>commons-text</artifactId>
-    </dependency>
-    <dependency>
-      <groupId>commons-io</groupId>
-      <artifactId>commons-io</artifactId>
-    </dependency>
     <dependency>
       <groupId>org.apache.ivy</groupId>
       <artifactId>ivy</artifactId>
diff --git a/common/utils/src/main/resources/error/error-conditions.json b/common/utils/src/main/resources/error/error-conditions.json
index fe14f4e827938..167c460536ac9 100644
--- a/common/utils/src/main/resources/error/error-conditions.json
+++ b/common/utils/src/main/resources/error/error-conditions.json
@@ -90,6 +90,30 @@
     ],
     "sqlState" : "42000"
   },
+  "APPROX_TOP_K_MAX_ITEMS_TRACKED_EXCEEDS_LIMIT" : {
+    "message" : [
+      "The max items tracked `maxItemsTracked`(<maxItemsTracked>) of `approx_top_k` should be less than or equal to <limit>."
+    ],
+    "sqlState" : "22023"
+  },
+  "APPROX_TOP_K_MAX_ITEMS_TRACKED_LESS_THAN_K" : {
+    "message" : [
+      "The max items tracked `maxItemsTracked`(<maxItemsTracked>) of `approx_top_k` should be greater than or equal to `k`(<k>)."
+    ],
+    "sqlState" : "22023"
+  },
+  "APPROX_TOP_K_NON_POSITIVE_ARG" : {
+    "message" : [
+      "The value of <argName> in `approx_top_k` must be a positive integer, but got <argValue>."
+    ],
+    "sqlState" : "22023"
+  },
+  "APPROX_TOP_K_NULL_ARG" : {
+    "message" : [
+      "The value of <argName> in `approx_top_k` cannot be NULL."
+    ],
+    "sqlState" : "22004"
+  },
   "ARITHMETIC_OVERFLOW" : {
     "message" : [
       "<message>.<alternative> If necessary set <config> to \"false\" to bypass this error."
@@ -249,6 +273,24 @@
     ],
     "sqlState" : "0A000"
   },
+  "CANNOT_LOAD_CHECKPOINT_FILE_MANAGER" : {
+    "message" : [
+      "Error loading streaming checkpoint file manager for path=<path>."
+    ],
+    "subClass" : {
+      "ERROR_LOADING_CLASS" : {
+        "message" : [
+          "Error instantiating streaming checkpoint file manager for path=<path> with className=<className>. msg=<msg>."
+        ]
+      },
+      "UNCATEGORIZED" : {
+        "message" : [
+          ""
+        ]
+      }
+    },
+    "sqlState" : "58030"
+  },
   "CANNOT_LOAD_FUNCTION_CLASS" : {
     "message" : [
       "Cannot load class <className> when registering the function <functionName>, please make sure it is on the classpath."
@@ -853,6 +895,11 @@
           "Please fit or load a model smaller than <modelMaxSize> bytes."
         ]
       },
+      "MODEL_SUMMARY_LOST" : {
+        "message" : [
+          "The model <objectName> summary is lost because the cached model is offloaded."
+        ]
+      },
       "UNSUPPORTED_EXCEPTION" : {
         "message" : [
           "<message>"
@@ -921,12 +968,24 @@
     },
     "sqlState" : "21S01"
   },
+  "CYCLIC_FUNCTION_REFERENCE" : {
+    "message" : [
+      "Cyclic function reference detected: <path>."
+    ],
+    "sqlState" : "42887"
+  },
   "DATAFLOW_GRAPH_NOT_FOUND" : {
     "message" : [
       "Dataflow graph with id <graphId> could not be found"
     ],
     "sqlState" : "KD011"
   },
+  "DATATYPE_CANNOT_ORDER" : {
+    "message" : [
+      "Type <dataType> does not support ordered operations."
+    ],
+    "sqlState" : "0A000"
+  },
   "DATATYPE_MISMATCH" : {
     "message" : [
       "Cannot resolve <sqlExpr> due to data type mismatch:"
@@ -1435,6 +1494,12 @@
     ],
     "sqlState" : "42711"
   },
+  "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE" : {
+    "message" : [
+      "Found duplicate variable <variableName> in the declare variable list. Please, remove one of them."
+    ],
+    "sqlState" : "42734"
+  },
   "EMITTING_ROWS_OLDER_THAN_WATERMARK_NOT_ALLOWED" : {
     "message" : [
       "Previous node emitted a row with eventTime=<emittedRowEventTime> which is older than current_watermark_value=<currentWatermark>",
@@ -1781,12 +1846,6 @@
     ],
     "sqlState" : "39000"
   },
-  "FOUND_MULTIPLE_DATA_SOURCES" : {
-    "message" : [
-      "Detected multiple data sources with the name '<provider>'. Please check the data source isn't simultaneously registered and located in the classpath."
-    ],
-    "sqlState" : "42710"
-  },
   "GENERATED_COLUMN_WITH_DEFAULT_VALUE" : {
     "message" : [
       "A column cannot have both a default value and a generation expression but column <colName> has default value: (<defaultValue>) and generation expression: (<genExpr>)."
@@ -2708,6 +2767,34 @@
     ],
     "sqlState" : "42000"
   },
+  "INVALID_FLOW_QUERY_TYPE" : {
+    "message" : [
+      "Flow <flowIdentifier> returns an invalid relation type."
+    ],
+    "subClass" : {
+      "BATCH_RELATION_FOR_STREAMING_TABLE" : {
+        "message" : [
+          "Streaming tables may only be defined by streaming relations, but the flow <flowIdentifier> attempts to write a batch relation to the streaming table <tableIdentifier>. Consider using the STREAM operator in Spark-SQL to convert the batch relation into a streaming relation, or populating the streaming table with an append once-flow instead."
+        ]
+      },
+      "STREAMING_RELATION_FOR_MATERIALIZED_VIEW" : {
+        "message" : [
+          "Materialized views may only be defined by a batch relation, but the flow <flowIdentifier> attempts to write a streaming relation to the materialized view <tableIdentifier>."
+        ]
+      },
+      "STREAMING_RELATION_FOR_ONCE_FLOW" : {
+        "message" : [
+          "<flowIdentifier> is an append once-flow that is defined by a streaming relation. Append once-flows may only be defined by or return a batch relation."
+        ]
+      },
+      "STREAMING_RELATION_FOR_PERSISTED_VIEW" : {
+        "message" : [
+          "Persisted views may only be defined by a batch relation, but the flow <flowIdentifier> attempts to write a streaming relation to the persisted view <viewIdentifier>."
+        ]
+      }
+    },
+    "sqlState" : "42000"
+  },
   "INVALID_FORMAT" : {
     "message" : [
       "The format is invalid: <format>."
@@ -3349,6 +3436,11 @@
           "expects a string literal, but got <invalidValue>."
         ]
       },
+      "TIME_UNIT" : {
+        "message" : [
+          "expects one of the units 'HOUR', 'MINUTE', 'SECOND', 'MILLISECOND', 'MICROSECOND', but got '<invalidValue>'."
+        ]
+      },
       "ZERO_INDEX" : {
         "message" : [
           "expects %1$, %2$ and so on, but got %0$."
@@ -3407,7 +3499,7 @@
   },
   "INVALID_RECURSIVE_CTE" : {
     "message" : [
-      "Invalid recursive definition found. Recursive queries must contain an UNION or an UNION ALL statement with 2 children. The first child needs to be the anchor term without any recursive references."
+      "Invalid recursive definition found. Recursive queries must contain an UNION or an UNION ALL statement with 2 children. The first child needs to be the anchor term without any recursive references. Any top level inner CTE must not contain self references."
     ],
     "sqlState" : "42836"
   },
@@ -3416,14 +3508,9 @@
       "Invalid recursive reference found inside WITH RECURSIVE clause."
     ],
     "subClass" : {
-      "NUMBER" : {
-        "message" : [
-          "Multiple self-references to one recursive CTE are not allowed."
-        ]
-      },
       "PLACE" : {
         "message" : [
-          "Recursive references cannot be used on the right side of left outer/semi/anti joins, on the left side of right outer joins, in full outer joins, in aggregates, and in subquery expressions."
+          "Recursive references cannot be used on the right side of left outer/semi/anti joins, on the left side of right outer joins, in full outer joins, in aggregates, window functions or sorts"
         ]
       }
     },
@@ -3551,6 +3638,12 @@
     ],
     "sqlState" : "42K08"
   },
+  "INVALID_SQL_FUNCTION_DATA_ACCESS" : {
+    "message" : [
+      "Cannot create a SQL function with CONTAINS SQL that accesses a table/view or a SQL function that reads SQL data. Please use READS SQL DATA instead."
+    ],
+    "sqlState" : "42K0E"
+  },
   "INVALID_SQL_FUNCTION_PLAN_STRUCTURE" : {
     "message" : [
       "Invalid SQL function plan structure",
@@ -3975,18 +4068,25 @@
     ],
     "sqlState" : "42K0L"
   },
-  "LABEL_ALREADY_EXISTS" : {
+  "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS" : {
     "message" : [
-      "The label <label> already exists. Choose another name or rename the existing label."
+      "The label or FOR variable <label> already exists. Choose another name or rename the existing one."
     ],
     "sqlState" : "42K0L"
   },
-  "LABEL_NAME_FORBIDDEN" : {
+  "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN" : {
     "message" : [
-      "The label name <label> is forbidden."
+      "The label or FOR variable name <label> is forbidden."
     ],
     "sqlState" : "42K0L"
   },
+  "LATERAL_JOIN_WITH_ARROW_UDTF_UNSUPPORTED" : {
+    "message" : [
+      "LATERAL JOIN with Arrow-optimized user-defined table functions (UDTFs) is not supported. Arrow UDTFs cannot be used on the right-hand side of a lateral join.",
+      "Please use a regular UDTF instead, or restructure your query to avoid the lateral join."
+    ],
+    "sqlState" : "0A000"
+  },
   "LOAD_DATA_PATH_NOT_EXISTS" : {
     "message" : [
       "LOAD DATA input path does not exist: <path>."
@@ -4353,6 +4453,18 @@
     ],
     "sqlState" : "42809"
   },
+  "NOT_A_SCALAR_FUNCTION" : {
+    "message" : [
+      "<functionName> appears as a scalar expression here, but the function was defined as a table function. Please update the query to move the function call into the FROM clause, or redefine <functionName> as a scalar function instead."
+    ],
+    "sqlState" : "42887"
+  },
+  "NOT_A_TABLE_FUNCTION" : {
+    "message" : [
+      "<functionName> appears as a table function here, but the function was defined as a scalar function. Please update the query to move the function call outside the FROM clause, or redefine <functionName> as a table function instead."
+    ],
+    "sqlState" : "42887"
+  },
   "NOT_NULL_ASSERT_VIOLATION" : {
     "message" : [
       "NULL value appeared in non-nullable field: <walkedTypePath>If the schema is inferred from a Scala tuple/case class, or a Java bean, please try to use scala.Option[_] or other nullable types (such as java.lang.Integer instead of int/scala.Int)."
@@ -4860,6 +4972,13 @@
     ],
     "sqlState" : "22023"
   },
+  "RUN_EMPTY_PIPELINE" : {
+    "message" : [
+      "Pipelines are expected to have at least one non-temporary dataset defined (tables, persisted views) but no non-temporary datasets were found in your pipeline.",
+      "Please verify that you have included the expected source files, and that your source code includes table definitions (e.g., CREATE MATERIALIZED VIEW in SQL code, @sdp.table in python code)."
+    ],
+    "sqlState" : "42617"
+  },
   "SCALAR_FUNCTION_NOT_COMPATIBLE" : {
     "message" : [
       "ScalarFunction <scalarFunc> not overrides method 'produceResult(InternalRow)' with custom implementation."
@@ -4983,6 +5102,12 @@
     ],
     "sqlState" : "07501"
   },
+  "STAGE_MATERIALIZATION_MULTIPLE_FAILURES" : {
+    "message" : [
+      "Multiple failures (<failureCount>) in stage materialization: <failureDetails>"
+    ],
+    "sqlState" : "XX000"
+  },
   "STAR_GROUP_BY_POS" : {
     "message" : [
       "Star (*) is not allowed in a select list when GROUP BY an ordinal position is used."
@@ -5037,12 +5162,29 @@
     ],
     "sqlState" : "42802"
   },
+  "STATE_STORE_CHECKPOINT_LOCATION_NOT_EMPTY" : {
+    "message" : [
+      "The checkpoint location <checkpointLocation> should be empty on batch 0",
+      "Please either use a new checkpoint location, or delete the existing data in the checkpoint location."
+    ],
+    "sqlState" : "42K03"
+  },
   "STATE_STORE_COLUMN_FAMILY_SCHEMA_INCOMPATIBLE" : {
     "message" : [
       "Incompatible schema transformation with column family=<colFamilyName>, oldSchema=<oldSchema>, newSchema=<newSchema>."
     ],
     "sqlState" : "42802"
   },
+  "STATE_STORE_COMMIT_VALIDATION_FAILED" : {
+    "message" : [
+      "State store commit validation failed for batch <batchId>.",
+      "Expected <expectedCommits> commits but got <actualCommits>.",
+      "Missing commits: <missingCommits>.",
+      "This error typically occurs when using operations like show() or limit() in foreachBatch that don't process all partitions, or if you are swallowing an exception and returning from the function early.",
+      "To fix: ensure your foreachBatch function processes the entire DataFrame."
+    ],
+    "sqlState" : "XXKST"
+  },
   "STATE_STORE_HANDLE_NOT_INITIALIZED" : {
     "message" : [
       "The handle has not been initialized for this StatefulProcessor.",
@@ -5074,6 +5216,18 @@
     ],
     "sqlState" : "42K06"
   },
+  "STATE_STORE_INVALID_STAMP" : {
+    "message" : [
+      "Invalid stamp <providedStamp>, current stamp: <currentStamp>."
+    ],
+    "sqlState" : "XXKST"
+  },
+  "STATE_STORE_INVALID_STATE_MACHINE_TRANSITION" : {
+    "message" : [
+      "Invalid state machine transition detected for state store <storeId>. Old state: <oldState>, New state: <newState>, Operation: <operation>."
+    ],
+    "sqlState" : "XXKST"
+  },
   "STATE_STORE_INVALID_VALUE_SCHEMA_EVOLUTION" : {
     "message" : [
       "Schema evolution is not possible new value_schema=<newValueSchema> and old value_schema=<oldValueSchema>",
@@ -6484,12 +6638,6 @@
     ],
     "sqlState" : "0A000"
   },
-  "UNSUPPORTED_STREAMING_TABLE_VALUED_FUNCTION" : {
-    "message" : [
-      "The function <funcName> does not support streaming. Please remove the STREAM keyword"
-    ],
-    "sqlState" : "42000"
-  },
   "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY" : {
     "message" : [
       "Unsupported subquery expression:"
@@ -6585,6 +6733,12 @@
     },
     "sqlState" : "0A000"
   },
+  "UNSUPPORTED_TABLE_CHANGE_IN_AUTO_SCHEMA_EVOLUTION" : {
+    "message" : [
+      "The table changes <changes> are not supported by the catalog on table <tableName>."
+    ],
+    "sqlState" : "42000"
+  },
   "UNSUPPORTED_TABLE_CHANGE_IN_JDBC_CATALOG" : {
     "message" : [
       "The table change <change> is not supported for the JDBC catalog on table <tableName>. Supported changes include: AddColumn, RenameColumn, DeleteColumn, UpdateColumnType, UpdateColumnNullability."
@@ -7869,11 +8023,6 @@
       "Unsuccessful try to zip maps with <size> unique keys due to exceeding the array size limit <maxRoundedArrayLength>."
     ]
   },
-  "_LEGACY_ERROR_TEMP_2005" : {
-    "message" : [
-      "Type <dataType> does not support ordered operations."
-    ]
-  },
   "_LEGACY_ERROR_TEMP_2017" : {
     "message" : [
       "not resolved."
@@ -8286,11 +8435,6 @@
       "Failed to get outer pointer for <innerCls>."
     ]
   },
-  "_LEGACY_ERROR_TEMP_2155" : {
-    "message" : [
-      "<userClass> is not annotated with SQLUserDefinedType nor registered with UDTRegistration.}"
-    ]
-  },
   "_LEGACY_ERROR_TEMP_2163" : {
     "message" : [
       "Initial type <dataType> must be a <target>."
@@ -8570,11 +8714,6 @@
       "Failed to set original ACL <aclEntries> back to the created path: <path>. Exception: <message>"
     ]
   },
-  "_LEGACY_ERROR_TEMP_2235" : {
-    "message" : [
-      "Multiple failures in stage materialization."
-    ]
-  },
   "_LEGACY_ERROR_TEMP_2236" : {
     "message" : [
       "Unrecognized compression scheme type ID: <typeId>."
@@ -8627,7 +8766,7 @@
   },
   "_LEGACY_ERROR_TEMP_2250" : {
     "message" : [
-      "Not enough memory to build and broadcast the table to all worker nodes. As a workaround, you can either disable broadcast by setting <autoBroadcastJoinThreshold> to -1 or increase the spark driver memory by setting <driverMemory> to a higher value<analyzeTblMsg>"
+      "Not enough memory to build and broadcast the table to all worker nodes. As a workaround, you can either disable broadcast by setting <autoBroadcastJoinThreshold> to -1 or increase the spark driver memory by setting <driverMemory> to a higher value<analyzeTblMsg> or apply the shuffle sort merge join hint as described in the Spark documentation: https://spark.apache.org/docs/latest/sql-ref-syntax-qry-select-hints.html#join-hints."
     ]
   },
   "_LEGACY_ERROR_TEMP_2251" : {
diff --git a/common/utils/src/main/scala/org/apache/spark/ErrorClassesJSONReader.scala b/common/utils/src/main/scala/org/apache/spark/ErrorClassesJSONReader.scala
index 85d460f618a79..2ff8112989018 100644
--- a/common/utils/src/main/scala/org/apache/spark/ErrorClassesJSONReader.scala
+++ b/common/utils/src/main/scala/org/apache/spark/ErrorClassesJSONReader.scala
@@ -19,13 +19,10 @@ package org.apache.spark
 
 import java.net.URL
 
-import scala.jdk.CollectionConverters._
-
 import com.fasterxml.jackson.annotation.JsonIgnore
 import com.fasterxml.jackson.core.`type`.TypeReference
 import com.fasterxml.jackson.databind.json.JsonMapper
 import com.fasterxml.jackson.module.scala.DefaultScalaModule
-import org.apache.commons.text.StringSubstitutor
 
 import org.apache.spark.annotation.DeveloperApi
 
@@ -48,9 +45,7 @@ class ErrorClassesJsonReader(jsonFileURLs: Seq[URL]) {
       case (key, null) => key -> "null"
       case (key, value) => key -> value
     }
-    val sub = new StringSubstitutor(sanitizedParameters.asJava)
-    sub.setEnableUndefinedVariableException(true)
-    sub.setDisableSubstitutionInValues(true)
+    val sub = new StringSubstitutor(sanitizedParameters)
     val errorMessage = try {
       sub.replace(ErrorClassesJsonReader.TEMPLATE_REGEX.replaceAllIn(
         messageTemplate, "\\$\\{$1\\}"))
diff --git a/common/utils/src/main/scala/org/apache/spark/SparkException.scala b/common/utils/src/main/scala/org/apache/spark/SparkException.scala
index 00989fd29095c..f438c62253475 100644
--- a/common/utils/src/main/scala/org/apache/spark/SparkException.scala
+++ b/common/utils/src/main/scala/org/apache/spark/SparkException.scala
@@ -131,6 +131,14 @@ object SparkException {
       messageParameters: java.util.Map[String, String]): Map[String, String] = {
     messageParameters.asScala.toMap
   }
+
+  def mustOverrideOneMethodError(methodName: String): RuntimeException = {
+    val msg = s"You must override one `$methodName`. It's preferred to not override the " +
+      "deprecated one."
+    new SparkRuntimeException(
+      "INTERNAL_ERROR",
+      Map("message" -> msg))
+  }
 }
 
 /**
@@ -145,8 +153,8 @@ private[spark] class SparkDriverExecutionException(cause: Throwable)
  * Exception thrown when the main user code is run as a child process (e.g. pyspark) and we want
  * the parent SparkSubmit process to exit with the same exit code.
  */
-private[spark] case class SparkUserAppException(exitCode: Int)
-  extends SparkException(s"User application exited with $exitCode")
+private[spark] case class SparkUserAppException(exitCode: Int, cause: Throwable = null)
+  extends SparkException(s"User application exited with $exitCode", cause)
 
 /**
  * Exception thrown when the relative executor to access is dead.
diff --git a/common/utils/src/main/scala/org/apache/spark/StringSubstitutor.scala b/common/utils/src/main/scala/org/apache/spark/StringSubstitutor.scala
new file mode 100644
index 0000000000000..6513c7dc7e8ec
--- /dev/null
+++ b/common/utils/src/main/scala/org/apache/spark/StringSubstitutor.scala
@@ -0,0 +1,126 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark
+
+import scala.collection.mutable.{ListBuffer, StringBuilder}
+
+class StringSubstitutor(
+    resolver: Map[String, Any],
+    prefix: String = "${",
+    suffix: String = "}",
+    escape: Char = '$',
+    valueDelimiter: String = ":-",
+    preserveEscapes: Boolean = true,
+    enableSubstitutionInVariables: Boolean = false,
+    enableUndefinedVariableException: Boolean = true) {
+
+  private val prefixLen = prefix.length
+  private val suffixLen = suffix.length
+
+  def replace(source: String): String = {
+    if (source == null) return null
+    val buf = new StringBuilder(source)
+    if (!substitute(buf, 0, buf.length, ListBuffer.empty[String])) {
+      source
+    } else {
+      buf.toString
+    }
+  }
+
+  private def substitute(
+      buf: StringBuilder,
+      offset: Int,
+      length: Int,
+      priorVariables: ListBuffer[String]): Boolean = {
+    var altered = false
+    var currentPos = offset
+    val endPos = offset + length
+
+    while (currentPos < endPos) {
+      // Find prefix
+      val prefixPos = buf.indexOf(prefix, currentPos)
+      if (prefixPos < 0 || prefixPos >= endPos) {
+        return altered
+      }
+
+      if (prefixPos > 0 && buf.charAt(prefixPos - 1) == escape) {
+        if (preserveEscapes) {
+          currentPos = prefixPos + prefixLen
+        } else {
+          buf.deleteCharAt(prefixPos - 1)
+          altered = true
+          currentPos = prefixPos - 1 + prefixLen // adjust position
+        }
+      } else {
+        // Find suffix
+        val suffixPos = buf.indexOf(suffix, prefixPos + prefixLen)
+        if (suffixPos < 0) {
+          currentPos = prefixPos + prefixLen
+        } else {
+          // Extract variable name and default
+          val varFull = buf.substring(prefixPos + prefixLen, suffixPos)
+          val index = varFull.indexOf(valueDelimiter)
+          val (varName, defaultValue) = if (index >= 0) {
+            (varFull.substring(0, index), Some(varFull.substring(index + valueDelimiter.length)))
+          } else {
+            (varFull, None)
+          }
+
+          // Check for cycle
+          if (priorVariables.contains(varName)) {
+            throw new IllegalStateException(
+              s"Infinite loop in property interpolation of $varName")
+          }
+
+          resolver.get(varName) match {
+            case Some(value) =>
+              var replacement = value.toString
+              if (enableSubstitutionInVariables) {
+                val newPrior = priorVariables.clone() += varName
+                val tempBuf = new StringBuilder(replacement)
+                if (substitute(tempBuf, 0, tempBuf.length, newPrior)) {
+                  replacement = tempBuf.toString
+                }
+              }
+              buf.replace(prefixPos, suffixPos + suffixLen, replacement)
+              // Adjust positions and recurse on the changed part
+              val changeInLength = replacement.length - (suffixPos + suffixLen - prefixPos)
+              val newLength = length + changeInLength
+              substitute(buf, prefixPos + replacement.length, newLength, priorVariables)
+              return true // restart scan after change
+
+            case None =>
+              defaultValue match {
+                case Some(value) =>
+                  buf.replace(prefixPos, suffixPos + suffixLen, value)
+                  val changeInLength = value.length - (suffixPos + suffixLen - prefixPos)
+                  val newLength = length + changeInLength
+                  substitute(buf, prefixPos + value.length, length, priorVariables)
+                  return true
+                case None =>
+                  if (enableUndefinedVariableException) {
+                    throw new IllegalArgumentException(s"Undefined variable: $varName")
+                  }
+              }
+          }
+          currentPos = suffixPos + suffixLen
+        }
+      }
+    }
+    altered
+  }
+}
diff --git a/common/utils/src/main/java/org/apache/spark/api/java/function/package.scala b/common/utils/src/main/scala/org/apache/spark/api/java/function/package.scala
similarity index 100%
rename from common/utils/src/main/java/org/apache/spark/api/java/function/package.scala
rename to common/utils/src/main/scala/org/apache/spark/api/java/function/package.scala
diff --git a/common/utils/src/main/scala/org/apache/spark/internal/LogKey.scala b/common/utils/src/main/scala/org/apache/spark/internal/LogKey.scala
deleted file mode 100644
index b0fae3fd9443b..0000000000000
--- a/common/utils/src/main/scala/org/apache/spark/internal/LogKey.scala
+++ /dev/null
@@ -1,915 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package org.apache.spark.internal
-
-import java.util.Locale
-
-/**
- * All structured logging `keys` used in `MDC` must be extends `LogKey`
- * <p>
- *
- * `LogKey`s serve as identifiers for mapped diagnostic contexts (MDC) within logs.
- * Follow these guidelines when adding a new LogKey:
- * <ul>
- *   <li>
- *     Define all structured logging keys in `LogKey.scala`, and sort them alphabetically for
- *     ease of search.
- *   </li>
- *   <li>
- *     Use `UPPER_SNAKE_CASE` for key names.
- *   </li>
- *   <li>
- *     Key names should be both simple and broad, yet include specific identifiers like `STAGE_ID`,
- *     `TASK_ID`, and `JOB_ID` when needed for clarity. For instance, use `MAX_ATTEMPTS` as a
- *     general key instead of creating separate keys for each scenario such as
- *     `EXECUTOR_STATE_SYNC_MAX_ATTEMPTS` and `MAX_TASK_FAILURES`.
- *     This balances simplicity with the detail needed for effective logging.
- *   </li>
- *   <li>
- *     Use abbreviations in names if they are widely understood,
- *     such as `APP_ID` for APPLICATION_ID, and `K8S` for KUBERNETES.
- *   </li>
- *   <li>
- *     For time-related keys, use milliseconds as the unit of time.
- *   </li>
- * </ul>
- */
-trait LogKey {
-  private lazy val _name: String = getClass.getSimpleName.stripSuffix("$").toLowerCase(Locale.ROOT)
-  def name: String = _name
-}
-
-/**
- * Various keys used for mapped diagnostic contexts(MDC) in logging. All structured logging keys
- * should be defined here for standardization.
- */
-private[spark] object LogKeys {
-  case object ACCUMULATOR_ID extends LogKey
-  case object ACL_ENABLED extends LogKey
-  case object ACTUAL_NUM_FILES extends LogKey
-  case object ACTUAL_PARTITION_COLUMN extends LogKey
-  case object ADDED_JARS extends LogKey
-  case object ADMIN_ACLS extends LogKey
-  case object ADMIN_ACL_GROUPS extends LogKey
-  case object ADVISORY_TARGET_SIZE extends LogKey
-  case object AGGREGATE_FUNCTIONS extends LogKey
-  case object ALIGNED_FROM_TIME extends LogKey
-  case object ALIGNED_TO_TIME extends LogKey
-  case object ALPHA extends LogKey
-  case object ANALYSIS_ERROR extends LogKey
-  case object APP_ATTEMPT_ID extends LogKey
-  case object APP_ATTEMPT_SHUFFLE_MERGE_ID extends LogKey
-  case object APP_DESC extends LogKey
-  case object APP_EXECUTOR_ID extends LogKey
-  case object APP_ID extends LogKey
-  case object APP_NAME extends LogKey
-  case object APP_STATE extends LogKey
-  case object ARCHIVE_NAME extends LogKey
-  case object ARGS extends LogKey
-  case object ARTIFACTS extends LogKey
-  case object ARTIFACT_ID extends LogKey
-  case object ATTRIBUTE_MAP extends LogKey
-  case object AUTH_ENABLED extends LogKey
-  case object AVG_BATCH_PROC_TIME extends LogKey
-  case object BACKUP_FILE extends LogKey
-  case object BARRIER_EPOCH extends LogKey
-  case object BARRIER_ID extends LogKey
-  case object BATCH_ID extends LogKey
-  case object BATCH_NAME extends LogKey
-  case object BATCH_TIMES extends LogKey
-  case object BATCH_TIMESTAMP extends LogKey
-  case object BATCH_WRITE extends LogKey
-  case object BIND_ADDRESS extends LogKey
-  case object BLOCK_GENERATOR_STATUS extends LogKey
-  case object BLOCK_ID extends LogKey
-  case object BLOCK_IDS extends LogKey
-  case object BLOCK_MANAGER_ID extends LogKey
-  case object BLOCK_MANAGER_IDS extends LogKey
-  case object BLOCK_TYPE extends LogKey
-  case object BOOT extends LogKey
-  case object BOOTSTRAP_TIME extends LogKey
-  case object BOOT_TIME extends LogKey
-  case object BROADCAST extends LogKey
-  case object BROADCAST_ID extends LogKey
-  case object BROADCAST_OUTPUT_STATUS_SIZE extends LogKey
-  case object BUCKET extends LogKey
-  case object BYTECODE_SIZE extends LogKey
-  case object BYTE_BUFFER extends LogKey
-  case object BYTE_SIZE extends LogKey
-  case object CACHED_TABLE_PARTITION_METADATA_SIZE extends LogKey
-  case object CACHE_AUTO_REMOVED_SIZE extends LogKey
-  case object CACHE_SIZE extends LogKey
-  case object CACHE_UNTIL_HIGHEST_CONSUMED_SIZE extends LogKey
-  case object CACHE_UNTIL_LAST_PRODUCED_SIZE extends LogKey
-  case object CALL_SITE_LONG_FORM extends LogKey
-  case object CALL_SITE_SHORT_FORM extends LogKey
-  case object CANCEL_FUTURE_JOBS extends LogKey
-  case object CATALOG_NAME extends LogKey
-  case object CATEGORICAL_FEATURES extends LogKey
-  case object CHECKPOINT_FILE extends LogKey
-  case object CHECKPOINT_INTERVAL extends LogKey
-  case object CHECKPOINT_LOCATION extends LogKey
-  case object CHECKPOINT_PATH extends LogKey
-  case object CHECKPOINT_ROOT extends LogKey
-  case object CHECKPOINT_TIME extends LogKey
-  case object CHOSEN_WATERMARK extends LogKey
-  case object CLASSIFIER extends LogKey
-  case object CLASS_LOADER extends LogKey
-  case object CLASS_NAME extends LogKey
-  case object CLASS_PATH extends LogKey
-  case object CLASS_PATHS extends LogKey
-  case object CLAUSES extends LogKey
-  case object CLEANUP_LOCAL_DIRS extends LogKey
-  case object CLUSTER_CENTROIDS extends LogKey
-  case object CLUSTER_ID extends LogKey
-  case object CLUSTER_LABEL extends LogKey
-  case object CLUSTER_LEVEL extends LogKey
-  case object CLUSTER_WEIGHT extends LogKey
-  case object CODE extends LogKey
-  case object CODEC_LEVEL extends LogKey
-  case object CODEC_NAME extends LogKey
-  case object CODEGEN_STAGE_ID extends LogKey
-  case object COLUMN_DATA_TYPE_SOURCE extends LogKey
-  case object COLUMN_DATA_TYPE_TARGET extends LogKey
-  case object COLUMN_DEFAULT_VALUE extends LogKey
-  case object COLUMN_NAME extends LogKey
-  case object COMMAND extends LogKey
-  case object COMMAND_OUTPUT extends LogKey
-  case object COMMITTED_VERSION extends LogKey
-  case object COMPACT_INTERVAL extends LogKey
-  case object COMPONENT extends LogKey
-  case object COMPUTE extends LogKey
-  case object CONFIG extends LogKey
-  case object CONFIG2 extends LogKey
-  case object CONFIG3 extends LogKey
-  case object CONFIG4 extends LogKey
-  case object CONFIG5 extends LogKey
-  case object CONFIG_DEPRECATION_MESSAGE extends LogKey
-  case object CONFIG_KEY_UPDATED extends LogKey
-  case object CONFIG_VERSION extends LogKey
-  case object CONSUMER extends LogKey
-  case object CONTAINER extends LogKey
-  case object CONTAINER_ID extends LogKey
-  case object CONTAINER_STATE extends LogKey
-  case object CONTEXT extends LogKey
-  case object COST extends LogKey
-  case object COUNT extends LogKey
-  case object CREATED_POOL_NAME extends LogKey
-  case object CREATION_SITE extends LogKey
-  case object CREDENTIALS_RENEWAL_INTERVAL_RATIO extends LogKey
-  case object CROSS_VALIDATION_METRIC extends LogKey
-  case object CROSS_VALIDATION_METRICS extends LogKey
-  case object CSV_HEADER_COLUMN_NAME extends LogKey
-  case object CSV_HEADER_COLUMN_NAMES extends LogKey
-  case object CSV_HEADER_LENGTH extends LogKey
-  case object CSV_SCHEMA_FIELD_NAME extends LogKey
-  case object CSV_SCHEMA_FIELD_NAMES extends LogKey
-  case object CSV_SOURCE extends LogKey
-  case object CURRENT_BATCH_ID extends LogKey
-  case object CURRENT_DISK_SIZE extends LogKey
-  case object CURRENT_FILE extends LogKey
-  case object CURRENT_MEMORY_SIZE extends LogKey
-  case object CURRENT_PATH extends LogKey
-  case object CURRENT_TIME extends LogKey
-  case object DATA extends LogKey
-  case object DATABASE_NAME extends LogKey
-  case object DATAFRAME_CACHE_ENTRY extends LogKey
-  case object DATAFRAME_ID extends LogKey
-  case object DATA_FILE extends LogKey
-  case object DATA_SOURCE extends LogKey
-  case object DATA_SOURCES extends LogKey
-  case object DEFAULT_COMPACT_INTERVAL extends LogKey
-  case object DEFAULT_ISOLATION_LEVEL extends LogKey
-  case object DEFAULT_NAME extends LogKey
-  case object DEFAULT_VALUE extends LogKey
-  case object DELAY extends LogKey
-  case object DELEGATE extends LogKey
-  case object DELTA extends LogKey
-  case object DEPRECATED_KEY extends LogKey
-  case object DERIVATIVE extends LogKey
-  case object DESCRIPTION extends LogKey
-  case object DESIRED_NUM_PARTITIONS extends LogKey
-  case object DESIRED_TREE_DEPTH extends LogKey
-  case object DESTINATION_PATH extends LogKey
-  case object DFS_FILE extends LogKey
-  case object DIFF_DELTA extends LogKey
-  case object DIVISIBLE_CLUSTER_INDICES_SIZE extends LogKey
-  case object DRIVER_ID extends LogKey
-  case object DRIVER_MEMORY_SIZE extends LogKey
-  case object DRIVER_STATE extends LogKey
-  case object DROPPED_PARTITIONS extends LogKey
-  case object DSTREAM extends LogKey
-  case object DURATION extends LogKey
-  case object EARLIEST_LOADED_VERSION extends LogKey
-  case object EFFECTIVE_STORAGE_LEVEL extends LogKey
-  case object ELAPSED_TIME extends LogKey
-  case object ENCODING extends LogKey
-  case object ENDPOINT_NAME extends LogKey
-  case object END_INDEX extends LogKey
-  case object END_POINT extends LogKey
-  case object END_VERSION extends LogKey
-  case object ENGINE extends LogKey
-  case object EPOCH extends LogKey
-  case object ERROR extends LogKey
-  case object ESTIMATOR_PARAM_MAP extends LogKey
-  case object EVALUATED_FILTERS extends LogKey
-  case object EVENT extends LogKey
-  case object EVENT_LOG_DESTINATION extends LogKey
-  case object EVENT_LOOP extends LogKey
-  case object EVENT_NAME extends LogKey
-  case object EVENT_QUEUE extends LogKey
-  case object EXCEPTION extends LogKey
-  case object EXECUTE_INFO extends LogKey
-  case object EXECUTE_KEY extends LogKey
-  case object EXECUTION_MEMORY_SIZE extends LogKey
-  case object EXECUTION_PLAN_LEAVES extends LogKey
-  case object EXECUTOR_BACKEND extends LogKey
-  case object EXECUTOR_ENVS extends LogKey
-  case object EXECUTOR_ENV_REGEX extends LogKey
-  case object EXECUTOR_ID extends LogKey
-  case object EXECUTOR_IDS extends LogKey
-  case object EXECUTOR_LAUNCH_COMMANDS extends LogKey
-  case object EXECUTOR_MEMORY_OFFHEAP extends LogKey
-  case object EXECUTOR_MEMORY_OVERHEAD_SIZE extends LogKey
-  case object EXECUTOR_MEMORY_SIZE extends LogKey
-  case object EXECUTOR_RESOURCES extends LogKey
-  case object EXECUTOR_SHUFFLE_INFO extends LogKey
-  case object EXECUTOR_STATE extends LogKey
-  case object EXECUTOR_TIMEOUT extends LogKey
-  case object EXECUTOR_USER_CLASS_PATH_FIRST extends LogKey
-  case object EXEC_AMOUNT extends LogKey
-  case object EXISTING_FILE extends LogKey
-  case object EXISTING_PATH extends LogKey
-  case object EXIT_CODE extends LogKey
-  case object EXPECTED_NUM_FILES extends LogKey
-  case object EXPECTED_PARTITION_COLUMN extends LogKey
-  case object EXPIRY_TIMESTAMP extends LogKey
-  case object EXPR extends LogKey
-  case object EXPR_TERMS extends LogKey
-  case object EXTENDED_EXPLAIN_GENERATOR extends LogKey
-  case object FAILED_STAGE extends LogKey
-  case object FAILED_STAGE_NAME extends LogKey
-  case object FAILURES extends LogKey
-  case object FALLBACK_VERSION extends LogKey
-  case object FEATURE_COLUMN extends LogKey
-  case object FEATURE_DIMENSION extends LogKey
-  case object FEATURE_NAME extends LogKey
-  case object FETCH_SIZE extends LogKey
-  case object FIELD_NAME extends LogKey
-  case object FIELD_TYPE extends LogKey
-  case object FILES extends LogKey
-  case object FILE_ABSOLUTE_PATH extends LogKey
-  case object FILE_END_OFFSET extends LogKey
-  case object FILE_FORMAT extends LogKey
-  case object FILE_FORMAT2 extends LogKey
-  case object FILE_LENGTH_XATTR extends LogKey
-  case object FILE_MODIFICATION_TIME extends LogKey
-  case object FILE_NAME extends LogKey
-  case object FILE_NAME2 extends LogKey
-  case object FILE_NAME3 extends LogKey
-  case object FILE_NAMES extends LogKey
-  case object FILE_START_OFFSET extends LogKey
-  case object FILE_SYSTEM extends LogKey
-  case object FILE_VERSION extends LogKey
-  case object FILTER extends LogKey
-  case object FINAL_CONTEXT extends LogKey
-  case object FINAL_OUTPUT_PATH extends LogKey
-  case object FINAL_PATH extends LogKey
-  case object FINISH_TIME extends LogKey
-  case object FINISH_TRIGGER_DURATION extends LogKey
-  case object FLOW_NAME extends LogKey
-  case object FREE_MEMORY_SIZE extends LogKey
-  case object FROM_OFFSET extends LogKey
-  case object FROM_TIME extends LogKey
-  case object FS_DATA_OUTPUT_STREAM extends LogKey
-  case object FUNCTION_NAME extends LogKey
-  case object FUNCTION_PARAM extends LogKey
-  case object GLOBAL_INIT_FILE extends LogKey
-  case object GLOBAL_WATERMARK extends LogKey
-  case object GROUP_BY_EXPRS extends LogKey
-  case object GROUP_ID extends LogKey
-  case object HADOOP_VERSION extends LogKey
-  case object HASH_JOIN_KEYS extends LogKey
-  case object HASH_MAP_SIZE extends LogKey
-  case object HEARTBEAT extends LogKey
-  case object HEARTBEAT_INTERVAL extends LogKey
-  case object HISTORY_DIR extends LogKey
-  case object HIVE_CLIENT_VERSION extends LogKey
-  case object HIVE_METASTORE_VERSION extends LogKey
-  case object HIVE_OPERATION_STATE extends LogKey
-  case object HIVE_OPERATION_TYPE extends LogKey
-  case object HOST extends LogKey
-  case object HOSTS extends LogKey
-  case object HOST_LOCAL_BLOCKS_SIZE extends LogKey
-  case object HOST_PORT extends LogKey
-  case object HOST_PORT2 extends LogKey
-  case object HUGE_METHOD_LIMIT extends LogKey
-  case object HYBRID_STORE_DISK_BACKEND extends LogKey
-  case object IDENTIFIER extends LogKey
-  case object INCOMPATIBLE_TYPES extends LogKey
-  case object INDEX extends LogKey
-  case object INDEX_FILE extends LogKey
-  case object INDEX_NAME extends LogKey
-  case object INFERENCE_MODE extends LogKey
-  case object INIT extends LogKey
-  case object INITIAL_CAPACITY extends LogKey
-  case object INITIAL_HEARTBEAT_INTERVAL extends LogKey
-  case object INIT_MODE extends LogKey
-  case object INIT_TIME extends LogKey
-  case object INPUT extends LogKey
-  case object INPUT_SPLIT extends LogKey
-  case object INTEGRAL extends LogKey
-  case object INTERRUPT_THREAD extends LogKey
-  case object INTERVAL extends LogKey
-  case object INVALID_PARAMS extends LogKey
-  case object ISOLATION_LEVEL extends LogKey
-  case object ISSUE_DATE extends LogKey
-  case object IS_NETWORK_REQUEST_DONE extends LogKey
-  case object JAR_ENTRY extends LogKey
-  case object JAR_MESSAGE extends LogKey
-  case object JAR_URL extends LogKey
-  case object JAVA_VERSION extends LogKey
-  case object JAVA_VM_NAME extends LogKey
-  case object JOB_ID extends LogKey
-  case object JOIN_CONDITION extends LogKey
-  case object JOIN_CONDITION_SUB_EXPR extends LogKey
-  case object JOIN_TYPE extends LogKey
-  case object K8S_CONTEXT extends LogKey
-  case object KEY extends LogKey
-  case object KEY2 extends LogKey
-  case object KEYTAB extends LogKey
-  case object KEYTAB_FILE extends LogKey
-  case object KILL_EXECUTORS extends LogKey
-  case object KINESIS_REASON extends LogKey
-  case object LABEL_COLUMN extends LogKey
-  case object LARGEST_CLUSTER_INDEX extends LogKey
-  case object LAST_ACCESS_TIME extends LogKey
-  case object LAST_COMMITTED_CHECKPOINT_ID extends LogKey
-  case object LAST_COMMIT_BASED_CHECKPOINT_ID extends LogKey
-  case object LAST_VALID_TIME extends LogKey
-  case object LATEST_BATCH_ID extends LogKey
-  case object LATEST_COMMITTED_BATCH_ID extends LogKey
-  case object LATEST_SHUFFLE_MERGE_ID extends LogKey
-  case object LEARNING_RATE extends LogKey
-  case object LEFT_EXPR extends LogKey
-  case object LEFT_LOGICAL_PLAN_STATS_SIZE_IN_BYTES extends LogKey
-  case object LINE extends LogKey
-  case object LINEAGE extends LogKey
-  case object LINE_NUM extends LogKey
-  case object LISTENER extends LogKey
-  case object LOADED_CHECKPOINT_ID extends LogKey
-  case object LOADED_VERSION extends LogKey
-  case object LOAD_FACTOR extends LogKey
-  case object LOAD_TIME extends LogKey
-  case object LOCALE extends LogKey
-  case object LOCAL_BLOCKS_SIZE extends LogKey
-  case object LOCAL_SCRATCH_DIR extends LogKey
-  case object LOCATION extends LogKey
-  case object LOGICAL_PLAN extends LogKey
-  case object LOGICAL_PLAN_COLUMNS extends LogKey
-  case object LOGICAL_PLAN_LEAVES extends LogKey
-  case object LOG_ID extends LogKey
-  case object LOG_LEVEL extends LogKey
-  case object LOG_OFFSET extends LogKey
-  case object LOG_TYPE extends LogKey
-  case object LOSSES extends LogKey
-  case object LOWER_BOUND extends LogKey
-  case object MALFORMATTED_STRING extends LogKey
-  case object MAP_ID extends LogKey
-  case object MASTER_URL extends LogKey
-  case object MAX_ATTEMPTS extends LogKey
-  case object MAX_CACHE_UNTIL_HIGHEST_CONSUMED_SIZE extends LogKey
-  case object MAX_CACHE_UNTIL_LAST_PRODUCED_SIZE extends LogKey
-  case object MAX_CAPACITY extends LogKey
-  case object MAX_CATEGORIES extends LogKey
-  case object MAX_EXECUTOR_FAILURES extends LogKey
-  case object MAX_FILE_VERSION extends LogKey
-  case object MAX_JVM_METHOD_PARAMS_LENGTH extends LogKey
-  case object MAX_MEMORY_SIZE extends LogKey
-  case object MAX_METHOD_CODE_SIZE extends LogKey
-  case object MAX_NUM_BINS extends LogKey
-  case object MAX_NUM_CHUNKS extends LogKey
-  case object MAX_NUM_FILES extends LogKey
-  case object MAX_NUM_LOG_POLICY extends LogKey
-  case object MAX_NUM_PARTITIONS extends LogKey
-  case object MAX_NUM_POSSIBLE_BINS extends LogKey
-  case object MAX_NUM_ROWS_IN_MEMORY_BUFFER extends LogKey
-  case object MAX_SEEN_VERSION extends LogKey
-  case object MAX_SERVICE_NAME_LENGTH extends LogKey
-  case object MAX_SIZE extends LogKey
-  case object MAX_SLOTS extends LogKey
-  case object MAX_SPLIT_BYTES extends LogKey
-  case object MAX_TABLE_PARTITION_METADATA_SIZE extends LogKey
-  case object MEMORY_CONSUMER extends LogKey
-  case object MEMORY_POOL_NAME extends LogKey
-  case object MEMORY_SIZE extends LogKey
-  case object MEMORY_THRESHOLD_SIZE extends LogKey
-  case object MERGE_DIR_NAME extends LogKey
-  case object MESSAGE extends LogKey
-  case object METADATA extends LogKey
-  case object METADATA_DIRECTORY extends LogKey
-  case object METADATA_JSON extends LogKey
-  case object META_FILE extends LogKey
-  case object METHOD_NAME extends LogKey
-  case object METHOD_PARAM_TYPES extends LogKey
-  case object METRICS_JSON extends LogKey
-  case object METRIC_NAME extends LogKey
-  case object MINI_BATCH_FRACTION extends LogKey
-  case object MIN_COMPACTION_BATCH_ID extends LogKey
-  case object MIN_NUM_FREQUENT_PATTERN extends LogKey
-  case object MIN_POINT_PER_CLUSTER extends LogKey
-  case object MIN_RATE extends LogKey
-  case object MIN_SEEN_VERSION extends LogKey
-  case object MIN_SHARE extends LogKey
-  case object MIN_SIZE extends LogKey
-  case object MIN_TIME extends LogKey
-  case object MIN_VERSIONS_TO_DELETE extends LogKey
-  case object MIN_VERSION_NUM extends LogKey
-  case object MISSING_PARENT_STAGES extends LogKey
-  case object MODEL_WEIGHTS extends LogKey
-  case object MODIFY_ACLS extends LogKey
-  case object MODIFY_ACLS_GROUPS extends LogKey
-  case object MODULE_NAME extends LogKey
-  case object NAME extends LogKey
-  case object NAMESPACE extends LogKey
-  case object NETWORK_IF extends LogKey
-  case object NEW_FEATURE_COLUMN_NAME extends LogKey
-  case object NEW_LABEL_COLUMN_NAME extends LogKey
-  case object NEW_PATH extends LogKey
-  case object NEW_RDD_ID extends LogKey
-  case object NEW_STATE extends LogKey
-  case object NEW_VALUE extends LogKey
-  case object NEXT_RENEWAL_TIME extends LogKey
-  case object NODES extends LogKey
-  case object NODE_LOCATION extends LogKey
-  case object NON_BUILT_IN_CONNECTORS extends LogKey
-  case object NORM extends LogKey
-  case object NUM_ADDED_PARTITIONS extends LogKey
-  case object NUM_APPS extends LogKey
-  case object NUM_ATTEMPT extends LogKey
-  case object NUM_BATCHES extends LogKey
-  case object NUM_BIN extends LogKey
-  case object NUM_BLOCKS extends LogKey
-  case object NUM_BLOCK_IDS extends LogKey
-  case object NUM_BROADCAST_BLOCK extends LogKey
-  case object NUM_BYTES extends LogKey
-  case object NUM_BYTES_CURRENT extends LogKey
-  case object NUM_BYTES_EVICTED extends LogKey
-  case object NUM_BYTES_MAX extends LogKey
-  case object NUM_BYTES_TO_FREE extends LogKey
-  case object NUM_BYTES_TO_WARN extends LogKey
-  case object NUM_BYTES_USED extends LogKey
-  case object NUM_CATEGORIES extends LogKey
-  case object NUM_CHECKSUM_FILE extends LogKey
-  case object NUM_CHUNKS extends LogKey
-  case object NUM_CLASSES extends LogKey
-  case object NUM_COEFFICIENTS extends LogKey
-  case object NUM_COLUMNS extends LogKey
-  case object NUM_CONCURRENT_WRITER extends LogKey
-  case object NUM_CORES extends LogKey
-  case object NUM_DATA_FILE extends LogKey
-  case object NUM_DATA_FILES extends LogKey
-  case object NUM_DECOMMISSIONED extends LogKey
-  case object NUM_DRIVERS extends LogKey
-  case object NUM_DROPPED_PARTITIONS extends LogKey
-  case object NUM_EFFECTIVE_RULE_OF_RUNS extends LogKey
-  case object NUM_ELEMENTS_SPILL_THRESHOLD extends LogKey
-  case object NUM_EVENTS extends LogKey
-  case object NUM_EXAMPLES extends LogKey
-  case object NUM_EXECUTORS extends LogKey
-  case object NUM_EXECUTORS_EXITED extends LogKey
-  case object NUM_EXECUTORS_KILLED extends LogKey
-  case object NUM_EXECUTOR_CORES extends LogKey
-  case object NUM_EXECUTOR_CORES_REMAINING extends LogKey
-  case object NUM_EXECUTOR_CORES_TOTAL extends LogKey
-  case object NUM_EXECUTOR_DESIRED extends LogKey
-  case object NUM_EXECUTOR_LAUNCH extends LogKey
-  case object NUM_EXECUTOR_TARGET extends LogKey
-  case object NUM_FAILURES extends LogKey
-  case object NUM_FEATURES extends LogKey
-  case object NUM_FILES extends LogKey
-  case object NUM_FILES_COPIED extends LogKey
-  case object NUM_FILES_FAILED_TO_DELETE extends LogKey
-  case object NUM_FILES_REUSED extends LogKey
-  case object NUM_FREQUENT_ITEMS extends LogKey
-  case object NUM_HOST_LOCAL_BLOCKS extends LogKey
-  case object NUM_INDEX_FILE extends LogKey
-  case object NUM_INDEX_FILES extends LogKey
-  case object NUM_ITERATIONS extends LogKey
-  case object NUM_KAFKA_PULLS extends LogKey
-  case object NUM_KAFKA_RECORDS_PULLED extends LogKey
-  case object NUM_LAGGING_STORES extends LogKey
-  case object NUM_LEADING_SINGULAR_VALUES extends LogKey
-  case object NUM_LEFT_PARTITION_VALUES extends LogKey
-  case object NUM_LOADED_ENTRIES extends LogKey
-  case object NUM_LOCAL_BLOCKS extends LogKey
-  case object NUM_LOCAL_DIRS extends LogKey
-  case object NUM_LOCAL_FREQUENT_PATTERN extends LogKey
-  case object NUM_MERGERS extends LogKey
-  case object NUM_MERGER_LOCATIONS extends LogKey
-  case object NUM_META_FILES extends LogKey
-  case object NUM_NODES extends LogKey
-  case object NUM_PARTITIONS extends LogKey
-  case object NUM_PARTITIONS2 extends LogKey
-  case object NUM_PATHS extends LogKey
-  case object NUM_PEERS extends LogKey
-  case object NUM_PEERS_REPLICATED_TO extends LogKey
-  case object NUM_PEERS_TO_REPLICATE_TO extends LogKey
-  case object NUM_PENDING_LAUNCH_TASKS extends LogKey
-  case object NUM_POD extends LogKey
-  case object NUM_POD_SHARED_SLOT extends LogKey
-  case object NUM_POD_TARGET extends LogKey
-  case object NUM_POINT extends LogKey
-  case object NUM_PREFIXES extends LogKey
-  case object NUM_PRUNED extends LogKey
-  case object NUM_PUSH_MERGED_LOCAL_BLOCKS extends LogKey
-  case object NUM_RECEIVERS extends LogKey
-  case object NUM_RECORDS_READ extends LogKey
-  case object NUM_RELEASED_LOCKS extends LogKey
-  case object NUM_REMAINED extends LogKey
-  case object NUM_REMOTE_BLOCKS extends LogKey
-  case object NUM_REMOVED_WORKERS extends LogKey
-  case object NUM_REPLICAS extends LogKey
-  case object NUM_REQUESTS extends LogKey
-  case object NUM_REQUEST_SYNC_TASK extends LogKey
-  case object NUM_RESOURCE_SLOTS extends LogKey
-  case object NUM_RETRIES extends LogKey
-  case object NUM_RETRY extends LogKey
-  case object NUM_RIGHT_PARTITION_VALUES extends LogKey
-  case object NUM_ROWS extends LogKey
-  case object NUM_RULE_OF_RUNS extends LogKey
-  case object NUM_SEQUENCES extends LogKey
-  case object NUM_SKIPPED extends LogKey
-  case object NUM_SLOTS extends LogKey
-  case object NUM_SPILLS extends LogKey
-  case object NUM_SPILL_WRITERS extends LogKey
-  case object NUM_SUB_DIRS extends LogKey
-  case object NUM_SUCCESSFUL_TASKS extends LogKey
-  case object NUM_TASKS extends LogKey
-  case object NUM_TASK_CPUS extends LogKey
-  case object NUM_TRAIN_WORD extends LogKey
-  case object NUM_UNFINISHED_DECOMMISSIONED extends LogKey
-  case object NUM_VERSIONS_RETAIN extends LogKey
-  case object NUM_WEIGHTED_EXAMPLES extends LogKey
-  case object NUM_WORKERS extends LogKey
-  case object OBJECT_AGG_SORT_BASED_FALLBACK_THRESHOLD extends LogKey
-  case object OBJECT_ID extends LogKey
-  case object OFFSET extends LogKey
-  case object OFFSETS extends LogKey
-  case object OFFSET_SEQUENCE_METADATA extends LogKey
-  case object OLD_BLOCK_MANAGER_ID extends LogKey
-  case object OLD_GENERATION_GC extends LogKey
-  case object OLD_VALUE extends LogKey
-  case object OPEN_COST_IN_BYTES extends LogKey
-  case object OPERATION_HANDLE extends LogKey
-  case object OPERATION_HANDLE_ID extends LogKey
-  case object OPERATION_ID extends LogKey
-  case object OPTIMIZED_PLAN_COLUMNS extends LogKey
-  case object OPTIMIZER_CLASS_NAME extends LogKey
-  case object OPTIONS extends LogKey
-  case object OP_ID extends LogKey
-  case object OP_TYPE extends LogKey
-  case object ORIGINAL_DISK_SIZE extends LogKey
-  case object ORIGINAL_MEMORY_SIZE extends LogKey
-  case object OS_ARCH extends LogKey
-  case object OS_NAME extends LogKey
-  case object OS_VERSION extends LogKey
-  case object OUTPUT extends LogKey
-  case object OUTPUT_BUFFER extends LogKey
-  case object OVERHEAD_MEMORY_SIZE extends LogKey
-  case object PAGE_SIZE extends LogKey
-  case object PARENT_STAGES extends LogKey
-  case object PARSE_MODE extends LogKey
-  case object PARTITIONED_FILE_READER extends LogKey
-  case object PARTITIONER extends LogKey
-  case object PARTITION_ID extends LogKey
-  case object PARTITION_IDS extends LogKey
-  case object PARTITION_SIZE extends LogKey
-  case object PARTITION_SPECIFICATION extends LogKey
-  case object PARTITION_SPECS extends LogKey
-  case object PATH extends LogKey
-  case object PATHS extends LogKey
-  case object PEER extends LogKey
-  case object PENDING_TIMES extends LogKey
-  case object PERCENT extends LogKey
-  case object PIPELINE_STAGE_UID extends LogKey
-  case object PLUGIN_NAME extends LogKey
-  case object POD_ID extends LogKey
-  case object POD_NAME extends LogKey
-  case object POD_NAMESPACE extends LogKey
-  case object POD_PHASE extends LogKey
-  case object POD_STATE extends LogKey
-  case object POINT_OF_CENTER extends LogKey
-  case object POLICY extends LogKey
-  case object POOL_NAME extends LogKey
-  case object PORT extends LogKey
-  case object PORT2 extends LogKey
-  case object POST_SCAN_FILTERS extends LogKey
-  case object PREDICATE extends LogKey
-  case object PREDICATES extends LogKey
-  case object PREFERRED_SERVICE_NAME extends LogKey
-  case object PREFIX extends LogKey
-  case object PRETTY_ID_STRING extends LogKey
-  case object PRINCIPAL extends LogKey
-  case object PROCESS extends LogKey
-  case object PROCESSING_TIME extends LogKey
-  case object PRODUCER_ID extends LogKey
-  case object PROPERTY_NAME extends LogKey
-  case object PROPORTIONAL extends LogKey
-  case object PROTOCOL_VERSION extends LogKey
-  case object PROVIDER extends LogKey
-  case object PUSHED_FILTERS extends LogKey
-  case object PUSH_MERGED_LOCAL_BLOCKS_SIZE extends LogKey
-  case object PVC_METADATA_NAME extends LogKey
-  case object PYTHON_EXEC extends LogKey
-  case object PYTHON_PACKAGES extends LogKey
-  case object PYTHON_VERSION extends LogKey
-  case object PYTHON_WORKER_CHANNEL_IS_BLOCKING_MODE extends LogKey
-  case object PYTHON_WORKER_CHANNEL_IS_CONNECTED extends LogKey
-  case object PYTHON_WORKER_HAS_INPUTS extends LogKey
-  case object PYTHON_WORKER_IDLE_TIMEOUT extends LogKey
-  case object PYTHON_WORKER_IS_ALIVE extends LogKey
-  case object PYTHON_WORKER_MODULE extends LogKey
-  case object PYTHON_WORKER_RESPONSE extends LogKey
-  case object PYTHON_WORKER_SELECTION_KEY_INTERESTS extends LogKey
-  case object PYTHON_WORKER_SELECTION_KEY_IS_VALID extends LogKey
-  case object PYTHON_WORKER_SELECTOR_IS_OPEN extends LogKey
-  case object QUANTILES extends LogKey
-  case object QUERY_CACHE_VALUE extends LogKey
-  case object QUERY_HINT extends LogKey
-  case object QUERY_ID extends LogKey
-  case object QUERY_PLAN extends LogKey
-  case object QUERY_PLAN_COMPARISON extends LogKey
-  case object QUERY_PLAN_LENGTH_ACTUAL extends LogKey
-  case object QUERY_PLAN_LENGTH_MAX extends LogKey
-  case object QUERY_RUN_ID extends LogKey
-  case object RANGE extends LogKey
-  case object RATE_LIMIT extends LogKey
-  case object RATIO extends LogKey
-  case object RDD extends LogKey
-  case object RDD_CHECKPOINT_DIR extends LogKey
-  case object RDD_DEBUG_STRING extends LogKey
-  case object RDD_DESCRIPTION extends LogKey
-  case object RDD_ID extends LogKey
-  case object READ_LIMIT extends LogKey
-  case object REASON extends LogKey
-  case object REATTACHABLE extends LogKey
-  case object RECEIVED_BLOCK_INFO extends LogKey
-  case object RECEIVED_BLOCK_TRACKER_LOG_EVENT extends LogKey
-  case object RECEIVER_ID extends LogKey
-  case object RECEIVER_IDS extends LogKey
-  case object RECORDS extends LogKey
-  case object RECOVERY_STATE extends LogKey
-  case object RECURSIVE_DEPTH extends LogKey
-  case object REDACTED_STATEMENT extends LogKey
-  case object REDUCE_ID extends LogKey
-  case object REGEX extends LogKey
-  case object REGISTERED_EXECUTOR_FILE extends LogKey
-  case object REGISTER_MERGE_RESULTS extends LogKey
-  case object RELATION_NAME extends LogKey
-  case object RELATION_OUTPUT extends LogKey
-  case object RELATIVE_TOLERANCE extends LogKey
-  case object RELEASED_LOCKS extends LogKey
-  case object REMAINING_PARTITIONS extends LogKey
-  case object REMOTE_ADDRESS extends LogKey
-  case object REMOTE_BLOCKS_SIZE extends LogKey
-  case object REMOVE_FROM_MASTER extends LogKey
-  case object REPORT_DETAILS extends LogKey
-  case object REQUESTER_SIZE extends LogKey
-  case object REQUEST_EXECUTORS extends LogKey
-  case object REQUEST_ID extends LogKey
-  case object RESOURCE extends LogKey
-  case object RESOURCE_NAME extends LogKey
-  case object RESOURCE_PROFILE_ID extends LogKey
-  case object RESOURCE_PROFILE_IDS extends LogKey
-  case object RESOURCE_PROFILE_TO_TOTAL_EXECS extends LogKey
-  case object RESPONSE_BODY_SIZE extends LogKey
-  case object RESTART_TIME extends LogKey
-  case object RESULT extends LogKey
-  case object RESULT_SIZE_BYTES extends LogKey
-  case object RESULT_SIZE_BYTES_MAX extends LogKey
-  case object RETRY_INTERVAL extends LogKey
-  case object RETRY_WAIT_TIME extends LogKey
-  case object RIGHT_EXPR extends LogKey
-  case object RIGHT_LOGICAL_PLAN_STATS_SIZE_IN_BYTES extends LogKey
-  case object RMSE extends LogKey
-  case object ROCKS_DB_FILE_MAPPING extends LogKey
-  case object ROCKS_DB_LOG_LEVEL extends LogKey
-  case object ROCKS_DB_LOG_MESSAGE extends LogKey
-  case object RPC_ADDRESS extends LogKey
-  case object RPC_ENDPOINT_REF extends LogKey
-  case object RPC_MESSAGE_CAPACITY extends LogKey
-  case object RPC_SSL_ENABLED extends LogKey
-  case object RULE_EXECUTOR_NAME extends LogKey
-  case object RULE_NAME extends LogKey
-  case object RUN_ID extends LogKey
-  case object RUN_ID_STRING extends LogKey
-  case object SCALA_VERSION extends LogKey
-  case object SCALING_DOWN_RATIO extends LogKey
-  case object SCALING_UP_RATIO extends LogKey
-  case object SCHEDULER_POOL_NAME extends LogKey
-  case object SCHEDULING_MODE extends LogKey
-  case object SCHEMA extends LogKey
-  case object SCHEMA2 extends LogKey
-  case object SERVER_NAME extends LogKey
-  case object SERVICE_NAME extends LogKey
-  case object SERVLET_CONTEXT_HANDLER_PATH extends LogKey
-  case object SESSION_HANDLE extends LogKey
-  case object SESSION_HOLD_INFO extends LogKey
-  case object SESSION_ID extends LogKey
-  case object SESSION_KEY extends LogKey
-  case object SET_CLIENT_INFO_REQUEST extends LogKey
-  case object SHARD_ID extends LogKey
-  case object SHORTER_SERVICE_NAME extends LogKey
-  case object SHORT_USER_NAME extends LogKey
-  case object SHUFFLE_BLOCK_INFO extends LogKey
-  case object SHUFFLE_DB_BACKEND_KEY extends LogKey
-  case object SHUFFLE_DB_BACKEND_NAME extends LogKey
-  case object SHUFFLE_ID extends LogKey
-  case object SHUFFLE_IDS extends LogKey
-  case object SHUFFLE_MERGE_ID extends LogKey
-  case object SHUFFLE_MERGE_RECOVERY_FILE extends LogKey
-  case object SHUFFLE_SERVICE_CONF_OVERLAY_URL extends LogKey
-  case object SHUFFLE_SERVICE_METRICS_NAMESPACE extends LogKey
-  case object SHUFFLE_SERVICE_NAME extends LogKey
-  case object SIGMAS_LENGTH extends LogKey
-  case object SIGNAL extends LogKey
-  case object SINK extends LogKey
-  case object SIZE extends LogKey
-  case object SLEEP_TIME extends LogKey
-  case object SLIDE_DURATION extends LogKey
-  case object SMALLEST_CLUSTER_INDEX extends LogKey
-  case object SNAPSHOT_EVENT extends LogKey
-  case object SNAPSHOT_EVENT_TIME_DELTA extends LogKey
-  case object SNAPSHOT_EVENT_VERSION_DELTA extends LogKey
-  case object SNAPSHOT_VERSION extends LogKey
-  case object SOCKET_ADDRESS extends LogKey
-  case object SOURCE extends LogKey
-  case object SOURCE_PATH extends LogKey
-  case object SPARK_BRANCH extends LogKey
-  case object SPARK_BUILD_DATE extends LogKey
-  case object SPARK_BUILD_USER extends LogKey
-  case object SPARK_DATA_STREAM extends LogKey
-  case object SPARK_PLAN_ID extends LogKey
-  case object SPARK_REPO_URL extends LogKey
-  case object SPARK_REVISION extends LogKey
-  case object SPARK_VERSION extends LogKey
-  case object SPILL_TIMES extends LogKey
-  case object SQL_TEXT extends LogKey
-  case object SRC_PATH extends LogKey
-  case object STAGE extends LogKey
-  case object STAGES extends LogKey
-  case object STAGE_ATTEMPT extends LogKey
-  case object STAGE_ATTEMPT_ID extends LogKey
-  case object STAGE_ID extends LogKey
-  case object STAGE_NAME extends LogKey
-  case object START_INDEX extends LogKey
-  case object START_TIME extends LogKey
-  case object STATEMENT_ID extends LogKey
-  case object STATE_NAME extends LogKey
-  case object STATE_STORE_COORDINATOR extends LogKey
-  case object STATE_STORE_ID extends LogKey
-  case object STATE_STORE_PROVIDER extends LogKey
-  case object STATE_STORE_PROVIDER_ID extends LogKey
-  case object STATE_STORE_PROVIDER_IDS extends LogKey
-  case object STATE_STORE_VERSION extends LogKey
-  case object STATS extends LogKey
-  case object STATUS extends LogKey
-  case object STDERR extends LogKey
-  case object STOP_SITE_SHORT_FORM extends LogKey
-  case object STORAGE_LEVEL extends LogKey
-  case object STORAGE_LEVEL_DESERIALIZED extends LogKey
-  case object STORAGE_LEVEL_REPLICATION extends LogKey
-  case object STORAGE_MEMORY_SIZE extends LogKey
-  case object STORE_ID extends LogKey
-  case object STRATEGY extends LogKey
-  case object STREAMING_CONTEXT extends LogKey
-  case object STREAMING_DATA_SOURCE_DESCRIPTION extends LogKey
-  case object STREAMING_DATA_SOURCE_NAME extends LogKey
-  case object STREAMING_OFFSETS_END extends LogKey
-  case object STREAMING_OFFSETS_START extends LogKey
-  case object STREAMING_QUERY_PROGRESS extends LogKey
-  case object STREAMING_SOURCE extends LogKey
-  case object STREAMING_TABLE extends LogKey
-  case object STREAMING_WRITE extends LogKey
-  case object STREAM_CHUNK_ID extends LogKey
-  case object STREAM_ID extends LogKey
-  case object STREAM_NAME extends LogKey
-  case object SUBMISSION_ID extends LogKey
-  case object SUBSAMPLING_RATE extends LogKey
-  case object SUB_QUERY extends LogKey
-  case object TABLE_NAME extends LogKey
-  case object TABLE_TYPE extends LogKey
-  case object TABLE_TYPES extends LogKey
-  case object TAG extends LogKey
-  case object TARGET_NUM_EXECUTOR extends LogKey
-  case object TARGET_NUM_EXECUTOR_DELTA extends LogKey
-  case object TARGET_PATH extends LogKey
-  case object TARGET_SIZE extends LogKey
-  case object TASK_ATTEMPT_ID extends LogKey
-  case object TASK_ID extends LogKey
-  case object TASK_INDEX extends LogKey
-  case object TASK_LOCALITY extends LogKey
-  case object TASK_NAME extends LogKey
-  case object TASK_REQUIREMENTS extends LogKey
-  case object TASK_RESOURCES extends LogKey
-  case object TASK_RESOURCE_ASSIGNMENTS extends LogKey
-  case object TASK_SET_MANAGER extends LogKey
-  case object TASK_SET_NAME extends LogKey
-  case object TASK_STATE extends LogKey
-  case object TEMP_FILE extends LogKey
-  case object TEMP_OUTPUT_PATH extends LogKey
-  case object TEMP_PATH extends LogKey
-  case object TEST_SIZE extends LogKey
-  case object THREAD extends LogKey
-  case object THREAD_ID extends LogKey
-  case object THREAD_NAME extends LogKey
-  case object THREAD_POOL_KEEPALIVE_TIME extends LogKey
-  case object THREAD_POOL_SIZE extends LogKey
-  case object THREAD_POOL_WAIT_QUEUE_SIZE extends LogKey
-  case object THRESHOLD extends LogKey
-  case object THRESH_TIME extends LogKey
-  case object TIME extends LogKey
-  case object TIMEOUT extends LogKey
-  case object TIMER extends LogKey
-  case object TIMESTAMP extends LogKey
-  case object TIME_UNITS extends LogKey
-  case object TIP extends LogKey
-  case object TOKEN extends LogKey
-  case object TOKEN_KIND extends LogKey
-  case object TOKEN_REGEX extends LogKey
-  case object TOKEN_RENEWER extends LogKey
-  case object TOPIC extends LogKey
-  case object TOPIC_PARTITION extends LogKey
-  case object TOPIC_PARTITIONS extends LogKey
-  case object TOPIC_PARTITION_OFFSET extends LogKey
-  case object TOPIC_PARTITION_OFFSET_RANGE extends LogKey
-  case object TOTAL extends LogKey
-  case object TOTAL_EFFECTIVE_TIME extends LogKey
-  case object TOTAL_SIZE extends LogKey
-  case object TOTAL_TIME extends LogKey
-  case object TOTAL_TIME_READ extends LogKey
-  case object TO_TIME extends LogKey
-  case object TRAINING_SIZE extends LogKey
-  case object TRAIN_VALIDATION_SPLIT_METRIC extends LogKey
-  case object TRAIN_VALIDATION_SPLIT_METRICS extends LogKey
-  case object TRANSFER_TYPE extends LogKey
-  case object TREE_NODE extends LogKey
-  case object TRIGGER_INTERVAL extends LogKey
-  case object UI_ACLS extends LogKey
-  case object UI_FILTER extends LogKey
-  case object UI_FILTER_PARAMS extends LogKey
-  case object UI_PROXY_BASE extends LogKey
-  case object UNKNOWN_PARAM extends LogKey
-  case object UNSUPPORTED_EXPR extends LogKey
-  case object UNSUPPORTED_HINT_REASON extends LogKey
-  case object UNTIL_OFFSET extends LogKey
-  case object UPPER_BOUND extends LogKey
-  case object URI extends LogKey
-  case object URIS extends LogKey
-  case object URL extends LogKey
-  case object URL2 extends LogKey
-  case object URLS extends LogKey
-  case object USER_ID extends LogKey
-  case object USER_NAME extends LogKey
-  case object UUID extends LogKey
-  case object VALUE extends LogKey
-  case object VERSIONS_TO_DELETE extends LogKey
-  case object VERSION_NUM extends LogKey
-  case object VIEW_ACLS extends LogKey
-  case object VIEW_ACLS_GROUPS extends LogKey
-  case object VIRTUAL_CORES extends LogKey
-  case object VOCAB_SIZE extends LogKey
-  case object WAIT_RESULT_TIME extends LogKey
-  case object WAIT_SEND_TIME extends LogKey
-  case object WATERMARK_CONSTRAINT extends LogKey
-  case object WEB_URL extends LogKey
-  case object WEIGHT extends LogKey
-  case object WORKER extends LogKey
-  case object WORKER_HOST extends LogKey
-  case object WORKER_ID extends LogKey
-  case object WORKER_PORT extends LogKey
-  case object WORKER_URL extends LogKey
-  case object WRITE_AHEAD_LOG_INFO extends LogKey
-  case object WRITE_AHEAD_LOG_RECORD_HANDLE extends LogKey
-  case object WRITE_JOB_UUID extends LogKey
-  case object XML_SCHEDULING_MODE extends LogKey
-  case object XSD_PATH extends LogKey
-  case object YARN_RESOURCE extends LogKey
-  case object YOUNG_GENERATION_GC extends LogKey
-  case object ZERO_TIME extends LogKey
-}
diff --git a/common/utils/src/main/scala/org/apache/spark/internal/Logging.scala b/common/utils/src/main/scala/org/apache/spark/internal/Logging.scala
index cc5d0281829d0..810bdabebb38a 100644
--- a/common/utils/src/main/scala/org/apache/spark/internal/Logging.scala
+++ b/common/utils/src/main/scala/org/apache/spark/internal/Logging.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.internal
 
+import java.util.Locale
+
 import scala.concurrent.duration._
 import scala.jdk.CollectionConverters._
 
@@ -29,7 +31,6 @@ import org.slf4j.{Logger, LoggerFactory}
 import org.slf4j.event.{Level => Slf4jLevel}
 
 import org.apache.spark.internal.Logging.SparkShellLoggingFilter
-import org.apache.spark.internal.LogKeys
 import org.apache.spark.util.SparkClassUtils
 
 /**
@@ -61,29 +62,16 @@ import org.apache.spark.util.SparkClassUtils
  * <p>
  *
  * If you want to output logs in `scala code` through the structured log framework,
- * you can define `custom LogKey` and use it in `scala` code as follows:
+ * you can define `custom LogKey` in `java` and use it in `scala` code as follows:
  * <p>
  *
- * // To add a `custom LogKey`, implement `LogKey`
- * case object CUSTOM_LOG_KEY extends LogKey
- * import org.apache.spark.internal.MDC;
+ * // Add a `CustomLogKeys`, implement `LogKey`
+ * public enum CustomLogKeys implements LogKey {
+ *   CUSTOM_LOG_KEY
+ * }
  * logInfo(log"${MDC(CUSTOM_LOG_KEY, "key")}")
  */
 
-/**
- * Mapped Diagnostic Context (MDC) that will be used in log messages.
- * The values of the MDC will be inline in the log message, while the key-value pairs will be
- * part of the ThreadContext.
- */
-case class MDC(key: LogKey, value: Any) {
-  require(!value.isInstanceOf[MessageWithContext],
-    "the class of value cannot be MessageWithContext")
-}
-
-object MDC {
-  def of(key: LogKey, value: Any): MDC = MDC(key, value)
-}
-
 /**
  * Wrapper class for log messages that include a logging context.
  * This is used as the return type of the string interpolator `LogStringContext`.
@@ -155,7 +143,7 @@ trait Logging {
         val value = if (mdc.value != null) mdc.value.toString else null
         sb.append(value)
         if (Logging.isStructuredLoggingEnabled) {
-          context.put(mdc.key.name, value)
+          context.put(mdc.key.name.toLowerCase(Locale.ROOT), value)
         }
 
         if (processedParts.hasNext) {
@@ -182,6 +170,12 @@ trait Logging {
     }
   }
 
+  protected def MDC(key: LogKey, value: Any): MDC = {
+    require(!value.isInstanceOf[MessageWithContext],
+      "the class of value cannot be MessageWithContext")
+    new MDC(key, value)
+  }
+
   // Log methods that take only a String
   protected def logInfo(msg: => String): Unit = {
     if (log.isInfoEnabled) log.info(msg)
@@ -411,7 +405,6 @@ private[spark] object Logging {
   @volatile private var initialized = false
   @volatile private var defaultRootLevel: Level = null
   @volatile private var defaultSparkLog4jConfig = false
-  @volatile private var structuredLoggingEnabled = false
   @volatile private[spark] var sparkShellThresholdLevel: Level = null
   @volatile private[spark] var setLogLevelPrinted: Boolean = false
 
@@ -484,21 +477,21 @@ private[spark] object Logging {
    * Enable Structured logging framework.
    */
   private[spark] def enableStructuredLogging(): Unit = {
-    structuredLoggingEnabled = true
+    SparkLoggerFactory.enableStructuredLogging()
   }
 
   /**
    * Disable Structured logging framework.
    */
   private[spark] def disableStructuredLogging(): Unit = {
-    structuredLoggingEnabled = false
+    SparkLoggerFactory.disableStructuredLogging()
   }
 
   /**
    * Return true if Structured logging framework is enabled.
    */
   private[spark] def isStructuredLoggingEnabled: Boolean = {
-    structuredLoggingEnabled
+    SparkLoggerFactory.isStructuredLoggingEnabled
   }
 
   private[spark] class SparkShellLoggingFilter extends AbstractFilter {
diff --git a/common/utils/src/main/scala/org/apache/spark/util/ClosureCleaner.scala b/common/utils/src/main/scala/org/apache/spark/util/ClosureCleaner.scala
index 5ea3c9afa9c10..db6953031fd2c 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/ClosureCleaner.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/ClosureCleaner.scala
@@ -24,7 +24,6 @@ import java.lang.reflect.{Field, Modifier}
 import scala.collection.mutable.{Map, Queue, Set, Stack}
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.lang3.ClassUtils
 import org.apache.xbean.asm9.{ClassReader, ClassVisitor, Handle, MethodVisitor, Type}
 import org.apache.xbean.asm9.Opcodes._
 import org.apache.xbean.asm9.tree.{ClassNode, MethodNode}
@@ -619,7 +618,7 @@ private[spark] object IndylambdaScalaClosures extends Logging {
   def getSerializationProxy(maybeClosure: AnyRef): Option[SerializedLambda] = {
     def isClosureCandidate(cls: Class[_]): Boolean = {
       // TODO: maybe lift this restriction to support other functional interfaces in the future
-      val implementedInterfaces = ClassUtils.getAllInterfaces(cls).asScala
+      val implementedInterfaces = SparkClassUtils.getAllInterfaces(cls)
       implementedInterfaces.exists(_.getName.startsWith("scala.Function"))
     }
 
diff --git a/core/src/main/scala/org/apache/spark/util/CompletionIterator.scala b/common/utils/src/main/scala/org/apache/spark/util/CompletionIterator.scala
similarity index 100%
rename from core/src/main/scala/org/apache/spark/util/CompletionIterator.scala
rename to common/utils/src/main/scala/org/apache/spark/util/CompletionIterator.scala
diff --git a/common/utils/src/main/scala/org/apache/spark/util/MavenUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/MavenUtils.scala
index d54a2f2ed9cea..5e923ad35a3ab 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/MavenUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/MavenUtils.scala
@@ -22,7 +22,6 @@ import java.net.URI
 import java.text.ParseException
 import java.util.UUID
 
-import org.apache.commons.lang3.StringUtils
 import org.apache.ivy.Ivy
 import org.apache.ivy.core.LogOptions
 import org.apache.ivy.core.module.descriptor.{Artifact, DefaultDependencyDescriptor, DefaultExcludeRule, DefaultModuleDescriptor, ExcludeRule}
@@ -36,7 +35,7 @@ import org.apache.ivy.plugins.repository.file.FileRepository
 import org.apache.ivy.plugins.resolver.{ChainResolver, FileSystemResolver, IBiblioResolver}
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.util.ArrayImplicits._
 
 /** Provides utility functions to be used inside SparkSubmit. */
@@ -567,7 +566,7 @@ private[spark] object MavenUtils extends Logging {
   }
 
   private def isInvalidQueryString(tokens: Array[String]): Boolean = {
-    tokens.length != 2 || StringUtils.isBlank(tokens(0)) || StringUtils.isBlank(tokens(1))
+    tokens.length != 2 || SparkStringUtils.isBlank(tokens(0)) || SparkStringUtils.isBlank(tokens(1))
   }
 
   /**
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkClassUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkClassUtils.scala
index 307006315a3c4..3f22719240c06 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkClassUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkClassUtils.scala
@@ -18,6 +18,7 @@ package org.apache.spark.util
 
 import java.util.Random
 
+import scala.collection.mutable.LinkedHashSet
 import scala.util.Try
 
 private[spark] trait SparkClassUtils {
@@ -136,6 +137,33 @@ private[spark] trait SparkClassUtils {
       }
     }
   }
+
+  /**
+   * Gets a list of all interfaces implemented by the given class and its superclasses.
+   */
+  def getAllInterfaces(cls: Class[_]): List[Class[_]] = {
+    if (cls == null) {
+      return null
+    }
+    val interfacesFound = LinkedHashSet[Class[_]]()
+    getAllInterfacesHelper(cls, interfacesFound)
+    interfacesFound.toList
+  }
+
+  private def getAllInterfacesHelper(
+      clazz: Class[_],
+      interfacesFound: LinkedHashSet[Class[_]]): Unit = {
+    var currentClass = clazz
+    while (currentClass != null) {
+      val interfaces = currentClass.getInterfaces
+      for (i <- interfaces) {
+        if (interfacesFound.add(i)) {
+          getAllInterfacesHelper(i, interfacesFound)
+        }
+      }
+      currentClass = currentClass.getSuperclass
+    }
+  }
 }
 
 private[spark] object SparkClassUtils extends SparkClassUtils
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkCollectionUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkCollectionUtils.scala
index eaab50117abdc..9c255daa0522d 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkCollectionUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkCollectionUtils.scala
@@ -16,7 +16,10 @@
  */
 package org.apache.spark.util
 
+import java.util.Arrays
+
 import scala.collection.immutable
+import scala.reflect.ClassTag
 
 private[spark] trait SparkCollectionUtils {
   /**
@@ -32,6 +35,36 @@ private[spark] trait SparkCollectionUtils {
     }
     builder.result()
   }
+
+  def isEmpty[K, V](map: java.util.Map[K, V]): Boolean = {
+    map == null || map.isEmpty()
+  }
+
+  def isNotEmpty[K, V](map: java.util.Map[K, V]): Boolean = !isEmpty(map)
+
+  def createArray[K: ClassTag](size: Int, defaultValue: K): Array[K] = {
+    val arr = Array.ofDim[K](size)
+    val classTag = implicitly[ClassTag[K]]
+    classTag.runtimeClass match {
+      case c if c == classOf[Boolean] =>
+        Arrays.fill(arr.asInstanceOf[Array[Boolean]], defaultValue.asInstanceOf[Boolean])
+      case c if c == classOf[Byte] =>
+        Arrays.fill(arr.asInstanceOf[Array[Byte]], defaultValue.asInstanceOf[Byte])
+      case c if c == classOf[Short] =>
+        Arrays.fill(arr.asInstanceOf[Array[Short]], defaultValue.asInstanceOf[Short])
+      case c if c == classOf[Int] =>
+        Arrays.fill(arr.asInstanceOf[Array[Int]], defaultValue.asInstanceOf[Int])
+      case c if c == classOf[Long] =>
+        Arrays.fill(arr.asInstanceOf[Array[Long]], defaultValue.asInstanceOf[Long])
+      case c if c == classOf[Float] =>
+        Arrays.fill(arr.asInstanceOf[Array[Float]], defaultValue.asInstanceOf[Float])
+      case c if c == classOf[Double] =>
+        Arrays.fill(arr.asInstanceOf[Array[Double]], defaultValue.asInstanceOf[Double])
+      case _ =>
+        Arrays.fill(arr.asInstanceOf[Array[AnyRef]], defaultValue.asInstanceOf[AnyRef])
+    }
+    arr
+  }
 }
 
 private[spark] object SparkCollectionUtils extends SparkCollectionUtils
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkEnvUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkEnvUtils.scala
index b54e6ee5d7309..01e3f52de41f3 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkEnvUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkEnvUtils.scala
@@ -16,16 +16,14 @@
  */
 package org.apache.spark.util
 
+import org.apache.spark.network.util.JavaUtils
+
 private[spark] trait SparkEnvUtils {
 
   /**
    * Indicates whether Spark is currently running unit tests.
    */
-  def isTesting: Boolean = {
-    // Scala's `sys.env` creates a ton of garbage by constructing Scala immutable maps, so
-    // we directly use the Java APIs instead.
-    System.getenv("SPARK_TESTING") != null || System.getProperty("spark.testing") != null
-  }
+  def isTesting: Boolean = JavaUtils.isTesting
 
 }
 
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkErrorUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkErrorUtils.scala
index 872c89e5a29a2..2f16c90ad7149 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkErrorUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkErrorUtils.scala
@@ -16,12 +16,14 @@
  */
 package org.apache.spark.util
 
-import java.io.{Closeable, IOException, PrintWriter}
-import java.nio.charset.StandardCharsets.UTF_8
+import java.io.{Closeable, IOException}
 
+import scala.annotation.tailrec
+import scala.collection.mutable
 import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
+import org.apache.spark.network.util.JavaUtils
 
 private[spark] trait SparkErrorUtils extends Logging {
   /**
@@ -45,7 +47,11 @@ private[spark] trait SparkErrorUtils extends Logging {
 
   def tryWithResource[R <: Closeable, T](createResource: => R)(f: R => T): T = {
     val resource = createResource
-    try f.apply(resource) finally resource.close()
+    try {
+      f.apply(resource)
+    } finally {
+      closeQuietly(resource)
+    }
   }
 
   /**
@@ -59,7 +65,7 @@ private[spark] trait SparkErrorUtils extends Logging {
       initialize(resource)
     } catch {
       case e: Throwable =>
-        resource.close()
+        closeQuietly(resource)
         throw e
     }
   }
@@ -97,13 +103,54 @@ private[spark] trait SparkErrorUtils extends Logging {
     }
   }
 
-  def stackTraceToString(t: Throwable): String = {
-    val out = new java.io.ByteArrayOutputStream
-    SparkErrorUtils.tryWithResource(new PrintWriter(out)) { writer =>
-      t.printStackTrace(writer)
-      writer.flush()
+  def stackTraceToString(t: Throwable): String = JavaUtils.stackTraceToString(t)
+
+  /**
+   * Walks the [[Throwable]] to obtain its root cause.
+   *
+   * This method walks through the exception chain until the last element,
+   * the root cause of the chain, using `getCause()`, and
+   * returns that exception.
+   *
+   * This method handles recursive cause chains that might
+   * otherwise cause infinite loops. The cause chain is processed until
+   * the end, or until the next item in the chain is already
+   * processed. If we detect a loop, then return the element before the loop.
+   *
+   * @param throwable the throwable to get the root cause for, may be null
+   * @return the root cause of the [[Throwable]], `null` if null throwable input
+   */
+  def getRootCause(throwable: Throwable): Throwable = {
+    @tailrec
+    def findRoot(
+        current: Throwable,
+        visited: mutable.Set[Throwable] = mutable.Set.empty): Throwable = {
+      if (current == null) null
+      else {
+        visited += current
+        val cause = current.getCause
+        if (cause == null) {
+          current
+        } else if (visited.contains(cause)) {
+          current
+        } else {
+          findRoot(cause, visited)
+        }
+      }
+    }
+
+    findRoot(throwable)
+  }
+
+  /** Try to close by ignoring all exceptions. This is different from JavaUtils.closeQuietly. */
+  def closeQuietly(closeable: Closeable): Unit = {
+    if (closeable != null) {
+      try {
+        closeable.close()
+      } catch {
+        case _: Exception =>
+      }
     }
-    new String(out.toByteArray, UTF_8)
   }
 }
 
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkFileUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkFileUtils.scala
index 22f03df1b2697..3f1f9c1f9df7f 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkFileUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkFileUtils.scala
@@ -17,10 +17,11 @@
 package org.apache.spark.util
 
 import java.io.File
-import java.net.{URI, URISyntaxException}
-import java.nio.file.Files
+import java.net.{URI, URISyntaxException, URL}
+import java.nio.file.{Files, Path, StandardCopyOption}
+import java.nio.file.attribute.FileTime
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.network.util.JavaUtils
 
 private[spark] trait SparkFileUtils extends Logging {
@@ -49,6 +50,13 @@ private[spark] trait SparkFileUtils extends Logging {
     new File(path).getCanonicalFile().toURI()
   }
 
+  /**
+   * Size of files recursively.
+   */
+  def sizeOf(f: File): Long = {
+    JavaUtils.sizeOf(f)
+  }
+
   /**
    * Lists files recursively.
    */
@@ -65,6 +73,20 @@ private[spark] trait SparkFileUtils extends Logging {
     result.toArray
   }
 
+  /**
+   * Lists regular files recursively.
+   */
+  def listFiles(f: File): java.util.Set[File] = {
+    JavaUtils.listFiles(f)
+  }
+
+  /**
+   * Lists regular paths recursively.
+   */
+  def listPaths(f: File): java.util.Set[Path] = {
+    JavaUtils.listPaths(f)
+  }
+
   /**
    * Create a directory given the abstract pathname
    * @return true, if the directory is successfully created; otherwise, return false.
@@ -112,6 +134,21 @@ private[spark] trait SparkFileUtils extends Logging {
     createDirectory(root, namePrefix)
   }
 
+  def createParentDirs(file: File): Unit = {
+    if (file == null) {
+      throw new IllegalArgumentException("Input should not be null.")
+    }
+    val parent = file.getParentFile()
+    if (parent != null) {
+      Files.createDirectories(parent.toPath())
+    }
+  }
+
+  /** Delete recursively while keeping the given directory itself. */
+  def cleanDirectory(dir: File): Unit = {
+    JavaUtils.cleanDirectory(dir)
+  }
+
   /**
    * Delete a file or directory and its contents recursively.
    * Don't follow directories if they are symlinks.
@@ -120,6 +157,87 @@ private[spark] trait SparkFileUtils extends Logging {
   def deleteRecursively(file: File): Unit = {
     JavaUtils.deleteRecursively(file)
   }
+
+  /** Delete a file or directory and its contents recursively without throwing exceptions. */
+  def deleteQuietly(file: File): Unit = {
+    JavaUtils.deleteQuietly(file)
+  }
+
+  /** Registers the file or directory for deletion when the JVM exists. */
+  def forceDeleteOnExit(file: File): Unit = {
+    JavaUtils.forceDeleteOnExit(file)
+  }
+
+  def getFile(names: String*): File = {
+    require(names != null && names.forall(_ != null))
+    names.tail.foldLeft(Path.of(names.head)) { (path, part) =>
+      path.resolve(part)
+    }.toFile
+  }
+
+  def getFile(parent: File, names: String*): File = {
+    require(parent != null && names != null && names.forall(_ != null))
+    names.foldLeft(parent.toPath) { (path, part) =>
+      path.resolve(part)
+    }.toFile
+  }
+
+  /** Move src to dst simply. File attribute times are not copied. */
+  def moveFile(src: File, dst: File): Unit = {
+    JavaUtils.moveFile(src, dst)
+  }
+
+  /** Move src to dst simply. File attribute times are not copied. */
+  def moveDirectory(src: File, dst: File): Unit = {
+    JavaUtils.moveDirectory(src, dst)
+  }
+
+  /** Copy src to the target directory simply. File attribute times are not copied. */
+  def copyDirectory(src: File, dir: File): Unit = {
+    JavaUtils.copyDirectory(src, dir)
+  }
+
+  /** Copy file to the target directory simply. File attribute times are not copied. */
+  def copyFileToDirectory(file: File, dir: File): Unit = {
+    if (file == null || dir == null || !file.exists() || (dir.exists() && !dir.isDirectory())) {
+      throw new IllegalArgumentException(s"Invalid input file $file or directory $dir")
+    }
+    Files.createDirectories(dir.toPath())
+    val newFile = new File(dir, file.getName())
+    Files.copy(file.toPath(), newFile.toPath(), StandardCopyOption.REPLACE_EXISTING)
+  }
+
+  def copyFile(src: File, dst: File): Unit = {
+    if (src == null || dst == null || !src.exists() || (dst.exists() && dst.isDirectory())) {
+      throw new IllegalArgumentException(s"Invalid input file $src or directory $dst")
+    }
+    Files.copy(src.toPath(), dst.toPath(), StandardCopyOption.REPLACE_EXISTING)
+  }
+
+  def copyURLToFile(url: URL, file: File): Unit = {
+    JavaUtils.copyURLToFile(url, file)
+  }
+
+  /** Return true if the content of the files are equal or they both don't exist */
+  def contentEquals(file1: File, file2: File): Boolean = {
+    JavaUtils.contentEquals(file1, file2)
+  }
+
+  def touch(file: File): Unit = {
+    if (file == null) {
+      throw new IllegalArgumentException("Invalid input file: null")
+    }
+    val path = file.toPath
+    if (Files.exists(path)) {
+      Files.setLastModifiedTime(path, FileTime.fromMillis(System.currentTimeMillis()))
+    } else {
+      val parent = path.getParent()
+      if (parent != null && !Files.exists(parent)) {
+        Files.createDirectories(parent)
+      }
+      Files.createFile(path)
+    }
+  }
 }
 
 private[spark] object SparkFileUtils extends SparkFileUtils
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkStreamUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkStreamUtils.scala
index b9148901f1ac6..a2556770ed357 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkStreamUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkStreamUtils.scala
@@ -19,6 +19,7 @@ package org.apache.spark.util
 import java.io.{FileInputStream, FileOutputStream, InputStream, OutputStream}
 import java.nio.channels.{FileChannel, WritableByteChannel}
 
+import org.apache.spark.network.util.JavaUtils
 import org.apache.spark.util.SparkErrorUtils.tryWithSafeFinally
 
 private[spark] trait SparkStreamUtils {
@@ -104,6 +105,14 @@ private[spark] trait SparkStreamUtils {
          """.stripMargin)
     }
   }
+
+  def toString(in: InputStream): String = {
+    JavaUtils.toString(in)
+  }
+
+  def readFully(in: InputStream, arr: Array[Byte], off: Int, len: Int): Unit = {
+    JavaUtils.readFully(in, arr, off, len)
+  }
 }
 
 private [spark] object SparkStreamUtils extends SparkStreamUtils
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkStringUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkStringUtils.scala
index 9f58288ee266c..53f46a5d9c8ed 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkStringUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkStringUtils.scala
@@ -16,11 +16,131 @@
  */
 package org.apache.spark.util
 
+import java.util.HexFormat
+import java.util.concurrent.atomic.AtomicBoolean
+
+import org.apache.spark.internal.Logging
+import org.apache.spark.util.ArrayImplicits._
+
 private[spark] trait SparkStringUtils {
+  private final lazy val SPACE_DELIMITED_UPPERCASE_HEX =
+    HexFormat.of().withDelimiter(" ").withUpperCase()
+
+  /**
+   * Returns a pretty string of the byte array which prints each byte as a hex digit and add
+   * spaces between them. For example, [1A C0].
+   */
+  def getHexString(bytes: Array[Byte]): String = {
+    s"[${SPACE_DELIMITED_UPPERCASE_HEX.formatHex(bytes)}]"
+  }
+
+  def fromHexString(hex: String): Array[Byte] = {
+    SPACE_DELIMITED_UPPERCASE_HEX.parseHex(hex.stripPrefix("[").stripSuffix("]"))
+  }
+
+  def isEmpty(str: String): Boolean = str == null || str.length() == 0
+
+  def isNotEmpty(str: String): Boolean = !isEmpty(str)
+
+  def isBlank(str: String): Boolean = str == null || str.isBlank
+
+  def isNotBlank(str: String): Boolean = !isBlank(str)
+
+  def abbreviate(str: String, abbrevMarker: String, len: Int): String = {
+    if (str == null || abbrevMarker == null) {
+      null
+    } else if (str.length() <= len || str.length() <= abbrevMarker.length()) {
+      str
+    } else {
+      str.substring(0, len - abbrevMarker.length()) + abbrevMarker
+    }
+  }
+
+  def abbreviate(str: String, len: Int): String = abbreviate(str, "...", len)
+
+  def sideBySide(left: String, right: String): Seq[String] = {
+    sideBySide(left.split("\n").toImmutableArraySeq, right.split("\n").toImmutableArraySeq)
+  }
+
+  def sideBySide(left: Seq[String], right: Seq[String]): Seq[String] = {
+    val maxLeftSize = left.map(_.length).max
+    val leftPadded = left ++ Seq.fill(math.max(right.size - left.size, 0))("")
+    val rightPadded = right ++ Seq.fill(math.max(left.size - right.size, 0))("")
+
+    leftPadded.zip(rightPadded).map { case (l, r) =>
+      (if (l == r) " " else "!") + l + " ".repeat((maxLeftSize - l.length) + 3) + r
+    }
+  }
+
   def stringToSeq(str: String): Seq[String] = {
     import org.apache.spark.util.ArrayImplicits._
     str.split(",").map(_.trim()).filter(_.nonEmpty).toImmutableArraySeq
   }
+
+  /** Try to strip prefix and suffix with the given string 's' */
+  def strip(str: String, s: String): String =
+    if (str == null || s == null) str else str.stripPrefix(s).stripSuffix(s)
+
+  def leftPad(str: String, width: Int): String =
+    if (str == null || str.length >= width) str else String.format(s"%${width}s", str)
+
+  def rightPad(str: String, width: Int): String =
+    if (str == null || str.length >= width) str else String.format(s"%-${width}s", str)
+
+  def rightPad(str: String, width: Int, s: String): String =
+    if (str == null || str.length >= width) {
+      str
+    } else {
+      val tmp = str + s.repeat((width - str.length)/s.length)
+      tmp + s.substring(0, width - tmp.length)
+    }
 }
 
-private[spark] object SparkStringUtils extends SparkStringUtils
+private[spark] object SparkStringUtils extends SparkStringUtils with Logging {
+
+  /** Whether we have warned about plan string truncation yet. */
+  private val truncationWarningPrinted = new AtomicBoolean(false)
+
+  /**
+   * Format a sequence with semantics similar to calling .mkString(). Any elements beyond
+   * `maxFields` will be dropped and replaced by a "... N more fields" placeholder.
+   *
+   * @return
+   *   the trimmed and formatted string.
+   */
+  def truncatedString[T](
+      seq: Seq[T],
+      start: String,
+      sep: String,
+      end: String,
+      maxFields: Int,
+      customToString: Option[T => String] = None): String = {
+    if (seq.length > maxFields) {
+      if (truncationWarningPrinted.compareAndSet(false, true)) {
+        logWarning(
+          "Truncated the string representation of a plan since it was too large. This " +
+            s"behavior can be adjusted by setting 'spark.sql.debug.maxToStringFields'.")
+      }
+      val numFields = math.max(0, maxFields)
+      val restNum = seq.length - numFields
+      val ending = (if (numFields == 0) "" else sep) +
+        (if (restNum == 0) "" else s"... $restNum more fields") + end
+      if (customToString.isDefined) {
+        seq.take(numFields).map(customToString.get).mkString(start, sep, ending)
+      } else {
+        seq.take(numFields).mkString(start, sep, ending)
+      }
+    } else {
+      if (customToString.isDefined) {
+        seq.map(customToString.get).mkString(start, sep, end)
+      } else {
+        seq.mkString(start, sep, end)
+      }
+    }
+  }
+
+  /** Shorthand for calling truncatedString() without start or end strings. */
+  def truncatedString[T](seq: Seq[T], sep: String, maxFields: Int): String = {
+    truncatedString(seq, "", sep, "", maxFields)
+  }
+}
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkSystemUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkSystemUtils.scala
new file mode 100644
index 0000000000000..eccf556c424eb
--- /dev/null
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkSystemUtils.scala
@@ -0,0 +1,68 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.util
+
+import org.apache.spark.network.util.JavaUtils
+
+private[spark] trait SparkSystemUtils {
+  /**
+   * The `os.name` system property.
+   */
+  val osName = JavaUtils.osName
+
+  /**
+   * The `os.version` system property.
+   */
+  val osVersion = JavaUtils.osVersion
+
+  /**
+   * The `os.arch` system property.
+   */
+  val osArch = JavaUtils.osArch
+
+  /**
+   * The `java.version` system property.
+   */
+  val javaVersion = JavaUtils.javaVersion
+
+  /**
+   * Whether the underlying operating system is Windows.
+   */
+  val isWindows = JavaUtils.isWindows
+
+  /**
+   * Whether the underlying operating system is Mac OS X.
+   */
+  val isMac = JavaUtils.isMac
+
+  /**
+   * Whether the underlying operating system is Mac OS X and processor is Apple Silicon.
+   */
+  val isMacOnAppleSilicon = JavaUtils.isMacOnAppleSilicon
+
+  /**
+   * Whether the underlying operating system is Linux.
+   */
+  val isLinux = JavaUtils.isLinux
+
+  /**
+   * Whether the underlying operating system is UNIX.
+   */
+  val isUnix = JavaUtils.isUnix
+}
+
+object SparkSystemUtils extends SparkSystemUtils
diff --git a/common/utils/src/main/scala/org/apache/spark/util/SparkTestUtils.scala b/common/utils/src/main/scala/org/apache/spark/util/SparkTestUtils.scala
index 34b40a5a8890c..83028ad06a8f3 100644
--- a/common/utils/src/main/scala/org/apache/spark/util/SparkTestUtils.scala
+++ b/common/utils/src/main/scala/org/apache/spark/util/SparkTestUtils.scala
@@ -66,8 +66,6 @@ private[spark] trait SparkTestUtils {
     assert(result.exists(), "Compiled file not found: " + result.getAbsolutePath())
     val out = new File(destDir, fileName)
 
-    // renameTo cannot handle in and out files in different filesystems
-    // use google's Files.move instead
     Files.move(result.toPath, out.toPath)
 
     assert(out.exists(), "Destination file not moved: " + out.getAbsolutePath())
diff --git a/common/utils/src/test/scala/org/apache/spark/util/IvyTestUtils.scala b/common/utils/src/test/scala/org/apache/spark/util/IvyTestUtils.scala
index 140de836622f4..e240603ee2527 100644
--- a/common/utils/src/test/scala/org/apache/spark/util/IvyTestUtils.scala
+++ b/common/utils/src/test/scala/org/apache/spark/util/IvyTestUtils.scala
@@ -23,10 +23,10 @@ import java.util.jar.Attributes.Name
 
 import scala.collection.mutable.ArrayBuffer
 
-import org.apache.commons.io.FileUtils
 import org.apache.ivy.core.settings.IvySettings
 
 import org.apache.spark.util.MavenUtils.MavenCoordinate
+import org.apache.spark.util.SparkFileUtils.deleteRecursively
 
 private[spark] object IvyTestUtils {
 
@@ -95,7 +95,7 @@ private[spark] object IvyTestUtils {
       className: String,
       packageName: String): Seq[(String, File)] = {
     val rFilesDir = new File(dir, "R" + File.separator + "pkg")
-    new File(rFilesDir, "R").mkdirs()
+    SparkFileUtils.createDirectory(new File(rFilesDir, "R"))
     val contents =
       s"""myfunc <- function(x) {
         |  SparkR:::callJStatic("$packageName.$className", "myFunc", x)
@@ -150,20 +150,20 @@ private[spark] object IvyTestUtils {
       useIvyLayout: Boolean): File = {
     if (useIvyLayout) {
       val ivyXmlPath = pathFromCoordinate(artifact, tempPath, "ivy", true)
-      ivyXmlPath.mkdirs()
+      SparkFileUtils.createDirectory(ivyXmlPath)
       createIvyDescriptor(ivyXmlPath, artifact, dependencies)
     } else {
       val pomPath = pathFromCoordinate(artifact, tempPath, "pom", useIvyLayout)
-      pomPath.mkdirs()
+      SparkFileUtils.createDirectory(pomPath)
       createPom(pomPath, artifact, dependencies)
     }
   }
 
   /** Helper method to write artifact information in the pom. */
   private def pomArtifactWriter(artifact: MavenCoordinate, tabCount: Int = 1): String = {
-    var result = "\n" + "  " * tabCount + s"<groupId>${artifact.groupId}</groupId>"
-    result += "\n" + "  " * tabCount + s"<artifactId>${artifact.artifactId}</artifactId>"
-    result += "\n" + "  " * tabCount + s"<version>${artifact.version}</version>"
+    var result = "\n" + "  ".repeat(tabCount) + s"<groupId>${artifact.groupId}</groupId>"
+    result += "\n" + "  ".repeat(tabCount) + s"<artifactId>${artifact.artifactId}</artifactId>"
+    result += "\n" + "  ".repeat(tabCount) + s"<version>${artifact.version}</version>"
     result
   }
 
@@ -293,13 +293,13 @@ private[spark] object IvyTestUtils {
     // Where the root of the repository exists, and what Ivy will search in
     val tempPath = tempDir.getOrElse(SparkFileUtils.createTempDir())
     // Create directory if it doesn't exist
-    tempPath.mkdirs()
+    SparkFileUtils.createDirectory(tempPath)
     // Where to create temporary class files and such
     val root = new File(tempPath, tempPath.hashCode().toString)
-    root.mkdirs()
+    SparkFileUtils.createDirectory(root)
     try {
       val jarPath = pathFromCoordinate(artifact, tempPath, "jar", useIvyLayout)
-      jarPath.mkdirs()
+      SparkFileUtils.createDirectory(jarPath)
       val className = "MyLib"
 
       val javaClass = createJavaClass(root, className, artifact.groupId)
@@ -319,7 +319,7 @@ private[spark] object IvyTestUtils {
       val descriptor = createDescriptor(tempPath, artifact, dependencies, useIvyLayout)
       assert(descriptor.exists(), "Problem creating Pom file")
     } finally {
-      FileUtils.deleteDirectory(root)
+      deleteRecursively(root)
     }
     tempPath
   }
@@ -377,13 +377,13 @@ private[spark] object IvyTestUtils {
       if (repo.toString.contains(".m2") || repo.toString.contains(".ivy2") ||
           repo.toString.contains(".ivy2.5.2")) {
         val groupDir = getBaseGroupDirectory(artifact, useIvyLayout)
-        FileUtils.deleteDirectory(new File(repo, groupDir + File.separator + artifact.artifactId))
+        deleteRecursively(new File(repo, groupDir + File.separator + artifact.artifactId))
         deps.foreach { _.foreach { dep =>
-            FileUtils.deleteDirectory(new File(repo, getBaseGroupDirectory(dep, useIvyLayout)))
+            deleteRecursively(new File(repo, getBaseGroupDirectory(dep, useIvyLayout)))
           }
         }
       } else {
-        FileUtils.deleteDirectory(repo)
+        deleteRecursively(repo)
       }
       purgeLocalIvyCache(artifact, deps, ivySettings)
     }
@@ -395,9 +395,9 @@ private[spark] object IvyTestUtils {
       dependencies: Option[Seq[MavenCoordinate]],
       ivySettings: IvySettings): Unit = {
     // delete the artifact from the cache as well if it already exists
-    FileUtils.deleteDirectory(new File(ivySettings.getDefaultCache, artifact.groupId))
+    deleteRecursively(new File(ivySettings.getDefaultCache, artifact.groupId))
     dependencies.foreach { _.foreach { dep =>
-        FileUtils.deleteDirectory(new File(ivySettings.getDefaultCache, dep.groupId))
+        deleteRecursively(new File(ivySettings.getDefaultCache, dep.groupId))
       }
     }
   }
diff --git a/common/utils/src/test/scala/org/apache/spark/util/LogKeySuite.scala b/common/utils/src/test/scala/org/apache/spark/util/LogKeysSuite.scala
similarity index 65%
rename from common/utils/src/test/scala/org/apache/spark/util/LogKeySuite.scala
rename to common/utils/src/test/scala/org/apache/spark/util/LogKeysSuite.scala
index 17e360f510a24..25a908a8b96e2 100644
--- a/common/utils/src/test/scala/org/apache/spark/util/LogKeySuite.scala
+++ b/common/utils/src/test/scala/org/apache/spark/util/LogKeysSuite.scala
@@ -19,25 +19,23 @@ package org.apache.spark.util
 
 import java.nio.charset.StandardCharsets
 import java.nio.file.{Files, Path}
-import java.util.{ArrayList => JList}
 
 import scala.jdk.CollectionConverters._
-import scala.reflect.runtime.universe._
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.funsuite.AnyFunSuite // scalastyle:ignore funsuite
 
 import org.apache.spark.internal.{Logging, LogKeys}
+import org.apache.spark.util.ArrayImplicits._
 
 // scalastyle:off line.size.limit
 /**
- * To re-generate the file `LogKey.scala`, run:
+ * To re-generate the file `LogKeys.java`, run:
  * {{{
- *   SPARK_GENERATE_GOLDEN_FILES=1 build/sbt "common-utils/testOnly org.apache.spark.util.LogKeySuite"
+ *   SPARK_GENERATE_GOLDEN_FILES=1 build/sbt "common-utils/testOnly org.apache.spark.util.LogKeysSuite"
  * }}}
  */
 // scalastyle:on line.size.limit
-class LogKeySuite
+class LogKeysSuite
     extends AnyFunSuite // scalastyle:ignore funsuite
     with Logging {
 
@@ -54,37 +52,33 @@ class LogKeySuite
 
   private val regenerateGoldenFiles: Boolean = System.getenv("SPARK_GENERATE_GOLDEN_FILES") == "1"
 
-  private val logKeyFilePath = getWorkspaceFilePath("common", "utils", "src", "main", "scala",
-    "org", "apache", "spark", "internal", "LogKey.scala")
+  private val logKeyFilePath = getWorkspaceFilePath("common", "utils", "src", "main", "java",
+    "org", "apache", "spark", "internal", "LogKeys.java")
 
-  // regenerate the file `LogKey.scala` with its members sorted alphabetically
+  // regenerate the file `LogKeys.java` with its members sorted alphabetically
   private def regenerateLogKeyFile(
       originalKeys: Seq[String], sortedKeys: Seq[String]): Unit = {
     if (originalKeys != sortedKeys) {
       val logKeyFile = logKeyFilePath.toFile
       logInfo(s"Regenerating the file $logKeyFile")
-      val originalContents = FileUtils.readLines(logKeyFile, StandardCharsets.UTF_8)
-      val sortedContents = new JList[String]()
-      var firstMatch = false
-      originalContents.asScala.foreach { line =>
-        if (line.trim.startsWith("case object ") && line.trim.endsWith(" extends LogKey")) {
-          if (!firstMatch) {
-            sortedKeys.foreach { key =>
-              sortedContents.add(s"  case object $key extends LogKey")
-            }
-            firstMatch = true
-          }
-        } else {
-          sortedContents.add(line)
-        }
-      }
+      val originalContents = Files.readAllLines(logKeyFile.toPath, StandardCharsets.UTF_8).asScala
+
+      val beforeFirstIndex = originalContents
+        .indexWhere(_.contains("public enum LogKeys implements LogKey"))
+
+      val content =
+        s"""${originalContents.take(beforeFirstIndex + 1).mkString("\n")}
+           |${sortedKeys.map { key => s"  $key" }.mkString(",\n")}
+           |}
+           |""".stripMargin
+
       Files.delete(logKeyFile.toPath)
-      FileUtils.writeLines(logKeyFile, StandardCharsets.UTF_8.name(), sortedContents)
+      Files.writeString(logKeyFile.toPath, content, StandardCharsets.UTF_8)
     }
   }
 
   test("The members of LogKeys are correctly sorted") {
-    val originalKeys = getAllLogKeys.reverse
+    val originalKeys = LogKeys.values.map(_.name).toImmutableArraySeq
     val sortedKeys = originalKeys.sorted
     if (regenerateGoldenFiles) {
       regenerateLogKeyFile(originalKeys, sortedKeys)
@@ -93,11 +87,4 @@ class LogKeySuite
         "The members of LogKeys must be sorted alphabetically")
     }
   }
-
-  private def getAllLogKeys: Seq[String] = {
-    val logKeysType = typeOf[LogKeys.type]
-    val classSymbol = logKeysType.typeSymbol.asClass
-    val members = classSymbol.typeSignature.members
-    members.filter(m => m.isTerm && !m.isMethod).map(_.name.toString).toSeq
-  }
 }
diff --git a/common/utils/src/test/scala/org/apache/spark/util/MDCSuite.scala b/common/utils/src/test/scala/org/apache/spark/util/MDCSuite.scala
index 9615eb2263636..f086b6d18dafc 100644
--- a/common/utils/src/test/scala/org/apache/spark/util/MDCSuite.scala
+++ b/common/utils/src/test/scala/org/apache/spark/util/MDCSuite.scala
@@ -22,7 +22,7 @@ import scala.jdk.CollectionConverters._
 import org.scalatest.BeforeAndAfterAll
 import org.scalatest.funsuite.AnyFunSuite // scalastyle:ignore funsuite
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{EXIT_CODE, OFFSET, RANGE}
 
 class MDCSuite
diff --git a/common/utils/src/test/scala/org/apache/spark/util/SparkErrorUtilsSuite.scala b/common/utils/src/test/scala/org/apache/spark/util/SparkErrorUtilsSuite.scala
new file mode 100644
index 0000000000000..791003b9cddce
--- /dev/null
+++ b/common/utils/src/test/scala/org/apache/spark/util/SparkErrorUtilsSuite.scala
@@ -0,0 +1,120 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.util
+
+import java.io.{Closeable, IOException}
+
+import scala.annotation.nowarn
+
+import org.scalatest.BeforeAndAfterEach
+import org.scalatest.funsuite.AnyFunSuite // scalastyle:ignore funsuite
+
+class SparkErrorUtilsSuite
+    extends AnyFunSuite // scalastyle:ignore funsuite
+    with BeforeAndAfterEach {
+
+  private var withoutCause: Throwable = _
+  private var withCause: Throwable = _
+  private var jdkNoCause: Throwable = _
+  private var nested: NestableException = _
+  private var cyclicCause: ExceptionWithCause = _
+
+  override def beforeEach(): Unit = {
+    withoutCause = createExceptionWithoutCause
+    nested = new NestableException(withoutCause)
+    withCause = new ExceptionWithCause(nested)
+    jdkNoCause = new NullPointerException
+    val exceptionA = new ExceptionWithCause(null.asInstanceOf[Throwable])
+    val exceptionB = new ExceptionWithCause(exceptionA)
+    exceptionA.setCauseValue(exceptionB)
+    cyclicCause = new ExceptionWithCause(exceptionA)
+  }
+
+  override def afterEach(): Unit = {
+    withoutCause = null
+    nested = null
+    withCause = null
+    jdkNoCause = null
+    cyclicCause = null
+  }
+
+  test("getRootCause") {
+    assert(SparkErrorUtils.getRootCause(null) == null)
+    assert(SparkErrorUtils.getRootCause(withoutCause) == withoutCause)
+    assert(SparkErrorUtils.getRootCause(nested) == withoutCause)
+    assert(SparkErrorUtils.getRootCause(withCause) == withoutCause)
+    assert(SparkErrorUtils.getRootCause(jdkNoCause) == jdkNoCause)
+    assert(SparkErrorUtils.getRootCause(cyclicCause) == cyclicCause.getCause.getCause)
+  }
+
+  test("tryWithResource / tryInitializeResource") {
+    val closeable = new Closeable {
+      override def close(): Unit = {
+        throw new IOException("Catch me if you can")
+      }
+    }
+    val e1 = intercept[IOException] {
+      SparkErrorUtils.tryWithResource(closeable)(_ => throw new IOException("You got me!"))
+    }
+    assert(e1.getMessage === "You got me!")
+    val e2 = intercept[IOException] {
+      SparkErrorUtils.tryInitializeResource(closeable)(_ => throw new IOException("You got me!"))
+    }
+    assert(e2.getMessage === "You got me!")
+  }
+
+  private def createExceptionWithoutCause: Throwable =
+    try throw new ExceptionWithoutCause
+    catch {
+      case t: Throwable => t
+    }
+
+  private final class ExceptionWithoutCause extends Exception {
+    @nowarn def getTargetException(): Unit = {}
+  }
+
+  private final class NestableException extends Exception {
+    def this(t: Throwable) = {
+      this()
+      initCause(t)
+    }
+  }
+
+  private final class ExceptionWithCause(message: String = null) extends Exception(message) {
+
+    private var _cause: Throwable = _
+
+    def this(message: String, cause: Throwable) = {
+      this(message)
+      this._cause = cause
+    }
+
+    def this(cause: Throwable) = {
+      this(null.asInstanceOf[String])
+      this._cause = cause
+    }
+
+    override def getCause: Throwable = synchronized {
+      _cause
+    }
+
+    def setCauseValue(cause: Throwable): Unit = {
+      this._cause = cause
+    }
+  }
+}
diff --git a/common/utils/src/test/scala/org/apache/spark/util/StructuredLoggingSuite.scala b/common/utils/src/test/scala/org/apache/spark/util/StructuredLoggingSuite.scala
index 0026b696f0695..20f6d2347eabe 100644
--- a/common/utils/src/test/scala/org/apache/spark/util/StructuredLoggingSuite.scala
+++ b/common/utils/src/test/scala/org/apache/spark/util/StructuredLoggingSuite.scala
@@ -26,7 +26,7 @@ import org.apache.logging.log4j.Level
 import org.scalatest.BeforeAndAfterAll
 import org.scalatest.funsuite.AnyFunSuite // scalastyle:ignore funsuite
 
-import org.apache.spark.internal.{LogEntry, Logging, LogKey, LogKeys, MDC, MessageWithContext}
+import org.apache.spark.internal.{LogEntry, Logging, LogKeys, MessageWithContext}
 
 trait LoggingSuiteBase
     extends AnyFunSuite // scalastyle:ignore funsuite
@@ -491,8 +491,3 @@ class StructuredLoggingSuite extends LoggingSuiteBase {
     assert(mdcPattern.r.findFirstIn(logOutputWithoutMDCSet).isEmpty)
   }
 }
-
-object CustomLogKeys {
-  // Custom `LogKey` must be `extends LogKey`
-  case object CUSTOM_LOG_KEY extends LogKey
-}
diff --git a/common/variant/src/main/java/org/apache/spark/types/variant/VariantBuilder.java b/common/variant/src/main/java/org/apache/spark/types/variant/VariantBuilder.java
index 9c4487dbd3f75..1bd008a5c9149 100644
--- a/common/variant/src/main/java/org/apache/spark/types/variant/VariantBuilder.java
+++ b/common/variant/src/main/java/org/apache/spark/types/variant/VariantBuilder.java
@@ -229,7 +229,7 @@ public void appendTimestampNtz(long microsSinceEpoch) {
   public void appendFloat(float f) {
     checkCapacity(1 + 4);
     writeBuffer[writePos++] = primitiveHeader(FLOAT);
-    writeLong(writeBuffer, writePos, Float.floatToIntBits(f), 8);
+    writeLong(writeBuffer, writePos, Float.floatToIntBits(f), 4);
     writePos += 4;
   }
 
diff --git a/common/variant/src/main/java/org/apache/spark/types/variant/VariantUtil.java b/common/variant/src/main/java/org/apache/spark/types/variant/VariantUtil.java
index 40ea064cbf115..795d46ec2062b 100644
--- a/common/variant/src/main/java/org/apache/spark/types/variant/VariantUtil.java
+++ b/common/variant/src/main/java/org/apache/spark/types/variant/VariantUtil.java
@@ -19,6 +19,7 @@
 
 import org.apache.spark.QueryContext;
 import org.apache.spark.SparkRuntimeException;
+import org.apache.spark.network.util.JavaUtils;
 import scala.collection.immutable.Map$;
 
 import java.math.BigDecimal;
@@ -140,7 +141,7 @@ public class VariantUtil {
   // Both variant value and variant metadata need to be no longer than 128MiB.
   // Note: to make tests more reliable, we set the max size to 16Mib to avoid OOM in tests.
   public static final int SIZE_LIMIT =
-    System.getenv("SPARK_TESTING") != null ? U24_MAX + 1 : 128 * 1024 * 1024;
+    JavaUtils.isTesting() ? U24_MAX + 1 : 128 * 1024 * 1024;
 
   public static final int MAX_DECIMAL4_PRECISION = 9;
   public static final int MAX_DECIMAL8_PRECISION = 18;
diff --git a/connect-examples/server-library-example/README.md b/connect-examples/server-library-example/README.md
deleted file mode 100644
index adf4830d58ff5..0000000000000
--- a/connect-examples/server-library-example/README.md
+++ /dev/null
@@ -1,133 +0,0 @@
-# Spark Server Library Example - Custom Datasource Handler
-
-This example demonstrates a modular maven-based project architecture with separate client, server 
-and common components. It leverages the extensibility of Spark Connect to create a server library 
-that may be attached to the server to extend the functionality of the Spark Connect server as a whole. Below is a detailed overview of the setup and functionality.
-
-## Project Structure
-
-```
-├── common/                # Shared protobuf/utilities/classes
-├── client/                # Sample client implementation 
-│   ├── src/               # Source code for client functionality
-│   ├── pom.xml            # Maven configuration for the client
-├── server/                # Server-side plugin extension
-│   ├── src/               # Source code for server functionality
-│   ├── pom.xml            # Maven configuration for the server
-├── resources/             # Static resources
-├── pom.xml                # Parent Maven configuration
-```
-
-## Functionality Overview
-
-To demonstrate the extensibility of Spark Connect, a custom datasource handler, `CustomTable` is 
-implemented in the server module. The class handles reading, writing and processing data stored in
-a custom format, here we simply use the `.custom` extension (which itself is a wrapper over `.csv`
-files).
-
-First and foremost, the client and the server must be able to communicate with each other through
-custom messages that 'understand' our custom data format. This is achieved by defining custom
-protobuf messages in the `common` module. The client and server modules both depend on the `common`
-module to access these messages.
-- `common/src/main/protobuf/base.proto`: Defines the base `CustomTable` which is simply represented
-by a path and a name.
-```protobuf
-message CustomTable {
-  string path = 1;
-  string name = 2;
-}
-```
-- `common/src/main/protobuf/commands.proto`: Defines the custom commands that the client can send
-to the server. These commands are typically operations that the server can perform, such as cloning
-an existing custom table.
-```protobuf
-message CustomCommand {
-  oneof command_type {
-    CreateTable create_table = 1;
-    CloneTable clone_table = 2;
-  }
-}
-```
-- `common/src/main/protobuf/relations.proto`: Defines custom `relations`, which are a mechanism through which an optional input dataset is transformed into an
-  output dataset such as a Scan.
-```protobuf
-message Scan {
-  CustomTable table = 1;
-}
-```
-
-On the client side, the `CustomTable` class mimics the style of Spark's `Dataset` API, allowing the
-user to perform and chain operations on a `CustomTable` object.
-
-On the server side, a similar `CustomTable` class is implemented to handle the core functionality of
-reading, writing and processing data in the custom format. The plugins (`CustomCommandPlugin` and
-`CustomRelationPlugin`) are responsible for processing the custom protobuf messages sent from the client
-(those defined in the `common` module) and delegating the appropriate actions to the `CustomTable`.
-
-
-
-## Build and Run Instructions
-
-1. **Navigate to the sample project from `SPARK_HOME`**:
-   ```bash
-   cd connect-examples/server-library-example
-   ```
-
-2. **Build and package the modules**:
-   ```bash
-   mvn clean package
-   ```
-
-3. **Download the `4.0.0-preview2` release to use as the Spark Connect Server**:
-   - Choose a distribution from https://archive.apache.org/dist/spark/spark-4.0.0-preview2/.
-   - Example: `curl -L https://archive.apache.org/dist/spark/spark-4.0.0-preview2/spark-4.0.0-preview2-bin-hadoop3.tgz | tar xz`
-
-4. **Copy relevant JARs to the root of the unpacked Spark distribution**:
-   ```bash
-    cp \
-    <SPARK_HOME>/connect-examples/server-library-example/common/target/spark-daria_2.13-1.2.3.jar \
-    <SPARK_HOME>/connect-examples/server-library-example/common/target/spark-server-library-example-common-1.0.0.jar \
-    <SPARK_HOME>/connect-examples/server-library-example/server/target/spark-server-library-example-server-extension-1.0.0.jar \
-    .
-   ```
-5. **Start the Spark Connect Server with the relevant JARs**:
-   ```bash
-    bin/spark-connect-shell \
-   --jars spark-server-library-example-server-extension-1.0.0.jar,spark-server-library-example-common-1.0.0.jar,spark-daria_2.13-1.2.3.jar \
-   --conf spark.connect.extensions.relation.classes=org.apache.connect.examples.serverlibrary.CustomRelationPlugin \
-   --conf spark.connect.extensions.command.classes=org.apache.connect.examples.serverlibrary.CustomCommandPlugin
-   ```
-6. **In a different terminal, navigate back to the root of the sample project and start the client**:
-   ```bash
-   java -cp client/target/spark-server-library-client-package-scala-1.0.0.jar org.apache.connect.examples.serverlibrary.CustomTableExample
-   ```
-7. **Notice the printed output in the client terminal as well as the creation of the cloned table**:
-```protobuf
-Explaining plan for custom table: sample_table with path: <SPARK_HOME>/spark/connect-examples/server-library-example/client/../resources/dummy_data.custom
-== Parsed Logical Plan ==
-Relation [id#2,name#3] csv
-
-== Analyzed Logical Plan ==
-id: int, name: string
-Relation [id#2,name#3] csv
-
-== Optimized Logical Plan ==
-Relation [id#2,name#3] csv
-
-== Physical Plan ==
-FileScan csv [id#2,name#3] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/Users/venkata.gudesa/spark/connect-examples/server-library-example/resou..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<id:int,name:string>
-
-Explaining plan for custom table: cloned_table with path: <SPARK_HOME>/connect-examples/server-library-example/client/../resources/cloned_data.data
-== Parsed Logical Plan ==
-Relation [id#2,name#3] csv
-
-== Analyzed Logical Plan ==
-id: int, name: string
-Relation [id#2,name#3] csv
-
-== Optimized Logical Plan ==
-Relation [id#2,name#3] csv
-
-== Physical Plan ==
-FileScan csv [id#2,name#3] Batched: false, DataFilters: [], Format: CSV, Location: InMemoryFileIndex(1 paths)[file:/Users/venkata.gudesa/spark/connect-examples/server-library-example/resou..., PartitionFilters: [], PushedFilters: [], ReadSchema: struct<id:int,name:string>
-```
\ No newline at end of file
diff --git a/connect-examples/server-library-example/client/pom.xml b/connect-examples/server-library-example/client/pom.xml
deleted file mode 100644
index 364920a2ec22b..0000000000000
--- a/connect-examples/server-library-example/client/pom.xml
+++ /dev/null
@@ -1,112 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!--
-  ~ Licensed to the Apache Software Foundation (ASF) under one or more
-  ~ contributor license agreements.  See the NOTICE file distributed with
-  ~ this work for additional information regarding copyright ownership.
-  ~ The ASF licenses this file to You under the Apache License, Version 2.0
-  ~ (the "License"); you may not use this file except in compliance with
-  ~ the License.  You may obtain a copy of the License at
-  ~
-  ~    http://www.apache.org/licenses/LICENSE-2.0
-  ~
-  ~ Unless required by applicable law or agreed to in writing, software
-  ~ distributed under the License is distributed on an "AS IS" BASIS,
-  ~ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  ~ See the License for the specific language governing permissions and
-  ~ limitations under the License.
-  -->
-
-<project xmlns="http://maven.apache.org/POM/4.0.0"
-         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
-         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
-  <modelVersion>4.0.0</modelVersion>
-
-  <parent>
-    <groupId>org.apache.connect.examples.serverlibrary</groupId>
-    <artifactId>spark-server-library-example</artifactId>
-    <version>1.0.0</version>
-    <relativePath>../pom.xml</relativePath>
-  </parent>
-
-  <artifactId>spark-server-library-client-package-scala</artifactId>
-  <packaging>jar</packaging>
-  
-  <dependencies>
-    <!-- Custom Proto definitions are in the common module -->
-    <dependency>
-      <groupId>org.apache.connect.examples.serverlibrary</groupId>
-      <artifactId>spark-server-library-example-common</artifactId>
-      <version>1.0.0</version>
-      <exclusions>
-        <exclusion>
-          <groupId>com.google.protobuf</groupId>
-          <artifactId>protobuf-java</artifactId>
-        </exclusion>
-      </exclusions>
-    </dependency>
-    <!-- spark-connect-common contains proto definitions that we require to build custom commands/relations/expressions -->
-    <dependency>
-      <groupId>org.apache.spark</groupId>
-      <artifactId>spark-connect-common_${scala.binary}</artifactId>
-      <version>${spark.version}</version>
-    </dependency>
-    <!-- Dependency on the spark connect client module to interact with the Spark server -->
-    <dependency>
-      <groupId>org.apache.spark</groupId>
-      <artifactId>spark-connect-client-jvm_${scala.binary}</artifactId>
-      <version>${spark.version}</version>
-    </dependency>
-    <!-- Dependency on the scala library -->
-    <dependency>
-      <groupId>org.scala-lang</groupId>
-      <artifactId>scala-library</artifactId>
-      <version>${scala.version}</version>
-    </dependency>
-
-  </dependencies>
-
-  <build>
-    <sourceDirectory>src/main/scala</sourceDirectory>
-    <plugins>
-      <!-- Scala -->
-      <plugin>
-        <!-- see http://davidb.github.com/scala-maven-plugin -->
-        <groupId>net.alchim31.maven</groupId>
-        <artifactId>scala-maven-plugin</artifactId>
-        <version>4.9.2</version>
-        <executions>
-          <execution>
-            <goals>
-              <goal>compile</goal>
-              <goal>testCompile</goal>
-            </goals>
-          </execution>
-        </executions>
-      </plugin>
-
-      <!-- Shade plugin for creating a fat JAR -->
-      <plugin>
-        <groupId>org.apache.maven.plugins</groupId>
-        <artifactId>maven-shade-plugin</artifactId>
-        <version>3.5.1</version>
-        <executions>
-          <execution>
-            <phase>package</phase>
-            <goals>
-              <goal>shade</goal>
-            </goals>
-            <configuration>
-              <shadedArtifactAttached>false</shadedArtifactAttached>
-              <promoteTransitiveDependencies>true</promoteTransitiveDependencies>
-              <createDependencyReducedPom>false</createDependencyReducedPom>
-              <!--SPARK-42228: Add `ServicesResourceTransformer` to relocation class names in META-INF/services for grpc-->
-              <transformers>
-                <transformer implementation="org.apache.maven.plugins.shade.resource.ServicesResourceTransformer"/>
-              </transformers>
-            </configuration>
-          </execution>
-        </executions>
-      </plugin>
-    </plugins>
-  </build>
-</project>
diff --git a/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTable.scala b/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTable.scala
deleted file mode 100644
index 782a246d92984..0000000000000
--- a/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTable.scala
+++ /dev/null
@@ -1,149 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.connect.examples.serverlibrary
-
-import com.google.protobuf.Any
-import org.apache.spark.connect.proto.Command
-import org.apache.spark.sql.{functions, Column, DataFrame, Dataset, Row, SparkSession}
-
-import org.apache.connect.examples.serverlibrary.proto
-import org.apache.connect.examples.serverlibrary.proto.CreateTable.Column.{DataType => ProtoDataType}
-
-/**
- * Represents a custom table with associated DataFrame and metadata.
- *
- * @param df    The underlying DataFrame.
- * @param table The metadata of the custom table.
- */
-class CustomTable private (private val df: Dataset[Row], private val table: proto.CustomTable) {
-
-  /**
-   * Returns the Spark session associated with the DataFrame.
-   */
-  private def spark = df.sparkSession
-
-  /**
-   * Converts the custom table to a DataFrame.
-   *
-   * @return The underlying DataFrame.
-   */
-  def toDF: Dataset[Row] = df
-
-  /**
-   * Prints the execution plan of the custom table.
-   */
-  def explain(): Unit = {
-    println(s"Explaining plan for custom table: ${table.getName} with path: ${table.getPath}")
-    df.explain("extended")
-  }
-
-  /**
-   * Clones the custom table to a new location with a new name.
-   *
-   * @param target  The target path for the cloned table.
-   * @param newName The new name for the cloned table.
-   * @param replace Whether to replace the target location if it exists.
-   * @return A new `CustomTable` instance representing the cloned table.
-   */
-  def clone(target: String, newName: String, replace: Boolean): CustomTable = {
-    val cloneTableProto = proto.CloneTable
-      .newBuilder()
-      .setTable(
-        proto.CustomTable
-          .newBuilder()
-          .setName(table.getName)
-          .setPath(table.getPath))
-      .setClone(
-        proto.CustomTable
-          .newBuilder()
-          .setName(newName)
-          .setPath(target))
-      .setReplace(replace)
-      .build()
-    val customCommand = proto.CustomCommand
-      .newBuilder()
-      .setCloneTable(cloneTableProto)
-      .build()
-    // Pack the CustomCommand into Any
-    val customCommandAny = Any.pack(customCommand)
-    // Set the Any as the extension of a Command
-    val commandProto = Command
-      .newBuilder()
-      .setExtension(customCommandAny)
-      .build()
-    // Execute the command
-    spark.execute(commandProto)
-    CustomTable.from(spark, newName, target)
-  }
-}
-
-object CustomTable {
-  /**
-   * Creates a `CustomTable` from the given Spark session, name, and path.
-   *
-   * @param spark The Spark session.
-   * @param name  The name of the table.
-   * @param path  The path of the table.
-   * @return A new `CustomTable` instance.
-   */
-  def from(spark: SparkSession, name: String, path: String): CustomTable = {
-    val table = proto.CustomTable
-      .newBuilder()
-      .setName(name)
-      .setPath(path)
-      .build()
-    val relation = proto.CustomRelation
-      .newBuilder()
-      .setScan(proto.Scan.newBuilder().setTable(table))
-      .build()
-    val customRelation = Any.pack(relation)
-    val df = spark.newDataFrame(f => f.setExtension(customRelation))
-    new CustomTable(df, table)
-  }
-
-  /**
-   * Creates a new `CustomTableBuilder` instance.
-   *
-   * @param spark The Spark session.
-   * @return A new `CustomTableBuilder` instance.
-   */
-  def create(spark: SparkSession): CustomTableBuilder = new CustomTableBuilder(spark)
-
-  /**
-   * Enumeration for data types.
-   */
-  object DataType extends Enumeration {
-    type DataType = Value
-    val Int, String, Float, Boolean = Value
-
-    /**
-     * Converts a `DataType` to its corresponding `ProtoDataType`.
-     *
-     * @param dataType The data type to convert.
-     * @return The corresponding `ProtoDataType`.
-     */
-    def toProto(dataType: DataType): ProtoDataType = {
-      dataType match {
-        case Int => ProtoDataType.INT
-        case String => ProtoDataType.STRING
-        case Float => ProtoDataType.FLOAT
-        case Boolean => ProtoDataType.BOOLEAN
-      }
-    }
-  }
-}
diff --git a/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTableBuilder.scala b/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTableBuilder.scala
deleted file mode 100644
index a1b8ffdb8dd72..0000000000000
--- a/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTableBuilder.scala
+++ /dev/null
@@ -1,135 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.connect.examples.serverlibrary
-
-import com.google.protobuf.Any
-import org.apache.spark.connect.proto.Command
-import org.apache.spark.sql.SparkSession
-
-import org.apache.connect.examples.serverlibrary.CustomTable
-
-/**
- * Builder class for constructing a `CustomTable` instance.
- *
- * @param spark The Spark session.
- */
-class CustomTableBuilder private[serverlibrary] (spark: SparkSession) {
-  import CustomTableBuilder._
-
-  private var name: String = _
-  private var path: String = _
-  private var columns: Seq[Column] = Seq.empty
-
-  /**
-   * Sets the name of the custom table.
-   *
-   * @param name The name of the table.
-   * @return The current `CustomTableBuilder` instance.
-   */
-  def name(name: String): CustomTableBuilder = {
-    this.name = name
-    this
-  }
-
-  /**
-   * Sets the path of the custom table.
-   *
-   * @param path The path of the table.
-   * @return The current `CustomTableBuilder` instance.
-   */
-  def path(path: String): CustomTableBuilder = {
-    this.path = path
-    this
-  }
-
-  /**
-   * Adds a column to the custom table.
-   *
-   * @param name The name of the column.
-   * @param dataType The data type of the column.
-   * @return The current `CustomTableBuilder` instance.
-   */
-  def addColumn(name: String, dataType: CustomTable.DataType.Value): CustomTableBuilder = {
-    columns = columns :+ Column(name, dataType)
-    this
-  }
-
-  /**
-   * Builds the `CustomTable` instance.
-   *
-   * @return A new `CustomTable` instance.
-   * @throws IllegalArgumentException if name, path, or columns are not set.
-   */
-  def build(): CustomTable = {
-    require(name != null, "Name must be set")
-    require(path != null, "Path must be set")
-    require(columns.nonEmpty, "At least one column must be added")
-
-    // Define the table creation proto
-    val createTableProtoBuilder = proto.CreateTable
-      .newBuilder()
-      .setTable(
-        proto.CustomTable
-          .newBuilder()
-          .setPath(path)
-          .setName(name)
-          .build())
-
-    // Add columns to the table creation proto
-    columns.foreach { column =>
-      createTableProtoBuilder.addColumns(
-        proto.CreateTable.Column
-          .newBuilder()
-          .setName(column.name)
-          .setDataType(CustomTable.DataType.toProto(column.dataType))
-          .build())
-    }
-    val createTableProto = createTableProtoBuilder.build() // Build the CreateTable object
-
-    // Wrap the CreateTable proto in CustomCommand
-    val customCommand = proto.CustomCommand
-      .newBuilder()
-      .setCreateTable(createTableProto)
-      .build()
-
-    // Pack the CustomCommand into Any
-    val customCommandAny = Any.pack(customCommand)
-    // Set the Any as the extension of a Command
-    val commandProto = Command
-      .newBuilder()
-      .setExtension(customCommandAny)
-      .build()
-
-    // Execute the command
-    spark.execute(commandProto)
-
-    // After the command is executed, create a client-side representation of the table with the
-    // leaf node of the client-side dataset being the Scan node for the custom table.
-    CustomTable.from(spark, name, path)
-  }
-}
-
-object CustomTableBuilder {
-  /**
-   * Case class representing a column in the custom table.
-   *
-   * @param name The name of the column.
-   * @param dataType The data type of the column.
-   */
-  private case class Column(name: String, dataType: CustomTable.DataType.Value)
-}
diff --git a/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTableExample.scala b/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTableExample.scala
deleted file mode 100644
index 8470465cd7a0b..0000000000000
--- a/connect-examples/server-library-example/client/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTableExample.scala
+++ /dev/null
@@ -1,60 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.connect.examples.serverlibrary
-
-import java.nio.file.{Path, Paths}
-
-import com.google.protobuf.Any
-import org.apache.spark.connect.proto.Command
-import org.apache.spark.sql.SparkSession
-import org.apache.spark.sql.types.{StructType, StructField, StringType, IntegerType}
-
-import org.apache.connect.examples.serverlibrary.proto
-import org.apache.connect.examples.serverlibrary.proto.CreateTable.Column.{DataType => ProtoDataType}
-
-object CustomTableExample {
-  def main(args: Array[String]): Unit = {
-    val spark = SparkSession.builder().remote("sc://localhost").build()
-
-    // Step 1: Create a custom table from existing data
-    val tableName = "sample_table"
-    val fileName = "dummy_data.data"
-
-    val workingDirectory = System.getProperty("user.dir")
-    val fullPath = Paths.get(workingDirectory, s"resources/$fileName")
-    val customTable = CustomTable
-      .create(spark)
-      .name(tableName)
-      .path(fullPath.toString)
-      .addColumn("id", CustomTable.DataType.Int)
-      .addColumn("name", CustomTable.DataType.String)
-      .build()
-
-    // Step 2: Verify
-    customTable.explain()
-
-    // Step 3: Clone the custom table
-    val clonedPath = fullPath.getParent.resolve("cloned_data.data")
-    val clonedName = "cloned_table"
-    val clonedTable =
-      customTable.clone(target = clonedPath.toString, newName = clonedName, replace = true)
-
-    // Step 4: Verify
-    clonedTable.explain()
-  }
-}
diff --git a/connect-examples/server-library-example/common/pom.xml b/connect-examples/server-library-example/common/pom.xml
deleted file mode 100644
index 592c43f26770b..0000000000000
--- a/connect-examples/server-library-example/common/pom.xml
+++ /dev/null
@@ -1,76 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!--
-  ~ Licensed to the Apache Software Foundation (ASF) under one or more
-  ~ contributor license agreements.  See the NOTICE file distributed with
-  ~ this work for additional information regarding copyright ownership.
-  ~ The ASF licenses this file to You under the Apache License, Version 2.0
-  ~ (the "License"); you may not use this file except in compliance with
-  ~ the License.  You may obtain a copy of the License at
-  ~
-  ~    http://www.apache.org/licenses/LICENSE-2.0
-  ~
-  ~ Unless required by applicable law or agreed to in writing, software
-  ~ distributed under the License is distributed on an "AS IS" BASIS,
-  ~ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  ~ See the License for the specific language governing permissions and
-  ~ limitations under the License.
-  -->
-
-<project xmlns="http://maven.apache.org/POM/4.0.0"
-         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
-         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
-  <modelVersion>4.0.0</modelVersion>
-
-  <parent>
-    <groupId>org.apache.connect.examples.serverlibrary</groupId>
-    <artifactId>spark-server-library-example</artifactId>
-    <version>1.0.0</version>
-    <relativePath>../pom.xml</relativePath>
-  </parent>
-
-  <artifactId>spark-server-library-example-common</artifactId>
-  <packaging>jar</packaging>
-
-  <dependencies>
-    <!--Required to compile the proto files-->
-    <dependency>
-      <groupId>com.google.protobuf</groupId>
-      <artifactId>protobuf-java</artifactId>
-      <version>${protobuf.version}</version>
-    </dependency>
-    <dependency>
-      <groupId>org.scala-lang</groupId>
-      <artifactId>scala-library</artifactId>
-      <version>${scala.version}</version>
-    </dependency>
-  </dependencies>
-
-  <build>
-    <plugins>
-      <!-- os-maven-plugin helps resolve ${os.detected.classifier} automatically -->
-      <plugin>
-        <groupId>kr.motd.maven</groupId>
-        <artifactId>os-maven-plugin</artifactId>
-        <version>1.7.0</version>
-        <extensions>true</extensions>
-      </plugin>
-      <plugin>
-        <groupId>org.xolstice.maven.plugins</groupId>
-        <artifactId>protobuf-maven-plugin</artifactId>
-        <version>0.6.1</version>
-        <configuration>
-          <protocArtifact>com.google.protobuf:protoc:${protobuf.version}:exe:${os.detected.classifier}</protocArtifact>
-          <protoSourceRoot>src/main/protobuf</protoSourceRoot>
-        </configuration>
-        <executions>
-          <execution>
-            <phase>generate-sources</phase>
-            <goals>
-              <goal>compile</goal>
-            </goals>
-          </execution>
-        </executions>
-      </plugin>
-    </plugins>
-  </build>
-</project>
diff --git a/connect-examples/server-library-example/common/src/main/protobuf/commands.proto b/connect-examples/server-library-example/common/src/main/protobuf/commands.proto
deleted file mode 100644
index 13d9945cfe61d..0000000000000
--- a/connect-examples/server-library-example/common/src/main/protobuf/commands.proto
+++ /dev/null
@@ -1,61 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-syntax = 'proto3';
-
-option java_multiple_files = true;
-option java_package = "org.apache.connect.examples.serverlibrary.proto";
-
-import "base.proto";
-
-message CustomCommand {
-  oneof command_type {
-    CreateTable create_table = 1;
-    CloneTable clone_table = 2;
-  }
-}
-
-message CreateTable {
-
-  // Column in the schema of the table.
-  message Column {
-    // (Required) Name of the column.
-    string name = 1;
-    // (Required) Data type of the column.
-    enum DataType {
-      DATA_TYPE_UNSPECIFIED = 0; // Default value
-      INT = 1;                  // Integer data type
-      STRING = 2;               // String data type
-      FLOAT = 3;                // Float data type
-      BOOLEAN = 4;              // Boolean data type
-    }
-    DataType data_type = 2;
-  }
-  // (Required) Table properties.
-  CustomTable table = 1;
-  // (Required) List of columns in the schema of the table.
-  repeated Column columns = 2;
-}
-
-message CloneTable {
-  // (Required) The source table to clone.
-  CustomTable table = 1;
-  // (Required) Path to the location where the data of the cloned table should be stored.
-  CustomTable clone = 2;
-  // (Required) Overwrites the target location when true.
-  bool replace = 3;
-}
diff --git a/connect-examples/server-library-example/pom.xml b/connect-examples/server-library-example/pom.xml
deleted file mode 100644
index 1723f3b0154fa..0000000000000
--- a/connect-examples/server-library-example/pom.xml
+++ /dev/null
@@ -1,42 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!--
-  ~ Licensed to the Apache Software Foundation (ASF) under one or more
-  ~ contributor license agreements.  See the NOTICE file distributed with
-  ~ this work for additional information regarding copyright ownership.
-  ~ The ASF licenses this file to You under the Apache License, Version 2.0
-  ~ (the "License"); you may not use this file except in compliance with
-  ~ the License.  You may obtain a copy of the License at
-  ~
-  ~    http://www.apache.org/licenses/LICENSE-2.0
-  ~
-  ~ Unless required by applicable law or agreed to in writing, software
-  ~ distributed under the License is distributed on an "AS IS" BASIS,
-  ~ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  ~ See the License for the specific language governing permissions and
-  ~ limitations under the License.
-  -->
-
-<project xmlns="http://maven.apache.org/POM/4.0.0"
-         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
-         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
-  <modelVersion>4.0.0</modelVersion>
-
-  <groupId>org.apache.connect.examples.serverlibrary</groupId>
-  <artifactId>spark-server-library-example</artifactId>
-  <version>1.0.0</version>
-  <packaging>pom</packaging>
-  <modules>
-    <module>common</module>
-    <module>server</module>
-    <module>client</module>
-  </modules>
-  <properties>
-    <maven.compiler.source>17</maven.compiler.source>
-    <maven.compiler.target>17</maven.compiler.target>
-    <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
-    <scala.binary>2.13</scala.binary>
-    <scala.version>2.13.15</scala.version>
-    <protobuf.version>3.25.4</protobuf.version>
-    <spark.version>4.0.0-preview2</spark.version>
-  </properties>
-</project>
diff --git a/connect-examples/server-library-example/resources/dummy_data.data b/connect-examples/server-library-example/resources/dummy_data.data
deleted file mode 100644
index 0a6645b757222..0000000000000
--- a/connect-examples/server-library-example/resources/dummy_data.data
+++ /dev/null
@@ -1,6 +0,0 @@
-id,name
-1,John Doe
-2,Jane Smith
-3,Bob Johnson
-4,Alice Williams
-5,Charlie Brown
\ No newline at end of file
diff --git a/connect-examples/server-library-example/server/pom.xml b/connect-examples/server-library-example/server/pom.xml
deleted file mode 100644
index b13a7537f9c13..0000000000000
--- a/connect-examples/server-library-example/server/pom.xml
+++ /dev/null
@@ -1,90 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!--
-  ~ Licensed to the Apache Software Foundation (ASF) under one or more
-  ~ contributor license agreements.  See the NOTICE file distributed with
-  ~ this work for additional information regarding copyright ownership.
-  ~ The ASF licenses this file to You under the Apache License, Version 2.0
-  ~ (the "License"); you may not use this file except in compliance with
-  ~ the License.  You may obtain a copy of the License at
-  ~
-  ~    http://www.apache.org/licenses/LICENSE-2.0
-  ~
-  ~ Unless required by applicable law or agreed to in writing, software
-  ~ distributed under the License is distributed on an "AS IS" BASIS,
-  ~ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  ~ See the License for the specific language governing permissions and
-  ~ limitations under the License.
-  -->
-
-<project xmlns="http://maven.apache.org/POM/4.0.0"
-         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
-         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
-  <modelVersion>4.0.0</modelVersion>
-
-  <parent>
-    <groupId>org.apache.connect.examples.serverlibrary</groupId>
-    <artifactId>spark-server-library-example</artifactId>
-    <version>1.0.0</version>
-    <relativePath>../pom.xml</relativePath>
-  </parent>
-
-  <artifactId>spark-server-library-example-server-extension</artifactId>
-  <packaging>jar</packaging>
-
-  <dependencies>
-    <!-- Custom Proto definitions are in the common module -->
-    <dependency>
-      <groupId>org.apache.connect.examples.serverlibrary</groupId>
-      <artifactId>spark-server-library-example-common</artifactId>
-      <version>1.0.0</version>
-    </dependency>
-
-    <dependency>
-      <groupId>org.scala-lang</groupId>
-      <artifactId>scala-library</artifactId>
-      <version>${scala.version}</version>
-    </dependency>
-
-    <dependency>
-      <groupId>org.apache.spark</groupId>
-      <artifactId>spark-sql_${scala.binary}</artifactId>
-      <version>${spark.version}</version>
-      <scope>provided</scope>
-    </dependency>
-
-    <dependency>
-      <groupId>org.apache.spark</groupId>
-      <artifactId>spark-connect_${scala.binary}</artifactId>
-      <version>${spark.version}</version>
-      <scope>provided</scope>
-    </dependency>
-
-    <!-- Include Spark Daria for utility Dataframe write methods -->
-    <dependency>
-      <groupId>com.github.mrpowers</groupId>
-      <artifactId>spark-daria_${scala.binary}</artifactId>
-      <version>1.2.3</version>
-    </dependency>
-  </dependencies>
-
-  <build>
-    <sourceDirectory>src/main/scala</sourceDirectory>
-    <plugins>
-      <!-- Scala -->
-      <plugin>
-        <!-- see http://davidb.github.com/scala-maven-plugin -->
-        <groupId>net.alchim31.maven</groupId>
-        <artifactId>scala-maven-plugin</artifactId>
-        <version>4.9.2</version>
-        <executions>
-          <execution>
-            <goals>
-              <goal>compile</goal>
-              <goal>testCompile</goal>
-            </goals>
-          </execution>
-        </executions>
-      </plugin>
-    </plugins>
-  </build>
-</project>
diff --git a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomCommandPlugin.scala b/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomCommandPlugin.scala
deleted file mode 100644
index 2253c4b238be4..0000000000000
--- a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomCommandPlugin.scala
+++ /dev/null
@@ -1,134 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.connect.examples.serverlibrary
-
-import scala.collection.JavaConverters._
-
-import com.google.protobuf.Any
-import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
-import org.apache.spark.sql.connect.planner.SparkConnectPlanner
-import org.apache.spark.sql.connect.plugin.CommandPlugin
-import org.apache.spark.sql.types.{StringType, IntegerType, FloatType, DoubleType, BooleanType, LongType, StructType, StructField, DataType}
-
-import org.apache.connect.examples.serverlibrary.CustomTable
-import org.apache.connect.examples.serverlibrary.proto
-import org.apache.connect.examples.serverlibrary.proto.CreateTable.Column.{DataType => ProtoDataType}
-
-/**
- * Commands are distinct actions that can be executed. Unlike relations, which focus on the
- * transformation and nesting of output data, commands represent singular operations that perform
- * specific tasks on the data.
- * In this example, the `CustomCommandPlugin` handles operations related to creating and duplicating
- * custom tables.
- */
-class CustomCommandPlugin extends CommandPlugin with CustomPluginBase {
-
-  /**
-   * Processes the raw byte array containing the command.
-   *
-   * @param raw The raw byte array of the command.
-   * @param planner The SparkConnectPlanner instance.
-   * @return True if the command was processed, false otherwise.
-   */
-  override def process(raw: Array[Byte], planner: SparkConnectPlanner): Boolean = {
-    val command = Any.parseFrom(raw)
-    if (command.is(classOf[proto.CustomCommand])) {
-      processInternal(command.unpack(classOf[proto.CustomCommand]), planner)
-      true
-    } else {
-      false
-    }
-  }
-
-  /**
-   * Processes the unpacked CustomCommand.
-   *
-   * @param command The unpacked CustomCommand.
-   * @param planner The SparkConnectPlanner instance.
-   */
-  private def processInternal(
-      command: proto.CustomCommand,
-      planner: SparkConnectPlanner): Unit = {
-    command.getCommandTypeCase match {
-      case proto.CustomCommand.CommandTypeCase.CREATE_TABLE =>
-        processCreateTable(planner, command.getCreateTable)
-      case proto.CustomCommand.CommandTypeCase.CLONE_TABLE =>
-        processCloneTable(planner, command.getCloneTable)
-      case _ =>
-        throw new IllegalArgumentException(
-          s"Unsupported command type: ${command.getCommandTypeCase}")
-    }
-  }
-
-  /**
-   * Processes the CreateTable command.
-   *
-   * @param planner The SparkConnectPlanner instance.
-   * @param createTable The CreateTable message.
-   */
-  private def processCreateTable(
-      planner: SparkConnectPlanner,
-      createTable: proto.CreateTable): Unit = {
-    val tableName = createTable.getTable.getName
-    val tablePath = createTable.getTable.getPath
-
-    // Convert the list of columns from the protobuf message to a Spark schema
-    val schema = StructType(createTable.getColumnsList.asScala.toSeq.map { column =>
-      StructField(
-        column.getName,
-        protoDataTypeToSparkType(column.getDataType),
-        nullable = true // Assuming all columns are nullable for simplicity
-      )
-    })
-
-    // Create the table using the CustomTable utility
-    CustomTable.createTable(tableName, tablePath, planner.session, schema)
-  }
-
-  /**
-   * Converts a protobuf DataType to a Spark DataType.
-   *
-   * @param protoType The protobuf DataType.
-   * @return The corresponding Spark DataType.
-   */
-  private def protoDataTypeToSparkType(protoType: ProtoDataType): DataType = {
-    protoType match {
-      case ProtoDataType.INT => IntegerType
-      case ProtoDataType.STRING => StringType
-      case ProtoDataType.FLOAT => FloatType
-      case ProtoDataType.BOOLEAN => BooleanType
-      case _ =>
-        throw new IllegalArgumentException(s"Unsupported or unknown data type: ${protoType}")
-    }
-  }
-
-  /**
-   * Processes the CloneTable command.
-   *
-   * @param planner The SparkConnectPlanner instance.
-   * @param msg The CloneTable message.
-   */
-  private def processCloneTable(planner: SparkConnectPlanner, msg: proto.CloneTable): Unit = {
-    val sourceTable = getCustomTable(msg.getTable)
-    CustomTable.cloneTable(
-      sourceTable,
-      msg.getClone.getName,
-      msg.getClone.getPath,
-      msg.getReplace)
-  }
-}
diff --git a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomRelationPlugin.scala b/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomRelationPlugin.scala
deleted file mode 100644
index 7b444803a065f..0000000000000
--- a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomRelationPlugin.scala
+++ /dev/null
@@ -1,91 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.connect.examples.serverlibrary
-
-import java.util.Optional
-
-import com.google.protobuf.Any
-import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
-import org.apache.spark.sql.connect.planner.SparkConnectPlanner
-import org.apache.spark.sql.connect.plugin.RelationPlugin
-
-import org.apache.connect.examples.serverlibrary.{CustomPluginBase, CustomTable}
-import org.apache.connect.examples.serverlibrary.proto
-
-/**
- * Relations are fundamental to dataset transformations, acting as the mechanism through which an
- * input dataset is transformed into an output dataset. Conceptually, relations can be likened to
- * tables within a database, manipulated to achieve desired outcomes.
- * In this example, the `CustomRelationPlugin` handles the transformation related to scanning
- * custom tables. The scan relation would appear as leaf nodes in a dataset's associated logical
- * plan node when it involves reads from the custom tables.
- */
-class CustomRelationPlugin extends RelationPlugin with CustomPluginBase {
-
-  /**
-   * Transforms the raw byte array containing the relation into a Spark logical plan.
-   *
-   * @param raw The raw byte array of the relation.
-   * @param planner The SparkConnectPlanner instance.
-   * @return An Optional containing the LogicalPlan if the relation was processed, empty otherwise.
-   */
-  override def transform(
-      raw: Array[Byte],
-      planner: SparkConnectPlanner): Optional[LogicalPlan] = {
-    val rel = Any.parseFrom(raw)
-    if (rel.is(classOf[proto.CustomRelation])) {
-      val customRelation = rel.unpack(classOf[proto.CustomRelation])
-      // Transform the custom relation
-      Optional.of(transformInner(customRelation, planner))
-    } else {
-      Optional.empty()
-    }
-  }
-
-  /**
-   * Transforms the unpacked CustomRelation into a Spark logical plan.
-   *
-   * @param relation The unpacked CustomRelation.
-   * @param planner The SparkConnectPlanner instance.
-   * @return The corresponding Spark LogicalPlan.
-   */
-  private def transformInner(
-      relation: proto.CustomRelation,
-      planner: SparkConnectPlanner): LogicalPlan = {
-    relation.getRelationTypeCase match {
-      case proto.CustomRelation.RelationTypeCase.SCAN =>
-        transformScan(relation.getScan, planner)
-      case _ =>
-        throw new IllegalArgumentException(
-          s"Unsupported relation type: ${relation.getRelationTypeCase}")
-    }
-  }
-
-  /**
-   * Transforms the Scan relation into a Spark logical plan.
-   *
-   * @param scan The Scan message.
-   * @param planner The SparkConnectPlanner instance.
-   * @return The corresponding Spark LogicalPlan.
-   */
-  private def transformScan(scan: proto.Scan, planner: SparkConnectPlanner): LogicalPlan = {
-    val customTable = getCustomTable(scan.getTable)
-    // Convert the custom table to a DataFrame and get its logical plan
-    customTable.toDF().queryExecution.analyzed
-  }
-}
diff --git a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTable.scala b/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTable.scala
deleted file mode 100644
index e1630cc25edd4..0000000000000
--- a/connect-examples/server-library-example/server/src/main/scala/org/apache/connect/examples/serverlibrary/CustomTable.scala
+++ /dev/null
@@ -1,131 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.connect.examples.serverlibrary
-
-import java.util.UUID
-
-import com.github.mrpowers.spark.daria.sql.DariaWriters
-import org.apache.spark.sql.types.StructType
-import org.apache.spark.sql.{Dataset, Row, SparkSession}
-
-/**
- * Represents a custom table with an identifier and a DataFrame.
- *
- * @param identifier The unique identifier for the table.
- * @param df The DataFrame associated with the table.
- */
-class CustomTable private (identifier: CustomTable.Identifier, df: Dataset[Row]) {
-
-  /**
-   * Returns the DataFrame associated with the table.
-   *
-   * @return The DataFrame.
-   */
-  def toDF(): Dataset[Row] = df
-
-  /**
-   * Writes the DataFrame to disk as a CSV file.
-   */
-  def flush(): Unit = {
-    // Write dataset to disk as a CSV file
-    DariaWriters.writeSingleFile(
-      df = df,
-      format = "csv",
-      sc = df.sparkSession.sparkContext,
-      tmpFolder = s"./${UUID.randomUUID().toString}",
-      filename = identifier.path,
-      saveMode = "overwrite")
-  }
-}
-
-object CustomTable {
-
-  /**
-   * Represents the unique identifier for a custom table.
-   *
-   * @param name The name of the table.
-   * @param path The path where the table is stored.
-   */
-  private case class Identifier(name: String, path: String)
-
-  // Collection holding all the CustomTable instances and searchable by the identifier
-  private val tablesByIdentifier = scala.collection.mutable.Map[Identifier, CustomTable]()
-
-  /**
-   * Creates a new custom table.
-   *
-   * @param name The name of the table.
-   * @param path The path where the table is stored.
-   * @param spark The SparkSession instance.
-   * @param schema The schema of the table.
-   * @return The created CustomTable instance.
-   */
-  private[serverlibrary] def createTable(
-      name: String,
-      path: String,
-      spark: SparkSession,
-      schema: StructType): CustomTable = {
-    val identifier = Identifier(name, path)
-    val df = spark.read
-      .option("header", "true")
-      .schema(schema)
-      .csv(path)
-    val table = new CustomTable(identifier, df)
-    tablesByIdentifier(identifier) = table
-    table
-  }
-
-  /**
-   * Clones an existing custom table.
-   *
-   * @param sourceTable The source table to clone.
-   * @param newName The name of the new table.
-   * @param newPath The path where the new table will be stored.
-   * @param replace Whether to replace the existing table if it exists.
-   * @return The cloned CustomTable instance.
-   */
-  private[serverlibrary] def cloneTable(
-      sourceTable: CustomTable,
-      newName: String,
-      newPath: String,
-      replace: Boolean): CustomTable = {
-    val newIdentifier = Identifier(newName, newPath)
-    val clonedDf = sourceTable.toDF()
-    val clonedTable = new CustomTable(newIdentifier, clonedDf)
-    clonedTable.flush()
-    tablesByIdentifier(newIdentifier) = clonedTable
-    clonedTable
-  }
-
-  /**
-   * Retrieves a custom table based on its identifier.
-   *
-   * @param name The name of the table.
-   * @param path The path where the table is stored.
-   * @return The CustomTable instance.
-   * @throws IllegalArgumentException if the table is not found.
-   */
-  def getTable(name: String, path: String): CustomTable = {
-    val identifier = Identifier(name, path)
-    tablesByIdentifier.get(identifier) match {
-      case Some(table) => table
-      case None =>
-        throw new IllegalArgumentException(s"Table with identifier $identifier not found")
-    }
-  }
-}
diff --git a/connector/avro/benchmarks/AvroReadBenchmark-jdk21-results.txt b/connector/avro/benchmarks/AvroReadBenchmark-jdk21-results.txt
index e01810e1e970c..181508f416ad4 100644
--- a/connector/avro/benchmarks/AvroReadBenchmark-jdk21-results.txt
+++ b/connector/avro/benchmarks/AvroReadBenchmark-jdk21-results.txt
@@ -2,140 +2,140 @@
 SQL Single Numeric Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                2045           2062          24          7.7         130.0       1.0X
+Sum                                                2024           2082          83          7.8         128.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                2033           2040          11          7.7         129.2       1.0X
+Sum                                                2032           2047          21          7.7         129.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1959           1965           8          8.0         124.6       1.0X
+Sum                                                1990           2019          40          7.9         126.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1983           2019          51          7.9         126.1       1.0X
+Sum                                                1988           1989           2          7.9         126.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1935           1941           7          8.1         123.1       1.0X
+Sum                                                1992           2015          32          7.9         126.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1960           1976          23          8.0         124.6       1.0X
+Sum                                                1976           2008          45          8.0         125.6       1.0X
 
 
 ================================================================================================
 Int and String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int and String Scan:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of columns                                     3561           3573          16          2.9         339.6       1.0X
+Sum of columns                                     3538           3559          29          3.0         337.4       1.0X
 
 
 ================================================================================================
 Partitioned Table Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partitioned Table:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Data column                                        2138           2158          28          7.4         135.9       1.0X
-Partition column                                   1817           1828          15          8.7         115.5       1.2X
-Both columns                                       2066           2092          36          7.6         131.4       1.0X
+Data column                                        2317           2368          73          6.8         147.3       1.0X
+Partition column                                   1988           1990           3          7.9         126.4       1.2X
+Both columns                                       2280           2360         114          6.9         144.9       1.0X
 
 
 ================================================================================================
 Repeated String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repeated String:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               2183           2212          41          4.8         208.2       1.0X
+Sum of string length                               2125           2148          33          4.9         202.7       1.0X
 
 
 ================================================================================================
 String with Nulls Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (0.0%):            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               3278           3296          26          3.2         312.6       1.0X
+Sum of string length                               3365           3371           8          3.1         321.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (50.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               2148           2152           5          4.9         204.9       1.0X
+Sum of string length                               2153           2159           8          4.9         205.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (95.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               1128           1129           1          9.3         107.6       1.0X
+Sum of string length                               1128           1131           5          9.3         107.6       1.0X
 
 
 ================================================================================================
 Select All From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Wide Column Scan from 1000 columns:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select of all columns                             20327          20405         111          0.0       40653.8       1.0X
+Select of all columns                             19734          20045         439          0.0       39467.9       1.0X
 
 
 ================================================================================================
 Single Column Scan From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 100 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of single column                               3365           3372           9          0.3        3209.4       1.0X
+Sum of single column                               3445           3445           1          0.3        3285.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 200 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of single column                               6611           6633          32          0.2        6304.7       1.0X
+Sum of single column                               6726           6730           7          0.2        6414.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 300 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of single column                              10030          10036           9          0.1        9565.3       1.0X
+Sum of single column                              10099          10107          12          0.1        9631.1       1.0X
 
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Filters pushdown:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-w/o filters                                        5455           5470          21          0.2        5455.0       1.0X
-pushdown disabled                                  5362           5367           5          0.2        5362.0       1.0X
-w/ filters                                         2367           2384          15          0.4        2367.4       2.3X
+w/o filters                                        5598           5610          18          0.2        5598.4       1.0X
+pushdown disabled                                  5501           5520          18          0.2        5500.6       1.0X
+w/ filters                                         2332           2350          23          0.4        2332.2       2.4X
 
diff --git a/connector/avro/benchmarks/AvroReadBenchmark-results.txt b/connector/avro/benchmarks/AvroReadBenchmark-results.txt
index 85f3a34340cd7..3a41c98083171 100644
--- a/connector/avro/benchmarks/AvroReadBenchmark-results.txt
+++ b/connector/avro/benchmarks/AvroReadBenchmark-results.txt
@@ -2,140 +2,140 @@
 SQL Single Numeric Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1925           1972          66          8.2         122.4       1.0X
+Sum                                                2001           2017          23          7.9         127.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1958           1971          18          8.0         124.5       1.0X
+Sum                                                1980           1981           2          7.9         125.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1918           1920           4          8.2         121.9       1.0X
+Sum                                                1972           1973           1          8.0         125.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1877           1888          16          8.4         119.3       1.0X
+Sum                                                1937           1964          39          8.1         123.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1886           1891           7          8.3         119.9       1.0X
+Sum                                                1905           1934          41          8.3         121.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum                                                1870           1871           1          8.4         118.9       1.0X
+Sum                                                1884           1888           5          8.3         119.8       1.0X
 
 
 ================================================================================================
 Int and String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int and String Scan:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of columns                                     3539           3544           7          3.0         337.5       1.0X
+Sum of columns                                     3423           3462          54          3.1         326.5       1.0X
 
 
 ================================================================================================
 Partitioned Table Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partitioned Table:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Data column                                        1949           1950           1          8.1         123.9       1.0X
-Partition column                                   1780           1791          16          8.8         113.2       1.1X
-Both columns                                       1985           2001          23          7.9         126.2       1.0X
+Data column                                        2067           2068           1          7.6         131.4       1.0X
+Partition column                                   1924           1954          43          8.2         122.3       1.1X
+Both columns                                       2222           2269          67          7.1         141.2       0.9X
 
 
 ================================================================================================
 Repeated String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repeated String:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               2081           2096          21          5.0         198.4       1.0X
+Sum of string length                               1991           2029          53          5.3         189.9       1.0X
 
 
 ================================================================================================
 String with Nulls Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (0.0%):            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               3094           3096           2          3.4         295.1       1.0X
+Sum of string length                               3148           3150           2          3.3         300.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (50.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               2161           2185          34          4.9         206.1       1.0X
+Sum of string length                               2092           2092           0          5.0         199.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (95.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of string length                               1106           1110           6          9.5         105.4       1.0X
+Sum of string length                               1126           1131           8          9.3         107.3       1.0X
 
 
 ================================================================================================
 Select All From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Wide Column Scan from 1000 columns:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select of all columns                             18000          18000           0          0.0       35999.1       1.0X
+Select of all columns                             19944          20078         190          0.0       39887.7       1.0X
 
 
 ================================================================================================
 Single Column Scan From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 100 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of single column                               3094           3103          13          0.3        2950.6       1.0X
+Sum of single column                               3555           3630         106          0.3        3390.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 200 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of single column                               6074           6083          13          0.2        5792.7       1.0X
+Sum of single column                               6793           6796           5          0.2        6478.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 300 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Sum of single column                               9105           9122          23          0.1        8683.6       1.0X
+Sum of single column                              10218          10229          16          0.1        9744.2       1.0X
 
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Filters pushdown:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-w/o filters                                        5123           5132          12          0.2        5122.5       1.0X
-pushdown disabled                                  5071           5085          20          0.2        5070.8       1.0X
-w/ filters                                         1967           1984          26          0.5        1967.2       2.6X
+w/o filters                                        5835           5841           7          0.2        5835.4       1.0X
+pushdown disabled                                  5703           5716          13          0.2        5703.1       1.0X
+w/ filters                                         2217           2227          10          0.5        2217.5       2.6X
 
diff --git a/connector/avro/benchmarks/AvroWriteBenchmark-jdk21-results.txt b/connector/avro/benchmarks/AvroWriteBenchmark-jdk21-results.txt
index 2014407498850..b18b2661be071 100644
--- a/connector/avro/benchmarks/AvroWriteBenchmark-jdk21-results.txt
+++ b/connector/avro/benchmarks/AvroWriteBenchmark-jdk21-results.txt
@@ -1,56 +1,56 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro writer benchmark:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1672           1680          12          9.4         106.3       1.0X
-Output Single Double Column                        1572           1572           0         10.0         100.0       1.1X
-Output Int and String Column                       3337           3351          20          4.7         212.1       0.5X
-Output Partitions                                  2984           2998          20          5.3         189.7       0.6X
-Output Buckets                                     3939           3948          14          4.0         250.4       0.4X
+Output Single Int Column                           1651           1721          98          9.5         105.0       1.0X
+Output Single Double Column                        1856           1864          12          8.5         118.0       0.9X
+Output Int and String Column                       3670           3671           1          4.3         233.3       0.5X
+Output Partitions                                  3288           3290           2          4.8         209.0       0.5X
+Output Buckets                                     3909           3935          37          4.0         248.5       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro compression with different codec:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-BZIP2:                                           117102         117155          74          0.0     1171024.1       1.0X
-DEFLATE:                                           6412           6438          36          0.0       64121.2      18.3X
-UNCOMPRESSED:                                      5015           5034          26          0.0       50153.9      23.3X
-SNAPPY:                                            4540           4542           2          0.0       45403.0      25.8X
-XZ:                                               41913          42574         934          0.0      419134.4       2.8X
-ZSTANDARD:                                         4807           4848          58          0.0       48065.1      24.4X
+BZIP2:                                           122117         122139          32          0.0     1221169.3       1.0X
+DEFLATE:                                           6544           6576          46          0.0       65435.4      18.7X
+UNCOMPRESSED:                                      5013           5028          22          0.0       50129.3      24.4X
+SNAPPY:                                            4664           4676          17          0.0       46641.2      26.2X
+XZ:                                               43536          43997         652          0.0      435362.0       2.8X
+ZSTANDARD:                                         4882           4901          27          0.0       48819.9      25.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro deflate with different levels:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-DEFLATE: deflate.level=1                           4691           4719          40          0.0       46909.5       1.0X
-DEFLATE: deflate.level=3                           4773           4773           0          0.0       47731.7       1.0X
-DEFLATE: deflate.level=5                           6225           6233          11          0.0       62254.0       0.8X
-DEFLATE: deflate.level=7                           6308           6323          21          0.0       63075.8       0.7X
-DEFLATE: deflate.level=9                           6632           6639           9          0.0       66320.6       0.7X
+DEFLATE: deflate.level=1                           4863           4874          15          0.0       48629.6       1.0X
+DEFLATE: deflate.level=3                           4915           4919           6          0.0       49148.2       1.0X
+DEFLATE: deflate.level=5                           6512           6521          14          0.0       65117.5       0.7X
+DEFLATE: deflate.level=7                           6580           6595          22          0.0       65798.8       0.7X
+DEFLATE: deflate.level=9                           6829           6868          56          0.0       68288.6       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro xz with different levels:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-XZ: xz.level=1                                    11561          11582          30          0.0      115608.9       1.0X
-XZ: xz.level=3                                    21560          21618          82          0.0      215604.1       0.5X
-XZ: xz.level=5                                    40673          40707          48          0.0      406733.7       0.3X
-XZ: xz.level=7                                    58646          59202         787          0.0      586455.4       0.2X
-XZ: xz.level=9                                   130798         131012         302          0.0     1307981.2       0.1X
+XZ: xz.level=1                                    11635          11646          16          0.0      116350.7       1.0X
+XZ: xz.level=3                                    21619          21735         165          0.0      216185.2       0.5X
+XZ: xz.level=5                                    41636          41887         355          0.0      416358.8       0.3X
+XZ: xz.level=7                                    61117          61329         301          0.0      611167.0       0.2X
+XZ: xz.level=9                                   140074         142026        2761          0.0     1400739.5       0.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro zstandard with different levels:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------
-ZSTANDARD: zstandard.level=1                                              4842           4883          58          0.0       48423.9       1.0X
-ZSTANDARD: zstandard.level=1, zstandard.bufferPool.enabled=true           4659           4685          37          0.0       46593.3       1.0X
-ZSTANDARD: zstandard.level=3                                              4808           4874          93          0.0       48075.0       1.0X
-ZSTANDARD: zstandard.level=3, zstandard.bufferPool.enabled=true           4554           4586          44          0.0       45541.4       1.1X
-ZSTANDARD: zstandard.level=5                                              5024           5026           2          0.0       50244.9       1.0X
-ZSTANDARD: zstandard.level=5, zstandard.bufferPool.enabled=true           4810           4812           3          0.0       48099.6       1.0X
-ZSTANDARD: zstandard.level=7                                              5223           5237          20          0.0       52232.5       0.9X
-ZSTANDARD: zstandard.level=7, zstandard.bufferPool.enabled=true           5184           5192          12          0.0       51837.0       0.9X
-ZSTANDARD: zstandard.level=9                                              6023           6059          52          0.0       60226.6       0.8X
-ZSTANDARD: zstandard.level=9, zstandard.bufferPool.enabled=true           5886           5896          15          0.0       58855.8       0.8X
+ZSTANDARD: zstandard.level=1                                              4785           4831          65          0.0       47853.1       1.0X
+ZSTANDARD: zstandard.level=1, zstandard.bufferPool.enabled=true           4843           4852          12          0.0       48430.1       1.0X
+ZSTANDARD: zstandard.level=3                                              4934           4954          28          0.0       49341.5       1.0X
+ZSTANDARD: zstandard.level=3, zstandard.bufferPool.enabled=true           4831           4832           2          0.0       48307.1       1.0X
+ZSTANDARD: zstandard.level=5                                              5157           5311         218          0.0       51573.5       0.9X
+ZSTANDARD: zstandard.level=5, zstandard.bufferPool.enabled=true           4956           4959           4          0.0       49560.3       1.0X
+ZSTANDARD: zstandard.level=7                                              5394           5435          59          0.0       53939.4       0.9X
+ZSTANDARD: zstandard.level=7, zstandard.bufferPool.enabled=true           5273           5333          84          0.0       52734.7       0.9X
+ZSTANDARD: zstandard.level=9                                              5954           6054         142          0.0       59536.1       0.8X
+ZSTANDARD: zstandard.level=9, zstandard.bufferPool.enabled=true           5930           6060         184          0.0       59295.7       0.8X
 
diff --git a/connector/avro/benchmarks/AvroWriteBenchmark-results.txt b/connector/avro/benchmarks/AvroWriteBenchmark-results.txt
index 4582347ceb11b..cfe3eb7a08300 100644
--- a/connector/avro/benchmarks/AvroWriteBenchmark-results.txt
+++ b/connector/avro/benchmarks/AvroWriteBenchmark-results.txt
@@ -1,56 +1,56 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro writer benchmark:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1556           1579          33         10.1          98.9       1.0X
-Output Single Double Column                        1591           1601          14          9.9         101.2       1.0X
-Output Int and String Column                       3363           3379          22          4.7         213.8       0.5X
-Output Partitions                                  2937           2952          21          5.4         186.8       0.5X
-Output Buckets                                     3823           3825           3          4.1         243.0       0.4X
+Output Single Int Column                           1559           1630          99         10.1          99.1       1.0X
+Output Single Double Column                        1762           1804          59          8.9         112.0       0.9X
+Output Int and String Column                       3831           3832           1          4.1         243.6       0.4X
+Output Partitions                                  2914           2944          41          5.4         185.3       0.5X
+Output Buckets                                     3718           3725          11          4.2         236.4       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro compression with different codec:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-BZIP2:                                           132833         133636        1136          0.0     1328332.0       1.0X
-DEFLATE:                                           6522           6554          45          0.0       65216.8      20.4X
-UNCOMPRESSED:                                      5131           5150          27          0.0       51311.0      25.9X
-SNAPPY:                                            4709           4766          80          0.0       47091.8      28.2X
-XZ:                                               42816          43168         498          0.0      428160.6       3.1X
-ZSTANDARD:                                         4835           4850          22          0.0       48345.6      27.5X
+BZIP2:                                           132034         132397         514          0.0     1320336.8       1.0X
+DEFLATE:                                           6582           6587           8          0.0       65820.4      20.1X
+UNCOMPRESSED:                                      5144           5147           5          0.0       51436.8      25.7X
+SNAPPY:                                            4756           4757           1          0.0       47563.8      27.8X
+XZ:                                               50584          51077         697          0.0      505841.3       2.6X
+ZSTANDARD:                                         4930           4938          11          0.0       49302.3      26.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro deflate with different levels:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-DEFLATE: deflate.level=1                           4832           4836           6          0.0       48320.1       1.0X
-DEFLATE: deflate.level=3                           4798           4818          28          0.0       47979.1       1.0X
-DEFLATE: deflate.level=5                           6472           6473           2          0.0       64717.5       0.7X
-DEFLATE: deflate.level=7                           6516           6519           5          0.0       65161.0       0.7X
-DEFLATE: deflate.level=9                           6877           6879           3          0.0       68768.4       0.7X
+DEFLATE: deflate.level=1                           4819           4851          45          0.0       48186.1       1.0X
+DEFLATE: deflate.level=3                           4943           5010          94          0.0       49427.9       1.0X
+DEFLATE: deflate.level=5                           6366           6381          22          0.0       63658.6       0.8X
+DEFLATE: deflate.level=7                           6465           6476          16          0.0       64647.8       0.7X
+DEFLATE: deflate.level=9                           6768           6798          44          0.0       67675.3       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro xz with different levels:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-XZ: xz.level=1                                    11901          11909          11          0.0      119013.0       1.0X
-XZ: xz.level=3                                    22159          22204          64          0.0      221592.3       0.5X
-XZ: xz.level=5                                    41324          41591         378          0.0      413243.8       0.3X
-XZ: xz.level=7                                    59391          59735         487          0.0      593906.4       0.2X
-XZ: xz.level=9                                   132884         135160        3219          0.0     1328837.1       0.1X
+XZ: xz.level=1                                    12255          12266          15          0.0      122554.1       1.0X
+XZ: xz.level=3                                    23906          23913          10          0.0      239062.9       0.5X
+XZ: xz.level=5                                    43890          44695        1139          0.0      438895.6       0.3X
+XZ: xz.level=7                                    71200          72059        1215          0.0      712003.3       0.2X
+XZ: xz.level=9                                   157018         160566        5018          0.0     1570183.3       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Avro zstandard with different levels:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------
-ZSTANDARD: zstandard.level=1                                              4707           4753          65          0.0       47073.3       1.0X
-ZSTANDARD: zstandard.level=1, zstandard.bufferPool.enabled=true           4701           4717          23          0.0       47006.8       1.0X
-ZSTANDARD: zstandard.level=3                                              4810           4857          67          0.0       48096.6       1.0X
-ZSTANDARD: zstandard.level=3, zstandard.bufferPool.enabled=true           4768           4799          44          0.0       47684.0       1.0X
-ZSTANDARD: zstandard.level=5                                              5093           5134          59          0.0       50928.2       0.9X
-ZSTANDARD: zstandard.level=5, zstandard.bufferPool.enabled=true           5033           5052          27          0.0       50331.4       0.9X
-ZSTANDARD: zstandard.level=7                                              5538           5554          22          0.0       55381.9       0.8X
-ZSTANDARD: zstandard.level=7, zstandard.bufferPool.enabled=true           5479           5484           7          0.0       54790.8       0.9X
-ZSTANDARD: zstandard.level=9                                              6233           6347         161          0.0       62331.1       0.8X
-ZSTANDARD: zstandard.level=9, zstandard.bufferPool.enabled=true           6266           6319          74          0.0       62663.4       0.8X
+ZSTANDARD: zstandard.level=1                                              4733           4760          37          0.0       47334.4       1.0X
+ZSTANDARD: zstandard.level=1, zstandard.bufferPool.enabled=true           4650           4664          19          0.0       46501.3       1.0X
+ZSTANDARD: zstandard.level=3                                              4799           4835          51          0.0       47986.4       1.0X
+ZSTANDARD: zstandard.level=3, zstandard.bufferPool.enabled=true           4722           4748          36          0.0       47224.8       1.0X
+ZSTANDARD: zstandard.level=5                                              5118           5178          85          0.0       51184.0       0.9X
+ZSTANDARD: zstandard.level=5, zstandard.bufferPool.enabled=true           5002           5008           8          0.0       50019.6       0.9X
+ZSTANDARD: zstandard.level=7                                              5492           5540          69          0.0       54916.5       0.9X
+ZSTANDARD: zstandard.level=7, zstandard.bufferPool.enabled=true           5380           5381           0          0.0       53801.9       0.9X
+ZSTANDARD: zstandard.level=9                                              6198           6207          13          0.0       61975.9       0.8X
+ZSTANDARD: zstandard.level=9, zstandard.bufferPool.enabled=true           5839           5885          65          0.0       58392.7       0.8X
 
diff --git a/connector/avro/src/test/scala/org/apache/spark/sql/avro/AvroSuite.scala b/connector/avro/src/test/scala/org/apache/spark/sql/avro/AvroSuite.scala
index 6f345e069ff78..c78bc62126620 100644
--- a/connector/avro/src/test/scala/org/apache/spark/sql/avro/AvroSuite.scala
+++ b/connector/avro/src/test/scala/org/apache/spark/sql/avro/AvroSuite.scala
@@ -32,7 +32,6 @@ import org.apache.avro.Schema.Type._
 import org.apache.avro.file.{DataFileReader, DataFileWriter}
 import org.apache.avro.generic.{GenericData, GenericDatumReader, GenericDatumWriter, GenericRecord}
 import org.apache.avro.generic.GenericData.{EnumSymbol, Fixed}
-import org.apache.commons.io.FileUtils
 
 import org.apache.spark.{SPARK_VERSION_SHORT, SparkConf, SparkException, SparkRuntimeException, SparkThrowable, SparkUpgradeException}
 import org.apache.spark.TestUtils.assertExceptionMsg
@@ -640,7 +639,7 @@ abstract class AvroSuite
 
   private def createDummyCorruptFile(dir: File): Unit = {
     Utils.tryWithResource {
-      FileUtils.forceMkdir(dir)
+      Files.createDirectories(dir.toPath)
       val corruptFile = new File(dir, "corrupt.avro")
       new BufferedWriter(new FileWriter(corruptFile))
     } { writer =>
@@ -760,12 +759,12 @@ abstract class AvroSuite
       spark.conf.set(SQLConf.AVRO_COMPRESSION_CODEC.key, ZSTANDARD.lowerCaseName())
       df.write.format("avro").save(zstandardDir)
 
-      val uncompressSize = FileUtils.sizeOfDirectory(new File(uncompressDir))
-      val bzip2Size = FileUtils.sizeOfDirectory(new File(bzip2Dir))
-      val xzSize = FileUtils.sizeOfDirectory(new File(xzDir))
-      val deflateSize = FileUtils.sizeOfDirectory(new File(deflateDir))
-      val snappySize = FileUtils.sizeOfDirectory(new File(snappyDir))
-      val zstandardSize = FileUtils.sizeOfDirectory(new File(zstandardDir))
+      val uncompressSize = Utils.sizeOf(new File(uncompressDir))
+      val bzip2Size = Utils.sizeOf(new File(bzip2Dir))
+      val xzSize = Utils.sizeOf(new File(xzDir))
+      val deflateSize = Utils.sizeOf(new File(deflateDir))
+      val snappySize = Utils.sizeOf(new File(snappyDir))
+      val zstandardSize = Utils.sizeOf(new File(zstandardDir))
 
       assert(uncompressSize > deflateSize)
       assert(snappySize > deflateSize)
@@ -1875,7 +1874,7 @@ abstract class AvroSuite
 
     intercept[FileNotFoundException] {
       withTempDir { dir =>
-        FileUtils.touch(new File(dir, "test"))
+        Utils.touch(new File(dir, "test"))
         withSQLConf(AvroFileFormat.IgnoreFilesWithoutExtensionProperty -> "true") {
           spark.read.format("avro").load(dir.toString)
         }
@@ -1884,7 +1883,7 @@ abstract class AvroSuite
 
     intercept[FileNotFoundException] {
       withTempDir { dir =>
-        FileUtils.touch(new File(dir, "test"))
+        Utils.touch(new File(dir, "test"))
 
         spark
           .read
@@ -1899,7 +1898,7 @@ abstract class AvroSuite
     withTempPath { tempDir =>
       val tempEmptyDir = s"$tempDir/sqlOverwrite"
       // Create a temp directory for table that will be overwritten
-      new File(tempEmptyDir).mkdirs()
+      Utils.createDirectory(tempEmptyDir)
       spark.sql(
         s"""
            |CREATE TEMPORARY VIEW episodes
diff --git a/connector/docker-integration-tests/README.md b/connector/docker-integration-tests/README.md
index 385218097a3cb..0e77a2816c3aa 100644
--- a/connector/docker-integration-tests/README.md
+++ b/connector/docker-integration-tests/README.md
@@ -45,7 +45,7 @@ the container bootstrapping. To run an individual Docker integration test, use t
 
 Besides the default Docker images, the integration tests can be run with custom Docker images. For example,
 
-    ORACLE_DOCKER_IMAGE_NAME=gvenzl/oracle-free:23.7-slim ./build/sbt -Pdocker-integration-tests "docker-integration-tests/testOnly *OracleIntegrationSuite"
+    ORACLE_DOCKER_IMAGE_NAME=gvenzl/oracle-free:23.9-slim ./build/sbt -Pdocker-integration-tests "docker-integration-tests/testOnly *OracleIntegrationSuite"
 
 The following environment variables can be used to specify the custom Docker images for different databases:
 
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DB2IntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DB2IntegrationSuite.scala
index 25695f144f558..c2d83943e3222 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DB2IntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DB2IntegrationSuite.scala
@@ -37,7 +37,7 @@ import org.apache.spark.tags.DockerTest
  * }}}
  */
 @DockerTest
-class DB2IntegrationSuite extends DockerJDBCIntegrationSuite with SharedJDBCIntegrationTests {
+class DB2IntegrationSuite extends SharedJDBCIntegrationSuite {
   override val db = new DB2DatabaseOnDocker
 
   override def dataPreparation(conn: Connection): Unit = {
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DockerJDBCIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DockerJDBCIntegrationSuite.scala
index 1df01bd3bfb62..0062b03575930 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DockerJDBCIntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/DockerJDBCIntegrationSuite.scala
@@ -37,7 +37,6 @@ import org.scalatest.concurrent.{Eventually, PatienceConfiguration}
 import org.scalatest.time.SpanSugar._
 
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, CONTAINER, STATUS}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.util.{DockerUtils, Utils}
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MariaDBKrbIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MariaDBKrbIntegrationSuite.scala
index 53e45baa99679..4f782bed77922 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MariaDBKrbIntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MariaDBKrbIntegrationSuite.scala
@@ -33,8 +33,7 @@ import org.apache.spark.tags.DockerTest
  * }}}
  */
 @DockerTest
-class MariaDBKrbIntegrationSuite extends DockerKrbJDBCIntegrationSuite
-  with SharedJDBCIntegrationTests {
+class MariaDBKrbIntegrationSuite extends DockerKrbJDBCIntegrationSuite {
   override protected val userName = s"mariadb/$dockerIp"
   override protected val keytabFileName = "mariadb.keytab"
 
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MsSqlServerIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MsSqlServerIntegrationSuite.scala
index f72f3ecca6929..0950fd7330c5a 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MsSqlServerIntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MsSqlServerIntegrationSuite.scala
@@ -40,8 +40,7 @@ import org.apache.spark.tags.DockerTest
  * }}}
  */
 @DockerTest
-class MsSqlServerIntegrationSuite extends DockerJDBCIntegrationSuite
-  with SharedJDBCIntegrationTests {
+class MsSqlServerIntegrationSuite extends SharedJDBCIntegrationSuite {
   override val db = new MsSQLServerDatabaseOnDocker
 
   override def dataPreparation(conn: Connection): Unit = {
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MySQLIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MySQLIntegrationSuite.scala
index 7244c5547abb3..f74a24c6319da 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MySQLIntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/MySQLIntegrationSuite.scala
@@ -39,7 +39,7 @@ import org.apache.spark.tags.DockerTest
  * }}}
  */
 @DockerTest
-class MySQLIntegrationSuite extends DockerJDBCIntegrationSuite {
+class MySQLIntegrationSuite extends SharedJDBCIntegrationSuite {
   override val db = new MySQLDatabaseOnDocker
 
   override def dataPreparation(conn: Connection): Unit = {
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleDatabaseOnDocker.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleDatabaseOnDocker.scala
index 8656d23a2e6a0..e32563c7e94bd 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleDatabaseOnDocker.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleDatabaseOnDocker.scala
@@ -21,7 +21,7 @@ import org.apache.spark.internal.Logging
 
 class OracleDatabaseOnDocker extends DatabaseOnDocker with Logging {
   lazy override val imageName =
-    sys.env.getOrElse("ORACLE_DOCKER_IMAGE_NAME", "gvenzl/oracle-free:23.7-slim")
+    sys.env.getOrElse("ORACLE_DOCKER_IMAGE_NAME", "gvenzl/oracle-free:23.9-slim")
   val oracle_password = "Th1s1sThe0racle#Pass"
   override val env = Map(
     "ORACLE_PWD" -> oracle_password, // oracle images uses this
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleIntegrationSuite.scala
index 33a89f4f20c4c..d44e2d1e748fd 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleIntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/OracleIntegrationSuite.scala
@@ -61,9 +61,8 @@ import org.apache.spark.tags.DockerTest
  * and with Oracle Express Edition versions 18.4.0 and 21.4.0
  */
 @DockerTest
-class OracleIntegrationSuite extends DockerJDBCIntegrationSuite
-  with SharedSparkSession
-  with SharedJDBCIntegrationTests {
+class OracleIntegrationSuite extends SharedJDBCIntegrationSuite
+  with SharedSparkSession {
   import testImplicits._
 
   override val db = new OracleDatabaseOnDocker
@@ -458,7 +457,7 @@ class OracleIntegrationSuite extends DockerJDBCIntegrationSuite
       .load()
 
     df1.logicalPlan match {
-      case LogicalRelationWithTable(JDBCRelation(_, parts, _), _) =>
+      case LogicalRelationWithTable(JDBCRelation(_, parts, _, _), _) =>
         val whereClauses = parts.map(_.asInstanceOf[JDBCPartition].whereClause).toSet
         assert(whereClauses === Set(
           """"D" < '2018-07-11' or "D" is null""",
@@ -481,7 +480,7 @@ class OracleIntegrationSuite extends DockerJDBCIntegrationSuite
       .load()
 
     df2.logicalPlan match {
-      case LogicalRelationWithTable(JDBCRelation(_, parts, _), _) =>
+      case LogicalRelationWithTable(JDBCRelation(_, parts, _, _), _) =>
         val whereClauses = parts.map(_.asInstanceOf[JDBCPartition].whereClause).toSet
         assert(whereClauses === Set(
           """"T" < '2018-07-15 20:50:32.5' or "T" is null""",
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/PostgresIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/PostgresIntegrationSuite.scala
index 9d1186463ca2a..050f74f369034 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/PostgresIntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/PostgresIntegrationSuite.scala
@@ -40,7 +40,7 @@ import org.apache.spark.tags.DockerTest
  * }}}
  */
 @DockerTest
-class PostgresIntegrationSuite extends DockerJDBCIntegrationSuite with SharedJDBCIntegrationTests {
+class PostgresIntegrationSuite extends SharedJDBCIntegrationSuite {
   override val db = new PostgresDatabaseOnDocker
 
   override def dataPreparation(conn: Connection): Unit = {
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/SharedJDBCIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/SharedJDBCIntegrationSuite.scala
new file mode 100644
index 0000000000000..e42d04ead0871
--- /dev/null
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/SharedJDBCIntegrationSuite.scala
@@ -0,0 +1,80 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc
+
+import java.sql.Connection
+
+import org.scalatest.time.SpanSugar._
+
+import org.apache.spark.SparkException
+import org.apache.spark.sql.Row
+
+abstract class SharedJDBCIntegrationSuite extends DockerJDBCIntegrationSuite {
+
+  override def beforeAll(): Unit = runIfTestsEnabled(s"Prepare for ${this.getClass.getName}") {
+    super.beforeAll()
+    var conn: Connection = null
+    eventually(connectionTimeout, interval(1.second)) {
+      conn = getConnection()
+    }
+    try {
+      createSharedTable(conn)
+    } finally {
+      conn.close()
+    }
+  }
+
+  /**
+   * Create a table with the same name that can be used to test common functionality
+   * in
+   * @param conn
+   */
+  def createSharedTable(conn: Connection): Unit = {
+    val batchStmt = conn.createStatement()
+
+    batchStmt.addBatch("CREATE TABLE tbl_shared (x INTEGER)")
+    batchStmt.addBatch("INSERT INTO tbl_shared VALUES(1)")
+
+    batchStmt.executeBatch()
+    batchStmt.close()
+  }
+
+  test("SPARK-52184: Wrap external engine syntax error") {
+    val e = intercept[SparkException] {
+
+      spark.read.format("jdbc")
+        .option("url", jdbcUrl)
+        .option("query", "THIS IS NOT VALID SQL").load()
+    }
+    assert(e.getCondition.startsWith("JDBC_EXTERNAL_ENGINE_SYNTAX_ERROR"))
+  }
+
+  test("SPARK-53386: Parameter `query` should work when ending with semicolons") {
+    val dfSingle = spark.read.format("jdbc")
+      .option("url", jdbcUrl)
+      .option("query", "SELECT x FROM tbl_shared; ")
+      .load()
+    checkAnswer(dfSingle, Seq(Row(1)))
+
+    val dfMultiple = spark.read.format("jdbc")
+      .option("url", jdbcUrl)
+      .option("query", "SELECT x FROM tbl_shared;;;")
+      .load()
+    checkAnswer(dfMultiple, Seq(Row(1)))
+  }
+}
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/CrossDbmsQueryTestSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/CrossDbmsQueryTestSuite.scala
index a693920c10032..c959aae8e91e6 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/CrossDbmsQueryTestSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/CrossDbmsQueryTestSuite.scala
@@ -14,9 +14,10 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.jdbc
+package org.apache.spark.sql.jdbc.querytest
 
 import java.io.File
+import java.nio.file.Files
 import java.sql.ResultSet
 
 import scala.collection.mutable.ArrayBuffer
@@ -24,7 +25,7 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.SQLQueryTestHelper
-import org.apache.spark.sql.catalyst.util.fileToString
+import org.apache.spark.sql.jdbc.DockerJDBCIntegrationSuite
 
 /**
  * This suite builds off of that to allow us to run other DBMS against the SQL test golden files (on
@@ -76,7 +77,7 @@ trait CrossDbmsQueryTestSuite extends DockerJDBCIntegrationSuite with SQLQueryTe
   }
 
   protected def runSqlTestCase(testCase: TestCase, listTestCases: Seq[TestCase]): Unit = {
-    val input = fileToString(new File(testCase.inputFile))
+    val input = Files.readString(new File(testCase.inputFile).toPath)
     val (comments, code) = splitCommentsAndCodes(input)
     val queries = getQueries(code, comments, listTestCases)
 
@@ -143,7 +144,7 @@ trait CrossDbmsQueryTestSuite extends DockerJDBCIntegrationSuite with SQLQueryTe
     // Read back the golden files.
     var curSegment = 0
     val expectedOutputs: Seq[QueryTestOutput] = {
-      val goldenOutput = fileToString(new File(testCase.resultFile))
+      val goldenOutput = Files.readString(new File(testCase.resultFile).toPath)
       val segments = goldenOutput.split("-- !query.*\n")
       outputs.map { output =>
         val result =
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/GeneratedSubquerySuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/GeneratedSubquerySuite.scala
index 3a1d5e18b7e5a..eabdb033ebc24 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/GeneratedSubquerySuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/GeneratedSubquerySuite.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.jdbc
+package org.apache.spark.sql.jdbc.querytest
 
 import java.sql.{Connection, ResultSet, Statement}
 import java.util.Locale
@@ -24,6 +24,7 @@ import scala.collection.mutable.ArrayBuffer
 import org.apache.spark.sql.{QueryGeneratorHelper, QueryTest}
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.jdbc.{DockerJDBCIntegrationSuite, PostgresDatabaseOnDocker}
 import org.apache.spark.tags.DockerTest
 
 /**
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/PostgresSQLQueryTestSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/PostgresSQLQueryTestSuite.scala
index 28320a9e0a949..4b7fc0c3e20cd 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/PostgresSQLQueryTestSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/querytest/PostgresSQLQueryTestSuite.scala
@@ -14,11 +14,12 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.jdbc
+package org.apache.spark.sql.jdbc.querytest
 
 import java.io.File
 import java.sql.Connection
 
+import org.apache.spark.sql.jdbc.PostgresDatabaseOnDocker
 import org.apache.spark.tags.DockerTest
 
 /**
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/DockerJDBCIntegrationV2Suite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/DockerJDBCIntegrationV2Suite.scala
index 60345257f2dc4..2a66845f46ed5 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/DockerJDBCIntegrationV2Suite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/DockerJDBCIntegrationV2Suite.scala
@@ -19,10 +19,17 @@ package org.apache.spark.sql.jdbc.v2
 
 import java.sql.Connection
 
+import org.apache.spark.SparkConf
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.jdbc.DockerJDBCIntegrationSuite
 
 abstract class DockerJDBCIntegrationV2Suite extends DockerJDBCIntegrationSuite {
 
+  override def sparkConf: SparkConf = super.sparkConf
+    // DS V2 relies on ANSI mode to translate expressions, we should always
+    // run JDBC v2 tests with ANSI on.
+    .set(SQLConf.ANSI_ENABLED, true)
+
   /**
    * Prepare databases and tables for testing.
    */
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/OracleIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/OracleIntegrationSuite.scala
index 7a58fca17970f..c71f9ae7688f3 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/OracleIntegrationSuite.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/OracleIntegrationSuite.scala
@@ -118,11 +118,28 @@ class OracleIntegrationSuite extends DockerJDBCIntegrationV2Suite with V2JDBCTes
       "CREATE TABLE employee (dept NUMBER(32), name VARCHAR2(32), salary NUMBER(20, 2)," +
         " bonus BINARY_DOUBLE)").executeUpdate()
     connection.prepareStatement(
-      s"""CREATE TABLE pattern_testing_table (
-         |pattern_testing_col VARCHAR(50)
-         |)
-                   """.stripMargin
+      """CREATE TABLE pattern_testing_table (
+        |pattern_testing_col VARCHAR(50)
+        |)
+      """.stripMargin
     ).executeUpdate()
+    connection.prepareStatement(
+        "CREATE TABLE datetime (name VARCHAR(32), date1 DATE, time1 TIMESTAMP)")
+      .executeUpdate()
+  }
+
+  override def dataPreparation(connection: Connection): Unit = {
+    super.dataPreparation(connection)
+    connection.prepareStatement(
+      "INSERT INTO datetime VALUES ('amy', TO_DATE('2022-05-19', 'YYYY-MM-DD')," +
+        " TO_TIMESTAMP('2022-05-19 00:00:00', 'YYYY-MM-DD HH24:MI:SS'))").executeUpdate()
+    connection.prepareStatement(
+      "INSERT INTO datetime VALUES ('alex', TO_DATE('2022-05-18', 'YYYY-MM-DD')," +
+        " TO_TIMESTAMP('2022-05-18 00:00:00', 'YYYY-MM-DD HH24:MI:SS'))").executeUpdate()
+    // '2022-01-01' is Saturday and is in ISO year 2021.
+    connection.prepareStatement(
+      "INSERT INTO datetime VALUES ('tom', TO_DATE('2022-01-01', 'YYYY-MM-DD')," +
+        " TO_TIMESTAMP('2022-01-01 00:00:00', 'YYYY-MM-DD HH24:MI:SS'))").executeUpdate()
   }
 
   override def testUpdateColumnType(tbl: String): Unit = {
@@ -185,4 +202,143 @@ class OracleIntegrationSuite extends DockerJDBCIntegrationV2Suite with V2JDBCTes
       checkAnswer(sql(s"SELECT * FROM $tableName"), Seq(Row("Eason", "Y  ")))
     }
   }
+
+  override def testDatetime(tbl: String): Unit = {
+    val df1 = sql(s"SELECT name FROM $tbl WHERE " +
+      "dayofyear(date1) > 100 AND dayofmonth(date1) > 10 ")
+    checkFilterPushed(df1, false)
+    val rows1 = df1.collect()
+    assert(rows1.length === 2)
+    assert(rows1(0).getString(0) === "amy")
+    assert(rows1(1).getString(0) === "alex")
+
+    val df2 = sql(s"SELECT name FROM $tbl WHERE year(date1) = 2022 AND quarter(date1) = 2")
+    checkFilterPushed(df2, false)
+    val rows2 = df2.collect()
+    assert(rows2.length === 2)
+    assert(rows2(0).getString(0) === "amy")
+    assert(rows2(1).getString(0) === "alex")
+
+    val df3 = sql(s"SELECT name FROM $tbl WHERE month(date1) = 5")
+    checkFilterPushed(df3)
+    val rows3 = df3.collect()
+    assert(rows3.length === 2)
+    assert(rows3(0).getString(0) === "amy")
+    assert(rows3(1).getString(0) === "alex")
+
+    val df4 = sql(s"SELECT name FROM $tbl WHERE hour(time1) = 0 AND minute(time1) = 0")
+    checkFilterPushed(df4)
+    val rows4 = df4.collect()
+    assert(rows4.length === 3)
+    assert(rows4(0).getString(0) === "amy")
+    assert(rows4(1).getString(0) === "alex")
+    assert(rows4(2).getString(0) === "tom")
+
+    val df5 = sql(s"SELECT name FROM $tbl WHERE " +
+      "extract(WEEK from date1) > 10 AND extract(YEAR from date1) = 2022")
+    checkFilterPushed(df5, false)
+    val rows5 = df5.collect()
+    assert(rows5.length === 3)
+    assert(rows5(0).getString(0) === "amy")
+    assert(rows5(1).getString(0) === "alex")
+    assert(rows5(2).getString(0) === "tom")
+
+    val df6 = sql(s"SELECT name FROM $tbl WHERE date_add(date1, 1) = date'2022-05-20' " +
+      "AND datediff(date1, '2022-05-10') > 0")
+    checkFilterPushed(df6, false)
+    val rows6 = df6.collect()
+    assert(rows6.length === 1)
+    assert(rows6(0).getString(0) === "amy")
+
+    val df7 = sql(s"SELECT name FROM $tbl WHERE weekday(date1) = 2")
+    checkFilterPushed(df7, false)
+    val rows7 = df7.collect()
+    assert(rows7.length === 1)
+    assert(rows7(0).getString(0) === "alex")
+
+    withClue("weekofyear") {
+      val woy = sql(s"SELECT weekofyear(date1) FROM $tbl WHERE name = 'tom'")
+        .collect().head.getInt(0)
+      val df = sql(s"SELECT name FROM $tbl WHERE weekofyear(date1) = $woy")
+      checkFilterPushed(df, false)
+      val rows = df.collect()
+      assert(rows.length === 1)
+      assert(rows(0).getString(0) === "tom")
+    }
+
+    withClue("dayofweek") {
+      val dow = sql(s"SELECT dayofweek(date1) FROM $tbl WHERE name = 'alex'")
+        .collect().head.getInt(0)
+      val df = sql(s"SELECT name FROM $tbl WHERE dayofweek(date1) = $dow")
+      checkFilterPushed(df, false)
+      val rows = df.collect()
+      assert(rows.length === 1)
+      assert(rows(0).getString(0) === "alex")
+    }
+
+    withClue("yearofweek") {
+      val yow = sql(s"SELECT extract(YEAROFWEEK from date1) FROM $tbl WHERE name = 'tom'")
+        .collect().head.getInt(0)
+      val df = sql(s"SELECT name FROM $tbl WHERE extract(YEAROFWEEK from date1) = $yow")
+      checkFilterPushed(df, false)
+      val rows = df.collect()
+      assert(rows.length === 1)
+      assert(rows(0).getString(0) === "tom")
+    }
+
+    withClue("dayofyear") {
+      val doy = sql(s"SELECT dayofyear(date1) FROM $tbl WHERE name = 'amy'")
+        .collect().head.getInt(0)
+      val df = sql(s"SELECT name FROM $tbl WHERE dayofyear(date1) = $doy")
+      checkFilterPushed(df, false)
+      val rows = df.collect()
+      assert(rows.length === 1)
+      assert(rows(0).getString(0) === "amy")
+    }
+
+    withClue("dayofmonth") {
+      val dom = sql(s"SELECT dayofmonth(date1) FROM $tbl WHERE name = 'amy'")
+        .collect().head.getInt(0)
+      val df = sql(s"SELECT name FROM $tbl WHERE dayofmonth(date1) = $dom")
+      checkFilterPushed(df)
+      val rows = df.collect()
+      assert(rows.length === 1)
+      assert(rows(0).getString(0) === "amy")
+    }
+
+    withClue("year") {
+      val year = sql(s"SELECT year(date1) FROM $tbl WHERE name = 'amy'")
+        .collect().head.getInt(0)
+      val df = sql(s"SELECT name FROM $tbl WHERE year(date1) = $year")
+      checkFilterPushed(df)
+      val rows = df.collect()
+      assert(rows.length === 3)
+      assert(rows(0).getString(0) === "amy")
+      assert(rows5(1).getString(0) === "alex")
+      assert(rows5(2).getString(0) === "tom")
+    }
+
+    withClue("second") {
+      val df = sql(s"SELECT name FROM $tbl WHERE second(time1) = 0 AND month(date1) = 5")
+      checkFilterPushed(df, false)
+      val rows = df.collect()
+      assert(rows.length === 2)
+      assert(rows(0).getString(0) === "amy")
+      assert(rows(1).getString(0) === "alex")
+    }
+
+    val df9 = sql(s"SELECT name FROM $tbl WHERE " +
+      "dayofyear(date1) > 100 order by dayofyear(date1) limit 1")
+    checkFilterPushed(df9, false)
+    val rows9 = df9.collect()
+    assert(rows9.length === 1)
+    assert(rows9(0).getString(0) === "alex")
+
+    val df10 = sql(s"SELECT name FROM $tbl WHERE trunc(date1, 'week') = date'2022-05-16'")
+    checkFilterPushed(df10)
+    val rows10 = df10.collect()
+    assert(rows10.length === 2)
+    assert(rows10(0).getString(0) === "amy")
+    assert(rows10(1).getString(0) === "alex")
+  }
 }
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/V2JDBCTest.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/V2JDBCTest.scala
index ee4a479960145..fb18dca97994e 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/V2JDBCTest.scala
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/V2JDBCTest.scala
@@ -22,20 +22,21 @@ import org.apache.logging.log4j.Level
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.{AnalysisException, DataFrame}
 import org.apache.spark.sql.catalyst.analysis.{IndexAlreadyExistsException, NoSuchIndexException}
-import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, GlobalLimit, LocalLimit, Offset, Sample, Sort}
+import org.apache.spark.sql.connector.DataSourcePushdownTestUtils
 import org.apache.spark.sql.connector.catalog.{Catalogs, Identifier, TableCatalog}
 import org.apache.spark.sql.connector.catalog.index.SupportsIndex
 import org.apache.spark.sql.connector.expressions.NullOrdering
-import org.apache.spark.sql.connector.expressions.aggregate.GeneralAggregateFunc
 import org.apache.spark.sql.execution.datasources.jdbc.JDBCRDD
-import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2ScanRelation, V1ScanWrapper}
 import org.apache.spark.sql.jdbc.DockerIntegrationFunSuite
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.tags.DockerTest
 
 @DockerTest
-private[v2] trait V2JDBCTest extends SharedSparkSession with DockerIntegrationFunSuite {
+private[v2] trait V2JDBCTest
+  extends DataSourcePushdownTestUtils
+  with DockerIntegrationFunSuite
+  with SharedSparkSession {
   import testImplicits._
 
   val catalogName: String
@@ -468,56 +469,6 @@ private[v2] trait V2JDBCTest extends SharedSparkSession with DockerIntegrationFu
 
   def supportsTableSample: Boolean = false
 
-  private def checkSamplePushed(df: DataFrame, pushed: Boolean = true): Unit = {
-    val sample = df.queryExecution.optimizedPlan.collect {
-      case s: Sample => s
-    }
-    if (pushed) {
-      assert(sample.isEmpty)
-    } else {
-      assert(sample.nonEmpty)
-    }
-  }
-
-  protected def checkFilterPushed(df: DataFrame, pushed: Boolean = true): Unit = {
-    val filter = df.queryExecution.optimizedPlan.collect {
-      case f: Filter => f
-    }
-    if (pushed) {
-      assert(filter.isEmpty)
-    } else {
-      assert(filter.nonEmpty)
-    }
-  }
-
-  protected def checkLimitRemoved(df: DataFrame, pushed: Boolean = true): Unit = {
-    val limit = df.queryExecution.optimizedPlan.collect {
-      case l: LocalLimit => l
-      case g: GlobalLimit => g
-    }
-    if (pushed) {
-      assert(limit.isEmpty)
-    } else {
-      assert(limit.nonEmpty)
-    }
-  }
-
-  private def checkLimitPushed(df: DataFrame, limit: Option[Int]): Unit = {
-    df.queryExecution.optimizedPlan.collect {
-      case relation: DataSourceV2ScanRelation => relation.scan match {
-        case v1: V1ScanWrapper =>
-          assert(v1.pushedDownOperators.limit == limit)
-      }
-    }
-  }
-
-  private def checkColumnPruned(df: DataFrame, col: String): Unit = {
-    val scan = df.queryExecution.optimizedPlan.collectFirst {
-      case s: DataSourceV2ScanRelation => s
-    }.get
-    assert(scan.schema.names.sameElements(Seq(col)))
-  }
-
   test("SPARK-48172: Test CONTAINS") {
     val df1 = spark.sql(
       s"""
@@ -841,39 +792,6 @@ private[v2] trait V2JDBCTest extends SharedSparkSession with DockerIntegrationFu
     }
   }
 
-  private def checkSortRemoved(df: DataFrame, pushed: Boolean = true): Unit = {
-    val sorts = df.queryExecution.optimizedPlan.collect {
-      case s: Sort => s
-    }
-
-    if (pushed) {
-      assert(sorts.isEmpty)
-    } else {
-      assert(sorts.nonEmpty)
-    }
-  }
-
-  private def checkOffsetRemoved(df: DataFrame, pushed: Boolean = true): Unit = {
-    val offsets = df.queryExecution.optimizedPlan.collect {
-      case o: Offset => o
-    }
-
-    if (pushed) {
-      assert(offsets.isEmpty)
-    } else {
-      assert(offsets.nonEmpty)
-    }
-  }
-
-  private def checkOffsetPushed(df: DataFrame, offset: Option[Int]): Unit = {
-    df.queryExecution.optimizedPlan.collect {
-      case relation: DataSourceV2ScanRelation => relation.scan match {
-        case v1: V1ScanWrapper =>
-          assert(v1.pushedDownOperators.offset == offset)
-      }
-    }
-  }
-
   gridTest("simple scan")(partitioningEnabledTestCase) { partitioningEnabled =>
     val (tableOptions, partitionInfo) = getTableOptions("employee", partitioningEnabled)
     val df = sql(s"SELECT name, salary, bonus FROM $catalogAndNamespace." +
@@ -1028,27 +946,6 @@ private[v2] trait V2JDBCTest extends SharedSparkSession with DockerIntegrationFu
     }
   }
 
-  private def checkAggregateRemoved(df: DataFrame): Unit = {
-    val aggregates = df.queryExecution.optimizedPlan.collect {
-      case agg: Aggregate => agg
-    }
-    assert(aggregates.isEmpty)
-  }
-
-  private def checkAggregatePushed(df: DataFrame, funcName: String): Unit = {
-    df.queryExecution.optimizedPlan.collect {
-      case DataSourceV2ScanRelation(_, scan, _, _, _) =>
-        assert(scan.isInstanceOf[V1ScanWrapper])
-        val wrapper = scan.asInstanceOf[V1ScanWrapper]
-        assert(wrapper.pushedDownOperators.aggregation.isDefined)
-        val aggregationExpressions =
-          wrapper.pushedDownOperators.aggregation.get.aggregateExpressions()
-        assert(aggregationExpressions.length == 1)
-        assert(aggregationExpressions(0).isInstanceOf[GeneralAggregateFunc])
-        assert(aggregationExpressions(0).asInstanceOf[GeneralAggregateFunc].name() == funcName)
-    }
-  }
-
   protected def caseConvert(tableName: String): String = tableName
 
   Seq(true, false).foreach { isDistinct =>
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/MsSqlServerJoinPushdownIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/MsSqlServerJoinPushdownIntegrationSuite.scala
new file mode 100644
index 0000000000000..d8f6fa4b1b44e
--- /dev/null
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/MsSqlServerJoinPushdownIntegrationSuite.scala
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc.v2.join
+
+import java.sql.Connection
+import java.util.Locale
+
+import org.apache.spark.sql.jdbc.{DockerJDBCIntegrationSuite, JdbcDialect, MsSQLServerDatabaseOnDocker, MsSqlServerDialect}
+import org.apache.spark.sql.jdbc.v2.JDBCV2JoinPushdownIntegrationSuiteBase
+import org.apache.spark.tags.DockerTest
+
+/**
+ * To run this test suite for a specific version (e.g., 2022-CU15-ubuntu-22.04):
+ * {{{
+ *   ENABLE_DOCKER_INTEGRATION_TESTS=1
+ *   MSSQLSERVER_DOCKER_IMAGE_NAME=mcr.microsoft.com/mssql/server:2022-CU15-ubuntu-22.04
+ *     ./build/sbt -Pdocker-integration-tests "testOnly *v2*MsSqlServerIntegrationSuite"
+ * }}}
+ */
+@DockerTest
+class MsSqlServerJoinPushdownIntegrationSuite
+  extends DockerJDBCIntegrationSuite
+    with JDBCV2JoinPushdownIntegrationSuiteBase {
+  override val db = new MsSQLServerDatabaseOnDocker
+
+  override val url = db.getJdbcUrl(dockerIp, externalPort)
+
+  override val jdbcDialect: JdbcDialect = MsSqlServerDialect()
+
+  override def caseConvert(identifier: String): String = identifier.toUpperCase(Locale.ROOT)
+
+  // This method comes from DockerJDBCIntegrationSuite
+  override def dataPreparation(connection: Connection): Unit = {
+    super.dataPreparation()
+  }
+}
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/MySQLJoinPushdownIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/MySQLJoinPushdownIntegrationSuite.scala
new file mode 100644
index 0000000000000..1a1536b6a2929
--- /dev/null
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/MySQLJoinPushdownIntegrationSuite.scala
@@ -0,0 +1,52 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc.v2.join
+
+import java.sql.Connection
+import java.util.Locale
+
+import org.apache.spark.sql.jdbc.{DockerJDBCIntegrationSuite, JdbcDialect, MySQLDatabaseOnDocker, MySQLDialect}
+import org.apache.spark.sql.jdbc.v2.JDBCV2JoinPushdownIntegrationSuiteBase
+import org.apache.spark.tags.DockerTest
+
+/**
+ * To run this test suite for a specific version (e.g., mysql:9.2.0):
+ * {{{
+ *   ENABLE_DOCKER_INTEGRATION_TESTS=1 MYSQL_DOCKER_IMAGE_NAME=mysql:9.2.0
+ *     ./build/sbt -Pdocker-integration-tests "testOnly *v2*MySQLIntegrationSuite"
+ * }}}
+ */
+@DockerTest
+class MySQLJoinPushdownIntegrationSuite
+  extends DockerJDBCIntegrationSuite
+    with JDBCV2JoinPushdownIntegrationSuiteBase {
+  override val db = new MySQLDatabaseOnDocker
+
+  override val url = db.getJdbcUrl(dockerIp, externalPort)
+
+  override val jdbcDialect: JdbcDialect = MySQLDialect()
+
+  override def caseConvert(identifier: String): String = identifier.toUpperCase(Locale.ROOT)
+
+  override def remainColumnCase(identifier: String): String = "`" + identifier + "`"
+
+  // This method comes from DockerJDBCIntegrationSuite
+  override def dataPreparation(connection: Connection): Unit = {
+    super.dataPreparation()
+  }
+}
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/OracleJoinPushdownIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/OracleJoinPushdownIntegrationSuite.scala
new file mode 100644
index 0000000000000..ad9e5d002bf50
--- /dev/null
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/OracleJoinPushdownIntegrationSuite.scala
@@ -0,0 +1,123 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc.v2.join
+
+import java.sql.Connection
+import java.util.Locale
+
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.jdbc.{DockerJDBCIntegrationSuite, JdbcDialect, OracleDatabaseOnDocker, OracleDialect}
+import org.apache.spark.sql.jdbc.v2.JDBCV2JoinPushdownIntegrationSuiteBase
+import org.apache.spark.sql.types.DataTypes
+import org.apache.spark.tags.DockerTest
+
+/**
+ * The following are the steps to test this:
+ *
+ * 1. Choose to use a prebuilt image or build Oracle database in a container
+ *    - The documentation on how to build Oracle RDBMS in a container is at
+ *      https://github.com/oracle/docker-images/blob/master/OracleDatabase/SingleInstance/README.md
+ *    - Official Oracle container images can be found at https://container-registry.oracle.com
+ *    - Trustable and streamlined Oracle Database Free images can be found on Docker Hub at
+ *      https://hub.docker.com/r/gvenzl/oracle-free
+ *      see also https://github.com/gvenzl/oci-oracle-free
+ * 2. Run: export ORACLE_DOCKER_IMAGE_NAME=image_you_want_to_use_for_testing
+ *    - Example: export ORACLE_DOCKER_IMAGE_NAME=gvenzl/oracle-free:latest
+ * 3. Run: export ENABLE_DOCKER_INTEGRATION_TESTS=1
+ * 4. Start docker: sudo service docker start
+ *    - Optionally, docker pull $ORACLE_DOCKER_IMAGE_NAME
+ * 5. Run Spark integration tests for Oracle with: ./build/sbt -Pdocker-integration-tests
+ *    "testOnly org.apache.spark.sql.jdbc.v2.OracleIntegrationSuite"
+ *
+ * A sequence of commands to build the Oracle Database Free container image:
+ *  $ git clone https://github.com/oracle/docker-images.git
+ *  $ cd docker-images/OracleDatabase/SingleInstance/dockerfiles0
+ *  $ ./buildContainerImage.sh -v 23.4.0 -f
+ *  $ export ORACLE_DOCKER_IMAGE_NAME=oracle/database:23.4.0-free
+ *
+ * This procedure has been validated with Oracle Database Free version 23.4.0,
+ * and with Oracle Express Edition versions 18.4.0 and 21.4.0
+ */
+@DockerTest
+class OracleJoinPushdownIntegrationSuite
+  extends DockerJDBCIntegrationSuite
+  with JDBCV2JoinPushdownIntegrationSuiteBase {
+  override def excluded: Seq[String] = Seq(
+    // Following tests are harder to be supported for Oracle because Oracle connector does
+    // casts in predicates. There is a separate test in this suite that is similar to
+    // "Test explain formatted" test from base suite.
+    "Test self join with condition",
+    "Test multi-way self join with conditions",
+    "Test explain formatted"
+  )
+
+  override val namespace: String = "SYSTEM"
+
+  override val db = new OracleDatabaseOnDocker
+
+  override val url = db.getJdbcUrl(dockerIp, externalPort)
+
+  override val jdbcDialect: JdbcDialect = OracleDialect()
+
+  override val integerType = DataTypes.createDecimalType(10, 0)
+
+  override def caseConvert(identifier: String): String = identifier.toUpperCase(Locale.ROOT)
+
+  override def schemaPreparation(): Unit = {}
+
+  // This method comes from DockerJDBCIntegrationSuite
+  override def dataPreparation(connection: Connection): Unit = {
+    super.dataPreparation()
+  }
+
+  test("Test explain formatted - Oracle compatible") {
+    val sqlQuery =
+      s"""
+         |SELECT * FROM $catalogAndNamespace.$casedJoinTableName1 a
+         |JOIN $catalogAndNamespace.$casedJoinTableName2 b
+         |ON a.id = b.id + 1
+         |JOIN $catalogAndNamespace.$casedJoinTableName3 c
+         |ON b.id = c.id + 1
+         |JOIN $catalogAndNamespace.$casedJoinTableName4 d
+         |ON c.id = d.id + 1
+         |""".stripMargin
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      // scalastyle:off line.size.limit
+      checkJoinPushed(
+        df,
+        s"""PushedFilters: [CAST(id_3 AS decimal(11,0)) = (id_4 + 1)], PushedJoins:\u0020
+           |[L]: PushedFilters: [CAST(ID_1 AS decimal(11,0)) = (id_3 + 1)]
+           |     PushedJoins:
+           |     [L]: PushedFilters: [CAST(ID AS decimal(11,0)) = (ID_1 + 1)]
+           |          PushedJoins:
+           |          [L]: Relation: $catalogAndNamespace.${caseConvert(joinTableName1)}
+           |               PushedFilters: [${caseConvert("id")} IS NOT NULL]
+           |          [R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName2)}
+           |               PushedFilters: [${caseConvert("id")} IS NOT NULL]
+           |     [R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName3)}
+           |          PushedFilters: [id IS NOT NULL]
+           |[R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName4)}
+           |     PushedFilters: [id IS NOT NULL]""".stripMargin
+      )
+      // scalastyle:on line.size.limit
+    }
+  }
+}
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/PostgresJoinPushdownIntegrationSuite.scala b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/PostgresJoinPushdownIntegrationSuite.scala
new file mode 100644
index 0000000000000..e515eb698f60c
--- /dev/null
+++ b/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/v2/join/PostgresJoinPushdownIntegrationSuite.scala
@@ -0,0 +1,47 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc.v2.join
+
+import java.sql.Connection
+
+import org.apache.spark.sql.jdbc.{DockerJDBCIntegrationSuite, JdbcDialect, PostgresDatabaseOnDocker, PostgresDialect}
+import org.apache.spark.sql.jdbc.v2.JDBCV2JoinPushdownIntegrationSuiteBase
+import org.apache.spark.tags.DockerTest
+
+/**
+ * To run this test suite for a specific version (e.g., postgres:17.2-alpine)
+ * {{{
+ *   ENABLE_DOCKER_INTEGRATION_TESTS=1 POSTGRES_DOCKER_IMAGE_NAME=postgres:17.2-alpine
+ *     ./build/sbt -Pdocker-integration-tests "testOnly *v2.PostgresIntegrationSuite"
+ * }}}
+ */
+@DockerTest
+class PostgresJoinPushdownIntegrationSuite
+  extends DockerJDBCIntegrationSuite
+    with JDBCV2JoinPushdownIntegrationSuiteBase {
+  override val db = new PostgresDatabaseOnDocker
+
+  override val url = db.getJdbcUrl(dockerIp, externalPort)
+
+  override val jdbcDialect: JdbcDialect = PostgresDialect()
+
+  // This method comes from DockerJDBCIntegrationSuite
+  override def dataPreparation(connection: Connection): Unit = {
+    super.dataPreparation()
+  }
+}
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala
index cb1c7055483b3..02568aa89eb1d 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaBatchPartitionReader.scala
@@ -20,13 +20,13 @@ package org.apache.spark.sql.kafka010
 import java.{util => ju}
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.connector.metric.CustomTaskMetric
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
-import org.apache.spark.sql.execution.streaming.{MicroBatchExecution, StreamExecution}
+import org.apache.spark.sql.execution.streaming.runtime.{MicroBatchExecution, StreamExecution}
 import org.apache.spark.sql.kafka010.consumer.KafkaDataConsumer
 
 /** A [[InputPartition]] for reading Kafka data in a batch based streaming query. */
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala
index 10bdbb1d9d447..041fe074f7e40 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaContinuousStream.scala
@@ -24,7 +24,7 @@ import org.apache.kafka.clients.consumer.{ConsumerConfig, ConsumerRecord, Offset
 import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ERROR, OFFSETS, TIP}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala
index c79da13017b97..19a5d7cb739f5 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchStream.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ERROR, OFFSETS, TIP}
 import org.apache.spark.internal.config.Network.NETWORK_TIMEOUT
 import org.apache.spark.sql.SparkSession
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderAdmin.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderAdmin.scala
index 86cec6fc041cd..7420c2c1055b2 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderAdmin.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderAdmin.scala
@@ -30,7 +30,7 @@ import org.apache.kafka.common.{IsolationLevel, TopicPartition}
 import org.apache.kafka.common.requests.OffsetFetchResponse
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{NUM_RETRY, OFFSETS, TOPIC_PARTITION_OFFSET}
 import org.apache.spark.scheduler.ExecutorCacheTaskLocation
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderConsumer.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderConsumer.scala
index fb06797d1fe34..b7ac9a171c575 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderConsumer.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaOffsetReaderConsumer.scala
@@ -27,7 +27,7 @@ import org.apache.kafka.clients.consumer.{Consumer, ConsumerConfig, OffsetAndTim
 import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{NUM_RETRY, OFFSETS, TOPIC_PARTITION_OFFSET}
 import org.apache.spark.scheduler.ExecutorCacheTaskLocation
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala
index ff884310f660c..7e98446567640 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaRelation.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.kafka010
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.TOPIC_PARTITIONS
 import org.apache.spark.internal.config.Network.NETWORK_TIMEOUT
 import org.apache.spark.rdd.RDD
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSink.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSink.scala
index fb473e71d5a75..d3ea5332f4e44 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSink.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSink.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.kafka010
 
 import java.{util => ju}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.BATCH_ID
 import org.apache.spark.sql.DataFrame
 import org.apache.spark.sql.execution.streaming.Sink
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala
index 1b52046b14833..b2679e27827fe 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSource.scala
@@ -22,7 +22,7 @@ import java.{util => ju}
 import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.SparkContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ERROR, FROM_OFFSET, OFFSETS, TIP, TOPIC_PARTITIONS, UNTIL_OFFSET}
 import org.apache.spark.internal.config.Network.NETWORK_TIMEOUT
 import org.apache.spark.scheduler.ExecutorCacheTaskLocation
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceInitialOffsetWriter.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceInitialOffsetWriter.scala
index f9b7e23df49b6..cef712fafd888 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceInitialOffsetWriter.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceInitialOffsetWriter.scala
@@ -20,10 +20,10 @@ package org.apache.spark.sql.kafka010
 import java.io._
 import java.nio.charset.StandardCharsets
 
-import org.apache.commons.io.IOUtils
-
 import org.apache.spark.sql.SparkSession
-import org.apache.spark.sql.execution.streaming.{HDFSMetadataLog, SerializedOffset}
+import org.apache.spark.sql.execution.streaming.checkpointing.HDFSMetadataLog
+import org.apache.spark.sql.execution.streaming.runtime.SerializedOffset
+import org.apache.spark.util.Utils
 
 /** A version of [[HDFSMetadataLog]] specialized for saving the initial offsets. */
 private[kafka010] class KafkaSourceInitialOffsetWriter(
@@ -43,7 +43,7 @@ private[kafka010] class KafkaSourceInitialOffsetWriter(
 
   override def deserialize(in: InputStream): KafkaSourceOffset = {
     in.read() // A zero byte is read to support Spark 2.1.0 (SPARK-19517)
-    val content = IOUtils.toString(new InputStreamReader(in, StandardCharsets.UTF_8))
+    val content = Utils.toString(in)
     // HDFSMetadataLog guarantees that it never creates a partial file.
     require(content.nonEmpty)
     if (content(0) == 'v') {
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceOffset.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceOffset.scala
index 8790a77e5d895..d2c0c5d6fba85 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceOffset.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceOffset.scala
@@ -21,7 +21,8 @@ import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.sql.connector.read.streaming
 import org.apache.spark.sql.connector.read.streaming.PartitionOffset
-import org.apache.spark.sql.execution.streaming.{Offset, SerializedOffset}
+import org.apache.spark.sql.execution.streaming.Offset
+import org.apache.spark.sql.execution.streaming.runtime.SerializedOffset
 
 /**
  * An [[Offset]] for the [[KafkaSource]]. This one tracks all partitions of subscribed topics and
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceProvider.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceProvider.scala
index 82ad75e028afe..ff2f16d26b932 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceProvider.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceProvider.scala
@@ -27,7 +27,7 @@ import org.apache.kafka.clients.producer.ProducerConfig
 import org.apache.kafka.common.TopicPartition
 import org.apache.kafka.common.serialization.{ByteArrayDeserializer, ByteArraySerializer}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.kafka010.KafkaConfigUpdater
 import org.apache.spark.sql.{AnalysisException, DataFrame, SaveMode, SQLContext}
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala
index 0f962a29588a0..9bae686a65bf8 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/KafkaSourceRDD.scala
@@ -23,7 +23,6 @@ import org.apache.kafka.clients.consumer.ConsumerRecord
 
 import org.apache.spark.{Partition, SparkContext, SparkException, TaskContext}
 import org.apache.spark.internal.LogKeys.{FROM_OFFSET, PARTITION_ID, TOPIC}
-import org.apache.spark.internal.MDC
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.kafka010.consumer.KafkaDataConsumer
 import org.apache.spark.storage.StorageLevel
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/FetchedDataPool.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/FetchedDataPool.scala
index 9f68cb6fd0882..2ea1104177a54 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/FetchedDataPool.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/FetchedDataPool.scala
@@ -26,7 +26,7 @@ import scala.collection.mutable
 import org.apache.kafka.clients.consumer.ConsumerRecord
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DATA, KEY}
 import org.apache.spark.sql.kafka010.{FETCHED_DATA_CACHE_EVICTOR_THREAD_RUN_INTERVAL, FETCHED_DATA_CACHE_TIMEOUT}
 import org.apache.spark.sql.kafka010.consumer.KafkaDataConsumer.{AvailableOffsetRange, CacheKey, UNKNOWN_OFFSET}
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/KafkaDataConsumer.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/KafkaDataConsumer.scala
index ceb9d96660ae3..2d1125294df27 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/KafkaDataConsumer.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/consumer/KafkaDataConsumer.scala
@@ -30,7 +30,7 @@ import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.{SparkEnv, TaskContext}
 import org.apache.spark.deploy.security.HadoopDelegationTokenManager
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.kafka010.{KafkaConfigUpdater, KafkaTokenUtil}
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.NANOS_PER_MILLIS
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/CachedKafkaProducer.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/CachedKafkaProducer.scala
index c3457cf8982d9..9b40bcf8ce779 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/CachedKafkaProducer.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/CachedKafkaProducer.scala
@@ -23,7 +23,7 @@ import scala.util.control.NonFatal
 
 import org.apache.kafka.clients.producer.KafkaProducer
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PRODUCER_ID
 
 private[kafka010] class CachedKafkaProducer(
diff --git a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/InternalKafkaProducerPool.scala b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/InternalKafkaProducerPool.scala
index 79e0a91dd8968..ca9a0059ba1e4 100644
--- a/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/InternalKafkaProducerPool.scala
+++ b/connector/kafka-0-10-sql/src/main/scala/org/apache/spark/sql/kafka010/producer/InternalKafkaProducerPool.scala
@@ -27,7 +27,7 @@ import scala.jdk.CollectionConverters._
 import org.apache.kafka.clients.producer.KafkaProducer
 
 import org.apache.spark.{SparkConf, SparkEnv}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PRODUCER_ID
 import org.apache.spark.kafka010.{KafkaConfigUpdater, KafkaRedactionUtil}
 import org.apache.spark.sql.kafka010.{PRODUCER_CACHE_EVICTOR_THREAD_RUN_INTERVAL, PRODUCER_CACHE_TIMEOUT}
diff --git a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaContinuousTest.scala b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaContinuousTest.scala
index 4b6a5b899fc8e..2dff58ff87875 100644
--- a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaContinuousTest.scala
+++ b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaContinuousTest.scala
@@ -22,8 +22,8 @@ import java.util.concurrent.atomic.AtomicInteger
 import org.apache.spark.SparkContext
 import org.apache.spark.scheduler.{SparkListener, SparkListenerTaskEnd, SparkListenerTaskStart}
 import org.apache.spark.sql.execution.datasources.v2.ContinuousScanExec
-import org.apache.spark.sql.execution.streaming.StreamExecution
 import org.apache.spark.sql.execution.streaming.continuous.ContinuousExecution
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.sql.streaming.Trigger
 import org.apache.spark.sql.test.TestSparkSession
 
diff --git a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDelegationTokenSuite.scala b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDelegationTokenSuite.scala
index 702bd4f6ebdad..a55b6e0068519 100644
--- a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDelegationTokenSuite.scala
+++ b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaDelegationTokenSuite.scala
@@ -26,7 +26,7 @@ import org.apache.kafka.common.security.auth.SecurityProtocol.SASL_PLAINTEXT
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.deploy.security.HadoopDelegationTokenManager
 import org.apache.spark.internal.config.{KEYTAB, PRINCIPAL}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.streaming.{OutputMode, StreamTest}
 import org.apache.spark.sql.test.SharedSparkSession
 
diff --git a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala
index e738abf21f597..2ef6c992ad238 100644
--- a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala
+++ b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaMicroBatchSourceSuite.scala
@@ -29,7 +29,6 @@ import scala.io.Source
 import scala.jdk.CollectionConverters._
 import scala.util.Random
 
-import org.apache.commons.io.FileUtils
 import org.apache.kafka.clients.producer.{ProducerRecord, RecordMetadata}
 import org.apache.kafka.common.TopicPartition
 import org.scalatest.concurrent.PatienceConfiguration.Timeout
@@ -43,8 +42,10 @@ import org.apache.spark.sql.connector.read.streaming.SparkDataStream
 import org.apache.spark.sql.execution.datasources.v2.StreamingDataSourceV2ScanRelation
 import org.apache.spark.sql.execution.exchange.ReusedExchangeExec
 import org.apache.spark.sql.execution.streaming._
-import org.apache.spark.sql.execution.streaming.AsyncProgressTrackingMicroBatchExecution.{ASYNC_PROGRESS_TRACKING_CHECKPOINTING_INTERVAL_MS, ASYNC_PROGRESS_TRACKING_ENABLED}
+import org.apache.spark.sql.execution.streaming.checkpointing.OffsetSeq
 import org.apache.spark.sql.execution.streaming.continuous.ContinuousExecution
+import org.apache.spark.sql.execution.streaming.runtime.{MicroBatchExecution, StreamExecution, StreamingExecutionRelation}
+import org.apache.spark.sql.execution.streaming.runtime.AsyncProgressTrackingMicroBatchExecution.{ASYNC_PROGRESS_TRACKING_CHECKPOINTING_INTERVAL_MS, ASYNC_PROGRESS_TRACKING_ENABLED}
 import org.apache.spark.sql.functions.{count, expr, window}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.kafka010.KafkaSourceProvider._
@@ -1729,7 +1730,7 @@ abstract class KafkaMicroBatchV2SourceSuite extends KafkaMicroBatchSourceSuiteBa
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     testStream(query)(
       StartStream(checkpointLocation = checkpointDir.getAbsolutePath),
diff --git a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSinkSuite.scala b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSinkSuite.scala
index 82edba59995ec..a444128cb2c0b 100644
--- a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSinkSuite.scala
+++ b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSinkSuite.scala
@@ -32,7 +32,7 @@ import org.scalatest.time.SpanSugar._
 import org.apache.spark.{SparkConf, SparkContext, TestUtils}
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.expressions.{AttributeReference, SpecificInternalRow, UnsafeProjection}
-import org.apache.spark.sql.execution.streaming.{MemoryStream, MemoryStreamBase}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, MemoryStreamBase}
 import org.apache.spark.sql.execution.streaming.sources.ContinuousMemoryStream
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
diff --git a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSourceOffsetSuite.scala b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSourceOffsetSuite.scala
index 553ab42b9c8b1..18330feac861c 100644
--- a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSourceOffsetSuite.scala
+++ b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaSourceOffsetSuite.scala
@@ -19,7 +19,8 @@ package org.apache.spark.sql.kafka010
 
 import java.io.File
 
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.checkpointing.{OffsetSeq, OffsetSeqLog}
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.streaming.OffsetSuite
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.util.Utils
diff --git a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaTestUtils.scala b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaTestUtils.scala
index 60de3705636ec..0e1ca7af14a43 100644
--- a/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaTestUtils.scala
+++ b/connector/kafka-0-10-sql/src/test/scala/org/apache/spark/sql/kafka010/KafkaTestUtils.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.kafka010
 
 import java.io.{File, IOException}
 import java.net.InetSocketAddress
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.{Collections, Properties, UUID}
 import java.util.concurrent.TimeUnit
 import javax.security.auth.login.Configuration
@@ -27,7 +27,6 @@ import javax.security.auth.login.Configuration
 import scala.io.Source
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
 import kafka.log.LogManager
 import kafka.server.{HostedPartition, KafkaConfig, KafkaServer}
 import kafka.server.checkpoints.OffsetCheckpointFile
@@ -53,7 +52,7 @@ import org.scalatest.concurrent.Eventually._
 import org.scalatest.time.SpanSugar._
 
 import org.apache.spark.{SparkConf, SparkException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.kafka010.KafkaTokenUtil
 import org.apache.spark.util.{SecurityUtils, ShutdownHookManager, Utils}
@@ -176,7 +175,7 @@ class KafkaTestUtils(
     }
 
     kdc.getKrb5conf.delete()
-    Files.asCharSink(kdc.getKrb5conf, StandardCharsets.UTF_8).write(krb5confStr)
+    Files.writeString(kdc.getKrb5conf.toPath, krb5confStr)
     logDebug(s"krb5.conf file content: $krb5confStr")
   }
 
@@ -240,7 +239,7 @@ class KafkaTestUtils(
       |  principal="$kafkaServerUser@$realm";
       |};
       """.stripMargin.trim
-    Files.asCharSink(file, StandardCharsets.UTF_8).write(content)
+    Files.writeString(file.toPath, content)
     logDebug(s"Created JAAS file: ${file.getPath}")
     logDebug(s"JAAS file content: $content")
     file.getAbsolutePath()
diff --git a/connector/kafka-0-10-token-provider/src/main/scala/org/apache/spark/kafka010/KafkaDelegationTokenProvider.scala b/connector/kafka-0-10-token-provider/src/main/scala/org/apache/spark/kafka010/KafkaDelegationTokenProvider.scala
index 8acdd01a15bab..bce318811dc27 100644
--- a/connector/kafka-0-10-token-provider/src/main/scala/org/apache/spark/kafka010/KafkaDelegationTokenProvider.scala
+++ b/connector/kafka-0-10-token-provider/src/main/scala/org/apache/spark/kafka010/KafkaDelegationTokenProvider.scala
@@ -24,7 +24,7 @@ import org.apache.hadoop.security.Credentials
 import org.apache.kafka.common.security.auth.SecurityProtocol.{SASL_PLAINTEXT, SASL_SSL, SSL}
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLUSTER_ID, SERVICE_NAME}
 import org.apache.spark.security.HadoopDelegationTokenProvider
 
diff --git a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/ConsumerStrategy.scala b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/ConsumerStrategy.scala
index 2320f1908da5a..24c3dd0cddf17 100644
--- a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/ConsumerStrategy.scala
+++ b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/ConsumerStrategy.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import org.apache.kafka.clients.consumer._
 import org.apache.kafka.common.TopicPartition
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CONFIG
 import org.apache.spark.kafka010.KafkaConfigUpdater
 
diff --git a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/DirectKafkaInputDStream.scala b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/DirectKafkaInputDStream.scala
index f7bea064d2d6c..beaac35720445 100644
--- a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/DirectKafkaInputDStream.scala
+++ b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/DirectKafkaInputDStream.scala
@@ -27,7 +27,7 @@ import scala.jdk.CollectionConverters._
 import org.apache.kafka.clients.consumer._
 import org.apache.kafka.common.TopicPartition
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{OFFSET, TIME, TOPIC_PARTITION, TOPIC_PARTITION_OFFSET_RANGE}
 import org.apache.spark.storage.StorageLevel
 import org.apache.spark.streaming.{StreamingContext, Time}
diff --git a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaDataConsumer.scala b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaDataConsumer.scala
index 75b046430ef50..03701dbda0947 100644
--- a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaDataConsumer.scala
+++ b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaDataConsumer.scala
@@ -26,7 +26,7 @@ import org.apache.kafka.clients.consumer.{ConsumerConfig, ConsumerRecord, KafkaC
 import org.apache.kafka.common.{KafkaException, TopicPartition}
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.kafka010.KafkaConfigUpdater
 
diff --git a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaRDD.scala b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaRDD.scala
index 2637034766574..af97d5464e004 100644
--- a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaRDD.scala
+++ b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaRDD.scala
@@ -23,7 +23,7 @@ import org.apache.kafka.clients.consumer.{ ConsumerConfig, ConsumerRecord }
 import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.{Partition, SparkContext, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FROM_OFFSET, PARTITION_ID, TOPIC, UNTIL_OFFSET}
 import org.apache.spark.internal.config.Network._
 import org.apache.spark.partial.{BoundedDouble, PartialResult}
diff --git a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaUtils.scala b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaUtils.scala
index d15e5e25f561d..54cb9ff39d993 100644
--- a/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaUtils.scala
+++ b/connector/kafka-0-10/src/main/scala/org/apache/spark/streaming/kafka010/KafkaUtils.scala
@@ -24,7 +24,7 @@ import org.apache.kafka.common.TopicPartition
 
 import org.apache.spark.SparkContext
 import org.apache.spark.api.java.{ JavaRDD, JavaSparkContext }
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, GROUP_ID}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.streaming.StreamingContext
diff --git a/connector/kafka-0-10/src/test/scala/org/apache/spark/streaming/kafka010/KafkaRDDSuite.scala b/connector/kafka-0-10/src/test/scala/org/apache/spark/streaming/kafka010/KafkaRDDSuite.scala
index 212693f6e02cc..a1264af021aa1 100644
--- a/connector/kafka-0-10/src/test/scala/org/apache/spark/streaming/kafka010/KafkaRDDSuite.scala
+++ b/connector/kafka-0-10/src/test/scala/org/apache/spark/streaming/kafka010/KafkaRDDSuite.scala
@@ -38,6 +38,7 @@ import org.scalatest.concurrent.Eventually.{eventually, interval, timeout}
 import org.apache.spark._
 import org.apache.spark.scheduler.ExecutorCacheTaskLocation
 import org.apache.spark.streaming.kafka010.mocks.MockTime
+import org.apache.spark.util.Utils
 
 class KafkaRDDSuite extends SparkFunSuite {
 
@@ -91,7 +92,7 @@ class KafkaRDDSuite extends SparkFunSuite {
     val logs = new Pool[TopicPartition, UnifiedLog]()
     val logDir = kafkaTestUtils.brokerLogDir
     val dir = new File(logDir, topic + "-" + partition)
-    dir.mkdirs()
+    Utils.createDirectory(dir)
     val logProps = new ju.Properties()
     logProps.put(TopicConfig.CLEANUP_POLICY_CONFIG, TopicConfig.CLEANUP_POLICY_COMPACT)
     logProps.put(TopicConfig.MIN_CLEANABLE_DIRTY_RATIO_CONFIG, java.lang.Float.valueOf(0.1f))
diff --git a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisBackedBlockRDD.scala b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisBackedBlockRDD.scala
index b391203b4b968..ac3622f93321a 100644
--- a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisBackedBlockRDD.scala
+++ b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisBackedBlockRDD.scala
@@ -29,7 +29,7 @@ import com.amazonaws.services.kinesis.clientlibrary.types.UserRecord
 import com.amazonaws.services.kinesis.model._
 
 import org.apache.spark._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ERROR, NUM_RETRY}
 import org.apache.spark.rdd.{BlockRDD, BlockRDDPartition}
 import org.apache.spark.storage.BlockId
diff --git a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisCheckpointer.scala b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisCheckpointer.scala
index c52eeca1e48a1..b259a5337f37e 100644
--- a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisCheckpointer.scala
+++ b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisCheckpointer.scala
@@ -22,7 +22,7 @@ import scala.util.control.NonFatal
 
 import com.amazonaws.services.kinesis.clientlibrary.interfaces.IRecordProcessorCheckpointer
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{SHARD_ID, WORKER_URL}
 import org.apache.spark.streaming.Duration
 import org.apache.spark.streaming.util.RecurringTimer
diff --git a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisReceiver.scala b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisReceiver.scala
index 953817e625e48..ab91431035fef 100644
--- a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisReceiver.scala
+++ b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisReceiver.scala
@@ -28,7 +28,7 @@ import com.amazonaws.services.kinesis.clientlibrary.lib.worker.{KinesisClientLib
 import com.amazonaws.services.kinesis.metrics.interfaces.MetricsLevel
 import com.amazonaws.services.kinesis.model.Record
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.WORKER_URL
 import org.apache.spark.storage.{StorageLevel, StreamBlockId}
 import org.apache.spark.streaming.Duration
diff --git a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisRecordProcessor.scala b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisRecordProcessor.scala
index cd740f971e484..8304ddda96dfa 100644
--- a/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisRecordProcessor.scala
+++ b/connector/kinesis-asl/src/main/scala/org/apache/spark/streaming/kinesis/KinesisRecordProcessor.scala
@@ -26,7 +26,7 @@ import com.amazonaws.services.kinesis.clientlibrary.interfaces.{IRecordProcessor
 import com.amazonaws.services.kinesis.clientlibrary.lib.worker.ShutdownReason
 import com.amazonaws.services.kinesis.model.Record
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{KINESIS_REASON, RETRY_INTERVAL, SHARD_ID, WORKER_URL}
 
 /**
diff --git a/connector/kinesis-asl/src/test/scala/org/apache/spark/streaming/kinesis/KinesisTestUtils.scala b/connector/kinesis-asl/src/test/scala/org/apache/spark/streaming/kinesis/KinesisTestUtils.scala
index 652822c5fdc97..3f06d476f08dc 100644
--- a/connector/kinesis-asl/src/test/scala/org/apache/spark/streaming/kinesis/KinesisTestUtils.scala
+++ b/connector/kinesis-asl/src/test/scala/org/apache/spark/streaming/kinesis/KinesisTestUtils.scala
@@ -33,7 +33,7 @@ import com.amazonaws.services.dynamodbv2.document.DynamoDB
 import com.amazonaws.services.kinesis.{AmazonKinesis, AmazonKinesisClient}
 import com.amazonaws.services.kinesis.model._
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{STREAM_NAME, TABLE_NAME}
 
 /**
diff --git a/connector/profiler/README.md b/connector/profiler/README.md
index 9e0a58444c605..742b1a8bb5da3 100644
--- a/connector/profiler/README.md
+++ b/connector/profiler/README.md
@@ -16,7 +16,7 @@ or
 
 ## Executor Code Profiling
 
-The spark profiler module enables code profiling of executors in cluster mode based on the [async profiler](https://github.com/async-profiler/async-profiler/blob/v3.0/README.md), a low overhead sampling profiler. This allows a Spark application to capture CPU and memory profiles for application running on a cluster which can later be analyzed for performance issues. The profiler captures [Java Flight Recorder (jfr)](https://access.redhat.com/documentation/es-es/red_hat_build_of_openjdk/17/html/using_jdk_flight_recorder_with_red_hat_build_of_openjdk/openjdk-flight-recorded-overview) files for each executor; these can be read by many tools including Java Mission Control and Intellij.
+The spark profiler module enables code profiling of executors in cluster mode based on the [async profiler](https://github.com/async-profiler/async-profiler/blob/v4.0/README.md), a low overhead sampling profiler. This allows a Spark application to capture CPU and memory profiles for application running on a cluster which can later be analyzed for performance issues. The profiler captures [Java Flight Recorder (jfr)](https://access.redhat.com/documentation/es-es/red_hat_build_of_openjdk/17/html/using_jdk_flight_recorder_with_red_hat_build_of_openjdk/openjdk-flight-recorded-overview) files for each executor; these can be read by many tools including Java Mission Control and Intellij.
 
 The profiler writes the jfr files to the executor's working directory in the executor's local file system and the files can grow to be large, so it is advisable that the executor machines have adequate storage. The profiler can be configured to copy the jfr files to a hdfs location before the executor shuts down.
 
@@ -95,7 +95,7 @@ Then enable the profiling in the configuration.
   <td>event=wall,interval=10ms,alloc=2m,lock=10ms,chunktime=300s</td>
   <td>
       Arguments to pass to the Async Profiler. Detailed options are documented in the comments here:
-      <a href="https://github.com/async-profiler/async-profiler/blob/v3.0/src/arguments.cpp#L44">Profiler arguments</a>.  
+      <a href="https://github.com/async-profiler/async-profiler/blob/v4.0/docs/ProfilerOptions.md">Profiler options</a>.  
        Note that the arguments to start, stop, specify output format, and output file do not have to be specified.
   </td>
   <td>4.0.0</td>
diff --git a/connector/profiler/src/main/scala/org/apache/spark/profiler/ProfilerPlugin.scala b/connector/profiler/src/main/scala/org/apache/spark/profiler/ProfilerPlugin.scala
index db3de90099f7c..cb341aef3a0d8 100644
--- a/connector/profiler/src/main/scala/org/apache/spark/profiler/ProfilerPlugin.scala
+++ b/connector/profiler/src/main/scala/org/apache/spark/profiler/ProfilerPlugin.scala
@@ -23,7 +23,7 @@ import scala.util.Random
 
 import org.apache.spark.{SparkConf, SparkContext}
 import org.apache.spark.api.plugin.{DriverPlugin, ExecutorPlugin, PluginContext, SparkPlugin}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.EXECUTOR_ID
 
 /**
diff --git a/connector/profiler/src/main/scala/org/apache/spark/profiler/SparkAsyncProfiler.scala b/connector/profiler/src/main/scala/org/apache/spark/profiler/SparkAsyncProfiler.scala
index 125ce63620b63..02d39a2c435b3 100644
--- a/connector/profiler/src/main/scala/org/apache/spark/profiler/SparkAsyncProfiler.scala
+++ b/connector/profiler/src/main/scala/org/apache/spark/profiler/SparkAsyncProfiler.scala
@@ -26,7 +26,7 @@ import org.apache.hadoop.fs.permission.FsPermission
 import org.apache.spark.SparkConf
 import org.apache.spark.SparkContext.DRIVER_IDENTIFIER
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.util.{ThreadUtils, Utils}
 
@@ -36,7 +36,6 @@ import org.apache.spark.util.{ThreadUtils, Utils}
 private[spark] class SparkAsyncProfiler(conf: SparkConf, executorId: String) extends Logging {
 
   private var running = false
-  private val enableProfiler = conf.get(PROFILER_EXECUTOR_ENABLED)
   private val profilerOptions = conf.get(PROFILER_ASYNC_PROFILER_OPTIONS)
   private val profilerDfsDirOpt = conf.get(PROFILER_DFS_DIR)
   private val profilerLocalDir = conf.get(PROFILER_LOCAL_DIR)
@@ -66,9 +65,15 @@ private[spark] class SparkAsyncProfiler(conf: SparkConf, executorId: String) ext
   private var threadpool: ScheduledExecutorService = _
   @volatile private var writing: Boolean = false
 
+  lazy private val extractionDir =
+    Utils.createTempDir(Utils.getLocalDir(conf), "asyncProfiler").toPath
+
   val profiler: Option[AsyncProfiler] = {
     Option(
-      if (enableProfiler && AsyncProfilerLoader.isSupported) AsyncProfilerLoader.load() else null
+      if (AsyncProfilerLoader.isSupported) {
+        AsyncProfilerLoader.setExtractionDirectory(extractionDir)
+        AsyncProfilerLoader.load()
+      } else null
     )
   }
 
diff --git a/connector/spark-ganglia-lgpl/src/main/java/com/codahale/metrics/ganglia/GangliaReporter.java b/connector/spark-ganglia-lgpl/src/main/java/com/codahale/metrics/ganglia/GangliaReporter.java
index 48c61e80d6655..3a38a52f7ab5d 100644
--- a/connector/spark-ganglia-lgpl/src/main/java/com/codahale/metrics/ganglia/GangliaReporter.java
+++ b/connector/spark-ganglia-lgpl/src/main/java/com/codahale/metrics/ganglia/GangliaReporter.java
@@ -295,7 +295,7 @@ private void reportTimer(String name, Timer timer) {
             reportMetered(sanitizedName, timer, group, "calls");
         } catch (GangliaException e) {
             LOGGER.warn("Unable to report timer {}", e,
-                MDC.of(LogKeys.METRIC_NAME$.MODULE$, sanitizedName));
+                MDC.of(LogKeys.METRIC_NAME, sanitizedName));
         }
     }
 
@@ -306,7 +306,7 @@ private void reportMeter(String name, Meter meter) {
             reportMetered(sanitizedName, meter, group, "events");
         } catch (GangliaException e) {
             LOGGER.warn("Unable to report meter {}", e,
-                MDC.of(LogKeys.METRIC_NAME$.MODULE$, name));
+                MDC.of(LogKeys.METRIC_NAME, name));
         }
     }
 
@@ -338,7 +338,7 @@ private void reportHistogram(String name, Histogram histogram) {
             announceIfEnabled(P999, sanitizedName, group, snapshot.get999thPercentile(), "");
         } catch (GangliaException e) {
             LOGGER.warn("Unable to report histogram {}", e,
-                MDC.of(LogKeys.METRIC_NAME$.MODULE$, sanitizedName));
+                MDC.of(LogKeys.METRIC_NAME, sanitizedName));
         }
     }
 
@@ -349,7 +349,7 @@ private void reportCounter(String name, Counter counter) {
             announce(prefix(sanitizedName, COUNT.getCode()), group, Long.toString(counter.getCount()), GMetricType.DOUBLE, "");
         } catch (GangliaException e) {
             LOGGER.warn("Unable to report counter {}", e,
-                MDC.of(LogKeys.METRIC_NAME$.MODULE$, name));
+                MDC.of(LogKeys.METRIC_NAME, name));
         }
     }
 
@@ -363,7 +363,7 @@ private void reportGauge(String name, Gauge gauge) {
             announce(name(prefix, sanitizedName), group, value, type, "");
         } catch (GangliaException e) {
             LOGGER.warn("Unable to report gauge {}", e,
-                MDC.of(LogKeys.METRIC_NAME$.MODULE$, name));
+                MDC.of(LogKeys.METRIC_NAME, name));
         }
     }
 
diff --git a/core/benchmarks/ChecksumBenchmark-jdk21-results.txt b/core/benchmarks/ChecksumBenchmark-jdk21-results.txt
index 0065bd684beba..c622b13efc483 100644
--- a/core/benchmarks/ChecksumBenchmark-jdk21-results.txt
+++ b/core/benchmarks/ChecksumBenchmark-jdk21-results.txt
@@ -2,12 +2,12 @@
 Benchmark Checksum Algorithms
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Checksum Algorithms:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Adler32                                           11110          11117           9          0.0    10849608.9       1.0X
-CRC32                                              2763           2768           4          0.0     2698564.7       4.0X
-CRC32C                                             2249           2303          48          0.0     2195990.4       4.9X
+Adler32                                           11108          11126          25          0.0    10847856.7       1.0X
+CRC32                                              2757           2770          19          0.0     2692382.2       4.0X
+CRC32C                                             1986           2008          19          0.0     1939837.0       5.6X
 
 
diff --git a/core/benchmarks/ChecksumBenchmark-results.txt b/core/benchmarks/ChecksumBenchmark-results.txt
index e907066d649c3..e7515b83cdfff 100644
--- a/core/benchmarks/ChecksumBenchmark-results.txt
+++ b/core/benchmarks/ChecksumBenchmark-results.txt
@@ -2,12 +2,12 @@
 Benchmark Checksum Algorithms
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Checksum Algorithms:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Adler32                                           11096          11101           4          0.0    10835715.4       1.0X
-CRC32                                              2715           2716           1          0.0     2651776.1       4.1X
-CRC32C                                             1629           1647          15          0.0     1591225.5       6.8X
+Adler32                                           11125          11135          15          0.0    10863804.5       1.0X
+CRC32                                              2778           2783           6          0.0     2713168.9       4.0X
+CRC32C                                             2268           2513         391          0.0     2214567.2       4.9X
 
 
diff --git a/core/benchmarks/CoalescedRDDBenchmark-jdk21-results.txt b/core/benchmarks/CoalescedRDDBenchmark-jdk21-results.txt
index 88142e681790d..e4e7342c1d0ca 100644
--- a/core/benchmarks/CoalescedRDDBenchmark-jdk21-results.txt
+++ b/core/benchmarks/CoalescedRDDBenchmark-jdk21-results.txt
@@ -2,39 +2,39 @@
 Coalesced RDD , large scale
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Coalesced RDD:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Coalesce Num Partitions: 100 Num Hosts: 1               255            263          12          0.4        2548.3       1.0X
-Coalesce Num Partitions: 100 Num Hosts: 5               133            135           2          0.8        1332.7       1.9X
-Coalesce Num Partitions: 100 Num Hosts: 10               99            103           4          1.0         994.6       2.6X
-Coalesce Num Partitions: 100 Num Hosts: 20              104            106           2          1.0        1035.4       2.5X
-Coalesce Num Partitions: 100 Num Hosts: 40               92            104          16          1.1         919.5       2.8X
-Coalesce Num Partitions: 100 Num Hosts: 80               99             99           1          1.0         986.7       2.6X
-Coalesce Num Partitions: 500 Num Hosts: 1               880            892          13          0.1        8796.0       0.3X
-Coalesce Num Partitions: 500 Num Hosts: 5               247            254           7          0.4        2474.6       1.0X
-Coalesce Num Partitions: 500 Num Hosts: 10              167            169           1          0.6        1672.5       1.5X
-Coalesce Num Partitions: 500 Num Hosts: 20              127            128           1          0.8        1269.1       2.0X
-Coalesce Num Partitions: 500 Num Hosts: 40              107            107           1          0.9        1065.5       2.4X
-Coalesce Num Partitions: 500 Num Hosts: 80              109            112           3          0.9        1090.6       2.3X
-Coalesce Num Partitions: 1000 Num Hosts: 1             1651           1677          23          0.1       16508.5       0.2X
-Coalesce Num Partitions: 1000 Num Hosts: 5              407            418          14          0.2        4073.4       0.6X
-Coalesce Num Partitions: 1000 Num Hosts: 10             249            250           2          0.4        2485.6       1.0X
-Coalesce Num Partitions: 1000 Num Hosts: 20             165            170           7          0.6        1654.8       1.5X
-Coalesce Num Partitions: 1000 Num Hosts: 40             129            130           3          0.8        1287.6       2.0X
-Coalesce Num Partitions: 1000 Num Hosts: 80             108            110           2          0.9        1082.9       2.4X
-Coalesce Num Partitions: 5000 Num Hosts: 1             7737           7757          19          0.0       77368.9       0.0X
-Coalesce Num Partitions: 5000 Num Hosts: 5             1784           1790           5          0.1       17837.1       0.1X
-Coalesce Num Partitions: 5000 Num Hosts: 10             923            938          20          0.1        9226.0       0.3X
-Coalesce Num Partitions: 5000 Num Hosts: 20             520            526           9          0.2        5196.1       0.5X
-Coalesce Num Partitions: 5000 Num Hosts: 40             314            315           1          0.3        3137.0       0.8X
-Coalesce Num Partitions: 5000 Num Hosts: 80             201            213          13          0.5        2012.4       1.3X
-Coalesce Num Partitions: 10000 Num Hosts: 1           14476          14509          28          0.0      144760.1       0.0X
-Coalesce Num Partitions: 10000 Num Hosts: 5            3401           3429          41          0.0       34012.2       0.1X
-Coalesce Num Partitions: 10000 Num Hosts: 10           1753           1759           9          0.1       17526.3       0.1X
-Coalesce Num Partitions: 10000 Num Hosts: 20            927            936           9          0.1        9272.2       0.3X
-Coalesce Num Partitions: 10000 Num Hosts: 40            510            518          12          0.2        5097.7       0.5X
-Coalesce Num Partitions: 10000 Num Hosts: 80            303            307           3          0.3        3034.1       0.8X
+Coalesce Num Partitions: 100 Num Hosts: 1               258            289          44          0.4        2576.1       1.0X
+Coalesce Num Partitions: 100 Num Hosts: 5               134            135           2          0.7        1337.3       1.9X
+Coalesce Num Partitions: 100 Num Hosts: 10              115            119           5          0.9        1153.1       2.2X
+Coalesce Num Partitions: 100 Num Hosts: 20              121            122           2          0.8        1205.8       2.1X
+Coalesce Num Partitions: 100 Num Hosts: 40              104            111           8          1.0        1042.2       2.5X
+Coalesce Num Partitions: 100 Num Hosts: 80              102            109           9          1.0        1023.5       2.5X
+Coalesce Num Partitions: 500 Num Hosts: 1               861            877          21          0.1        8610.7       0.3X
+Coalesce Num Partitions: 500 Num Hosts: 5               274            276           2          0.4        2743.6       0.9X
+Coalesce Num Partitions: 500 Num Hosts: 10              184            185           1          0.5        1838.5       1.4X
+Coalesce Num Partitions: 500 Num Hosts: 20              147            152           6          0.7        1472.2       1.7X
+Coalesce Num Partitions: 500 Num Hosts: 40              125            126           1          0.8        1249.5       2.1X
+Coalesce Num Partitions: 500 Num Hosts: 80              125            126           2          0.8        1250.0       2.1X
+Coalesce Num Partitions: 1000 Num Hosts: 1             1616           1624          10          0.1       16161.1       0.2X
+Coalesce Num Partitions: 1000 Num Hosts: 5              423            426           5          0.2        4229.1       0.6X
+Coalesce Num Partitions: 1000 Num Hosts: 10             264            266           2          0.4        2641.7       1.0X
+Coalesce Num Partitions: 1000 Num Hosts: 20             182            191          15          0.6        1816.1       1.4X
+Coalesce Num Partitions: 1000 Num Hosts: 40             135            140           5          0.7        1352.6       1.9X
+Coalesce Num Partitions: 1000 Num Hosts: 80             137            138           1          0.7        1373.0       1.9X
+Coalesce Num Partitions: 5000 Num Hosts: 1             7384           7391           6          0.0       73841.7       0.0X
+Coalesce Num Partitions: 5000 Num Hosts: 5             1899           1911          16          0.1       18986.8       0.1X
+Coalesce Num Partitions: 5000 Num Hosts: 10            1004           1010           6          0.1       10035.9       0.3X
+Coalesce Num Partitions: 5000 Num Hosts: 20             571            575           3          0.2        5714.0       0.5X
+Coalesce Num Partitions: 5000 Num Hosts: 40             349            351           3          0.3        3485.6       0.7X
+Coalesce Num Partitions: 5000 Num Hosts: 80             232            234           2          0.4        2324.0       1.1X
+Coalesce Num Partitions: 10000 Num Hosts: 1           13891          13911          35          0.0      138910.9       0.0X
+Coalesce Num Partitions: 10000 Num Hosts: 5            3828           3830           2          0.0       38275.2       0.1X
+Coalesce Num Partitions: 10000 Num Hosts: 10           1921           1935          13          0.1       19206.1       0.1X
+Coalesce Num Partitions: 10000 Num Hosts: 20           1018           1025           6          0.1       10184.3       0.3X
+Coalesce Num Partitions: 10000 Num Hosts: 40            571            577           9          0.2        5710.2       0.5X
+Coalesce Num Partitions: 10000 Num Hosts: 80            341            345           3          0.3        3413.2       0.8X
 
 
diff --git a/core/benchmarks/CoalescedRDDBenchmark-results.txt b/core/benchmarks/CoalescedRDDBenchmark-results.txt
index d3a2cc1a6e108..c4e9b60f683b4 100644
--- a/core/benchmarks/CoalescedRDDBenchmark-results.txt
+++ b/core/benchmarks/CoalescedRDDBenchmark-results.txt
@@ -2,39 +2,39 @@
 Coalesced RDD , large scale
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Coalesced RDD:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Coalesce Num Partitions: 100 Num Hosts: 1               150            156           7          0.7        1501.3       1.0X
-Coalesce Num Partitions: 100 Num Hosts: 5               109            113           4          0.9        1087.1       1.4X
-Coalesce Num Partitions: 100 Num Hosts: 10               94            106          11          1.1         943.2       1.6X
-Coalesce Num Partitions: 100 Num Hosts: 20               92             99           8          1.1         924.6       1.6X
-Coalesce Num Partitions: 100 Num Hosts: 40               91             97           6          1.1         906.9       1.7X
-Coalesce Num Partitions: 100 Num Hosts: 80               92             98           7          1.1         916.3       1.6X
-Coalesce Num Partitions: 500 Num Hosts: 1               317            323           7          0.3        3174.6       0.5X
-Coalesce Num Partitions: 500 Num Hosts: 5               139            140           2          0.7        1394.3       1.1X
-Coalesce Num Partitions: 500 Num Hosts: 10              114            129          19          0.9        1144.9       1.3X
-Coalesce Num Partitions: 500 Num Hosts: 20              107            116          15          0.9        1065.8       1.4X
-Coalesce Num Partitions: 500 Num Hosts: 40               99            104           5          1.0         995.0       1.5X
-Coalesce Num Partitions: 500 Num Hosts: 80               96            101           5          1.0         960.9       1.6X
-Coalesce Num Partitions: 1000 Num Hosts: 1              523            533           9          0.2        5231.6       0.3X
-Coalesce Num Partitions: 1000 Num Hosts: 5              188            188           0          0.5        1882.4       0.8X
-Coalesce Num Partitions: 1000 Num Hosts: 10             131            133           2          0.8        1314.5       1.1X
-Coalesce Num Partitions: 1000 Num Hosts: 20             112            114           3          0.9        1120.6       1.3X
-Coalesce Num Partitions: 1000 Num Hosts: 40             105            105           0          1.0        1047.7       1.4X
-Coalesce Num Partitions: 1000 Num Hosts: 80              98            105           5          1.0         984.4       1.5X
-Coalesce Num Partitions: 5000 Num Hosts: 1             2321           2342          28          0.0       23213.0       0.1X
-Coalesce Num Partitions: 5000 Num Hosts: 5              686            697          17          0.1        6858.9       0.2X
-Coalesce Num Partitions: 5000 Num Hosts: 10             386            391           4          0.3        3863.4       0.4X
-Coalesce Num Partitions: 5000 Num Hosts: 20             252            253           2          0.4        2518.2       0.6X
-Coalesce Num Partitions: 5000 Num Hosts: 40             168            171           4          0.6        1683.5       0.9X
-Coalesce Num Partitions: 5000 Num Hosts: 80             132            137           5          0.8        1322.0       1.1X
-Coalesce Num Partitions: 10000 Num Hosts: 1            4250           4268          16          0.0       42497.7       0.0X
-Coalesce Num Partitions: 10000 Num Hosts: 5            1401           1408           7          0.1       14008.0       0.1X
-Coalesce Num Partitions: 10000 Num Hosts: 10            724            725           2          0.1        7237.0       0.2X
-Coalesce Num Partitions: 10000 Num Hosts: 20            396            402           5          0.3        3959.1       0.4X
-Coalesce Num Partitions: 10000 Num Hosts: 40            255            257           2          0.4        2550.1       0.6X
-Coalesce Num Partitions: 10000 Num Hosts: 80            181            183           2          0.6        1811.0       0.8X
+Coalesce Num Partitions: 100 Num Hosts: 1               139            150          13          0.7        1388.1       1.0X
+Coalesce Num Partitions: 100 Num Hosts: 5               109            110           1          0.9        1089.8       1.3X
+Coalesce Num Partitions: 100 Num Hosts: 10               95            105          15          1.0         954.0       1.5X
+Coalesce Num Partitions: 100 Num Hosts: 20               92             98           9          1.1         921.3       1.5X
+Coalesce Num Partitions: 100 Num Hosts: 40               91             93           2          1.1         912.2       1.5X
+Coalesce Num Partitions: 100 Num Hosts: 80               90             96           8          1.1         897.0       1.5X
+Coalesce Num Partitions: 500 Num Hosts: 1               314            319           5          0.3        3143.2       0.4X
+Coalesce Num Partitions: 500 Num Hosts: 5               149            151           3          0.7        1492.4       0.9X
+Coalesce Num Partitions: 500 Num Hosts: 10              112            116           5          0.9        1120.0       1.2X
+Coalesce Num Partitions: 500 Num Hosts: 20              102            102           0          1.0        1017.6       1.4X
+Coalesce Num Partitions: 500 Num Hosts: 40               92             97           8          1.1         918.3       1.5X
+Coalesce Num Partitions: 500 Num Hosts: 80               90             92           3          1.1         898.4       1.5X
+Coalesce Num Partitions: 1000 Num Hosts: 1              528            531           4          0.2        5282.1       0.3X
+Coalesce Num Partitions: 1000 Num Hosts: 5              177            177           0          0.6        1768.9       0.8X
+Coalesce Num Partitions: 1000 Num Hosts: 10             146            147           2          0.7        1457.7       1.0X
+Coalesce Num Partitions: 1000 Num Hosts: 20             109            110           2          0.9        1085.2       1.3X
+Coalesce Num Partitions: 1000 Num Hosts: 40              99            101           1          1.0         992.1       1.4X
+Coalesce Num Partitions: 1000 Num Hosts: 80              93             94           1          1.1         928.0       1.5X
+Coalesce Num Partitions: 5000 Num Hosts: 1             2321           2328           6          0.0       23205.7       0.1X
+Coalesce Num Partitions: 5000 Num Hosts: 5              687            692           7          0.1        6870.2       0.2X
+Coalesce Num Partitions: 5000 Num Hosts: 10             386            389           3          0.3        3861.2       0.4X
+Coalesce Num Partitions: 5000 Num Hosts: 20             240            242           2          0.4        2399.8       0.6X
+Coalesce Num Partitions: 5000 Num Hosts: 40             173            179          10          0.6        1729.4       0.8X
+Coalesce Num Partitions: 5000 Num Hosts: 80             128            131           3          0.8        1277.8       1.1X
+Coalesce Num Partitions: 10000 Num Hosts: 1            4233           4245          12          0.0       42331.1       0.0X
+Coalesce Num Partitions: 10000 Num Hosts: 5            1376           1382           5          0.1       13757.6       0.1X
+Coalesce Num Partitions: 10000 Num Hosts: 10            702            707           5          0.1        7019.0       0.2X
+Coalesce Num Partitions: 10000 Num Hosts: 20            406            408           2          0.2        4059.0       0.3X
+Coalesce Num Partitions: 10000 Num Hosts: 40            247            248           1          0.4        2466.7       0.6X
+Coalesce Num Partitions: 10000 Num Hosts: 80            165            171           5          0.6        1654.9       0.8X
 
 
diff --git a/core/benchmarks/KryoBenchmark-jdk21-results.txt b/core/benchmarks/KryoBenchmark-jdk21-results.txt
index ca03441d01a87..c182d1f38c036 100644
--- a/core/benchmarks/KryoBenchmark-jdk21-results.txt
+++ b/core/benchmarks/KryoBenchmark-jdk21-results.txt
@@ -2,27 +2,27 @@
 Benchmark Kryo Unsafe vs safe Serialization
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark Kryo Unsafe vs safe Serialization:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-basicTypes: Int with unsafe:true                       166            169           6          6.0         165.7       1.0X
-basicTypes: Long with unsafe:true                      178            182           4          5.6         177.5       0.9X
-basicTypes: Float with unsafe:true                     183            191           9          5.5         182.7       0.9X
-basicTypes: Double with unsafe:true                    186            193           7          5.4         186.4       0.9X
-Array: Int with unsafe:true                              1              1           0        745.8           1.3     123.5X
-Array: Long with unsafe:true                             2              3           0        451.7           2.2      74.8X
-Array: Float with unsafe:true                            1              1           0        743.0           1.3     123.1X
-Array: Double with unsafe:true                           2              2           0        475.6           2.1      78.8X
-Map of string->Double  with unsafe:true                 27             28           1         37.0          27.0       6.1X
-basicTypes: Int with unsafe:false                      198            199           1          5.1         197.7       0.8X
-basicTypes: Long with unsafe:false                     220            221           1          4.5         219.8       0.8X
-basicTypes: Float with unsafe:false                    206            208           1          4.8         206.3       0.8X
-basicTypes: Double with unsafe:false                   222            225           2          4.5         221.9       0.7X
-Array: Int with unsafe:false                            13             14           1         78.0          12.8      12.9X
-Array: Long with unsafe:false                           21             21           1         48.2          20.8       8.0X
-Array: Float with unsafe:false                           6              6           0        178.9           5.6      29.6X
-Array: Double with unsafe:false                         15             16           0         65.3          15.3      10.8X
-Map of string->Double  with unsafe:false                28             29           2         35.2          28.4       5.8X
+basicTypes: Int with unsafe:true                       169            170           1          5.9         168.9       1.0X
+basicTypes: Long with unsafe:true                      177            182           3          5.7         176.7       1.0X
+basicTypes: Float with unsafe:true                     184            185           1          5.4         184.3       0.9X
+basicTypes: Double with unsafe:true                    184            186           3          5.4         183.6       0.9X
+Array: Int with unsafe:true                              1              1           0        755.5           1.3     127.6X
+Array: Long with unsafe:true                             2              2           0        496.5           2.0      83.8X
+Array: Float with unsafe:true                            1              1           0        754.2           1.3     127.4X
+Array: Double with unsafe:true                           2              2           0        500.0           2.0      84.4X
+Map of string->Double  with unsafe:true                 27             27           0         37.7          26.5       6.4X
+basicTypes: Int with unsafe:false                      204            205           0          4.9         203.9       0.8X
+basicTypes: Long with unsafe:false                     216            218           2          4.6         216.1       0.8X
+basicTypes: Float with unsafe:false                    195            196           1          5.1         194.7       0.9X
+basicTypes: Double with unsafe:false                   197            199           2          5.1         197.4       0.9X
+Array: Int with unsafe:false                            13             13           0         77.6          12.9      13.1X
+Array: Long with unsafe:false                           20             20           0         49.4          20.2       8.3X
+Array: Float with unsafe:false                           8              8           0        132.8           7.5      22.4X
+Array: Double with unsafe:false                          9             10           0        106.0           9.4      17.9X
+Map of string->Double  with unsafe:false                27             28           2         37.0          27.0       6.2X
 
 
diff --git a/core/benchmarks/KryoBenchmark-results.txt b/core/benchmarks/KryoBenchmark-results.txt
index bffc9eafb79e3..d526e5f4c47c2 100644
--- a/core/benchmarks/KryoBenchmark-results.txt
+++ b/core/benchmarks/KryoBenchmark-results.txt
@@ -2,27 +2,27 @@
 Benchmark Kryo Unsafe vs safe Serialization
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark Kryo Unsafe vs safe Serialization:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-basicTypes: Int with unsafe:true                       172            174           1          5.8         171.9       1.0X
-basicTypes: Long with unsafe:true                      196            197           0          5.1         196.2       0.9X
-basicTypes: Float with unsafe:true                     193            195           2          5.2         192.7       0.9X
-basicTypes: Double with unsafe:true                    193            194           1          5.2         193.2       0.9X
-Array: Int with unsafe:true                              1              1           0        715.2           1.4     122.9X
-Array: Long with unsafe:true                             2              2           0        474.2           2.1      81.5X
-Array: Float with unsafe:true                            1              1           0        718.2           1.4     123.5X
-Array: Double with unsafe:true                           2              2           0        475.8           2.1      81.8X
-Map of string->Double  with unsafe:true                 27             28           0         36.7          27.2       6.3X
-basicTypes: Int with unsafe:false                      207            209           5          4.8         207.3       0.8X
-basicTypes: Long with unsafe:false                     239            241           2          4.2         238.9       0.7X
-basicTypes: Float with unsafe:false                    215            217           2          4.6         215.4       0.8X
-basicTypes: Double with unsafe:false                   220            225           7          4.5         220.2       0.8X
-Array: Int with unsafe:false                            16             20           7         63.4          15.8      10.9X
-Array: Long with unsafe:false                           22             22           0         45.9          21.8       7.9X
-Array: Float with unsafe:false                           6              6           1        170.0           5.9      29.2X
-Array: Double with unsafe:false                         10             10           0         98.6          10.1      16.9X
-Map of string->Double  with unsafe:false                28             29           1         35.9          27.9       6.2X
+basicTypes: Int with unsafe:true                       167            169           2          6.0         167.1       1.0X
+basicTypes: Long with unsafe:true                      190            192           2          5.3         190.3       0.9X
+basicTypes: Float with unsafe:true                     187            189           1          5.3         187.3       0.9X
+basicTypes: Double with unsafe:true                    197            198           3          5.1         196.5       0.9X
+Array: Int with unsafe:true                              1              1           0        740.3           1.4     123.7X
+Array: Long with unsafe:true                             2              2           0        448.5           2.2      74.9X
+Array: Float with unsafe:true                            1              1           0        743.0           1.3     124.1X
+Array: Double with unsafe:true                           2              2           0        446.8           2.2      74.6X
+Map of string->Double  with unsafe:true                 27             29           1         36.5          27.4       6.1X
+basicTypes: Int with unsafe:false                      223            224           1          4.5         223.0       0.7X
+basicTypes: Long with unsafe:false                     244            245           1          4.1         244.0       0.7X
+basicTypes: Float with unsafe:false                    225            225           1          4.5         224.7       0.7X
+basicTypes: Double with unsafe:false                   222            224           1          4.5         221.9       0.8X
+Array: Int with unsafe:false                            14             15           0         69.4          14.4      11.6X
+Array: Long with unsafe:false                           20             21           0         49.1          20.4       8.2X
+Array: Float with unsafe:false                           6              6           0        170.8           5.9      28.5X
+Array: Double with unsafe:false                         10             10           0        102.7           9.7      17.2X
+Map of string->Double  with unsafe:false                31             32           1         32.5          30.8       5.4X
 
 
diff --git a/core/benchmarks/KryoIteratorBenchmark-jdk21-results.txt b/core/benchmarks/KryoIteratorBenchmark-jdk21-results.txt
index 835b16e24d95f..c853973a3ed1f 100644
--- a/core/benchmarks/KryoIteratorBenchmark-jdk21-results.txt
+++ b/core/benchmarks/KryoIteratorBenchmark-jdk21-results.txt
@@ -2,27 +2,27 @@
 Benchmark of kryo asIterator on deserialization stream
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark of kryo asIterator on deserialization stream:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------------
-Colletion of int with 1 elements, useIterator: true                        6              7           0          1.5         645.9       1.0X
-Colletion of int with 10 elements, useIterator: true                      13             14           0          0.8        1330.8       0.5X
-Colletion of int with 100 elements, useIterator: true                     80             81           1          0.1        7987.1       0.1X
-Colletion of string with 1 elements, useIterator: true                     8              8           0          1.3         787.4       0.8X
-Colletion of string with 10 elements, useIterator: true                   21             21           0          0.5        2113.7       0.3X
-Colletion of string with 100 elements, useIterator: true                 161            162           1          0.1       16108.9       0.0X
-Colletion of Array[int] with 1 elements, useIterator: true                 7              8           0          1.3         747.8       0.9X
-Colletion of Array[int] with 10 elements, useIterator: true               19             19           0          0.5        1879.8       0.3X
-Colletion of Array[int] with 100 elements, useIterator: true             140            141           1          0.1       14008.3       0.0X
-Colletion of int with 1 elements, useIterator: false                       6              7           0          1.6         642.6       1.0X
-Colletion of int with 10 elements, useIterator: false                     14             15           1          0.7        1414.6       0.5X
-Colletion of int with 100 elements, useIterator: false                    87             88           1          0.1        8699.0       0.1X
-Colletion of string with 1 elements, useIterator: false                    7              8           0          1.3         746.5       0.9X
-Colletion of string with 10 elements, useIterator: false                  22             22           0          0.5        2192.3       0.3X
-Colletion of string with 100 elements, useIterator: false                161            162           2          0.1       16091.2       0.0X
-Colletion of Array[int] with 1 elements, useIterator: false                7              8           0          1.4         719.6       0.9X
-Colletion of Array[int] with 10 elements, useIterator: false              19             19           0          0.5        1869.6       0.3X
-Colletion of Array[int] with 100 elements, useIterator: false            138            139           1          0.1       13766.1       0.0X
+Colletion of int with 1 elements, useIterator: true                        6              6           0          1.6         614.1       1.0X
+Colletion of int with 10 elements, useIterator: true                      14             14           0          0.7        1353.8       0.5X
+Colletion of int with 100 elements, useIterator: true                     83             84           1          0.1        8301.3       0.1X
+Colletion of string with 1 elements, useIterator: true                     8              8           0          1.3         780.9       0.8X
+Colletion of string with 10 elements, useIterator: true                   23             23           1          0.4        2274.3       0.3X
+Colletion of string with 100 elements, useIterator: true                 171            172           1          0.1       17072.6       0.0X
+Colletion of Array[int] with 1 elements, useIterator: true                 7              8           0          1.4         736.9       0.8X
+Colletion of Array[int] with 10 elements, useIterator: true               20             20           0          0.5        1976.1       0.3X
+Colletion of Array[int] with 100 elements, useIterator: true             147            148           1          0.1       14712.0       0.0X
+Colletion of int with 1 elements, useIterator: false                       6              6           0          1.6         619.4       1.0X
+Colletion of int with 10 elements, useIterator: false                     13             14           0          0.7        1343.7       0.5X
+Colletion of int with 100 elements, useIterator: false                    84             85           0          0.1        8391.9       0.1X
+Colletion of string with 1 elements, useIterator: false                    7              8           0          1.4         721.7       0.9X
+Colletion of string with 10 elements, useIterator: false                  22             22           0          0.5        2208.8       0.3X
+Colletion of string with 100 elements, useIterator: false                164            164           0          0.1       16358.2       0.0X
+Colletion of Array[int] with 1 elements, useIterator: false                7              7           0          1.4         702.7       0.9X
+Colletion of Array[int] with 10 elements, useIterator: false              19             20           0          0.5        1911.7       0.3X
+Colletion of Array[int] with 100 elements, useIterator: false            143            144           1          0.1       14274.6       0.0X
 
 
diff --git a/core/benchmarks/KryoIteratorBenchmark-results.txt b/core/benchmarks/KryoIteratorBenchmark-results.txt
index 6caa842d0e4d2..016f8e38bd807 100644
--- a/core/benchmarks/KryoIteratorBenchmark-results.txt
+++ b/core/benchmarks/KryoIteratorBenchmark-results.txt
@@ -2,27 +2,27 @@
 Benchmark of kryo asIterator on deserialization stream
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark of kryo asIterator on deserialization stream:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------------
-Colletion of int with 1 elements, useIterator: true                        6              6           0          1.6         629.3       1.0X
-Colletion of int with 10 elements, useIterator: true                      14             14           0          0.7        1350.0       0.5X
-Colletion of int with 100 elements, useIterator: true                     83             83           1          0.1        8255.8       0.1X
-Colletion of string with 1 elements, useIterator: true                     8              8           0          1.3         750.8       0.8X
-Colletion of string with 10 elements, useIterator: true                   21             21           1          0.5        2116.4       0.3X
-Colletion of string with 100 elements, useIterator: true                 162            163           1          0.1       16191.1       0.0X
-Colletion of Array[int] with 1 elements, useIterator: true                 7              8           0          1.4         732.3       0.9X
-Colletion of Array[int] with 10 elements, useIterator: true               19             19           0          0.5        1906.4       0.3X
-Colletion of Array[int] with 100 elements, useIterator: true             142            143           0          0.1       14222.9       0.0X
-Colletion of int with 1 elements, useIterator: false                       6              6           0          1.7         604.6       1.0X
-Colletion of int with 10 elements, useIterator: false                     13             13           0          0.8        1325.8       0.5X
-Colletion of int with 100 elements, useIterator: false                    83             83           0          0.1        8261.2       0.1X
-Colletion of string with 1 elements, useIterator: false                    7              8           1          1.4         719.2       0.9X
-Colletion of string with 10 elements, useIterator: false                  22             22           0          0.5        2203.0       0.3X
-Colletion of string with 100 elements, useIterator: false                163            163           1          0.1       16294.8       0.0X
-Colletion of Array[int] with 1 elements, useIterator: false                7              7           0          1.5         674.8       0.9X
-Colletion of Array[int] with 10 elements, useIterator: false              18             19           0          0.6        1808.7       0.3X
-Colletion of Array[int] with 100 elements, useIterator: false            135            135           0          0.1       13481.7       0.0X
+Colletion of int with 1 elements, useIterator: true                        6              7           0          1.6         641.1       1.0X
+Colletion of int with 10 elements, useIterator: true                      14             14           0          0.7        1354.7       0.5X
+Colletion of int with 100 elements, useIterator: true                     81             82           0          0.1        8098.5       0.1X
+Colletion of string with 1 elements, useIterator: true                     8              8           0          1.3         779.2       0.8X
+Colletion of string with 10 elements, useIterator: true                   22             23           1          0.5        2215.9       0.3X
+Colletion of string with 100 elements, useIterator: true                 162            162           0          0.1       16186.6       0.0X
+Colletion of Array[int] with 1 elements, useIterator: true                 7              8           0          1.3         745.7       0.9X
+Colletion of Array[int] with 10 elements, useIterator: true               20             20           0          0.5        1976.9       0.3X
+Colletion of Array[int] with 100 elements, useIterator: true             149            150           3          0.1       14870.3       0.0X
+Colletion of int with 1 elements, useIterator: false                       6              7           0          1.6         630.8       1.0X
+Colletion of int with 10 elements, useIterator: false                     13             14           0          0.7        1345.9       0.5X
+Colletion of int with 100 elements, useIterator: false                    83             84           1          0.1        8279.3       0.1X
+Colletion of string with 1 elements, useIterator: false                    7              8           1          1.3         741.4       0.9X
+Colletion of string with 10 elements, useIterator: false                  21             22           1          0.5        2116.2       0.3X
+Colletion of string with 100 elements, useIterator: false                167            167           0          0.1       16683.1       0.0X
+Colletion of Array[int] with 1 elements, useIterator: false                7              7           0          1.4         709.9       0.9X
+Colletion of Array[int] with 10 elements, useIterator: false              19             20           0          0.5        1912.0       0.3X
+Colletion of Array[int] with 100 elements, useIterator: false            139            140           1          0.1       13891.9       0.0X
 
 
diff --git a/core/benchmarks/KryoSerializerBenchmark-jdk21-results.txt b/core/benchmarks/KryoSerializerBenchmark-jdk21-results.txt
index e2c03b0acd23c..eaa4579ea6f5a 100644
--- a/core/benchmarks/KryoSerializerBenchmark-jdk21-results.txt
+++ b/core/benchmarks/KryoSerializerBenchmark-jdk21-results.txt
@@ -2,11 +2,11 @@
 Benchmark KryoPool vs old"pool of 1" implementation
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark KryoPool vs old"pool of 1" implementation:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-KryoPool:true                                                 3610           5082        1510          0.0     7219633.5       1.0X
-KryoPool:false                                                5886           7699        1454          0.0    11772046.4       0.6X
+KryoPool:true                                                 3317           5001        1551          0.0     6634900.3       1.0X
+KryoPool:false                                                5484           7586        1475          0.0    10968339.2       0.6X
 
 
diff --git a/core/benchmarks/KryoSerializerBenchmark-results.txt b/core/benchmarks/KryoSerializerBenchmark-results.txt
index 54b21654ce054..f0fefa24a833c 100644
--- a/core/benchmarks/KryoSerializerBenchmark-results.txt
+++ b/core/benchmarks/KryoSerializerBenchmark-results.txt
@@ -2,11 +2,11 @@
 Benchmark KryoPool vs old"pool of 1" implementation
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark KryoPool vs old"pool of 1" implementation:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-KryoPool:true                                                 3682           5317        1787          0.0     7363182.2       1.0X
-KryoPool:false                                                5853           7922        1339          0.0    11705848.9       0.6X
+KryoPool:true                                                 3514           5193        1835          0.0     7028412.4       1.0X
+KryoPool:false                                                5665           7598        1316          0.0    11329264.8       0.6X
 
 
diff --git a/core/benchmarks/LZFBenchmark-jdk21-results.txt b/core/benchmarks/LZFBenchmark-jdk21-results.txt
index b96edb0de4fa8..26adedf06015f 100644
--- a/core/benchmarks/LZFBenchmark-jdk21-results.txt
+++ b/core/benchmarks/LZFBenchmark-jdk21-results.txt
@@ -2,18 +2,18 @@
 Benchmark LZFCompressionCodec
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Compress small objects:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Compression 256000000 int values in parallel                590            602          11        433.7           2.3       1.0X
-Compression 256000000 int values single-threaded            557            558           1        460.0           2.2       1.1X
+Compression 256000000 int values in parallel                592            604          12        432.7           2.3       1.0X
+Compression 256000000 int values single-threaded            558            560           2        458.7           2.2       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Compress large objects:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Compression 1024 array values in 1 threads                42             47           3          0.0       41185.8       1.0X
-Compression 1024 array values single-threaded             31             31           0          0.0       30214.3       1.4X
+Compression 1024 array values in 1 threads                44             50           3          0.0       43112.9       1.0X
+Compression 1024 array values single-threaded             32             33           0          0.0       31315.1       1.4X
 
 
diff --git a/core/benchmarks/LZFBenchmark-results.txt b/core/benchmarks/LZFBenchmark-results.txt
index d999bb12f1fbc..713482e7a2e3d 100644
--- a/core/benchmarks/LZFBenchmark-results.txt
+++ b/core/benchmarks/LZFBenchmark-results.txt
@@ -2,18 +2,18 @@
 Benchmark LZFCompressionCodec
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Compress small objects:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Compression 256000000 int values in parallel                608            619           8        420.8           2.4       1.0X
-Compression 256000000 int values single-threaded            584            586           2        438.3           2.3       1.0X
+Compression 256000000 int values in parallel                591            611          14        433.3           2.3       1.0X
+Compression 256000000 int values single-threaded            613            619           6        417.3           2.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Compress large objects:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Compression 1024 array values in 1 threads                37             46           6          0.0       35682.0       1.0X
-Compression 1024 array values single-threaded             32             33           0          0.0       31517.3       1.1X
+Compression 1024 array values in 1 threads                39             45           5          0.0       38040.2       1.0X
+Compression 1024 array values single-threaded             31             31           1          0.0       29909.9       1.3X
 
 
diff --git a/core/benchmarks/MapStatusesConvertBenchmark-jdk21-results.txt b/core/benchmarks/MapStatusesConvertBenchmark-jdk21-results.txt
index 2639b7194286f..3e3baa1708890 100644
--- a/core/benchmarks/MapStatusesConvertBenchmark-jdk21-results.txt
+++ b/core/benchmarks/MapStatusesConvertBenchmark-jdk21-results.txt
@@ -2,12 +2,12 @@
 MapStatuses Convert Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 MapStatuses Convert:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Num Maps: 50000 Fetch partitions:500                699            706           6          0.0   698685201.0       1.0X
-Num Maps: 50000 Fetch partitions:1000              1587           1596          11          0.0  1586755889.0       0.4X
-Num Maps: 50000 Fetch partitions:1500              2442           2479          33          0.0  2442011440.0       0.3X
+Num Maps: 50000 Fetch partitions:500                717            721           5          0.0   716748683.0       1.0X
+Num Maps: 50000 Fetch partitions:1000              1615           1640          30          0.0  1615066557.0       0.4X
+Num Maps: 50000 Fetch partitions:1500              2485           2497          12          0.0  2484802897.0       0.3X
 
 
diff --git a/core/benchmarks/MapStatusesConvertBenchmark-results.txt b/core/benchmarks/MapStatusesConvertBenchmark-results.txt
index bd17fb8c53dee..ebadf6f9bc5d1 100644
--- a/core/benchmarks/MapStatusesConvertBenchmark-results.txt
+++ b/core/benchmarks/MapStatusesConvertBenchmark-results.txt
@@ -2,12 +2,12 @@
 MapStatuses Convert Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 MapStatuses Convert:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Num Maps: 50000 Fetch partitions:500                750            763          16          0.0   749869953.0       1.0X
-Num Maps: 50000 Fetch partitions:1000              1826           1851          24          0.0  1825734215.0       0.4X
-Num Maps: 50000 Fetch partitions:1500              2846           2863          17          0.0  2845610666.0       0.3X
+Num Maps: 50000 Fetch partitions:500                868            871           3          0.0   867735046.0       1.0X
+Num Maps: 50000 Fetch partitions:1000              1472           1492          29          0.0  1471850953.0       0.6X
+Num Maps: 50000 Fetch partitions:1500              2239           2252          14          0.0  2238836298.0       0.4X
 
 
diff --git a/core/benchmarks/MapStatusesSerDeserBenchmark-jdk21-results.txt b/core/benchmarks/MapStatusesSerDeserBenchmark-jdk21-results.txt
index 936af3f1dd149..3304f827bb4ea 100644
--- a/core/benchmarks/MapStatusesSerDeserBenchmark-jdk21-results.txt
+++ b/core/benchmarks/MapStatusesSerDeserBenchmark-jdk21-results.txt
@@ -1,64 +1,64 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 10 blocks w/ broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Serialization                                         85             88           4          2.3         425.9       1.0X
-Deserialization                                      141            148           8          1.4         707.0       0.6X
+Serialization                                         84             87           4          2.4         420.1       1.0X
+Deserialization                                      142            150           5          1.4         709.3       0.6X
 
 Compressed Serialized MapStatus sizes: 426.0 B
 Compressed Serialized Broadcast MapStatus sizes: 2.5 MiB
 
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 10 blocks w/o broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Serialization                                          75             76           1          2.7         376.2       1.0X
-Deserialization                                       141            145           9          1.4         706.7       0.5X
+Serialization                                          82             83           1          2.4         409.4       1.0X
+Deserialization                                       141            143           4          1.4         704.1       0.6X
 
 Compressed Serialized MapStatus sizes: 2.5 MiB
 Compressed Serialized Broadcast MapStatus sizes: 0.0 B
 
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 100 blocks w/ broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Serialization                                         161            166           8          1.2         805.6       1.0X
-Deserialization                                       158            163          13          1.3         790.6       1.0X
+Serialization                                         154            160          10          1.3         770.5       1.0X
+Deserialization                                       157            161           7          1.3         787.2       1.0X
 
 Compressed Serialized MapStatus sizes: 442.0 B
 Compressed Serialized Broadcast MapStatus sizes: 13.6 MiB
 
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 100 blocks w/o broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Serialization                                          143            143           0          1.4         712.6       1.0X
-Deserialization                                        158            164           9          1.3         789.7       0.9X
+Serialization                                          152            154           1          1.3         761.2       1.0X
+Deserialization                                        157            159           4          1.3         787.0       1.0X
 
 Compressed Serialized MapStatus sizes: 13.6 MiB
 Compressed Serialized Broadcast MapStatus sizes: 0.0 B
 
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 1000 blocks w/ broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Serialization                                          699            725          44          0.3        3494.9       1.0X
-Deserialization                                        327            344          11          0.6        1633.4       2.1X
+Serialization                                          727            749          37          0.3        3634.8       1.0X
+Deserialization                                        319            337          18          0.6        1593.8       2.3X
 
 Compressed Serialized MapStatus sizes: 570.0 B
 Compressed Serialized Broadcast MapStatus sizes: 122.3 MiB
 
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 1000 blocks w/o broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Serialization                                           562            567           5          0.4        2809.3       1.0X
-Deserialization                                         320            341          18          0.6        1598.2       1.8X
+Serialization                                           577            579           2          0.3        2884.2       1.0X
+Deserialization                                         316            335          18          0.6        1579.5       1.8X
 
 Compressed Serialized MapStatus sizes: 122.3 MiB
 Compressed Serialized Broadcast MapStatus sizes: 0.0 B
diff --git a/core/benchmarks/MapStatusesSerDeserBenchmark-results.txt b/core/benchmarks/MapStatusesSerDeserBenchmark-results.txt
index 48fe51f7cf938..af0468b055d72 100644
--- a/core/benchmarks/MapStatusesSerDeserBenchmark-results.txt
+++ b/core/benchmarks/MapStatusesSerDeserBenchmark-results.txt
@@ -1,64 +1,64 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 10 blocks w/ broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Serialization                                         90             93           3          2.2         449.1       1.0X
-Deserialization                                      137            144           6          1.5         685.7       0.7X
+Serialization                                         90             93           3          2.2         450.5       1.0X
+Deserialization                                      142            146           6          1.4         710.5       0.6X
 
 Compressed Serialized MapStatus sizes: 426.0 B
 Compressed Serialized Broadcast MapStatus sizes: 2.5 MiB
 
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 10 blocks w/o broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Serialization                                          75             76           1          2.7         376.3       1.0X
-Deserialization                                       137            142           6          1.5         683.4       0.6X
+Serialization                                          84             85           1          2.4         421.4       1.0X
+Deserialization                                       141            147           8          1.4         707.0       0.6X
 
 Compressed Serialized MapStatus sizes: 2.5 MiB
 Compressed Serialized Broadcast MapStatus sizes: 0.0 B
 
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 100 blocks w/ broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Serialization                                         153            158           5          1.3         762.6       1.0X
-Deserialization                                       153            161          11          1.3         765.5       1.0X
+Serialization                                         164            168           4          1.2         817.8       1.0X
+Deserialization                                       157            164           8          1.3         786.7       1.0X
 
 Compressed Serialized MapStatus sizes: 442.0 B
 Compressed Serialized Broadcast MapStatus sizes: 13.6 MiB
 
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 100 blocks w/o broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Serialization                                          156            160           3          1.3         779.5       1.0X
-Deserialization                                        153            160          11          1.3         762.6       1.0X
+Serialization                                          151            152           2          1.3         752.9       1.0X
+Deserialization                                        157            164          10          1.3         786.9       1.0X
 
 Compressed Serialized MapStatus sizes: 13.6 MiB
 Compressed Serialized Broadcast MapStatus sizes: 0.0 B
 
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 1000 blocks w/ broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Serialization                                          691            716          30          0.3        3457.5       1.0X
-Deserialization                                        330            342           9          0.6        1652.0       2.1X
+Serialization                                          717            726           8          0.3        3586.0       1.0X
+Deserialization                                        334            350          13          0.6        1669.7       2.1X
 
-Compressed Serialized MapStatus sizes: 569.0 B
+Compressed Serialized MapStatus sizes: 568.0 B
 Compressed Serialized Broadcast MapStatus sizes: 122.3 MiB
 
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200000 MapOutputs, 1000 blocks w/o broadcast:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Serialization                                           573            581           8          0.3        2866.3       1.0X
-Deserialization                                         323            336          12          0.6        1616.5       1.8X
+Serialization                                           578            584          11          0.3        2888.6       1.0X
+Deserialization                                         332            352          17          0.6        1660.3       1.7X
 
 Compressed Serialized MapStatus sizes: 122.3 MiB
 Compressed Serialized Broadcast MapStatus sizes: 0.0 B
diff --git a/core/benchmarks/PercentileHeapBenchmark-jdk21-results.txt b/core/benchmarks/PercentileHeapBenchmark-jdk21-results.txt
index 5d08b56176fbc..b005440163bce 100644
--- a/core/benchmarks/PercentileHeapBenchmark-jdk21-results.txt
+++ b/core/benchmarks/PercentileHeapBenchmark-jdk21-results.txt
@@ -2,40 +2,40 @@
 PercentileHeap Operations
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 10000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            1              1           0         10.2          98.3       1.0X
-Percentile: 0.9                                            1              1           0         17.4          57.3       1.7X
-Percentile: 0.95                                           0              0           0         22.8          43.9       2.2X
-Percentile: 0.99                                           0              0           0         30.4          32.9       3.0X
+Percentile: 0.5                                            1              1           0          9.8         102.2       1.0X
+Percentile: 0.9                                            1              1           0         17.5          57.2       1.8X
+Percentile: 0.95                                           0              0           0         22.2          45.0       2.3X
+Percentile: 0.99                                           0              0           0         30.1          33.2       3.1X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 50000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            5              5           0          9.6         104.6       1.0X
-Percentile: 0.9                                            3              3           0         16.8          59.6       1.8X
-Percentile: 0.95                                           2              2           0         20.8          48.1       2.2X
-Percentile: 0.99                                           2              2           0         29.3          34.2       3.1X
+Percentile: 0.5                                            5              6           0          9.2         109.2       1.0X
+Percentile: 0.9                                            3              4           1         15.9          63.0       1.7X
+Percentile: 0.95                                           2              2           0         21.4          46.8       2.3X
+Percentile: 0.99                                           2              2           0         29.0          34.4       3.2X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 100000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            12             12           0          8.2         121.5       1.0X
-Percentile: 0.9                                             6              7           0         15.6          64.1       1.9X
-Percentile: 0.95                                            5              5           0         19.9          50.1       2.4X
-Percentile: 0.99                                            4              4           0         28.3          35.3       3.4X
+Percentile: 0.5                                            13             13           0          7.9         126.5       1.0X
+Percentile: 0.9                                             7              7           1         14.7          67.9       1.9X
+Percentile: 0.95                                            5              5           0         20.0          50.1       2.5X
+Percentile: 0.99                                            4              4           0         28.2          35.4       3.6X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 200000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            26             26           0          7.8         128.2       1.0X
-Percentile: 0.9                                            14             14           0         14.5          68.8       1.9X
-Percentile: 0.95                                           11             11           0         19.0          52.7       2.4X
-Percentile: 0.99                                            7              7           0         27.1          36.9       3.5X
+Percentile: 0.5                                            27             27           1          7.5         134.0       1.0X
+Percentile: 0.9                                            14             14           0         14.3          70.1       1.9X
+Percentile: 0.95                                           11             11           0         18.5          54.1       2.5X
+Percentile: 0.99                                            7              7           0         27.2          36.8       3.6X
 
 
diff --git a/core/benchmarks/PercentileHeapBenchmark-results.txt b/core/benchmarks/PercentileHeapBenchmark-results.txt
index 2967772a8c273..979030652a5b7 100644
--- a/core/benchmarks/PercentileHeapBenchmark-results.txt
+++ b/core/benchmarks/PercentileHeapBenchmark-results.txt
@@ -2,40 +2,40 @@
 PercentileHeap Operations
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 10000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            1              1           0          9.9         101.1       1.0X
-Percentile: 0.9                                            1              1           0         17.2          58.3       1.7X
-Percentile: 0.95                                           0              0           0         22.9          43.6       2.3X
-Percentile: 0.99                                           0              0           0         30.5          32.8       3.1X
+Percentile: 0.5                                            1              1           0         10.3          97.4       1.0X
+Percentile: 0.9                                            1              1           0         18.3          54.7       1.8X
+Percentile: 0.95                                           0              0           0         23.4          42.8       2.3X
+Percentile: 0.99                                           0              0           0         30.8          32.5       3.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 50000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            5              6           0          9.3         107.0       1.0X
-Percentile: 0.9                                            3              3           0         16.8          59.4       1.8X
-Percentile: 0.95                                           2              2           0         21.8          45.9       2.3X
-Percentile: 0.99                                           2              2           0         28.8          34.8       3.1X
+Percentile: 0.5                                            5              6           1          9.4         106.8       1.0X
+Percentile: 0.9                                            3              3           0         16.5          60.5       1.8X
+Percentile: 0.95                                           2              2           0         22.0          45.5       2.3X
+Percentile: 0.99                                           2              2           0         29.0          34.5       3.1X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 100000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            12             12           0          8.2         122.2       1.0X
-Percentile: 0.9                                             6              7           0         15.8          63.5       1.9X
-Percentile: 0.95                                            5              5           0         20.4          49.0       2.5X
-Percentile: 0.99                                            3              3           0         28.7          34.9       3.5X
+Percentile: 0.5                                            12             12           0          8.6         116.5       1.0X
+Percentile: 0.9                                             7              7           0         15.3          65.3       1.8X
+Percentile: 0.95                                            5              5           0         20.9          47.8       2.4X
+Percentile: 0.99                                            4              4           0         28.1          35.5       3.3X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1015-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 PercentileHeap Operations - Input Size: 200000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Percentile: 0.5                                            26             26           0          7.7         130.1       1.0X
-Percentile: 0.9                                            14             14           0         14.4          69.4       1.9X
-Percentile: 0.95                                           10             11           1         19.3          51.8       2.5X
-Percentile: 0.99                                            7              7           0         27.6          36.2       3.6X
+Percentile: 0.5                                            25             26           0          7.9         126.6       1.0X
+Percentile: 0.9                                            14             14           0         14.6          68.6       1.8X
+Percentile: 0.95                                           10             11           1         19.4          51.6       2.5X
+Percentile: 0.99                                            7              7           0         27.3          36.7       3.5X
 
 
diff --git a/core/benchmarks/PersistenceEngineBenchmark-jdk21-results.txt b/core/benchmarks/PersistenceEngineBenchmark-jdk21-results.txt
index 49e54abebfea6..dbaca446f7782 100644
--- a/core/benchmarks/PersistenceEngineBenchmark-jdk21-results.txt
+++ b/core/benchmarks/PersistenceEngineBenchmark-jdk21-results.txt
@@ -2,17 +2,17 @@
 PersistenceEngineBenchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 1000 Workers:                                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-ZooKeeperPersistenceEngine with JavaSerializer                     6237           6453         236          0.0     6236919.5       1.0X
-FileSystemPersistenceEngine with JavaSerializer                    2481           2495          12          0.0     2480642.5       2.5X
-FileSystemPersistenceEngine with JavaSerializer (lz4)               776            805          29          0.0      776056.9       8.0X
-FileSystemPersistenceEngine with JavaSerializer (lzf)               728            733           4          0.0      727884.9       8.6X
-FileSystemPersistenceEngine with JavaSerializer (snappy)            739            753          13          0.0      738838.5       8.4X
-FileSystemPersistenceEngine with JavaSerializer (zstd)              976            989          22          0.0      976199.8       6.4X
-RocksDBPersistenceEngine with JavaSerializer                        283            286           4          0.0      282774.2      22.1X
-BlackHolePersistenceEngine                                            0              0           0          6.0         167.9   37143.3X
+ZooKeeperPersistenceEngine with JavaSerializer                     6956           7080         115          0.0     6956379.5       1.0X
+FileSystemPersistenceEngine with JavaSerializer                    2402           2447          67          0.0     2401650.8       2.9X
+FileSystemPersistenceEngine with JavaSerializer (lz4)               779            796          21          0.0      778925.0       8.9X
+FileSystemPersistenceEngine with JavaSerializer (lzf)               783            800          16          0.0      782977.7       8.9X
+FileSystemPersistenceEngine with JavaSerializer (snappy)            709            752          38          0.0      709110.4       9.8X
+FileSystemPersistenceEngine with JavaSerializer (zstd)              899            981          78          0.0      898701.3       7.7X
+RocksDBPersistenceEngine with JavaSerializer                        280            280           1          0.0      279833.2      24.9X
+BlackHolePersistenceEngine                                            0              0           0          6.0         165.9   41930.9X
 
 
diff --git a/core/benchmarks/PersistenceEngineBenchmark-results.txt b/core/benchmarks/PersistenceEngineBenchmark-results.txt
index 91390591e312b..566ca47a5b7d7 100644
--- a/core/benchmarks/PersistenceEngineBenchmark-results.txt
+++ b/core/benchmarks/PersistenceEngineBenchmark-results.txt
@@ -2,17 +2,17 @@
 PersistenceEngineBenchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 1000 Workers:                                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-ZooKeeperPersistenceEngine with JavaSerializer                     5746           5947         252          0.0     5746489.4       1.0X
-FileSystemPersistenceEngine with JavaSerializer                    2520           2545          23          0.0     2520044.8       2.3X
-FileSystemPersistenceEngine with JavaSerializer (lz4)               782            807          35          0.0      782074.1       7.3X
-FileSystemPersistenceEngine with JavaSerializer (lzf)               731            768          37          0.0      731043.3       7.9X
-FileSystemPersistenceEngine with JavaSerializer (snappy)            817            831          17          0.0      816894.1       7.0X
-FileSystemPersistenceEngine with JavaSerializer (zstd)              950            959          14          0.0      950456.4       6.0X
-RocksDBPersistenceEngine with JavaSerializer                        285            287           3          0.0      285388.0      20.1X
-BlackHolePersistenceEngine                                            0              0           0          5.9         170.2   33755.4X
+ZooKeeperPersistenceEngine with JavaSerializer                     7368           7576         255          0.0     7368098.5       1.0X
+FileSystemPersistenceEngine with JavaSerializer                    2454           2487          37          0.0     2454081.7       3.0X
+FileSystemPersistenceEngine with JavaSerializer (lz4)               784            835          47          0.0      784080.9       9.4X
+FileSystemPersistenceEngine with JavaSerializer (lzf)               743            806          63          0.0      742767.1       9.9X
+FileSystemPersistenceEngine with JavaSerializer (snappy)            787            811          34          0.0      786859.3       9.4X
+FileSystemPersistenceEngine with JavaSerializer (zstd)              967           1004          32          0.0      966791.5       7.6X
+RocksDBPersistenceEngine with JavaSerializer                        289            292           3          0.0      288790.5      25.5X
+BlackHolePersistenceEngine                                            0              0           0          6.0         167.7   43938.0X
 
 
diff --git a/core/benchmarks/PropertiesCloneBenchmark-jdk21-results.txt b/core/benchmarks/PropertiesCloneBenchmark-jdk21-results.txt
index 0dda0a89b6119..ee4a3af6d7fbc 100644
--- a/core/benchmarks/PropertiesCloneBenchmark-jdk21-results.txt
+++ b/core/benchmarks/PropertiesCloneBenchmark-jdk21-results.txt
@@ -2,39 +2,39 @@
 Properties Cloning
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Empty Properties:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
 SerializationUtils.clone                              0              0           0          0.3        3145.0       1.0X
-Utils.cloneProperties                                 0              0           0         11.2          89.0      35.3X
+Utils.cloneProperties                                 0              0           0         11.1          90.0      34.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 System Properties:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              0              0           0          0.0      148318.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.2        4708.0      31.5X
+SerializationUtils.clone                              0              0           0          0.0      166011.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.2        4758.0      34.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Small Properties:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              0              0           0          0.0      241993.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.1        6812.0      35.5X
+SerializationUtils.clone                              0              0           0          0.0      241673.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.2        5450.0      44.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Medium Properties:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              1              1           0          0.0      858356.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.0       29876.0      28.7X
+SerializationUtils.clone                              1              1           0          0.0      855822.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.0       27581.0      31.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Large Properties:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              2              2           0          0.0     1612428.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.0       59872.0      26.9X
+SerializationUtils.clone                              2              2           0          0.0     1611288.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.0       55464.0      29.1X
 
 
diff --git a/core/benchmarks/PropertiesCloneBenchmark-results.txt b/core/benchmarks/PropertiesCloneBenchmark-results.txt
index 2cf84524d1c39..2371d8efac012 100644
--- a/core/benchmarks/PropertiesCloneBenchmark-results.txt
+++ b/core/benchmarks/PropertiesCloneBenchmark-results.txt
@@ -2,39 +2,39 @@
 Properties Cloning
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Empty Properties:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              0              0           0          0.3        3146.0       1.0X
-Utils.cloneProperties                                 0              0           0         11.1          90.0      35.0X
+SerializationUtils.clone                              0              0           0          0.3        3056.0       1.0X
+Utils.cloneProperties                                 0              0           0         11.1          90.0      34.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 System Properties:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              0              0           0          0.0      150510.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.2        4017.0      37.5X
+SerializationUtils.clone                              0              0           0          0.0      178123.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.2        4167.0      42.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Small Properties:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              0              0           0          0.0      250416.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.1        7914.0      31.6X
+SerializationUtils.clone                              0              0           0          0.0      249586.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.1        7614.0      32.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Medium Properties:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              1              1           0          0.0      853339.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.0       39814.0      21.4X
+SerializationUtils.clone                              1              1           0          0.0      862953.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.0       38932.0      22.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Large Properties:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SerializationUtils.clone                              2              2           0          0.0     1604705.0       1.0X
-Utils.cloneProperties                                 0              0           0          0.0       78226.0      20.5X
+SerializationUtils.clone                              2              2           0          0.0     1613866.0       1.0X
+Utils.cloneProperties                                 0              0           0          0.0       78046.0      20.7X
 
 
diff --git a/core/benchmarks/RocksDBBenchmark-jdk21-results.txt b/core/benchmarks/RocksDBBenchmark-jdk21-results.txt
new file mode 100644
index 0000000000000..72342104c1704
--- /dev/null
+++ b/core/benchmarks/RocksDBBenchmark-jdk21-results.txt
@@ -0,0 +1,102 @@
+================================================================================================
+RocksDB Lifecycle Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+RocksDB Lifecycle Operations:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+DB Creation                                           6              8           2          0.0     5683288.0       1.0X
+DB Close                                              0              0           0          0.0      151425.0      37.5X
+
+
+================================================================================================
+Sequential Operations Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Sequential Writes:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              23             24           1          0.0       22705.3       1.0X
+No Index                                             18             18           0          0.1       17420.4       1.3X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Sequential Updates:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              22             23           0          0.0       21721.3       1.0X
+No Index                                             11             11           0          0.1       10447.7       2.1X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Sequential Deletes:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              11             12           0          0.1       11053.0       1.0X
+No Index                                              8              8           0          0.1        7709.9       1.4X
+
+
+================================================================================================
+Random Operations Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Random Writes:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              24             25           1          0.0       23404.3       1.0X
+No Index                                             18             19           0          0.1       17619.8       1.3X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Random Updates:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              23             24           0          0.0       22456.5       1.0X
+No Index                                             11             11           0          0.1       10427.0       2.2X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Random Deletes:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              12             12           0          0.1       11272.5       1.0X
+No Index                                              8              8           1          0.1        7679.9       1.5X
+
+
+================================================================================================
+Natural Index Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Natural Index - Create Iterator:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             0              0           0       1053.5           0.9       1.0X
+Descending                                            0              0           0       1012.9           1.0       1.0X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Natural Index - Iteration:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             1              1           0          0.8        1292.4       1.0X
+Descending                                            1              2           0          0.8        1298.7       1.0X
+
+
+================================================================================================
+Ref Index Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Ref Index - Create Iterator:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             0              0           0        725.2           1.4       1.0X
+Descending                                            0              0           0        710.1           1.4       1.0X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Ref Index - Iteration:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             3              3           0          0.4        2621.7       1.0X
+Descending                                            3              3           1          0.4        2635.0       1.0X
+
+
diff --git a/core/benchmarks/RocksDBBenchmark-results.txt b/core/benchmarks/RocksDBBenchmark-results.txt
new file mode 100644
index 0000000000000..52865acf97273
--- /dev/null
+++ b/core/benchmarks/RocksDBBenchmark-results.txt
@@ -0,0 +1,102 @@
+================================================================================================
+RocksDB Lifecycle Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+RocksDB Lifecycle Operations:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+DB Creation                                           5              6           1          0.0     5171553.0       1.0X
+DB Close                                              0              0           0          0.0      151443.0      34.1X
+
+
+================================================================================================
+Sequential Operations Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Sequential Writes:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              24             25           2          0.0       23602.9       1.0X
+No Index                                             19             19           0          0.1       18194.7       1.3X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Sequential Updates:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              23             23           1          0.0       22149.7       1.0X
+No Index                                             11             11           0          0.1       10640.2       2.1X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Sequential Deletes:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              12             12           0          0.1       11319.0       1.0X
+No Index                                              8              9           0          0.1        8044.0       1.4X
+
+
+================================================================================================
+Random Operations Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Random Writes:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              25             25           1          0.0       24001.2       1.0X
+No Index                                             19             19           1          0.1       18206.3       1.3X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Random Updates:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              23             23           1          0.0       22268.3       1.0X
+No Index                                             11             11           1          0.1       10525.2       2.1X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Random Deletes:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Indexed                                              12             12           0          0.1       11377.6       1.0X
+No Index                                              8              9           0          0.1        8007.0       1.4X
+
+
+================================================================================================
+Natural Index Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Natural Index - Create Iterator:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             0              0           0        946.4           1.1       1.0X
+Descending                                            0              0           0        896.7           1.1       0.9X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Natural Index - Iteration:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             1              1           0          0.7        1419.1       1.0X
+Descending                                            1              2           0          0.7        1412.8       1.0X
+
+
+================================================================================================
+Ref Index Benchmark
+================================================================================================
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Ref Index - Create Iterator:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             0              0           0        912.7           1.1       1.0X
+Descending                                            0              0           0        881.2           1.1       1.0X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Ref Index - Iteration:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Ascending                                             3              3           0          0.4        2633.6       1.0X
+Descending                                            3              3           1          0.4        2643.5       1.0X
+
+
diff --git a/core/benchmarks/SorterBenchmark-jdk21-results.txt b/core/benchmarks/SorterBenchmark-jdk21-results.txt
index 91b725a0b493b..072a30a8a8815 100644
--- a/core/benchmarks/SorterBenchmark-jdk21-results.txt
+++ b/core/benchmarks/SorterBenchmark-jdk21-results.txt
@@ -2,25 +2,28 @@
 key-value pairs sort
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 key-value pairs sort 25000000:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Tuple-sort using Arrays.sort()                    17292          17584         413          1.4         691.7       1.0X
-KV-sort using Sorter                              21245          21340         134          1.2         849.8       0.8X
+Tuple-sort using Arrays.sort()                    16337          16917         821          1.5         653.5       1.0X
+Tuple-sort using Arrays.parallelSort()             8220           9097        1240          3.0         328.8       2.0X
+KV-sort using Sorter                              19974          20183         295          1.3         799.0       0.8X
 
 
 ================================================================================================
 primitive int array sort
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
-primitive int array sort 25000000:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
--------------------------------------------------------------------------------------------------------------------------------
-Java Arrays.sort() on non-primitive int array            14231          14561         468          1.8         569.2       1.0X
-Java Arrays.sort() on primitive int array                 2141           2145           6         11.7          85.6       6.6X
-Sorter without key reuse on primitive int array           8607           8612           7          2.9         344.3       1.7X
-Sorter with key reuse on primitive int array             10602          10621          27          2.4         424.1       1.3X
+primitive int array sort 25000000:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+-------------------------------------------------------------------------------------------------------------------------------------
+Java Arrays.sort() on non-primitive int array                  14132          14508         532          1.8         565.3       1.0X
+Java Arrays.parallelSort() on non-primitive int array           6251           6572         453          4.0         250.1       2.3X
+Java Arrays.sort() on primitive int array                       2123           2123           0         11.8          84.9       6.7X
+Java Arrays.parallelSort() on primitive int array                823            885          54         30.4          32.9      17.2X
+Sorter without key reuse on primitive int array                 8532           8546          18          2.9         341.3       1.7X
+Sorter with key reuse on primitive int array                   10609          10615           9          2.4         424.4       1.3X
 
 
diff --git a/core/benchmarks/SorterBenchmark-results.txt b/core/benchmarks/SorterBenchmark-results.txt
index 6369727a85ca6..a00cbb61ac804 100644
--- a/core/benchmarks/SorterBenchmark-results.txt
+++ b/core/benchmarks/SorterBenchmark-results.txt
@@ -2,25 +2,28 @@
 key-value pairs sort
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 key-value pairs sort 25000000:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Tuple-sort using Arrays.sort()                    20545          20560          21          1.2         821.8       1.0X
-KV-sort using Sorter                              26696          26797         143          0.9        1067.8       0.8X
+Tuple-sort using Arrays.sort()                    17269          17567         421          1.4         690.8       1.0X
+Tuple-sort using Arrays.parallelSort()             8155           9560        1988          3.1         326.2       2.1X
+KV-sort using Sorter                              20713          20875         230          1.2         828.5       0.8X
 
 
 ================================================================================================
 primitive int array sort
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
-primitive int array sort 25000000:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
--------------------------------------------------------------------------------------------------------------------------------
-Java Arrays.sort() on non-primitive int array            15325          15510         263          1.6         613.0       1.0X
-Java Arrays.sort() on primitive int array                 2088           2141          76         12.0          83.5       7.3X
-Sorter without key reuse on primitive int array           8254           8262          10          3.0         330.2       1.9X
-Sorter with key reuse on primitive int array             10184          10186           3          2.5         407.3       1.5X
+primitive int array sort 25000000:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+-------------------------------------------------------------------------------------------------------------------------------------
+Java Arrays.sort() on non-primitive int array                  15599          15631          45          1.6         624.0       1.0X
+Java Arrays.parallelSort() on non-primitive int array           8045           8066          30          3.1         321.8       1.9X
+Java Arrays.sort() on primitive int array                       2174           2176           2         11.5          87.0       7.2X
+Java Arrays.parallelSort() on primitive int array                771            782          18         32.4          30.8      20.2X
+Sorter without key reuse on primitive int array                 8380           8397          25          3.0         335.2       1.9X
+Sorter with key reuse on primitive int array                   10176          10183          11          2.5         407.0       1.5X
 
 
diff --git a/core/benchmarks/XORShiftRandomBenchmark-jdk21-results.txt b/core/benchmarks/XORShiftRandomBenchmark-jdk21-results.txt
index faeb60e44af10..a7e03aa0c450c 100644
--- a/core/benchmarks/XORShiftRandomBenchmark-jdk21-results.txt
+++ b/core/benchmarks/XORShiftRandomBenchmark-jdk21-results.txt
@@ -2,43 +2,43 @@
 Pseudo random
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextInt:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java.util.Random                                    453            453           0        220.7           4.5       1.0X
-XORShiftRandom                                      186            186           0        536.7           1.9       2.4X
+java.util.Random                                    453            454           0        220.5           4.5       1.0X
+XORShiftRandom                                      186            186           0        536.5           1.9       2.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextLong:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java.util.Random                                    901            901           0        111.0           9.0       1.0X
-XORShiftRandom                                      373            373           0        268.2           3.7       2.4X
+java.util.Random                                    901            901           0        110.9           9.0       1.0X
+XORShiftRandom                                      373            373           0        268.1           3.7       2.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextDouble:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
 java.util.Random                                    905            905           0        110.5           9.0       1.0X
-XORShiftRandom                                      373            375           3        268.2           3.7       2.4X
+XORShiftRandom                                      373            373           0        268.1           3.7       2.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextGaussian:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java.util.Random                                   3425           3428           3         29.2          34.3       1.0X
-XORShiftRandom                                     2487           2495           9         40.2          24.9       1.4X
+java.util.Random                                   3440           3441           1         29.1          34.4       1.0X
+XORShiftRandom                                     2467           2467           0         40.5          24.7       1.4X
 
 
 ================================================================================================
 hash seed
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash seed:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-XORShiftRandom.hashSeed                               1              1           0      12973.9           0.1       1.0X
+XORShiftRandom.hashSeed                               1              1           0      12851.4           0.1       1.0X
 
 
diff --git a/core/benchmarks/XORShiftRandomBenchmark-results.txt b/core/benchmarks/XORShiftRandomBenchmark-results.txt
index 93f9adebb1e44..7f51cfc9f5818 100644
--- a/core/benchmarks/XORShiftRandomBenchmark-results.txt
+++ b/core/benchmarks/XORShiftRandomBenchmark-results.txt
@@ -2,43 +2,43 @@
 Pseudo random
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextInt:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java.util.Random                                    441            441           0        226.6           4.4       1.0X
-XORShiftRandom                                      186            186           0        536.7           1.9       2.4X
+java.util.Random                                    441            442           0        226.5           4.4       1.0X
+XORShiftRandom                                      186            186           0        536.8           1.9       2.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextLong:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java.util.Random                                    913            914           0        109.5           9.1       1.0X
-XORShiftRandom                                      373            373           0        268.4           3.7       2.5X
+java.util.Random                                    918            918           0        109.0           9.2       1.0X
+XORShiftRandom                                      373            373           0        268.3           3.7       2.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextDouble:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java.util.Random                                    909            910           1        110.0           9.1       1.0X
-XORShiftRandom                                      373            373           0        268.3           3.7       2.4X
+java.util.Random                                    912            916           7        109.7           9.1       1.0X
+XORShiftRandom                                      373            373           0        268.4           3.7       2.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 nextGaussian:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java.util.Random                                   4031           4035           3         24.8          40.3       1.0X
-XORShiftRandom                                     2952           2965          19         33.9          29.5       1.4X
+java.util.Random                                   4021           4021           0         24.9          40.2       1.0X
+XORShiftRandom                                     2942           2942           1         34.0          29.4       1.4X
 
 
 ================================================================================================
 hash seed
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash seed:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-XORShiftRandom.hashSeed                               2              2           0       6455.0           0.2       1.0X
+XORShiftRandom.hashSeed                               2              2           0       6452.9           0.2       1.0X
 
 
diff --git a/core/benchmarks/ZStandardBenchmark-jdk21-results.txt b/core/benchmarks/ZStandardBenchmark-jdk21-results.txt
index 41993e9cfa479..93a9b0995fee5 100644
--- a/core/benchmarks/ZStandardBenchmark-jdk21-results.txt
+++ b/core/benchmarks/ZStandardBenchmark-jdk21-results.txt
@@ -2,48 +2,81 @@
 Benchmark ZStandardCompressionCodec
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Compression 10000 times at level 1 without buffer pool            657            673          15          0.0       65664.9       1.0X
-Compression 10000 times at level 2 without buffer pool            718            726          13          0.0       71830.9       0.9X
-Compression 10000 times at level 3 without buffer pool            815            819           7          0.0       81453.1       0.8X
-Compression 10000 times at level 1 with buffer pool               598            600           1          0.0       59809.3       1.1X
-Compression 10000 times at level 2 with buffer pool               637            639           2          0.0       63710.0       1.0X
-Compression 10000 times at level 3 with buffer pool               754            757           3          0.0       75403.8       0.9X
-
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+Compression 10000 times at level 1 without buffer pool            646            665          13          0.0       64646.5       1.0X
+Compression 10000 times at level 2 without buffer pool            706            706           1          0.0       70582.5       0.9X
+Compression 10000 times at level 3 without buffer pool            802            809           9          0.0       80238.3       0.8X
+Compression 10000 times at level 1 with buffer pool               595            596           1          0.0       59540.8       1.1X
+Compression 10000 times at level 2 with buffer pool               627            628           1          0.0       62663.7       1.0X
+Compression 10000 times at level 3 with buffer pool               736            750          13          0.0       73612.1       0.9X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------
-Decompression 10000 times from level 1 without buffer pool            832            835           2          0.0       83247.0       1.0X
-Decompression 10000 times from level 2 without buffer pool            833            840           8          0.0       83277.8       1.0X
-Decompression 10000 times from level 3 without buffer pool            833            833           0          0.0       83280.6       1.0X
-Decompression 10000 times from level 1 with buffer pool               753            755           2          0.0       75333.7       1.1X
-Decompression 10000 times from level 2 with buffer pool               751            752           1          0.0       75115.3       1.1X
-Decompression 10000 times from level 3 with buffer pool               753            754           2          0.0       75254.0       1.1X
-
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+Decompression 10000 times from level 1 without buffer pool            831            832           0          0.0       83137.4       1.0X
+Decompression 10000 times from level 2 without buffer pool            833            838           7          0.0       83253.4       1.0X
+Decompression 10000 times from level 3 without buffer pool            831            832           1          0.0       83113.3       1.0X
+Decompression 10000 times from level 1 with buffer pool               764            765           1          0.0       76368.9       1.1X
+Decompression 10000 times from level 2 with buffer pool               763            764           0          0.0       76313.5       1.1X
+Decompression 10000 times from level 3 with buffer pool               763            764           0          0.0       76331.2       1.1X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 3:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                  77             78           1          0.0      601317.6       1.0X
-Parallel Compression with 1 workers                  64             70           4          0.0      499456.2       1.2X
-Parallel Compression with 2 workers                  53             56           3          0.0      410610.6       1.5X
-Parallel Compression with 4 workers                  45             47           1          0.0      350847.8       1.7X
-Parallel Compression with 8 workers                  47             49           1          0.0      370647.8       1.6X
-Parallel Compression with 16 workers                 50             52           1          0.0      390524.8       1.5X
-
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+Parallel Compression with 0 workers                  65             66           1          0.0      506864.4       1.0X
+Parallel Compression with 1 workers                  55             57           2          0.0      427674.1       1.2X
+Parallel Compression with 2 workers                  45             47           1          0.0      352972.0       1.4X
+Parallel Compression with 4 workers                  41             42           1          0.0      316529.7       1.6X
+Parallel Compression with 8 workers                  43             45           1          0.0      336022.6       1.5X
+Parallel Compression with 16 workers                 46             51           2          0.0      358955.3       1.4X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 9:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                 243            244           2          0.0     1894990.4       1.0X
-Parallel Compression with 1 workers                 299            300           2          0.0     2335128.6       0.8X
-Parallel Compression with 2 workers                 167            177          11          0.0     1308212.2       1.4X
-Parallel Compression with 4 workers                 161            163           3          0.0     1254638.0       1.5X
-Parallel Compression with 8 workers                 166            170           4          0.0     1299104.0       1.5X
-Parallel Compression with 16 workers                167            170           2          0.0     1301666.4       1.5X
+Parallel Compression with 0 workers                 233            234           1          0.0     1820726.1       1.0X
+Parallel Compression with 1 workers                 252            254           2          0.0     1968958.3       0.9X
+Parallel Compression with 2 workers                 139            145           7          0.0     1086297.3       1.7X
+Parallel Compression with 4 workers                 130            134           2          0.0     1019245.3       1.8X
+Parallel Compression with 8 workers                 133            139           3          0.0     1041655.7       1.7X
+Parallel Compression with 16 workers                134            138           2          0.0     1049368.5       1.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Compression at level 1:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Compression by strategy -1                           53             54           1          0.0      410474.6       1.0X
+Compression by strategy 1                            52             54           1          0.0      409782.1       1.0X
+Compression by strategy 3                            87             88           1          0.0      677298.8       0.6X
+Compression by strategy 5                           232            233           1          0.0     1809977.4       0.2X
+Compression by strategy 7                           251            252           1          0.0     1959523.1       0.2X
+Compression by strategy 9                           251            252           1          0.0     1958592.9       0.2X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Compression at level 3:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Compression by strategy -1                           65             66           1          0.0      504323.2       1.0X
+Compression by strategy 1                            49             50           1          0.0      381367.0       1.3X
+Compression by strategy 3                            85             87           1          0.0      666905.7       0.8X
+Compression by strategy 5                           232            234           1          0.0     1816082.8       0.3X
+Compression by strategy 7                           270            272           1          0.0     2110571.7       0.2X
+Compression by strategy 9                           270            271           1          0.0     2108787.3       0.2X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Compression at level 9:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Compression by strategy -1                          234            235           1          0.0     1824805.4       1.0X
+Compression by strategy 1                            49             51           1          0.0      381728.3       4.8X
+Compression by strategy 3                            86             87           1          0.0      670661.9       2.7X
+Compression by strategy 5                           235            235           1          0.0     1832255.5       1.0X
+Compression by strategy 7                           272            273           1          0.0     2125776.3       0.9X
+Compression by strategy 9                           272            273           1          0.0     2122237.8       0.9X
 
 
diff --git a/core/benchmarks/ZStandardBenchmark-results.txt b/core/benchmarks/ZStandardBenchmark-results.txt
index 66aa149515a2e..0a8f611d4d666 100644
--- a/core/benchmarks/ZStandardBenchmark-results.txt
+++ b/core/benchmarks/ZStandardBenchmark-results.txt
@@ -2,48 +2,81 @@
 Benchmark ZStandardCompressionCodec
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Compression 10000 times at level 1 without buffer pool            651            654           3          0.0       65120.6       1.0X
-Compression 10000 times at level 2 without buffer pool            701            702           1          0.0       70069.5       0.9X
-Compression 10000 times at level 3 without buffer pool            788            790           2          0.0       78845.5       0.8X
-Compression 10000 times at level 1 with buffer pool               577            578           2          0.0       57688.1       1.1X
-Compression 10000 times at level 2 with buffer pool               607            608           1          0.0       60653.3       1.1X
-Compression 10000 times at level 3 with buffer pool               716            717           0          0.0       71634.8       0.9X
-
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+Compression 10000 times at level 1 without buffer pool            265            267           1          0.0       26513.9       1.0X
+Compression 10000 times at level 2 without buffer pool            298            300           1          0.0       29837.5       0.9X
+Compression 10000 times at level 3 without buffer pool            809            809           0          0.0       80903.8       0.3X
+Compression 10000 times at level 1 with buffer pool               578            579           0          0.0       57809.5       0.5X
+Compression 10000 times at level 2 with buffer pool               609            609           1          0.0       60892.6       0.4X
+Compression 10000 times at level 3 with buffer pool               717            728           9          0.0       71748.2       0.4X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------
-Decompression 10000 times from level 1 without buffer pool            621            621           0          0.0       62063.9       1.0X
-Decompression 10000 times from level 2 without buffer pool            620            621           1          0.0       62003.0       1.0X
-Decompression 10000 times from level 3 without buffer pool            620            622           1          0.0       62017.4       1.0X
-Decompression 10000 times from level 1 with buffer pool               544            544           0          0.0       54377.6       1.1X
-Decompression 10000 times from level 2 with buffer pool               544            544           1          0.0       54404.3       1.1X
-Decompression 10000 times from level 3 with buffer pool               543            544           1          0.0       54310.2       1.1X
-
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+Decompression 10000 times from level 1 without buffer pool            592            595           4          0.0       59245.4       1.0X
+Decompression 10000 times from level 2 without buffer pool            592            594           1          0.0       59209.6       1.0X
+Decompression 10000 times from level 3 without buffer pool            593            593           0          0.0       59309.5       1.0X
+Decompression 10000 times from level 1 with buffer pool               540            541           0          0.0       54039.4       1.1X
+Decompression 10000 times from level 2 with buffer pool               541            541           0          0.0       54058.9       1.1X
+Decompression 10000 times from level 3 with buffer pool               540            541           0          0.0       54016.9       1.1X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 3:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                  77             79           1          0.0      603481.7       1.0X
-Parallel Compression with 1 workers                  65             68           3          0.0      504835.7       1.2X
-Parallel Compression with 2 workers                  50             55           3          0.0      393366.7       1.5X
-Parallel Compression with 4 workers                  45             48           2          0.0      352491.0       1.7X
-Parallel Compression with 8 workers                  46             49           1          0.0      362934.5       1.7X
-Parallel Compression with 16 workers                 50             53           1          0.0      393219.4       1.5X
-
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+Parallel Compression with 0 workers                  65             66           0          0.0      509528.4       1.0X
+Parallel Compression with 1 workers                  55             58           3          0.0      426851.9       1.2X
+Parallel Compression with 2 workers                  44             46           1          0.0      341996.8       1.5X
+Parallel Compression with 4 workers                  41             42           1          0.0      322444.2       1.6X
+Parallel Compression with 8 workers                  43             45           1          0.0      336123.3       1.5X
+Parallel Compression with 16 workers                 46             49           1          0.0      359754.8       1.4X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 9:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                 237            239           1          0.0     1852985.0       1.0X
-Parallel Compression with 1 workers                 299            301           2          0.0     2339270.2       0.8X
-Parallel Compression with 2 workers                 167            174           6          0.0     1303651.0       1.4X
-Parallel Compression with 4 workers                 160            165           3          0.0     1248593.3       1.5X
-Parallel Compression with 8 workers                 166            170           3          0.0     1295084.3       1.4X
-Parallel Compression with 16 workers                165            169           3          0.0     1288571.2       1.4X
+Parallel Compression with 0 workers                 228            229           1          0.0     1780109.3       1.0X
+Parallel Compression with 1 workers                 247            249           3          0.0     1927634.1       0.9X
+Parallel Compression with 2 workers                 140            146           8          0.0     1094789.1       1.6X
+Parallel Compression with 4 workers                 130            133           2          0.0     1013913.1       1.8X
+Parallel Compression with 8 workers                 136            138           2          0.0     1058972.8       1.7X
+Parallel Compression with 16 workers                135            139           2          0.0     1053766.4       1.7X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Compression at level 1:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Compression by strategy -1                           54             54           0          0.0      418444.8       1.0X
+Compression by strategy 1                            53             54           0          0.0      417570.9       1.0X
+Compression by strategy 3                            88             88           0          0.0      684663.0       0.6X
+Compression by strategy 5                           228            229           0          0.0     1784827.6       0.2X
+Compression by strategy 7                           256            256           0          0.0     1998418.9       0.2X
+Compression by strategy 9                           256            256           0          0.0     1997712.8       0.2X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Compression at level 3:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Compression by strategy -1                           65             66           1          0.0      509229.4       1.0X
+Compression by strategy 1                            49             50           1          0.0      383259.2       1.3X
+Compression by strategy 3                            86             87           0          0.0      674150.1       0.8X
+Compression by strategy 5                           227            228           0          0.0     1777012.2       0.3X
+Compression by strategy 7                           274            274           0          0.0     2137945.7       0.2X
+Compression by strategy 9                           274            275           0          0.0     2141819.7       0.2X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+Compression at level 9:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+------------------------------------------------------------------------------------------------------------------------
+Compression by strategy -1                          228            230           1          0.0     1781070.7       1.0X
+Compression by strategy 1                            50             50           1          0.0      387332.5       4.6X
+Compression by strategy 3                            86             87           1          0.0      674742.4       2.6X
+Compression by strategy 5                           228            229           0          0.0     1783581.6       1.0X
+Compression by strategy 7                           275            276           1          0.0     2151470.1       0.8X
+Compression by strategy 9                           275            276           1          0.0     2150367.6       0.8X
 
 
diff --git a/core/benchmarks/ZStandardTPCDSDataBenchmark-jdk21-results.txt b/core/benchmarks/ZStandardTPCDSDataBenchmark-jdk21-results.txt
index 58be348a69c9b..5e1af70caa2c5 100644
--- a/core/benchmarks/ZStandardTPCDSDataBenchmark-jdk21-results.txt
+++ b/core/benchmarks/ZStandardTPCDSDataBenchmark-jdk21-results.txt
@@ -2,48 +2,48 @@
 Benchmark ZStandardCompressionCodec
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------
-Compression 4 times at level 1 without buffer pool           2852           2858          10          0.0   712887837.3       1.0X
-Compression 4 times at level 2 without buffer pool           4417           4418           1          0.0  1104333096.8       0.6X
-Compression 4 times at level 3 without buffer pool           6594           6602          12          0.0  1648568689.0       0.4X
-Compression 4 times at level 1 with buffer pool              2875           2876           2          0.0   718686835.3       1.0X
-Compression 4 times at level 2 with buffer pool              4415           4422          10          0.0  1103705078.0       0.6X
-Compression 4 times at level 3 with buffer pool              6749           6774          35          0.0  1687199785.0       0.4X
+Compression 4 times at level 1 without buffer pool           2764           2764           1          0.0   690899114.5       1.0X
+Compression 4 times at level 2 without buffer pool           4363           4381          25          0.0  1090808911.2       0.6X
+Compression 4 times at level 3 without buffer pool           6602           6604           2          0.0  1650543838.8       0.4X
+Compression 4 times at level 1 with buffer pool              2749           2750           2          0.0   687137810.8       1.0X
+Compression 4 times at level 2 with buffer pool              4439           4444           8          0.0  1109656370.0       0.6X
+Compression 4 times at level 3 with buffer pool              6561           6579          25          0.0  1640364047.0       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Decompression 4 times from level 1 without buffer pool           1084           1140          79          0.0   271079599.8       1.0X
-Decompression 4 times from level 2 without buffer pool           1341           1363          31          0.0   335200382.3       0.8X
-Decompression 4 times from level 3 without buffer pool           1620           1632          18          0.0   404881883.0       0.7X
-Decompression 4 times from level 1 with buffer pool              1110           1144          48          0.0   277478874.5       1.0X
-Decompression 4 times from level 2 with buffer pool              1306           1363          80          0.0   326419359.8       0.8X
-Decompression 4 times from level 3 with buffer pool              1566           1585          27          0.0   391420983.5       0.7X
+Decompression 4 times from level 1 without buffer pool           1026           1091          92          0.0   256389848.5       1.0X
+Decompression 4 times from level 2 without buffer pool           1344           1377          48          0.0   335901373.5       0.8X
+Decompression 4 times from level 3 without buffer pool           1556           1610          76          0.0   388926978.3       0.7X
+Decompression 4 times from level 1 with buffer pool              1028           1079          72          0.0   257022260.0       1.0X
+Decompression 4 times from level 2 with buffer pool              1328           1356          40          0.0   331990447.8       0.8X
+Decompression 4 times from level 3 with buffer pool              1596           1652          80          0.0   398930929.8       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 3:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                2160           2166           9          0.0   539942027.3       1.0X
-Parallel Compression with 1 workers                2245           2248           4          0.0   561232751.0       1.0X
-Parallel Compression with 2 workers                1180           1183           4          0.0   295021164.8       1.8X
-Parallel Compression with 4 workers                 832            840          12          0.0   207891005.5       2.6X
-Parallel Compression with 8 workers                 971           1002          44          0.0   242832737.3       2.2X
-Parallel Compression with 16 workers               1329           1365          51          0.0   332270317.7       1.6X
+Parallel Compression with 0 workers                2080           2092          18          0.0   519889128.5       1.0X
+Parallel Compression with 1 workers                2203           2208           6          0.0   550838598.0       0.9X
+Parallel Compression with 2 workers                1155           1170          21          0.0   288752087.0       1.8X
+Parallel Compression with 4 workers                 826            839          11          0.0   206623975.8       2.5X
+Parallel Compression with 8 workers                 872            893          18          0.0   218002184.8       2.4X
+Parallel Compression with 16 workers               1225           1256          44          0.0   306297206.5       1.7X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 9:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                9168           9276         154          0.0  2291883601.5       1.0X
-Parallel Compression with 1 workers                8142           8244         145          0.0  2035422527.5       1.1X
-Parallel Compression with 2 workers                4703           4939         334          0.0  1175760328.8       1.9X
-Parallel Compression with 4 workers                4366           4426          84          0.0  1091576971.0       2.1X
-Parallel Compression with 8 workers                5395           5716         453          0.0  1348844072.5       1.7X
-Parallel Compression with 16 workers               6410           6573         230          0.0  1602434231.8       1.4X
+Parallel Compression with 0 workers                9201           9228          37          0.0  2300372887.8       1.0X
+Parallel Compression with 1 workers                7690           7852         229          0.0  1922482505.8       1.2X
+Parallel Compression with 2 workers                4272           4317          63          0.0  1068103607.8       2.2X
+Parallel Compression with 4 workers                3675           3685          14          0.0   918764298.5       2.5X
+Parallel Compression with 8 workers                4731           4762          44          0.0  1182798359.8       1.9X
+Parallel Compression with 16 workers               5834           5851          24          0.0  1458440232.3       1.6X
 
 
diff --git a/core/benchmarks/ZStandardTPCDSDataBenchmark-results.txt b/core/benchmarks/ZStandardTPCDSDataBenchmark-results.txt
index cc439b099a6c5..b7afea04fbc88 100644
--- a/core/benchmarks/ZStandardTPCDSDataBenchmark-results.txt
+++ b/core/benchmarks/ZStandardTPCDSDataBenchmark-results.txt
@@ -2,48 +2,48 @@
 Benchmark ZStandardCompressionCodec
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------
-Compression 4 times at level 1 without buffer pool           2582           2583           1          0.0   645586401.5       1.0X
-Compression 4 times at level 2 without buffer pool           4128           4132           6          0.0  1032017030.8       0.6X
-Compression 4 times at level 3 without buffer pool           6222           6229          11          0.0  1555453651.0       0.4X
-Compression 4 times at level 1 with buffer pool              2581           2581           1          0.0   645260104.3       1.0X
-Compression 4 times at level 2 with buffer pool              4123           4129           9          0.0  1030789387.7       0.6X
-Compression 4 times at level 3 with buffer pool              6290           6299          13          0.0  1572478346.5       0.4X
+Compression 4 times at level 1 without buffer pool           2554           2556           3          0.0   638404691.8       1.0X
+Compression 4 times at level 2 without buffer pool           4160           4160           1          0.0  1039958809.8       0.6X
+Compression 4 times at level 3 without buffer pool           6259           6272          19          0.0  1564689762.0       0.4X
+Compression 4 times at level 1 with buffer pool              2554           2555           1          0.0   638584854.0       1.0X
+Compression 4 times at level 2 with buffer pool              4173           4174           1          0.0  1043297333.7       0.6X
+Compression 4 times at level 3 with buffer pool              6292           6296           5          0.0  1573072300.0       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark ZStandardCompressionCodec:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Decompression 4 times from level 1 without buffer pool            898            902           4          0.0   224453665.0       1.0X
-Decompression 4 times from level 2 without buffer pool           1170           1174           5          0.0   292566849.8       0.8X
-Decompression 4 times from level 3 without buffer pool           1409           1411           2          0.0   352317771.3       0.6X
-Decompression 4 times from level 1 with buffer pool               900            901           2          0.0   224956421.3       1.0X
-Decompression 4 times from level 2 with buffer pool              1169           1174           7          0.0   292235703.0       0.8X
-Decompression 4 times from level 3 with buffer pool              1400           1403           3          0.0   350101054.0       0.6X
+Decompression 4 times from level 1 without buffer pool            899            913          23          0.0   224716523.7       1.0X
+Decompression 4 times from level 2 without buffer pool           1163           1168           6          0.0   290860752.3       0.8X
+Decompression 4 times from level 3 without buffer pool           1392           1392           0          0.0   347912543.8       0.6X
+Decompression 4 times from level 1 with buffer pool               890            894           3          0.0   222572354.0       1.0X
+Decompression 4 times from level 2 with buffer pool              1157           1161           6          0.0   289278691.8       0.8X
+Decompression 4 times from level 3 with buffer pool              1383           1387           6          0.0   345816264.3       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 3:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                2088           2098          15          0.0   521933319.5       1.0X
-Parallel Compression with 1 workers                2142           2145           4          0.0   535401971.0       1.0X
-Parallel Compression with 2 workers                1086           1090           5          0.0   271554405.7       1.9X
-Parallel Compression with 4 workers                 789            799          10          0.0   197186788.0       2.6X
-Parallel Compression with 8 workers                 930            951          18          0.0   232624325.3       2.2X
-Parallel Compression with 16 workers               1011           1014           5          0.0   252634970.3       2.1X
+Parallel Compression with 0 workers                2095           2095           0          0.0   523730144.5       1.0X
+Parallel Compression with 1 workers                2117           2117           0          0.0   529351910.2       1.0X
+Parallel Compression with 2 workers                1084           1085           0          0.0   271065080.0       1.9X
+Parallel Compression with 4 workers                 754            759           4          0.0   188485738.0       2.8X
+Parallel Compression with 8 workers                 784            787           6          0.0   195887107.7       2.7X
+Parallel Compression with 16 workers                882            897          13          0.0   220488661.0       2.4X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1014-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parallel Compression at level 9:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parallel Compression with 0 workers                8766           8812          64          0.0  2191521645.8       1.0X
-Parallel Compression with 1 workers                7808           7810           3          0.0  1951970435.0       1.1X
-Parallel Compression with 2 workers                4057           4096          56          0.0  1014125964.5       2.2X
-Parallel Compression with 4 workers                3508           3528          28          0.0   877027867.8       2.5X
-Parallel Compression with 8 workers                4026           4028           2          0.0  1006539516.7       2.2X
-Parallel Compression with 16 workers               4044           4052          11          0.0  1011070885.5       2.2X
+Parallel Compression with 0 workers                8758           8789          45          0.0  2189469160.5       1.0X
+Parallel Compression with 1 workers                7089           7118          41          0.0  1772262320.5       1.2X
+Parallel Compression with 2 workers                3669           3674           8          0.0   917169770.5       2.4X
+Parallel Compression with 4 workers                3290           3296           9          0.0   822425053.8       2.7X
+Parallel Compression with 8 workers                3657           3685          40          0.0   914190198.7       2.4X
+Parallel Compression with 16 workers               3804           3815          15          0.0   951081198.7       2.3X
 
 
diff --git a/core/src/main/java/org/apache/spark/api/java/Optional.java b/core/src/main/java/org/apache/spark/api/java/Optional.java
index 362149c92145e..913ed966668d4 100644
--- a/core/src/main/java/org/apache/spark/api/java/Optional.java
+++ b/core/src/main/java/org/apache/spark/api/java/Optional.java
@@ -20,8 +20,6 @@
 import java.io.Serializable;
 import java.util.Objects;
 
-import com.google.common.base.Preconditions;
-
 /**
  * <p>Like {@code java.util.Optional} in Java 8, {@code scala.Option} in Scala, and
  * {@code com.google.common.base.Optional} in Google Guava, this class represents a
@@ -71,8 +69,7 @@ private Optional() {
   }
 
   private Optional(T value) {
-    Preconditions.checkNotNull(value);
-    this.value = value;
+    this.value = Objects.requireNonNull(value);
   }
 
   // java.util.Optional API (subset)
@@ -112,8 +109,7 @@ public static <T> Optional<T> ofNullable(T value) {
    * @throws NullPointerException if this is empty (contains no value)
    */
   public T get() {
-    Preconditions.checkNotNull(value);
-    return value;
+    return Objects.requireNonNull(value);
   }
 
   /**
diff --git a/core/src/main/java/org/apache/spark/io/ReadAheadInputStream.java b/core/src/main/java/org/apache/spark/io/ReadAheadInputStream.java
index 7dd87df713e6e..91ee2d8ccbe96 100644
--- a/core/src/main/java/org/apache/spark/io/ReadAheadInputStream.java
+++ b/core/src/main/java/org/apache/spark/io/ReadAheadInputStream.java
@@ -28,13 +28,11 @@
 import java.util.concurrent.locks.ReentrantLock;
 import javax.annotation.concurrent.GuardedBy;
 
-import com.google.common.base.Preconditions;
-import com.google.common.base.Throwables;
-
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.internal.LogKeys;
 import org.apache.spark.internal.MDC;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.util.ThreadUtils;
 
 /**
@@ -105,7 +103,7 @@ public class ReadAheadInputStream extends InputStream {
    */
   public ReadAheadInputStream(
       InputStream inputStream, int bufferSizeInBytes) {
-    Preconditions.checkArgument(bufferSizeInBytes > 0,
+    JavaUtils.checkArgument(bufferSizeInBytes > 0,
         "bufferSizeInBytes should be greater than 0, but the value is " + bufferSizeInBytes);
     activeBuffer = ByteBuffer.allocate(bufferSizeInBytes);
     readAheadBuffer = ByteBuffer.allocate(bufferSizeInBytes);
@@ -120,8 +118,10 @@ private boolean isEndOfStream() {
 
   private void checkReadException() throws IOException {
     if (readAborted) {
-      Throwables.throwIfInstanceOf(readException, IOException.class);
-      Throwables.throwIfUnchecked(readException);
+      if (readException == null) throw new NullPointerException("readException is not captured.");
+      if (readException instanceof IOException ie) throw ie;
+      if (readException instanceof Error error) throw error;
+      if (readException instanceof RuntimeException re) throw re;
       throw new IOException(readException);
     }
   }
@@ -213,7 +213,7 @@ private void closeUnderlyingInputStreamIfNecessary() {
       try {
         underlyingInputStream.close();
       } catch (IOException e) {
-        logger.warn("{}", e, MDC.of(LogKeys.ERROR$.MODULE$, e.getMessage()));
+        logger.warn("{}", e, MDC.of(LogKeys.ERROR, e.getMessage()));
       }
     }
   }
diff --git a/core/src/main/java/org/apache/spark/memory/TaskMemoryManager.java b/core/src/main/java/org/apache/spark/memory/TaskMemoryManager.java
index e98554db22524..ab9e470e0c2c0 100644
--- a/core/src/main/java/org/apache/spark/memory/TaskMemoryManager.java
+++ b/core/src/main/java/org/apache/spark/memory/TaskMemoryManager.java
@@ -279,11 +279,11 @@ private long trySpillAndAcquire(
     } catch (ClosedByInterruptException | InterruptedIOException e) {
       // This called by user to kill a task (e.g: speculative task).
       logger.error("Error while calling spill() on {}", e,
-        MDC.of(LogKeys.MEMORY_CONSUMER$.MODULE$, consumerToSpill));
+        MDC.of(LogKeys.MEMORY_CONSUMER, consumerToSpill));
       throw new RuntimeException(e.getMessage());
     } catch (IOException e) {
       logger.error("Error while calling spill() on {}", e,
-        MDC.of(LogKeys.MEMORY_CONSUMER$.MODULE$, consumerToSpill));
+        MDC.of(LogKeys.MEMORY_CONSUMER, consumerToSpill));
       // checkstyle.off: RegexpSinglelineJava
       throw new SparkOutOfMemoryError(
         "SPILL_OUT_OF_MEMORY",
@@ -320,7 +320,7 @@ public void releaseExecutionMemory(long size, MemoryConsumer consumer) {
    */
   public void showMemoryUsage() {
     logger.info("Memory used in task {}",
-      MDC.of(LogKeys.TASK_ATTEMPT_ID$.MODULE$, taskAttemptId));
+      MDC.of(LogKeys.TASK_ATTEMPT_ID, taskAttemptId));
     synchronized (this) {
       long memoryAccountedForByConsumers = 0;
       for (MemoryConsumer c: consumers) {
@@ -328,20 +328,20 @@ public void showMemoryUsage() {
         memoryAccountedForByConsumers += totalMemUsage;
         if (totalMemUsage > 0) {
           logger.info("Acquired by {}: {}",
-            MDC.of(LogKeys.MEMORY_CONSUMER$.MODULE$, c),
-            MDC.of(LogKeys.MEMORY_SIZE$.MODULE$, Utils.bytesToString(totalMemUsage)));
+            MDC.of(LogKeys.MEMORY_CONSUMER, c),
+            MDC.of(LogKeys.MEMORY_SIZE, Utils.bytesToString(totalMemUsage)));
         }
       }
       long memoryNotAccountedFor =
         memoryManager.getExecutionMemoryUsageForTask(taskAttemptId) - memoryAccountedForByConsumers;
       logger.info(
         "{} bytes of memory were used by task {} but are not associated with specific consumers",
-        MDC.of(LogKeys.MEMORY_SIZE$.MODULE$, memoryNotAccountedFor),
-        MDC.of(LogKeys.TASK_ATTEMPT_ID$.MODULE$, taskAttemptId));
+        MDC.of(LogKeys.MEMORY_SIZE, memoryNotAccountedFor),
+        MDC.of(LogKeys.TASK_ATTEMPT_ID, taskAttemptId));
       logger.info(
         "{} bytes of memory are used for execution and {} bytes of memory are used for storage",
-        MDC.of(LogKeys.EXECUTION_MEMORY_SIZE$.MODULE$, memoryManager.executionMemoryUsed()),
-        MDC.of(LogKeys.STORAGE_MEMORY_SIZE$.MODULE$,  memoryManager.storageMemoryUsed()));
+        MDC.of(LogKeys.EXECUTION_MEMORY_SIZE, memoryManager.executionMemoryUsed()),
+        MDC.of(LogKeys.STORAGE_MEMORY_SIZE,  memoryManager.storageMemoryUsed()));
     }
   }
 
@@ -388,7 +388,7 @@ public MemoryBlock allocatePage(long size, MemoryConsumer consumer) {
       page = memoryManager.tungstenMemoryAllocator().allocate(acquired);
     } catch (OutOfMemoryError e) {
       logger.warn("Failed to allocate a page ({} bytes), try again.",
-        MDC.of(LogKeys.PAGE_SIZE$.MODULE$, acquired));
+        MDC.of(LogKeys.PAGE_SIZE, acquired));
       // there is no enough memory actually, it means the actual free memory is smaller than
       // MemoryManager thought, we should keep the acquired memory.
       synchronized (this) {
diff --git a/core/src/main/java/org/apache/spark/shuffle/sort/BypassMergeSortShuffleWriter.java b/core/src/main/java/org/apache/spark/shuffle/sort/BypassMergeSortShuffleWriter.java
index 86f7d5143eff5..8072a432ab110 100644
--- a/core/src/main/java/org/apache/spark/shuffle/sort/BypassMergeSortShuffleWriter.java
+++ b/core/src/main/java/org/apache/spark/shuffle/sort/BypassMergeSortShuffleWriter.java
@@ -227,7 +227,7 @@ private long[] writePartitionedData(ShuffleMapOutputWriter mapOutputWriter) thro
             }
             if (!file.delete()) {
               logger.error("Unable to delete file for partition {}",
-                MDC.of(LogKeys.PARTITION_ID$.MODULE$, i));
+                MDC.of(LogKeys.PARTITION_ID, i));
             }
           }
         }
diff --git a/core/src/main/java/org/apache/spark/shuffle/sort/ShuffleExternalSorter.java b/core/src/main/java/org/apache/spark/shuffle/sort/ShuffleExternalSorter.java
index de3c41a4b526b..bed241b1e03a9 100644
--- a/core/src/main/java/org/apache/spark/shuffle/sort/ShuffleExternalSorter.java
+++ b/core/src/main/java/org/apache/spark/shuffle/sort/ShuffleExternalSorter.java
@@ -89,6 +89,11 @@ final class ShuffleExternalSorter extends MemoryConsumer implements ShuffleCheck
    */
   private final int numElementsForSpillThreshold;
 
+  /**
+   * Force this sorter to spill when the size in memory is beyond this threshold.
+   */
+  private final long recordsSizeForSpillThreshold;
+
   /** The buffer size to use when writing spills using DiskBlockObjectWriter */
   private final int fileBufferSizeBytes;
 
@@ -112,6 +117,7 @@ final class ShuffleExternalSorter extends MemoryConsumer implements ShuffleCheck
   @Nullable private ShuffleInMemorySorter inMemSorter;
   @Nullable private MemoryBlock currentPage = null;
   private long pageCursor = -1;
+  private long inMemRecordsSize = 0;
 
   // Checksum calculator for each partition. Empty when shuffle checksum disabled.
   private final Checksum[] partitionChecksums;
@@ -136,6 +142,8 @@ final class ShuffleExternalSorter extends MemoryConsumer implements ShuffleCheck
         (int) (long) conf.get(package$.MODULE$.SHUFFLE_FILE_BUFFER_SIZE()) * 1024;
     this.numElementsForSpillThreshold =
         (int) conf.get(package$.MODULE$.SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD());
+    this.recordsSizeForSpillThreshold =
+        (long) conf.get(package$.MODULE$.SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD());
     this.writeMetrics = writeMetrics;
     this.inMemSorter = new ShuffleInMemorySorter(
       this, initialSize, (boolean) conf.get(package$.MODULE$.SHUFFLE_SORT_USE_RADIXSORT()));
@@ -162,11 +170,11 @@ private void writeSortedFile(boolean isFinalFile) {
     if (!isFinalFile) {
       logger.info(
         "Task {} on Thread {} spilling sort data of {} to disk ({} {} so far)",
-        MDC.of(LogKeys.TASK_ATTEMPT_ID$.MODULE$, taskContext.taskAttemptId()),
-        MDC.of(LogKeys.THREAD_ID$.MODULE$, Thread.currentThread().getId()),
-        MDC.of(LogKeys.MEMORY_SIZE$.MODULE$, Utils.bytesToString(getMemoryUsage())),
-        MDC.of(LogKeys.NUM_SPILLS$.MODULE$, spills.size()),
-        MDC.of(LogKeys.SPILL_TIMES$.MODULE$, spills.size() != 1 ? "times" : "time"));
+        MDC.of(LogKeys.TASK_ATTEMPT_ID, taskContext.taskAttemptId()),
+        MDC.of(LogKeys.THREAD_ID, Thread.currentThread().getId()),
+        MDC.of(LogKeys.MEMORY_SIZE, Utils.bytesToString(getMemoryUsage())),
+        MDC.of(LogKeys.NUM_SPILLS, spills.size()),
+        MDC.of(LogKeys.SPILL_TIMES, spills.size() != 1 ? "times" : "time"));
     }
 
     // This call performs the actual sort.
@@ -338,6 +346,7 @@ private long freeMemory() {
     allocatedPages.clear();
     currentPage = null;
     pageCursor = 0;
+    inMemRecordsSize = 0;
     return memoryFreed;
   }
 
@@ -353,7 +362,7 @@ public void cleanupResources() {
     for (SpillInfo spill : spills) {
       if (spill.file.exists() && !spill.file.delete()) {
         logger.error("Unable to delete spill file {}",
-          MDC.of(LogKeys.PATH$.MODULE$, spill.file.getPath()));
+          MDC.of(LogKeys.PATH, spill.file.getPath()));
       }
     }
   }
@@ -417,11 +426,16 @@ private void acquireNewPageIfNecessary(int required) {
   public void insertRecord(Object recordBase, long recordOffset, int length, int partitionId)
     throws IOException {
 
-    // for tests
     assert(inMemSorter != null);
     if (inMemSorter.numRecords() >= numElementsForSpillThreshold) {
-      logger.info("Spilling data because number of spilledRecords crossed the threshold {}" +
-        MDC.of(LogKeys.NUM_ELEMENTS_SPILL_THRESHOLD$.MODULE$, numElementsForSpillThreshold));
+      logger.info("Spilling data because number of spilledRecords ({}) crossed the threshold {}",
+        MDC.of(LogKeys.NUM_ELEMENTS_SPILL_RECORDS, inMemSorter.numRecords()),
+        MDC.of(LogKeys.NUM_ELEMENTS_SPILL_THRESHOLD, numElementsForSpillThreshold));
+      spill();
+    } else if (inMemRecordsSize >= recordsSizeForSpillThreshold) {
+      logger.info("Spilling data because size of spilledRecords ({}) crossed the size threshold {}",
+        MDC.of(LogKeys.SPILL_RECORDS_SIZE, inMemRecordsSize),
+        MDC.of(LogKeys.SPILL_RECORDS_SIZE_THRESHOLD, recordsSizeForSpillThreshold));
       spill();
     }
 
@@ -439,6 +453,7 @@ public void insertRecord(Object recordBase, long recordOffset, int length, int p
     Platform.copyMemory(recordBase, recordOffset, base, pageCursor, length);
     pageCursor += length;
     inMemSorter.insertRecord(recordAddress, partitionId);
+    inMemRecordsSize += required;
   }
 
   /**
diff --git a/core/src/main/java/org/apache/spark/shuffle/sort/UnsafeShuffleWriter.java b/core/src/main/java/org/apache/spark/shuffle/sort/UnsafeShuffleWriter.java
index ac9d335d63591..36a1487627367 100644
--- a/core/src/main/java/org/apache/spark/shuffle/sort/UnsafeShuffleWriter.java
+++ b/core/src/main/java/org/apache/spark/shuffle/sort/UnsafeShuffleWriter.java
@@ -33,7 +33,6 @@
 import scala.reflect.ClassTag$;
 
 import com.google.common.annotations.VisibleForTesting;
-import com.google.common.io.ByteStreams;
 import com.google.common.io.Closeables;
 
 import org.apache.spark.*;
@@ -229,7 +228,7 @@ void closeAndWriteOutput() throws IOException {
       for (SpillInfo spill : spills) {
         if (spill.file.exists() && !spill.file.delete()) {
           logger.error("Error while deleting spill file {}",
-            MDC.of(LogKeys.PATH$.MODULE$, spill.file.getPath()));
+            MDC.of(LogKeys.PATH, spill.file.getPath()));
         }
       }
     }
@@ -404,7 +403,7 @@ private void mergeSpillsWithFileStream(
                   partitionInputStream = compressionCodec.compressedInputStream(
                       partitionInputStream);
                 }
-                ByteStreams.copy(partitionInputStream, partitionOutput);
+                partitionInputStream.transferTo(partitionOutput);
                 copySpillThrewException = false;
               } finally {
                 Closeables.close(partitionInputStream, copySpillThrewException);
diff --git a/core/src/main/java/org/apache/spark/shuffle/sort/io/LocalDiskShuffleMapOutputWriter.java b/core/src/main/java/org/apache/spark/shuffle/sort/io/LocalDiskShuffleMapOutputWriter.java
index c0b9018c770a0..e51a48b019854 100644
--- a/core/src/main/java/org/apache/spark/shuffle/sort/io/LocalDiskShuffleMapOutputWriter.java
+++ b/core/src/main/java/org/apache/spark/shuffle/sort/io/LocalDiskShuffleMapOutputWriter.java
@@ -125,7 +125,7 @@ public void abort(Throwable error) throws IOException {
     cleanUp();
     if (outputTempFile != null && outputTempFile.exists() && !outputTempFile.delete()) {
       log.warn("Failed to delete temporary shuffle file at {}",
-        MDC.of(LogKeys.PATH$.MODULE$, outputTempFile.getAbsolutePath()));
+        MDC.of(LogKeys.PATH, outputTempFile.getAbsolutePath()));
     }
   }
 
diff --git a/core/src/main/java/org/apache/spark/unsafe/map/BytesToBytesMap.java b/core/src/main/java/org/apache/spark/unsafe/map/BytesToBytesMap.java
index 2a8e15cd09ccf..486bfd62bc97a 100644
--- a/core/src/main/java/org/apache/spark/unsafe/map/BytesToBytesMap.java
+++ b/core/src/main/java/org/apache/spark/unsafe/map/BytesToBytesMap.java
@@ -395,7 +395,7 @@ private void handleFailedDelete() {
         File file = spillWriters.removeFirst().getFile();
         if (file != null && file.exists() && !file.delete()) {
           logger.error("Was unable to delete spill file {}",
-            MDC.of(LogKeys.PATH$.MODULE$, file.getAbsolutePath()));
+            MDC.of(LogKeys.PATH, file.getAbsolutePath()));
         }
       }
     }
@@ -897,7 +897,7 @@ public void free() {
       if (file != null && file.exists()) {
         if (!file.delete()) {
           logger.error("Was unable to delete spill file {}",
-            MDC.of(LogKeys.PATH$.MODULE$, file.getAbsolutePath()));
+            MDC.of(LogKeys.PATH, file.getAbsolutePath()));
         }
       }
     }
diff --git a/core/src/main/java/org/apache/spark/util/EnumUtil.java b/core/src/main/java/org/apache/spark/util/EnumUtil.java
index c40c7e727613c..6c397640590fe 100644
--- a/core/src/main/java/org/apache/spark/util/EnumUtil.java
+++ b/core/src/main/java/org/apache/spark/util/EnumUtil.java
@@ -16,7 +16,8 @@
  */
 package org.apache.spark.util;
 
-import com.google.common.base.Joiner;
+import java.util.StringJoiner;
+
 import org.apache.spark.annotation.Private;
 
 @Private
@@ -33,6 +34,14 @@ public static <E extends Enum<E>> E parseIgnoreCase(Class<E> clz, String str) {
     }
     throw new IllegalArgumentException(
       String.format("Illegal type='%s'. Supported type values: %s",
-        str, Joiner.on(", ").join(constants)));
+        str, joinToString(constants)));
+  }
+
+  private static <E extends Enum<E>> String joinToString(E[] enums) {
+    StringJoiner stringJoiner = new StringJoiner(", ");
+    for (E e : enums) {
+      stringJoiner.add(e.name());
+    }
+    return stringJoiner.toString();
   }
 }
diff --git a/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/RadixSort.java b/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/RadixSort.java
index 3dd318471008b..c8f984e856cef 100644
--- a/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/RadixSort.java
+++ b/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/RadixSort.java
@@ -17,10 +17,9 @@
 
 package org.apache.spark.util.collection.unsafe.sort;
 
-import com.google.common.primitives.Ints;
-
 import org.apache.spark.unsafe.Platform;
 import org.apache.spark.unsafe.array.LongArray;
+import org.apache.spark.network.util.JavaUtils;
 
 public class RadixSort {
 
@@ -63,7 +62,7 @@ public static int sort(
         }
       }
     }
-    return Ints.checkedCast(inIndex);
+    return JavaUtils.checkedCast(inIndex);
   }
 
   /**
@@ -204,7 +203,7 @@ public static int sortKeyPrefixArray(
         }
       }
     }
-    return Ints.checkedCast(inIndex);
+    return JavaUtils.checkedCast(inIndex);
   }
 
   /**
diff --git a/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorter.java b/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorter.java
index af421e903ba3f..94c37e187131f 100644
--- a/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorter.java
+++ b/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorter.java
@@ -27,7 +27,6 @@
 import java.util.function.Supplier;
 
 import com.google.common.annotations.VisibleForTesting;
-import org.apache.commons.io.IOUtils;
 
 import org.apache.spark.TaskContext;
 import org.apache.spark.executor.ShuffleWriteMetrics;
@@ -80,6 +79,11 @@ public final class UnsafeExternalSorter extends MemoryConsumer {
    */
   private final int numElementsForSpillThreshold;
 
+  /**
+   * Force this sorter to spill when the size in memory is beyond this threshold.
+   */
+  private final long recordsSizeForSpillThreshold;
+
   /**
    * Memory pages that hold the records being sorted. The pages in this list are freed when
    * spilling, although in principle we could recycle these pages across spills (on the other hand,
@@ -92,6 +96,7 @@ public final class UnsafeExternalSorter extends MemoryConsumer {
 
   // These variables are reset after spilling:
   @Nullable private volatile UnsafeInMemorySorter inMemSorter;
+  private long inMemRecordsSize = 0;
 
   private MemoryBlock currentPage = null;
   private long pageCursor = -1;
@@ -110,11 +115,13 @@ public static UnsafeExternalSorter createWithExistingInMemorySorter(
       int initialSize,
       long pageSizeBytes,
       int numElementsForSpillThreshold,
+      long recordsSizeForSpillThreshold,
       UnsafeInMemorySorter inMemorySorter,
       long existingMemoryConsumption) throws IOException {
     UnsafeExternalSorter sorter = new UnsafeExternalSorter(taskMemoryManager, blockManager,
       serializerManager, taskContext, recordComparatorSupplier, prefixComparator, initialSize,
-        pageSizeBytes, numElementsForSpillThreshold, inMemorySorter, false /* ignored */);
+        pageSizeBytes, numElementsForSpillThreshold, recordsSizeForSpillThreshold,
+        inMemorySorter, false /* ignored */);
     sorter.spill(Long.MAX_VALUE, sorter);
     taskContext.taskMetrics().incMemoryBytesSpilled(existingMemoryConsumption);
     sorter.totalSpillBytes += existingMemoryConsumption;
@@ -133,10 +140,11 @@ public static UnsafeExternalSorter create(
       int initialSize,
       long pageSizeBytes,
       int numElementsForSpillThreshold,
+      long recordsSizeForSpillThreshold,
       boolean canUseRadixSort) {
     return new UnsafeExternalSorter(taskMemoryManager, blockManager, serializerManager,
       taskContext, recordComparatorSupplier, prefixComparator, initialSize, pageSizeBytes,
-      numElementsForSpillThreshold, null, canUseRadixSort);
+      numElementsForSpillThreshold, recordsSizeForSpillThreshold, null, canUseRadixSort);
   }
 
   private UnsafeExternalSorter(
@@ -149,6 +157,7 @@ private UnsafeExternalSorter(
       int initialSize,
       long pageSizeBytes,
       int numElementsForSpillThreshold,
+      long recordsSizeForSpillThreshold,
       @Nullable UnsafeInMemorySorter existingInMemorySorter,
       boolean canUseRadixSort) {
     super(taskMemoryManager, pageSizeBytes, taskMemoryManager.getTungstenMemoryMode());
@@ -178,6 +187,7 @@ private UnsafeExternalSorter(
       this.inMemSorter = existingInMemorySorter;
     }
     this.peakMemoryUsedBytes = getMemoryUsage();
+    this.recordsSizeForSpillThreshold = recordsSizeForSpillThreshold;
     this.numElementsForSpillThreshold = numElementsForSpillThreshold;
 
     // Register a cleanup task with TaskContext to ensure that memory is guaranteed to be freed at
@@ -220,10 +230,10 @@ public long spill(long size, MemoryConsumer trigger) throws IOException {
     }
 
     logger.info("Thread {} spilling sort data of {} to disk ({} {} so far)",
-      MDC.of(LogKeys.THREAD_ID$.MODULE$, Thread.currentThread().getId()),
-      MDC.of(LogKeys.MEMORY_SIZE$.MODULE$, Utils.bytesToString(getMemoryUsage())),
-      MDC.of(LogKeys.NUM_SPILL_WRITERS$.MODULE$, spillWriters.size()),
-      MDC.of(LogKeys.SPILL_TIMES$.MODULE$, spillWriters.size() > 1 ? "times" : "time"));
+      MDC.of(LogKeys.THREAD_ID, Thread.currentThread().getId()),
+      MDC.of(LogKeys.MEMORY_SIZE, Utils.bytesToString(getMemoryUsage())),
+      MDC.of(LogKeys.NUM_SPILL_WRITERS, spillWriters.size()),
+      MDC.of(LogKeys.SPILL_TIMES, spillWriters.size() > 1 ? "times" : "time"));
 
     ShuffleWriteMetrics writeMetrics = new ShuffleWriteMetrics();
 
@@ -238,6 +248,7 @@ public long spill(long size, MemoryConsumer trigger) throws IOException {
     // pages will currently be counted as memory spilled even though that space isn't actually
     // written to disk. This also counts the space needed to store the sorter's pointer array.
     inMemSorter.freeMemory();
+    inMemRecordsSize = 0;
     // Reset the in-memory sorter's pointer array only after freeing up the memory pages holding the
     // records. Otherwise, if the task is over allocated memory, then without freeing the memory
     // pages, we might not be able to get memory for the pointer array.
@@ -339,7 +350,7 @@ private void deleteSpillFiles() {
       if (file != null && file.exists()) {
         if (!file.delete()) {
           logger.error("Was unable to delete spill file {}",
-            MDC.of(LogKeys.PATH$.MODULE$, file.getAbsolutePath()));
+            MDC.of(LogKeys.PATH, file.getAbsolutePath()));
         }
       }
     }
@@ -480,8 +491,14 @@ public void insertRecord(
 
     assert(inMemSorter != null);
     if (inMemSorter.numRecords() >= numElementsForSpillThreshold) {
-      logger.info("Spilling data because number of spilledRecords crossed the threshold {}",
-        MDC.of(LogKeys.NUM_ELEMENTS_SPILL_THRESHOLD$.MODULE$, numElementsForSpillThreshold));
+      logger.info("Spilling data because number of spilledRecords ({}) crossed the threshold {}",
+        MDC.of(LogKeys.NUM_ELEMENTS_SPILL_RECORDS, inMemSorter.numRecords()),
+        MDC.of(LogKeys.NUM_ELEMENTS_SPILL_THRESHOLD, numElementsForSpillThreshold));
+      spill();
+    } else if (inMemRecordsSize >= recordsSizeForSpillThreshold) {
+      logger.info("Spilling data because size of spilledRecords ({}) crossed the size threshold {}",
+        MDC.of(LogKeys.SPILL_RECORDS_SIZE, inMemRecordsSize),
+        MDC.of(LogKeys.SPILL_RECORDS_SIZE_THRESHOLD, recordsSizeForSpillThreshold));
       spill();
     }
 
@@ -497,6 +514,7 @@ public void insertRecord(
     Platform.copyMemory(recordBase, recordOffset, base, pageCursor, length);
     pageCursor += length;
     inMemSorter.insertRecord(recordAddress, prefix, prefixIsNull);
+    inMemRecordsSize += required;
   }
 
   /**
@@ -867,7 +885,7 @@ public void close() throws IOException {
 
     private void closeIfPossible(UnsafeSorterIterator iterator) {
       if (iterator instanceof Closeable closeable) {
-        IOUtils.closeQuietly((closeable));
+        Utils.closeQuietly((closeable));
       }
     }
   }
diff --git a/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeSorterSpillReader.java b/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeSorterSpillReader.java
index 0693f8cb1a808..6674fcd73b92b 100644
--- a/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeSorterSpillReader.java
+++ b/core/src/main/java/org/apache/spark/util/collection/unsafe/sort/UnsafeSorterSpillReader.java
@@ -17,7 +17,6 @@
 
 package org.apache.spark.util.collection.unsafe.sort;
 
-import com.google.common.io.ByteStreams;
 import com.google.common.io.Closeables;
 import org.apache.spark.SparkEnv;
 import org.apache.spark.TaskContext;
@@ -27,6 +26,7 @@
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.io.NioBufferedFileInputStream;
 import org.apache.spark.io.ReadAheadInputStream;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.serializer.SerializerManager;
 import org.apache.spark.storage.BlockId;
 import org.apache.spark.unsafe.Platform;
@@ -128,7 +128,7 @@ public void loadNext() throws IOException {
       arr = new byte[recordLength];
       baseObject = arr;
     }
-    ByteStreams.readFully(in, arr, 0, recordLength);
+    JavaUtils.readFully(in, arr, 0, recordLength);
     numRecordsRemaining--;
     if (numRecordsRemaining == 0) {
       close();
diff --git a/core/src/main/scala/org/apache/spark/BarrierCoordinator.scala b/core/src/main/scala/org/apache/spark/BarrierCoordinator.scala
index 3f95515c04d29..2fdb8debf1909 100644
--- a/core/src/main/scala/org/apache/spark/BarrierCoordinator.scala
+++ b/core/src/main/scala/org/apache/spark/BarrierCoordinator.scala
@@ -24,7 +24,7 @@ import java.util.function.Consumer
 import scala.collection.mutable.{ArrayBuffer, HashSet}
 import scala.jdk.CollectionConverters._
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rpc.{RpcCallContext, RpcEnv, ThreadSafeRpcEndpoint}
 import org.apache.spark.scheduler.{LiveListenerBus, SparkListener, SparkListenerStageCompleted}
diff --git a/core/src/main/scala/org/apache/spark/BarrierTaskContext.scala b/core/src/main/scala/org/apache/spark/BarrierTaskContext.scala
index 47f287293974f..ee1e4dafcfc1a 100644
--- a/core/src/main/scala/org/apache/spark/BarrierTaskContext.scala
+++ b/core/src/main/scala/org/apache/spark/BarrierTaskContext.scala
@@ -27,7 +27,7 @@ import scala.util.{Failure, Success => ScalaSuccess, Try}
 
 import org.apache.spark.annotation.{Experimental, Since}
 import org.apache.spark.executor.TaskMetrics
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.memory.TaskMemoryManager
 import org.apache.spark.metrics.source.Source
diff --git a/core/src/main/scala/org/apache/spark/ContextCleaner.scala b/core/src/main/scala/org/apache/spark/ContextCleaner.scala
index fb56389cde77e..54ea8c94daac1 100644
--- a/core/src/main/scala/org/apache/spark/ContextCleaner.scala
+++ b/core/src/main/scala/org/apache/spark/ContextCleaner.scala
@@ -24,7 +24,7 @@ import java.util.concurrent.{ConcurrentHashMap, ConcurrentLinkedQueue, Scheduled
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ACCUMULATOR_ID, BROADCAST_ID, LISTENER, RDD_ID, SHUFFLE_ID}
 import org.apache.spark.internal.config._
 import org.apache.spark.rdd.{RDD, ReliableRDDCheckpointData}
diff --git a/core/src/main/scala/org/apache/spark/Dependency.scala b/core/src/main/scala/org/apache/spark/Dependency.scala
index 573608c4327e0..745faf866cebf 100644
--- a/core/src/main/scala/org/apache/spark/Dependency.scala
+++ b/core/src/main/scala/org/apache/spark/Dependency.scala
@@ -24,7 +24,7 @@ import scala.reflect.ClassTag
 import org.roaringbitmap.RoaringBitmap
 
 import org.apache.spark.annotation.DeveloperApi
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.serializer.Serializer
diff --git a/core/src/main/scala/org/apache/spark/ExecutorAllocationManager.scala b/core/src/main/scala/org/apache/spark/ExecutorAllocationManager.scala
index dd131e443135f..16ec7689d5261 100644
--- a/core/src/main/scala/org/apache/spark/ExecutorAllocationManager.scala
+++ b/core/src/main/scala/org/apache/spark/ExecutorAllocationManager.scala
@@ -26,7 +26,7 @@ import scala.util.control.NonFatal
 
 import com.codahale.metrics.{Counter, Gauge, MetricRegistry}
 
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.DECOMMISSION_ENABLED
@@ -614,7 +614,7 @@ private[spark] class ExecutorAllocationManager(
       } else {
         executorMonitor.executorsKilled(executorsRemoved.toSeq)
       }
-      logInfo(log"Executors ${MDC(EXECUTOR_IDS, executorsRemoved.mkString(","))}" +
+      logInfo(log"Executors ${MDC(EXECUTOR_IDS, executorsRemoved.mkString(","))} " +
         log"removed due to idle timeout.")
       executorsRemoved.toSeq
     } else {
diff --git a/core/src/main/scala/org/apache/spark/HeartbeatReceiver.scala b/core/src/main/scala/org/apache/spark/HeartbeatReceiver.scala
index 92aea5959aab7..40ea5c59ec04e 100644
--- a/core/src/main/scala/org/apache/spark/HeartbeatReceiver.scala
+++ b/core/src/main/scala/org/apache/spark/HeartbeatReceiver.scala
@@ -23,7 +23,7 @@ import scala.collection.mutable.{HashMap, Map}
 import scala.concurrent.Future
 
 import org.apache.spark.executor.ExecutorMetrics
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.Network
 import org.apache.spark.rpc.{IsolatedThreadSafeRpcEndpoint, RpcCallContext, RpcEnv}
diff --git a/core/src/main/scala/org/apache/spark/Heartbeater.scala b/core/src/main/scala/org/apache/spark/Heartbeater.scala
index 090458eecf182..8302aa17a9942 100644
--- a/core/src/main/scala/org/apache/spark/Heartbeater.scala
+++ b/core/src/main/scala/org/apache/spark/Heartbeater.scala
@@ -48,6 +48,13 @@ private[spark] class Heartbeater(
     heartbeater.scheduleAtFixedRate(heartbeatTask, initialDelay, intervalMs, TimeUnit.MILLISECONDS)
   }
 
+  /**
+   * Reports a heartbeat.
+   */
+  def doReportHeartbeat(): Unit = {
+    reportHeartbeat()
+  }
+
   /** Stops the heartbeat thread. */
   def stop(): Unit = {
     heartbeater.shutdown()
diff --git a/core/src/main/scala/org/apache/spark/MapOutputTracker.scala b/core/src/main/scala/org/apache/spark/MapOutputTracker.scala
index a660bccd2e68f..9b2d3d748ed4d 100644
--- a/core/src/main/scala/org/apache/spark/MapOutputTracker.scala
+++ b/core/src/main/scala/org/apache/spark/MapOutputTracker.scala
@@ -34,7 +34,7 @@ import org.apache.commons.io.output.{ByteArrayOutputStream => ApacheByteArrayOut
 import org.roaringbitmap.RoaringBitmap
 
 import org.apache.spark.broadcast.{Broadcast, BroadcastManager}
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.io.CompressionCodec
diff --git a/core/src/main/scala/org/apache/spark/SecurityManager.scala b/core/src/main/scala/org/apache/spark/SecurityManager.scala
index c951876e62034..1461677219bc1 100644
--- a/core/src/main/scala/org/apache/spark/SecurityManager.scala
+++ b/core/src/main/scala/org/apache/spark/SecurityManager.scala
@@ -26,7 +26,7 @@ import org.apache.hadoop.io.Text
 import org.apache.hadoop.security.{Credentials, UserGroupInformation}
 
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.UI._
 import org.apache.spark.launcher.SparkLauncher
diff --git a/core/src/main/scala/org/apache/spark/SparkConf.scala b/core/src/main/scala/org/apache/spark/SparkConf.scala
index bbf2809b7db23..1d1901ae4f688 100644
--- a/core/src/main/scala/org/apache/spark/SparkConf.scala
+++ b/core/src/main/scala/org/apache/spark/SparkConf.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.avro.{Schema, SchemaNormalization}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.History._
diff --git a/core/src/main/scala/org/apache/spark/SparkContext.scala b/core/src/main/scala/org/apache/spark/SparkContext.scala
index 2e61773251b67..d65b5f297dad4 100644
--- a/core/src/main/scala/org/apache/spark/SparkContext.scala
+++ b/core/src/main/scala/org/apache/spark/SparkContext.scala
@@ -46,14 +46,14 @@ import org.apache.spark.deploy.{LocalSparkCluster, SparkHadoopUtil}
 import org.apache.spark.errors.SparkCoreErrors
 import org.apache.spark.executor.{Executor, ExecutorMetrics, ExecutorMetricsSource}
 import org.apache.spark.input.{FixedLengthBinaryInputFormat, PortableDataStream, StreamInputFormat, WholeTextFileInputFormat}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.Tests._
 import org.apache.spark.internal.config.UI._
 import org.apache.spark.internal.plugin.PluginContainer
 import org.apache.spark.io.CompressionCodec
-import org.apache.spark.launcher.JavaModuleOptions
+import org.apache.spark.launcher.{JavaModuleOptions, SparkLauncher}
 import org.apache.spark.metrics.source.JVMCPUSource
 import org.apache.spark.partial.{ApproximateEvaluator, PartialResult}
 import org.apache.spark.rdd._
@@ -201,10 +201,10 @@ class SparkContext(config: SparkConf) extends Logging {
 
   // log out Spark Version in Spark driver log
   logInfo(log"Running Spark version ${MDC(LogKeys.SPARK_VERSION, SPARK_VERSION)}")
-  logInfo(log"OS info ${MDC(LogKeys.OS_NAME, System.getProperty("os.name"))}," +
-    log" ${MDC(LogKeys.OS_VERSION, System.getProperty("os.version"))}, " +
-    log"${MDC(LogKeys.OS_ARCH, System.getProperty("os.arch"))}")
-  logInfo(log"Java version ${MDC(LogKeys.JAVA_VERSION, System.getProperty("java.version"))}")
+  logInfo(log"OS info ${MDC(LogKeys.OS_NAME, Utils.osName)}," +
+    log" ${MDC(LogKeys.OS_VERSION, Utils.osVersion)}, " +
+    log"${MDC(LogKeys.OS_ARCH, Utils.osArch)}")
+  logInfo(log"Java version ${MDC(LogKeys.JAVA_VERSION, Utils.javaVersion)}")
 
   /* ------------------------------------------------------------------------------------- *
    | Private variables. These variables keep the internal state of the context, and are    |
@@ -483,7 +483,6 @@ class SparkContext(config: SparkConf) extends Logging {
     }
 
     _listenerBus = new LiveListenerBus(_conf)
-    _resourceProfileManager = new ResourceProfileManager(_conf, _listenerBus)
 
     // Initialize the app status store and listener before SparkEnv is created so that it gets
     // all events.
@@ -584,8 +583,9 @@ class SparkContext(config: SparkConf) extends Logging {
     _heartbeatReceiver = env.rpcEnv.setupEndpoint(
       HeartbeatReceiver.ENDPOINT_NAME, new HeartbeatReceiver(this))
 
-    // Initialize any plugins before the task scheduler is initialized.
+    // Initialize any plugins before initializing the task scheduler and resource profile manager.
     _plugins = PluginContainer(this, _resources.asJava)
+    _resourceProfileManager = new ResourceProfileManager(_conf, _listenerBus)
     _env.initializeShuffleManager()
     _env.initializeMemoryManager(SparkContext.numDriverCores(master, conf))
 
@@ -2934,8 +2934,14 @@ class SparkContext(config: SparkConf) extends Logging {
     _driverLogger.foreach(_.startSync(_hadoopConfiguration))
   }
 
-  /** Post the application end event */
+  /** Post the application end event and report the final heartbeat */
   private def postApplicationEnd(exitCode: Int): Unit = {
+    try {
+      _heartbeater.doReportHeartbeat()
+    } catch {
+      case t: Throwable =>
+        logInfo("Unable to report driver heartbeat metrics when stopping spark context", t);
+    }
     listenerBus.post(SparkListenerApplicationEnd(System.currentTimeMillis, Some(exitCode)))
   }
 
@@ -3413,27 +3419,21 @@ object SparkContext extends Logging {
    * `spark.driver.extraJavaOptions` and `spark.executor.extraJavaOptions`.
    */
   private def supplementJavaModuleOptions(conf: SparkConf): Unit = {
-    def supplement(key: OptionalConfigEntry[String]): Unit = {
-      val v = conf.get(key) match {
-        case Some(opts) => s"${JavaModuleOptions.defaultModuleOptions()} $opts"
-        case None => JavaModuleOptions.defaultModuleOptions()
-      }
-      conf.set(key.key, v)
+    def supplement(key: String): Unit = {
+      val v = s"${JavaModuleOptions.defaultModuleOptions()} ${conf.get(key, "")}".trim()
+      conf.set(key, v)
     }
-    supplement(DRIVER_JAVA_OPTIONS)
-    supplement(EXECUTOR_JAVA_OPTIONS)
+    supplement(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS)
+    supplement(SparkLauncher.EXECUTOR_EXTRA_JAVA_OPTIONS)
   }
 
   private def supplementJavaIPv6Options(conf: SparkConf): Unit = {
-    def supplement(key: OptionalConfigEntry[String]): Unit = {
-      val v = conf.get(key) match {
-        case Some(opts) => s"-Djava.net.preferIPv6Addresses=${Utils.preferIPv6} $opts"
-        case None => s"-Djava.net.preferIPv6Addresses=${Utils.preferIPv6}"
-      }
-      conf.set(key.key, v)
+    def supplement(key: String): Unit = {
+      val v = s"-Djava.net.preferIPv6Addresses=${Utils.preferIPv6} ${conf.get(key, "")}".trim()
+      conf.set(key, v)
     }
-    supplement(DRIVER_JAVA_OPTIONS)
-    supplement(EXECUTOR_JAVA_OPTIONS)
+    supplement(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS)
+    supplement(SparkLauncher.EXECUTOR_EXTRA_JAVA_OPTIONS)
   }
 }
 
diff --git a/core/src/main/scala/org/apache/spark/SparkEnv.scala b/core/src/main/scala/org/apache/spark/SparkEnv.scala
index bf6e30f5afade..796dbf4b6d5f8 100644
--- a/core/src/main/scala/org/apache/spark/SparkEnv.scala
+++ b/core/src/main/scala/org/apache/spark/SparkEnv.scala
@@ -32,7 +32,7 @@ import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.api.python.{PythonWorker, PythonWorkerFactory}
 import org.apache.spark.broadcast.BroadcastManager
 import org.apache.spark.executor.ExecutorBackend
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.memory.{MemoryManager, UnifiedMemoryManager}
diff --git a/core/src/main/scala/org/apache/spark/TaskContext.scala b/core/src/main/scala/org/apache/spark/TaskContext.scala
index 5384fd86a8f19..e4cf5f4bf01a5 100644
--- a/core/src/main/scala/org/apache/spark/TaskContext.scala
+++ b/core/src/main/scala/org/apache/spark/TaskContext.scala
@@ -50,6 +50,15 @@ object TaskContext {
     }
   }
 
+  def withTaskContext[T](context: TaskContext)(task: => T): T = {
+    try {
+      TaskContext.setTaskContext(context)
+      task
+    } finally {
+      TaskContext.unset()
+    }
+  }
+
   private[this] val taskContext: ThreadLocal[TaskContext] = new ThreadLocal[TaskContext]
 
   // Note: protected[spark] instead of private[spark] to prevent the following two from
diff --git a/core/src/main/scala/org/apache/spark/TaskContextImpl.scala b/core/src/main/scala/org/apache/spark/TaskContextImpl.scala
index f0e844289b9db..a7f09028597af 100644
--- a/core/src/main/scala/org/apache/spark/TaskContextImpl.scala
+++ b/core/src/main/scala/org/apache/spark/TaskContextImpl.scala
@@ -25,7 +25,7 @@ import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.executor.TaskMetrics
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys.LISTENER
 import org.apache.spark.memory.TaskMemoryManager
 import org.apache.spark.metrics.MetricsSystem
diff --git a/core/src/main/scala/org/apache/spark/TestUtils.scala b/core/src/main/scala/org/apache/spark/TestUtils.scala
index fed15a067c00f..aadfb2125cd69 100644
--- a/core/src/main/scala/org/apache/spark/TestUtils.scala
+++ b/core/src/main/scala/org/apache/spark/TestUtils.scala
@@ -20,7 +20,7 @@ package org.apache.spark
 import java.io.{ByteArrayInputStream, File, FileInputStream, FileOutputStream}
 import java.net.{HttpURLConnection, InetSocketAddress, URL}
 import java.nio.charset.StandardCharsets
-import java.nio.file.{Files => JavaFiles, Paths}
+import java.nio.file.{Files, Paths}
 import java.nio.file.attribute.PosixFilePermission.{OWNER_EXECUTE, OWNER_READ, OWNER_WRITE}
 import java.security.SecureRandom
 import java.security.cert.X509Certificate
@@ -37,8 +37,6 @@ import scala.reflect.{classTag, ClassTag}
 import scala.sys.process.Process
 import scala.util.Try
 
-import com.google.common.io.{ByteStreams, Files}
-import org.apache.commons.lang3.StringUtils
 import org.apache.logging.log4j.LogManager
 import org.apache.logging.log4j.core.LoggerContext
 import org.apache.logging.log4j.core.appender.ConsoleAppender
@@ -97,7 +95,7 @@ private[spark] object TestUtils extends SparkTestUtils {
     files.foreach { case (k, v) =>
       val entry = new JarEntry(k)
       jarStream.putNextEntry(entry)
-      ByteStreams.copy(new ByteArrayInputStream(v.getBytes(StandardCharsets.UTF_8)), jarStream)
+      new ByteArrayInputStream(v.getBytes(StandardCharsets.UTF_8)).transferTo(jarStream)
     }
     jarStream.close()
     jarFile.toURI.toURL
@@ -133,7 +131,7 @@ private[spark] object TestUtils extends SparkTestUtils {
       jarStream.putNextEntry(jarEntry)
 
       val in = new FileInputStream(file)
-      ByteStreams.copy(in, jarStream)
+      in.transferTo(jarStream)
       in.close()
     }
     jarStream.close()
@@ -229,13 +227,13 @@ private[spark] object TestUtils extends SparkTestUtils {
   def getAbsolutePathFromExecutable(executable: String): Option[String] = {
     val command = if (Utils.isWindows) s"$executable.exe" else executable
     if (command.split(File.separator, 2).length == 1 &&
-        JavaFiles.isRegularFile(Paths.get(command)) &&
-        JavaFiles.isExecutable(Paths.get(command))) {
+        Files.isRegularFile(Paths.get(command)) &&
+        Files.isExecutable(Paths.get(command))) {
       Some(Paths.get(command).toAbsolutePath.toString)
     } else {
       sys.env("PATH").split(Pattern.quote(File.pathSeparator))
-        .map(path => Paths.get(s"${StringUtils.strip(path, "\"")}${File.separator}$command"))
-        .find(p => JavaFiles.isRegularFile(p) && JavaFiles.isExecutable(p))
+        .map(path => Paths.get(s"${Utils.strip(path, "\"")}${File.separator}$command"))
+        .find(p => Files.isRegularFile(p) && Files.isExecutable(p))
         .map(_.toString)
     }
   }
@@ -413,7 +411,7 @@ private[spark] object TestUtils extends SparkTestUtils {
   /** Creates a temp JSON file that contains the input JSON record. */
   def createTempJsonFile(dir: File, prefix: String, jsonValue: JValue): String = {
     val file = File.createTempFile(prefix, ".json", dir)
-    JavaFiles.write(file.toPath, compact(render(jsonValue)).getBytes())
+    Files.write(file.toPath, compact(render(jsonValue)).getBytes())
     file.getPath
   }
 
@@ -421,8 +419,8 @@ private[spark] object TestUtils extends SparkTestUtils {
   def createTempScriptWithExpectedOutput(dir: File, prefix: String, output: String): String = {
     val file = File.createTempFile(prefix, ".sh", dir)
     val script = s"cat <<EOF\n$output\nEOF\n"
-    Files.asCharSink(file, StandardCharsets.UTF_8).write(script)
-    JavaFiles.setPosixFilePermissions(file.toPath,
+    Files.writeString(file.toPath, script)
+    Files.setPosixFilePermissions(file.toPath,
       EnumSet.of(OWNER_READ, OWNER_EXECUTE, OWNER_WRITE))
     file.getPath
   }
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonGatewayServer.scala b/core/src/main/scala/org/apache/spark/api/python/PythonGatewayServer.scala
index 7737822f2af2b..a1c11a8da9323 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonGatewayServer.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonGatewayServer.scala
@@ -23,7 +23,7 @@ import java.nio.charset.StandardCharsets.UTF_8
 import java.nio.file.Files
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, PATH}
 
 /**
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonHadoopUtil.scala b/core/src/main/scala/org/apache/spark/api/python/PythonHadoopUtil.scala
index 5e2b5553f3dca..d41ac4603a636 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonHadoopUtil.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonHadoopUtil.scala
@@ -25,7 +25,7 @@ import org.apache.hadoop.io._
 
 import org.apache.spark.SparkException
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_NAME
 import org.apache.spark.rdd.RDD
 import org.apache.spark.util.{SerializableConfiguration, Utils}
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
index f2b6b8c1e9f8d..cf0169fed60c4 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonRDD.scala
@@ -38,7 +38,7 @@ import org.apache.spark.api.java.{JavaPairRDD, JavaRDD, JavaSparkContext}
 import org.apache.spark.api.python.PythonFunction.PythonAccumulator
 import org.apache.spark.broadcast.Broadcast
 import org.apache.spark.input.PortableDataStream
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{HOST, PORT, SOCKET_ADDRESS}
 import org.apache.spark.internal.config.BUFFER_SIZE
 import org.apache.spark.internal.config.Python.PYTHON_UNIX_DOMAIN_SOCKET_ENABLED
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonRunner.scala b/core/src/main/scala/org/apache/spark/api/python/PythonRunner.scala
index 287dc86942288..ca4f6e56554ec 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonRunner.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonRunner.scala
@@ -32,7 +32,7 @@ import scala.util.control.NonFatal
 
 import org.apache.spark._
 import org.apache.spark.api.python.PythonFunction.PythonAccumulator
-import org.apache.spark.internal.{Logging, LogKeys, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, LogKeys, MessageWithContext}
 import org.apache.spark.internal.LogKeys.TASK_NAME
 import org.apache.spark.internal.config.{BUFFER_SIZE, EXECUTOR_CORES}
 import org.apache.spark.internal.config.Python._
@@ -70,9 +70,12 @@ private[spark] object PythonEvalType {
   // Arrow UDFs
   val SQL_SCALAR_ARROW_UDF = 250
   val SQL_SCALAR_ARROW_ITER_UDF = 251
+  val SQL_GROUPED_AGG_ARROW_UDF = 252
+  val SQL_WINDOW_AGG_ARROW_UDF = 253
 
   val SQL_TABLE_UDF = 300
   val SQL_ARROW_TABLE_UDF = 301
+  val SQL_ARROW_UDTF = 302
 
   def toString(pythonEvalType: Int): String = pythonEvalType match {
     case NON_UDF => "NON_UDF"
@@ -91,6 +94,7 @@ private[spark] object PythonEvalType {
     case SQL_COGROUPED_MAP_ARROW_UDF => "SQL_COGROUPED_MAP_ARROW_UDF"
     case SQL_TABLE_UDF => "SQL_TABLE_UDF"
     case SQL_ARROW_TABLE_UDF => "SQL_ARROW_TABLE_UDF"
+    case SQL_ARROW_UDTF => "SQL_ARROW_UDTF"
     case SQL_TRANSFORM_WITH_STATE_PANDAS_UDF => "SQL_TRANSFORM_WITH_STATE_PANDAS_UDF"
     case SQL_TRANSFORM_WITH_STATE_PANDAS_INIT_STATE_UDF =>
       "SQL_TRANSFORM_WITH_STATE_PANDAS_INIT_STATE_UDF"
@@ -101,6 +105,8 @@ private[spark] object PythonEvalType {
     // Arrow UDFs
     case SQL_SCALAR_ARROW_UDF => "SQL_SCALAR_ARROW_UDF"
     case SQL_SCALAR_ARROW_ITER_UDF => "SQL_SCALAR_ARROW_ITER_UDF"
+    case SQL_GROUPED_AGG_ARROW_UDF => "SQL_GROUPED_AGG_ARROW_UDF"
+    case SQL_WINDOW_AGG_ARROW_UDF => "SQL_WINDOW_AGG_ARROW_UDF"
   }
 }
 
@@ -170,6 +176,8 @@ private[spark] abstract class BasePythonRunner[IN, OUT](
   protected val faultHandlerEnabled: Boolean = conf.get(PYTHON_WORKER_FAULTHANLDER_ENABLED)
   protected val idleTimeoutSeconds: Long = conf.get(PYTHON_WORKER_IDLE_TIMEOUT_SECONDS)
   protected val killOnIdleTimeout: Boolean = conf.get(PYTHON_WORKER_KILL_ON_IDLE_TIMEOUT)
+  protected val tracebackDumpIntervalSeconds: Long =
+    conf.get(PYTHON_WORKER_TRACEBACK_DUMP_INTERVAL_SECONDS)
   protected val hideTraceback: Boolean = false
   protected val simplifiedTraceback: Boolean = false
 
@@ -267,6 +275,9 @@ private[spark] abstract class BasePythonRunner[IN, OUT](
     if (faultHandlerEnabled) {
       envVars.put("PYTHON_FAULTHANDLER_DIR", faultHandlerLogDir.toString)
     }
+    if (tracebackDumpIntervalSeconds > 0L) {
+      envVars.put("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", tracebackDumpIntervalSeconds.toString)
+    }
     // allow the user to set the batch size for the BatchedSerializer on UDFs
     envVars.put("PYTHON_UDF_BATCH_SIZE", batchSizeForPythonUDF.toString)
 
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala b/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala
index 816ceea327aae..52ad6a93ce4c6 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonUtils.scala
@@ -28,7 +28,7 @@ import scala.sys.process.Process
 
 import org.apache.spark.{SparkContext, SparkEnv}
 import org.apache.spark.api.java.{JavaRDD, JavaSparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{PATH, PYTHON_PACKAGES, PYTHON_VERSION}
 import org.apache.spark.util.ArrayImplicits.SparkArrayOps
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/api/python/PythonWorkerFactory.scala b/core/src/main/scala/org/apache/spark/api/python/PythonWorkerFactory.scala
index 64b29585a0d92..e02f10cc3fe69 100644
--- a/core/src/main/scala/org/apache/spark/api/python/PythonWorkerFactory.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/PythonWorkerFactory.scala
@@ -32,9 +32,9 @@ import scala.jdk.OptionConverters._
 
 import org.apache.spark._
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.config.Python.{PYTHON_UNIX_DOMAIN_SOCKET_DIR, PYTHON_UNIX_DOMAIN_SOCKET_ENABLED}
+import org.apache.spark.internal.config.Python.PYTHON_FACTORY_IDLE_WORKER_MAX_POOL_SIZE
 import org.apache.spark.security.SocketAuthHelper
 import org.apache.spark.util.{RedirectThread, Utils}
 
@@ -95,11 +95,12 @@ private[spark] class PythonWorkerFactory(
   // so we can also fall back to launching workers, pyspark/worker.py (by default) directly.
   private val useDaemon = {
     // This flag is ignored on Windows as it's unable to fork.
-    !System.getProperty("os.name").startsWith("Windows") && useDaemonEnabled
+    !Utils.isWindows && useDaemonEnabled
   }
 
-  private val authHelper = new SocketAuthHelper(SparkEnv.get.conf)
-  private val isUnixDomainSock = authHelper.conf.get(PYTHON_UNIX_DOMAIN_SOCKET_ENABLED)
+  private val conf = SparkEnv.get.conf
+  private val authHelper = new SocketAuthHelper(conf)
+  private val isUnixDomainSock = authHelper.isUnixDomainSock
 
   @GuardedBy("self")
   private var daemon: Process = null
@@ -111,7 +112,11 @@ private[spark] class PythonWorkerFactory(
   @GuardedBy("self")
   private var daemonSockPath: String = _
   @GuardedBy("self")
-  private val idleWorkers = new mutable.Queue[PythonWorker]()
+  // Visible for testing
+  private[spark] val idleWorkers = new mutable.Queue[PythonWorker]()
+  @GuardedBy("self")
+  private val maxIdleWorkerPoolSize =
+    conf.get(PYTHON_FACTORY_IDLE_WORKER_MAX_POOL_SIZE)
   @GuardedBy("self")
   private var lastActivityNs = 0L
   new MonitorThread().start()
@@ -127,15 +132,16 @@ private[spark] class PythonWorkerFactory(
   def create(): (PythonWorker, Option[ProcessHandle]) = {
     if (useDaemon) {
       self.synchronized {
-        // Pull from idle workers until we one that is alive, otherwise create a new one.
+        // Pull from idle workers until we get one that is alive, otherwise create a new one.
         while (idleWorkers.nonEmpty) {
           val worker = idleWorkers.dequeue()
-          val workerHandle = daemonWorkers(worker)
-          if (workerHandle.isAlive()) {
-            try {
-              return (worker.refresh(), Some(workerHandle))
-            } catch {
-              case c: CancelledKeyException => /* pass */
+          daemonWorkers.get(worker).foreach { workerHandle =>
+            if (workerHandle.isAlive()) {
+              try {
+                return (worker.refresh(), Some(workerHandle))
+              } catch {
+                case _: CancelledKeyException => /* pass */
+              }
             }
           }
           logWarning(log"Worker ${MDC(WORKER, worker)} " +
@@ -202,8 +208,7 @@ private[spark] class PythonWorkerFactory(
       blockingMode: Boolean): (PythonWorker, Option[ProcessHandle]) = {
     var serverSocketChannel: ServerSocketChannel = null
     lazy val sockPath = new File(
-      authHelper.conf.get(PYTHON_UNIX_DOMAIN_SOCKET_DIR)
-        .getOrElse(System.getProperty("java.io.tmpdir")),
+      authHelper.sockDir,
       s".${UUID.randomUUID()}.sock")
     try {
       if (isUnixDomainSock) {
@@ -306,8 +311,7 @@ private[spark] class PythonWorkerFactory(
         if (isUnixDomainSock) {
           workerEnv.put(
             "PYTHON_WORKER_FACTORY_SOCK_DIR",
-            authHelper.conf.get(PYTHON_UNIX_DOMAIN_SOCKET_DIR)
-              .getOrElse(System.getProperty("java.io.tmpdir")))
+            authHelper.sockDir)
           workerEnv.put("PYTHON_UNIX_DOMAIN_ENABLED", "True")
         } else {
           workerEnv.put("PYTHON_WORKER_FACTORY_SECRET", authHelper.secret)
@@ -482,6 +486,15 @@ private[spark] class PythonWorkerFactory(
     if (useDaemon) {
       self.synchronized {
         lastActivityNs = System.nanoTime()
+        if (maxIdleWorkerPoolSize.exists(idleWorkers.size >= _)) {
+          val oldestWorker = idleWorkers.dequeue()
+          try {
+            stopWorker(oldestWorker)
+          } catch {
+            case e: Exception =>
+              logWarning("Failed to stop evicted worker", e)
+          }
+        }
         idleWorkers.enqueue(worker)
       }
     } else {
diff --git a/core/src/main/scala/org/apache/spark/api/python/SerDeUtil.scala b/core/src/main/scala/org/apache/spark/api/python/SerDeUtil.scala
index 0fe57dd0bb0ae..e6f2a68567648 100644
--- a/core/src/main/scala/org/apache/spark/api/python/SerDeUtil.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/SerDeUtil.scala
@@ -28,7 +28,7 @@ import net.razorvine.pickle.{Pickler, Unpickler}
 
 import org.apache.spark.SparkException
 import org.apache.spark.api.java.JavaRDD
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.util.ArrayImplicits._
diff --git a/core/src/main/scala/org/apache/spark/api/python/StreamingPythonRunner.scala b/core/src/main/scala/org/apache/spark/api/python/StreamingPythonRunner.scala
index 7eba574751b46..e61fa01db113b 100644
--- a/core/src/main/scala/org/apache/spark/api/python/StreamingPythonRunner.scala
+++ b/core/src/main/scala/org/apache/spark/api/python/StreamingPythonRunner.scala
@@ -23,7 +23,7 @@ import java.nio.channels.Channels
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{SparkEnv, SparkPythonException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{PYTHON_WORKER_MODULE, PYTHON_WORKER_RESPONSE, SESSION_ID}
 import org.apache.spark.internal.config.BUFFER_SIZE
 import org.apache.spark.internal.config.Python.{PYTHON_AUTH_SOCKET_TIMEOUT, PYTHON_UNIX_DOMAIN_SOCKET_ENABLED}
diff --git a/core/src/main/scala/org/apache/spark/api/r/RBackendHandler.scala b/core/src/main/scala/org/apache/spark/api/r/RBackendHandler.scala
index c3d01ec47458e..622833c9cd6af 100644
--- a/core/src/main/scala/org/apache/spark/api/r/RBackendHandler.scala
+++ b/core/src/main/scala/org/apache/spark/api/r/RBackendHandler.scala
@@ -26,7 +26,7 @@ import io.netty.handler.timeout.ReadTimeoutException
 
 import org.apache.spark.{SparkConf, SparkEnv}
 import org.apache.spark.api.r.SerDe._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.R._
 import org.apache.spark.util.{ThreadUtils, Utils}
diff --git a/core/src/main/scala/org/apache/spark/broadcast/Broadcast.scala b/core/src/main/scala/org/apache/spark/broadcast/Broadcast.scala
index 3adb540a7ad18..ad1a274170a2a 100644
--- a/core/src/main/scala/org/apache/spark/broadcast/Broadcast.scala
+++ b/core/src/main/scala/org/apache/spark/broadcast/Broadcast.scala
@@ -22,7 +22,7 @@ import java.io.Serializable
 import scala.reflect.ClassTag
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.util.Utils
 
 /**
diff --git a/core/src/main/scala/org/apache/spark/broadcast/TorrentBroadcast.scala b/core/src/main/scala/org/apache/spark/broadcast/TorrentBroadcast.scala
index 0c7ec5c1a98a7..0f93db9b96b58 100644
--- a/core/src/main/scala/org/apache/spark/broadcast/TorrentBroadcast.scala
+++ b/core/src/main/scala/org/apache/spark/broadcast/TorrentBroadcast.scala
@@ -27,7 +27,7 @@ import scala.reflect.ClassTag
 import scala.util.Random
 
 import org.apache.spark._
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.serializer.Serializer
diff --git a/core/src/main/scala/org/apache/spark/deploy/Client.scala b/core/src/main/scala/org/apache/spark/deploy/Client.scala
index 226a6dcd36a16..2891247f20104 100644
--- a/core/src/main/scala/org/apache/spark/deploy/Client.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/Client.scala
@@ -31,7 +31,7 @@ import org.apache.spark.{SecurityManager, SparkConf}
 import org.apache.spark.deploy.DeployMessages._
 import org.apache.spark.deploy.master.{DriverState, Master}
 import org.apache.spark.deploy.master.DriverState.DriverState
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.Network.RPC_ASK_TIMEOUT
 import org.apache.spark.resource.ResourceUtils
diff --git a/core/src/main/scala/org/apache/spark/deploy/DriverTimeoutPlugin.scala b/core/src/main/scala/org/apache/spark/deploy/DriverTimeoutPlugin.scala
index 736c23556ec15..c1db3ddebc8ca 100644
--- a/core/src/main/scala/org/apache/spark/deploy/DriverTimeoutPlugin.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/DriverTimeoutPlugin.scala
@@ -23,7 +23,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark.SparkContext
 import org.apache.spark.api.plugin.{DriverPlugin, ExecutorPlugin, PluginContext, SparkPlugin}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.DRIVER_TIMEOUT
 import org.apache.spark.util.{SparkExitCode, ThreadUtils}
diff --git a/core/src/main/scala/org/apache/spark/deploy/ExternalShuffleService.scala b/core/src/main/scala/org/apache/spark/deploy/ExternalShuffleService.scala
index e21c772c00779..fec69aed48981 100644
--- a/core/src/main/scala/org/apache/spark/deploy/ExternalShuffleService.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/ExternalShuffleService.scala
@@ -23,7 +23,7 @@ import java.util.concurrent.CountDownLatch
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{SecurityManager, SparkConf}
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys.{AUTH_ENABLED, PORT, SHUFFLE_DB_BACKEND_KEY, SHUFFLE_DB_BACKEND_NAME}
 import org.apache.spark.metrics.{MetricsSystem, MetricsSystemInstances}
 import org.apache.spark.network.TransportContext
diff --git a/core/src/main/scala/org/apache/spark/deploy/LocalSparkCluster.scala b/core/src/main/scala/org/apache/spark/deploy/LocalSparkCluster.scala
index 263b1a233b808..e03dc2ff00a08 100644
--- a/core/src/main/scala/org/apache/spark/deploy/LocalSparkCluster.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/LocalSparkCluster.scala
@@ -24,7 +24,7 @@ import scala.collection.mutable.ArrayBuffer
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.master.Master
 import org.apache.spark.deploy.worker.Worker
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.rpc.RpcEnv
 import org.apache.spark.util.Utils
 
diff --git a/core/src/main/scala/org/apache/spark/deploy/RPackageUtils.scala b/core/src/main/scala/org/apache/spark/deploy/RPackageUtils.scala
index 5d996381a485e..f14c2dd693975 100644
--- a/core/src/main/scala/org/apache/spark/deploy/RPackageUtils.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/RPackageUtils.scala
@@ -24,10 +24,8 @@ import java.util.zip.{ZipEntry, ZipOutputStream}
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.{ByteStreams, Files}
-
 import org.apache.spark.api.r.RUtils
-import org.apache.spark.internal.{LogEntry, Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{LogEntry, Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.util.{RedirectThread, Utils}
 
@@ -153,11 +151,11 @@ private[deploy] object RPackageUtils extends Logging {
           if (verbose) {
             print(log"Creating directory: ${MDC(PATH, dir)}", printStream)
           }
-          dir.mkdirs
+          Utils.createDirectory(dir)
         } else {
           val inStream = jar.getInputStream(entry)
           val outPath = new File(tempDir, entryPath)
-          Files.createParentDirs(outPath)
+          Utils.createParentDirs(outPath)
           val outStream = new FileOutputStream(outPath)
           if (verbose) {
             print(log"Extracting ${MDC(JAR_ENTRY, entry)} to ${MDC(PATH, outPath)}", printStream)
@@ -251,7 +249,7 @@ private[deploy] object RPackageUtils extends Logging {
         val fis = new FileInputStream(file)
         val zipEntry = new ZipEntry(relPath)
         zipOutputStream.putNextEntry(zipEntry)
-        ByteStreams.copy(fis, zipOutputStream)
+        fis.transferTo(zipOutputStream)
         zipOutputStream.closeEntry()
         fis.close()
       }
diff --git a/core/src/main/scala/org/apache/spark/deploy/RedirectConsolePlugin.scala b/core/src/main/scala/org/apache/spark/deploy/RedirectConsolePlugin.scala
new file mode 100644
index 0000000000000..cc1995a264feb
--- /dev/null
+++ b/core/src/main/scala/org/apache/spark/deploy/RedirectConsolePlugin.scala
@@ -0,0 +1,137 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.deploy
+
+import java.io.{ByteArrayOutputStream, PrintStream}
+import java.util.{Collections, Map => JMap}
+
+import org.apache.spark.SparkContext
+import org.apache.spark.api.plugin.{DriverPlugin, ExecutorPlugin, PluginContext, SparkPlugin}
+import org.apache.spark.internal.{Logging, SparkLoggerFactory}
+import org.apache.spark.internal.config._
+
+/**
+ * A built-in plugin to allow redirecting stdout/stderr to logging system (SLF4J).
+ */
+class RedirectConsolePlugin extends SparkPlugin {
+  override def driverPlugin(): DriverPlugin = new DriverRedirectConsolePlugin()
+
+  override def executorPlugin(): ExecutorPlugin = new ExecRedirectConsolePlugin()
+}
+
+object RedirectConsolePlugin {
+
+  def redirectStdoutToLog(): Unit = {
+    val stdoutLogger = SparkLoggerFactory.getLogger("stdout")
+    System.setOut(new LoggingPrintStream(stdoutLogger.info))
+  }
+
+  def redirectStderrToLog(): Unit = {
+    val stderrLogger = SparkLoggerFactory.getLogger("stderr")
+    System.setErr(new LoggingPrintStream(stderrLogger.error))
+  }
+}
+
+class DriverRedirectConsolePlugin extends DriverPlugin with Logging {
+
+  override def init(sc: SparkContext, ctx: PluginContext): JMap[String, String] = {
+    val outputs = sc.conf.get(DRIVER_REDIRECT_CONSOLE_OUTPUTS)
+    if (outputs.contains("stdout")) {
+      logInfo("Redirect driver's stdout to logging system.")
+      RedirectConsolePlugin.redirectStdoutToLog()
+    }
+    if (outputs.contains("stderr")) {
+      logInfo("Redirect driver's stderr to logging system.")
+      RedirectConsolePlugin.redirectStderrToLog()
+    }
+    Collections.emptyMap
+  }
+}
+
+class ExecRedirectConsolePlugin extends ExecutorPlugin with Logging {
+
+  override def init(ctx: PluginContext, extraConf: JMap[String, String]): Unit = {
+    val outputs = ctx.conf.get(EXEC_REDIRECT_CONSOLE_OUTPUTS)
+    if (outputs.contains("stdout")) {
+      logInfo("Redirect executor's stdout to logging system.")
+      RedirectConsolePlugin.redirectStdoutToLog()
+    }
+    if (outputs.contains("stderr")) {
+      logInfo("Redirect executor's stderr to logging system.")
+      RedirectConsolePlugin.redirectStderrToLog()
+    }
+  }
+}
+
+private[spark] class LoggingPrintStream(redirect: String => Unit)
+  extends PrintStream(new LineBuffer(4 * 1024 * 1024)) {
+
+  override def write(b: Int): Unit = {
+    super.write(b)
+    tryLogCurrentLine()
+  }
+
+  override def write(buf: Array[Byte], off: Int, len: Int): Unit = {
+    super.write(buf, off, len)
+    tryLogCurrentLine()
+  }
+
+  private def tryLogCurrentLine(): Unit = this.synchronized {
+    out.asInstanceOf[LineBuffer].tryGenerateContext.foreach { logContext =>
+      redirect(logContext)
+    }
+  }
+}
+
+/**
+ * Cache bytes before line ending. When current line is ended or the bytes size reaches the
+ * threshold, it can generate the line.
+ */
+private[spark] object LineBuffer {
+  private val LF_BYTES = System.lineSeparator.getBytes
+  private val LF_LENGTH = LF_BYTES.length
+}
+
+private[spark] class LineBuffer(lineMaxBytes: Long) extends ByteArrayOutputStream {
+
+  import LineBuffer._
+
+  def tryGenerateContext: Option[String] =
+    if (isLineEnded) {
+      try Some(new String(buf, 0, count - LF_LENGTH)) finally reset()
+    } else if (count >= lineMaxBytes) {
+      try Some(new String(buf, 0, count)) finally reset()
+    } else {
+      None
+    }
+
+  private def isLineEnded: Boolean = {
+    if (count < LF_LENGTH) return false
+    // fast return in UNIX-like OS when LF is single char '\n'
+    if (LF_LENGTH == 1) return LF_BYTES(0) == buf(count - 1)
+
+    var i = 0
+    do {
+      if (LF_BYTES(i) != buf(count - LF_LENGTH + i)) {
+        return false
+      }
+      i = i + 1
+    } while (i < LF_LENGTH)
+    true
+  }
+}
diff --git a/core/src/main/scala/org/apache/spark/deploy/SparkHadoopUtil.scala b/core/src/main/scala/org/apache/spark/deploy/SparkHadoopUtil.scala
index ca932ef5dc05c..9c40f4cd1cf75 100644
--- a/core/src/main/scala/org/apache/spark/deploy/SparkHadoopUtil.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/SparkHadoopUtil.scala
@@ -37,7 +37,7 @@ import org.apache.hadoop.security.token.{Token, TokenIdentifier}
 import org.apache.hadoop.security.token.delegation.AbstractDelegationTokenIdentifier
 
 import org.apache.spark.{SparkConf, SparkException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.BUFFER_SIZE
 import org.apache.spark.util.ArrayImplicits._
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/deploy/SparkPipelines.scala b/core/src/main/scala/org/apache/spark/deploy/SparkPipelines.scala
new file mode 100644
index 0000000000000..2df83df3e291b
--- /dev/null
+++ b/core/src/main/scala/org/apache/spark/deploy/SparkPipelines.scala
@@ -0,0 +1,107 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.deploy
+
+import java.util
+
+import scala.collection.mutable.ArrayBuffer
+import scala.jdk.CollectionConverters._
+
+import org.apache.spark.SparkUserAppException
+import org.apache.spark.internal.Logging
+import org.apache.spark.launcher.SparkSubmitArgumentsParser
+import org.apache.spark.util.SparkExitCode
+
+/**
+ * Outer implementation of the spark-pipelines command line interface. Responsible for routing
+ * spark-submit args to spark-submit, and pipeline-specific args to the inner Python CLI
+ * implementation that loads the user code and submits it to the backend.
+ */
+object SparkPipelines extends Logging {
+  def main(args: Array[String]): Unit = {
+    val sparkHome = sys.env("SPARK_HOME")
+    SparkSubmit.main(constructSparkSubmitArgs(args, sparkHome).toArray)
+  }
+
+  protected[deploy] def constructSparkSubmitArgs(
+      args: Array[String],
+      sparkHome: String): Seq[String] = {
+    val (sparkSubmitArgs, pipelinesArgs) = splitArgs(args)
+    val pipelinesCliFile = s"$sparkHome/python/pyspark/pipelines/cli.py"
+    (sparkSubmitArgs ++ Seq(pipelinesCliFile) ++ pipelinesArgs)
+  }
+
+  /**
+   * Split the arguments into spark-submit args (--master, --remote, etc.) and pipeline args
+   * (run, --spec, etc.).
+   */
+  private def splitArgs(args: Array[String]): (Seq[String], Seq[String]) = {
+    val sparkSubmitArgs = new ArrayBuffer[String]()
+    val pipelinesArgs = new ArrayBuffer[String]()
+    var remote = "local"
+
+    new SparkSubmitArgumentsParser() {
+      parse(util.Arrays.asList(args: _*))
+
+      override protected def handle(opt: String, value: String): Boolean = {
+        if (opt == "--remote") {
+          remote = value
+        } else if (opt == "--class") {
+          logInfo("--class argument not supported.")
+          throw SparkUserAppException(SparkExitCode.EXIT_FAILURE)
+        } else if (opt == "--conf" &&
+          value.startsWith("spark.api.mode=") &&
+          value != "spark.api.mode=connect") {
+          logInfo(
+            "--spark.api.mode must be 'connect'. " +
+            "Declarative Pipelines currently only supports Spark Connect."
+          )
+          throw SparkUserAppException(SparkExitCode.EXIT_FAILURE)
+        } else if (Seq("--name", "-h", "--help").contains(opt)) {
+          pipelinesArgs += opt
+          if (value != null && value.nonEmpty) {
+            pipelinesArgs += value
+          }
+        } else {
+          sparkSubmitArgs += opt
+          if (value != null) {
+            sparkSubmitArgs += value
+          }
+        }
+
+        true
+      }
+
+      override protected def handleExtraArgs(extra: util.List[String]): Unit = {
+        pipelinesArgs.appendAll(extra.asScala)
+      }
+
+      override protected def handleUnknown(opt: String): Boolean = {
+        pipelinesArgs += opt
+        true
+      }
+    }
+
+    sparkSubmitArgs += "--conf"
+    sparkSubmitArgs += "spark.api.mode=connect"
+    sparkSubmitArgs += "--remote"
+    sparkSubmitArgs += remote
+    (sparkSubmitArgs.toSeq, pipelinesArgs.toSeq)
+  }
+
+}
diff --git a/core/src/main/scala/org/apache/spark/deploy/SparkSubmit.scala b/core/src/main/scala/org/apache/spark/deploy/SparkSubmit.scala
index c529e37e7e1bf..fe74f034e2933 100644
--- a/core/src/main/scala/org/apache/spark/deploy/SparkSubmit.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/SparkSubmit.scala
@@ -30,7 +30,6 @@ import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 import scala.util.{Properties, Try}
 
-import org.apache.commons.lang3.StringUtils
 import org.apache.hadoop.conf.{Configuration => HadoopConfiguration}
 import org.apache.hadoop.fs.{FileSystem, Path}
 import org.apache.hadoop.security.UserGroupInformation
@@ -39,7 +38,7 @@ import org.apache.hadoop.yarn.conf.YarnConfiguration
 import org.apache.spark._
 import org.apache.spark.api.r.RUtils
 import org.apache.spark.deploy.rest._
-import org.apache.spark.internal.{LogEntry, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{LogEntry, Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.UI._
 import org.apache.spark.launcher.SparkLauncher
@@ -368,7 +367,7 @@ private[spark] class SparkSubmit extends Logging {
 
       // install any R packages that may have been passed through --jars or --packages.
       // Spark Packages may contain R source code inside the jar.
-      if (args.isR && !StringUtils.isBlank(args.jars)) {
+      if (args.isR && !SparkStringUtils.isBlank(args.jars)) {
         RPackageUtils.checkAndBuildRPackage(args.jars, printStream, args.verbose)
       }
     }
@@ -997,14 +996,14 @@ private[spark] class SparkSubmit extends Logging {
           // TODO(SPARK-42375): Should point out the user-facing page here instead.
           logInfo("You need to specify Spark Connect jars with --jars or --packages.")
         }
-        throw new SparkUserAppException(CLASS_NOT_FOUND_EXIT_STATUS)
+        throw new SparkUserAppException(SparkExitCode.CLASS_NOT_FOUND)
       case e: NoClassDefFoundError =>
         logError(log"Failed to load ${MDC(LogKeys.CLASS_NAME, childMainClass)}", e)
         if (e.getMessage.contains("org/apache/hadoop/hive")) {
           logInfo("Failed to load hive class.")
           logInfo("You need to build Spark with -Phive and -Phive-thriftserver.")
         }
-        throw new SparkUserAppException(CLASS_NOT_FOUND_EXIT_STATUS)
+        throw new SparkUserAppException(SparkExitCode.CLASS_NOT_FOUND)
     }
 
     val app: SparkApplication = if (classOf[SparkApplication].isAssignableFrom(mainClass)) {
@@ -1023,11 +1022,19 @@ private[spark] class SparkSubmit extends Logging {
         e
     }
 
+    var exitCode: Int = 1
     try {
       app.start(childArgs.toArray, sparkConf)
+      exitCode = 0
     } catch {
       case t: Throwable =>
-        throw findCause(t)
+        val cause = findCause(t)
+        cause match {
+          case e: SparkUserAppException =>
+            exitCode = e.exitCode
+          case _ =>
+        }
+        throw cause
     } finally {
       if (args.master.startsWith("k8s") && !isShell(args.primaryResource) &&
           !isSqlShell(args.mainClass) && !isThriftServer(args.mainClass) &&
@@ -1038,6 +1045,12 @@ private[spark] class SparkSubmit extends Logging {
           case e: Throwable => logError("Failed to close SparkContext", e)
         }
       }
+      if (sparkConf.get(SUBMIT_CALL_SYSTEM_EXIT_ON_MAIN_EXIT)) {
+        logInfo(
+          log"Calling System.exit() with exit code ${MDC(LogKeys.EXIT_CODE, exitCode)} " +
+          log"because ${MDC(LogKeys.CONFIG, SUBMIT_CALL_SYSTEM_EXIT_ON_MAIN_EXIT.key)}=true")
+        exitFn(exitCode)
+      }
     }
   }
 
@@ -1081,8 +1094,6 @@ object SparkSubmit extends CommandLineUtils with Logging {
   private val SPARKR_PACKAGE_ARCHIVE = "sparkr.zip"
   private val R_PACKAGE_ARCHIVE = "rpkg.zip"
 
-  private val CLASS_NOT_FOUND_EXIT_STATUS = 101
-
   // Following constants are visible for testing.
   private[deploy] val YARN_CLUSTER_SUBMIT_CLASS =
     "org.apache.spark.deploy.yarn.YarnClusterApplication"
diff --git a/core/src/main/scala/org/apache/spark/deploy/SparkSubmitArguments.scala b/core/src/main/scala/org/apache/spark/deploy/SparkSubmitArguments.scala
index f4884385555f6..3eb2fd2a0e4d2 100644
--- a/core/src/main/scala/org/apache/spark/deploy/SparkSubmitArguments.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/SparkSubmitArguments.scala
@@ -28,7 +28,7 @@ import scala.util.Try
 
 import org.apache.spark.{SparkConf, SparkException, SparkUserAppException}
 import org.apache.spark.deploy.SparkSubmitAction._
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.DYN_ALLOCATION_ENABLED
 import org.apache.spark.launcher.SparkSubmitArgumentsParser
diff --git a/core/src/main/scala/org/apache/spark/deploy/StandaloneResourceUtils.scala b/core/src/main/scala/org/apache/spark/deploy/StandaloneResourceUtils.scala
index 7b98461b01acf..5a1d58897703d 100644
--- a/core/src/main/scala/org/apache/spark/deploy/StandaloneResourceUtils.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/StandaloneResourceUtils.scala
@@ -27,7 +27,7 @@ import org.json4s.{DefaultFormats, Extraction, Formats}
 import org.json4s.jackson.JsonMethods.{compact, render}
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.COMPONENT
 import org.apache.spark.resource.{ResourceAllocation, ResourceID, ResourceInformation, ResourceRequirement}
 import org.apache.spark.util.ArrayImplicits._
diff --git a/core/src/main/scala/org/apache/spark/deploy/Utils.scala b/core/src/main/scala/org/apache/spark/deploy/Utils.scala
index b3d871d75e6c7..9ff1333b03e62 100644
--- a/core/src/main/scala/org/apache/spark/deploy/Utils.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/Utils.scala
@@ -22,7 +22,7 @@ import java.io.File
 import jakarta.servlet.http.HttpServletRequest
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{LOG_TYPE, PATH}
 import org.apache.spark.ui.JettyUtils.createServletHandler
 import org.apache.spark.ui.WebUI
diff --git a/core/src/main/scala/org/apache/spark/deploy/client/StandaloneAppClient.scala b/core/src/main/scala/org/apache/spark/deploy/client/StandaloneAppClient.scala
index b34e5c408c3be..2d742b31f99c2 100644
--- a/core/src/main/scala/org/apache/spark/deploy/client/StandaloneAppClient.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/client/StandaloneAppClient.scala
@@ -29,7 +29,7 @@ import org.apache.spark.SparkConf
 import org.apache.spark.deploy.{ApplicationDescription, ExecutorState}
 import org.apache.spark.deploy.DeployMessages._
 import org.apache.spark.deploy.master.Master
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.resource.ResourceProfile
 import org.apache.spark.rpc._
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/ApplicationCache.scala b/core/src/main/scala/org/apache/spark/deploy/history/ApplicationCache.scala
index 8caf67ff4680b..e979671890eac 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/ApplicationCache.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/ApplicationCache.scala
@@ -28,7 +28,7 @@ import jakarta.servlet.{DispatcherType, Filter, FilterChain, ServletException, S
 import jakarta.servlet.http.{HttpServletRequest, HttpServletResponse}
 import org.eclipse.jetty.servlet.FilterHolder
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.metrics.source.Source
 import org.apache.spark.ui.SparkUI
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/ApplicationHistoryProvider.scala b/core/src/main/scala/org/apache/spark/deploy/history/ApplicationHistoryProvider.scala
index f3f7db6bb0aba..89f0d12935ce1 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/ApplicationHistoryProvider.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/ApplicationHistoryProvider.scala
@@ -99,6 +99,15 @@ private[history] abstract class ApplicationHistoryProvider {
    */
   def getListing(): Iterator[ApplicationInfo]
 
+  /**
+   * Returns a list of applications available for the history server to show.
+   *
+   * @param max The maximum number of applications to return
+   * @param predicate A function that filters the applications to be returned
+   * @return An iterator of matching applications up to the specified maximum
+   */
+  def getListing(max: Int)(predicate: ApplicationInfo => Boolean): Iterator[ApplicationInfo]
+
   /**
    * Returns the Spark UI for a specific application.
    *
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/EventFilter.scala b/core/src/main/scala/org/apache/spark/deploy/history/EventFilter.scala
index 20e60c679b06a..efa5b10c93f15 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/EventFilter.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/EventFilter.scala
@@ -23,7 +23,7 @@ import scala.util.control.NonFatal
 import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.deploy.history.EventFilter.FilterStatistics
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{LINE, LINE_NUM, PATH}
 import org.apache.spark.scheduler._
 import org.apache.spark.util.{JsonProtocol, Utils}
@@ -72,7 +72,6 @@ private[spark] object EventFilter extends Logging {
       fs: FileSystem,
       filters: Seq[EventFilter],
       path: Path,
-      jsonProtocol: JsonProtocol,
       onAccepted: (String, SparkListenerEvent) => Unit,
       onRejected: (String, SparkListenerEvent) => Unit,
       onUnidentified: String => Unit): Unit = {
@@ -82,7 +81,7 @@ private[spark] object EventFilter extends Logging {
       lines.zipWithIndex.foreach { case (line, lineNum) =>
         try {
           val event = try {
-            Some(jsonProtocol.sparkEventFromJson(line))
+            Some(JsonProtocol.sparkEventFromJson(line))
           } catch {
             // ignore any exception occurred from unidentified json
             case NonFatal(_) =>
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileCompactor.scala b/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileCompactor.scala
index 5cec3d2a9d28f..e0227641fc0eb 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileCompactor.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileCompactor.scala
@@ -28,10 +28,10 @@ import org.apache.hadoop.fs.{FileStatus, FileSystem, Path}
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.history.EventFilter.FilterStatistics
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.scheduler.ReplayListenerBus
-import org.apache.spark.util.{JsonProtocol, Utils}
+import org.apache.spark.util.Utils
 
 /**
  * This class compacts the old event log files into one compact file, via two phases reading:
@@ -55,8 +55,6 @@ class EventLogFileCompactor(
 
   require(maxFilesToRetain > 0, "Max event log files to retain should be higher than 0.")
 
-  private val jsonProtocol = new JsonProtocol(sparkConf)
-
   /**
    * Compacts the old event log files into one compact file, and clean old event log files being
    * compacted away.
@@ -115,7 +113,7 @@ class EventLogFileCompactor(
    * them via replaying events in given files.
    */
   private def initializeBuilders(fs: FileSystem, files: Seq[Path]): Seq[EventFilterBuilder] = {
-    val bus = new ReplayListenerBus(jsonProtocol)
+    val bus = new ReplayListenerBus()
 
     val builders = ServiceLoader.load(classOf[EventFilterBuilder],
       Utils.getContextOrSparkClassLoader).asScala.toSeq
@@ -155,7 +153,7 @@ class EventLogFileCompactor(
     val startTime = System.currentTimeMillis()
     logWriter.start()
     eventLogFiles.foreach { file =>
-      EventFilter.applyFilterToFile(fs, filters, file.getPath, jsonProtocol,
+      EventFilter.applyFilterToFile(fs, filters, file.getPath,
         onAccepted = (line, _) => logWriter.writeEvent(line, flushLogger = true),
         onRejected = (_, _) => {},
         onUnidentified = line => logWriter.writeEvent(line, flushLogger = true)
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileReaders.scala b/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileReaders.scala
index 8827fcde7b733..1721ef51807a5 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileReaders.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileReaders.scala
@@ -21,7 +21,6 @@ import java.io.{BufferedInputStream, InputStream}
 import java.util.concurrent.ConcurrentHashMap
 import java.util.zip.{ZipEntry, ZipOutputStream}
 
-import com.google.common.io.ByteStreams
 import org.apache.hadoop.fs.{FileStatus, FileSystem, Path}
 import org.apache.hadoop.hdfs.DFSInputStream
 
@@ -52,7 +51,7 @@ abstract class EventLogFileReader(
       entryName: String): Unit = {
     Utils.tryWithResource(fileSystem.open(path, 1 * 1024 * 1024)) { inputStream =>
       zipStream.putNextEntry(new ZipEntry(entryName))
-      ByteStreams.copy(inputStream, zipStream)
+      inputStream.transferTo(zipStream)
       zipStream.closeEntry()
     }
   }
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileWriters.scala b/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileWriters.scala
index 990ab680f3aaf..4e3bee1015ff3 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileWriters.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/EventLogFileWriters.scala
@@ -28,7 +28,7 @@ import org.apache.hadoop.fs.permission.FsPermission
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
@@ -43,6 +43,7 @@ import org.apache.spark.util.Utils
  *   spark.eventLog.compression.codec - The codec to compress logged events
  *   spark.eventLog.overwrite - Whether to overwrite any existing files
  *   spark.eventLog.buffer.kb - Buffer size to use when writing to output streams
+ *   spark.eventLog.excludedPatterns - Specifes a comma-separated event names to be excluded
  *
  * Note that descendant classes can maintain its own parameters: refer the javadoc of each class
  * for more details.
@@ -58,6 +59,8 @@ abstract class EventLogFileWriter(
 
   protected val shouldCompress = sparkConf.get(EVENT_LOG_COMPRESS) &&
       !sparkConf.get(EVENT_LOG_COMPRESSION_CODEC).equalsIgnoreCase("none")
+  protected val excludedPatterns = sparkConf.get(EVENT_LOG_EXCLUDED_PATTERNS)
+      .map(name => s"""{"Event":"$name"""")
   protected val shouldOverwrite = sparkConf.get(EVENT_LOG_OVERWRITE)
   protected val outputBufferSize = sparkConf.get(EVENT_LOG_OUTPUT_BUFFER_SIZE).toInt * 1024
   protected val fileSystem = Utils.getHadoopFileSystem(logBaseDir, hadoopConf)
@@ -117,6 +120,7 @@ abstract class EventLogFileWriter(
   }
 
   protected def writeLine(line: String, flushLogger: Boolean = false): Unit = {
+    if (excludedPatterns.exists(line.startsWith(_))) return
     // scalastyle:off println
     writer.foreach(_.println(line))
     // scalastyle:on println
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/FsHistoryProvider.scala b/core/src/main/scala/org/apache/spark/deploy/history/FsHistoryProvider.scala
index ad372a414c007..0c6d6acf66c89 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/FsHistoryProvider.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/FsHistoryProvider.scala
@@ -37,7 +37,7 @@ import org.apache.hadoop.security.AccessControlException
 
 import org.apache.spark.{SecurityManager, SparkConf, SparkException}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
@@ -52,8 +52,9 @@ import org.apache.spark.status._
 import org.apache.spark.status.KVUtils._
 import org.apache.spark.status.api.v1.{ApplicationAttemptInfo, ApplicationInfo}
 import org.apache.spark.ui.SparkUI
-import org.apache.spark.util.{CallerContext, Clock, JsonProtocol, SystemClock, ThreadUtils, Utils}
+import org.apache.spark.util.{CallerContext, Clock, SystemClock, ThreadUtils, Utils}
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.SparkStringUtils.stringToSeq
 import org.apache.spark.util.kvstore._
 
 /**
@@ -306,6 +307,14 @@ private[history] class FsHistoryProvider(conf: SparkConf, clock: Clock)
       .index("endTime").reverse())(_.toApplicationInfo()).iterator
   }
 
+  override def getListing(max: Int)(
+      predicate: ApplicationInfo => Boolean): Iterator[ApplicationInfo] = {
+    // Return the filtered listing in end time descending order.
+    KVUtils.mapToSeqWithFilter(
+      listing.view(classOf[ApplicationInfoWrapper]).index("endTime").reverse(),
+      max)(_.toApplicationInfo())(predicate).iterator
+  }
+
   override def getApplicationInfo(appId: String): Option[ApplicationInfo] = {
     try {
       Some(load(appId).toApplicationInfo())
@@ -319,17 +328,14 @@ private[history] class FsHistoryProvider(conf: SparkConf, clock: Clock)
 
   override def getLastUpdatedTime(): Long = lastScanTime.get()
 
-  /**
-   * Split a comma separated String, filter out any empty items, and return a Sequence of strings
-   */
-  private def stringToSeq(list: String): Seq[String] = {
-    list.split(',').map(_.trim).filter(_.nonEmpty).toImmutableArraySeq
-  }
-
   override def getAppUI(appId: String, attemptId: Option[String]): Option[LoadedAppUI] = {
+    val logPath = RollingEventLogFilesWriter.EVENT_LOG_DIR_NAME_PREFIX +
+        EventLogFileWriter.nameForAppAndAttempt(appId, attemptId)
     val app = try {
       load(appId)
      } catch {
+      case _: NoSuchElementException if this.conf.get(EVENT_LOG_ROLLING_ON_DEMAND_LOAD_ENABLED) =>
+        loadFromFallbackLocation(appId, attemptId, logPath)
       case _: NoSuchElementException =>
         return None
     }
@@ -351,6 +357,13 @@ private[history] class FsHistoryProvider(conf: SparkConf, clock: Clock)
           createInMemoryStore(attempt)
       }
     } catch {
+      case _: FileNotFoundException if this.conf.get(EVENT_LOG_ROLLING_ON_DEMAND_LOAD_ENABLED) =>
+        if (app.attempts.head.info.appSparkVersion == "unknown") {
+          listing.synchronized {
+            listing.delete(classOf[ApplicationInfoWrapper], appId)
+          }
+        }
+        return None
       case _: FileNotFoundException =>
         return None
     }
@@ -370,6 +383,18 @@ private[history] class FsHistoryProvider(conf: SparkConf, clock: Clock)
     Some(loadedUI)
   }
 
+  private def loadFromFallbackLocation(appId: String, attemptId: Option[String], logPath: String)
+    : ApplicationInfoWrapper = {
+    val date = new Date(0)
+    val lastUpdate = new Date()
+    val info = ApplicationAttemptInfo(
+      attemptId, date, date, lastUpdate, 0, "spark", false, "unknown")
+    addListing(new ApplicationInfoWrapper(
+      ApplicationInfo(appId, appId, None, None, None, None, List.empty),
+      List(new AttemptInfoWrapper(info, logPath, 0, Some(1), None, None, None, None))))
+    load(appId)
+  }
+
   override def getEmptyListingHtml(): Seq[Node] = {
     <p>
       Did you specify the correct logging directory? Please verify your setting of
@@ -802,7 +827,7 @@ private[history] class FsHistoryProvider(conf: SparkConf, clock: Clock)
     val shouldHalt = enableOptimizations &&
       ((!appCompleted && fastInProgressParsing) || reparseChunkSize > 0)
 
-    val bus = new ReplayListenerBus(new JsonProtocol(conf))
+    val bus = new ReplayListenerBus()
     val listener = new AppListingListener(reader, clock, shouldHalt)
     bus.addListener(listener)
 
@@ -1119,7 +1144,7 @@ private[history] class FsHistoryProvider(conf: SparkConf, clock: Clock)
     // to parse the event logs in the SHS.
     val replayConf = conf.clone().set(ASYNC_TRACKING_ENABLED, false)
     val trackingStore = new ElementTrackingStore(store, replayConf)
-    val replayBus = new ReplayListenerBus(new JsonProtocol(conf))
+    val replayBus = new ReplayListenerBus()
     val listener = new AppStatusListener(trackingStore, replayConf, false,
       lastUpdateTime = Some(lastUpdated))
     replayBus.addListener(listener)
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/HistoryPage.scala b/core/src/main/scala/org/apache/spark/deploy/history/HistoryPage.scala
index ff1629b698096..4eeddd7cc7098 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/HistoryPage.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/HistoryPage.scala
@@ -109,7 +109,7 @@ private[history] class HistoryPage(parent: HistoryServer) extends WebUIPage("")
   }
 
   def shouldDisplayApplications(requestedIncomplete: Boolean): Boolean = {
-    parent.getApplicationList().exists(isApplicationCompleted(_) != requestedIncomplete)
+    parent.getApplicationInfoList(1)(isApplicationCompleted(_) != requestedIncomplete).nonEmpty
   }
 
   private def makePageLink(request: HttpServletRequest, showIncomplete: Boolean): String = {
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServer.scala b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServer.scala
index ce9f70c9a83ed..14daa5d88b1c4 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServer.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServer.scala
@@ -28,7 +28,7 @@ import org.eclipse.jetty.servlet.{ServletContextHandler, ServletHolder}
 import org.apache.spark.{SecurityManager, SparkConf}
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.deploy.Utils.addRenderLogHandler
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.History
 import org.apache.spark.internal.config.UI._
@@ -224,6 +224,11 @@ class HistoryServer(
     getApplicationList()
   }
 
+  override def getApplicationInfoList(max: Int)(
+      filter: ApplicationInfo => Boolean): Iterator[ApplicationInfo] = {
+    provider.getListing(max)(filter)
+  }
+
   def getApplicationInfo(appId: String): Option[ApplicationInfo] = {
     provider.getApplicationInfo(appId)
   }
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerArguments.scala b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerArguments.scala
index f1343a0551384..14d6e4a0381ae 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerArguments.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerArguments.scala
@@ -83,7 +83,7 @@ private[history] class HistoryServerArguments(conf: SparkConf, args: Array[Strin
       configs.sortBy(_.key).foreach { conf =>
         sb.append("  ").append(conf.key.padTo(maxConfigLength, ' '))
         var currentDocLen = 0
-        val intention = "\n" + " " * (maxConfigLength + 2)
+        val intention = "\n" + " ".repeat(maxConfigLength + 2)
         conf.doc.split("\\s+").foreach { word =>
           if (currentDocLen + word.length > 60) {
             sb.append(intention).append(" ").append(word)
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerDiskManager.scala b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerDiskManager.scala
index 122ed299242f5..753fe59dc0894 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerDiskManager.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerDiskManager.scala
@@ -22,10 +22,8 @@ import java.util.concurrent.atomic.AtomicLong
 
 import scala.collection.mutable.{HashMap, ListBuffer}
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.History
 import org.apache.spark.internal.config.History._
@@ -76,7 +74,7 @@ private class HistoryServerDiskManager(
 
     // Clean up any temporary stores during start up. This assumes that they're leftover from other
     // instances and are not useful.
-    tmpStoreDir.listFiles().foreach(FileUtils.deleteQuietly)
+    tmpStoreDir.listFiles().foreach(Utils.deleteQuietly)
 
     // Go through the recorded store directories and remove any that may have been removed by
     // external code.
@@ -214,7 +212,7 @@ private class HistoryServerDiskManager(
   def committed(): Long = committedUsage.get()
 
   private def deleteStore(path: File): Unit = {
-    FileUtils.deleteDirectory(path)
+    Utils.deleteRecursively(path)
     listing.delete(classOf[ApplicationStoreInfo], path.getAbsolutePath())
   }
 
@@ -286,7 +284,7 @@ private class HistoryServerDiskManager(
   }
 
   /** Visible for testing. Return the size of a directory. */
-  private[history] def sizeOf(path: File): Long = FileUtils.sizeOf(path)
+  private[history] def sizeOf(path: File): Long = Utils.sizeOf(path)
 
   private[history] class Lease(val tmpPath: File, private val leased: Long) {
 
@@ -334,7 +332,7 @@ private class HistoryServerDiskManager(
     /** Deletes the temporary directory created for the lease. */
     def rollback(): Unit = {
       updateUsage(-leased)
-      FileUtils.deleteDirectory(tmpPath)
+      Utils.deleteRecursively(tmpPath)
     }
 
   }
diff --git a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerMemoryManager.scala b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerMemoryManager.scala
index 6e3dbb1170998..f9a6c7f64896c 100644
--- a/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerMemoryManager.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/history/HistoryServerMemoryManager.scala
@@ -22,7 +22,7 @@ import java.util.concurrent.atomic.AtomicLong
 import scala.collection.mutable.HashMap
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.History._
 import org.apache.spark.io.CompressionCodec
diff --git a/core/src/main/scala/org/apache/spark/deploy/master/FileSystemPersistenceEngine.scala b/core/src/main/scala/org/apache/spark/deploy/master/FileSystemPersistenceEngine.scala
index 4332544e4491c..0c9baf9e6f70c 100644
--- a/core/src/main/scala/org/apache/spark/deploy/master/FileSystemPersistenceEngine.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/master/FileSystemPersistenceEngine.scala
@@ -22,7 +22,7 @@ import java.nio.file.{FileAlreadyExistsException, Files, Paths}
 
 import scala.reflect.ClassTag
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.serializer.{DeserializationStream, SerializationStream, Serializer}
diff --git a/core/src/main/scala/org/apache/spark/deploy/master/Master.scala b/core/src/main/scala/org/apache/spark/deploy/master/Master.scala
index 7d15744de6b45..95778771d4239 100644
--- a/core/src/main/scala/org/apache/spark/deploy/master/Master.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/master/Master.scala
@@ -32,7 +32,7 @@ import org.apache.spark.deploy.master.DriverState.DriverState
 import org.apache.spark.deploy.master.MasterMessages._
 import org.apache.spark.deploy.master.ui.MasterWebUI
 import org.apache.spark.deploy.rest.StandaloneRestServer
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.Deploy._
diff --git a/core/src/main/scala/org/apache/spark/deploy/master/RecoveryModeFactory.scala b/core/src/main/scala/org/apache/spark/deploy/master/RecoveryModeFactory.scala
index 964b115865aef..a751c7bfc67c4 100644
--- a/core/src/main/scala/org/apache/spark/deploy/master/RecoveryModeFactory.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/master/RecoveryModeFactory.scala
@@ -19,7 +19,7 @@ package org.apache.spark.deploy.master
 
 import org.apache.spark.SparkConf
 import org.apache.spark.annotation.DeveloperApi
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.Deploy.{RECOVERY_COMPRESSION_CODEC, RECOVERY_DIRECTORY}
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.serializer.Serializer
diff --git a/core/src/main/scala/org/apache/spark/deploy/master/ui/MasterWebUI.scala b/core/src/main/scala/org/apache/spark/deploy/master/ui/MasterWebUI.scala
index 6c7a8f582d915..66036e7a5e5ce 100644
--- a/core/src/main/scala/org/apache/spark/deploy/master/ui/MasterWebUI.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/master/ui/MasterWebUI.scala
@@ -24,7 +24,7 @@ import jakarta.servlet.http.{HttpServlet, HttpServletRequest, HttpServletRespons
 import org.apache.spark.deploy.DeployMessages.{DecommissionWorkersOnHosts, MasterStateResponse, RequestMasterState}
 import org.apache.spark.deploy.Utils.addRenderLogHandler
 import org.apache.spark.deploy.master.Master
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{HOSTS, NUM_REMOVED_WORKERS}
 import org.apache.spark.internal.config.DECOMMISSION_ENABLED
 import org.apache.spark.internal.config.UI.MASTER_UI_DECOMMISSION_ALLOW_MODE
diff --git a/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionClient.scala b/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionClient.scala
index 3c0baacbf10be..6dc422515dbdb 100644
--- a/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionClient.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionClient.scala
@@ -33,7 +33,7 @@ import jakarta.servlet.http.HttpServletResponse
 
 import org.apache.spark.{SPARK_VERSION => sparkVersion, SparkConf, SparkException}
 import org.apache.spark.deploy.SparkApplication
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.util.Utils
 
diff --git a/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionServer.scala b/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionServer.scala
index f8afa86fd36fc..e172a06f0a32e 100644
--- a/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionServer.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/rest/RestSubmissionServer.scala
@@ -32,7 +32,7 @@ import org.json4s._
 import org.json4s.jackson.JsonMethods._
 
 import org.apache.spark.{SPARK_VERSION => sparkVersion, SparkConf}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{MASTER_REST_SERVER_FILTERS, MASTER_REST_SERVER_MAX_THREADS, MASTER_REST_SERVER_VIRTUAL_THREADS}
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/deploy/security/HBaseDelegationTokenProvider.scala b/core/src/main/scala/org/apache/spark/deploy/security/HBaseDelegationTokenProvider.scala
index 3a262a0d19fb5..83f36e1245844 100644
--- a/core/src/main/scala/org/apache/spark/deploy/security/HBaseDelegationTokenProvider.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/security/HBaseDelegationTokenProvider.scala
@@ -27,7 +27,7 @@ import org.apache.hadoop.security.Credentials
 import org.apache.hadoop.security.token.{Token, TokenIdentifier}
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.security.HadoopDelegationTokenProvider
 import org.apache.spark.util.Utils
@@ -54,8 +54,8 @@ private[security] class HBaseDelegationTokenProvider
       creds.addToken(token.getService, token)
     } catch {
       case NonFatal(e) =>
-        logWarning(Utils.createFailedToGetTokenMessage(serviceName, e) + log" Retrying to fetch " +
-          log"HBase security token with ${MDC(SERVICE_NAME, serviceName)} connection parameter.")
+        logWarning(Utils.createFailedToGetTokenMessage(serviceName) + log" Retrying to fetch " +
+          log"HBase security token with ${MDC(SERVICE_NAME, serviceName)} connection parameter.", e)
         // Seems to be spark is trying to get the token from HBase 2.x.x  version or above where the
         // obtainToken(Configuration conf) API has been removed. Lets try obtaining the token from
         // another compatible API of HBase service.
@@ -98,7 +98,7 @@ private[security] class HBaseDelegationTokenProvider
       creds.addToken(token.getService, token)
     } catch {
       case NonFatal(e) =>
-        logWarning(Utils.createFailedToGetTokenMessage(serviceName, e))
+        logWarning(Utils.createFailedToGetTokenMessage(serviceName), e)
     } finally {
       if (null != hbaseConnection) {
         hbaseConnection.close()
diff --git a/core/src/main/scala/org/apache/spark/deploy/security/HadoopDelegationTokenManager.scala b/core/src/main/scala/org/apache/spark/deploy/security/HadoopDelegationTokenManager.scala
index b9d88266ed538..bc77159415473 100644
--- a/core/src/main/scala/org/apache/spark/deploy/security/HadoopDelegationTokenManager.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/security/HadoopDelegationTokenManager.scala
@@ -31,7 +31,7 @@ import org.apache.hadoop.security.{Credentials, UserGroupInformation}
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.rpc.RpcEndpointRef
diff --git a/core/src/main/scala/org/apache/spark/deploy/security/HadoopFSDelegationTokenProvider.scala b/core/src/main/scala/org/apache/spark/deploy/security/HadoopFSDelegationTokenProvider.scala
index fc750b54d0b8e..3a38eb4a08d7d 100644
--- a/core/src/main/scala/org/apache/spark/deploy/security/HadoopFSDelegationTokenProvider.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/security/HadoopFSDelegationTokenProvider.scala
@@ -28,7 +28,7 @@ import org.apache.hadoop.security.{Credentials, UserGroupInformation}
 import org.apache.hadoop.security.token.delegation.AbstractDelegationTokenIdentifier
 
 import org.apache.spark.{SparkConf, SparkException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.security.HadoopDelegationTokenProvider
diff --git a/core/src/main/scala/org/apache/spark/deploy/worker/CommandUtils.scala b/core/src/main/scala/org/apache/spark/deploy/worker/CommandUtils.scala
index a3e7276fc83e1..5bc17e2164738 100644
--- a/core/src/main/scala/org/apache/spark/deploy/worker/CommandUtils.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/worker/CommandUtils.scala
@@ -24,7 +24,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{SecurityManager, SSLOptions}
 import org.apache.spark.deploy.Command
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.launcher.WorkerCommandBuilder
 import org.apache.spark.util.Utils
 
diff --git a/core/src/main/scala/org/apache/spark/deploy/worker/DriverRunner.scala b/core/src/main/scala/org/apache/spark/deploy/worker/DriverRunner.scala
index ca0e024ad1aed..28de0f45eb27f 100644
--- a/core/src/main/scala/org/apache/spark/deploy/worker/DriverRunner.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/worker/DriverRunner.scala
@@ -19,19 +19,18 @@ package org.apache.spark.deploy.worker
 
 import java.io._
 import java.net.URI
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
+import java.nio.file.StandardOpenOption
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.{Files, FileWriteMode}
-
 import org.apache.spark.{SecurityManager, SparkConf}
 import org.apache.spark.deploy.{DriverDescription, SparkHadoopUtil}
 import org.apache.spark.deploy.DeployMessages.DriverStateChanged
 import org.apache.spark.deploy.StandaloneResourceUtils.prepareResourcesFile
 import org.apache.spark.deploy.master.DriverState
 import org.apache.spark.deploy.master.DriverState.DriverState
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{DRIVER_RESOURCES_FILE, SPARK_DRIVER_PREFIX}
 import org.apache.spark.internal.config.UI.UI_REVERSE_PROXY
@@ -145,7 +144,7 @@ private[deploy] class DriverRunner(
    */
   private def createWorkingDirectory(): File = {
     val driverDir = new File(workDir, driverId)
-    if (!driverDir.exists() && !driverDir.mkdirs()) {
+    if (!driverDir.exists() && !Utils.createDirectory(driverDir)) {
       throw new IOException("Failed to create directory " + driverDir)
     }
     driverDir
@@ -215,8 +214,8 @@ private[deploy] class DriverRunner(
       val stderr = new File(baseDir, "stderr")
       val redactedCommand = Utils.redactCommandLineArgs(conf, builder.command.asScala.toSeq)
         .mkString("\"", "\" \"", "\"")
-      val header = "Launch Command: %s\n%s\n\n".format(redactedCommand, "=" * 40)
-      Files.asCharSink(stderr, StandardCharsets.UTF_8, FileWriteMode.APPEND).write(header)
+      val header = "Launch Command: %s\n%s\n\n".format(redactedCommand, "=".repeat(40))
+      Files.writeString(stderr.toPath, header, StandardOpenOption.APPEND)
       CommandUtils.redirectStream(process.getErrorStream, stderr)
     }
     runCommandWithRetry(ProcessBuilderLike(builder), initialize, supervise)
diff --git a/core/src/main/scala/org/apache/spark/deploy/worker/DriverWrapper.scala b/core/src/main/scala/org/apache/spark/deploy/worker/DriverWrapper.scala
index 4f42088903464..1d64dbc224c49 100644
--- a/core/src/main/scala/org/apache/spark/deploy/worker/DriverWrapper.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/worker/DriverWrapper.scala
@@ -21,7 +21,7 @@ import java.io.File
 
 import org.apache.spark.{SecurityManager, SparkConf}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys.RPC_ADDRESS
 import org.apache.spark.rpc.RpcEnv
 import org.apache.spark.util._
diff --git a/core/src/main/scala/org/apache/spark/deploy/worker/ExecutorRunner.scala b/core/src/main/scala/org/apache/spark/deploy/worker/ExecutorRunner.scala
index d21904dd16ea7..8f0b684a93e81 100644
--- a/core/src/main/scala/org/apache/spark/deploy/worker/ExecutorRunner.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/worker/ExecutorRunner.scala
@@ -18,17 +18,15 @@
 package org.apache.spark.deploy.worker
 
 import java.io._
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
-
 import org.apache.spark.{SecurityManager, SparkConf}
 import org.apache.spark.deploy.{ApplicationDescription, ExecutorState}
 import org.apache.spark.deploy.DeployMessages.ExecutorStateChanged
 import org.apache.spark.deploy.StandaloneResourceUtils.prepareResourcesFile
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.SPARK_EXECUTOR_PREFIX
 import org.apache.spark.internal.config.UI._
@@ -184,14 +182,14 @@ private[deploy] class ExecutorRunner(
 
       process = builder.start()
       val header = "Spark Executor Command: %s\n%s\n\n".format(
-        redactedCommand, "=" * 40)
+        redactedCommand, "=".repeat(40))
 
       // Redirect its stdout and stderr to files
       val stdout = new File(executorDir, "stdout")
       stdoutAppender = FileAppender(process.getInputStream, stdout, conf, true)
 
       val stderr = new File(executorDir, "stderr")
-      Files.asCharSink(stderr, StandardCharsets.UTF_8).write(header)
+      Files.writeString(stderr.toPath, header)
       stderrAppender = FileAppender(process.getErrorStream, stderr, conf, true)
 
       state = ExecutorState.RUNNING
diff --git a/core/src/main/scala/org/apache/spark/deploy/worker/Worker.scala b/core/src/main/scala/org/apache/spark/deploy/worker/Worker.scala
index b2ec23887a400..98da33a429eca 100755
--- a/core/src/main/scala/org/apache/spark/deploy/worker/Worker.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/worker/Worker.scala
@@ -37,7 +37,7 @@ import org.apache.spark.deploy.ExternalShuffleService
 import org.apache.spark.deploy.StandaloneResourceUtils._
 import org.apache.spark.deploy.master.{DriverState, Master}
 import org.apache.spark.deploy.worker.ui.WorkerWebUI
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.Tests.IS_TESTING
 import org.apache.spark.internal.config.UI._
@@ -600,7 +600,7 @@ private[deploy] class Worker(
 
           // Create the executor's working directory
           val executorDir = new File(workDir, appId + "/" + execId)
-          if (!executorDir.mkdirs()) {
+          if (!Utils.createDirectory(executorDir)) {
             throw new IOException("Failed to create directory " + executorDir)
           }
 
diff --git a/core/src/main/scala/org/apache/spark/deploy/worker/WorkerWatcher.scala b/core/src/main/scala/org/apache/spark/deploy/worker/WorkerWatcher.scala
index bd07a0ade523d..ef6d84631c83c 100644
--- a/core/src/main/scala/org/apache/spark/deploy/worker/WorkerWatcher.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/worker/WorkerWatcher.scala
@@ -19,7 +19,7 @@ package org.apache.spark.deploy.worker
 
 import java.util.concurrent.atomic.AtomicBoolean
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.WORKER_URL
 import org.apache.spark.rpc._
 
diff --git a/core/src/main/scala/org/apache/spark/deploy/worker/ui/LogPage.scala b/core/src/main/scala/org/apache/spark/deploy/worker/ui/LogPage.scala
index defce5acc6168..bdc143be91b94 100644
--- a/core/src/main/scala/org/apache/spark/deploy/worker/ui/LogPage.scala
+++ b/core/src/main/scala/org/apache/spark/deploy/worker/ui/LogPage.scala
@@ -23,7 +23,7 @@ import scala.xml.{Node, Unparsed}
 
 import jakarta.servlet.http.HttpServletRequest
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{LOG_TYPE, PATH}
 import org.apache.spark.ui.{UIUtils, WebUIPage}
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/executor/CoarseGrainedExecutorBackend.scala b/core/src/main/scala/org/apache/spark/executor/CoarseGrainedExecutorBackend.scala
index a30759e5d794e..206a6a0fe385c 100644
--- a/core/src/main/scala/org/apache/spark/executor/CoarseGrainedExecutorBackend.scala
+++ b/core/src/main/scala/org/apache/spark/executor/CoarseGrainedExecutorBackend.scala
@@ -31,7 +31,7 @@ import org.apache.spark._
 import org.apache.spark.TaskState.TaskState
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.deploy.worker.WorkerWatcher
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.network.netty.SparkTransportConf
diff --git a/core/src/main/scala/org/apache/spark/executor/Executor.scala b/core/src/main/scala/org/apache/spark/executor/Executor.scala
index 3b066e15386b8..a14ba21a0c186 100644
--- a/core/src/main/scala/org/apache/spark/executor/Executor.scala
+++ b/core/src/main/scala/org/apache/spark/executor/Executor.scala
@@ -36,11 +36,11 @@ import scala.util.control.NonFatal
 
 import com.google.common.cache.{Cache, CacheBuilder, RemovalListener, RemovalNotification}
 import com.google.common.util.concurrent.ThreadFactoryBuilder
-import org.slf4j.MDC
+import org.slf4j.{MDC => SLF4JMDC}
 
 import org.apache.spark._
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, LogKeys, MDC => LogMDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.{EXECUTOR_USER_CLASS_PATH_FIRST => EXECUTOR_USER_CLASS_PATH_FIRST_CONFIG}
@@ -82,12 +82,12 @@ private[spark] class Executor(
     resources: immutable.Map[String, ResourceInformation])
   extends Logging {
 
-  logInfo(log"Starting executor ID ${LogMDC(LogKeys.EXECUTOR_ID, executorId)}" +
-    log" on host ${LogMDC(HOST, executorHostname)}")
-  logInfo(log"OS info ${LogMDC(OS_NAME, System.getProperty("os.name"))}," +
-    log" ${LogMDC(OS_VERSION, System.getProperty("os.version"))}, " +
-    log"${LogMDC(OS_ARCH, System.getProperty("os.arch"))}")
-  logInfo(log"Java version ${LogMDC(JAVA_VERSION, System.getProperty("java.version"))}")
+  logInfo(log"Starting executor ID ${MDC(LogKeys.EXECUTOR_ID, executorId)}" +
+    log" on host ${MDC(HOST, executorHostname)}")
+  logInfo(log"OS info ${MDC(OS_NAME, Utils.osName)}," +
+    log" ${MDC(OS_VERSION, Utils.osVersion)}, " +
+    log"${MDC(OS_ARCH, Utils.osArch)}")
+  logInfo(log"Java version ${MDC(JAVA_VERSION, Utils.javaVersion)}")
 
   private val executorShutdown = new AtomicBoolean(false)
   val stopHookReference = ShutdownHookManager.addShutdownHook(
@@ -102,7 +102,7 @@ private[spark] class Executor(
   private[executor] val taskNameMDCKey = if (conf.get(LEGACY_TASK_NAME_MDC_ENABLED)) {
     "mdc.taskName"
   } else {
-    LogKeys.TASK_NAME.name
+    TASK_NAME.name.toLowerCase(Locale.ROOT)
   }
 
   // SPARK-40235: updateDependencies() uses a ReentrantLock instead of the `synchronized` keyword
@@ -223,7 +223,7 @@ private[spark] class Executor(
         if (sessionBasedRoot.isDirectory && sessionBasedRoot.exists()) {
           Utils.deleteRecursively(sessionBasedRoot)
         }
-        logInfo(log"Session evicted: ${LogMDC(SESSION_ID, state.sessionUUID)}")
+        logInfo(log"Session evicted: ${MDC(SESSION_ID, state.sessionUUID)}")
       }
     })
     .build[String, IsolatedSessionState]
@@ -505,9 +505,9 @@ private[spark] class Executor(
     @volatile var task: Task[Any] = _
 
     def kill(interruptThread: Boolean, reason: String): Unit = {
-      logInfo(log"Executor is trying to kill ${LogMDC(TASK_NAME, taskName)}, " +
-        log"interruptThread: ${LogMDC(INTERRUPT_THREAD, interruptThread)}, " +
-        log"reason: ${LogMDC(REASON, reason)}")
+      logInfo(log"Executor is trying to kill ${MDC(TASK_NAME, taskName)}, " +
+        log"interruptThread: ${MDC(INTERRUPT_THREAD, interruptThread)}, " +
+        log"reason: ${MDC(REASON, reason)}")
       reasonIfKilled = Some(reason)
       if (task != null) {
         synchronized {
@@ -579,7 +579,7 @@ private[spark] class Executor(
       } else 0L
       Thread.currentThread.setContextClassLoader(isolatedSession.replClassLoader)
       val ser = env.closureSerializer.newInstance()
-      logInfo(log"Running ${LogMDC(TASK_NAME, taskName)}")
+      logInfo(log"Running ${MDC(TASK_NAME, taskName)}")
       execBackend.statusUpdate(taskId, TaskState.RUNNING, EMPTY_BYTE_BUFFER)
       var taskStartTimeNs: Long = 0
       var taskStartCpu: Long = 0
@@ -653,7 +653,7 @@ private[spark] class Executor(
 
           if (freedMemory > 0 && !threwException) {
             val errMsg = log"Managed memory leak detected; size = " +
-              log"${LogMDC(NUM_BYTES, freedMemory)} bytes, ${LogMDC(TASK_NAME, taskName)}"
+              log"${MDC(NUM_BYTES, freedMemory)} bytes, ${MDC(TASK_NAME, taskName)}"
             if (conf.get(UNSAFE_EXCEPTION_ON_MEMORY_LEAK)) {
               throw SparkException.internalError(errMsg.message, category = "EXECUTOR")
             } else {
@@ -663,9 +663,9 @@ private[spark] class Executor(
 
           if (releasedLocks.nonEmpty && !threwException) {
             val errMsg =
-              log"${LogMDC(NUM_RELEASED_LOCKS, releasedLocks.size)} block locks" +
-                log" were not released by ${LogMDC(TASK_NAME, taskName)}\n" +
-                log" ${LogMDC(RELEASED_LOCKS, releasedLocks.mkString("[", ", ", "]"))})"
+              log"${MDC(NUM_RELEASED_LOCKS, releasedLocks.size)} block locks" +
+                log" were not released by ${MDC(TASK_NAME, taskName)}\n" +
+                log" ${MDC(RELEASED_LOCKS, releasedLocks.mkString("[", ", ", "]"))})"
             if (conf.get(STORAGE_EXCEPTION_PIN_LEAK)) {
               throw SparkException.internalError(errMsg.message, category = "EXECUTOR")
             } else {
@@ -677,10 +677,10 @@ private[spark] class Executor(
           // uh-oh.  it appears the user code has caught the fetch-failure without throwing any
           // other exceptions.  Its *possible* this is what the user meant to do (though highly
           // unlikely).  So we will log an error and keep going.
-          logError(log"${LogMDC(TASK_NAME, taskName)} completed successfully though internally " +
+          logError(log"${MDC(TASK_NAME, taskName)} completed successfully though internally " +
             log"it encountered unrecoverable fetch failures! Most likely this means user code " +
             log"is incorrectly swallowing Spark's internal " +
-            log"${LogMDC(CLASS_NAME, classOf[FetchFailedException])}", fetchFailure)
+            log"${MDC(CLASS_NAME, classOf[FetchFailedException])}", fetchFailure)
         }
         val taskFinishNs = System.nanoTime()
         val taskFinishCpu = if (threadMXBean.isCurrentThreadCpuTimeSupported) {
@@ -746,10 +746,10 @@ private[spark] class Executor(
         // directSend = sending directly back to the driver
         val serializedResult: ByteBuffer = {
           if (maxResultSize > 0 && resultSize > maxResultSize) {
-            logWarning(log"Finished ${LogMDC(TASK_NAME, taskName)}. " +
+            logWarning(log"Finished ${MDC(TASK_NAME, taskName)}. " +
               log"Result is larger than maxResultSize " +
-              log"(${LogMDC(RESULT_SIZE_BYTES, Utils.bytesToString(resultSize))} > " +
-              log"${LogMDC(RESULT_SIZE_BYTES_MAX, Utils.bytesToString(maxResultSize))}), " +
+              log"(${MDC(RESULT_SIZE_BYTES, Utils.bytesToString(resultSize))} > " +
+              log"${MDC(RESULT_SIZE_BYTES_MAX, Utils.bytesToString(maxResultSize))}), " +
               log"dropping it.")
             ser.serialize(new IndirectTaskResult[Any](TaskResultBlockId(taskId), resultSize))
           } else if (resultSize > maxDirectResultSize) {
@@ -758,12 +758,12 @@ private[spark] class Executor(
               blockId,
               serializedDirectResult,
               StorageLevel.MEMORY_AND_DISK_SER)
-            logInfo(log"Finished ${LogMDC(TASK_NAME, taskName)}." +
-              log" ${LogMDC(NUM_BYTES, resultSize)} bytes result sent via BlockManager)")
+            logInfo(log"Finished ${MDC(TASK_NAME, taskName)}." +
+              log" ${MDC(NUM_BYTES, resultSize)} bytes result sent via BlockManager)")
             ser.serialize(new IndirectTaskResult[Any](blockId, resultSize))
           } else {
-            logInfo(log"Finished ${LogMDC(TASK_NAME, taskName)}." +
-              log" ${LogMDC(NUM_BYTES, resultSize)} bytes result sent to driver")
+            logInfo(log"Finished ${MDC(TASK_NAME, taskName)}." +
+              log" ${MDC(NUM_BYTES, resultSize)} bytes result sent to driver")
             // toByteBuffer is safe here, guarded by maxDirectResultSize
             serializedDirectResult.toByteBuffer
           }
@@ -775,8 +775,8 @@ private[spark] class Executor(
         execBackend.statusUpdate(taskId, TaskState.FINISHED, serializedResult)
       } catch {
         case t: TaskKilledException =>
-          logInfo(log"Executor killed ${LogMDC(TASK_NAME, taskName)}," +
-            log" reason: ${LogMDC(REASON, t.reason)}")
+          logInfo(log"Executor killed ${MDC(TASK_NAME, taskName)}," +
+            log" reason: ${MDC(REASON, t.reason)}")
 
           val (accums, accUpdates) = collectAccumulatorsAndResetStatusOnFailure(taskStartTimeNs)
           // Here and below, put task metric peaks in an immutable.ArraySeq to expose them as an
@@ -789,8 +789,8 @@ private[spark] class Executor(
         case _: InterruptedException | NonFatal(_) if
             task != null && task.reasonIfKilled.isDefined =>
           val killReason = task.reasonIfKilled.getOrElse("unknown reason")
-          logInfo(log"Executor interrupted and killed ${LogMDC(TASK_NAME, taskName)}," +
-            log" reason: ${LogMDC(REASON, killReason)}")
+          logInfo(log"Executor interrupted and killed ${MDC(TASK_NAME, taskName)}," +
+            log" reason: ${MDC(REASON, killReason)}")
 
           val (accums, accUpdates) = collectAccumulatorsAndResetStatusOnFailure(taskStartTimeNs)
           val metricPeaks = metricsPoller.getTaskMetricPeaks(taskId).toImmutableArraySeq
@@ -803,12 +803,12 @@ private[spark] class Executor(
           if (!t.isInstanceOf[FetchFailedException]) {
             // there was a fetch failure in the task, but some user code wrapped that exception
             // and threw something else.  Regardless, we treat it as a fetch failure.
-            logWarning(log"${LogMDC(TASK_NAME, taskName)} encountered a " +
-              log"${LogMDC(CLASS_NAME, classOf[FetchFailedException].getName)} " +
+            logWarning(log"${MDC(TASK_NAME, taskName)} encountered a " +
+              log"${MDC(CLASS_NAME, classOf[FetchFailedException].getName)} " +
               log"and failed, but the " +
-              log"${LogMDC(CLASS_NAME, classOf[FetchFailedException].getName)} " +
+              log"${MDC(CLASS_NAME, classOf[FetchFailedException].getName)} " +
               log"was hidden by another exception. Spark is handling this like a fetch failure " +
-              log"and ignoring the other exception: ${LogMDC(ERROR, t)}")
+              log"and ignoring the other exception: ${MDC(ERROR, t)}")
           }
           setTaskFinishedAndClearInterruptStatus()
           plugins.foreach(_.onTaskFailed(reason))
@@ -823,13 +823,13 @@ private[spark] class Executor(
         case t: Throwable if env.isStopped =>
           // Log the expected exception after executor.stop without stack traces
           // see: SPARK-19147
-          logError(log"Exception in ${LogMDC(TASK_NAME, taskName)}: ${LogMDC(ERROR, t.getMessage)}")
+          logError(log"Exception in ${MDC(TASK_NAME, taskName)}: ${MDC(ERROR, t.getMessage)}")
 
         case t: Throwable =>
           // Attempt to exit cleanly by informing the driver of our failure.
           // If anything goes wrong (or this was a fatal exception), we will delegate to
           // the default uncaught exception handler, which will terminate the Executor.
-          logError(log"Exception in ${LogMDC(TASK_NAME, taskName)}", t)
+          logError(log"Exception in ${MDC(TASK_NAME, taskName)}", t)
 
           // SPARK-20904: Do not report failure to driver if if happened during shut down. Because
           // libraries may set up shutdown hooks that race with running tasks during shutdown,
@@ -934,16 +934,16 @@ private[spark] class Executor(
 
   private def setMDCForTask(taskName: String, mdc: Seq[(String, String)]): Unit = {
     if (Executor.mdcIsSupported) {
-      mdc.foreach { case (key, value) => MDC.put(key, value) }
+      mdc.foreach { case (key, value) => SLF4JMDC.put(key, value) }
       // avoid overriding the takName by the user
-      MDC.put(taskNameMDCKey, taskName)
+      SLF4JMDC.put(taskNameMDCKey, taskName)
     }
   }
 
   private def cleanMDCForTask(taskName: String, mdc: Seq[(String, String)]): Unit = {
     if (Executor.mdcIsSupported) {
-      mdc.foreach { case (key, _) => MDC.remove(key) }
-      MDC.remove(taskNameMDCKey)
+      mdc.foreach { case (key, _) => SLF4JMDC.remove(key) }
+      SLF4JMDC.remove(taskNameMDCKey)
     }
   }
 
@@ -1016,14 +1016,14 @@ private[spark] class Executor(
             finished = true
           } else {
             val elapsedTimeMs = TimeUnit.NANOSECONDS.toMillis(elapsedTimeNs)
-            logWarning(log"Killed task ${LogMDC(TASK_ID, taskId)} " +
-              log"is still running after ${LogMDC(TIME_UNITS, elapsedTimeMs)} ms")
+            logWarning(log"Killed task ${MDC(TASK_ID, taskId)} " +
+              log"is still running after ${MDC(TIME_UNITS, elapsedTimeMs)} ms")
             if (takeThreadDump) {
               try {
                 taskRunner.theadDump().foreach { thread =>
                   if (thread.threadName == taskRunner.threadName) {
-                    logWarning(log"Thread dump from task ${LogMDC(TASK_ID, taskId)}:\n" +
-                      log"${LogMDC(THREAD, thread.toString)}")
+                    logWarning(log"Thread dump from task ${MDC(TASK_ID, taskId)}:\n" +
+                      log"${MDC(THREAD, thread.toString)}")
                   }
                 }
               } catch {
@@ -1037,8 +1037,8 @@ private[spark] class Executor(
         if (!taskRunner.isFinished && timeoutExceeded()) {
           val killTimeoutMs = TimeUnit.NANOSECONDS.toMillis(killTimeoutNs)
           if (isLocal) {
-            logError(log"Killed task ${LogMDC(TASK_ID, taskId)} could not be stopped within " +
-              log"${LogMDC(TIMEOUT, killTimeoutMs)} ms; " +
+            logError(log"Killed task ${MDC(TASK_ID, taskId)} could not be stopped within " +
+              log"${MDC(TIMEOUT, killTimeoutMs)} ms; " +
               log"not killing JVM because we are running in local mode.")
           } else {
             // In non-local-mode, the exception thrown here will bubble up to the uncaught exception
@@ -1093,8 +1093,8 @@ private[spark] class Executor(
     logInfo(
       log"Starting executor with user classpath" +
         log" (userClassPathFirst =" +
-        log" ${LogMDC(LogKeys.EXECUTOR_USER_CLASS_PATH_FIRST, userClassPathFirst)}): " +
-        log"${LogMDC(URLS, urls.mkString("'", ",", "'"))}"
+        log" ${MDC(LogKeys.EXECUTOR_USER_CLASS_PATH_FIRST, userClassPathFirst)}): " +
+        log"${MDC(URLS, urls.mkString("'", ",", "'"))}"
     )
 
     if (useStub) {
@@ -1150,13 +1150,13 @@ private[spark] class Executor(
       sessionUUID: String): ClassLoader = {
     val classUri = sessionClassUri.getOrElse(conf.get("spark.repl.class.uri", null))
     val classLoader = if (classUri != null) {
-      logInfo(log"Using REPL class URI: ${LogMDC(LogKeys.URI, classUri)}")
+      logInfo(log"Using REPL class URI: ${MDC(LogKeys.URI, classUri)}")
       new ExecutorClassLoader(conf, env, classUri, parent, userClassPathFirst)
     } else {
       parent
     }
-    logInfo(log"Created or updated repl class loader ${LogMDC(CLASS_LOADER, classLoader)}" +
-      log" for ${LogMDC(SESSION_ID, sessionUUID)}.")
+    logInfo(log"Created or updated repl class loader ${MDC(CLASS_LOADER, classLoader)}" +
+      log" for ${MDC(SESSION_ID, sessionUUID)}.")
     classLoader
   }
 
@@ -1191,16 +1191,16 @@ private[spark] class Executor(
 
       // Fetch missing dependencies
       for ((name, timestamp) <- newFiles if state.currentFiles.getOrElse(name, -1L) < timestamp) {
-        logInfo(log"Fetching ${LogMDC(FILE_NAME, name)} with" +
-          log" timestamp ${LogMDC(TIMESTAMP, timestamp)}")
+        logInfo(log"Fetching ${MDC(FILE_NAME, name)} with" +
+          log" timestamp ${MDC(TIMESTAMP, timestamp)}")
         // Fetch file with useCache mode, close cache for local mode.
         Utils.fetchFile(name, root, conf, hadoopConf, timestamp, useCache = !isLocal)
         state.currentFiles(name) = timestamp
       }
       for ((name, timestamp) <- newArchives if
           state.currentArchives.getOrElse(name, -1L) < timestamp) {
-        logInfo(log"Fetching ${LogMDC(ARCHIVE_NAME, name)} with" +
-          log" timestamp ${LogMDC(TIMESTAMP, timestamp)}")
+        logInfo(log"Fetching ${MDC(ARCHIVE_NAME, name)} with" +
+          log" timestamp ${MDC(TIMESTAMP, timestamp)}")
         val sourceURI = new URI(name)
         val uriToDownload = Utils.getUriBuilder(sourceURI).fragment(null).build()
         val source = Utils.fetchFile(uriToDownload.toString, Utils.createTempDir(), conf,
@@ -1209,10 +1209,10 @@ private[spark] class Executor(
           root,
           if (sourceURI.getFragment != null) sourceURI.getFragment else source.getName)
         logInfo(
-          log"Unpacking an archive ${LogMDC(ARCHIVE_NAME, name)}" +
-            log" (${LogMDC(BYTE_SIZE, source.length)} bytes)" +
-            log" from ${LogMDC(SOURCE_PATH, source.getAbsolutePath)}" +
-            log" to ${LogMDC(DESTINATION_PATH, dest.getAbsolutePath)}")
+          log"Unpacking an archive ${MDC(ARCHIVE_NAME, name)}" +
+            log" (${MDC(BYTE_SIZE, source.length)} bytes)" +
+            log" from ${MDC(SOURCE_PATH, source.getAbsolutePath)}" +
+            log" to ${MDC(DESTINATION_PATH, dest.getAbsolutePath)}")
         Utils.deleteRecursively(dest)
         Utils.unpack(source, dest)
         state.currentArchives(name) = timestamp
@@ -1223,8 +1223,8 @@ private[spark] class Executor(
           .orElse(state.currentJars.get(localName))
           .getOrElse(-1L)
         if (currentTimeStamp < timestamp) {
-          logInfo(log"Fetching ${LogMDC(JAR_URL, name)} with" +
-            log" timestamp ${LogMDC(TIMESTAMP, timestamp)}")
+          logInfo(log"Fetching ${MDC(JAR_URL, name)} with" +
+            log" timestamp ${MDC(TIMESTAMP, timestamp)}")
           // Fetch file with useCache mode, close cache for local mode.
           Utils.fetchFile(name, root, conf,
             hadoopConf, timestamp, useCache = !isLocal)
@@ -1232,8 +1232,8 @@ private[spark] class Executor(
           // Add it to our class loader
           val url = new File(root, localName).toURI.toURL
           if (!state.urlClassLoader.getURLs().contains(url)) {
-            logInfo(log"Adding ${LogMDC(LogKeys.URL, url)} to" +
-              log" class loader ${LogMDC(UUID, state.sessionUUID)}")
+            logInfo(log"Adding ${MDC(LogKeys.URL, url)} to" +
+              log" class loader ${MDC(UUID, state.sessionUUID)}")
             state.urlClassLoader.addURL(url)
             if (isStubbingEnabledForState(state.sessionUUID)) {
               renewClassLoader = true
@@ -1298,7 +1298,7 @@ private[spark] class Executor(
         heartbeatFailures += 1
         if (heartbeatFailures >= HEARTBEAT_MAX_FAILURES) {
           logError(log"Exit as unable to send heartbeats to driver " +
-            log"more than ${LogMDC(MAX_ATTEMPTS, HEARTBEAT_MAX_FAILURES)} times")
+            log"more than ${MDC(MAX_ATTEMPTS, HEARTBEAT_MAX_FAILURES)} times")
           System.exit(ExecutorExitCode.HEARTBEAT_FAILURE)
         }
     }
@@ -1309,7 +1309,7 @@ private[spark] class Executor(
     if (runner != null) {
       runner.theadDump()
     } else {
-      logWarning(log"Failed to dump thread for task ${LogMDC(TASK_ID, taskId)}")
+      logWarning(log"Failed to dump thread for task ${MDC(TASK_ID, taskId)}")
       None
     }
   }
@@ -1328,8 +1328,8 @@ private[spark] object Executor extends Logging {
     try {
       // This tests if any class initialization error is thrown
       val testKey = System.nanoTime().toString
-      MDC.put(testKey, "testValue")
-      MDC.remove(testKey)
+      SLF4JMDC.put(testKey, "testValue")
+      SLF4JMDC.remove(testKey)
 
       true
     } catch {
diff --git a/core/src/main/scala/org/apache/spark/executor/ExecutorClassLoader.scala b/core/src/main/scala/org/apache/spark/executor/ExecutorClassLoader.scala
index 6f8138da6f4fb..faea70933071a 100644
--- a/core/src/main/scala/org/apache/spark/executor/ExecutorClassLoader.scala
+++ b/core/src/main/scala/org/apache/spark/executor/ExecutorClassLoader.scala
@@ -30,7 +30,7 @@ import org.apache.xbean.asm9.Opcodes._
 
 import org.apache.spark.{SparkConf, SparkEnv}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.util.ParentClassLoader
 
 /**
diff --git a/core/src/main/scala/org/apache/spark/executor/ExecutorLogUrlHandler.scala b/core/src/main/scala/org/apache/spark/executor/ExecutorLogUrlHandler.scala
index 2202489509fc4..9807cb2c81e45 100644
--- a/core/src/main/scala/org/apache/spark/executor/ExecutorLogUrlHandler.scala
+++ b/core/src/main/scala/org/apache/spark/executor/ExecutorLogUrlHandler.scala
@@ -21,7 +21,7 @@ import java.util.concurrent.atomic.AtomicBoolean
 
 import scala.util.matching.Regex
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 
 private[spark] class ExecutorLogUrlHandler(logUrlPattern: Option[String]) extends Logging {
diff --git a/core/src/main/scala/org/apache/spark/executor/ProcfsMetricsGetter.scala b/core/src/main/scala/org/apache/spark/executor/ProcfsMetricsGetter.scala
index b9a462d62e413..00334e9cc55f1 100644
--- a/core/src/main/scala/org/apache/spark/executor/ProcfsMetricsGetter.scala
+++ b/core/src/main/scala/org/apache/spark/executor/ProcfsMetricsGetter.scala
@@ -96,7 +96,14 @@ private[spark] class ProcfsMetricsGetter(procfsDir: String = "/proc/") extends L
       }
       Utils.tryWithResource(openReader()) { in =>
         val procInfo = in.readLine
-        val procInfoSplit = procInfo.split(" ")
+        // The comm field, which is inside parentheses, could contain spaces. We should not split
+        // by those spaces as doing so could cause the numbers after it to be shifted.
+        val commStartIndex = procInfo.indexOf('(')
+        val commEndIndex = procInfo.lastIndexOf(')') + 1
+        val pidArray = Array(procInfo.substring(0, commStartIndex).trim)
+        val commArray = Array(procInfo.substring(commStartIndex, commEndIndex))
+        val splitAfterComm = procInfo.substring(commEndIndex).trim.split(" ")
+        val procInfoSplit = pidArray ++ commArray ++ splitAfterComm
         val vmem = procInfoSplit(22).toLong
         val rssMem = procInfoSplit(23).toLong * pageSize
         if (procInfoSplit(1).toLowerCase(Locale.US).contains("java")) {
diff --git a/core/src/main/scala/org/apache/spark/input/PortableDataStream.scala b/core/src/main/scala/org/apache/spark/input/PortableDataStream.scala
index 3c3017a9a64c1..9211bfec5cbd5 100644
--- a/core/src/main/scala/org/apache/spark/input/PortableDataStream.scala
+++ b/core/src/main/scala/org/apache/spark/input/PortableDataStream.scala
@@ -21,7 +21,7 @@ import java.io.{ByteArrayInputStream, ByteArrayOutputStream, DataInputStream, Da
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.{ByteStreams, Closeables}
+import com.google.common.io.Closeables
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.mapreduce.{InputSplit, JobContext, RecordReader, TaskAttemptContext}
@@ -202,7 +202,7 @@ class PortableDataStream(
   def toArray(): Array[Byte] = {
     val stream = open()
     try {
-      ByteStreams.toByteArray(stream)
+      stream.readAllBytes()
     } finally {
       Closeables.close(stream, true)
     }
diff --git a/core/src/main/scala/org/apache/spark/input/WholeTextFileRecordReader.scala b/core/src/main/scala/org/apache/spark/input/WholeTextFileRecordReader.scala
index 0bd2d551cc912..ba975237cb934 100644
--- a/core/src/main/scala/org/apache/spark/input/WholeTextFileRecordReader.scala
+++ b/core/src/main/scala/org/apache/spark/input/WholeTextFileRecordReader.scala
@@ -17,15 +17,16 @@
 
 package org.apache.spark.input
 
-import com.google.common.io.{ByteStreams, Closeables}
+import com.google.common.io.Closeables
 import org.apache.hadoop.conf.{Configurable => HConfigurable, Configuration}
 import org.apache.hadoop.io.Text
-import org.apache.hadoop.io.compress.CompressionCodecFactory
 import org.apache.hadoop.mapreduce.InputSplit
 import org.apache.hadoop.mapreduce.RecordReader
 import org.apache.hadoop.mapreduce.TaskAttemptContext
 import org.apache.hadoop.mapreduce.lib.input.{CombineFileRecordReader, CombineFileSplit}
 
+import org.apache.spark.io.HadoopCodecStreams
+
 /**
  * A trait to implement [[org.apache.hadoop.conf.Configurable Configurable]] interface.
  */
@@ -69,15 +70,8 @@ private[spark] class WholeTextFileRecordReader(
 
   override def nextKeyValue(): Boolean = {
     if (!processed) {
-      val conf = getConf
-      val factory = new CompressionCodecFactory(conf)
-      val codec = factory.getCodec(path)  // infers from file ext.
-      val fileIn = fs.open(path)
-      val innerBuffer = if (codec != null) {
-        ByteStreams.toByteArray(codec.createInputStream(fileIn))
-      } else {
-        ByteStreams.toByteArray(fileIn)
-      }
+      val fileIn = HadoopCodecStreams.createInputStream(getConf, path)
+      val innerBuffer = fileIn.readAllBytes()
 
       value = new Text(innerBuffer)
       Closeables.close(fileIn, false)
diff --git a/core/src/main/scala/org/apache/spark/internal/config/History.scala b/core/src/main/scala/org/apache/spark/internal/config/History.scala
index bbd4afcaebab4..8eaa37cceee97 100644
--- a/core/src/main/scala/org/apache/spark/internal/config/History.scala
+++ b/core/src/main/scala/org/apache/spark/internal/config/History.scala
@@ -159,6 +159,13 @@ private[spark] object History {
       .doubleConf
       .createWithDefault(0.7d)
 
+  val EVENT_LOG_ROLLING_ON_DEMAND_LOAD_ENABLED =
+    ConfigBuilder("spark.history.fs.eventLog.rolling.onDemandLoadEnabled")
+      .doc("Whether to look up rolling event log locations on demand manner before listing files.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
   val DRIVER_LOG_CLEANER_ENABLED = ConfigBuilder("spark.history.fs.driverlog.cleaner.enabled")
     .version("3.0.0")
     .doc("Specifies whether the History Server should periodically clean up driver logs from " +
@@ -227,6 +234,7 @@ private[spark] object History {
       "exceeded, then the oldest applications will be removed from the cache. If an application " +
       "is not in the cache, it will have to be loaded from disk if it is accessed from the UI.")
     .intConf
+    .checkValue(v => v > 0, "The number of applications to retain should be a positive integer.")
     .createWithDefault(50)
 
   val PROVIDER = ConfigBuilder("spark.history.provider")
diff --git a/core/src/main/scala/org/apache/spark/internal/config/Python.scala b/core/src/main/scala/org/apache/spark/internal/config/Python.scala
index 46d54be92f3d6..de95e2fa1f7a2 100644
--- a/core/src/main/scala/org/apache/spark/internal/config/Python.scala
+++ b/core/src/main/scala/org/apache/spark/internal/config/Python.scala
@@ -117,4 +117,25 @@ private[spark] object Python {
     .version("4.1.0")
     .booleanConf
     .createWithDefault(false)
+
+  val PYTHON_WORKER_TRACEBACK_DUMP_INTERVAL_SECONDS =
+    ConfigBuilder("spark.python.worker.tracebackDumpIntervalSeconds")
+      .doc("The interval (in seconds) for Python workers to dump their tracebacks. " +
+        "If it's positive, the Python worker will periodically dump the traceback into " +
+        "its `stderr`. The default is `0` that means it is disabled.")
+      .version("4.1.0")
+      .timeConf(TimeUnit.SECONDS)
+      .checkValue(_ >= 0, "The interval should be 0 or positive.")
+      .createWithDefault(0)
+
+  val PYTHON_FACTORY_IDLE_WORKER_MAX_POOL_SIZE =
+    ConfigBuilder("spark.python.factory.idleWorkerMaxPoolSize")
+      .doc("Maximum number of idle Python workers to keep. " +
+        "If unset, the number is unbounded. " +
+        "If set to a positive integer N, at most N idle workers are retained; " +
+        "least-recently used workers are evicted first.")
+      .version("4.1.0")
+      .intConf
+      .checkValue(_ > 0, "If set, the idle worker max size must be > 0.")
+      .createOptional
 }
diff --git a/core/src/main/scala/org/apache/spark/internal/config/package.scala b/core/src/main/scala/org/apache/spark/internal/config/package.scala
index 7cb3d068b676f..c0c605dd1643f 100644
--- a/core/src/main/scala/org/apache/spark/internal/config/package.scala
+++ b/core/src/main/scala/org/apache/spark/internal/config/package.scala
@@ -224,6 +224,14 @@ package object config {
       .booleanConf
       .createWithDefault(false)
 
+  private[spark] val EVENT_LOG_EXCLUDED_PATTERNS =
+    ConfigBuilder("spark.eventLog.excludedPatterns")
+      .doc("Specifies comma-separated event names to be excluded from the event logs.")
+      .version("4.1.0")
+      .stringConf
+      .toSequence
+      .createWithDefault(Nil)
+
   private[spark] val EVENT_LOG_ALLOW_EC =
     ConfigBuilder("spark.eventLog.erasureCoding.enabled")
       .version("3.0.0")
@@ -283,14 +291,6 @@ package object config {
       .booleanConf
       .createWithDefault(true)
 
-  private[spark] val EVENT_LOG_READER_MAX_STRING_LENGTH =
-    ConfigBuilder("spark.eventLog.readerMaxStringLength")
-      .doc("Limit the maximum string size an eventlog item can have when deserializing it.")
-      .version("4.1.0")
-      .intConf
-      .checkValue(_ > 0, "Maximum string size of an eventLog item should be positive.")
-      .createWithDefault(Int.MaxValue)
-
   private[spark] val EVENT_LOG_OVERWRITE =
     ConfigBuilder("spark.eventLog.overwrite")
       .version("1.0.0")
@@ -317,8 +317,8 @@ package object config {
         " to be rolled over.")
       .version("3.0.0")
       .bytesConf(ByteUnit.BYTE)
-      .checkValue(_ >= ByteUnit.MiB.toBytes(10), "Max file size of event log should be " +
-        "configured to be at least 10 MiB.")
+      .checkValue(_ >= ByteUnit.MiB.toBytes(2), "Max file size of event log should be " +
+        "configured to be at least 2 MiB.")
       .createWithDefaultString("128m")
 
   private[spark] val EXECUTOR_ID =
@@ -492,6 +492,16 @@ package object config {
     .doubleConf
     .createWithDefault(0.6)
 
+  private[spark] val UNMANAGED_MEMORY_POLLING_INTERVAL =
+    ConfigBuilder("spark.memory.unmanagedMemoryPollingInterval")
+      .doc("Interval for polling unmanaged memory users to track their memory usage. " +
+        "Unmanaged memory users are components that manage their own memory outside of " +
+        "Spark's core memory management, such as RocksDB for Streaming State Store. " +
+        "Setting this to 0 disables unmanaged memory polling.")
+      .version("4.1.0")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .createWithDefaultString("0s")
+
   private[spark] val STORAGE_UNROLL_MEMORY_THRESHOLD =
     ConfigBuilder("spark.storage.unrollMemoryThreshold")
       .doc("Initial memory to request before unrolling any block")
@@ -604,6 +614,26 @@ package object config {
       .checkValue(_.endsWith(java.io.File.separator), "Path should end with separator.")
       .createOptional
 
+  private[spark] val STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_DELAY =
+    ConfigBuilder("spark.storage.decommission.fallbackStorage.replicationDelay")
+      .doc("The maximum expected delay for files written by one executor to become " +
+        "available to other executors.")
+      .version("4.1.0")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .checkValue(_ > 0, "Value must be positive.")
+      .createOptional
+
+  private[spark] val STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_WAIT =
+    ConfigBuilder("spark.storage.decommission.fallbackStorage.replicationWait")
+      .doc(
+        "When an executor cannot find a file in the fallback storage it waits " +
+          "this amount of time before attempting to open the file again, " +
+          f"while not exceeding ${STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_DELAY.key}.")
+      .version("4.1.0")
+      .timeConf(TimeUnit.MILLISECONDS)
+      .checkValue(_ > 0, "Value must be positive.")
+      .createWithDefaultString("1s")
+
   private[spark] val STORAGE_DECOMMISSION_FALLBACK_STORAGE_CLEANUP =
     ConfigBuilder("spark.storage.decommission.fallbackStorage.cleanUp")
       .doc("If true, Spark cleans up its fallback storage data during shutting down.")
@@ -1588,6 +1618,18 @@ package object config {
       .intConf
       .createWithDefault(Integer.MAX_VALUE)
 
+  private[spark] val SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD =
+    ConfigBuilder("spark.shuffle.spill.maxRecordsSizeForSpillThreshold")
+      .internal()
+      .doc("The maximum size in memory before forcing the shuffle sorter to spill. " +
+        "By default it is Long.MAX_VALUE, which means we never force the sorter to spill, " +
+        "until we reach some limitations, like the max page size limitation for the pointer " +
+        "array in the sorter.")
+      .version("4.1.0")
+      .bytesConf(ByteUnit.BYTE)
+      .checkValue(v => v > 0, "The threshold should be positive.")
+      .createWithDefault(Long.MaxValue)
+
   private[spark] val SHUFFLE_MAP_OUTPUT_PARALLEL_AGGREGATION_THRESHOLD =
     ConfigBuilder("spark.shuffle.mapOutput.parallelAggregationThreshold")
       .internal()
@@ -2105,6 +2147,15 @@ package object config {
       .intConf
       .createWithDefault(1)
 
+  private[spark] val IO_COMPRESSION_ZSTD_STRATEGY =
+    ConfigBuilder("spark.io.compression.zstd.strategy")
+      .doc("Compression strategy for Zstd compression codec. The higher the value is, the more " +
+        "complex it becomes, usually resulting stronger but slower compression or higher CPU " +
+        "cost.")
+      .version("4.1.0")
+      .intConf
+      .createOptional
+
   private[spark] val IO_COMPRESSION_LZF_PARALLEL =
     ConfigBuilder("spark.io.compression.lzf.parallel.enabled")
       .doc("When true, LZF compression will use multiple threads to compress data in parallel.")
@@ -2280,6 +2331,15 @@ package object config {
     .toSequence
     .createWithDefault(Nil)
 
+  private[spark] val SUBMIT_CALL_SYSTEM_EXIT_ON_MAIN_EXIT =
+    ConfigBuilder("spark.submit.callSystemExitOnMainExit")
+      .doc("If true, SparkSubmit will call System.exit() to initiate JVM shutdown once the " +
+        "user's main method has exited. This can be useful in cases where non-daemon JVM " +
+        "threads might otherwise prevent the JVM from shutting down on its own.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+
   private[spark] val SCHEDULER_ALLOCATION_FILE =
     ConfigBuilder("spark.scheduler.allocation.file")
       .version("0.8.1")
@@ -2838,4 +2898,30 @@ package object config {
       .checkValues(Set("connect", "classic"))
       .createWithDefault(
         if (sys.env.get("SPARK_CONNECT_MODE").contains("1")) "connect" else "classic")
+
+  private[spark] val DRIVER_REDIRECT_CONSOLE_OUTPUTS =
+    ConfigBuilder("spark.driver.log.redirectConsoleOutputs")
+      .doc("Comma-separated list of the console output kind for driver that needs to redirect " +
+        "to logging system. Supported values are `stdout`, `stderr`. It only takes affect when " +
+        s"`${PLUGINS.key}` is configured with `org.apache.spark.deploy.RedirectConsolePlugin`.")
+      .version("4.1.0")
+      .stringConf
+      .transform(_.toLowerCase(Locale.ROOT))
+      .toSequence
+      .checkValue(v => v.forall(Set("stdout", "stderr").contains),
+        "The value only can be one or more of 'stdout, stderr'.")
+      .createWithDefault(Seq("stdout", "stderr"))
+
+  private[spark] val EXEC_REDIRECT_CONSOLE_OUTPUTS =
+    ConfigBuilder("spark.executor.log.redirectConsoleOutputs")
+      .doc("Comma-separated list of the console output kind for executor that needs to redirect " +
+        "to logging system. Supported values are `stdout`, `stderr`. It only takes affect when " +
+        s"`${PLUGINS.key}` is configured with `org.apache.spark.deploy.RedirectConsolePlugin`.")
+      .version("4.1.0")
+      .stringConf
+      .transform(_.toLowerCase(Locale.ROOT))
+      .toSequence
+      .checkValue(v => v.forall(Set("stdout", "stderr").contains),
+        "The value only can be one or more of 'stdout, stderr'.")
+      .createWithDefault(Seq("stdout", "stderr"))
 }
diff --git a/core/src/main/scala/org/apache/spark/internal/io/FileCommitProtocol.scala b/core/src/main/scala/org/apache/spark/internal/io/FileCommitProtocol.scala
index e2a96267082b8..651895bf1f7a2 100644
--- a/core/src/main/scala/org/apache/spark/internal/io/FileCommitProtocol.scala
+++ b/core/src/main/scala/org/apache/spark/internal/io/FileCommitProtocol.scala
@@ -20,6 +20,7 @@ package org.apache.spark.internal.io
 import org.apache.hadoop.fs._
 import org.apache.hadoop.mapreduce._
 
+import org.apache.spark.SparkException
 import org.apache.spark.annotation.Unstable
 import org.apache.spark.internal.Logging
 import org.apache.spark.util.Utils
@@ -96,7 +97,9 @@ abstract class FileCommitProtocol extends Logging {
    * guarantees that files written by different tasks will not conflict.
    */
   @deprecated("use newTaskTempFile(..., spec: FileNameSpec) instead", "3.3.0")
-  def newTaskTempFile(taskContext: TaskAttemptContext, dir: Option[String], ext: String): String
+  def newTaskTempFile(taskContext: TaskAttemptContext, dir: Option[String], ext: String): String = {
+    throw SparkException.mustOverrideOneMethodError("newTaskTempFile")
+  }
 
   /**
    * Notifies the commit protocol to add a new file, and gets back the full path that should be
@@ -135,7 +138,9 @@ abstract class FileCommitProtocol extends Logging {
    */
   @deprecated("use newTaskTempFileAbsPath(..., spec: FileNameSpec) instead", "3.3.0")
   def newTaskTempFileAbsPath(
-      taskContext: TaskAttemptContext, absoluteDir: String, ext: String): String
+      taskContext: TaskAttemptContext, absoluteDir: String, ext: String): String = {
+    throw SparkException.mustOverrideOneMethodError("newTaskTempFileAbsPath")
+  }
 
   /**
    * Similar to newTaskTempFile(), but allows files to committed to an absolute output location.
diff --git a/core/src/main/scala/org/apache/spark/internal/io/HadoopMapRedCommitProtocol.scala b/core/src/main/scala/org/apache/spark/internal/io/HadoopMapRedCommitProtocol.scala
index 44f8d7cd63635..358424abefba5 100644
--- a/core/src/main/scala/org/apache/spark/internal/io/HadoopMapRedCommitProtocol.scala
+++ b/core/src/main/scala/org/apache/spark/internal/io/HadoopMapRedCommitProtocol.scala
@@ -21,7 +21,6 @@ import org.apache.hadoop.mapred._
 import org.apache.hadoop.mapreduce.{TaskAttemptContext => NewTaskAttemptContext}
 
 import org.apache.spark.internal.LogKeys
-import org.apache.spark.internal.MDC
 
 /**
  * An [[FileCommitProtocol]] implementation backed by an underlying Hadoop OutputCommitter
diff --git a/core/src/main/scala/org/apache/spark/internal/io/HadoopMapReduceCommitProtocol.scala b/core/src/main/scala/org/apache/spark/internal/io/HadoopMapReduceCommitProtocol.scala
index 476cddc643954..d7bda5bbe721a 100644
--- a/core/src/main/scala/org/apache/spark/internal/io/HadoopMapReduceCommitProtocol.scala
+++ b/core/src/main/scala/org/apache/spark/internal/io/HadoopMapReduceCommitProtocol.scala
@@ -29,7 +29,7 @@ import org.apache.hadoop.mapreduce._
 import org.apache.hadoop.mapreduce.lib.output.FileOutputCommitter
 import org.apache.hadoop.mapreduce.task.TaskAttemptContextImpl
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.mapred.SparkHadoopMapRedUtil
 
@@ -117,11 +117,6 @@ class HadoopMapReduceCommitProtocol(
     format.getOutputCommitter(context)
   }
 
-  override def newTaskTempFile(
-      taskContext: TaskAttemptContext, dir: Option[String], ext: String): String = {
-    newTaskTempFile(taskContext, dir, FileNameSpec("", ext))
-  }
-
   override def newTaskTempFile(
       taskContext: TaskAttemptContext, dir: Option[String], spec: FileNameSpec): String = {
     val filename = getFilename(taskContext, spec)
@@ -145,11 +140,6 @@ class HadoopMapReduceCommitProtocol(
     }
   }
 
-  override def newTaskTempFileAbsPath(
-      taskContext: TaskAttemptContext, absoluteDir: String, ext: String): String = {
-    newTaskTempFileAbsPath(taskContext, absoluteDir, FileNameSpec("", ext))
-  }
-
   override def newTaskTempFileAbsPath(
       taskContext: TaskAttemptContext, absoluteDir: String, spec: FileNameSpec): String = {
     val filename = getFilename(taskContext, spec)
diff --git a/core/src/main/scala/org/apache/spark/internal/io/SparkHadoopWriter.scala b/core/src/main/scala/org/apache/spark/internal/io/SparkHadoopWriter.scala
index db961b3c42f4c..de136a86a2cc3 100644
--- a/core/src/main/scala/org/apache/spark/internal/io/SparkHadoopWriter.scala
+++ b/core/src/main/scala/org/apache/spark/internal/io/SparkHadoopWriter.scala
@@ -32,7 +32,7 @@ import org.apache.hadoop.mapreduce.task.{TaskAttemptContextImpl => NewTaskAttemp
 
 import org.apache.spark.{SerializableWritable, SparkConf, SparkException, TaskContext}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DURATION, JOB_ID, TASK_ATTEMPT_ID}
 import org.apache.spark.internal.io.FileCommitProtocol.TaskCommitMessage
 import org.apache.spark.rdd.{HadoopRDD, RDD}
diff --git a/core/src/main/scala/org/apache/spark/internal/plugin/PluginContainer.scala b/core/src/main/scala/org/apache/spark/internal/plugin/PluginContainer.scala
index a0c07bd75f885..51b29e1a0ec68 100644
--- a/core/src/main/scala/org/apache/spark/internal/plugin/PluginContainer.scala
+++ b/core/src/main/scala/org/apache/spark/internal/plugin/PluginContainer.scala
@@ -22,7 +22,7 @@ import scala.util.{Either, Left, Right}
 
 import org.apache.spark.{SparkContext, SparkEnv, TaskFailedReason}
 import org.apache.spark.api.plugin._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.resource.ResourceInformation
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/internal/plugin/PluginEndpoint.scala b/core/src/main/scala/org/apache/spark/internal/plugin/PluginEndpoint.scala
index 6ff918979c9ed..2c2f2f022a7a3 100644
--- a/core/src/main/scala/org/apache/spark/internal/plugin/PluginEndpoint.scala
+++ b/core/src/main/scala/org/apache/spark/internal/plugin/PluginEndpoint.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.internal.plugin
 
 import org.apache.spark.api.plugin.DriverPlugin
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rpc.{IsolatedThreadSafeRpcEndpoint, RpcCallContext, RpcEnv}
 
diff --git a/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala b/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala
index 233228a9c6d4c..b81e46667323e 100644
--- a/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala
+++ b/core/src/main/scala/org/apache/spark/io/CompressionCodec.scala
@@ -228,6 +228,7 @@ class ZStdCompressionCodec(conf: SparkConf) extends CompressionCodec {
   // Default compression level for zstd compression to 1 because it is
   // fastest of all with reasonably high compression ratio.
   private val level = conf.get(IO_COMPRESSION_ZSTD_LEVEL)
+  private val strategy = conf.get(IO_COMPRESSION_ZSTD_STRATEGY)
 
   private val bufferPool = if (conf.get(IO_COMPRESSION_ZSTD_BUFFERPOOL_ENABLED)) {
     RecyclingBufferPool.INSTANCE
@@ -241,6 +242,7 @@ class ZStdCompressionCodec(conf: SparkConf) extends CompressionCodec {
     // Wrap the zstd output stream in a buffered output stream, so that we can
     // avoid overhead excessive of JNI call while trying to compress small amount of data.
     val os = new ZstdOutputStreamNoFinalizer(s, bufferPool).setLevel(level).setWorkers(workers)
+    strategy.foreach(os.setStrategy)
     new BufferedOutputStream(os, bufferSize)
   }
 
diff --git a/core/src/main/scala/org/apache/spark/io/HadoopCodecStreams.scala b/core/src/main/scala/org/apache/spark/io/HadoopCodecStreams.scala
new file mode 100644
index 0000000000000..cba0e7ffd73bf
--- /dev/null
+++ b/core/src/main/scala/org/apache/spark/io/HadoopCodecStreams.scala
@@ -0,0 +1,94 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.io
+
+import java.io.InputStream
+import java.util.Locale
+
+import scala.collection.Seq
+
+import org.apache.hadoop.conf.Configuration
+import org.apache.hadoop.fs.Path
+import org.apache.hadoop.io.compress._
+
+import org.apache.spark.{SparkConf, SparkEnv}
+import org.apache.spark.io.{CompressionCodec => SparkCompressionCodec}
+
+/**
+ * An utility object to look up Hadoop compression codecs and create input streams.
+ * In addition to standard Hadoop codecs, it also supports Spark's Zstandard codec
+ * if Hadopp is not compiled with Zstandard support. Additionally, it supports
+ * non-standard file extensions like `.zstd` and `.gzip` for Zstandard and Gzip codecs.
+ */
+object HadoopCodecStreams {
+  private val ZSTD_EXTENSIONS = Seq(".zstd", ".zst")
+
+  // get codec based on file name extension
+  def getDecompressionCodec(
+    config: Configuration,
+    file: Path): Option[CompressionCodec] = {
+    val factory = new CompressionCodecFactory(config)
+    Option(factory.getCodec(file)).orElse {
+      // Try some non-standards extensions for Zstandard and Gzip
+      file.getName.toLowerCase() match {
+        case name if name.endsWith(".zstd") =>
+          Option(factory.getCodecByName(classOf[ZStandardCodec].getName))
+        case name if name.endsWith(".gzip") =>
+          Option(factory.getCodecByName(classOf[GzipCodec].getName))
+        case _ => None
+      }
+    }
+  }
+
+  def createZstdInputStream(
+    file: Path,
+    inputStream: InputStream): Option[InputStream] = {
+    val sparkConf = Option(SparkEnv.get).map(_.conf).getOrElse(new SparkConf)
+    val fileName = file.getName.toLowerCase(Locale.ROOT)
+
+    val isOpt = if (ZSTD_EXTENSIONS.exists(fileName.endsWith)) {
+      Some(
+        SparkCompressionCodec
+          .createCodec(sparkConf, SparkCompressionCodec.ZSTD)
+          .compressedInputStream(inputStream)
+      )
+    } else {
+      None
+    }
+    isOpt
+  }
+
+  def createInputStream(
+    config: Configuration,
+    file: Path): InputStream = {
+    val fs = file.getFileSystem(config)
+    val inputStream: InputStream = fs.open(file)
+
+    getDecompressionCodec(config, file)
+      .map { codec =>
+        try {
+          codec.createInputStream(inputStream)
+        } catch {
+          case e: RuntimeException =>
+            // createInputStream may fail for ZSTD if hadoop is not already compiled with ZSTD
+            // support. In that case, we try to use Spark's Zstandard codec.
+            createZstdInputStream(file, inputStream).getOrElse(throw e)
+        }
+      }.getOrElse(inputStream)
+  }
+}
diff --git a/core/src/main/scala/org/apache/spark/mapred/SparkHadoopMapRedUtil.scala b/core/src/main/scala/org/apache/spark/mapred/SparkHadoopMapRedUtil.scala
index 0aaa222e6195e..e9745a7c2ba67 100644
--- a/core/src/main/scala/org/apache/spark/mapred/SparkHadoopMapRedUtil.scala
+++ b/core/src/main/scala/org/apache/spark/mapred/SparkHadoopMapRedUtil.scala
@@ -24,7 +24,7 @@ import org.apache.hadoop.mapreduce.{OutputCommitter => MapReduceOutputCommitter}
 
 import org.apache.spark.{SparkEnv, TaskContext}
 import org.apache.spark.executor.CommitDeniedException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{TASK_ATTEMPT_ID, TOTAL_TIME}
 import org.apache.spark.util.Utils
 
diff --git a/core/src/main/scala/org/apache/spark/memory/ExecutionMemoryPool.scala b/core/src/main/scala/org/apache/spark/memory/ExecutionMemoryPool.scala
index 7098961d1649a..8b31d02cf97e3 100644
--- a/core/src/main/scala/org/apache/spark/memory/ExecutionMemoryPool.scala
+++ b/core/src/main/scala/org/apache/spark/memory/ExecutionMemoryPool.scala
@@ -21,7 +21,7 @@ import javax.annotation.concurrent.GuardedBy
 
 import scala.collection.mutable
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 
 /**
diff --git a/core/src/main/scala/org/apache/spark/memory/StorageMemoryPool.scala b/core/src/main/scala/org/apache/spark/memory/StorageMemoryPool.scala
index 24fcb5b17f388..7cde44b553321 100644
--- a/core/src/main/scala/org/apache/spark/memory/StorageMemoryPool.scala
+++ b/core/src/main/scala/org/apache/spark/memory/StorageMemoryPool.scala
@@ -20,7 +20,7 @@ package org.apache.spark.memory
 import javax.annotation.concurrent.GuardedBy
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.storage.BlockId
 import org.apache.spark.storage.memory.MemoryStore
diff --git a/core/src/main/scala/org/apache/spark/memory/UnifiedMemoryManager.scala b/core/src/main/scala/org/apache/spark/memory/UnifiedMemoryManager.scala
index d4ec6ed8495af..db51f14415e1a 100644
--- a/core/src/main/scala/org/apache/spark/memory/UnifiedMemoryManager.scala
+++ b/core/src/main/scala/org/apache/spark/memory/UnifiedMemoryManager.scala
@@ -17,11 +17,19 @@
 
 package org.apache.spark.memory
 
+import java.util.concurrent.{ConcurrentHashMap, ScheduledExecutorService, TimeUnit}
+import java.util.concurrent.atomic.{AtomicBoolean, AtomicLong}
+
+import scala.jdk.CollectionConverters._
+import scala.util.control.NonFatal
+
 import org.apache.spark.{SparkConf, SparkIllegalArgumentException}
-import org.apache.spark.internal.{config, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.Tests._
+import org.apache.spark.internal.config.UNMANAGED_MEMORY_POLLING_INTERVAL
 import org.apache.spark.storage.BlockId
+import org.apache.spark.util.{ThreadUtils, Utils}
 
 /**
  * A [[MemoryManager]] that enforces a soft boundary between execution and storage such that
@@ -56,7 +64,47 @@ private[spark] class UnifiedMemoryManager(
     conf,
     numCores,
     onHeapStorageRegionSize,
-    maxHeapMemory - onHeapStorageRegionSize) {
+    maxHeapMemory - onHeapStorageRegionSize) with Logging  {
+
+  /**
+   * Unmanaged memory tracking infrastructure.
+   *
+   * Unmanaged memory refers to memory consumed by components that manage their own memory
+   * outside of Spark's unified memory management system. Examples include:
+   * - RocksDB state stores used in structured streaming
+   * - Native libraries with their own memory management
+   * - Off-heap caches managed by unmanaged systems
+   *
+   * We track this memory to:
+   * 1. Provide visibility into total memory usage on executors
+   * 2. Prevent OOM errors by accounting for it in memory allocation decisions
+   * 3. Enable better debugging and monitoring of memory-intensive applications
+   *
+   * The polling mechanism periodically queries registered unmanaged memory consumers
+   * to detect inactive consumers and handle cleanup.
+   */
+  // Configuration for polling interval (in milliseconds)
+  private val unmanagedMemoryPollingIntervalMs = conf.get(UNMANAGED_MEMORY_POLLING_INTERVAL)
+  // Initialize background polling if enabled
+  if (unmanagedMemoryPollingIntervalMs > 0) {
+    UnifiedMemoryManager.startPollingIfNeeded(unmanagedMemoryPollingIntervalMs)
+  }
+
+  /**
+   * Get the current unmanaged memory usage in bytes for a specific memory mode.
+   * @param memoryMode The memory mode (ON_HEAP or OFF_HEAP) to get usage for
+   * @return The current unmanaged memory usage in bytes
+   */
+  private def getUnmanagedMemoryUsed(memoryMode: MemoryMode): Long = {
+    // Only consider unmanaged memory if polling is enabled
+    if (unmanagedMemoryPollingIntervalMs <= 0) {
+      return 0L
+    }
+    memoryMode match {
+      case MemoryMode.ON_HEAP => UnifiedMemoryManager.unmanagedOnHeapUsed.get()
+      case MemoryMode.OFF_HEAP => UnifiedMemoryManager.unmanagedOffHeapUsed.get()
+    }
+  }
 
   private def assertInvariants(): Unit = {
     assert(onHeapExecutionMemoryPool.poolSize + onHeapStorageMemoryPool.poolSize == maxHeapMemory)
@@ -140,9 +188,15 @@ private[spark] class UnifiedMemoryManager(
      * in execution memory allocation across tasks, Otherwise, a task may occupy more than
      * its fair share of execution memory, mistakenly thinking that other tasks can acquire
      * the portion of storage memory that cannot be evicted.
+     *
+     * This also factors in unmanaged memory usage to ensure we don't over-allocate memory
+     * when unmanaged components are consuming significant memory.
      */
     def computeMaxExecutionPoolSize(): Long = {
-      maxMemory - math.min(storagePool.memoryUsed, storageRegionSize)
+      val unmanagedMemory = getUnmanagedMemoryUsed(memoryMode)
+      val availableMemory = maxMemory - math.min(storagePool.memoryUsed, storageRegionSize)
+      // Reduce available memory by unmanaged memory usage to prevent over-allocation
+      math.max(0L, availableMemory - unmanagedMemory)
     }
 
     executionPool.acquireMemory(
@@ -165,11 +219,21 @@ private[spark] class UnifiedMemoryManager(
         offHeapStorageMemoryPool,
         maxOffHeapStorageMemory)
     }
-    if (numBytes > maxMemory) {
+
+    // Factor in unmanaged memory usage for the specific memory mode
+    val unmanagedMemory = getUnmanagedMemoryUsed(memoryMode)
+    val effectiveMaxMemory = math.max(0L, maxMemory - unmanagedMemory)
+
+    if (numBytes > effectiveMaxMemory) {
       // Fail fast if the block simply won't fit
       logInfo(log"Will not store ${MDC(BLOCK_ID, blockId)} as the required space" +
         log" (${MDC(NUM_BYTES, numBytes)} bytes) exceeds our" +
-        log" memory limit (${MDC(NUM_BYTES_MAX, maxMemory)} bytes)")
+        log" memory limit (${MDC(NUM_BYTES_MAX, effectiveMaxMemory)} bytes)" +
+        (if (unmanagedMemory > 0) {
+          log" (unmanaged memory usage: ${MDC(NUM_BYTES, unmanagedMemory)} bytes)"
+        } else {
+          log""
+        }))
       return false
     }
     if (numBytes > storagePool.memoryFree) {
@@ -191,7 +255,7 @@ private[spark] class UnifiedMemoryManager(
   }
 }
 
-object UnifiedMemoryManager {
+object UnifiedMemoryManager extends Logging {
 
   // Set aside a fixed amount of memory for non-storage, non-execution purposes.
   // This serves a function similar to `spark.memory.fraction`, but guarantees that we reserve
@@ -199,6 +263,181 @@ object UnifiedMemoryManager {
   // the memory used for execution and storage will be (1024 - 300) * 0.6 = 434MB by default.
   private val RESERVED_SYSTEM_MEMORY_BYTES = 300 * 1024 * 1024
 
+  private val unmanagedMemoryConsumers =
+    new ConcurrentHashMap[UnmanagedMemoryConsumerId, UnmanagedMemoryConsumer]
+
+  // Cached unmanaged memory usage values updated by polling
+  private val unmanagedOnHeapUsed = new AtomicLong(0L)
+  private val unmanagedOffHeapUsed = new AtomicLong(0L)
+
+  // Atomic flag to ensure polling is only started once per JVM
+  private val pollingStarted = new AtomicBoolean(false)
+
+  /**
+   * Register an unmanaged memory consumer to track its memory usage.
+   *
+   * Unmanaged memory consumers are components that manage their own memory outside
+   * of Spark's unified memory management system. By registering, their memory usage
+   * will be periodically polled and factored into Spark's memory allocation decisions.
+   *
+   * @param unmanagedMemoryConsumer The consumer to register for memory tracking
+   */
+  def registerUnmanagedMemoryConsumer(
+      unmanagedMemoryConsumer: UnmanagedMemoryConsumer): Unit = {
+    val id = unmanagedMemoryConsumer.unmanagedMemoryConsumerId
+    unmanagedMemoryConsumers.put(id, unmanagedMemoryConsumer)
+  }
+
+  /**
+   * Unregister an unmanaged memory consumer.
+   * This should be called when a component is shutting down to prevent memory leaks
+   * and ensure accurate memory tracking.
+   *
+   * @param unmanagedMemoryConsumer The consumer to unregister. Only used in tests
+   */
+  private[spark] def unregisterUnmanagedMemoryConsumer(
+      unmanagedMemoryConsumer: UnmanagedMemoryConsumer): Unit = {
+    val id = unmanagedMemoryConsumer.unmanagedMemoryConsumerId
+    unmanagedMemoryConsumers.remove(id)
+  }
+
+
+  /**
+   * Get the current memory usage in bytes for a specific component type.
+   * @param componentType The type of component to filter by (e.g., "RocksDB")
+   * @return Total memory usage in bytes for the specified component type
+   */
+  def getMemoryByComponentType(componentType: String): Long = {
+    unmanagedMemoryConsumers.asScala.values.toSeq
+      .filter(_.unmanagedMemoryConsumerId.componentType == componentType)
+      .map { memoryUser =>
+        try {
+          memoryUser.getMemBytesUsed
+        } catch {
+          case e: Exception =>
+            0L
+        }
+      }
+      .sum
+  }
+
+  /**
+   * Clear all unmanaged memory users.
+   * This is useful during executor shutdown or cleanup.
+   * Since each executor runs in its own JVM, this clears all users for this executor.
+   */
+  def clearUnmanagedMemoryUsers(): Unit = {
+    unmanagedMemoryConsumers.clear()
+    // Reset cached values when clearing consumers
+    unmanagedOnHeapUsed.set(0L)
+    unmanagedOffHeapUsed.set(0L)
+  }
+
+  // Shared polling infrastructure - only one polling thread per JVM
+  @volatile private var unmanagedMemoryPoller: ScheduledExecutorService = _
+
+  /**
+   * Start unmanaged memory polling if not already started.
+   * This ensures only one polling thread is created per JVM, regardless of how many
+   * UnifiedMemoryManager instances are created.
+   */
+  private[memory] def startPollingIfNeeded(pollingIntervalMs: Long): Unit = {
+    if (pollingStarted.compareAndSet(false, true)) {
+      unmanagedMemoryPoller = ThreadUtils.newDaemonSingleThreadScheduledExecutor(
+        "unmanaged-memory-poller")
+
+      val pollingTask = new Runnable {
+        override def run(): Unit = Utils.tryLogNonFatalError {
+          pollUnmanagedMemoryUsers()
+        }
+      }
+
+      unmanagedMemoryPoller.scheduleAtFixedRate(
+        pollingTask,
+        0L, // initial delay
+        pollingIntervalMs,
+        TimeUnit.MILLISECONDS)
+
+      logInfo(log"Unmanaged memory polling started with interval " +
+        log"${MDC(LogKeys.TIME, pollingIntervalMs)}ms")
+    }
+  }
+
+  private def pollUnmanagedMemoryUsers(): Unit = {
+    val consumers = unmanagedMemoryConsumers.asScala.toMap
+
+    // Get memory usage for each consumer, handling failures gracefully
+    val memoryUsages = consumers.map { case (userId, memoryUser) =>
+      try {
+        val memoryUsed = memoryUser.getMemBytesUsed
+        if (memoryUsed == -1L) {
+          logDebug(log"Unmanaged memory consumer ${MDC(LogKeys.OBJECT_ID, userId.toString)} " +
+            log"is no longer active, marking for removal")
+          (userId, memoryUser, None) // Mark for removal
+        } else if (memoryUsed < 0L) {
+          logWarning(log"Invalid memory usage value ${MDC(LogKeys.NUM_BYTES, memoryUsed)} " +
+            log"from unmanaged memory user ${MDC(LogKeys.OBJECT_ID, userId.toString)}")
+          (userId, memoryUser, Some(0L)) // Treat as 0
+        } else {
+          (userId, memoryUser, Some(memoryUsed))
+        }
+      } catch {
+        case NonFatal(e) =>
+          logWarning(log"Failed to get memory usage for unmanaged memory user " +
+            log"${MDC(LogKeys.OBJECT_ID, userId.toString)} ${MDC(LogKeys.EXCEPTION, e)}")
+          (userId, memoryUser, Some(0L)) // Treat as 0 on error
+      }
+    }
+
+    // Remove inactive consumers
+    memoryUsages.filter(_._3.isEmpty).foreach { case (userId, _, _) =>
+      unmanagedMemoryConsumers.remove(userId)
+      logInfo(log"Removed inactive unmanaged memory consumer " +
+        log"${MDC(LogKeys.OBJECT_ID, userId.toString)}")
+    }
+    // Calculate total memory usage by mode
+    val activeUsages = memoryUsages.filter(_._3.isDefined)
+    val onHeapTotal = activeUsages
+      .filter(_._2.memoryMode == MemoryMode.ON_HEAP)
+      .map(_._3.get)
+      .sum
+    val offHeapTotal = activeUsages
+      .filter(_._2.memoryMode == MemoryMode.OFF_HEAP)
+      .map(_._3.get)
+      .sum
+    // Update cached values atomically
+    unmanagedOnHeapUsed.set(onHeapTotal)
+    unmanagedOffHeapUsed.set(offHeapTotal)
+    // Log polling results for monitoring
+    val totalMemoryUsed = onHeapTotal + offHeapTotal
+    val numConsumers = activeUsages.size
+    logDebug(s"Unmanaged memory polling completed: $numConsumers consumers, " +
+      s"total memory used: ${totalMemoryUsed} bytes " +
+      s"(on-heap: ${onHeapTotal}, off-heap: ${offHeapTotal})")
+  }
+
+  /**
+   * Shutdown the unmanaged memory polling thread. Only used in tests
+   */
+  private[spark] def shutdownUnmanagedMemoryPoller(): Unit = {
+    synchronized {
+      if (unmanagedMemoryPoller != null) {
+        unmanagedMemoryPoller.shutdown()
+        try {
+          if (!unmanagedMemoryPoller.awaitTermination(5, TimeUnit.SECONDS)) {
+            unmanagedMemoryPoller.shutdownNow()
+          }
+        } catch {
+          case _: InterruptedException =>
+            Thread.currentThread().interrupt()
+        }
+        unmanagedMemoryPoller = null
+        pollingStarted.set(false)
+        logInfo(log"Unmanaged memory poller shutdown complete")
+      }
+    }
+  }
+
   def apply(conf: SparkConf, numCores: Int): UnifiedMemoryManager = {
     val maxMemory = getMaxMemory(conf)
     new UnifiedMemoryManager(
diff --git a/core/src/main/scala/org/apache/spark/memory/UnmanagedMemoryConsumer.scala b/core/src/main/scala/org/apache/spark/memory/UnmanagedMemoryConsumer.scala
new file mode 100644
index 0000000000000..8351918282156
--- /dev/null
+++ b/core/src/main/scala/org/apache/spark/memory/UnmanagedMemoryConsumer.scala
@@ -0,0 +1,72 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.memory
+
+/**
+ * Identifier for an unmanaged memory consumer.
+ *
+ * @param componentType The type of component (e.g., "RocksDB", "NativeLibrary")
+ * @param instanceKey A unique key to identify this specific instance of the component.
+ *                    For shared memory consumers, this should be a common key across
+ *                    all instances to avoid double counting.
+ */
+case class UnmanagedMemoryConsumerId(
+    componentType: String,
+    instanceKey: String
+)
+
+/**
+ * Interface for components that consume memory outside of Spark's unified memory management.
+ *
+ * Components implementing this trait can register themselves with the memory manager
+ * to have their memory usage tracked and factored into memory allocation decisions.
+ * This helps prevent OOM errors when unmanaged components use significant memory.
+ *
+ * Examples of unmanaged memory consumers:
+ * - RocksDB state stores in structured streaming
+ * - Native libraries with custom memory allocation
+ * - Off-heap caches managed outside of Spark
+ */
+trait UnmanagedMemoryConsumer {
+  /**
+   * Returns the unique identifier for this memory consumer.
+   * The identifier is used to track and manage the consumer in the memory tracking system.
+   */
+  def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId
+
+  /**
+   * Returns the memory mode (ON_HEAP or OFF_HEAP) that this consumer uses.
+   * This is used to ensure unmanaged memory usage only affects the correct memory pool.
+   */
+  def memoryMode: MemoryMode
+
+  /**
+   * Returns the current memory usage in bytes.
+   *
+   * This method is called periodically by the memory polling mechanism to track
+   * memory usage over time. Implementations should return the current total memory
+   * consumed by this component.
+   *
+   * @return Current memory usage in bytes. Should return 0 if no memory is currently used.
+   *         Return -1L to indicate this consumer is no longer active and should be
+   *         automatically removed from tracking.
+   * @throws Exception if memory usage cannot be determined. The polling mechanism
+   *                   will handle exceptions gracefully and log warnings.
+   */
+  def getMemBytesUsed: Long
+}
diff --git a/core/src/main/scala/org/apache/spark/metrics/ExecutorMetricType.scala b/core/src/main/scala/org/apache/spark/metrics/ExecutorMetricType.scala
index 965468ac2418f..b192a9f9babd1 100644
--- a/core/src/main/scala/org/apache/spark/metrics/ExecutorMetricType.scala
+++ b/core/src/main/scala/org/apache/spark/metrics/ExecutorMetricType.scala
@@ -24,7 +24,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.executor.ProcfsMetricsGetter
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.memory.MemoryManager
 
diff --git a/core/src/main/scala/org/apache/spark/metrics/MetricsConfig.scala b/core/src/main/scala/org/apache/spark/metrics/MetricsConfig.scala
index a845feeb67ff0..b975cefb336c2 100644
--- a/core/src/main/scala/org/apache/spark/metrics/MetricsConfig.scala
+++ b/core/src/main/scala/org/apache/spark/metrics/MetricsConfig.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import scala.util.matching.Regex
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.internal.config.METRICS_CONF
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/metrics/MetricsSystem.scala b/core/src/main/scala/org/apache/spark/metrics/MetricsSystem.scala
index 709ce0060e150..af1f54007248d 100644
--- a/core/src/main/scala/org/apache/spark/metrics/MetricsSystem.scala
+++ b/core/src/main/scala/org/apache/spark/metrics/MetricsSystem.scala
@@ -26,7 +26,7 @@ import com.codahale.metrics.{Metric, MetricRegistry}
 import org.eclipse.jetty.servlet.ServletContextHandler
 
 import org.apache.spark.{SecurityManager, SparkConf}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.metrics.sink.{MetricsServlet, PrometheusServlet, Sink}
diff --git a/core/src/main/scala/org/apache/spark/metrics/sink/StatsdSink.scala b/core/src/main/scala/org/apache/spark/metrics/sink/StatsdSink.scala
index 30b10d64882ac..4b74354aa15e3 100644
--- a/core/src/main/scala/org/apache/spark/metrics/sink/StatsdSink.scala
+++ b/core/src/main/scala/org/apache/spark/metrics/sink/StatsdSink.scala
@@ -22,7 +22,7 @@ import java.util.concurrent.TimeUnit
 
 import com.codahale.metrics.{Metric, MetricFilter, MetricRegistry}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PREFIX
 import org.apache.spark.metrics.MetricsSystem
 
diff --git a/core/src/main/scala/org/apache/spark/network/netty/NettyBlockRpcServer.scala b/core/src/main/scala/org/apache/spark/network/netty/NettyBlockRpcServer.scala
index a922eb336c28f..03810292bd05c 100644
--- a/core/src/main/scala/org/apache/spark/network/netty/NettyBlockRpcServer.scala
+++ b/core/src/main/scala/org/apache/spark/network/netty/NettyBlockRpcServer.scala
@@ -23,7 +23,7 @@ import scala.jdk.CollectionConverters._
 import scala.reflect.ClassTag
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.network.BlockDataManager
 import org.apache.spark.network.buffer.NioManagedBuffer
diff --git a/core/src/main/scala/org/apache/spark/network/netty/NettyBlockTransferService.scala b/core/src/main/scala/org/apache/spark/network/netty/NettyBlockTransferService.scala
index 7ceb50db5966a..fe55518d80004 100644
--- a/core/src/main/scala/org/apache/spark/network/netty/NettyBlockTransferService.scala
+++ b/core/src/main/scala/org/apache/spark/network/netty/NettyBlockTransferService.scala
@@ -30,7 +30,7 @@ import com.codahale.metrics.{Metric, MetricSet}
 
 import org.apache.spark.{SecurityManager, SparkConf}
 import org.apache.spark.ExecutorDeadException
-import org.apache.spark.internal.{config, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.network._
 import org.apache.spark.network.buffer.{ManagedBuffer, NioManagedBuffer}
 import org.apache.spark.network.client.{RpcResponseCallback, TransportClientBootstrap}
@@ -57,7 +57,7 @@ private[spark] class NettyBlockTransferService(
     _port: Int,
     numCores: Int,
     driverEndPointRef: RpcEndpointRef = null)
-  extends BlockTransferService {
+  extends BlockTransferService with Logging {
 
   // TODO: Don't use Java serialization, use a more cross-version compatible serialization format.
   private val serializer = serializerManager.getSerializer(scala.reflect.classTag[Any], false)
@@ -196,9 +196,9 @@ private[spark] class NettyBlockTransferService(
 
       override def onFailure(e: Throwable): Unit = {
         if (asStream) {
-          logger.error(s"Error while uploading {} as stream", e, MDC.of(LogKeys.BLOCK_ID, blockId))
+          logger.error(s"Error while uploading {} as stream", e, MDC(LogKeys.BLOCK_ID, blockId))
         } else {
-          logger.error(s"Error while uploading {}", e, MDC.of(LogKeys.BLOCK_ID, blockId))
+          logger.error(s"Error while uploading {}", e, MDC(LogKeys.BLOCK_ID, blockId))
         }
         result.failure(e)
       }
diff --git a/core/src/main/scala/org/apache/spark/rdd/HadoopRDD.scala b/core/src/main/scala/org/apache/spark/rdd/HadoopRDD.scala
index 44ce1bfa8c5c8..a16bd98a74669 100644
--- a/core/src/main/scala/org/apache/spark/rdd/HadoopRDD.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/HadoopRDD.scala
@@ -39,7 +39,7 @@ import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.broadcast.Broadcast
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.rdd.HadoopRDD.HadoopMapPartitionsWithSplitRDD
diff --git a/core/src/main/scala/org/apache/spark/rdd/JdbcRDD.scala b/core/src/main/scala/org/apache/spark/rdd/JdbcRDD.scala
index 8c10bcbc25a86..e71cf4d002a74 100644
--- a/core/src/main/scala/org/apache/spark/rdd/JdbcRDD.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/JdbcRDD.scala
@@ -25,7 +25,7 @@ import org.apache.spark.{Partition, SparkContext, TaskContext}
 import org.apache.spark.api.java.{JavaRDD, JavaSparkContext}
 import org.apache.spark.api.java.JavaSparkContext.fakeClassTag
 import org.apache.spark.api.java.function.{Function => JFunction}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.util.NextIterator
 
@@ -54,7 +54,9 @@ private[spark] class JdbcPartition(idx: Int, val lower: Long, val upper: Long) e
  * @param mapRow a function from a ResultSet to a single row of the desired result type(s).
  *   This should only call getInt, getString, etc; the RDD takes care of calling next.
  *   The default maps a ResultSet to an array of Object.
+ * @deprecated Jdbc RDD is deprecated, consider using JDBC data source instead.
  */
+@deprecated("Jdbc RDD is deprecated, consider using JDBC data source instead.", "4.1.0")
 class JdbcRDD[T: ClassTag](
     sc: SparkContext,
     getConnection: () => Connection,
diff --git a/core/src/main/scala/org/apache/spark/rdd/NewHadoopRDD.scala b/core/src/main/scala/org/apache/spark/rdd/NewHadoopRDD.scala
index 27e4948ce1297..cdf90a03a554a 100644
--- a/core/src/main/scala/org/apache/spark/rdd/NewHadoopRDD.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/NewHadoopRDD.scala
@@ -39,7 +39,7 @@ import org.apache.spark._
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.rdd.NewHadoopRDD.NewHadoopMapPartitionsWithSplitRDD
diff --git a/core/src/main/scala/org/apache/spark/rdd/PairRDDFunctions.scala b/core/src/main/scala/org/apache/spark/rdd/PairRDDFunctions.scala
index c0966dd5ede14..956620e0b2c23 100644
--- a/core/src/main/scala/org/apache/spark/rdd/PairRDDFunctions.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/PairRDDFunctions.scala
@@ -35,7 +35,7 @@ import org.apache.hadoop.mapreduce.{Job => NewAPIHadoopJob, OutputFormat => NewO
 import org.apache.spark._
 import org.apache.spark.Partitioner.defaultPartitioner
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.SPECULATION_ENABLED
 import org.apache.spark.internal.io._
diff --git a/core/src/main/scala/org/apache/spark/rdd/PartitionerAwareUnionRDD.scala b/core/src/main/scala/org/apache/spark/rdd/PartitionerAwareUnionRDD.scala
index 965618ee827d1..99b1546f858c1 100644
--- a/core/src/main/scala/org/apache/spark/rdd/PartitionerAwareUnionRDD.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/PartitionerAwareUnionRDD.scala
@@ -47,23 +47,12 @@ class PartitionerAwareUnionRDDPartition(
   }
 }
 
-/**
- * Class representing an RDD that can take multiple RDDs partitioned by the same partitioner and
- * unify them into a single RDD while preserving the partitioner. So m RDDs with p partitions each
- * will be unified to a single RDD with p partitions and the same partitioner. The preferred
- * location for each partition of the unified RDD will be the most common preferred location
- * of the corresponding partitions of the parent RDDs. For example, location of partition 0
- * of the unified RDD will be where most of partition 0 of the parent RDDs are located.
- */
 private[spark]
-class PartitionerAwareUnionRDD[T: ClassTag](
+abstract class PartitionerAwareUnionRDDBase[T: ClassTag](
     sc: SparkContext,
     var rdds: Seq[RDD[T]]
   ) extends RDD[T](sc, rdds.map(x => new OneToOneDependency(x))) {
-  require(rdds.nonEmpty)
-  require(rdds.forall(_.partitioner.isDefined))
-  require(rdds.flatMap(_.partitioner).toSet.size == 1,
-    "Parent RDDs have different partitioners: " + rdds.flatMap(_.partitioner))
+  require(rdds.nonEmpty, "RDDs cannot be empty")
 
   override val partitioner = rdds.head.partitioner
 
@@ -111,3 +100,49 @@ class PartitionerAwareUnionRDD[T: ClassTag](
     rdd.context.getPreferredLocs(rdd, part.index).map(tl => tl.host)
   }
 }
+
+/**
+ * Class representing an RDD that can take multiple RDDs partitioned by the same partitioner and
+ * unify them into a single RDD while preserving the partitioner. So m RDDs with p partitions each
+ * will be unified to a single RDD with p partitions and the same partitioner. The preferred
+ * location for each partition of the unified RDD will be the most common preferred location
+ * of the corresponding partitions of the parent RDDs. For example, location of partition 0
+ * of the unified RDD will be where most of partition 0 of the parent RDDs are located.
+ */
+private[spark]
+class PartitionerAwareUnionRDD[T: ClassTag](
+    sc: SparkContext,
+    var _rdds: Seq[RDD[T]]
+  ) extends PartitionerAwareUnionRDDBase(sc, _rdds) {
+  require(_rdds.forall(_.partitioner.isDefined))
+  require(_rdds.flatMap(_.partitioner).toSet.size == 1,
+    "Parent RDDs have different partitioners: " + _rdds.flatMap(_.partitioner))
+}
+
+/**
+ * This is similar to [[PartitionerAwareUnionRDD]], but it doesn't require the parent RDDs
+ * to have defined partitioner and have the same partitioner if defined.
+ * It is because SQL's shuffle RDD's partitioner is not defined in `ShuffledRowRDD`.
+ * The actual partitioning is implemented in `ShuffleExchangeExec.prepareShuffleDependency`.
+ *
+ * Thus, this RDD doesn't check the partitioner of parent RDDs. Its correctness relies on the
+ * fact that the given RDDs are partitioned in the same way. So before using this RDD, you must
+ * ensure that all parent RDDs are partitioned correctly by checking their SQL output partitioning.
+ */
+private[spark]
+class SQLPartitioningAwareUnionRDD[T: ClassTag](
+    sc: SparkContext,
+    var _rdds: Seq[RDD[T]],
+    val numPartitions: Int
+  ) extends PartitionerAwareUnionRDDBase(sc, _rdds) {
+  require(partitioner.isEmpty || partitioner.get.numPartitions == numPartitions,
+    "Partitioner of parent RDDs does not match the number of partitions: " +
+      s"expected $numPartitions, but got ${partitioner.map(_.numPartitions).getOrElse("none")}")
+
+  override def getPartitions: Array[Partition] = {
+    (0 until numPartitions).map { index =>
+      new PartitionerAwareUnionRDDPartition(_rdds, index)
+    }.toArray
+  }
+}
+
diff --git a/core/src/main/scala/org/apache/spark/rdd/PipedRDD.scala b/core/src/main/scala/org/apache/spark/rdd/PipedRDD.scala
index 126c92e4cb656..5a9e51026ba98 100644
--- a/core/src/main/scala/org/apache/spark/rdd/PipedRDD.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/PipedRDD.scala
@@ -35,7 +35,6 @@ import scala.reflect.ClassTag
 import org.apache.spark.{Partition, TaskContext}
 import org.apache.spark.errors.SparkCoreErrors
 import org.apache.spark.internal.LogKeys.{COMMAND, ERROR, PATH}
-import org.apache.spark.internal.MDC
 import org.apache.spark.util.Utils
 
 
@@ -90,7 +89,7 @@ private[spark] class PipedRDD[T: ClassTag](
       val currentDir = new File(".")
       logDebug("currentDir = " + currentDir.getAbsolutePath())
       val taskDirFile = new File(taskDirectory)
-      taskDirFile.mkdirs()
+      Utils.createDirectory(taskDirFile)
 
       try {
         val tasksDirFilter = new NotEqualsFileNameFilter("tasks")
diff --git a/core/src/main/scala/org/apache/spark/rdd/RDD.scala b/core/src/main/scala/org/apache/spark/rdd/RDD.scala
index 80db818b77e42..117b2925710d3 100644
--- a/core/src/main/scala/org/apache/spark/rdd/RDD.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/RDD.scala
@@ -36,7 +36,7 @@ import org.apache.spark.Partitioner._
 import org.apache.spark.annotation.{DeveloperApi, Experimental, Since}
 import org.apache.spark.api.java.JavaRDD
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.RDD_LIMIT_SCALE_UP_FACTOR
@@ -2016,7 +2016,7 @@ abstract class RDD[T: ClassTag](
     def firstDebugString(rdd: RDD[_]): Seq[String] = {
       val partitionStr = "(" + rdd.partitions.length + ")"
       val leftOffset = (partitionStr.length - 1) / 2
-      val nextPrefix = (" " * leftOffset) + "|" + (" " * (partitionStr.length - leftOffset))
+      val nextPrefix = " ".repeat(leftOffset) + "|" + " ".repeat(partitionStr.length - leftOffset)
 
       debugSelf(rdd).zipWithIndex.map{
         case (desc: String, 0) => s"$partitionStr $desc"
@@ -2030,7 +2030,7 @@ abstract class RDD[T: ClassTag](
       val nextPrefix = (
         thisPrefix
         + (if (isLastChild) "  " else "| ")
-        + (" " * leftOffset) + "|" + (" " * (partitionStr.length - leftOffset)))
+        + (" ".repeat(leftOffset)) + "|" + (" ".repeat(partitionStr.length - leftOffset)))
 
       debugSelf(rdd).zipWithIndex.map{
         case (desc: String, 0) => s"$thisPrefix+-$partitionStr $desc"
diff --git a/core/src/main/scala/org/apache/spark/rdd/RDDOperationScope.scala b/core/src/main/scala/org/apache/spark/rdd/RDDOperationScope.scala
index 3abb2d8a11f35..49c259999a471 100644
--- a/core/src/main/scala/org/apache/spark/rdd/RDDOperationScope.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/RDDOperationScope.scala
@@ -17,13 +17,13 @@
 
 package org.apache.spark.rdd
 
+import java.util.Objects
 import java.util.concurrent.atomic.AtomicInteger
 
 import com.fasterxml.jackson.annotation.{JsonIgnore, JsonInclude, JsonPropertyOrder}
 import com.fasterxml.jackson.annotation.JsonInclude.Include
 import com.fasterxml.jackson.databind.ObjectMapper
 import com.fasterxml.jackson.module.scala.DefaultScalaModule
-import com.google.common.base.Objects
 
 import org.apache.spark.SparkContext
 import org.apache.spark.internal.Logging
@@ -69,7 +69,7 @@ private[spark] class RDDOperationScope(
     }
   }
 
-  override def hashCode(): Int = Objects.hashCode(id, name, parent)
+  override def hashCode(): Int = Objects.hash(id, name, parent)
 
   override def toString: String = toJson
 }
diff --git a/core/src/main/scala/org/apache/spark/rdd/ReliableCheckpointRDD.scala b/core/src/main/scala/org/apache/spark/rdd/ReliableCheckpointRDD.scala
index ee13acc650337..fd42cea795d60 100644
--- a/core/src/main/scala/org/apache/spark/rdd/ReliableCheckpointRDD.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/ReliableCheckpointRDD.scala
@@ -29,7 +29,7 @@ import org.apache.hadoop.fs.Path
 import org.apache.spark._
 import org.apache.spark.broadcast.Broadcast
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{BUFFER_SIZE, CACHE_CHECKPOINT_PREFERRED_LOCS_EXPIRE_TIME, CHECKPOINT_COMPRESS}
 import org.apache.spark.io.CompressionCodec
diff --git a/core/src/main/scala/org/apache/spark/rdd/ReliableRDDCheckpointData.scala b/core/src/main/scala/org/apache/spark/rdd/ReliableRDDCheckpointData.scala
index b468a38fcf229..9f80d53d2c0bf 100644
--- a/core/src/main/scala/org/apache/spark/rdd/ReliableRDDCheckpointData.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/ReliableRDDCheckpointData.scala
@@ -23,7 +23,7 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark._
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{NEW_RDD_ID, RDD_CHECKPOINT_DIR, RDD_ID}
 import org.apache.spark.internal.config.CLEANER_REFERENCE_TRACKING_CLEAN_CHECKPOINTS
 
diff --git a/core/src/main/scala/org/apache/spark/rdd/SequenceFileRDDFunctions.scala b/core/src/main/scala/org/apache/spark/rdd/SequenceFileRDDFunctions.scala
index 118660ef69476..14e8bade2200a 100644
--- a/core/src/main/scala/org/apache/spark/rdd/SequenceFileRDDFunctions.scala
+++ b/core/src/main/scala/org/apache/spark/rdd/SequenceFileRDDFunctions.scala
@@ -23,7 +23,7 @@ import org.apache.hadoop.io.compress.CompressionCodec
 import org.apache.hadoop.mapred.JobConf
 import org.apache.hadoop.mapred.SequenceFileOutputFormat
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 
 /**
  * Extra functions available on RDDs of (key, value) pairs to create a Hadoop SequenceFile,
diff --git a/core/src/main/scala/org/apache/spark/resource/ResourceDiscoveryScriptPlugin.scala b/core/src/main/scala/org/apache/spark/resource/ResourceDiscoveryScriptPlugin.scala
index 51de7e2b9ac70..b11c88828e065 100644
--- a/core/src/main/scala/org/apache/spark/resource/ResourceDiscoveryScriptPlugin.scala
+++ b/core/src/main/scala/org/apache/spark/resource/ResourceDiscoveryScriptPlugin.scala
@@ -23,7 +23,7 @@ import java.util.Optional
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.api.resource.ResourceDiscoveryPlugin
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.util.Utils.executeAndGetOutput
 
diff --git a/core/src/main/scala/org/apache/spark/resource/ResourceProfile.scala b/core/src/main/scala/org/apache/spark/resource/ResourceProfile.scala
index 0baa578764d08..1b4b4f61016a4 100644
--- a/core/src/main/scala/org/apache/spark/resource/ResourceProfile.scala
+++ b/core/src/main/scala/org/apache/spark/resource/ResourceProfile.scala
@@ -26,7 +26,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{SparkConf, SparkContext, SparkEnv, SparkException}
 import org.apache.spark.annotation.{Evolving, Since}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.Python.PYSPARK_EXECUTOR_MEMORY
@@ -106,6 +106,14 @@ class ResourceProfile(
     executorResources.get(ResourceProfile.PYSPARK_MEM).map(_.amount)
   }
 
+  private[spark] def getOverheadMemory: Option[Long] = {
+    executorResources.get(ResourceProfile.OVERHEAD_MEM).map(_.amount)
+  }
+
+  private[spark] def getExecutorOffHeap: Option[Long] = {
+    executorResources.get(ResourceProfile.OFFHEAP_MEM).map(_.amount)
+  }
+
   private[spark] def getExecutorMemory: Option[Long] = {
     executorResources.get(ResourceProfile.MEMORY).map(_.amount)
   }
diff --git a/core/src/main/scala/org/apache/spark/resource/ResourceProfileManager.scala b/core/src/main/scala/org/apache/spark/resource/ResourceProfileManager.scala
index 6a6b5067f70f2..10121f6ef2667 100644
--- a/core/src/main/scala/org/apache/spark/resource/ResourceProfileManager.scala
+++ b/core/src/main/scala/org/apache/spark/resource/ResourceProfileManager.scala
@@ -23,7 +23,7 @@ import scala.collection.mutable.HashMap
 
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.annotation.Evolving
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config.Tests._
 import org.apache.spark.scheduler.{LiveListenerBus, SparkListenerResourceProfileAdded}
diff --git a/core/src/main/scala/org/apache/spark/resource/ResourceUtils.scala b/core/src/main/scala/org/apache/spark/resource/ResourceUtils.scala
index 78c45cdc75418..8e11923a9e8f0 100644
--- a/core/src/main/scala/org/apache/spark/resource/ResourceUtils.scala
+++ b/core/src/main/scala/org/apache/spark/resource/ResourceUtils.scala
@@ -28,7 +28,7 @@ import org.json4s.jackson.JsonMethods._
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.api.resource.ResourceDiscoveryPlugin
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{EXECUTOR_CORES, RESOURCES_DISCOVERY_PLUGIN, SPARK_TASK_PREFIX}
 import org.apache.spark.internal.config.Tests.RESOURCES_WARNING_TESTING
diff --git a/core/src/main/scala/org/apache/spark/rpc/netty/Dispatcher.scala b/core/src/main/scala/org/apache/spark/rpc/netty/Dispatcher.scala
index 8acfef38659c0..faa263c7db6a7 100644
--- a/core/src/main/scala/org/apache/spark/rpc/netty/Dispatcher.scala
+++ b/core/src/main/scala/org/apache/spark/rpc/netty/Dispatcher.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
 import org.apache.spark.{SparkEnv, SparkException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.network.client.RpcResponseCallback
 import org.apache.spark.rpc._
diff --git a/core/src/main/scala/org/apache/spark/rpc/netty/Inbox.scala b/core/src/main/scala/org/apache/spark/rpc/netty/Inbox.scala
index 0de67a65593b1..dfaa9ea436458 100644
--- a/core/src/main/scala/org/apache/spark/rpc/netty/Inbox.scala
+++ b/core/src/main/scala/org/apache/spark/rpc/netty/Inbox.scala
@@ -22,7 +22,7 @@ import javax.annotation.concurrent.GuardedBy
 import scala.util.control.NonFatal
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rpc.{RpcAddress, RpcEndpoint, ThreadSafeRpcEndpoint}
 
diff --git a/core/src/main/scala/org/apache/spark/rpc/netty/MessageLoop.scala b/core/src/main/scala/org/apache/spark/rpc/netty/MessageLoop.scala
index 2fd1c6d7fe71e..cce455270df43 100644
--- a/core/src/main/scala/org/apache/spark/rpc/netty/MessageLoop.scala
+++ b/core/src/main/scala/org/apache/spark/rpc/netty/MessageLoop.scala
@@ -22,7 +22,7 @@ import java.util.concurrent._
 import scala.util.control.NonFatal
 
 import org.apache.spark.{SparkConf, SparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.ERROR
 import org.apache.spark.internal.config.EXECUTOR_ID
 import org.apache.spark.internal.config.Network._
diff --git a/core/src/main/scala/org/apache/spark/rpc/netty/NettyRpcEnv.scala b/core/src/main/scala/org/apache/spark/rpc/netty/NettyRpcEnv.scala
index c2688610fe8b1..a4f6d5438bf3d 100644
--- a/core/src/main/scala/org/apache/spark/rpc/netty/NettyRpcEnv.scala
+++ b/core/src/main/scala/org/apache/spark/rpc/netty/NettyRpcEnv.scala
@@ -30,7 +30,7 @@ import scala.util.{DynamicVariable, Failure, Success, Try}
 import scala.util.control.NonFatal
 
 import org.apache.spark.{SecurityManager, SparkConf, SparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.EXECUTOR_ID
 import org.apache.spark.internal.config.Network._
diff --git a/core/src/main/scala/org/apache/spark/scheduler/AsyncEventQueue.scala b/core/src/main/scala/org/apache/spark/scheduler/AsyncEventQueue.scala
index 16e9211b54851..3931b8ff5190e 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/AsyncEventQueue.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/AsyncEventQueue.scala
@@ -23,7 +23,7 @@ import java.util.concurrent.atomic.{AtomicBoolean, AtomicLong}
 import com.codahale.metrics.{Gauge, Timer}
 
 import org.apache.spark.{SparkConf, SparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/scheduler/DAGScheduler.scala b/core/src/main/scala/org/apache/spark/scheduler/DAGScheduler.scala
index baf0ed4df5309..30eb49b0c0798 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/DAGScheduler.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/DAGScheduler.scala
@@ -37,7 +37,7 @@ import org.apache.spark._
 import org.apache.spark.broadcast.Broadcast
 import org.apache.spark.errors.SparkCoreErrors
 import org.apache.spark.executor.{ExecutorMetrics, TaskMetrics}
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{LEGACY_ABORT_STAGE_AFTER_KILL_TASKS, RDD_CACHE_VISIBILITY_TRACKING_ENABLED}
 import org.apache.spark.internal.config.Tests.TEST_NO_STAGE_RETRY
diff --git a/core/src/main/scala/org/apache/spark/scheduler/EventLoggingListener.scala b/core/src/main/scala/org/apache/spark/scheduler/EventLoggingListener.scala
index 1a47d5ed17158..1e46142fab255 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/EventLoggingListener.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/EventLoggingListener.scala
@@ -31,7 +31,7 @@ import org.apache.spark.deploy.history.EventLogFileWriter
 import org.apache.spark.executor.ExecutorMetrics
 import org.apache.spark.internal.Logging
 import org.apache.spark.internal.config._
-import org.apache.spark.util.{JsonProtocol, Utils}
+import org.apache.spark.util.{JsonProtocol, JsonProtocolOptions, Utils}
 
 /**
  * A SparkListener that logs events to persistent storage.
@@ -74,7 +74,7 @@ private[spark] class EventLoggingListener(
   private val liveStageExecutorMetrics =
     mutable.HashMap.empty[(Int, Int), mutable.HashMap[String, ExecutorMetrics]]
 
-  private[this] val jsonProtocol = new JsonProtocol(sparkConf)
+  private[this] val jsonProtocolOptions = new JsonProtocolOptions(sparkConf)
 
   /**
    * Creates the log file in the configured log directory.
@@ -86,7 +86,7 @@ private[spark] class EventLoggingListener(
 
   private def initEventLog(): Unit = {
     val metadata = SparkListenerLogStart(SPARK_VERSION)
-    val eventJson = jsonProtocol.sparkEventToJsonString(metadata)
+    val eventJson = JsonProtocol.sparkEventToJsonString(metadata, jsonProtocolOptions)
     logWriter.writeEvent(eventJson, flushLogger = true)
     if (testing && loggedEvents != null) {
       loggedEvents += eventJson
@@ -95,7 +95,7 @@ private[spark] class EventLoggingListener(
 
   /** Log the event as JSON. */
   private def logEvent(event: SparkListenerEvent, flushLogger: Boolean = false): Unit = {
-    val eventJson = jsonProtocol.sparkEventToJsonString(event)
+    val eventJson = JsonProtocol.sparkEventToJsonString(event, jsonProtocolOptions)
     logWriter.writeEvent(eventJson, flushLogger)
     if (testing) {
       loggedEvents += eventJson
diff --git a/core/src/main/scala/org/apache/spark/scheduler/HealthTracker.scala b/core/src/main/scala/org/apache/spark/scheduler/HealthTracker.scala
index 82ec0ef91f4fc..fe62e39432250 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/HealthTracker.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/HealthTracker.scala
@@ -22,7 +22,7 @@ import java.util.concurrent.atomic.AtomicReference
 import scala.collection.mutable.{ArrayBuffer, HashMap, HashSet}
 
 import org.apache.spark.{ExecutorAllocationClient, SparkConf, SparkContext}
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.util.{Clock, SystemClock, Utils}
 
diff --git a/core/src/main/scala/org/apache/spark/scheduler/LiveListenerBus.scala b/core/src/main/scala/org/apache/spark/scheduler/LiveListenerBus.scala
index 7251eb2c86ea1..656f9875de2e2 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/LiveListenerBus.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/LiveListenerBus.scala
@@ -30,7 +30,7 @@ import com.codahale.metrics.{Counter, MetricRegistry, Timer}
 
 import org.apache.spark.{SparkConf, SparkContext}
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, MAX_SIZE}
 import org.apache.spark.internal.config._
 import org.apache.spark.metrics.MetricsSystem
diff --git a/core/src/main/scala/org/apache/spark/scheduler/OutputCommitCoordinator.scala b/core/src/main/scala/org/apache/spark/scheduler/OutputCommitCoordinator.scala
index a769c3fa14b62..3e6f0fe3bfc44 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/OutputCommitCoordinator.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/OutputCommitCoordinator.scala
@@ -20,7 +20,7 @@ package org.apache.spark.scheduler
 import scala.collection.mutable
 
 import org.apache.spark._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.rpc.{RpcCallContext, RpcEndpoint, RpcEndpointRef, RpcEnv}
 import org.apache.spark.util.{RpcUtils, ThreadUtils}
 
diff --git a/core/src/main/scala/org/apache/spark/scheduler/ReplayListenerBus.scala b/core/src/main/scala/org/apache/spark/scheduler/ReplayListenerBus.scala
index 0aa74190d9f3d..2e6cfa98ff373 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/ReplayListenerBus.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/ReplayListenerBus.scala
@@ -24,7 +24,7 @@ import scala.io.{Codec, Source}
 import com.fasterxml.jackson.core.JsonParseException
 import com.fasterxml.jackson.databind.exc.UnrecognizedPropertyException
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.scheduler.ReplayListenerBus._
 import org.apache.spark.util.JsonProtocol
@@ -32,8 +32,7 @@ import org.apache.spark.util.JsonProtocol
 /**
  * A SparkListenerBus that can be used to replay events from serialized event data.
  */
-private[spark] class ReplayListenerBus(
-    jsonProtocol: JsonProtocol) extends SparkListenerBus with Logging {
+private[spark] class ReplayListenerBus extends SparkListenerBus with Logging {
 
   /**
    * Replay each event in the order maintained in the given stream. The stream is expected to
@@ -87,7 +86,7 @@ private[spark] class ReplayListenerBus(
           currentLine = entry._1
           lineNumber = entry._2 + 1
 
-          postToAll(jsonProtocol.sparkEventFromJson(currentLine))
+          postToAll(JsonProtocol.sparkEventFromJson(currentLine))
         } catch {
           case e: ClassNotFoundException =>
             // Ignore unknown events, parse through the event log file.
diff --git a/core/src/main/scala/org/apache/spark/scheduler/SchedulableBuilder.scala b/core/src/main/scala/org/apache/spark/scheduler/SchedulableBuilder.scala
index bea49fb279ee3..06b6045cccd99 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/SchedulableBuilder.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/SchedulableBuilder.scala
@@ -26,7 +26,7 @@ import scala.xml.{Node, XML}
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{SCHEDULER_ALLOCATION_FILE, SCHEDULER_MODE}
diff --git a/core/src/main/scala/org/apache/spark/scheduler/StatsReportListener.scala b/core/src/main/scala/org/apache/spark/scheduler/StatsReportListener.scala
index e46dde5561a26..c8ffaefba3d64 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/StatsReportListener.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/StatsReportListener.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable
 
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.executor.TaskMetrics
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.util.{Distribution, Utils}
 
 
diff --git a/core/src/main/scala/org/apache/spark/scheduler/Task.scala b/core/src/main/scala/org/apache/spark/scheduler/Task.scala
index e21ec77ce69ec..0e5e2c9faa05a 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/Task.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/Task.scala
@@ -22,7 +22,7 @@ import java.util.Properties
 
 import org.apache.spark._
 import org.apache.spark.executor.TaskMetrics
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.APP_CALLER_CONTEXT
 import org.apache.spark.internal.plugin.PluginContainer
 import org.apache.spark.memory.{MemoryMode, TaskMemoryManager}
diff --git a/core/src/main/scala/org/apache/spark/scheduler/TaskResultGetter.scala b/core/src/main/scala/org/apache/spark/scheduler/TaskResultGetter.scala
index 97c539bb05a58..70f58747506cc 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/TaskResultGetter.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/TaskResultGetter.scala
@@ -25,7 +25,7 @@ import scala.util.control.NonFatal
 
 import org.apache.spark._
 import org.apache.spark.TaskState.TaskState
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_LOADER
 import org.apache.spark.serializer.{SerializerHelper, SerializerInstance}
 import org.apache.spark.util.{LongAccumulator, ThreadUtils, Utils}
diff --git a/core/src/main/scala/org/apache/spark/scheduler/TaskSchedulerImpl.scala b/core/src/main/scala/org/apache/spark/scheduler/TaskSchedulerImpl.scala
index 13018da5bc274..1351d8c778b58 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/TaskSchedulerImpl.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/TaskSchedulerImpl.scala
@@ -33,7 +33,7 @@ import org.apache.spark.InternalAccumulator.{input, shuffleRead}
 import org.apache.spark.TaskState.TaskState
 import org.apache.spark.errors.SparkCoreErrors
 import org.apache.spark.executor.ExecutorMetrics
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.resource.ResourceProfile
diff --git a/core/src/main/scala/org/apache/spark/scheduler/TaskSetExcludeList.scala b/core/src/main/scala/org/apache/spark/scheduler/TaskSetExcludeList.scala
index 3637305293107..c1b09567013f0 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/TaskSetExcludeList.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/TaskSetExcludeList.scala
@@ -19,7 +19,7 @@ package org.apache.spark.scheduler
 import scala.collection.mutable.{HashMap, HashSet}
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.util.Clock
 
 /**
diff --git a/core/src/main/scala/org/apache/spark/scheduler/TaskSetManager.scala b/core/src/main/scala/org/apache/spark/scheduler/TaskSetManager.scala
index 0eaf138d3eb8d..69e0a10a34b28 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/TaskSetManager.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/TaskSetManager.scala
@@ -30,7 +30,7 @@ import org.apache.spark.InternalAccumulator
 import org.apache.spark.InternalAccumulator.{input, shuffleRead}
 import org.apache.spark.TaskState.TaskState
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.scheduler.SchedulingMode._
diff --git a/core/src/main/scala/org/apache/spark/scheduler/cluster/CoarseGrainedSchedulerBackend.scala b/core/src/main/scala/org/apache/spark/scheduler/cluster/CoarseGrainedSchedulerBackend.scala
index 4b3a16b4d3f60..49590f0940f76 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/cluster/CoarseGrainedSchedulerBackend.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/cluster/CoarseGrainedSchedulerBackend.scala
@@ -32,7 +32,7 @@ import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.deploy.security.HadoopDelegationTokenManager
 import org.apache.spark.errors.SparkCoreErrors
 import org.apache.spark.executor.ExecutorLogUrlHandler
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
diff --git a/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneSchedulerBackend.scala b/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneSchedulerBackend.scala
index eb408a95589f7..061b54914c839 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneSchedulerBackend.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/cluster/StandaloneSchedulerBackend.scala
@@ -27,7 +27,7 @@ import org.apache.spark.{SparkConf, SparkContext}
 import org.apache.spark.deploy.{ApplicationDescription, Command}
 import org.apache.spark.deploy.client.{StandaloneAppClient, StandaloneAppClientListener}
 import org.apache.spark.executor.ExecutorExitCode
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.config.EXECUTOR_REMOVE_DELAY
 import org.apache.spark.internal.config.Tests.IS_TESTING
 import org.apache.spark.launcher.{LauncherBackend, SparkAppHandle}
diff --git a/core/src/main/scala/org/apache/spark/scheduler/dynalloc/ExecutorMonitor.scala b/core/src/main/scala/org/apache/spark/scheduler/dynalloc/ExecutorMonitor.scala
index 57505c87f879e..a98672fd7db4a 100644
--- a/core/src/main/scala/org/apache/spark/scheduler/dynalloc/ExecutorMonitor.scala
+++ b/core/src/main/scala/org/apache/spark/scheduler/dynalloc/ExecutorMonitor.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark._
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.resource.ResourceProfile.UNKNOWN_RESOURCE_PROFILE_ID
 import org.apache.spark.scheduler._
diff --git a/core/src/main/scala/org/apache/spark/security/CryptoStreamUtils.scala b/core/src/main/scala/org/apache/spark/security/CryptoStreamUtils.scala
index 1ee46d51ce70b..b230df93e1fac 100644
--- a/core/src/main/scala/org/apache/spark/security/CryptoStreamUtils.scala
+++ b/core/src/main/scala/org/apache/spark/security/CryptoStreamUtils.scala
@@ -26,12 +26,11 @@ import javax.crypto.spec.{IvParameterSpec, SecretKeySpec}
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.ByteStreams
 import org.apache.commons.crypto.random._
 import org.apache.commons.crypto.stream._
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.network.util.{CryptoUtils, JavaUtils}
@@ -84,7 +83,7 @@ private[spark] object CryptoStreamUtils extends Logging {
       sparkConf: SparkConf,
       key: Array[Byte]): InputStream = {
     val iv = new Array[Byte](IV_LENGTH_IN_BYTES)
-    ByteStreams.readFully(is, iv)
+    JavaUtils.readFully(is, iv, 0, IV_LENGTH_IN_BYTES)
     val params = new CryptoParams(key, sparkConf)
     new CryptoInputStream(params.transformation, params.conf, is, params.keySpec,
       new IvParameterSpec(iv))
diff --git a/core/src/main/scala/org/apache/spark/serializer/GenericAvroSerializer.scala b/core/src/main/scala/org/apache/spark/serializer/GenericAvroSerializer.scala
index d09abff2773b8..23a5965d6aead 100644
--- a/core/src/main/scala/org/apache/spark/serializer/GenericAvroSerializer.scala
+++ b/core/src/main/scala/org/apache/spark/serializer/GenericAvroSerializer.scala
@@ -28,7 +28,6 @@ import com.esotericsoftware.kryo.io.{Input => KryoInput, Output => KryoOutput}
 import org.apache.avro.{Schema, SchemaNormalization}
 import org.apache.avro.generic.{GenericContainer, GenericData}
 import org.apache.avro.io._
-import org.apache.commons.io.IOUtils
 
 import org.apache.spark.{SparkEnv, SparkException}
 import org.apache.spark.io.CompressionCodec
@@ -93,7 +92,7 @@ private[serializer] class GenericAvroSerializer[D <: GenericContainer]
       schemaBytes.remaining())
     val in = codec.compressedInputStream(bis)
     val bytes = Utils.tryWithSafeFinally {
-      IOUtils.toByteArray(in)
+      in.readAllBytes()
     } {
       in.close()
     }
diff --git a/core/src/main/scala/org/apache/spark/serializer/KryoSerializer.scala b/core/src/main/scala/org/apache/spark/serializer/KryoSerializer.scala
index 000ba8d79bc02..28261a4520a28 100644
--- a/core/src/main/scala/org/apache/spark/serializer/KryoSerializer.scala
+++ b/core/src/main/scala/org/apache/spark/serializer/KryoSerializer.scala
@@ -40,7 +40,7 @@ import org.roaringbitmap.RoaringBitmap
 import org.apache.spark._
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.api.python.PythonBroadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_NAME
 import org.apache.spark.internal.config.Kryo._
 import org.apache.spark.internal.io.FileCommitProtocol._
diff --git a/core/src/main/scala/org/apache/spark/shuffle/IndexShuffleBlockResolver.scala b/core/src/main/scala/org/apache/spark/shuffle/IndexShuffleBlockResolver.scala
index bf3117a9a9b12..9b27f648134ee 100644
--- a/core/src/main/scala/org/apache/spark/shuffle/IndexShuffleBlockResolver.scala
+++ b/core/src/main/scala/org/apache/spark/shuffle/IndexShuffleBlockResolver.scala
@@ -29,7 +29,7 @@ import com.google.common.cache.CacheBuilder
 
 import org.apache.spark.{SecurityManager, SparkConf, SparkEnv, SparkException}
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.io.NioBufferedFileInputStream
 import org.apache.spark.network.buffer.{FileSegmentManagedBuffer, ManagedBuffer}
diff --git a/core/src/main/scala/org/apache/spark/shuffle/ShuffleBlockPusher.scala b/core/src/main/scala/org/apache/spark/shuffle/ShuffleBlockPusher.scala
index 4e3191e44fbdf..548ecb399d5ff 100644
--- a/core/src/main/scala/org/apache/spark/shuffle/ShuffleBlockPusher.scala
+++ b/core/src/main/scala/org/apache/spark/shuffle/ShuffleBlockPusher.scala
@@ -27,7 +27,7 @@ import scala.util.control.NonFatal
 import org.apache.spark.{SecurityManager, ShuffleDependency, SparkConf, SparkContext, SparkEnv}
 import org.apache.spark.annotation.Since
 import org.apache.spark.executor.{CoarseGrainedExecutorBackend, ExecutorBackend}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.launcher.SparkLauncher
diff --git a/core/src/main/scala/org/apache/spark/shuffle/ShuffleWriteProcessor.scala b/core/src/main/scala/org/apache/spark/shuffle/ShuffleWriteProcessor.scala
index be42af092f24a..47d54ae4f10b0 100644
--- a/core/src/main/scala/org/apache/spark/shuffle/ShuffleWriteProcessor.scala
+++ b/core/src/main/scala/org/apache/spark/shuffle/ShuffleWriteProcessor.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.shuffle
 
 import org.apache.spark.{ShuffleDependency, SparkEnv, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{NUM_MERGER_LOCATIONS, SHUFFLE_ID, STAGE_ID}
 import org.apache.spark.scheduler.MapStatus
 
diff --git a/core/src/main/scala/org/apache/spark/status/AppStatusListener.scala b/core/src/main/scala/org/apache/spark/status/AppStatusListener.scala
index 5c93bf4bf77a0..52856427cb37a 100644
--- a/core/src/main/scala/org/apache/spark/status/AppStatusListener.scala
+++ b/core/src/main/scala/org/apache/spark/status/AppStatusListener.scala
@@ -26,7 +26,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark._
 import org.apache.spark.executor.{ExecutorMetrics, TaskMetrics}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.CPUS_PER_TASK
 import org.apache.spark.internal.config.Status._
 import org.apache.spark.resource.ResourceProfile.CPUS
diff --git a/core/src/main/scala/org/apache/spark/status/AppStatusStore.scala b/core/src/main/scala/org/apache/spark/status/AppStatusStore.scala
index 87f876467c30e..a7f3fde9e6f6f 100644
--- a/core/src/main/scala/org/apache/spark/status/AppStatusStore.scala
+++ b/core/src/main/scala/org/apache/spark/status/AppStatusStore.scala
@@ -25,7 +25,7 @@ import scala.collection.mutable.HashMap
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{JobExecutionStatus, SparkConf, SparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.internal.config.Status.LIVE_UI_LOCAL_STORE_DIR
 import org.apache.spark.status.AppStatusUtils.getQuantilesValue
diff --git a/core/src/main/scala/org/apache/spark/status/KVUtils.scala b/core/src/main/scala/org/apache/spark/status/KVUtils.scala
index e334626413dc0..76fb654f8da2d 100644
--- a/core/src/main/scala/org/apache/spark/status/KVUtils.scala
+++ b/core/src/main/scala/org/apache/spark/status/KVUtils.scala
@@ -31,7 +31,7 @@ import org.rocksdb.RocksDBException
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.history.{FsHistoryProvider, FsHistoryProviderMetadata}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.History
 import org.apache.spark.internal.config.History.HYBRID_STORE_DISK_BACKEND
@@ -213,6 +213,20 @@ private[spark] object KVUtils extends Logging {
     }
   }
 
+  /**
+   * Maps all values of KVStoreView to new values using a transformation function
+   * and filtered by a filter function.
+   */
+  def mapToSeqWithFilter[T, B](
+      view: KVStoreView[T],
+      max: Int)
+      (mapFunc: T => B)
+      (filterFunc: B => Boolean): Seq[B] = {
+    Utils.tryWithResource(view.closeableIterator()) { iter =>
+      iter.asScala.map(mapFunc).filter(filterFunc).take(max).toList
+    }
+  }
+
   def size[T](view: KVStoreView[T]): Int = {
     Utils.tryWithResource(view.closeableIterator()) { iter =>
       iter.asScala.size
diff --git a/core/src/main/scala/org/apache/spark/status/api/v1/ApiRootResource.scala b/core/src/main/scala/org/apache/spark/status/api/v1/ApiRootResource.scala
index 66fac8a9d105a..61e800844db09 100644
--- a/core/src/main/scala/org/apache/spark/status/api/v1/ApiRootResource.scala
+++ b/core/src/main/scala/org/apache/spark/status/api/v1/ApiRootResource.scala
@@ -82,6 +82,10 @@ private[spark] trait UIRoot {
   def withSparkUI[T](appId: String, attemptId: Option[String])(fn: SparkUI => T): T
 
   def getApplicationInfoList: Iterator[ApplicationInfo]
+
+  def getApplicationInfoList(max: Int)(
+      filter: ApplicationInfo => Boolean): Iterator[ApplicationInfo]
+
   def getApplicationInfo(appId: String): Option[ApplicationInfo]
 
   /**
diff --git a/core/src/main/scala/org/apache/spark/status/api/v1/ApplicationListResource.scala b/core/src/main/scala/org/apache/spark/status/api/v1/ApplicationListResource.scala
index 2d5dd97b501f1..aaaa08b3340b9 100644
--- a/core/src/main/scala/org/apache/spark/status/api/v1/ApplicationListResource.scala
+++ b/core/src/main/scala/org/apache/spark/status/api/v1/ApplicationListResource.scala
@@ -38,7 +38,7 @@ private[v1] class ApplicationListResource extends ApiRequestContext {
     val includeCompleted = status.isEmpty || status.contains(ApplicationStatus.COMPLETED)
     val includeRunning = status.isEmpty || status.contains(ApplicationStatus.RUNNING)
 
-    uiRoot.getApplicationInfoList.filter { app =>
+    uiRoot.getApplicationInfoList(numApps) { app =>
       val anyRunning = app.attempts.isEmpty || !app.attempts.head.completed
       // if any attempt is still running, we consider the app to also still be running;
       // keep the app if *any* attempts fall in the right time window
@@ -46,7 +46,7 @@ private[v1] class ApplicationListResource extends ApiRequestContext {
       app.attempts.exists { attempt =>
         isAttemptInRange(attempt, minDate, maxDate, minEndDate, maxEndDate, anyRunning)
       }
-    }.take(numApps)
+    }
   }
 
   private def isAttemptInRange(
diff --git a/core/src/main/scala/org/apache/spark/status/protobuf/StageDataWrapperSerializer.scala b/core/src/main/scala/org/apache/spark/status/protobuf/StageDataWrapperSerializer.scala
index d83cff5f23a27..26e5068d15325 100644
--- a/core/src/main/scala/org/apache/spark/status/protobuf/StageDataWrapperSerializer.scala
+++ b/core/src/main/scala/org/apache/spark/status/protobuf/StageDataWrapperSerializer.scala
@@ -21,12 +21,11 @@ import java.util.Date
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.collections4.MapUtils
-
 import org.apache.spark.status.StageDataWrapper
 import org.apache.spark.status.api.v1.{ExecutorMetricsDistributions, ExecutorPeakMetricsDistributions, InputMetricDistributions, InputMetrics, OutputMetricDistributions, OutputMetrics, ShufflePushReadMetricDistributions, ShufflePushReadMetrics, ShuffleReadMetricDistributions, ShuffleReadMetrics, ShuffleWriteMetricDistributions, ShuffleWriteMetrics, SpeculationStageSummary, StageData, TaskData, TaskMetricDistributions, TaskMetrics}
 import org.apache.spark.status.protobuf.Utils._
 import org.apache.spark.util.Utils.weakIntern
+import org.apache.spark.util.collection.Utils.isNotEmpty
 
 private[protobuf] class StageDataWrapperSerializer extends ProtobufSerDe[StageDataWrapper] {
 
@@ -397,11 +396,11 @@ private[protobuf] class StageDataWrapperSerializer extends ProtobufSerDe[StageDa
     val failureReason = getOptional(binary.hasFailureReason, binary.getFailureReason)
     val description = getOptional(binary.hasDescription, binary.getDescription)
     val accumulatorUpdates = AccumulableInfoSerializer.deserialize(binary.getAccumulatorUpdatesList)
-    val tasks = if (MapUtils.isNotEmpty(binary.getTasksMap)) {
+    val tasks = if (isNotEmpty(binary.getTasksMap)) {
       Some(binary.getTasksMap.asScala.map(
         entry => (entry._1.toLong, deserializeTaskData(entry._2))).toMap)
     } else None
-    val executorSummary = if (MapUtils.isNotEmpty(binary.getExecutorSummaryMap)) {
+    val executorSummary = if (isNotEmpty(binary.getExecutorSummaryMap)) {
       Some(binary.getExecutorSummaryMap.asScala.toMap
         .transform((_, v) => ExecutorStageSummarySerializer.deserialize(v)))
     } else None
diff --git a/core/src/main/scala/org/apache/spark/storage/BlockManager.scala b/core/src/main/scala/org/apache/spark/storage/BlockManager.scala
index d99bc5bf30546..1e1cb8bf9fd53 100644
--- a/core/src/main/scala/org/apache/spark/storage/BlockManager.scala
+++ b/core/src/main/scala/org/apache/spark/storage/BlockManager.scala
@@ -36,12 +36,11 @@ import scala.util.control.NonFatal
 import com.codahale.metrics.{MetricRegistry, MetricSet}
 import com.esotericsoftware.kryo.KryoException
 import com.google.common.cache.CacheBuilder
-import org.apache.commons.io.IOUtils
 
 import org.apache.spark._
 import org.apache.spark.errors.SparkCoreErrors
 import org.apache.spark.executor.{DataReadMethod, ExecutorExitCode}
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{Network, RDD_CACHE_VISIBILITY_TRACKING_ENABLED, Tests}
 import org.apache.spark.memory.{MemoryManager, MemoryMode}
@@ -373,7 +372,7 @@ private[spark] class BlockManager(
           logInfo(extendMessageWithBlockDetails(ex.getMessage, blockId))
           throw ex
       } finally {
-        IOUtils.closeQuietly(inputStream)
+        Utils.closeQuietly(inputStream)
       }
     }
 
diff --git a/core/src/main/scala/org/apache/spark/storage/BlockManagerDecommissioner.scala b/core/src/main/scala/org/apache/spark/storage/BlockManagerDecommissioner.scala
index 19807453ee28c..1a067fab04c1d 100644
--- a/core/src/main/scala/org/apache/spark/storage/BlockManagerDecommissioner.scala
+++ b/core/src/main/scala/org/apache/spark/storage/BlockManagerDecommissioner.scala
@@ -26,7 +26,7 @@ import scala.util.control.NonFatal
 
 import org.apache.spark._
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.shuffle.ShuffleBlockInfo
 import org.apache.spark.storage.BlockManagerMessages.ReplicateBlock
diff --git a/core/src/main/scala/org/apache/spark/storage/BlockManagerMaster.scala b/core/src/main/scala/org/apache/spark/storage/BlockManagerMaster.scala
index 276bd63e14237..16c2cbbe7fdc4 100644
--- a/core/src/main/scala/org/apache/spark/storage/BlockManagerMaster.scala
+++ b/core/src/main/scala/org/apache/spark/storage/BlockManagerMaster.scala
@@ -23,7 +23,7 @@ import scala.concurrent.Future
 
 import org.apache.spark.SparkConf
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rpc.RpcEndpointRef
 import org.apache.spark.storage.BlockManagerMessages._
diff --git a/core/src/main/scala/org/apache/spark/storage/BlockManagerMasterEndpoint.scala b/core/src/main/scala/org/apache/spark/storage/BlockManagerMasterEndpoint.scala
index 858db498e83ad..f63d4a55669aa 100644
--- a/core/src/main/scala/org/apache/spark/storage/BlockManagerMasterEndpoint.scala
+++ b/core/src/main/scala/org/apache/spark/storage/BlockManagerMasterEndpoint.scala
@@ -31,7 +31,7 @@ import com.google.common.cache.CacheBuilder
 
 import org.apache.spark.{MapOutputTrackerMaster, SparkConf, SparkContext, SparkEnv}
 import org.apache.spark.annotation.DeveloperApi
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.RDD_CACHE_VISIBILITY_TRACKING_ENABLED
 import org.apache.spark.network.shuffle.{ExternalBlockStoreClient, RemoteBlockPushResolver}
diff --git a/core/src/main/scala/org/apache/spark/storage/BlockManagerStorageEndpoint.scala b/core/src/main/scala/org/apache/spark/storage/BlockManagerStorageEndpoint.scala
index f29e8778da037..54329c5b1e514 100644
--- a/core/src/main/scala/org/apache/spark/storage/BlockManagerStorageEndpoint.scala
+++ b/core/src/main/scala/org/apache/spark/storage/BlockManagerStorageEndpoint.scala
@@ -20,7 +20,7 @@ package org.apache.spark.storage
 import scala.concurrent.{ExecutionContext, ExecutionContextExecutorService, Future}
 
 import org.apache.spark.{MapOutputTracker, SparkEnv}
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys.{BLOCK_ID, BROADCAST_ID, RDD_ID, SHUFFLE_ID}
 import org.apache.spark.rpc.{IsolatedThreadSafeRpcEndpoint, RpcCallContext, RpcEnv}
 import org.apache.spark.storage.BlockManagerMessages._
diff --git a/core/src/main/scala/org/apache/spark/storage/BlockReplicationPolicy.scala b/core/src/main/scala/org/apache/spark/storage/BlockReplicationPolicy.scala
index 5186cbfa217cc..9126dc8a83561 100644
--- a/core/src/main/scala/org/apache/spark/storage/BlockReplicationPolicy.scala
+++ b/core/src/main/scala/org/apache/spark/storage/BlockReplicationPolicy.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable
 import scala.util.Random
 
 import org.apache.spark.annotation.DeveloperApi
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 
 /**
diff --git a/core/src/main/scala/org/apache/spark/storage/DiskBlockManager.scala b/core/src/main/scala/org/apache/spark/storage/DiskBlockManager.scala
index 72d8dc0b19d21..df29ddf6999f5 100644
--- a/core/src/main/scala/org/apache/spark/storage/DiskBlockManager.scala
+++ b/core/src/main/scala/org/apache/spark/storage/DiskBlockManager.scala
@@ -30,7 +30,7 @@ import com.fasterxml.jackson.module.scala.DefaultScalaModule
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.errors.SparkCoreErrors
 import org.apache.spark.executor.ExecutorExitCode
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys.{MERGE_DIR_NAME, PATH}
 import org.apache.spark.network.shuffle.ExecutorDiskUtils
 import org.apache.spark.storage.DiskBlockManager.ATTEMPT_ID_KEY
@@ -316,7 +316,7 @@ private[spark] class DiskBlockManager(
         throw SparkCoreErrors.failToCreateDirectoryError(dirToCreate.getAbsolutePath, maxAttempts)
       }
       try {
-        dirToCreate.mkdirs()
+        Utils.createDirectory(dirToCreate)
         Files.setPosixFilePermissions(
           dirToCreate.toPath, PosixFilePermissions.fromString("rwxrwx---"))
         if (dirToCreate.exists()) {
diff --git a/core/src/main/scala/org/apache/spark/storage/DiskBlockObjectWriter.scala b/core/src/main/scala/org/apache/spark/storage/DiskBlockObjectWriter.scala
index efcdb7fa8c69e..9964e64724f6b 100644
--- a/core/src/main/scala/org/apache/spark/storage/DiskBlockObjectWriter.scala
+++ b/core/src/main/scala/org/apache/spark/storage/DiskBlockObjectWriter.scala
@@ -24,7 +24,7 @@ import java.util.zip.Checksum
 
 import org.apache.spark.SparkException
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.io.MutableCheckedOutputStream
 import org.apache.spark.serializer.{SerializationStream, SerializerInstance, SerializerManager}
diff --git a/core/src/main/scala/org/apache/spark/storage/DiskStore.scala b/core/src/main/scala/org/apache/spark/storage/DiskStore.scala
index 3e57094b36a7e..b304d7bc32a84 100644
--- a/core/src/main/scala/org/apache/spark/storage/DiskStore.scala
+++ b/core/src/main/scala/org/apache/spark/storage/DiskStore.scala
@@ -27,10 +27,9 @@ import scala.collection.mutable.ListBuffer
 
 import com.google.common.io.Closeables
 import io.netty.channel.DefaultFileRegion
-import org.apache.commons.io.FileUtils
 
 import org.apache.spark.{SecurityManager, SparkConf, SparkException}
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.network.buffer.ManagedBuffer
 import org.apache.spark.network.util.{AbstractFileRegion, JavaUtils}
@@ -151,7 +150,7 @@ private[spark] class DiskStore(
     blockSizes.put(targetBlockId, blockSize)
     val targetFile = diskManager.getFile(targetBlockId.name)
     logDebug(s"${sourceFile.getPath()} -> ${targetFile.getPath()}")
-    FileUtils.moveFile(sourceFile, targetFile)
+    Utils.moveFile(sourceFile, targetFile)
   }
 
   def contains(blockId: BlockId): Boolean = diskManager.containsBlock(blockId)
diff --git a/core/src/main/scala/org/apache/spark/storage/FallbackStorage.scala b/core/src/main/scala/org/apache/spark/storage/FallbackStorage.scala
index 0f2bfaede4454..cf6f3ea1f6dd5 100644
--- a/core/src/main/scala/org/apache/spark/storage/FallbackStorage.scala
+++ b/core/src/main/scala/org/apache/spark/storage/FallbackStorage.scala
@@ -17,26 +17,27 @@
 
 package org.apache.spark.storage
 
-import java.io.DataInputStream
+import java.io.{DataInputStream, FileNotFoundException}
 import java.nio.ByteBuffer
 
+import scala.annotation.tailrec
 import scala.concurrent.Future
 import scala.reflect.ClassTag
 
 import org.apache.hadoop.conf.Configuration
-import org.apache.hadoop.fs.{FileSystem, Path}
+import org.apache.hadoop.fs.{FileSystem, FSDataInputStream, Path}
 
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.config.{STORAGE_DECOMMISSION_FALLBACK_STORAGE_CLEANUP, STORAGE_DECOMMISSION_FALLBACK_STORAGE_PATH}
+import org.apache.spark.internal.config.{STORAGE_DECOMMISSION_FALLBACK_STORAGE_CLEANUP, STORAGE_DECOMMISSION_FALLBACK_STORAGE_PATH, STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_DELAY, STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_WAIT}
 import org.apache.spark.network.buffer.{ManagedBuffer, NioManagedBuffer}
 import org.apache.spark.network.util.JavaUtils
 import org.apache.spark.rpc.{RpcAddress, RpcEndpointRef, RpcTimeout}
 import org.apache.spark.shuffle.{IndexShuffleBlockResolver, ShuffleBlockInfo}
 import org.apache.spark.shuffle.IndexShuffleBlockResolver.NOOP_REDUCE_ID
-import org.apache.spark.util.Utils
+import org.apache.spark.util.{Clock, SystemClock, Utils}
 
 /**
  * A fallback storage used by storage decommissioners.
@@ -155,6 +156,61 @@ private[spark] object FallbackStorage extends Logging {
       FALLBACK_BLOCK_MANAGER_ID, blockId, StorageLevel.DISK_ONLY, memSize = 0, dataLength)
   }
 
+  /**
+   * Open the file, retry a FileNotFoundException for waitMs milliseconds, unless this would
+   * exceed the deadline. In the latter case, rethrow the exception.
+   */
+  @tailrec
+  private def open(
+      filesystem: FileSystem,
+      path: Path,
+      deadlineTs: Long,
+      waitMs: Long,
+      clock: Clock): FSDataInputStream = {
+    try {
+      filesystem.open(path)
+    } catch {
+      case fnf: FileNotFoundException =>
+        val waitTillTs = clock.getTimeMillis() + waitMs
+        if (waitTillTs <= deadlineTs) {
+          logInfo(f"File not found, waiting ${waitMs / 1000}s: $path")
+          clock.waitTillTime(waitTillTs)
+          open(filesystem, path, deadlineTs, waitMs, clock)
+        } else {
+          throw fnf
+        }
+    }
+  }
+
+  /**
+   * Open the file and retry FileNotFoundExceptions according to
+   * STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_DELAY and
+   * STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_WAIT
+   */
+  // Visible for testing
+  private[spark] def open(
+      conf: SparkConf,
+      filesystem: FileSystem,
+      path: Path,
+      clock: Clock = new SystemClock()): FSDataInputStream = {
+    val replicationDelay = conf.get(STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_DELAY)
+    if (replicationDelay.isDefined) {
+      val replicationDeadline = clock.getTimeMillis() + replicationDelay.get
+      val replicationWaitMs = conf.get(STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_WAIT)
+      try {
+        open(filesystem, path, replicationDeadline, replicationWaitMs, clock)
+      } catch {
+        case fnf: FileNotFoundException =>
+          logInfo(
+            "File not found, exceeded expected replication delay " +
+              f"of ${replicationDelay.get}s: $path")
+          throw fnf
+      }
+    } else {
+      filesystem.open(path)
+    }
+  }
+
   /**
    * Read a ManagedBuffer.
    */
@@ -180,7 +236,7 @@ private[spark] object FallbackStorage extends Logging {
     val indexFile = new Path(fallbackPath, s"$appId/$shuffleId/$hash/$name")
     val start = startReduceId * 8L
     val end = endReduceId * 8L
-    Utils.tryWithResource(fallbackFileSystem.open(indexFile)) { inputStream =>
+    Utils.tryWithResource(open(conf, fallbackFileSystem, indexFile)) { inputStream =>
       Utils.tryWithResource(new DataInputStream(inputStream)) { index =>
         index.skip(start)
         val offset = index.readLong()
@@ -193,7 +249,7 @@ private[spark] object FallbackStorage extends Logging {
         logDebug(s"To byte array $size")
         val array = new Array[Byte](size.toInt)
         val startTimeNs = System.nanoTime()
-        Utils.tryWithResource(fallbackFileSystem.open(dataFile)) { f =>
+        Utils.tryWithResource(open(conf, fallbackFileSystem, dataFile)) { f =>
           f.seek(offset)
           f.readFully(array)
           logDebug(s"Took ${(System.nanoTime() - startTimeNs) / (1000 * 1000)}ms")
diff --git a/core/src/main/scala/org/apache/spark/storage/PushBasedFetchHelper.scala b/core/src/main/scala/org/apache/spark/storage/PushBasedFetchHelper.scala
index 8a3ca3066961c..16a68bbf50e25 100644
--- a/core/src/main/scala/org/apache/spark/storage/PushBasedFetchHelper.scala
+++ b/core/src/main/scala/org/apache/spark/storage/PushBasedFetchHelper.scala
@@ -28,7 +28,7 @@ import org.roaringbitmap.RoaringBitmap
 
 import org.apache.spark.MapOutputTracker
 import org.apache.spark.MapOutputTracker.SHUFFLE_PUSH_MAP_ID
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.network.shuffle.{BlockStoreClient, MergedBlockMeta, MergedBlocksMetaListener}
 import org.apache.spark.shuffle.ShuffleReadMetricsReporter
diff --git a/core/src/main/scala/org/apache/spark/storage/ShuffleBlockFetcherIterator.scala b/core/src/main/scala/org/apache/spark/storage/ShuffleBlockFetcherIterator.scala
index 57f6901a7a735..b2f185bc590fd 100644
--- a/core/src/main/scala/org/apache/spark/storage/ShuffleBlockFetcherIterator.scala
+++ b/core/src/main/scala/org/apache/spark/storage/ShuffleBlockFetcherIterator.scala
@@ -19,7 +19,7 @@ package org.apache.spark.storage
 
 import java.io.{InputStream, IOException}
 import java.nio.channels.ClosedByInterruptException
-import java.util.concurrent.{LinkedBlockingQueue, TimeUnit}
+import java.util.concurrent.{LinkedBlockingDeque, TimeUnit}
 import java.util.concurrent.atomic.AtomicBoolean
 import java.util.zip.CheckedInputStream
 import javax.annotation.concurrent.GuardedBy
@@ -30,13 +30,12 @@ import scala.collection.mutable.{ArrayBuffer, HashMap, HashSet, Queue}
 import scala.util.{Failure, Success}
 
 import io.netty.util.internal.OutOfDirectMemoryError
-import org.apache.commons.io.IOUtils
 import org.roaringbitmap.RoaringBitmap
 
 import org.apache.spark.{MapOutputTracker, SparkException, TaskContext}
 import org.apache.spark.MapOutputTracker.SHUFFLE_PUSH_MAP_ID
 import org.apache.spark.errors.SparkCoreErrors
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.network.buffer.{FileSegmentManagedBuffer, ManagedBuffer}
 import org.apache.spark.network.shuffle._
@@ -132,7 +131,7 @@ final class ShuffleBlockFetcherIterator(
    * A queue to hold our results. This turns the asynchronous model provided by
    * [[org.apache.spark.network.BlockTransferService]] into a synchronous model (iterator).
    */
-  private[this] val results = new LinkedBlockingQueue[FetchResult]
+  private[this] val results = new LinkedBlockingDeque[FetchResult]()
 
   /**
    * Current [[FetchResult]] being processed. We track this so we can release the current buffer
@@ -358,7 +357,7 @@ final class ShuffleBlockFetcherIterator(
                 results.put(FallbackOnPushMergedFailureResult(
                   block, address, infoMap(blockId)._1, remainingBlocks.isEmpty))
               } else {
-                results.put(FailureFetchResult(block, infoMap(blockId)._2, address, e))
+                results.putFirst(FailureFetchResult(block, infoMap(blockId)._2, address, e))
               }
           }
         }
@@ -594,7 +593,8 @@ final class ShuffleBlockFetcherIterator(
                 log"Error occurred while fetching local blocks, ${MDC(ERROR, ce.getMessage)}")
             case ex: Exception => logError("Error occurred while fetching local blocks", ex)
           }
-          results.put(FailureFetchResult(blockId, mapIndex, blockManager.blockManagerId, e))
+          results.putFirst(
+            FailureFetchResult(blockId, mapIndex, blockManager.blockManagerId, e))
           return
       }
     }
@@ -615,7 +615,7 @@ final class ShuffleBlockFetcherIterator(
       case e: Exception =>
         // If we see an exception, stop immediately.
         logError(s"Error occurred while fetching local blocks", e)
-        results.put(FailureFetchResult(blockId, mapIndex, blockManagerId, e))
+        results.putFirst(FailureFetchResult(blockId, mapIndex, blockManagerId, e))
         false
     }
   }
@@ -668,7 +668,7 @@ final class ShuffleBlockFetcherIterator(
             val bmId = bmIds.head
             val blockInfoSeq = hostLocalBlocksWithMissingDirs(bmId)
             val (blockId, _, mapIndex) = blockInfoSeq.head
-            results.put(FailureFetchResult(blockId, mapIndex, bmId, throwable))
+            results.putFirst(FailureFetchResult(blockId, mapIndex, bmId, throwable))
         }
       }
     }
@@ -1407,7 +1407,7 @@ private class BufferReleasingInputStream(
         val diagnosisResponse = checkedInOpt.map { checkedIn =>
           iterator.diagnoseCorruption(checkedIn, address, blockId)
         }
-        IOUtils.closeQuietly(this)
+        Utils.closeQuietly(this)
         // We'd never retry the block whatever the cause is since the block has been
         // partially consumed by downstream RDDs.
         iterator.throwFetchFailedException(blockId, mapIndex, address, e, diagnosisResponse)
diff --git a/core/src/main/scala/org/apache/spark/storage/TopologyMapper.scala b/core/src/main/scala/org/apache/spark/storage/TopologyMapper.scala
index f1dca53c7e3b1..45d3a4acb9ca9 100644
--- a/core/src/main/scala/org/apache/spark/storage/TopologyMapper.scala
+++ b/core/src/main/scala/org/apache/spark/storage/TopologyMapper.scala
@@ -19,7 +19,7 @@ package org.apache.spark.storage
 
 import org.apache.spark.SparkConf
 import org.apache.spark.annotation.DeveloperApi
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.util.Utils
 
diff --git a/core/src/main/scala/org/apache/spark/storage/memory/MemoryStore.scala b/core/src/main/scala/org/apache/spark/storage/memory/MemoryStore.scala
index 6746bbd490c42..3981006c7ffe6 100644
--- a/core/src/main/scala/org/apache/spark/storage/memory/MemoryStore.scala
+++ b/core/src/main/scala/org/apache/spark/storage/memory/MemoryStore.scala
@@ -27,10 +27,8 @@ import scala.jdk.CollectionConverters._
 import scala.reflect.ClassTag
 import scala.util.control.NonFatal
 
-import com.google.common.io.ByteStreams
-
 import org.apache.spark.{SparkConf, SparkException, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.{STORAGE_UNROLL_MEMORY_THRESHOLD, UNROLL_MEMORY_CHECK_PERIOD, UNROLL_MEMORY_GROWTH_FACTOR}
 import org.apache.spark.memory.{MemoryManager, MemoryMode}
@@ -905,7 +903,7 @@ private[storage] class PartiallySerializedBlock[T](
         // We want to close the output stream in order to free any resources associated with the
         // serializer itself (such as Kryo's internal buffers). close() might cause data to be
         // written, so redirect the output stream to discard that data.
-        redirectableOutputStream.setOutputStream(ByteStreams.nullOutputStream())
+        redirectableOutputStream.setOutputStream(OutputStream.nullOutputStream())
         serializationStream.close()
       } finally {
         discarded = true
@@ -923,7 +921,7 @@ private[storage] class PartiallySerializedBlock[T](
     verifyNotConsumedAndNotDiscarded()
     consumed = true
     // `unrolled`'s underlying buffers will be freed once this input stream is fully read:
-    ByteStreams.copy(unrolledBuffer.toInputStream(dispose = true), os)
+    unrolledBuffer.toInputStream(dispose = true).transferTo(os)
     memoryStore.releaseUnrollMemoryForThisTask(memoryMode, unrollMemory)
     redirectableOutputStream.setOutputStream(os)
     while (rest.hasNext) {
diff --git a/core/src/main/scala/org/apache/spark/ui/ConsoleProgressBar.scala b/core/src/main/scala/org/apache/spark/ui/ConsoleProgressBar.scala
index e95eeddbdace3..0ce0f69b20704 100644
--- a/core/src/main/scala/org/apache/spark/ui/ConsoleProgressBar.scala
+++ b/core/src/main/scala/org/apache/spark/ui/ConsoleProgressBar.scala
@@ -38,6 +38,8 @@ private[spark] class ConsoleProgressBar(sc: SparkContext) extends Logging {
   private val updatePeriodMSec = sc.conf.get(UI_CONSOLE_PROGRESS_UPDATE_INTERVAL)
   // Delay to show up a progress bar, in milliseconds
   private val firstDelayMSec = 500L
+  // Get the stderr (which is console for spark-shell) before installing RedirectConsolePlugin
+  private val console = System.err
 
   // The width of terminal
   private val TerminalWidth = sys.env.getOrElse("COLUMNS", "80").toInt
@@ -92,7 +94,7 @@ private[spark] class ConsoleProgressBar(sc: SparkContext) extends Logging {
     // only refresh if it's changed OR after 1 minute (or the ssh connection will be closed
     // after idle some time)
     if (bar != lastProgressBar || now - lastUpdateTime > 60 * 1000L) {
-      System.err.print(s"$CR$bar$CR")
+      console.print(s"$CR$bar$CR")
       lastUpdateTime = now
     }
     lastProgressBar = bar
@@ -103,7 +105,7 @@ private[spark] class ConsoleProgressBar(sc: SparkContext) extends Logging {
    */
   private def clear(): Unit = {
     if (!lastProgressBar.isEmpty) {
-      System.err.printf(s"$CR${" " * TerminalWidth}$CR")
+      console.printf(s"$CR${" ".repeat(TerminalWidth)}$CR")
       lastProgressBar = ""
     }
   }
diff --git a/core/src/main/scala/org/apache/spark/ui/DriverLogPage.scala b/core/src/main/scala/org/apache/spark/ui/DriverLogPage.scala
index 8b4eebc26b3ba..dca85b53178ad 100644
--- a/core/src/main/scala/org/apache/spark/ui/DriverLogPage.scala
+++ b/core/src/main/scala/org/apache/spark/ui/DriverLogPage.scala
@@ -21,7 +21,7 @@ import scala.xml.{Node, Unparsed}
 import jakarta.servlet.http.HttpServletRequest
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{LOG_TYPE, PATH}
 import org.apache.spark.internal.config.DRIVER_LOG_LOCAL_DIR
 import org.apache.spark.util.Utils
diff --git a/core/src/main/scala/org/apache/spark/ui/JettyUtils.scala b/core/src/main/scala/org/apache/spark/ui/JettyUtils.scala
index 068f9b0b2cbcb..bd7848c764375 100644
--- a/core/src/main/scala/org/apache/spark/ui/JettyUtils.scala
+++ b/core/src/main/scala/org/apache/spark/ui/JettyUtils.scala
@@ -40,7 +40,7 @@ import org.json4s.JValue
 import org.json4s.jackson.JsonMethods.{pretty, render}
 
 import org.apache.spark.{SecurityManager, SparkConf, SSLOptions}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.UI._
diff --git a/core/src/main/scala/org/apache/spark/ui/SparkUI.scala b/core/src/main/scala/org/apache/spark/ui/SparkUI.scala
index b8d422c9d9fbb..a23764f98d49d 100644
--- a/core/src/main/scala/org/apache/spark/ui/SparkUI.scala
+++ b/core/src/main/scala/org/apache/spark/ui/SparkUI.scala
@@ -23,7 +23,7 @@ import jakarta.servlet.http.{HttpServlet, HttpServletRequest, HttpServletRespons
 import org.eclipse.jetty.servlet.ServletContextHandler
 
 import org.apache.spark.{SecurityManager, SparkConf, SparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, WEB_URL}
 import org.apache.spark.internal.config.DRIVER_LOG_LOCAL_DIR
 import org.apache.spark.internal.config.UI._
@@ -201,6 +201,11 @@ private[spark] class SparkUI private (
     ))
   }
 
+  override def getApplicationInfoList(max: Int)(
+      filter: ApplicationInfo => Boolean): Iterator[ApplicationInfo] = {
+    getApplicationInfoList.filter(filter).take(max)
+  }
+
   def getApplicationInfo(appId: String): Option[ApplicationInfo] = {
     getApplicationInfoList.find(_.id == appId)
   }
diff --git a/core/src/main/scala/org/apache/spark/ui/WebUI.scala b/core/src/main/scala/org/apache/spark/ui/WebUI.scala
index 60d4e5db99d7e..c0d0fb50ae36b 100644
--- a/core/src/main/scala/org/apache/spark/ui/WebUI.scala
+++ b/core/src/main/scala/org/apache/spark/ui/WebUI.scala
@@ -29,7 +29,7 @@ import org.eclipse.jetty.servlet.{FilterHolder, FilterMapping, ServletContextHan
 import org.json4s.JsonAST.{JNothing, JValue}
 
 import org.apache.spark.{SecurityManager, SparkConf, SSLOptions}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.ui.JettyUtils._
diff --git a/core/src/main/scala/org/apache/spark/ui/exec/ExecutorThreadDumpPage.scala b/core/src/main/scala/org/apache/spark/ui/exec/ExecutorThreadDumpPage.scala
index ef26a02a406a8..fa10c8937144c 100644
--- a/core/src/main/scala/org/apache/spark/ui/exec/ExecutorThreadDumpPage.scala
+++ b/core/src/main/scala/org/apache/spark/ui/exec/ExecutorThreadDumpPage.scala
@@ -73,6 +73,7 @@ private[ui] class ExecutorThreadDumpPage(
     <div class="row">
       <div class="col-12">
         <p>Updated at {UIUtils.formatDate(time)}</p>
+        {threadDumpSummary(threadDump)}
         { if (flamegraphEnabled) {
             drawExecutorFlamegraph(request, threadDump) }
           else {
@@ -123,10 +124,8 @@ private[ui] class ExecutorThreadDumpPage(
     </div>
     }.getOrElse(Text("Error fetching thread dump"))
     UIUtils.headerSparkPage(request, s"Thread dump for executor $executorId", content, parent)
-    // scalastyle:on
   }
 
-  // scalastyle:off
   private def drawExecutorFlamegraph(request: HttpServletRequest, thread: Array[ThreadStackTrace]): Seq[Node] = {
     val js =
       s"""
@@ -154,5 +153,32 @@ private[ui] class ExecutorThreadDumpPage(
       </div>
     </div>
   }
-  // scalastyle:off
+
+
+  private def threadDumpSummary(threadDump: Array[ThreadStackTrace]): Seq[Node] = {
+    val totalCount = threadDump.length
+    <div>
+      <span class="thead-dump-summary collapse-table" onClick="collapseTable('thead-dump-summary', 'thread-dump-summary-table')">
+        <h4>
+          <span class="collapse-table-arrow arrow-open"></span>
+          <a>Thread Dump Summary: { totalCount }</a>
+        </h4>
+      </span>
+      <table class={UIUtils.TABLE_CLASS_STRIPED + " accordion-group" + " sortable" + " thread-dump-summary-table collapsible-table"}>
+        <thead><th>Thread State</th><th>Count</th><th>Percentage</th></thead>
+        <tbody>
+          {
+          threadDump.groupBy(_.threadState).map { case (state, threads) =>
+            <tr>
+              <td>{state}</td>
+              <td>{threads.length}</td>
+              <td>{"%.2f%%".format(threads.length * 100.0 / totalCount)}</td>
+            </tr>
+          }.toSeq
+          }
+        </tbody>
+      </table>
+    </div>
+  }
+  // scalastyle:on
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvesOperatorChildren.scala b/core/src/main/scala/org/apache/spark/ui/jobs/StageDataUtil.scala
similarity index 54%
rename from sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvesOperatorChildren.scala
rename to core/src/main/scala/org/apache/spark/ui/jobs/StageDataUtil.scala
index 0f548c3c55858..7757a815da65a 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvesOperatorChildren.scala
+++ b/core/src/main/scala/org/apache/spark/ui/jobs/StageDataUtil.scala
@@ -15,22 +15,25 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.catalyst.analysis.resolver
+package org.apache.spark.ui.jobs
 
-import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
+import org.apache.spark.status.api.v1.StageData
+import org.apache.spark.ui.UIUtils
 
-/**
- * A mixin trait for all operator resolvers that need to resolve their children.
- */
-trait ResolvesOperatorChildren {
+object StageDataUtil {
+  def getDuration(stageData: StageData): Option[Long] = {
+    stageData.submissionTime.map { start =>
+      val end = stageData.completionTime.map(_.getTime).getOrElse(System.currentTimeMillis())
+      end - start.getTime
+    }
+  }
+
+  def getFormattedDuration(stageData: StageData): String = {
+    val duration = getDuration(stageData)
+    duration.map(d => UIUtils.formatDuration(d)).getOrElse("Unknown")
+  }
 
-  /**
-   * Resolves generic [[LogicalPlan]] children and returns its copy with children resolved.
-   */
-  protected def withResolvedChildren[OperatorType <: LogicalPlan](
-      unresolvedOperator: OperatorType,
-      resolve: LogicalPlan => LogicalPlan): OperatorType = {
-    val newChildren = unresolvedOperator.children.map(resolve(_))
-    unresolvedOperator.withNewChildren(newChildren).asInstanceOf[OperatorType]
+  def getFormattedSubmissionTime(stageData: StageData): String = {
+    stageData.submissionTime.map(UIUtils.formatDate).getOrElse("Unknown")
   }
 }
diff --git a/core/src/main/scala/org/apache/spark/ui/jobs/StagePage.scala b/core/src/main/scala/org/apache/spark/ui/jobs/StagePage.scala
index 257f7b37758a7..4fa7c81496904 100644
--- a/core/src/main/scala/org/apache/spark/ui/jobs/StagePage.scala
+++ b/core/src/main/scala/org/apache/spark/ui/jobs/StagePage.scala
@@ -141,6 +141,14 @@ private[ui] class StagePage(parent: StagesTab, store: AppStatusStore) extends We
     val summary =
       <div>
         <ul class="list-unstyled">
+          <li>
+            <Strong>Submitted:</Strong>
+            {StageDataUtil.getFormattedSubmissionTime(stageData)}
+          </li>
+          <li>
+            <strong>Duration</strong>
+            {StageDataUtil.getFormattedDuration(stageData)}
+          </li>
           <li>
             <strong>Resource Profile Id: </strong>
             {stageData.resourceProfileId}
diff --git a/core/src/main/scala/org/apache/spark/ui/scope/RDDOperationGraph.scala b/core/src/main/scala/org/apache/spark/ui/scope/RDDOperationGraph.scala
index ee7f67233bbd5..cd057ed08c3c3 100644
--- a/core/src/main/scala/org/apache/spark/ui/scope/RDDOperationGraph.scala
+++ b/core/src/main/scala/org/apache/spark/ui/scope/RDDOperationGraph.scala
@@ -25,7 +25,7 @@ import scala.xml.Utility
 
 import org.apache.commons.text.StringEscapeUtils
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.DeterministicLevel
 import org.apache.spark.scheduler.StageInfo
diff --git a/core/src/main/scala/org/apache/spark/util/AccumulatorV2.scala b/core/src/main/scala/org/apache/spark/util/AccumulatorV2.scala
index 1745498456213..7e2047526da03 100644
--- a/core/src/main/scala/org/apache/spark/util/AccumulatorV2.scala
+++ b/core/src/main/scala/org/apache/spark/util/AccumulatorV2.scala
@@ -23,7 +23,7 @@ import java.util.concurrent.ConcurrentHashMap
 import java.util.concurrent.atomic.AtomicLong
 
 import org.apache.spark.{InternalAccumulator, SparkContext, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.scheduler.AccumulableInfo
 import org.apache.spark.util.AccumulatorContext.internOption
diff --git a/core/src/main/scala/org/apache/spark/util/DependencyUtils.scala b/core/src/main/scala/org/apache/spark/util/DependencyUtils.scala
index 8526a21254586..63caa14215774 100644
--- a/core/src/main/scala/org/apache/spark/util/DependencyUtils.scala
+++ b/core/src/main/scala/org/apache/spark/util/DependencyUtils.scala
@@ -20,13 +20,12 @@ package org.apache.spark.util
 import java.io.{File, PrintStream}
 import java.net.URI
 
-import org.apache.commons.lang3.StringUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.deploy.SparkSubmit
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
@@ -83,7 +82,7 @@ private[spark] object DependencyUtils extends Logging {
 
     val (transitive, exclusionList, repos) = MavenUtils.parseQueryParams(uri)
     val fullReposList = Seq(ivyProperties.repositories, repos)
-      .filter(!StringUtils.isBlank(_))
+      .filter(!SparkStringUtils.isBlank(_))
       .mkString(",")
     resolveMavenDependencies(
       transitive,
@@ -103,7 +102,7 @@ private[spark] object DependencyUtils extends Logging {
       ivyRepoPath: String,
       ivySettingsPath: Option[String]): Seq[String] = {
     val exclusions: Seq[String] =
-      if (!StringUtils.isBlank(packagesExclusions)) {
+      if (!SparkStringUtils.isBlank(packagesExclusions)) {
         packagesExclusions.split(",").toImmutableArraySeq
       } else {
         Nil
@@ -237,7 +236,7 @@ private[spark] object DependencyUtils extends Logging {
    * no files, into a single comma-separated string.
    */
   def mergeFileLists(lists: String*): String = {
-    val merged = lists.filterNot(StringUtils.isBlank)
+    val merged = lists.filterNot(SparkStringUtils.isBlank)
       .flatMap(Utils.stringToSeq)
     if (merged.nonEmpty) merged.mkString(",") else null
   }
diff --git a/core/src/main/scala/org/apache/spark/util/EventLoop.scala b/core/src/main/scala/org/apache/spark/util/EventLoop.scala
index b9de661b63c4f..c15598a35651f 100644
--- a/core/src/main/scala/org/apache/spark/util/EventLoop.scala
+++ b/core/src/main/scala/org/apache/spark/util/EventLoop.scala
@@ -22,7 +22,7 @@ import java.util.concurrent.atomic.AtomicBoolean
 
 import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.EVENT_LOOP
 
 /**
diff --git a/core/src/main/scala/org/apache/spark/util/HadoopFSUtils.scala b/core/src/main/scala/org/apache/spark/util/HadoopFSUtils.scala
index 5e50361b278aa..f84184f7c1faf 100644
--- a/core/src/main/scala/org/apache/spark/util/HadoopFSUtils.scala
+++ b/core/src/main/scala/org/apache/spark/util/HadoopFSUtils.scala
@@ -28,7 +28,7 @@ import org.apache.hadoop.fs.viewfs.ViewFileSystem
 import org.apache.hadoop.hdfs.DistributedFileSystem
 
 import org.apache.spark._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.metrics.source.HiveCatalogMetrics
 import org.apache.spark.util.ArrayImplicits._
diff --git a/core/src/main/scala/org/apache/spark/util/JsonProtocol.scala b/core/src/main/scala/org/apache/spark/util/JsonProtocol.scala
index d4b9b3c2ef3a7..d2e684faf9edd 100644
--- a/core/src/main/scala/org/apache/spark/util/JsonProtocol.scala
+++ b/core/src/main/scala/org/apache/spark/util/JsonProtocol.scala
@@ -38,6 +38,16 @@ import org.apache.spark.storage._
 import org.apache.spark.util.ArrayImplicits._
 import org.apache.spark.util.Utils.weakIntern
 
+/**
+ * Helper class for passing configuration options to JsonProtocol.
+ * We use this instead of passing SparkConf directly because it lets us avoid
+ * repeated re-parsing of configuration values on each read.
+ */
+private[spark] class JsonProtocolOptions(conf: SparkConf) {
+  val includeTaskMetricsAccumulators: Boolean =
+    conf.get(EVENT_LOG_INCLUDE_TASK_METRICS_ACCUMULATORS)
+}
+
 /**
  * Serializes SparkListener events to/from JSON.  This protocol provides strong backwards-
  * and forwards-compatibility guarantees: any version of Spark should be able to read JSON output
@@ -53,45 +63,49 @@ import org.apache.spark.util.Utils.weakIntern
  *  - Any new JSON fields should be optional; use `jsonOption` when reading these fields
  *    in `*FromJson` methods.
  */
-private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
+private[spark] object JsonProtocol extends JsonUtils {
   // TODO: Remove this file and put JSON serialization into each individual class.
 
-  // SPARK-49872 remove limit on string lengths
+  // SPARK-49872: Remove jackson JSON string length limitation.
   mapper.getFactory.setStreamReadConstraints(
-    StreamReadConstraints.builder().maxStringLength(
-      sparkConf.get(EVENT_LOG_READER_MAX_STRING_LENGTH)
-    ).build()
+    StreamReadConstraints.builder().maxStringLength(Int.MaxValue).build()
   )
 
-  val includeTaskMetricsAccumulators: Boolean =
-    sparkConf.get(EVENT_LOG_INCLUDE_TASK_METRICS_ACCUMULATORS)
+  private[util]
+  val defaultOptions: JsonProtocolOptions = new JsonProtocolOptions(new SparkConf(false))
 
   /** ------------------------------------------------- *
    * JSON serialization methods for SparkListenerEvents |
    * -------------------------------------------------- */
 
+  // Only for use in tests. Production code should use the two-argument overload defined below.
   def sparkEventToJsonString(event: SparkListenerEvent): String = {
+    sparkEventToJsonString(event, defaultOptions)
+  }
+
+  def sparkEventToJsonString(event: SparkListenerEvent, options: JsonProtocolOptions): String = {
     toJsonString { generator =>
-      writeSparkEventToJson(event, generator)
+      writeSparkEventToJson(event, generator, options)
     }
   }
 
   def writeSparkEventToJson(
       event: SparkListenerEvent,
-      g: JsonGenerator): Unit = {
+      g: JsonGenerator,
+      options: JsonProtocolOptions): Unit = {
     event match {
       case stageSubmitted: SparkListenerStageSubmitted =>
-        stageSubmittedToJson(stageSubmitted, g)
+        stageSubmittedToJson(stageSubmitted, g, options)
       case stageCompleted: SparkListenerStageCompleted =>
-        stageCompletedToJson(stageCompleted, g)
+        stageCompletedToJson(stageCompleted, g, options)
       case taskStart: SparkListenerTaskStart =>
-        taskStartToJson(taskStart, g)
+        taskStartToJson(taskStart, g, options)
       case taskGettingResult: SparkListenerTaskGettingResult =>
-        taskGettingResultToJson(taskGettingResult, g)
+        taskGettingResultToJson(taskGettingResult, g, options)
       case taskEnd: SparkListenerTaskEnd =>
-        taskEndToJson(taskEnd, g)
+        taskEndToJson(taskEnd, g, options)
       case jobStart: SparkListenerJobStart =>
-        jobStartToJson(jobStart, g)
+        jobStartToJson(jobStart, g, options)
       case jobEnd: SparkListenerJobEnd =>
         jobEndToJson(jobEnd, g)
       case environmentUpdate: SparkListenerEnvironmentUpdate =>
@@ -125,16 +139,15 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
     }
   }
 
-  import JsonProtocol.SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES
-
   def stageSubmittedToJson(
       stageSubmitted: SparkListenerStageSubmitted,
-      g: JsonGenerator): Unit = {
+      g: JsonGenerator,
+      options: JsonProtocolOptions): Unit = {
     g.writeStartObject()
     g.writeStringField("Event", SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES.stageSubmitted)
     g.writeFieldName("Stage Info")
     // SPARK-42205: don't log accumulables in start events:
-    stageInfoToJson(stageSubmitted.stageInfo, g, includeAccumulables = false)
+    stageInfoToJson(stageSubmitted.stageInfo, g, options, includeAccumulables = false)
     Option(stageSubmitted.properties).foreach { properties =>
       g.writeFieldName("Properties")
       propertiesToJson(properties, g)
@@ -144,42 +157,46 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
 
   def stageCompletedToJson(
       stageCompleted: SparkListenerStageCompleted,
-      g: JsonGenerator): Unit = {
+      g: JsonGenerator,
+      options: JsonProtocolOptions): Unit = {
     g.writeStartObject()
     g.writeStringField("Event", SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES.stageCompleted)
     g.writeFieldName("Stage Info")
-    stageInfoToJson(stageCompleted.stageInfo, g, includeAccumulables = true)
+    stageInfoToJson(stageCompleted.stageInfo, g, options, includeAccumulables = true)
     g.writeEndObject()
   }
 
   def taskStartToJson(
       taskStart: SparkListenerTaskStart,
-      g: JsonGenerator): Unit = {
+      g: JsonGenerator,
+      options: JsonProtocolOptions): Unit = {
     g.writeStartObject()
     g.writeStringField("Event", SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES.taskStart)
     g.writeNumberField("Stage ID", taskStart.stageId)
     g.writeNumberField("Stage Attempt ID", taskStart.stageAttemptId)
     g.writeFieldName("Task Info")
     // SPARK-42205: don't log accumulables in start events:
-    taskInfoToJson(taskStart.taskInfo, g, includeAccumulables = false)
+    taskInfoToJson(taskStart.taskInfo, g, options, includeAccumulables = false)
     g.writeEndObject()
   }
 
   def taskGettingResultToJson(
       taskGettingResult: SparkListenerTaskGettingResult,
-      g: JsonGenerator): Unit = {
+      g: JsonGenerator,
+      options: JsonProtocolOptions): Unit = {
     val taskInfo = taskGettingResult.taskInfo
     g.writeStartObject()
     g.writeStringField("Event", SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES.taskGettingResult)
     g.writeFieldName("Task Info")
     // SPARK-42205: don't log accumulables in "task getting result" events:
-    taskInfoToJson(taskInfo, g, includeAccumulables = false)
+    taskInfoToJson(taskInfo, g, options, includeAccumulables = false)
     g.writeEndObject()
   }
 
   def taskEndToJson(
       taskEnd: SparkListenerTaskEnd,
-      g: JsonGenerator): Unit = {
+      g: JsonGenerator,
+      options: JsonProtocolOptions): Unit = {
     g.writeStartObject()
     g.writeStringField("Event", SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES.taskEnd)
     g.writeNumberField("Stage ID", taskEnd.stageId)
@@ -188,7 +205,7 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
     g.writeFieldName("Task End Reason")
     taskEndReasonToJson(taskEnd.reason, g)
     g.writeFieldName("Task Info")
-    taskInfoToJson(taskEnd.taskInfo, g, includeAccumulables = true)
+    taskInfoToJson(taskEnd.taskInfo, g, options, includeAccumulables = true)
     g.writeFieldName("Task Executor Metrics")
     executorMetricsToJson(taskEnd.taskExecutorMetrics, g)
     Option(taskEnd.taskMetrics).foreach { m =>
@@ -200,7 +217,8 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
 
   def jobStartToJson(
       jobStart: SparkListenerJobStart,
-      g: JsonGenerator): Unit = {
+      g: JsonGenerator,
+      options: JsonProtocolOptions): Unit = {
     g.writeStartObject()
     g.writeStringField("Event", SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES.jobStart)
     g.writeNumberField("Job ID", jobStart.jobId)
@@ -211,7 +229,7 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
     // the job was submitted: it is technically possible for a stage to belong to multiple
     // concurrent jobs, so this situation can arise even without races occurring between
     // event logging and stage completion.
-    jobStart.stageInfos.foreach(stageInfoToJson(_, g, includeAccumulables = true))
+    jobStart.stageInfos.foreach(stageInfoToJson(_, g, options, includeAccumulables = true))
     g.writeEndArray()
     g.writeArrayFieldStart("Stage IDs")
     jobStart.stageIds.foreach(g.writeNumber)
@@ -410,6 +428,7 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
   def stageInfoToJson(
       stageInfo: StageInfo,
       g: JsonGenerator,
+      options: JsonProtocolOptions,
       includeAccumulables: Boolean): Unit = {
     g.writeStartObject()
     g.writeNumberField("Stage ID", stageInfo.stageId)
@@ -431,7 +450,7 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
       accumulablesToJson(
         stageInfo.accumulables.values,
         g,
-        includeTaskMetricsAccumulators = includeTaskMetricsAccumulators)
+        includeTaskMetricsAccumulators = options.includeTaskMetricsAccumulators)
     } else {
       g.writeStartArray()
       g.writeEndArray()
@@ -445,6 +464,7 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
   def taskInfoToJson(
       taskInfo: TaskInfo,
       g: JsonGenerator,
+      options: JsonProtocolOptions,
       includeAccumulables: Boolean): Unit = {
     g.writeStartObject()
     g.writeNumberField("Task ID", taskInfo.taskId)
@@ -465,7 +485,7 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
       accumulablesToJson(
         taskInfo.accumulables,
         g,
-        includeTaskMetricsAccumulators = includeTaskMetricsAccumulators)
+        includeTaskMetricsAccumulators = options.includeTaskMetricsAccumulators)
     } else {
       g.writeStartArray()
       g.writeEndArray()
@@ -891,6 +911,29 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
    * JSON deserialization methods for SparkListenerEvents |
    * ---------------------------------------------------- */
 
+  private object SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES {
+    val stageSubmitted = Utils.getFormattedClassName(SparkListenerStageSubmitted)
+    val stageCompleted = Utils.getFormattedClassName(SparkListenerStageCompleted)
+    val taskStart = Utils.getFormattedClassName(SparkListenerTaskStart)
+    val taskGettingResult = Utils.getFormattedClassName(SparkListenerTaskGettingResult)
+    val taskEnd = Utils.getFormattedClassName(SparkListenerTaskEnd)
+    val jobStart = Utils.getFormattedClassName(SparkListenerJobStart)
+    val jobEnd = Utils.getFormattedClassName(SparkListenerJobEnd)
+    val environmentUpdate = Utils.getFormattedClassName(SparkListenerEnvironmentUpdate)
+    val blockManagerAdded = Utils.getFormattedClassName(SparkListenerBlockManagerAdded)
+    val blockManagerRemoved = Utils.getFormattedClassName(SparkListenerBlockManagerRemoved)
+    val unpersistRDD = Utils.getFormattedClassName(SparkListenerUnpersistRDD)
+    val applicationStart = Utils.getFormattedClassName(SparkListenerApplicationStart)
+    val applicationEnd = Utils.getFormattedClassName(SparkListenerApplicationEnd)
+    val executorAdded = Utils.getFormattedClassName(SparkListenerExecutorAdded)
+    val executorRemoved = Utils.getFormattedClassName(SparkListenerExecutorRemoved)
+    val logStart = Utils.getFormattedClassName(SparkListenerLogStart)
+    val metricsUpdate = Utils.getFormattedClassName(SparkListenerExecutorMetricsUpdate)
+    val stageExecutorMetrics = Utils.getFormattedClassName(SparkListenerStageExecutorMetrics)
+    val blockUpdate = Utils.getFormattedClassName(SparkListenerBlockUpdated)
+    val resourceProfileAdded = Utils.getFormattedClassName(SparkListenerResourceProfileAdded)
+  }
+
   def sparkEventFromJson(json: String): SparkListenerEvent = {
     sparkEventFromJson(mapper.readTree(json))
   }
@@ -919,8 +962,14 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
       case `stageExecutorMetrics` => stageExecutorMetricsFromJson(json)
       case `blockUpdate` => blockUpdateFromJson(json)
       case `resourceProfileAdded` => resourceProfileAddedFromJson(json)
-      case other => mapper.readValue(json.toString, Utils.classForName(other))
-        .asInstanceOf[SparkListenerEvent]
+      case other =>
+        val otherClass = Utils.classForName(other)
+        if (classOf[SparkListenerEvent].isAssignableFrom(otherClass)) {
+          mapper.readValue(json.toString, otherClass)
+            .asInstanceOf[SparkListenerEvent]
+        } else {
+          throw new SparkException(s"Unknown event type: $other")
+        }
     }
   }
 
@@ -1298,12 +1347,12 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
         jsonOption(readJson.get("Total Records Read")).map(_.extractLong).getOrElse(0L))
       readMetrics.incRemoteReqsDuration(jsonOption(readJson.get("Remote Requests Duration"))
         .map(_.extractLong).getOrElse(0L))
-      jsonOption(readJson.get("Shuffle Push Read Metrics")).foreach { shufflePushReadJson =>
+      jsonOption(readJson.get("Push Based Shuffle")).foreach { shufflePushReadJson =>
         readMetrics.incCorruptMergedBlockChunks(jsonOption(
           shufflePushReadJson.get("Corrupt Merged Block Chunks"))
             .map(_.extractLong).getOrElse(0L))
         readMetrics.incMergedFetchFallbackCount(jsonOption(
-          shufflePushReadJson.get("Merged Fallback Count")).map(_.extractLong).getOrElse(0L))
+          shufflePushReadJson.get("Merged Fetch Fallback Count")).map(_.extractLong).getOrElse(0L))
         readMetrics.incRemoteMergedBlocksFetched(jsonOption(shufflePushReadJson
           .get("Merged Remote Blocks Fetched")).map(_.extractLong).getOrElse(0L))
         readMetrics.incLocalMergedBlocksFetched(jsonOption(shufflePushReadJson
@@ -1360,8 +1409,20 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
     metrics
   }
 
+  private object TASK_END_REASON_FORMATTED_CLASS_NAMES {
+    val success = Utils.getFormattedClassName(Success)
+    val resubmitted = Utils.getFormattedClassName(Resubmitted)
+    val fetchFailed = Utils.getFormattedClassName(FetchFailed)
+    val exceptionFailure = Utils.getFormattedClassName(ExceptionFailure)
+    val taskResultLost = Utils.getFormattedClassName(TaskResultLost)
+    val taskKilled = Utils.getFormattedClassName(TaskKilled)
+    val taskCommitDenied = Utils.getFormattedClassName(TaskCommitDenied)
+    val executorLostFailure = Utils.getFormattedClassName(ExecutorLostFailure)
+    val unknownReason = Utils.getFormattedClassName(UnknownReason)
+  }
+
   def taskEndReasonFromJson(json: JsonNode): TaskEndReason = {
-    import JsonProtocol.TASK_END_REASON_FORMATTED_CLASS_NAMES._
+    import TASK_END_REASON_FORMATTED_CLASS_NAMES._
 
     json.get("Reason").extractString match {
       case `success` => Success
@@ -1434,8 +1495,13 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
     BlockManagerId(executorId, host, port)
   }
 
+  private object JOB_RESULT_FORMATTED_CLASS_NAMES {
+    val jobSucceeded = Utils.getFormattedClassName(JobSucceeded)
+    val jobFailed = Utils.getFormattedClassName(JobFailed)
+  }
+
   def jobResultFromJson(json: JsonNode): JobResult = {
-    import JsonProtocol.JOB_RESULT_FORMATTED_CLASS_NAMES._
+    import JOB_RESULT_FORMATTED_CLASS_NAMES._
 
     json.get("Result").extractString match {
       case `jobSucceeded` => JobSucceeded
@@ -1637,45 +1703,3 @@ private[spark] class JsonProtocol(sparkConf: SparkConf) extends JsonUtils {
     }
   }
 }
-
-private[spark] object JsonProtocol {
-  private object JOB_RESULT_FORMATTED_CLASS_NAMES {
-    val jobSucceeded = Utils.getFormattedClassName(JobSucceeded)
-    val jobFailed = Utils.getFormattedClassName(JobFailed)
-  }
-
-  private object SPARK_LISTENER_EVENT_FORMATTED_CLASS_NAMES {
-    val stageSubmitted = Utils.getFormattedClassName(SparkListenerStageSubmitted)
-    val stageCompleted = Utils.getFormattedClassName(SparkListenerStageCompleted)
-    val taskStart = Utils.getFormattedClassName(SparkListenerTaskStart)
-    val taskGettingResult = Utils.getFormattedClassName(SparkListenerTaskGettingResult)
-    val taskEnd = Utils.getFormattedClassName(SparkListenerTaskEnd)
-    val jobStart = Utils.getFormattedClassName(SparkListenerJobStart)
-    val jobEnd = Utils.getFormattedClassName(SparkListenerJobEnd)
-    val environmentUpdate = Utils.getFormattedClassName(SparkListenerEnvironmentUpdate)
-    val blockManagerAdded = Utils.getFormattedClassName(SparkListenerBlockManagerAdded)
-    val blockManagerRemoved = Utils.getFormattedClassName(SparkListenerBlockManagerRemoved)
-    val unpersistRDD = Utils.getFormattedClassName(SparkListenerUnpersistRDD)
-    val applicationStart = Utils.getFormattedClassName(SparkListenerApplicationStart)
-    val applicationEnd = Utils.getFormattedClassName(SparkListenerApplicationEnd)
-    val executorAdded = Utils.getFormattedClassName(SparkListenerExecutorAdded)
-    val executorRemoved = Utils.getFormattedClassName(SparkListenerExecutorRemoved)
-    val logStart = Utils.getFormattedClassName(SparkListenerLogStart)
-    val metricsUpdate = Utils.getFormattedClassName(SparkListenerExecutorMetricsUpdate)
-    val stageExecutorMetrics = Utils.getFormattedClassName(SparkListenerStageExecutorMetrics)
-    val blockUpdate = Utils.getFormattedClassName(SparkListenerBlockUpdated)
-    val resourceProfileAdded = Utils.getFormattedClassName(SparkListenerResourceProfileAdded)
-  }
-
-  private object TASK_END_REASON_FORMATTED_CLASS_NAMES {
-    val success = Utils.getFormattedClassName(Success)
-    val resubmitted = Utils.getFormattedClassName(Resubmitted)
-    val fetchFailed = Utils.getFormattedClassName(FetchFailed)
-    val exceptionFailure = Utils.getFormattedClassName(ExceptionFailure)
-    val taskResultLost = Utils.getFormattedClassName(TaskResultLost)
-    val taskKilled = Utils.getFormattedClassName(TaskKilled)
-    val taskCommitDenied = Utils.getFormattedClassName(TaskCommitDenied)
-    val executorLostFailure = Utils.getFormattedClassName(ExecutorLostFailure)
-    val unknownReason = Utils.getFormattedClassName(UnknownReason)
-  }
-}
diff --git a/core/src/main/scala/org/apache/spark/util/ListenerBus.scala b/core/src/main/scala/org/apache/spark/util/ListenerBus.scala
index 4f01cd6ac2136..0c0c932ac797c 100644
--- a/core/src/main/scala/org/apache/spark/util/ListenerBus.scala
+++ b/core/src/main/scala/org/apache/spark/util/ListenerBus.scala
@@ -26,7 +26,7 @@ import scala.util.control.NonFatal
 import com.codahale.metrics.Timer
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys.{EVENT, LISTENER, TOTAL_TIME}
 import org.apache.spark.scheduler.EventLoggingListener
 import org.apache.spark.scheduler.SparkListenerEnvironmentUpdate
diff --git a/core/src/main/scala/org/apache/spark/util/PeriodicCheckpointer.scala b/core/src/main/scala/org/apache/spark/util/PeriodicCheckpointer.scala
index 7a98c4830db92..5c9c3d3564d00 100644
--- a/core/src/main/scala/org/apache/spark/util/PeriodicCheckpointer.scala
+++ b/core/src/main/scala/org/apache/spark/util/PeriodicCheckpointer.scala
@@ -23,7 +23,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 
 
diff --git a/core/src/main/scala/org/apache/spark/util/ShutdownHookManager.scala b/core/src/main/scala/org/apache/spark/util/ShutdownHookManager.scala
index ad9c3d3f10cfe..af93f781343d2 100644
--- a/core/src/main/scala/org/apache/spark/util/ShutdownHookManager.scala
+++ b/core/src/main/scala/org/apache/spark/util/ShutdownHookManager.scala
@@ -26,7 +26,7 @@ import scala.util.Try
 import org.apache.hadoop.fs.FileSystem
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.internal.config.SPARK_SHUTDOWN_TIMEOUT_MS
 
diff --git a/core/src/main/scala/org/apache/spark/util/SignalUtils.scala b/core/src/main/scala/org/apache/spark/util/SignalUtils.scala
index b41166a50efd2..e2f615b44115b 100644
--- a/core/src/main/scala/org/apache/spark/util/SignalUtils.scala
+++ b/core/src/main/scala/org/apache/spark/util/SignalUtils.scala
@@ -21,11 +21,10 @@ import java.util.Collections
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.lang3.SystemUtils
 import org.slf4j.Logger
 import sun.misc.{Signal, SignalHandler}
 
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
 
 /**
@@ -58,7 +57,7 @@ private[spark] object SignalUtils extends Logging {
    * All actions for a given signal are run in a separate thread.
    */
   def register(signal: String)(action: => Boolean): Unit = {
-    if (SystemUtils.IS_OS_UNIX) {
+    if (Utils.isUnix) {
       register(signal, log"Failed to register signal handler for ${MDC(SIGNAL, signal)}",
         logStackTrace = true)(action)
     }
diff --git a/core/src/main/scala/org/apache/spark/util/SizeEstimator.scala b/core/src/main/scala/org/apache/spark/util/SizeEstimator.scala
index 88fe64859a214..12a417fee3a21 100644
--- a/core/src/main/scala/org/apache/spark/util/SizeEstimator.scala
+++ b/core/src/main/scala/org/apache/spark/util/SizeEstimator.scala
@@ -29,6 +29,7 @@ import com.google.common.collect.MapMaker
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.internal.Logging
 import org.apache.spark.internal.config.Tests.TEST_USE_COMPRESSED_OOPS_KEY
+import org.apache.spark.util.Utils
 import org.apache.spark.util.collection.OpenHashSet
 
 /**
@@ -106,7 +107,7 @@ object SizeEstimator extends Logging {
   // Sets object size, pointer size based on architecture and CompressedOops settings
   // from the JVM.
   private def initialize(): Unit = {
-    val arch = System.getProperty("os.arch")
+    val arch = Utils.osArch
     is64bit = arch.contains("64") || arch.contains("s390x")
     isCompressedOops = getIsCompressedOops
 
diff --git a/core/src/main/scala/org/apache/spark/util/SparkExitCode.scala b/core/src/main/scala/org/apache/spark/util/SparkExitCode.scala
index e8f8788243cd9..0ffc2afd96356 100644
--- a/core/src/main/scala/org/apache/spark/util/SparkExitCode.scala
+++ b/core/src/main/scala/org/apache/spark/util/SparkExitCode.scala
@@ -45,6 +45,9 @@ private[spark] object SparkExitCode {
       OutOfMemoryError. */
   val OOM = 52
 
+  /** Exit due to ClassNotFoundException or NoClassDefFoundError. */
+  val CLASS_NOT_FOUND = 101
+
   /** Exit because the driver is running over the given threshold. */
   val DRIVER_TIMEOUT = 124
 
diff --git a/core/src/main/scala/org/apache/spark/util/SparkUncaughtExceptionHandler.scala b/core/src/main/scala/org/apache/spark/util/SparkUncaughtExceptionHandler.scala
index 25a6322743baa..a1aeee1d877c7 100644
--- a/core/src/main/scala/org/apache/spark/util/SparkUncaughtExceptionHandler.scala
+++ b/core/src/main/scala/org/apache/spark/util/SparkUncaughtExceptionHandler.scala
@@ -19,7 +19,7 @@ package org.apache.spark.util
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.executor.{ExecutorExitCode, KilledByTaskReaperException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.THREAD
 import org.apache.spark.internal.config.KILL_ON_FATAL_ERROR_DEPTH
 
diff --git a/core/src/main/scala/org/apache/spark/util/UninterruptibleThread.scala b/core/src/main/scala/org/apache/spark/util/UninterruptibleThread.scala
index 8fba5ed944c67..3d504856f5660 100644
--- a/core/src/main/scala/org/apache/spark/util/UninterruptibleThread.scala
+++ b/core/src/main/scala/org/apache/spark/util/UninterruptibleThread.scala
@@ -107,8 +107,11 @@ private[spark] class UninterruptibleThread(
       // super.interrupt() is called. In this case to prevent runUninterruptibly() from being
       // interrupted, we use awaitInterruptThread flag. We need to set it only if
       // runUninterruptibly() is not yet set uninterruptible to true (!shouldInterruptThread) and
-      // there is no other threads that called interrupt (awaitInterruptThread is already true)
-      if (!shouldInterruptThread && !awaitInterruptThread) {
+      // there is no other threads that called interrupt (awaitInterruptThread is already true or
+      // isInterrupted is true. (SPARK-53394) Otherwise, the state of shouldInterruptThread would
+      // become inconsistent between isInterruptible() and isInterruptPending(), leading to
+      // UninterruptibleThread be interruptible under runUninterruptibly.)
+      if (!shouldInterruptThread && !awaitInterruptThread && !isInterrupted) {
         awaitInterruptThread = true
         true
       } else {
diff --git a/core/src/main/scala/org/apache/spark/util/Utils.scala b/core/src/main/scala/org/apache/spark/util/Utils.scala
index ea9b742fb2e1b..3b525cd69430e 100644
--- a/core/src/main/scala/org/apache/spark/util/Utils.scala
+++ b/core/src/main/scala/org/apache/spark/util/Utils.scala
@@ -28,7 +28,7 @@ import java.nio.channels.Channels
 import java.nio.charset.StandardCharsets
 import java.nio.file.Files
 import java.security.SecureRandom
-import java.util.{Locale, Properties, Random, UUID}
+import java.util.{HexFormat, Locale, Properties, Random, UUID}
 import java.util.concurrent._
 import java.util.concurrent.TimeUnit.NANOSECONDS
 import java.util.zip.{GZIPInputStream, ZipInputStream}
@@ -46,12 +46,8 @@ import scala.util.matching.Regex
 import _root_.io.netty.channel.unix.Errors.NativeIoException
 import com.google.common.cache.{CacheBuilder, CacheLoader, LoadingCache}
 import com.google.common.collect.Interners
-import com.google.common.io.{ByteStreams, Files => GFiles}
 import com.google.common.net.InetAddresses
 import jakarta.ws.rs.core.UriBuilder
-import org.apache.commons.codec.binary.Hex
-import org.apache.commons.io.IOUtils
-import org.apache.commons.lang3.{JavaVersion, SystemUtils}
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileSystem, FileUtil, Path}
 import org.apache.hadoop.fs.audit.CommonAuditContext.currentAuditContext
@@ -59,7 +55,7 @@ import org.apache.hadoop.io.compress.{CompressionCodecFactory, SplittableCompres
 import org.apache.hadoop.ipc.{CallerContext => HadoopCallerContext}
 import org.apache.hadoop.ipc.CallerContext.{Builder => HadoopCallerContextBuilder}
 import org.apache.hadoop.security.UserGroupInformation
-import org.apache.hadoop.util.{RunJar, StringUtils}
+import org.apache.hadoop.util.RunJar
 import org.apache.hadoop.yarn.conf.YarnConfiguration
 import org.apache.logging.log4j.{Level, LogManager}
 import org.apache.logging.log4j.core.LoggerContext
@@ -67,9 +63,9 @@ import org.apache.logging.log4j.core.config.LoggerConfig
 import org.eclipse.jetty.util.MultiException
 import org.slf4j.Logger
 
-import org.apache.spark._
+import org.apache.spark.{SPARK_VERSION, _}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
@@ -105,7 +101,8 @@ private[spark] object Utils
   with SparkFileUtils
   with SparkSerDeUtils
   with SparkStreamUtils
-  with SparkStringUtils {
+  with SparkStringUtils
+  with SparkSystemUtils {
 
   private val sparkUncaughtExceptionHandler = new SparkUncaughtExceptionHandler
   @volatile private var cachedLocalDir: String = ""
@@ -435,7 +432,7 @@ private[spark] object Utils
     if (!source.exists()) {
       throw new FileNotFoundException(source.getAbsolutePath)
     }
-    val lowerSrc = StringUtils.toLowerCase(source.getName)
+    val lowerSrc = source.getName.toLowerCase(Locale.ENGLISH)
     if (lowerSrc.endsWith(".jar")) {
       RunJar.unJar(source, dest, RunJar.MATCH_ANY)
     } else if (lowerSrc.endsWith(".zip")) {
@@ -458,7 +455,7 @@ private[spark] object Utils
    * to work around a security issue, see also SPARK-38631.
    */
   private def unTarUsingJava(source: File, dest: File): Unit = {
-    if (!dest.mkdirs && !dest.isDirectory) {
+    if (!Utils.createDirectory(dest) && !dest.isDirectory) {
       throw new IOException(s"Mkdirs failed to create $dest")
     } else {
       try {
@@ -594,7 +591,7 @@ private[spark] object Utils
         case (f1, f2) => filesEqualRecursive(f1, f2)
       }
     } else if (file1.isFile && file2.isFile) {
-      GFiles.equal(file1, file2)
+      contentEquals(file1, file2)
     } else {
       false
     }
@@ -810,19 +807,18 @@ private[spark] object Utils
     configuredLocalDirs.flatMap { root =>
       try {
         val rootDir = new File(root)
-        if (rootDir.exists || rootDir.mkdirs()) {
+        if (rootDir.exists || Utils.createDirectory(rootDir)) {
           val dir = createTempDir(root)
           chmod700(dir)
           Some(dir.getAbsolutePath)
         } else {
           logError(log"Failed to create dir in ${MDC(PATH, root)}. Ignoring this directory.")
-
           None
         }
       } catch {
         case e: IOException =>
           logError(
-            log"Failed to create local root dir in ${MDC(PATH, root)}. Ignoring this directory.")
+            log"Failed to create local root dir in ${MDC(PATH, root)}. Ignoring this directory.", e)
           None
       }
     }
@@ -1560,10 +1556,10 @@ private[spark] object Utils
       gzInputStream = new GZIPInputStream(new FileInputStream(file))
       val bufSize = 1024
       val buf = new Array[Byte](bufSize)
-      var numBytes = ByteStreams.read(gzInputStream, buf, 0, bufSize)
+      var numBytes = gzInputStream.readNBytes(buf, 0, bufSize)
       while (numBytes > 0) {
         fileSize += numBytes
-        numBytes = ByteStreams.read(gzInputStream, buf, 0, bufSize)
+        numBytes = gzInputStream.readNBytes(buf, 0, bufSize)
       }
       fileSize
     } catch {
@@ -1590,8 +1586,8 @@ private[spark] object Utils
     }
 
     try {
-      ByteStreams.skipFully(stream, effectiveStart)
-      ByteStreams.readFully(stream, buff)
+      stream.skipNBytes(effectiveStart)
+      readFully(stream, buff, 0, buff.length)
     } finally {
       stream.close()
     }
@@ -1859,24 +1855,14 @@ private[spark] object Utils
   }
 
   /**
-   * Whether the underlying operating system is Windows.
-   */
-  val isWindows = SystemUtils.IS_OS_WINDOWS
-
-  /**
-   * Whether the underlying operating system is Mac OS X.
+   * Whether the underlying Java version is at most 17.
    */
-  val isMac = SystemUtils.IS_OS_MAC_OSX
+  val isJavaVersionAtMost17 = Runtime.version().feature() <= 17
 
   /**
    * Whether the underlying Java version is at least 21.
    */
-  val isJavaVersionAtLeast21 = SystemUtils.isJavaVersionAtLeast(JavaVersion.JAVA_21)
-
-  /**
-   * Whether the underlying operating system is Mac OS X and processor is Apple Silicon.
-   */
-  val isMacOnAppleSilicon = SystemUtils.IS_OS_MAC_OSX && SystemUtils.OS_ARCH.equals("aarch64")
+  val isJavaVersionAtLeast21 = Runtime.version().feature() >= 21
 
   /**
    * Whether the underlying JVM prefer IPv6 addresses.
@@ -2920,12 +2906,19 @@ private[spark] object Utils
     opt.replace("{{APP_ID}}", appId)
   }
 
+  /**
+   * Replaces all the {{SPARK_VERSION}} occurrences with the Spark version.
+   */
+  def substituteSparkVersion(opt: String): String = {
+    opt.replace("{{SPARK_VERSION}}", SPARK_VERSION)
+  }
+
   def createSecret(conf: SparkConf): String = {
     val bits = conf.get(AUTH_SECRET_BIT_LENGTH)
     val rnd = new SecureRandom()
     val secretBytes = new Array[Byte](bits / JByte.SIZE)
     rnd.nextBytes(secretBytes)
-    Hex.encodeHexString(secretBytes)
+    HexFormat.of().formatHex(secretBytes)
   }
 
   /**
@@ -3056,9 +3049,9 @@ private[spark] object Utils
   }
 
   /** Returns a string message about delegation token generation failure */
-  def createFailedToGetTokenMessage(serviceName: String, e: scala.Throwable): MessageWithContext = {
-    log"Failed to get token from service ${MDC(SERVICE_NAME, serviceName)} " +
-      log"due to ${MDC(ERROR, e)}. If ${MDC(SERVICE_NAME, serviceName)} is not used, " +
+  def createFailedToGetTokenMessage(serviceName: String): MessageWithContext = {
+    log"Failed to get token from service ${MDC(SERVICE_NAME, serviceName)}. " +
+      log"If ${MDC(SERVICE_NAME, serviceName)} is not used, " +
       log"set spark.security.credentials.${MDC(SERVICE_NAME, serviceName)}.enabled to false."
   }
 
@@ -3078,7 +3071,7 @@ private[spark] object Utils
           val outFile = new File(localDir, fileName)
           files += outFile
           out = new FileOutputStream(outFile)
-          IOUtils.copy(in, out)
+          in.transferTo(out)
           out.close()
           in.closeEntry()
         }
@@ -3088,8 +3081,8 @@ private[spark] object Utils
       logDebug(log"Unzipped from ${MDC(PATH, dfsZipFile)}\n\t${MDC(PATHS, files.mkString("\n\t"))}")
     } finally {
       // Close everything no matter what happened
-      IOUtils.closeQuietly(in)
-      IOUtils.closeQuietly(out)
+      Utils.closeQuietly(in)
+      Utils.closeQuietly(out)
     }
     files.toSeq
   }
@@ -3157,6 +3150,17 @@ private[spark] object Utils
       "true".equals(useG1GC)
     }.getOrElse(false)
   }
+
+  /**
+   * Return a string of printStackTrace result.
+   */
+  def stringifyException(e: Throwable): String = {
+    val stm = new StringWriter()
+    val wrt = new PrintWriter(stm)
+    e.printStackTrace(wrt)
+    wrt.close()
+    stm.toString()
+  }
 }
 
 private[util] object CallerContext extends Logging {
diff --git a/core/src/main/scala/org/apache/spark/util/collection/ExternalAppendOnlyMap.scala b/core/src/main/scala/org/apache/spark/util/collection/ExternalAppendOnlyMap.scala
index 16a2f4fb6cad9..d892fa0e47060 100644
--- a/core/src/main/scala/org/apache/spark/util/collection/ExternalAppendOnlyMap.scala
+++ b/core/src/main/scala/org/apache/spark/util/collection/ExternalAppendOnlyMap.scala
@@ -29,7 +29,7 @@ import com.google.common.io.ByteStreams
 import org.apache.spark.{SparkEnv, TaskContext}
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.executor.ShuffleWriteMetrics
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.serializer.{DeserializationStream, Serializer, SerializerManager}
 import org.apache.spark.storage.{BlockId, BlockManager}
diff --git a/core/src/main/scala/org/apache/spark/util/collection/ExternalSorter.scala b/core/src/main/scala/org/apache/spark/util/collection/ExternalSorter.scala
index 393cdbbef0a5a..8dd207b25bb94 100644
--- a/core/src/main/scala/org/apache/spark/util/collection/ExternalSorter.scala
+++ b/core/src/main/scala/org/apache/spark/util/collection/ExternalSorter.scala
@@ -28,7 +28,7 @@ import com.google.common.io.ByteStreams
 
 import org.apache.spark._
 import org.apache.spark.executor.ShuffleWriteMetrics
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys.{NUM_BYTES, TASK_ATTEMPT_ID}
 import org.apache.spark.serializer._
 import org.apache.spark.shuffle.{ShufflePartitionPairsWriter, ShuffleWriteMetricsReporter}
diff --git a/core/src/main/scala/org/apache/spark/util/collection/PrimitiveKeyOpenHashMap.scala b/core/src/main/scala/org/apache/spark/util/collection/PrimitiveKeyOpenHashMap.scala
deleted file mode 100644
index 69665aaeac4db..0000000000000
--- a/core/src/main/scala/org/apache/spark/util/collection/PrimitiveKeyOpenHashMap.scala
+++ /dev/null
@@ -1,128 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.util.collection
-
-import scala.reflect._
-
-/**
- * A fast hash map implementation for primitive, non-null keys. This hash map supports
- * insertions and updates, but not deletions. This map is about an order of magnitude
- * faster than java.util.HashMap, while using much less space overhead.
- *
- * Under the hood, it uses our OpenHashSet implementation.
- */
-private[spark]
-class PrimitiveKeyOpenHashMap[@specialized(Long, Int) K: ClassTag,
-                              @specialized(Long, Int, Double) V: ClassTag](
-    initialCapacity: Int)
-  extends Iterable[(K, V)]
-  with Serializable {
-
-  def this() = this(64)
-
-  require(classTag[K] == classTag[Long] || classTag[K] == classTag[Int])
-
-  // Init in constructor (instead of in declaration) to work around a Scala compiler specialization
-  // bug that would generate two arrays (one for Object and one for specialized T).
-  protected var _keySet: OpenHashSet[K] = _
-  private var _values: Array[V] = _
-  _keySet = new OpenHashSet[K](initialCapacity)
-  _values = new Array[V](_keySet.capacity)
-
-  private var _oldValues: Array[V] = null
-
-  override def size: Int = _keySet.size
-
-  /** Tests whether this map contains a binding for a key. */
-  def contains(k: K): Boolean = {
-    _keySet.getPos(k) != OpenHashSet.INVALID_POS
-  }
-
-  /** Get the value for a given key */
-  def apply(k: K): V = {
-    val pos = _keySet.getPos(k)
-    _values(pos)
-  }
-
-  /** Get the value for a given key, or returns elseValue if it doesn't exist. */
-  def getOrElse(k: K, elseValue: V): V = {
-    val pos = _keySet.getPos(k)
-    if (pos >= 0) _values(pos) else elseValue
-  }
-
-  /** Set the value for a key */
-  def update(k: K, v: V): Unit = {
-    val pos = _keySet.addWithoutResize(k) & OpenHashSet.POSITION_MASK
-    _values(pos) = v
-    _keySet.rehashIfNeeded(k, grow, move)
-    _oldValues = null
-  }
-
-  /**
-   * If the key doesn't exist yet in the hash map, set its value to defaultValue; otherwise,
-   * set its value to mergeValue(oldValue).
-   *
-   * @return the newly updated value.
-   */
-  def changeValue(k: K, defaultValue: => V, mergeValue: (V) => V): V = {
-    val pos = _keySet.addWithoutResize(k)
-    if ((pos & OpenHashSet.NONEXISTENCE_MASK) != 0) {
-      val newValue = defaultValue
-      _values(pos & OpenHashSet.POSITION_MASK) = newValue
-      _keySet.rehashIfNeeded(k, grow, move)
-      newValue
-    } else {
-      _values(pos) = mergeValue(_values(pos))
-      _values(pos)
-    }
-  }
-
-  override def iterator: Iterator[(K, V)] = new Iterator[(K, V)] {
-    var pos = 0
-    var nextPair: (K, V) = computeNextPair()
-
-    /** Get the next value we should return from next(), or null if we're finished iterating */
-    def computeNextPair(): (K, V) = {
-      pos = _keySet.nextPos(pos)
-      if (pos >= 0) {
-        val ret = (_keySet.getValue(pos), _values(pos))
-        pos += 1
-        ret
-      } else {
-        null
-      }
-    }
-
-    def hasNext: Boolean = nextPair != null
-
-    def next(): (K, V) = {
-      val pair = nextPair
-      nextPair = computeNextPair()
-      pair
-    }
-  }
-
-  private def grow(newCapacity: Int): Unit = {
-    _oldValues = _values
-    _values = new Array[V](newCapacity)
-  }
-
-  private def move(oldPos: Int, newPos: Int): Unit = {
-    _values(newPos) = _oldValues(oldPos)
-  }
-}
diff --git a/core/src/main/scala/org/apache/spark/util/collection/Spillable.scala b/core/src/main/scala/org/apache/spark/util/collection/Spillable.scala
index 7f2a1a8419a71..17713e83bb83e 100644
--- a/core/src/main/scala/org/apache/spark/util/collection/Spillable.scala
+++ b/core/src/main/scala/org/apache/spark/util/collection/Spillable.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.util.collection
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.memory.{MemoryConsumer, MemoryMode, TaskMemoryManager}
 
@@ -58,6 +58,10 @@ private[spark] abstract class Spillable[C](taskMemoryManager: TaskMemoryManager)
   private[this] val numElementsForceSpillThreshold: Int =
     SparkEnv.get.conf.get(SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD)
 
+  // Force this collection to spill when its size is greater than this threshold
+  private[this] val maxSizeForceSpillThreshold: Long =
+    SparkEnv.get.conf.get(SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD)
+
   // Threshold for this collection's size in bytes before we start tracking its memory usage
   // To avoid a large number of small spills, initialize this to a value orders of magnitude > 0
   @volatile private[this] var myMemoryThreshold = initialMemoryThreshold
@@ -80,21 +84,25 @@ private[spark] abstract class Spillable[C](taskMemoryManager: TaskMemoryManager)
    * @return true if `collection` was spilled to disk; false otherwise
    */
   protected def maybeSpill(collection: C, currentMemory: Long): Boolean = {
-    var shouldSpill = false
-    if (elementsRead % 32 == 0 && currentMemory >= myMemoryThreshold) {
+    val shouldSpill = if (_elementsRead > numElementsForceSpillThreshold
+      || currentMemory > maxSizeForceSpillThreshold) {
+      // Check number of elements or memory usage limits, whichever is hit first
+      true
+    } else if (_elementsRead % 32 == 0 && currentMemory >= myMemoryThreshold) {
       // Claim up to double our current memory from the shuffle memory pool
       val amountToRequest = 2 * currentMemory - myMemoryThreshold
       val granted = acquireMemory(amountToRequest)
       myMemoryThreshold += granted
       // If we were granted too little memory to grow further (either tryToAcquire returned 0,
       // or we already had more memory than myMemoryThreshold), spill the current collection
-      shouldSpill = currentMemory >= myMemoryThreshold
+      currentMemory >= myMemoryThreshold
+    } else {
+      false
     }
-    shouldSpill = shouldSpill || _elementsRead > numElementsForceSpillThreshold
     // Actually spill
     if (shouldSpill) {
       _spillCount += 1
-      logSpillage(currentMemory)
+      logSpillage(currentMemory, _elementsRead)
       spill(collection)
       _elementsRead = 0
       _memoryBytesSpilled += currentMemory
@@ -140,12 +148,14 @@ private[spark] abstract class Spillable[C](taskMemoryManager: TaskMemoryManager)
    * Prints a standard log message detailing spillage.
    *
    * @param size number of bytes spilled
+   * @param elements number of elements read from input since last spill
    */
-  @inline private def logSpillage(size: Long): Unit = {
+  @inline private def logSpillage(size: Long, elements: Int): Unit = {
     val threadId = Thread.currentThread().getId
     logInfo(log"Thread ${MDC(LogKeys.THREAD_ID, threadId)} " +
       log"spilling in-memory map of ${MDC(LogKeys.BYTE_SIZE,
-        org.apache.spark.util.Utils.bytesToString(size))} to disk " +
+        org.apache.spark.util.Utils.bytesToString(size))} " +
+      log"(elements: ${MDC(LogKeys.NUM_ELEMENTS_SPILL_RECORDS, elements)}) to disk " +
       log"(${MDC(LogKeys.NUM_SPILLS, _spillCount)} times so far)")
   }
 }
diff --git a/core/src/main/scala/org/apache/spark/util/io/ChunkedByteBuffer.scala b/core/src/main/scala/org/apache/spark/util/io/ChunkedByteBuffer.scala
index 88bd117ba22bf..0f4cf79c0fe91 100644
--- a/core/src/main/scala/org/apache/spark/util/io/ChunkedByteBuffer.scala
+++ b/core/src/main/scala/org/apache/spark/util/io/ChunkedByteBuffer.scala
@@ -21,10 +21,8 @@ import java.io.{Externalizable, File, FileInputStream, InputStream, ObjectInput,
 import java.nio.ByteBuffer
 import java.nio.channels.WritableByteChannel
 
-import com.google.common.io.ByteStreams
 import com.google.common.primitives.UnsignedBytes
 import io.netty.handler.stream.ChunkedStream
-import org.apache.commons.io.IOUtils
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.internal.config
@@ -246,12 +244,12 @@ private[spark] object ChunkedByteBuffer {
     // and spark currently is not expecting memory-mapped buffers in the memory store, it conflicts
     // with other parts that manage the lifecycle of buffers and dispose them.  See SPARK-25422.
     val is = new FileInputStream(file)
-    ByteStreams.skipFully(is, offset)
+    is.skipNBytes(offset)
     val in = new LimitedInputStream(is, length)
     val chunkSize = math.min(ByteArrayMethods.MAX_ROUNDED_ARRAY_LENGTH, length).toInt
     val out = new ChunkedByteBufferOutputStream(chunkSize, ByteBuffer.allocate _)
     Utils.tryWithSafeFinally {
-      IOUtils.copy(in, out)
+      in.transferTo(out)
     } {
       in.close()
       out.close()
diff --git a/core/src/main/scala/org/apache/spark/util/logging/DriverLogger.scala b/core/src/main/scala/org/apache/spark/util/logging/DriverLogger.scala
index 840fb59d410a6..9854c99707b1c 100644
--- a/core/src/main/scala/org/apache/spark/util/logging/DriverLogger.scala
+++ b/core/src/main/scala/org/apache/spark/util/logging/DriverLogger.scala
@@ -21,7 +21,6 @@ import java.io._
 import java.util.EnumSet
 import java.util.concurrent.{ScheduledExecutorService, TimeUnit}
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileSystem, FSDataOutputStream, Path}
 import org.apache.hadoop.fs.permission.FsPermission
@@ -33,7 +32,7 @@ import org.apache.logging.log4j.core.layout.PatternLayout
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config._
 import org.apache.spark.network.util.JavaUtils
@@ -47,8 +46,8 @@ private[spark] class DriverLogger(conf: SparkConf) extends Logging {
   private val LOG_FILE_PERMISSIONS = new FsPermission(Integer.parseInt("770", 8).toShort)
 
   private val localLogFile: String = conf.get(DRIVER_LOG_LOCAL_DIR).map {
-    FileUtils.getFile(_, DriverLogger.DRIVER_LOG_FILE).getAbsolutePath()
-  }.getOrElse(FileUtils.getFile(
+    Utils.getFile(_, DriverLogger.DRIVER_LOG_FILE).getAbsolutePath()
+  }.getOrElse(Utils.getFile(
     Utils.getLocalDir(conf),
     DriverLogger.DRIVER_LOG_DIR,
     DriverLogger.DRIVER_LOG_FILE).getAbsolutePath())
@@ -106,7 +105,7 @@ private[spark] class DriverLogger(conf: SparkConf) extends Logging {
         logError(s"Error in persisting driver logs", e)
     } finally {
       Utils.tryLogNonFatalError {
-        JavaUtils.deleteRecursively(FileUtils.getFile(localLogFile).getParentFile())
+        JavaUtils.deleteRecursively(Utils.getFile(localLogFile).getParentFile())
       }
     }
   }
diff --git a/core/src/main/scala/org/apache/spark/util/logging/FileAppender.scala b/core/src/main/scala/org/apache/spark/util/logging/FileAppender.scala
index 2fec1ff832c0a..39fde0cef534b 100644
--- a/core/src/main/scala/org/apache/spark/util/logging/FileAppender.scala
+++ b/core/src/main/scala/org/apache/spark/util/logging/FileAppender.scala
@@ -20,7 +20,7 @@ package org.apache.spark.util.logging
 import java.io.{File, FileOutputStream, InputStream, IOException}
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.util.{IntParam, Utils}
 
diff --git a/core/src/main/scala/org/apache/spark/util/logging/RollingFileAppender.scala b/core/src/main/scala/org/apache/spark/util/logging/RollingFileAppender.scala
index 6927c119a91c5..544ab1711fa37 100644
--- a/core/src/main/scala/org/apache/spark/util/logging/RollingFileAppender.scala
+++ b/core/src/main/scala/org/apache/spark/util/logging/RollingFileAppender.scala
@@ -20,13 +20,11 @@ package org.apache.spark.util.logging
 import java.io._
 import java.util.zip.GZIPOutputStream
 
-import com.google.common.io.Files
-import org.apache.commons.io.IOUtils
-
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{config, MDC}
 import org.apache.spark.internal.LogKeys._
+import org.apache.spark.internal.config
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.Utils
 
 /**
  * Continuously appends data from input stream into the given file, and rolls
@@ -91,16 +89,16 @@ private[spark] class RollingFileAppender(
       try {
         inputStream = new FileInputStream(activeFile)
         gzOutputStream = new GZIPOutputStream(new FileOutputStream(gzFile))
-        IOUtils.copy(inputStream, gzOutputStream)
+        inputStream.transferTo(gzOutputStream)
         inputStream.close()
         gzOutputStream.close()
         activeFile.delete()
       } finally {
-        IOUtils.closeQuietly(inputStream)
-        IOUtils.closeQuietly(gzOutputStream)
+        Utils.closeQuietly(inputStream)
+        Utils.closeQuietly(gzOutputStream)
       }
     } else {
-      Files.move(activeFile, rolloverFile)
+      Utils.moveFile(activeFile, rolloverFile)
     }
   }
 
diff --git a/core/src/main/scala/org/apache/spark/util/logging/RollingPolicy.scala b/core/src/main/scala/org/apache/spark/util/logging/RollingPolicy.scala
index 310e895930943..7f4fc65fd92bf 100644
--- a/core/src/main/scala/org/apache/spark/util/logging/RollingPolicy.scala
+++ b/core/src/main/scala/org/apache/spark/util/logging/RollingPolicy.scala
@@ -20,7 +20,7 @@ package org.apache.spark.util.logging
 import java.text.SimpleDateFormat
 import java.util.{Calendar, Locale}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 
 /**
diff --git a/core/src/test/java/org/apache/spark/io/GenericFileInputStreamSuite.java b/core/src/test/java/org/apache/spark/io/GenericFileInputStreamSuite.java
index 7d5237eecbbf8..bbfa25e60d74b 100644
--- a/core/src/test/java/org/apache/spark/io/GenericFileInputStreamSuite.java
+++ b/core/src/test/java/org/apache/spark/io/GenericFileInputStreamSuite.java
@@ -16,7 +16,6 @@
  */
 package org.apache.spark.io;
 
-import org.apache.commons.io.FileUtils;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.BeforeEach;
 import org.junit.jupiter.api.Test;
@@ -24,6 +23,7 @@
 import java.io.File;
 import java.io.IOException;
 import java.io.InputStream;
+import java.nio.file.Files;
 import java.util.concurrent.ThreadLocalRandom;
 
 import static org.junit.jupiter.api.Assertions.assertEquals;
@@ -44,7 +44,7 @@ public abstract class GenericFileInputStreamSuite {
   public void setUp() throws IOException {
     ThreadLocalRandom.current().nextBytes(randomBytes);
     inputFile = File.createTempFile("temp-file", ".tmp");
-    FileUtils.writeByteArrayToFile(inputFile, randomBytes);
+    Files.write(inputFile.toPath(), randomBytes);
   }
 
   @AfterEach
diff --git a/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorterSuite.java b/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorterSuite.java
index 9e83717f52087..532566741206f 100644
--- a/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorterSuite.java
+++ b/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeExternalSorterSuite.java
@@ -87,9 +87,13 @@ public int compare(
   private final long pageSizeBytes = conf.getSizeAsBytes(
           package$.MODULE$.BUFFER_PAGESIZE().key(), "4m");
 
-  private final int spillThreshold =
+  private final int spillElementsThreshold =
     (int) conf.get(package$.MODULE$.SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD());
 
+  private final long spillSizeThreshold =
+    (long) conf.get(package$.MODULE$.SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD());
+
+
   @BeforeEach
   public void setUp() throws Exception {
     MockitoAnnotations.openMocks(this).close();
@@ -163,7 +167,8 @@ private UnsafeExternalSorter newSorter() throws IOException {
       prefixComparator,
       /* initialSize */ 1024,
       pageSizeBytes,
-      spillThreshold,
+      spillElementsThreshold,
+      spillSizeThreshold,
       shouldUseRadixSort());
   }
 
@@ -453,7 +458,8 @@ public void forcedSpillingWithoutComparator() throws Exception {
       null,
       /* initialSize */ 1024,
       pageSizeBytes,
-      spillThreshold,
+      spillElementsThreshold,
+      spillSizeThreshold,
       shouldUseRadixSort());
     long[] record = new long[100];
     int recordSize = record.length * 8;
@@ -515,7 +521,8 @@ public void testPeakMemoryUsed() throws Exception {
       prefixComparator,
       1024,
       pageSizeBytes,
-      spillThreshold,
+      spillElementsThreshold,
+      spillSizeThreshold,
       shouldUseRadixSort());
 
     // Peak memory should be monotonically increasing. More specifically, every time
@@ -584,7 +591,7 @@ public void testNoOOMDuringSpill() throws Exception {
     }
 
     // Check that spilling still succeeds when the task is starved for memory.
-    memoryManager.markconsequentOOM(Integer.MAX_VALUE);
+    memoryManager.markConsequentOOM(Integer.MAX_VALUE);
     sorter.spill();
     memoryManager.resetConsequentOOM();
 
diff --git a/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeInMemorySorterSuite.java b/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeInMemorySorterSuite.java
index 91f90d7d145aa..a612824fed498 100644
--- a/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeInMemorySorterSuite.java
+++ b/core/src/test/java/org/apache/spark/util/collection/unsafe/sort/UnsafeInMemorySorterSuite.java
@@ -172,7 +172,7 @@ public int compare(
             recordComparator, prefixComparator, 100, shouldUseRadixSort());
 
     // Ensure that the sorter does not OOM while freeing its memory.
-    testMemoryManager.markconsequentOOM(Integer.MAX_VALUE);
+    testMemoryManager.markConsequentOOM(Integer.MAX_VALUE);
     sorter.freeMemory();
     testMemoryManager.resetConsequentOOM();
     Assertions.assertFalse(sorter.hasSpaceForAnotherRecord());
@@ -182,7 +182,7 @@ public int compare(
     sorter.expandPointerArray(array);
 
     // Ensure that it is safe to call freeMemory() multiple times.
-    testMemoryManager.markconsequentOOM(Integer.MAX_VALUE);
+    testMemoryManager.markConsequentOOM(Integer.MAX_VALUE);
     sorter.freeMemory();
     sorter.freeMemory();
     testMemoryManager.resetConsequentOOM();
diff --git a/core/src/test/java/test/org/apache/spark/JavaAPISuite.java b/core/src/test/java/test/org/apache/spark/JavaAPISuite.java
index 802cb2667cc88..f2f4101877e51 100644
--- a/core/src/test/java/test/org/apache/spark/JavaAPISuite.java
+++ b/core/src/test/java/test/org/apache/spark/JavaAPISuite.java
@@ -21,6 +21,7 @@
 import java.nio.channels.FileChannel;
 import java.nio.ByteBuffer;
 import java.nio.charset.StandardCharsets;
+import java.nio.file.Files;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
@@ -44,12 +45,8 @@
 import scala.Tuple4;
 import scala.jdk.javaapi.CollectionConverters;
 
-import com.google.common.collect.ImmutableMap;
 import com.google.common.collect.Iterables;
 import com.google.common.collect.Iterators;
-import com.google.common.collect.Lists;
-import com.google.common.base.Throwables;
-import com.google.common.io.Files;
 import org.apache.hadoop.fs.Path;
 import org.apache.hadoop.io.IntWritable;
 import org.apache.hadoop.io.Text;
@@ -70,6 +67,7 @@
 import org.apache.spark.api.java.Optional;
 import org.apache.spark.api.java.function.*;
 import org.apache.spark.input.PortableDataStream;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.partial.BoundedDouble;
 import org.apache.spark.partial.PartialResult;
 import org.apache.spark.rdd.RDD;
@@ -334,7 +332,8 @@ public void foreachPartition() {
   public void toLocalIterator() {
     List<Integer> correct = Arrays.asList(1, 2, 3, 4);
     JavaRDD<Integer> rdd = sc.parallelize(correct);
-    List<Integer> result = Lists.newArrayList(rdd.toLocalIterator());
+    List<Integer> result = new ArrayList<>();
+    rdd.toLocalIterator().forEachRemaining(result::add);
     assertEquals(correct, result);
   }
 
@@ -960,7 +959,7 @@ public void textFiles() throws IOException {
     rdd.saveAsTextFile(outputDir);
     // Read the plain text file and check it's OK
     File outputFile = new File(outputDir, "part-00000");
-    String content = Files.asCharSource(outputFile, StandardCharsets.UTF_8).read();
+    String content = Files.readString(outputFile.toPath());
     assertEquals("1\n2\n3\n4\n", content);
     // Also try reading it in as a text file RDD
     List<String> expected = Arrays.asList("1", "2", "3", "4");
@@ -977,8 +976,8 @@ public void wholeTextFiles() throws Exception {
     String path1 = new Path(tempDirName, "part-00000").toUri().getPath();
     String path2 = new Path(tempDirName, "part-00001").toUri().getPath();
 
-    Files.write(content1, new File(path1));
-    Files.write(content2, new File(path2));
+    Files.write(new File(path1).toPath(), content1);
+    Files.write(new File(path2).toPath(), content2);
 
     Map<String, String> container = new HashMap<>();
     container.put(path1, new Text(content1).toString());
@@ -1263,7 +1262,7 @@ public void combineByKey() {
     JavaPairRDD<Integer, Integer> combinedRDD = originalRDD.keyBy(keyFunction)
       .combineByKey(createCombinerFunction, mergeValueFunction, mergeValueFunction);
     Map<Integer, Integer> results = combinedRDD.collectAsMap();
-    ImmutableMap<Integer, Integer> expected = ImmutableMap.of(0, 9, 1, 5, 2, 7);
+    Map<Integer, Integer> expected = Map.of(0, 9, 1, 5, 2, 7);
     assertEquals(expected, results);
 
     Partitioner defaultPartitioner = Partitioner.defaultPartitioner(
@@ -1504,7 +1503,7 @@ public void testAsyncActionErrorWrapping() throws Exception {
     JavaFutureAction<Long> future = rdd.map(new BuggyMapFunction<>()).countAsync();
     ExecutionException ee = assertThrows(ExecutionException.class,
       () -> future.get(2, TimeUnit.SECONDS));
-    assertTrue(Throwables.getStackTraceAsString(ee).contains("Custom exception!"));
+    assertTrue(JavaUtils.stackTraceToString(ee).contains("Custom exception!"));
     assertTrue(future.isDone());
   }
 
diff --git a/core/src/test/resources/ProcfsMetrics/487713/stat b/core/src/test/resources/ProcfsMetrics/487713/stat
new file mode 100644
index 0000000000000..63640b58155b5
--- /dev/null
+++ b/core/src/test/resources/ProcfsMetrics/487713/stat
@@ -0,0 +1 @@
+487713 ((Executor)	task l)) D 474416 474398 474398 0 -1 4194368 5 0 0 0 0 0 0 0 25 5 1 0 1542745216 7469137920 120815 18446744073709551615 104424108929024 104424108932808 140734257079632 0 0 0 4 3 553671884 1 0 0 17 58 0 0 0 0 0 104424108940536 104424108941336 104424532111360 140734257083781 140734257085131 140734257085131 140734257102797 0
\ No newline at end of file
diff --git a/core/src/test/resources/spark-events/app-20200706201101-0003 b/core/src/test/resources/spark-events/app-20200706201101-0003
index f74ad35460859..4b0f5957a8044 100644
--- a/core/src/test/resources/spark-events/app-20200706201101-0003
+++ b/core/src/test/resources/spark-events/app-20200706201101-0003
@@ -24,22 +24,22 @@
 {"Event":"SparkListenerTaskStart","Stage ID":0,"Stage Attempt ID":0,"Task Info":{"Task ID":13,"Index":13,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
 {"Event":"SparkListenerTaskStart","Stage ID":0,"Stage Attempt ID":0,"Task Info":{"Task ID":14,"Index":14,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
 {"Event":"SparkListenerTaskStart","Stage ID":0,"Stage Attempt ID":0,"Task Info":{"Task ID":15,"Index":15,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":6,"Index":6,"Attempt":0,"Launch Time":1594091479271,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480364,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"1","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":109,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1387,"Value":1387,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8922000,"Value":8922000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":80,"Value":80,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":235295000,"Value":235295000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":962,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":235295000,"Executor Run Time":80,"Executor CPU Time":8922000,"Peak Execution Memory":0,"Result Size":1387,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":8,"Index":8,"Attempt":0,"Launch Time":1594091479272,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480367,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"2","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":218,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":2778,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8860000,"Value":17782000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":81,"Value":161,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":213308000,"Value":448603000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":1925,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":213308000,"Executor Run Time":81,"Executor CPU Time":8860000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":2,"Index":2,"Attempt":0,"Launch Time":1594091479269,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480367,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"3","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":327,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1387,"Value":4165,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10463000,"Value":28245000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":240,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":228677000,"Value":677280000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":2887,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":228677000,"Executor Run Time":79,"Executor CPU Time":10463000,"Peak Execution Memory":0,"Result Size":1387,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":13,"Index":13,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480367,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"4","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":436,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1390,"Value":5555,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8782000,"Value":37027000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":83,"Value":323,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":196368000,"Value":873648000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":3849,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":196368000,"Executor Run Time":83,"Executor CPU Time":8782000,"Peak Execution Memory":0,"Result Size":1390,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":0,"Index":0,"Attempt":0,"Launch Time":1594091479253,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"5","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":545,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1384,"Value":6939,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10820000,"Value":47847000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":77,"Value":400,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":221708000,"Value":1095356000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":4811,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":221708000,"Executor Run Time":77,"Executor CPU Time":10820000,"Peak Execution Memory":0,"Result Size":1384,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":11,"Index":11,"Attempt":0,"Launch Time":1594091479273,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"7","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":654,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1406,"Value":8345,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":13213000,"Value":61060000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":78,"Value":478,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":260380000,"Value":1355736000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":5774,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":260380000,"Executor Run Time":78,"Executor CPU Time":13213000,"Peak Execution Memory":0,"Result Size":1406,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":10,"Index":10,"Attempt":0,"Launch Time":1594091479273,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"8","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":763,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":9736,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":9913000,"Value":70973000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":76,"Value":554,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":210788000,"Value":1566524000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":6736,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":210788000,"Executor Run Time":76,"Executor CPU Time":9913000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":14,"Index":14,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"9","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":872,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":11127,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8784000,"Value":79757000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":633,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":235620000,"Value":1802144000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":964,"Value":7700,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":964,"Executor Deserialize CPU Time":235620000,"Executor Run Time":79,"Executor CPU Time":8784000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":12,"Index":12,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"10","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":981,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":12518,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":12053000,"Value":91810000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":86,"Value":719,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":215398000,"Value":2017542000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":8663,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":215398000,"Executor Run Time":86,"Executor CPU Time":12053000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":3,"Index":3,"Attempt":0,"Launch Time":1594091479270,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"12","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1090,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1403,"Value":13921,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":9030000,"Value":100840000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":798,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":196266000,"Value":2213808000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":9625,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":196266000,"Executor Run Time":79,"Executor CPU Time":9030000,"Peak Execution Memory":0,"Result Size":1403,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":9,"Index":9,"Attempt":0,"Launch Time":1594091479273,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"13","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1199,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1390,"Value":15311,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10087000,"Value":110927000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":877,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":195342000,"Value":2409150000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":10587,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":195342000,"Executor Run Time":79,"Executor CPU Time":10087000,"Peak Execution Memory":0,"Result Size":1390,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":15,"Index":15,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"15","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1308,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1411,"Value":16722,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":12920000,"Value":123847000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":86,"Value":963,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":236044000,"Value":2645194000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":961,"Value":11548,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":961,"Executor Deserialize CPU Time":236044000,"Executor Run Time":86,"Executor CPU Time":12920000,"Peak Execution Memory":0,"Result Size":1411,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":5,"Index":5,"Attempt":0,"Launch Time":1594091479270,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"16","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":21,"Name":"internal.metrics.resultSerializationTime","Update":1,"Value":1,"Internal":true,"Count Failed Values":true},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1417,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1430,"Value":18152,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10478000,"Value":134325000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":77,"Value":1040,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":205925000,"Value":2851119000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":12510,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":205925000,"Executor Run Time":77,"Executor CPU Time":10478000,"Peak Execution Memory":0,"Result Size":1430,"JVM GC Time":109,"Result Serialization Time":1,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":4,"Index":4,"Attempt":0,"Launch Time":1594091479270,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"17","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1526,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1387,"Value":19539,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8972000,"Value":143297000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":87,"Value":1127,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":206247000,"Value":3057366000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":13473,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":206247000,"Executor Run Time":87,"Executor CPU Time":8972000,"Peak Execution Memory":0,"Result Size":1387,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":7,"Index":7,"Attempt":0,"Launch Time":1594091479272,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"19","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":21,"Name":"internal.metrics.resultSerializationTime","Update":2,"Value":3,"Internal":true,"Count Failed Values":true},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1635,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1452,"Value":20991,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":20898000,"Value":164195000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":83,"Value":1210,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":389356000,"Value":3446722000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":14436,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":389356000,"Executor Run Time":83,"Executor CPU Time":20898000,"Peak Execution Memory":0,"Result Size":1452,"JVM GC Time":109,"Result Serialization Time":2,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":1,"Index":1,"Attempt":0,"Launch Time":1594091479269,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"20","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1744,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1384,"Value":22375,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8668000,"Value":172863000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":82,"Value":1292,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":222167000,"Value":3668889000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":15399,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":222167000,"Executor Run Time":82,"Executor CPU Time":8668000,"Peak Execution Memory":0,"Result Size":1384,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":6,"Index":6,"Attempt":0,"Launch Time":1594091479271,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480364,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"1","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":109,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1387,"Value":1387,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8922000,"Value":8922000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":80,"Value":80,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":235295000,"Value":235295000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":962,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":235295000,"Executor Run Time":80,"Executor CPU Time":8922000,"Peak Execution Memory":0,"Result Size":1387,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":8,"Index":8,"Attempt":0,"Launch Time":1594091479272,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480367,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"2","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":218,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":2778,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8860000,"Value":17782000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":81,"Value":161,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":213308000,"Value":448603000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":1925,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":213308000,"Executor Run Time":81,"Executor CPU Time":8860000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":2,"Index":2,"Attempt":0,"Launch Time":1594091479269,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480367,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"3","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":327,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1387,"Value":4165,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10463000,"Value":28245000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":240,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":228677000,"Value":677280000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":2887,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":228677000,"Executor Run Time":79,"Executor CPU Time":10463000,"Peak Execution Memory":0,"Result Size":1387,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":13,"Index":13,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480367,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"4","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":436,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1390,"Value":5555,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8782000,"Value":37027000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":83,"Value":323,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":196368000,"Value":873648000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":3849,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":196368000,"Executor Run Time":83,"Executor CPU Time":8782000,"Peak Execution Memory":0,"Result Size":1390,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":0,"Index":0,"Attempt":0,"Launch Time":1594091479253,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"5","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":545,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1384,"Value":6939,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10820000,"Value":47847000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":77,"Value":400,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":221708000,"Value":1095356000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":4811,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":221708000,"Executor Run Time":77,"Executor CPU Time":10820000,"Peak Execution Memory":0,"Result Size":1384,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":11,"Index":11,"Attempt":0,"Launch Time":1594091479273,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"7","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":654,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1406,"Value":8345,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":13213000,"Value":61060000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":78,"Value":478,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":260380000,"Value":1355736000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":5774,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":260380000,"Executor Run Time":78,"Executor CPU Time":13213000,"Peak Execution Memory":0,"Result Size":1406,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":10,"Index":10,"Attempt":0,"Launch Time":1594091479273,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"8","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":763,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":9736,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":9913000,"Value":70973000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":76,"Value":554,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":210788000,"Value":1566524000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":6736,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":210788000,"Executor Run Time":76,"Executor CPU Time":9913000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":14,"Index":14,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480368,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"9","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":872,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":11127,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8784000,"Value":79757000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":633,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":235620000,"Value":1802144000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":964,"Value":7700,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":964,"Executor Deserialize CPU Time":235620000,"Executor Run Time":79,"Executor CPU Time":8784000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":12,"Index":12,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"10","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":981,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1391,"Value":12518,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":12053000,"Value":91810000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":86,"Value":719,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":215398000,"Value":2017542000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":8663,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":215398000,"Executor Run Time":86,"Executor CPU Time":12053000,"Peak Execution Memory":0,"Result Size":1391,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":3,"Index":3,"Attempt":0,"Launch Time":1594091479270,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"12","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1090,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1403,"Value":13921,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":9030000,"Value":100840000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":798,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":196266000,"Value":2213808000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":9625,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":196266000,"Executor Run Time":79,"Executor CPU Time":9030000,"Peak Execution Memory":0,"Result Size":1403,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":9,"Index":9,"Attempt":0,"Launch Time":1594091479273,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"13","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1199,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1390,"Value":15311,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10087000,"Value":110927000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":79,"Value":877,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":195342000,"Value":2409150000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":10587,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":195342000,"Executor Run Time":79,"Executor CPU Time":10087000,"Peak Execution Memory":0,"Result Size":1390,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":15,"Index":15,"Attempt":0,"Launch Time":1594091479274,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480369,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"15","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1308,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1411,"Value":16722,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":12920000,"Value":123847000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":86,"Value":963,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":236044000,"Value":2645194000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":961,"Value":11548,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":961,"Executor Deserialize CPU Time":236044000,"Executor Run Time":86,"Executor CPU Time":12920000,"Peak Execution Memory":0,"Result Size":1411,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":5,"Index":5,"Attempt":0,"Launch Time":1594091479270,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"16","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":21,"Name":"internal.metrics.resultSerializationTime","Update":1,"Value":1,"Internal":true,"Count Failed Values":true},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1417,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1430,"Value":18152,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":10478000,"Value":134325000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":77,"Value":1040,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":205925000,"Value":2851119000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":962,"Value":12510,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":962,"Executor Deserialize CPU Time":205925000,"Executor Run Time":77,"Executor CPU Time":10478000,"Peak Execution Memory":0,"Result Size":1430,"JVM GC Time":109,"Result Serialization Time":1,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":4,"Index":4,"Attempt":0,"Launch Time":1594091479270,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"17","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1526,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1387,"Value":19539,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8972000,"Value":143297000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":87,"Value":1127,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":206247000,"Value":3057366000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":13473,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":206247000,"Executor Run Time":87,"Executor CPU Time":8972000,"Peak Execution Memory":0,"Result Size":1387,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":7,"Index":7,"Attempt":0,"Launch Time":1594091479272,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"2","Value":"19","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":21,"Name":"internal.metrics.resultSerializationTime","Update":2,"Value":3,"Internal":true,"Count Failed Values":true},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1635,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1452,"Value":20991,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":20898000,"Value":164195000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":83,"Value":1210,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":389356000,"Value":3446722000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":14436,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":389356000,"Executor Run Time":83,"Executor CPU Time":20898000,"Peak Execution Memory":0,"Result Size":1452,"JVM GC Time":109,"Result Serialization Time":2,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":0,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":1,"Index":1,"Attempt":0,"Launch Time":1594091479269,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480370,"Failed":false,"Killed":false,"Accumulables":[{"ID":13,"Name":"number of output rows","Update":"1","Value":"20","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":20,"Name":"internal.metrics.jvmGCTime","Update":109,"Value":1744,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Update":1384,"Value":22375,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Update":8668000,"Value":172863000,"Internal":true,"Count Failed Values":true},{"ID":17,"Name":"internal.metrics.executorRunTime","Update":82,"Value":1292,"Internal":true,"Count Failed Values":true},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Update":222167000,"Value":3668889000,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Update":963,"Value":15399,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110},"Task Metrics":{"Executor Deserialize Time":963,"Executor Deserialize CPU Time":222167000,"Executor Run Time":82,"Executor CPU Time":8668000,"Peak Execution Memory":0,"Result Size":1384,"JVM GC Time":109,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
 {"Event":"SparkListenerStageExecutorMetrics","Executor ID":"0","Stage ID":0,"Stage Attempt ID":0,"Executor Metrics":{"JVMHeapMemory":155100856,"JVMOffHeapMemory":64239224,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":6964,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":6964,"OffHeapUnifiedMemory":0,"DirectPoolMemory":1852,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":7,"MinorGCTime":33,"MajorGCCount":3,"MajorGCTime":110}}
 {"Event":"SparkListenerStageCompleted","Stage Info":{"Stage ID":0,"Stage Attempt ID":0,"Stage Name":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Number of Tasks":16,"RDD Info":[{"RDD ID":2,"Name":"MapPartitionsRDD","Scope":"{\"id\":\"0\",\"name\":\"DeserializeToObject\"}","Callsite":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Parent IDs":[1],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":0,"Name":"ParallelCollectionRDD","Scope":"{\"id\":\"3\",\"name\":\"LocalTableScan\"}","Callsite":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Parent IDs":[],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":1,"Name":"MapPartitionsRDD","Scope":"{\"id\":\"3\",\"name\":\"LocalTableScan\"}","Callsite":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Parent IDs":[0],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0}],"Parent IDs":[],"Details":"org.apache.spark.sql.execution.SQLExecution$.$anonfun$withThreadLocalCaptured$1(SQLExecution.scala:185)\njava.util.concurrent.FutureTask.run(FutureTask.java:266)\njava.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)\njava.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)\njava.lang.Thread.run(Thread.java:748)","Submission Time":1594091478860,"Completion Time":1594091480381,"Accumulables":[{"ID":17,"Name":"internal.metrics.executorRunTime","Value":1292,"Internal":true,"Count Failed Values":true},{"ID":20,"Name":"internal.metrics.jvmGCTime","Value":1744,"Internal":true,"Count Failed Values":true},{"ID":13,"Name":"number of output rows","Value":"20","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":16,"Name":"internal.metrics.executorDeserializeCpuTime","Value":3668889000,"Internal":true,"Count Failed Values":true},{"ID":19,"Name":"internal.metrics.resultSize","Value":22375,"Internal":true,"Count Failed Values":true},{"ID":18,"Name":"internal.metrics.executorCpuTime","Value":172863000,"Internal":true,"Count Failed Values":true},{"ID":21,"Name":"internal.metrics.resultSerializationTime","Value":3,"Internal":true,"Count Failed Values":true},{"ID":15,"Name":"internal.metrics.executorDeserializeTime","Value":15399,"Internal":true,"Count Failed Values":true}],"Resource Profile Id":0}}
 {"Event":"SparkListenerJobEnd","Job ID":0,"Completion Time":1594091480385,"Job Result":{"Result":"JobSucceeded"}}
@@ -62,22 +62,22 @@
 {"Event":"SparkListenerTaskStart","Stage ID":1,"Stage Attempt ID":0,"Task Info":{"Task ID":29,"Index":13,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
 {"Event":"SparkListenerTaskStart","Stage ID":1,"Stage Attempt ID":0,"Task Info":{"Task ID":30,"Index":14,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
 {"Event":"SparkListenerTaskStart","Stage ID":1,"Stage Attempt ID":0,"Task Info":{"Task ID":31,"Index":15,"Attempt":0,"Launch Time":1594091480507,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":20,"Index":4,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480921,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"20","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"18","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"6","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":1016,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1966,"Value":1966,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":3116000,"Value":3116000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":378,"Value":378,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":4258000,"Value":4258000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":29,"Value":29,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":29,"Executor Deserialize CPU Time":4258000,"Executor Run Time":378,"Executor CPU Time":3116000,"Peak Execution Memory":1016,"Result Size":1966,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":17,"Index":1,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480921,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"40","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"36","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"12","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":2032,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1951,"Value":3917,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":2895000,"Value":6011000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":379,"Value":757,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2641000,"Value":6899000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":29,"Value":58,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":29,"Executor Deserialize CPU Time":2641000,"Executor Run Time":379,"Executor CPU Time":2895000,"Peak Execution Memory":1016,"Result Size":1951,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":21,"Index":5,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480923,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"60","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"54","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"18","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":3048,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1957,"Value":5874,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4164000,"Value":10175000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":380,"Value":1137,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2012000,"Value":8911000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":28,"Value":86,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":28,"Executor Deserialize CPU Time":2012000,"Executor Run Time":380,"Executor CPU Time":4164000,"Peak Execution Memory":1016,"Result Size":1957,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":25,"Index":9,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480923,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"80","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"72","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"24","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":4064,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1957,"Value":7831,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4285000,"Value":14460000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":380,"Value":1517,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2749000,"Value":11660000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":26,"Value":112,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":26,"Executor Deserialize CPU Time":2749000,"Executor Run Time":380,"Executor CPU Time":4285000,"Peak Execution Memory":1016,"Result Size":1957,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":23,"Index":7,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480924,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"100","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"93","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"31","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":5080,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":2007,"Value":9838,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":16921000,"Value":31381000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":383,"Value":1900,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3854000,"Value":15514000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":26,"Value":138,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":26,"Executor Deserialize CPU Time":3854000,"Executor Run Time":383,"Executor CPU Time":16921000,"Peak Execution Memory":1016,"Result Size":2007,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":30,"Index":14,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480925,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"120","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"111","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"37","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":6096,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1955,"Value":11793,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4798000,"Value":36179000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":2282,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2959000,"Value":18473000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":24,"Value":162,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":24,"Executor Deserialize CPU Time":2959000,"Executor Run Time":382,"Executor CPU Time":4798000,"Peak Execution Memory":1016,"Result Size":1955,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":27,"Index":11,"Attempt":0,"Launch Time":1594091480505,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480926,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"140","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"132","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"44","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":7112,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":2015,"Value":13808,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4850000,"Value":41029000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":2664,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":4278000,"Value":22751000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":25,"Value":187,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":25,"Executor Deserialize CPU Time":4278000,"Executor Run Time":382,"Executor CPU Time":4850000,"Peak Execution Memory":1016,"Result Size":2015,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":19,"Index":3,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480927,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"161","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"153","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"51","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":8128,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1998,"Value":15806,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4100000,"Value":45129000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":383,"Value":3047,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3622000,"Value":26373000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":28,"Value":215,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":28,"Executor Deserialize CPU Time":3622000,"Executor Run Time":383,"Executor CPU Time":4100000,"Peak Execution Memory":1016,"Result Size":1998,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":26,"Index":10,"Attempt":0,"Launch Time":1594091480505,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480927,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"182","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"171","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"57","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":9144,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1973,"Value":17779,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4350000,"Value":49479000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":383,"Value":3430,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3471000,"Value":29844000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":25,"Value":240,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":25,"Executor Deserialize CPU Time":3471000,"Executor Run Time":383,"Executor CPU Time":4350000,"Peak Execution Memory":1016,"Result Size":1973,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":28,"Index":12,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480927,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"202","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"189","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"63","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":10160,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1966,"Value":19745,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4682000,"Value":54161000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":384,"Value":3814,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2652000,"Value":32496000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":23,"Value":263,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":23,"Executor Deserialize CPU Time":2652000,"Executor Run Time":384,"Executor CPU Time":4682000,"Peak Execution Memory":1016,"Result Size":1966,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":31,"Index":15,"Attempt":0,"Launch Time":1594091480507,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480928,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"223","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"210","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"70","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":11176,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":2008,"Value":21753,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":3954000,"Value":58115000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":4196,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":4289000,"Value":36785000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":25,"Value":288,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":25,"Executor Deserialize CPU Time":4289000,"Executor Run Time":382,"Executor CPU Time":3954000,"Peak Execution Memory":1016,"Result Size":2008,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":18,"Index":2,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480928,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"243","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"228","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"76","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":12192,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1978,"Value":23731,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":349926000,"Value":408041000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":385,"Value":4581,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":14543000,"Value":51328000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":27,"Value":315,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":27,"Executor Deserialize CPU Time":14543000,"Executor Run Time":385,"Executor CPU Time":349926000,"Peak Execution Memory":1016,"Result Size":1978,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":22,"Index":6,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480928,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"263","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"246","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"82","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":13208,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1965,"Value":25696,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4473000,"Value":412514000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":381,"Value":4962,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3906000,"Value":55234000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":27,"Value":342,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":27,"Executor Deserialize CPU Time":3906000,"Executor Run Time":381,"Executor CPU Time":4473000,"Peak Execution Memory":1016,"Result Size":1965,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":29,"Index":13,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480929,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"283","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"264","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"88","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":14224,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1955,"Value":27651,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":6459000,"Value":418973000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":381,"Value":5343,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3298000,"Value":58532000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":24,"Value":366,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":24,"Executor Deserialize CPU Time":3298000,"Executor Run Time":381,"Executor CPU Time":6459000,"Peak Execution Memory":1016,"Result Size":1955,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":24,"Index":8,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480929,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"304","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"282","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"94","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":15240,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1954,"Value":29605,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4365000,"Value":423338000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":380,"Value":5723,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2411000,"Value":60943000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":28,"Value":394,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":28,"Executor Deserialize CPU Time":2411000,"Executor Run Time":380,"Executor CPU Time":4365000,"Peak Execution Memory":1016,"Result Size":1954,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":16,"Index":0,"Attempt":0,"Launch Time":1594091480502,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480930,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"324","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"300","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"100","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":16256,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1941,"Value":31546,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":3111000,"Value":426449000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":6105,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2723000,"Value":63666000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":30,"Value":424,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":30,"Executor Deserialize CPU Time":2723000,"Executor Run Time":382,"Executor CPU Time":3111000,"Peak Execution Memory":1016,"Result Size":1941,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":20,"Index":4,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480921,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"20","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"18","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"6","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":1016,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1966,"Value":1966,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":3116000,"Value":3116000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":378,"Value":378,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":4258000,"Value":4258000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":29,"Value":29,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":29,"Executor Deserialize CPU Time":4258000,"Executor Run Time":378,"Executor CPU Time":3116000,"Peak Execution Memory":1016,"Result Size":1966,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":17,"Index":1,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480921,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"40","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"36","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"12","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":2032,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1951,"Value":3917,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":2895000,"Value":6011000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":379,"Value":757,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2641000,"Value":6899000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":29,"Value":58,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":29,"Executor Deserialize CPU Time":2641000,"Executor Run Time":379,"Executor CPU Time":2895000,"Peak Execution Memory":1016,"Result Size":1951,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":21,"Index":5,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480923,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"60","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"54","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"18","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":3048,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1957,"Value":5874,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4164000,"Value":10175000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":380,"Value":1137,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2012000,"Value":8911000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":28,"Value":86,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":28,"Executor Deserialize CPU Time":2012000,"Executor Run Time":380,"Executor CPU Time":4164000,"Peak Execution Memory":1016,"Result Size":1957,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":25,"Index":9,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480923,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"80","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"72","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"24","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":4064,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1957,"Value":7831,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4285000,"Value":14460000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":380,"Value":1517,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2749000,"Value":11660000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":26,"Value":112,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":26,"Executor Deserialize CPU Time":2749000,"Executor Run Time":380,"Executor CPU Time":4285000,"Peak Execution Memory":1016,"Result Size":1957,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":23,"Index":7,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480924,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"100","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"93","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"31","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":5080,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":2007,"Value":9838,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":16921000,"Value":31381000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":383,"Value":1900,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3854000,"Value":15514000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":26,"Value":138,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":26,"Executor Deserialize CPU Time":3854000,"Executor Run Time":383,"Executor CPU Time":16921000,"Peak Execution Memory":1016,"Result Size":2007,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":30,"Index":14,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480925,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"120","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"111","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"37","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":6096,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1955,"Value":11793,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4798000,"Value":36179000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":2282,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2959000,"Value":18473000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":24,"Value":162,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":24,"Executor Deserialize CPU Time":2959000,"Executor Run Time":382,"Executor CPU Time":4798000,"Peak Execution Memory":1016,"Result Size":1955,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":27,"Index":11,"Attempt":0,"Launch Time":1594091480505,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480926,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"140","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"132","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"44","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":7112,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":2015,"Value":13808,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4850000,"Value":41029000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":2664,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":4278000,"Value":22751000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":25,"Value":187,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":25,"Executor Deserialize CPU Time":4278000,"Executor Run Time":382,"Executor CPU Time":4850000,"Peak Execution Memory":1016,"Result Size":2015,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":19,"Index":3,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480927,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"161","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"153","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"51","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":8128,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1998,"Value":15806,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4100000,"Value":45129000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":383,"Value":3047,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3622000,"Value":26373000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":28,"Value":215,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":28,"Executor Deserialize CPU Time":3622000,"Executor Run Time":383,"Executor CPU Time":4100000,"Peak Execution Memory":1016,"Result Size":1998,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":26,"Index":10,"Attempt":0,"Launch Time":1594091480505,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480927,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"182","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"171","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"57","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":9144,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1973,"Value":17779,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4350000,"Value":49479000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":383,"Value":3430,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3471000,"Value":29844000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":25,"Value":240,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":25,"Executor Deserialize CPU Time":3471000,"Executor Run Time":383,"Executor CPU Time":4350000,"Peak Execution Memory":1016,"Result Size":1973,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":28,"Index":12,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480927,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"202","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"189","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"63","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":10160,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1966,"Value":19745,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4682000,"Value":54161000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":384,"Value":3814,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2652000,"Value":32496000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":23,"Value":263,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":23,"Executor Deserialize CPU Time":2652000,"Executor Run Time":384,"Executor CPU Time":4682000,"Peak Execution Memory":1016,"Result Size":1966,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":31,"Index":15,"Attempt":0,"Launch Time":1594091480507,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480928,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"223","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"21","Value":"210","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"7","Value":"70","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":11176,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":2008,"Value":21753,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":3954000,"Value":58115000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":4196,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":4289000,"Value":36785000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":25,"Value":288,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":25,"Executor Deserialize CPU Time":4289000,"Executor Run Time":382,"Executor CPU Time":3954000,"Peak Execution Memory":1016,"Result Size":2008,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":18,"Index":2,"Attempt":0,"Launch Time":1594091480503,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480928,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"243","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"228","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"76","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":12192,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1978,"Value":23731,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":349926000,"Value":408041000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":385,"Value":4581,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":14543000,"Value":51328000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":27,"Value":315,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":27,"Executor Deserialize CPU Time":14543000,"Executor Run Time":385,"Executor CPU Time":349926000,"Peak Execution Memory":1016,"Result Size":1978,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":22,"Index":6,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480928,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"263","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"246","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"82","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":13208,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1965,"Value":25696,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4473000,"Value":412514000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":381,"Value":4962,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3906000,"Value":55234000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":27,"Value":342,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":27,"Executor Deserialize CPU Time":3906000,"Executor Run Time":381,"Executor CPU Time":4473000,"Peak Execution Memory":1016,"Result Size":1965,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":29,"Index":13,"Attempt":0,"Launch Time":1594091480506,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480929,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"283","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"264","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"88","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":14224,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1955,"Value":27651,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":6459000,"Value":418973000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":381,"Value":5343,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":3298000,"Value":58532000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":24,"Value":366,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":24,"Executor Deserialize CPU Time":3298000,"Executor Run Time":381,"Executor CPU Time":6459000,"Peak Execution Memory":1016,"Result Size":1955,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":24,"Index":8,"Attempt":0,"Launch Time":1594091480504,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480929,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"21","Value":"304","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"282","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"94","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":15240,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1954,"Value":29605,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":4365000,"Value":423338000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":380,"Value":5723,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2411000,"Value":60943000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":28,"Value":394,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":28,"Executor Deserialize CPU Time":2411000,"Executor Run Time":380,"Executor CPU Time":4365000,"Peak Execution Memory":1016,"Result Size":1954,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":1,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":16,"Index":0,"Attempt":0,"Launch Time":1594091480502,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091480930,"Failed":false,"Killed":false,"Accumulables":[{"ID":6,"Name":"duration","Update":"20","Value":"324","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":7,"Name":"number of output rows","Update":"18","Value":"300","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":8,"Name":"number of output rows","Update":"6","Value":"100","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Update":1016,"Value":16256,"Internal":true,"Count Failed Values":true},{"ID":44,"Name":"internal.metrics.resultSize","Update":1941,"Value":31546,"Internal":true,"Count Failed Values":true},{"ID":43,"Name":"internal.metrics.executorCpuTime","Update":3111000,"Value":426449000,"Internal":true,"Count Failed Values":true},{"ID":42,"Name":"internal.metrics.executorRunTime","Update":382,"Value":6105,"Internal":true,"Count Failed Values":true},{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Update":2723000,"Value":63666000,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Update":30,"Value":424,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":30,"Executor Deserialize CPU Time":2723000,"Executor Run Time":382,"Executor CPU Time":3111000,"Peak Execution Memory":1016,"Result Size":1941,"JVM GC Time":0,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
 {"Event":"SparkListenerStageExecutorMetrics","Executor ID":"0","Stage ID":1,"Stage Attempt ID":0,"Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0}}
 {"Event":"SparkListenerStageCompleted","Stage Info":{"Stage ID":1,"Stage Attempt ID":0,"Stage Name":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Number of Tasks":16,"RDD Info":[{"RDD ID":5,"Name":"MapPartitionsRDD","Scope":"{\"id\":\"0\",\"name\":\"DeserializeToObject\"}","Callsite":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Parent IDs":[4],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":3,"Name":"ParallelCollectionRDD","Scope":"{\"id\":\"2\",\"name\":\"WholeStageCodegen (1)\"}","Callsite":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Parent IDs":[],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":4,"Name":"MapPartitionsRDD","Scope":"{\"id\":\"2\",\"name\":\"WholeStageCodegen (1)\"}","Callsite":"$anonfun$withThreadLocalCaptured$1 at FutureTask.java:266","Parent IDs":[3],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0}],"Parent IDs":[],"Details":"org.apache.spark.sql.execution.SQLExecution$.$anonfun$withThreadLocalCaptured$1(SQLExecution.scala:185)\njava.util.concurrent.FutureTask.run(FutureTask.java:266)\njava.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1149)\njava.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:624)\njava.lang.Thread.run(Thread.java:748)","Submission Time":1594091480499,"Completion Time":1594091480930,"Accumulables":[{"ID":41,"Name":"internal.metrics.executorDeserializeCpuTime","Value":63666000,"Internal":true,"Count Failed Values":true},{"ID":8,"Name":"number of output rows","Value":"100","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":44,"Name":"internal.metrics.resultSize","Value":31546,"Internal":true,"Count Failed Values":true},{"ID":49,"Name":"internal.metrics.peakExecutionMemory","Value":16256,"Internal":true,"Count Failed Values":true},{"ID":40,"Name":"internal.metrics.executorDeserializeTime","Value":424,"Internal":true,"Count Failed Values":true},{"ID":7,"Name":"number of output rows","Value":"300","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":43,"Name":"internal.metrics.executorCpuTime","Value":426449000,"Internal":true,"Count Failed Values":true},{"ID":6,"Name":"duration","Value":"324","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":42,"Name":"internal.metrics.executorRunTime","Value":6105,"Internal":true,"Count Failed Values":true}],"Resource Profile Id":0}}
 {"Event":"SparkListenerJobEnd","Job ID":1,"Completion Time":1594091480930,"Job Result":{"Result":"JobSucceeded"}}
@@ -100,22 +100,22 @@
 {"Event":"SparkListenerTaskStart","Stage ID":2,"Stage Attempt ID":0,"Task Info":{"Task ID":45,"Index":13,"Attempt":0,"Launch Time":1594091481129,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
 {"Event":"SparkListenerTaskStart","Stage ID":2,"Stage Attempt ID":0,"Task Info":{"Task ID":46,"Index":14,"Attempt":0,"Launch Time":1594091481132,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
 {"Event":"SparkListenerTaskStart","Stage ID":2,"Stage Attempt ID":0,"Task Info":{"Task ID":47,"Index":15,"Attempt":0,"Launch Time":1594091481136,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":0,"Failed":false,"Killed":false,"Accumulables":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":38,"Index":6,"Attempt":0,"Launch Time":1594091481104,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091482939,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1467","Value":"1467","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"375000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"6250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":24040,"Internal":true,"Count Failed Values":true},{"ID":71,"Name":"internal.metrics.resultSerializationTime","Update":11,"Value":11,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":62,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2158,"Value":2158,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":414110000,"Value":414110000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1498,"Value":1498,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":60358000,"Value":60358000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":255,"Value":255,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":255,"Executor Deserialize CPU Time":60358000,"Executor Run Time":1498,"Executor CPU Time":414110000,"Peak Execution Memory":24040,"Result Size":2158,"JVM GC Time":62,"Result Serialization Time":11,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":47,"Index":15,"Attempt":0,"Launch Time":1594091481136,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483014,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1563","Value":"3030","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"750000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"12500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":48080,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":52,"Value":114,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":4273,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":1324251000,"Value":1738361000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1594,"Value":3092,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":47496000,"Value":107854000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":213,"Value":468,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":213,"Executor Deserialize CPU Time":47496000,"Executor Run Time":1594,"Executor CPU Time":1324251000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":52,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":37,"Index":5,"Attempt":0,"Launch Time":1594091481100,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483015,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1563","Value":"4593","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"1125000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"18750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":72120,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":176,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":6388,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":507192000,"Value":2245553000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1596,"Value":4688,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":60890000,"Value":168744000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":256,"Value":724,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":256,"Executor Deserialize CPU Time":60890000,"Executor Run Time":1596,"Executor CPU Time":507192000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":36,"Index":4,"Attempt":0,"Launch Time":1594091481095,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483015,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1564","Value":"6157","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"1500000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"25000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":96160,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":238,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":8503,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":503010000,"Value":2748563000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1596,"Value":6284,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":112849000,"Value":281593000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":260,"Value":984,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":260,"Executor Deserialize CPU Time":112849000,"Executor Run Time":1596,"Executor CPU Time":503010000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":35,"Index":3,"Attempt":0,"Launch Time":1594091481091,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483016,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1566","Value":"7723","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"1875000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"31250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":120200,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":300,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":10618,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":502908000,"Value":3251471000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1598,"Value":7882,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":62944000,"Value":344537000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":263,"Value":1247,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":263,"Executor Deserialize CPU Time":62944000,"Executor Run Time":1598,"Executor CPU Time":502908000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":40,"Index":8,"Attempt":0,"Launch Time":1594091481112,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483016,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1562","Value":"9285","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"2250000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"37500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":144240,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":362,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":12733,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":510597000,"Value":3762068000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1595,"Value":9477,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":69760000,"Value":414297000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":246,"Value":1493,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":246,"Executor Deserialize CPU Time":69760000,"Executor Run Time":1595,"Executor CPU Time":510597000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":45,"Index":13,"Attempt":0,"Launch Time":1594091481129,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483024,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1564","Value":"10849","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"2625000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"43750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":168280,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":424,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":14848,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":495138000,"Value":4257206000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1595,"Value":11072,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":54222000,"Value":468519000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":221,"Value":1714,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":221,"Executor Deserialize CPU Time":54222000,"Executor Run Time":1595,"Executor CPU Time":495138000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":39,"Index":7,"Attempt":0,"Launch Time":1594091481109,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483024,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1566","Value":"12415","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"3000000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"50000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":192320,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":486,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":16963,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":539451000,"Value":4796657000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1596,"Value":12668,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":64380000,"Value":532899000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":254,"Value":1968,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":254,"Executor Deserialize CPU Time":64380000,"Executor Run Time":1596,"Executor CPU Time":539451000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":33,"Index":1,"Attempt":0,"Launch Time":1594091481082,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483025,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1566","Value":"13981","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"3375000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"56250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":216360,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":548,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":19078,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":519178000,"Value":5315835000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1597,"Value":14265,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":54442000,"Value":587341000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":267,"Value":2235,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":267,"Executor Deserialize CPU Time":54442000,"Executor Run Time":1597,"Executor CPU Time":519178000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":34,"Index":2,"Attempt":0,"Launch Time":1594091481087,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483026,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1574","Value":"15555","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"3750000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"62500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":240400,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":614,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":21193,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":508433000,"Value":5824268000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1606,"Value":15871,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":69492000,"Value":656833000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":265,"Value":2500,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":265,"Executor Deserialize CPU Time":69492000,"Executor Run Time":1606,"Executor CPU Time":508433000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":43,"Index":11,"Attempt":0,"Launch Time":1594091481123,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483029,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1578","Value":"17133","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"4125000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"68750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":264440,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":680,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":23308,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":502120000,"Value":6326388000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1609,"Value":17480,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":48849000,"Value":705682000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":225,"Value":2725,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":225,"Executor Deserialize CPU Time":48849000,"Executor Run Time":1609,"Executor CPU Time":502120000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":41,"Index":9,"Attempt":0,"Launch Time":1594091481116,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483032,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1583","Value":"18716","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"4500000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"75000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":288480,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":746,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":25423,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":489923000,"Value":6816311000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1614,"Value":19094,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":55787000,"Value":761469000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":240,"Value":2965,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":240,"Executor Deserialize CPU Time":55787000,"Executor Run Time":1614,"Executor CPU Time":489923000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":46,"Index":14,"Attempt":0,"Launch Time":1594091481132,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483037,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1587","Value":"20303","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"4875000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"81250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":312520,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":812,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":27538,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":490927000,"Value":7307238000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1618,"Value":20712,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":51464000,"Value":812933000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":218,"Value":3183,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":218,"Executor Deserialize CPU Time":51464000,"Executor Run Time":1618,"Executor CPU Time":490927000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":32,"Index":0,"Attempt":0,"Launch Time":1594091481077,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483037,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1587","Value":"21890","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"5250000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"87500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":336560,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":878,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":29653,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":496683000,"Value":7803921000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1619,"Value":22331,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":56827000,"Value":869760000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":271,"Value":3454,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":271,"Executor Deserialize CPU Time":56827000,"Executor Run Time":1619,"Executor CPU Time":496683000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":42,"Index":10,"Attempt":0,"Launch Time":1594091481120,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483043,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1593","Value":"23483","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"5625000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"93750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":360600,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":944,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":31768,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":508230000,"Value":8312151000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1624,"Value":23955,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":58152000,"Value":927912000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":229,"Value":3683,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":229,"Executor Deserialize CPU Time":58152000,"Executor Run Time":1624,"Executor CPU Time":508230000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
-{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":44,"Index":12,"Attempt":0,"Launch Time":1594091481126,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483043,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1593","Value":"25076","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"6000000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"100000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":384640,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":1010,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":33883,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":498187000,"Value":8810338000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1624,"Value":25579,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":51988000,"Value":979900000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":222,"Value":3905,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":222,"Executor Deserialize CPU Time":51988000,"Executor Run Time":1624,"Executor CPU Time":498187000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Shuffle Push Read Metrics":{"Corrupt Merged Block Chunks":10,"Merged Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":38,"Index":6,"Attempt":0,"Launch Time":1594091481104,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091482939,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1467","Value":"1467","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"375000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"6250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":24040,"Internal":true,"Count Failed Values":true},{"ID":71,"Name":"internal.metrics.resultSerializationTime","Update":11,"Value":11,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":62,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2158,"Value":2158,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":414110000,"Value":414110000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1498,"Value":1498,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":60358000,"Value":60358000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":255,"Value":255,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":255,"Executor Deserialize CPU Time":60358000,"Executor Run Time":1498,"Executor CPU Time":414110000,"Peak Execution Memory":24040,"Result Size":2158,"JVM GC Time":62,"Result Serialization Time":11,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":47,"Index":15,"Attempt":0,"Launch Time":1594091481136,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483014,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1563","Value":"3030","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"750000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"12500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":48080,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":52,"Value":114,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":4273,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":1324251000,"Value":1738361000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1594,"Value":3092,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":47496000,"Value":107854000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":213,"Value":468,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":213,"Executor Deserialize CPU Time":47496000,"Executor Run Time":1594,"Executor CPU Time":1324251000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":52,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":37,"Index":5,"Attempt":0,"Launch Time":1594091481100,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483015,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1563","Value":"4593","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"1125000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"18750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":72120,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":176,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":6388,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":507192000,"Value":2245553000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1596,"Value":4688,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":60890000,"Value":168744000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":256,"Value":724,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":256,"Executor Deserialize CPU Time":60890000,"Executor Run Time":1596,"Executor CPU Time":507192000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":36,"Index":4,"Attempt":0,"Launch Time":1594091481095,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483015,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1564","Value":"6157","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"1500000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"25000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":96160,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":238,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":8503,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":503010000,"Value":2748563000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1596,"Value":6284,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":112849000,"Value":281593000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":260,"Value":984,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":260,"Executor Deserialize CPU Time":112849000,"Executor Run Time":1596,"Executor CPU Time":503010000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":35,"Index":3,"Attempt":0,"Launch Time":1594091481091,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483016,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1566","Value":"7723","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"1875000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"31250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":120200,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":300,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":10618,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":502908000,"Value":3251471000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1598,"Value":7882,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":62944000,"Value":344537000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":263,"Value":1247,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":263,"Executor Deserialize CPU Time":62944000,"Executor Run Time":1598,"Executor CPU Time":502908000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":40,"Index":8,"Attempt":0,"Launch Time":1594091481112,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483016,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1562","Value":"9285","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"2250000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"37500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":144240,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":362,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":12733,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":510597000,"Value":3762068000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1595,"Value":9477,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":69760000,"Value":414297000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":246,"Value":1493,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":246,"Executor Deserialize CPU Time":69760000,"Executor Run Time":1595,"Executor CPU Time":510597000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":45,"Index":13,"Attempt":0,"Launch Time":1594091481129,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483024,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1564","Value":"10849","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"2625000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"43750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":168280,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":424,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":14848,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":495138000,"Value":4257206000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1595,"Value":11072,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":54222000,"Value":468519000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":221,"Value":1714,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":221,"Executor Deserialize CPU Time":54222000,"Executor Run Time":1595,"Executor CPU Time":495138000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":39,"Index":7,"Attempt":0,"Launch Time":1594091481109,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483024,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1566","Value":"12415","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"3000000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"50000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":192320,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":486,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":16963,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":539451000,"Value":4796657000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1596,"Value":12668,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":64380000,"Value":532899000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":254,"Value":1968,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":254,"Executor Deserialize CPU Time":64380000,"Executor Run Time":1596,"Executor CPU Time":539451000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":33,"Index":1,"Attempt":0,"Launch Time":1594091481082,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483025,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1566","Value":"13981","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"3375000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"56250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":216360,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":62,"Value":548,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":19078,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":519178000,"Value":5315835000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1597,"Value":14265,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":54442000,"Value":587341000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":267,"Value":2235,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":267,"Executor Deserialize CPU Time":54442000,"Executor Run Time":1597,"Executor CPU Time":519178000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":62,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":34,"Index":2,"Attempt":0,"Launch Time":1594091481087,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483026,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1574","Value":"15555","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"3750000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"62500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":240400,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":614,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":21193,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":508433000,"Value":5824268000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1606,"Value":15871,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":69492000,"Value":656833000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":265,"Value":2500,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":265,"Executor Deserialize CPU Time":69492000,"Executor Run Time":1606,"Executor CPU Time":508433000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":43,"Index":11,"Attempt":0,"Launch Time":1594091481123,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483029,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1578","Value":"17133","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"4125000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"68750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":264440,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":680,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":23308,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":502120000,"Value":6326388000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1609,"Value":17480,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":48849000,"Value":705682000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":225,"Value":2725,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":225,"Executor Deserialize CPU Time":48849000,"Executor Run Time":1609,"Executor CPU Time":502120000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":41,"Index":9,"Attempt":0,"Launch Time":1594091481116,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483032,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1583","Value":"18716","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"4500000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"75000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":288480,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":746,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":25423,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":489923000,"Value":6816311000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1614,"Value":19094,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":55787000,"Value":761469000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":240,"Value":2965,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":240,"Executor Deserialize CPU Time":55787000,"Executor Run Time":1614,"Executor CPU Time":489923000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":46,"Index":14,"Attempt":0,"Launch Time":1594091481132,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483037,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1587","Value":"20303","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"4875000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"81250","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":312520,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":812,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":27538,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":490927000,"Value":7307238000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1618,"Value":20712,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":51464000,"Value":812933000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":218,"Value":3183,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":218,"Executor Deserialize CPU Time":51464000,"Executor Run Time":1618,"Executor CPU Time":490927000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":32,"Index":0,"Attempt":0,"Launch Time":1594091481077,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483037,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1587","Value":"21890","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"5250000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"87500","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":336560,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":878,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":29653,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":496683000,"Value":7803921000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1619,"Value":22331,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":56827000,"Value":869760000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":271,"Value":3454,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":271,"Executor Deserialize CPU Time":56827000,"Executor Run Time":1619,"Executor CPU Time":496683000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":42,"Index":10,"Attempt":0,"Launch Time":1594091481120,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483043,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1593","Value":"23483","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"5625000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"93750","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":360600,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":944,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":31768,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":508230000,"Value":8312151000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1624,"Value":23955,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":58152000,"Value":927912000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":229,"Value":3683,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":229,"Executor Deserialize CPU Time":58152000,"Executor Run Time":1624,"Executor CPU Time":508230000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
+{"Event":"SparkListenerTaskEnd","Stage ID":2,"Stage Attempt ID":0,"Task Type":"ResultTask","Task End Reason":{"Reason":"Success"},"Task Info":{"Task ID":44,"Index":12,"Attempt":0,"Launch Time":1594091481126,"Executor ID":"0","Host":"127.0.0.1","Locality":"PROCESS_LOCAL","Speculative":false,"Getting Result Time":0,"Finish Time":1594091483043,"Failed":false,"Killed":false,"Accumulables":[{"ID":0,"Name":"duration","Update":"1593","Value":"25076","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":1,"Name":"number of output rows","Update":"375000","Value":"6000000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":14,"Name":"number of output rows","Update":"6250","Value":"100000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Update":24040,"Value":384640,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Update":66,"Value":1010,"Internal":true,"Count Failed Values":true},{"ID":69,"Name":"internal.metrics.resultSize","Update":2115,"Value":33883,"Internal":true,"Count Failed Values":true},{"ID":68,"Name":"internal.metrics.executorCpuTime","Update":498187000,"Value":8810338000,"Internal":true,"Count Failed Values":true},{"ID":67,"Name":"internal.metrics.executorRunTime","Update":1624,"Value":25579,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Update":51988000,"Value":979900000,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Update":222,"Value":3905,"Internal":true,"Count Failed Values":true}]},"Task Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0},"Task Metrics":{"Executor Deserialize Time":222,"Executor Deserialize CPU Time":51988000,"Executor Run Time":1624,"Executor CPU Time":498187000,"Peak Execution Memory":24040,"Result Size":2115,"JVM GC Time":66,"Result Serialization Time":0,"Memory Bytes Spilled":0,"Disk Bytes Spilled":0,"Shuffle Read Metrics":{"Remote Blocks Fetched":0,"Local Blocks Fetched":0,"Fetch Wait Time":0,"Remote Bytes Read":0,"Remote Bytes Read To Disk":0,"Local Bytes Read":100,"Total Records Read":0,"Push Based Shuffle":{"Corrupt Merged Block Chunks":10,"Merged Fetch Fallback Count":2,"Merged Remote Blocks Fetched":10,"Merged Local Blocks Fetched":15,"Merged Remote Chunks Fetched":12,"Merged Local Chunks Fetched":10,"Merged Remote Bytes Read":100,"Merged Local Bytes Read":100}},"Shuffle Write Metrics":{"Shuffle Bytes Written":0,"Shuffle Write Time":0,"Shuffle Records Written":0},"Input Metrics":{"Bytes Read":0,"Records Read":0},"Output Metrics":{"Bytes Written":0,"Records Written":0},"Updated Blocks":[]}}
 {"Event":"SparkListenerStageExecutorMetrics","Executor ID":"driver","Stage ID":2,"Stage Attempt ID":0,"Executor Metrics":{"JVMHeapMemory":213367864,"JVMOffHeapMemory":189011656,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":2133349,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":2133349,"OffHeapUnifiedMemory":0,"DirectPoolMemory":282024,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":13,"MinorGCTime":115,"MajorGCCount":4,"MajorGCTime":339}}
 {"Event":"SparkListenerStageExecutorMetrics","Executor ID":"0","Stage ID":2,"Stage Attempt ID":0,"Executor Metrics":{"JVMHeapMemory":0,"JVMOffHeapMemory":0,"OnHeapExecutionMemory":0,"OffHeapExecutionMemory":0,"OnHeapStorageMemory":0,"OffHeapStorageMemory":0,"OnHeapUnifiedMemory":0,"OffHeapUnifiedMemory":0,"DirectPoolMemory":0,"MappedPoolMemory":0,"ProcessTreeJVMVMemory":0,"ProcessTreeJVMRSSMemory":0,"ProcessTreePythonVMemory":0,"ProcessTreePythonRSSMemory":0,"ProcessTreeOtherVMemory":0,"ProcessTreeOtherRSSMemory":0,"MinorGCCount":0,"MinorGCTime":0,"MajorGCCount":0,"MajorGCTime":0}}
 {"Event":"SparkListenerStageCompleted","Stage Info":{"Stage ID":2,"Stage Attempt ID":0,"Stage Name":"foreach at <console>:26","Number of Tasks":16,"RDD Info":[{"RDD ID":10,"Name":"MapPartitionsRDD","Scope":"{\"id\":\"18\",\"name\":\"mapPartitions\"}","Callsite":"foreach at <console>:26","Parent IDs":[9],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":8,"Name":"MapPartitionsRDD","Scope":"{\"id\":\"0\",\"name\":\"DeserializeToObject\"}","Callsite":"foreach at <console>:26","Parent IDs":[7],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":6,"Name":"ParallelCollectionRDD","Scope":"{\"id\":\"1\",\"name\":\"WholeStageCodegen (2)\"}","Callsite":"foreach at <console>:26","Parent IDs":[],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":7,"Name":"MapPartitionsRDD","Scope":"{\"id\":\"1\",\"name\":\"WholeStageCodegen (2)\"}","Callsite":"foreach at <console>:26","Parent IDs":[6],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0},{"RDD ID":9,"Name":"SQLExecutionRDD","Callsite":"foreach at <console>:26","Parent IDs":[8],"Storage Level":{"Use Disk":false,"Use Memory":false,"Deserialized":false,"Replication":1},"Barrier":false,"Number of Partitions":16,"Number of Cached Partitions":0,"Memory Size":0,"Disk Size":0}],"Parent IDs":[],"Details":"org.apache.spark.sql.Dataset.foreach(Dataset.scala:2862)\n$line19.$read$$iw$$iw$$iw$$iw$$iw$$iw$$iw$$iw.<init>(<console>:26)\n$line19.$read$$iw$$iw$$iw$$iw$$iw$$iw$$iw.<init>(<console>:30)\n$line19.$read$$iw$$iw$$iw$$iw$$iw$$iw.<init>(<console>:32)\n$line19.$read$$iw$$iw$$iw$$iw$$iw.<init>(<console>:34)\n$line19.$read$$iw$$iw$$iw$$iw.<init>(<console>:36)\n$line19.$read$$iw$$iw$$iw.<init>(<console>:38)\n$line19.$read$$iw$$iw.<init>(<console>:40)\n$line19.$read$$iw.<init>(<console>:42)\n$line19.$read.<init>(<console>:44)\n$line19.$read$.<init>(<console>:48)\n$line19.$read$.<clinit>(<console>)\n$line19.$eval$.$print$lzycompute(<console>:7)\n$line19.$eval$.$print(<console>:6)\n$line19.$eval.$print(<console>)\nsun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)\nsun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)\nsun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)\njava.lang.reflect.Method.invoke(Method.java:498)\nscala.tools.nsc.interpreter.IMain$ReadEvalPrint.call(IMain.scala:745)","Submission Time":1594091481040,"Completion Time":1594091483044,"Accumulables":[{"ID":68,"Name":"internal.metrics.executorCpuTime","Value":8810338000,"Internal":true,"Count Failed Values":true},{"ID":71,"Name":"internal.metrics.resultSerializationTime","Value":11,"Internal":true,"Count Failed Values":true},{"ID":74,"Name":"internal.metrics.peakExecutionMemory","Value":384640,"Internal":true,"Count Failed Values":true},{"ID":65,"Name":"internal.metrics.executorDeserializeTime","Value":3905,"Internal":true,"Count Failed Values":true},{"ID":14,"Name":"number of output rows","Value":"100000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":67,"Name":"internal.metrics.executorRunTime","Value":25579,"Internal":true,"Count Failed Values":true},{"ID":70,"Name":"internal.metrics.jvmGCTime","Value":1010,"Internal":true,"Count Failed Values":true},{"ID":1,"Name":"number of output rows","Value":"6000000","Internal":true,"Count Failed Values":true,"Metadata":"sql"},{"ID":69,"Name":"internal.metrics.resultSize","Value":33883,"Internal":true,"Count Failed Values":true},{"ID":66,"Name":"internal.metrics.executorDeserializeCpuTime","Value":979900000,"Internal":true,"Count Failed Values":true},{"ID":0,"Name":"duration","Value":"25076","Internal":true,"Count Failed Values":true,"Metadata":"sql"}],"Resource Profile Id":0}}
diff --git a/core/src/test/scala/org/apache/spark/CheckpointSuite.scala b/core/src/test/scala/org/apache/spark/CheckpointSuite.scala
index 7a39ba4ab382b..58512a2282ac2 100644
--- a/core/src/test/scala/org/apache/spark/CheckpointSuite.scala
+++ b/core/src/test/scala/org/apache/spark/CheckpointSuite.scala
@@ -21,7 +21,6 @@ import java.io.File
 
 import scala.reflect.ClassTag
 
-import com.google.common.io.ByteStreams
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.internal.config.CACHE_CHECKPOINT_PREFERRED_LOCS_EXPIRE_TIME
@@ -612,7 +611,7 @@ class CheckpointStorageSuite extends SparkFunSuite with LocalSparkContext {
       val compressedInputStream = CompressionCodec.createCodec(conf)
         .compressedInputStream(fs.open(checkpointFile))
       try {
-        ByteStreams.toByteArray(compressedInputStream)
+        compressedInputStream.readAllBytes()
       } finally {
         compressedInputStream.close()
       }
diff --git a/core/src/test/scala/org/apache/spark/FileSuite.scala b/core/src/test/scala/org/apache/spark/FileSuite.scala
index 5f9912cbd021d..6d9ec966e9fd7 100644
--- a/core/src/test/scala/org/apache/spark/FileSuite.scala
+++ b/core/src/test/scala/org/apache/spark/FileSuite.scala
@@ -19,13 +19,12 @@ package org.apache.spark
 
 import java.io._
 import java.nio.ByteBuffer
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.zip.GZIPOutputStream
 
 import scala.io.Source
 import scala.util.control.NonFatal
 
-import com.google.common.io.Files
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.io._
@@ -40,6 +39,7 @@ import org.apache.spark.rdd.{HadoopRDD, NewHadoopRDD}
 import org.apache.spark.serializer.KryoSerializer
 import org.apache.spark.storage.StorageLevel
 import org.apache.spark.util.Utils
+import org.apache.spark.util.collection.Utils.createArray
 
 class FileSuite extends SparkFunSuite with LocalSparkContext {
   var tempDir: File = _
@@ -81,17 +81,18 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
     val compressedOutputDir = new File(tempDir, "output_compressed").getAbsolutePath
     val codec = new DefaultCodec()
 
-    val data = sc.parallelize("a" * 10000, 1)
+    val data = sc.parallelize("a".repeat(10000), 1)
     data.saveAsTextFile(normalDir)
     data.saveAsTextFile(compressedOutputDir, classOf[DefaultCodec])
 
     val normalFile = new File(normalDir, "part-00000")
     val normalContent = sc.textFile(normalDir).collect()
-    assert(normalContent === Array.fill(10000)("a"))
+    val expected = createArray(10000, "a")
+    assert(normalContent === expected)
 
     val compressedFile = new File(compressedOutputDir, "part-00000" + codec.getDefaultExtension)
     val compressedContent = sc.textFile(compressedOutputDir).collect()
-    assert(compressedContent === Array.fill(10000)("a"))
+    assert(compressedContent === expected)
 
     assert(compressedFile.length < normalFile.length)
   }
@@ -107,7 +108,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
   test("SequenceFiles") {
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (x, "a" * x)) // (1,a), (2,aa), (3,aaa)
+    val nums = sc.makeRDD(1 to 3).map(x => (x, "a".repeat(x))) // (1,a), (2,aa), (3,aaa)
     nums.saveAsSequenceFile(outputDir)
     // Try reading the output back as a SequenceFile
     val output = sc.sequenceFile[IntWritable, Text](outputDir)
@@ -126,11 +127,12 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
 
       val normalFile = new File(normalDir, "part-00000")
       val normalContent = sc.sequenceFile[String, String](normalDir).collect()
-      assert(normalContent === Array.fill(100)(("abc", "abc")))
+      val expected = createArray(100, ("abc", "abc"))
+      assert(normalContent === expected)
 
       val compressedFile = new File(compressedOutputDir, "part-00000" + codec.getDefaultExtension)
       val compressedContent = sc.sequenceFile[String, String](compressedOutputDir).collect()
-      assert(compressedContent === Array.fill(100)(("abc", "abc")))
+      assert(compressedContent === expected)
 
       assert(compressedFile.length < normalFile.length)
     }
@@ -157,7 +159,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
   test("SequenceFile with writable key") {
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), "a" * x))
+    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), "a".repeat(x)))
     nums.saveAsSequenceFile(outputDir)
     // Try reading the output back as a SequenceFile
     val output = sc.sequenceFile[IntWritable, Text](outputDir)
@@ -167,7 +169,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
   test("SequenceFile with writable value") {
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (x, new Text("a" * x)))
+    val nums = sc.makeRDD(1 to 3).map(x => (x, new Text("a".repeat(x))))
     nums.saveAsSequenceFile(outputDir)
     // Try reading the output back as a SequenceFile
     val output = sc.sequenceFile[IntWritable, Text](outputDir)
@@ -177,7 +179,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
   test("SequenceFile with writable key and value") {
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), new Text("a" * x)))
+    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), new Text("a".repeat(x))))
     nums.saveAsSequenceFile(outputDir)
     // Try reading the output back as a SequenceFile
     val output = sc.sequenceFile[IntWritable, Text](outputDir)
@@ -187,7 +189,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
   test("implicit conversions in reading SequenceFiles") {
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (x, "a" * x)) // (1,a), (2,aa), (3,aaa)
+    val nums = sc.makeRDD(1 to 3).map(x => (x, "a".repeat(x))) // (1,a), (2,aa), (3,aaa)
     nums.saveAsSequenceFile(outputDir)
     // Similar to the tests above, we read a SequenceFile, but this time we pass type params
     // that are convertible to Writable instead of calling sequenceFile[IntWritable, Text]
@@ -213,7 +215,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
   test("object files of complex types") {
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (x, "a" * x))
+    val nums = sc.makeRDD(1 to 3).map(x => (x, "a".repeat(x)))
     nums.saveAsObjectFile(outputDir)
     // Try reading the output back as an object file
     val output = sc.objectFile[(Int, String)](outputDir)
@@ -245,7 +247,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
     import org.apache.hadoop.mapreduce.lib.output.SequenceFileOutputFormat
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), new Text("a" * x)))
+    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), new Text("a".repeat(x))))
     nums.saveAsNewAPIHadoopFile[SequenceFileOutputFormat[IntWritable, Text]](
         outputDir)
     val output = sc.sequenceFile[IntWritable, Text](outputDir)
@@ -256,7 +258,7 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
     import org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat
     sc = new SparkContext("local", "test")
     val outputDir = new File(tempDir, "output").getAbsolutePath
-    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), new Text("a" * x)))
+    val nums = sc.makeRDD(1 to 3).map(x => (new IntWritable(x), new Text("a".repeat(x))))
     nums.saveAsSequenceFile(outputDir)
     val output =
       sc.newAPIHadoopFile[IntWritable, Text, SequenceFileInputFormat[IntWritable, Text]](outputDir)
@@ -334,8 +336,8 @@ class FileSuite extends SparkFunSuite with LocalSparkContext {
 
       for (i <- 0 until 8) {
         val tempFile = new File(tempDir, s"part-0000$i")
-        Files.asCharSink(tempFile, StandardCharsets.UTF_8)
-          .write("someline1 in file1\nsomeline2 in file1\nsomeline3 in file1")
+        Files.writeString(tempFile.toPath,
+          "someline1 in file1\nsomeline2 in file1\nsomeline3 in file1")
       }
 
       for (p <- Seq(1, 2, 8)) {
diff --git a/core/src/test/scala/org/apache/spark/JobArtifactSetSuite.scala b/core/src/test/scala/org/apache/spark/JobArtifactSetSuite.scala
index bf1cb4dded85b..8899971d89ad9 100644
--- a/core/src/test/scala/org/apache/spark/JobArtifactSetSuite.scala
+++ b/core/src/test/scala/org/apache/spark/JobArtifactSetSuite.scala
@@ -20,8 +20,7 @@ package org.apache.spark
 import java.io.{File, FileInputStream, FileOutputStream}
 import java.util.zip.{ZipEntry, ZipOutputStream}
 
-import org.apache.commons.io.IOUtils
-
+import org.apache.spark.util.Utils
 
 class JobArtifactSetSuite extends SparkFunSuite with LocalSparkContext {
 
@@ -32,9 +31,9 @@ class JobArtifactSetSuite extends SparkFunSuite with LocalSparkContext {
     val zipOut = new ZipOutputStream(fos)
     val zipEntry = new ZipEntry(fileToZip.getName)
     zipOut.putNextEntry(zipEntry)
-    IOUtils.copy(fis, zipOut)
-    IOUtils.closeQuietly(fis)
-    IOUtils.closeQuietly(zipOut)
+    fis.transferTo(zipOut)
+    Utils.closeQuietly(fis)
+    Utils.closeQuietly(zipOut)
   }
 
   test("JobArtifactSet uses resources from SparkContext") {
diff --git a/core/src/test/scala/org/apache/spark/MapOutputTrackerSuite.scala b/core/src/test/scala/org/apache/spark/MapOutputTrackerSuite.scala
index 26dc218c30c74..68e366e9ad107 100644
--- a/core/src/test/scala/org/apache/spark/MapOutputTrackerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/MapOutputTrackerSuite.scala
@@ -38,6 +38,7 @@ import org.apache.spark.rpc.{RpcAddress, RpcCallContext, RpcEndpoint, RpcEndpoin
 import org.apache.spark.scheduler.{CompressedMapStatus, HighlyCompressedMapStatus, MapStatus, MergeStatus}
 import org.apache.spark.shuffle.FetchFailedException
 import org.apache.spark.storage.{BlockManagerId, BlockManagerMasterEndpoint, ShuffleBlockId, ShuffleMergedBlockId}
+import org.apache.spark.util.collection.Utils.createArray
 
 class MapOutputTrackerSuite extends SparkFunSuite with LocalSparkContext {
   private val conf = new SparkConf
@@ -193,7 +194,7 @@ class MapOutputTrackerSuite extends SparkFunSuite with LocalSparkContext {
     // Message size should be ~123B, and no exception should be thrown
     masterTracker.registerShuffle(10, 1, MergeStatus.SHUFFLE_PUSH_DUMMY_NUM_REDUCES)
     masterTracker.registerMapOutput(10, 0, MapStatus(
-      BlockManagerId("88", "mph", 1000), Array.fill[Long](10)(0), 5))
+      BlockManagerId("88", "mph", 1000), createArray(10, 0L), 5))
     val senderAddress = RpcAddress("localhost", 12345)
     val rpcCallContext = mock(classOf[RpcCallContext])
     when(rpcCallContext.senderAddress).thenReturn(senderAddress)
@@ -271,7 +272,7 @@ class MapOutputTrackerSuite extends SparkFunSuite with LocalSparkContext {
       masterTracker.registerShuffle(20, 100, MergeStatus.SHUFFLE_PUSH_DUMMY_NUM_REDUCES)
       (0 until 100).foreach { i =>
         masterTracker.registerMapOutput(20, i, new CompressedMapStatus(
-          BlockManagerId("999", "mps", 1000), Array.fill[Long](4000000)(0), 5))
+          BlockManagerId("999", "mps", 1000), createArray(4000000, 0L), 5))
       }
       val senderAddress = RpcAddress("localhost", 12345)
       val rpcCallContext = mock(classOf[RpcCallContext])
@@ -578,7 +579,7 @@ class MapOutputTrackerSuite extends SparkFunSuite with LocalSparkContext {
       masterTracker.registerShuffle(20, 100, MergeStatus.SHUFFLE_PUSH_DUMMY_NUM_REDUCES)
       (0 until 100).foreach { i =>
         masterTracker.registerMapOutput(20, i, new CompressedMapStatus(
-          BlockManagerId("999", "mps", 1000), Array.fill[Long](4000000)(0), 5))
+          BlockManagerId("999", "mps", 1000), createArray(4000000, 0L), 5))
       }
 
       val mapWorkerRpcEnv = createRpcEnv("spark-worker", "localhost", 0, new SecurityManager(conf))
@@ -625,7 +626,7 @@ class MapOutputTrackerSuite extends SparkFunSuite with LocalSparkContext {
       masterTracker.registerShuffle(20, 100, MergeStatus.SHUFFLE_PUSH_DUMMY_NUM_REDUCES)
       (0 until 100).foreach { i =>
         masterTracker.registerMapOutput(20, i, new CompressedMapStatus(
-          BlockManagerId("999", "mps", 1000), Array.fill[Long](4000000)(0), 5))
+          BlockManagerId("999", "mps", 1000), createArray(4000000, 0L), 5))
       }
       masterTracker.registerMergeResult(20, 0, MergeStatus(BlockManagerId("999", "mps", 1000), 0,
         bitmap1, 1000L))
diff --git a/core/src/test/scala/org/apache/spark/ShuffleSuite.scala b/core/src/test/scala/org/apache/spark/ShuffleSuite.scala
index f131d1d47a772..18e909fce51cb 100644
--- a/core/src/test/scala/org/apache/spark/ShuffleSuite.scala
+++ b/core/src/test/scala/org/apache/spark/ShuffleSuite.scala
@@ -23,8 +23,6 @@ import java.util.concurrent.{Callable, CyclicBarrier, Executors, ExecutorService
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
-import org.apache.commons.io.filefilter.TrueFileFilter
 import org.scalatest.matchers.must.Matchers
 import org.scalatest.matchers.should.Matchers._
 
@@ -37,8 +35,8 @@ import org.apache.spark.scheduler.{MapStatus, MergeStatus, MyRDD, SparkListener,
 import org.apache.spark.serializer.{JavaSerializer, KryoSerializer}
 import org.apache.spark.shuffle.ShuffleWriter
 import org.apache.spark.storage.{ShuffleBlockId, ShuffleDataBlockId, ShuffleIndexBlockId}
+import org.apache.spark.util.{MutablePair, Utils}
 import org.apache.spark.util.ArrayImplicits._
-import org.apache.spark.util.MutablePair
 
 abstract class ShuffleSuite extends SparkFunSuite with Matchers with LocalRootDirsTest {
 
@@ -426,8 +424,7 @@ abstract class ShuffleSuite extends SparkFunSuite with Matchers with LocalRootDi
 
   test("SPARK-34541: shuffle can be removed") {
     withTempDir { tmpDir =>
-      def getAllFiles: Set[File] =
-        FileUtils.listFiles(tmpDir, TrueFileFilter.INSTANCE, TrueFileFilter.INSTANCE).asScala.toSet
+      def getAllFiles: Set[File] = Utils.listFiles(tmpDir).asScala.toSet
       conf.set("spark.local.dir", tmpDir.getAbsolutePath)
       sc = new SparkContext("local", "test", conf)
       // For making the taskAttemptId starts from 1.
diff --git a/core/src/test/scala/org/apache/spark/SortShuffleSuite.scala b/core/src/test/scala/org/apache/spark/SortShuffleSuite.scala
index 8c6a876e8c1b7..e11194eb90135 100644
--- a/core/src/test/scala/org/apache/spark/SortShuffleSuite.scala
+++ b/core/src/test/scala/org/apache/spark/SortShuffleSuite.scala
@@ -17,19 +17,16 @@
 
 package org.apache.spark
 
-import java.io.File
-
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
-import org.apache.commons.io.filefilter.TrueFileFilter
 import org.scalatest.BeforeAndAfterAll
 import org.scalatest.matchers.should.Matchers._
 
-import org.apache.spark.internal.config.SHUFFLE_MANAGER
+import org.apache.spark.internal.config.{SHUFFLE_CHECKSUM_ALGORITHM, SHUFFLE_MANAGER}
 import org.apache.spark.rdd.ShuffledRDD
 import org.apache.spark.serializer.{JavaSerializer, KryoSerializer}
 import org.apache.spark.shuffle.sort.SortShuffleManager
+import org.apache.spark.util.Utils
 
 class SortShuffleSuite extends ShuffleSuite with BeforeAndAfterAll {
 
@@ -62,15 +59,15 @@ class SortShuffleSuite extends ShuffleSuite with BeforeAndAfterAll {
   }
 
   private def ensureFilesAreCleanedUp(shuffledRdd: ShuffledRDD[_, _, _]): Unit = {
-    def getAllFiles: Set[File] =
-      FileUtils.listFiles(tempDir, TrueFileFilter.INSTANCE, TrueFileFilter.INSTANCE).asScala.toSet
+    def getAllFiles = Utils.listFiles(tempDir).asScala.toSet
     val filesBeforeShuffle = getAllFiles
     // Force the shuffle to be performed
     shuffledRdd.count()
     // Ensure that the shuffle actually created files that will need to be cleaned up
     val filesCreatedByShuffle = getAllFiles -- filesBeforeShuffle
-    filesCreatedByShuffle.map(_.getName) should be
-    Set("shuffle_0_0_0.data", "shuffle_0_0_0.index")
+    filesCreatedByShuffle.map(_.getName) should be(
+      Set("shuffle_0_0_0.data", s"shuffle_0_0_0.checksum.${conf.get(SHUFFLE_CHECKSUM_ALGORITHM)}",
+        "shuffle_0_0_0.index"))
     // Check that the cleanup actually removes the files
     sc.env.blockManager.master.removeShuffle(0, blocking = true)
     for (file <- filesCreatedByShuffle) {
diff --git a/core/src/test/scala/org/apache/spark/SparkContextSuite.scala b/core/src/test/scala/org/apache/spark/SparkContextSuite.scala
index 9e5859feefb59..68bf9ca6a88cc 100644
--- a/core/src/test/scala/org/apache/spark/SparkContextSuite.scala
+++ b/core/src/test/scala/org/apache/spark/SparkContextSuite.scala
@@ -19,13 +19,12 @@ package org.apache.spark
 
 import java.io.File
 import java.net.{MalformedURLException, URI}
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.concurrent.{CountDownLatch, Semaphore, TimeUnit}
 
 import scala.concurrent.duration._
 import scala.io.Source
 
-import com.google.common.io.Files
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.io.{BytesWritable, LongWritable, Text}
@@ -42,6 +41,7 @@ import org.apache.spark.executor.ExecutorExitCode
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.Tests._
 import org.apache.spark.internal.config.UI._
+import org.apache.spark.launcher.SparkLauncher
 import org.apache.spark.resource.ResourceAllocation
 import org.apache.spark.resource.ResourceUtils._
 import org.apache.spark.resource.TestResourceIDs._
@@ -120,8 +120,8 @@ class SparkContextSuite extends SparkFunSuite with LocalSparkContext with Eventu
       val absolutePath2 = file2.getAbsolutePath
 
       try {
-        Files.asCharSink(file1, StandardCharsets.UTF_8).write("somewords1")
-        Files.asCharSink(file2, StandardCharsets.UTF_8).write("somewords2")
+        Files.writeString(file1.toPath, "somewords1")
+        Files.writeString(file2.toPath, "somewords2")
         val length1 = file1.length()
         val length2 = file2.length()
 
@@ -179,10 +179,10 @@ class SparkContextSuite extends SparkFunSuite with LocalSparkContext with Eventu
         s"${jarFile.getParent}/../${jarFile.getParentFile.getName}/${jarFile.getName}#zoo"
 
       try {
-        Files.asCharSink(file1, StandardCharsets.UTF_8).write("somewords1")
-        Files.asCharSink(file2, StandardCharsets.UTF_8).write("somewords22")
-        Files.asCharSink(file3, StandardCharsets.UTF_8).write("somewords333")
-        Files.asCharSink(file4, StandardCharsets.UTF_8).write("somewords4444")
+        Files.writeString(file1.toPath, "somewords1")
+        Files.writeString(file2.toPath, "somewords22")
+        Files.writeString(file3.toPath, "somewords333")
+        Files.writeString(file4.toPath, "somewords4444")
         val length1 = file1.length()
         val length2 = file2.length()
         val length3 = file1.length()
@@ -375,8 +375,8 @@ class SparkContextSuite extends SparkFunSuite with LocalSparkContext with Eventu
       assert(subdir2.mkdir())
       val file1 = new File(subdir1, "file")
       val file2 = new File(subdir2, "file")
-      Files.asCharSink(file1, StandardCharsets.UTF_8).write("old")
-      Files.asCharSink(file2, StandardCharsets.UTF_8).write("new")
+      Files.writeString(file1.toPath, "old")
+      Files.writeString(file2.toPath, "new")
       sc = new SparkContext("local-cluster[1,1,1024]", "test")
       sc.addFile(file1.getAbsolutePath)
       def getAddedFileContents(): String = {
@@ -455,7 +455,7 @@ class SparkContextSuite extends SparkFunSuite with LocalSparkContext with Eventu
   test("SPARK-22585 addJar argument without scheme is interpreted literally without url decoding") {
     withTempDir { dir =>
       val tmpDir = new File(dir, "host%3A443")
-      tmpDir.mkdirs()
+      Utils.createDirectory(tmpDir)
       val tmpJar = File.createTempFile("t%2F", ".jar", tmpDir)
 
       sc = new SparkContext("local", "test")
@@ -507,15 +507,12 @@ class SparkContextSuite extends SparkFunSuite with LocalSparkContext with Eventu
 
         try {
           // Create 5 text files.
-          Files.asCharSink(file1, StandardCharsets.UTF_8)
-            .write("someline1 in file1\nsomeline2 in file1\nsomeline3 in file1")
-          Files.asCharSink(file2, StandardCharsets.UTF_8)
-            .write("someline1 in file2\nsomeline2 in file2")
-          Files.asCharSink(file3, StandardCharsets.UTF_8).write("someline1 in file3")
-          Files.asCharSink(file4, StandardCharsets.UTF_8)
-            .write("someline1 in file4\nsomeline2 in file4")
-          Files.asCharSink(file5, StandardCharsets.UTF_8)
-            .write("someline1 in file2\nsomeline2 in file5")
+          Files.writeString(file1.toPath,
+            "someline1 in file1\nsomeline2 in file1\nsomeline3 in file1")
+          Files.writeString(file2.toPath, "someline1 in file2\nsomeline2 in file2")
+          Files.writeString(file3.toPath, "someline1 in file3")
+          Files.writeString(file4.toPath, "someline1 in file4\nsomeline2 in file4")
+          Files.writeString(file5.toPath, "someline1 in file2\nsomeline2 in file5")
 
           sc = new SparkContext(new SparkConf().setAppName("test").setMaster("local"))
 
@@ -780,7 +777,7 @@ class SparkContextSuite extends SparkFunSuite with LocalSparkContext with Eventu
     fs.initialize(new URI("file:///"), new Configuration())
     val file = File.createTempFile("SPARK19446", "temp")
     file.deleteOnExit()
-    Files.write(Array.ofDim[Byte](1000), file)
+    Files.write(file.toPath, Array.ofDim[Byte](1000))
     val path = new Path("file:///" + file.getCanonicalPath)
     val stream = fs.open(path)
     val exc = intercept[RuntimeException] {
@@ -1469,6 +1466,15 @@ class SparkContextSuite extends SparkFunSuite with LocalSparkContext with Eventu
     sc.stop()
   }
 
+  test("SPARK-49984: Don't duplicate default Java options to extra Java options") {
+    val conf = new SparkConf().setAppName("test").setMaster("local")
+    conf.set(SparkLauncher.DRIVER_DEFAULT_JAVA_OPTIONS, "-Dfoo=bar")
+    conf.set(SparkLauncher.EXECUTOR_DEFAULT_JAVA_OPTIONS, "-Dfoo=bar")
+    sc = new SparkContext(conf)
+    assert(!sc.conf.get(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS).contains("-Dfoo=bar"))
+    assert(!sc.conf.get(SparkLauncher.EXECUTOR_EXTRA_JAVA_OPTIONS).contains("-Dfoo=bar"))
+    sc.stop()
+  }
 }
 
 object SparkContextSuite {
diff --git a/core/src/test/scala/org/apache/spark/SparkFunSuite.scala b/core/src/test/scala/org/apache/spark/SparkFunSuite.scala
index 7bb5b9929177a..cd421ba20bd77 100644
--- a/core/src/test/scala/org/apache/spark/SparkFunSuite.scala
+++ b/core/src/test/scala/org/apache/spark/SparkFunSuite.scala
@@ -26,7 +26,6 @@ import scala.annotation.tailrec
 import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
 import org.apache.logging.log4j._
 import org.apache.logging.log4j.core.{LogEvent, Logger, LoggerContext}
 import org.apache.logging.log4j.core.appender.AbstractAppender
@@ -126,7 +125,7 @@ abstract class SparkFunSuite
     // copy it into a temporary one for accessing it from the dependent module.
     val file = File.createTempFile("test-resource", suffix)
     file.deleteOnExit()
-    FileUtils.copyURLToFile(url, file)
+    Utils.copyURLToFile(url, file)
     file
   }
 
@@ -205,7 +204,7 @@ abstract class SparkFunSuite
         logInfo("\n\n===== EXTRA LOGS FOR THE FAILED TEST\n")
         workerLogfiles.foreach { logFile =>
           logInfo(s"\n----- Logfile: ${logFile.getAbsolutePath()}")
-          logInfo(FileUtils.readFileToString(logFile, "UTF-8"))
+          logInfo(Files.readString(logFile.toPath))
         }
       }
     }
@@ -275,7 +274,7 @@ abstract class SparkFunSuite
   protected def withLogAppender(
       appender: AbstractAppender,
       loggerNames: Seq[String] = Seq.empty,
-      level: Option[Level] = None)(
+      level: Option[Level] = Some(Level.INFO))(
       f: => Unit): Unit = {
     val loggers = if (loggerNames.nonEmpty) {
       loggerNames.map(LogManager.getLogger)
diff --git a/core/src/test/scala/org/apache/spark/SparkThrowableSuite.scala b/core/src/test/scala/org/apache/spark/SparkThrowableSuite.scala
index ea845c0f93a4b..bf62052e36da9 100644
--- a/core/src/test/scala/org/apache/spark/SparkThrowableSuite.scala
+++ b/core/src/test/scala/org/apache/spark/SparkThrowableSuite.scala
@@ -30,7 +30,6 @@ import com.fasterxml.jackson.core.util.{DefaultIndenter, DefaultPrettyPrinter}
 import com.fasterxml.jackson.databind.SerializationFeature
 import com.fasterxml.jackson.databind.json.JsonMapper
 import com.fasterxml.jackson.module.scala.DefaultScalaModule
-import org.apache.commons.io.{FileUtils, IOUtils}
 
 import org.apache.spark.SparkThrowableHelper._
 import org.apache.spark.util.Utils
@@ -80,7 +79,7 @@ class SparkThrowableSuite extends SparkFunSuite {
 
   test("Error conditions are correctly formatted") {
     val errorConditionFileContents =
-      IOUtils.toString(errorJsonFilePath.toUri.toURL.openStream(), StandardCharsets.UTF_8)
+      Utils.toString(errorJsonFilePath.toUri.toURL.openStream())
     val mapper = JsonMapper.builder()
       .addModule(DefaultScalaModule)
       .enable(SerializationFeature.INDENT_OUTPUT)
@@ -97,8 +96,8 @@ class SparkThrowableSuite extends SparkFunSuite {
         val errorConditionsFile = errorJsonFilePath.toFile
         logInfo(s"Regenerating error conditions file $errorConditionsFile")
         Files.delete(errorConditionsFile.toPath)
-        FileUtils.writeStringToFile(
-          errorConditionsFile,
+        Files.writeString(
+          errorJsonFilePath,
           rewrittenString + lineSeparator,
           StandardCharsets.UTF_8)
       }
@@ -421,7 +420,7 @@ class SparkThrowableSuite extends SparkFunSuite {
   test("overwrite error classes") {
     withTempDir { dir =>
       val json = new File(dir, "errors.json")
-      FileUtils.writeStringToFile(json,
+      Files.writeString(json.toPath(),
         """
           |{
           |  "DIVIDE_BY_ZERO" : {
@@ -439,7 +438,7 @@ class SparkThrowableSuite extends SparkFunSuite {
   test("prohibit dots in error class names") {
     withTempDir { dir =>
       val json = new File(dir, "errors.json")
-      FileUtils.writeStringToFile(json,
+      Files.writeString(json.toPath(),
         """
           |{
           |  "DIVIDE.BY_ZERO" : {
@@ -458,7 +457,7 @@ class SparkThrowableSuite extends SparkFunSuite {
 
     withTempDir { dir =>
       val json = new File(dir, "errors.json")
-      FileUtils.writeStringToFile(json,
+      Files.writeString(json.toPath(),
         """
           |{
           |  "DIVIDE" : {
@@ -486,7 +485,7 @@ class SparkThrowableSuite extends SparkFunSuite {
   test("handle null values in message parameters") {
     withTempDir { dir =>
       val json = new File(dir, "errors.json")
-      FileUtils.writeStringToFile(json,
+      Files.writeString(json.toPath(),
         """
           |{
           |  "MISSING_PARAMETER" : {
diff --git a/core/src/test/scala/org/apache/spark/api/python/PythonWorkerFactorySuite.scala b/core/src/test/scala/org/apache/spark/api/python/PythonWorkerFactorySuite.scala
index 4d994ea5dffae..4f9dafb6cbeae 100644
--- a/core/src/test/scala/org/apache/spark/api/python/PythonWorkerFactorySuite.scala
+++ b/core/src/test/scala/org/apache/spark/api/python/PythonWorkerFactorySuite.scala
@@ -19,6 +19,7 @@ package org.apache.spark.api.python
 
 import java.net.SocketTimeoutException
 
+import scala.collection.mutable
 // scalastyle:off executioncontextglobal
 import scala.concurrent.ExecutionContext.Implicits.global
 // scalastyle:on executioncontextglobal
@@ -56,4 +57,56 @@ class PythonWorkerFactorySuite extends SparkFunSuite with SharedSparkContext {
     // Timeout ensures that the test fails in 5 minutes if createSimplerWorker() doesn't return.
     ThreadUtils.awaitReady(createFuture, 5.minutes)
   }
+
+  test("idle worker pool is unbounded when idleWorkerMaxPoolSize is not set") {
+    sc.conf.remove("spark.python.factory.idleWorkerMaxPoolSize")
+
+    val factory = new PythonWorkerFactory("python3", "pyspark.worker", Map.empty, true)
+
+    assert(factory.idleWorkers.size === 0)
+
+    val mockWorkers: mutable.Queue[PythonWorker] = mutable.Queue.empty
+    try {
+      (1 to 3).foreach { _ =>
+        val mockChannel = java.nio.channels.SocketChannel.open()
+        mockChannel.configureBlocking(false)
+        mockWorkers.enqueue(PythonWorker(mockChannel))
+      }
+      mockWorkers.foreach(factory.releaseWorker)
+      assert(factory.idleWorkers.size === 3)
+
+    } finally {
+      mockWorkers.foreach(factory.stopWorker)
+    }
+  }
+
+  test("idle worker pool is bounded when idleWorkerMaxPoolSize is set") {
+    sc.conf.set("spark.python.factory.idleWorkerMaxPoolSize", "2")
+
+    val factory = new PythonWorkerFactory("python3", "pyspark.worker", Map.empty, true)
+
+    assert(factory.idleWorkers.size === 0)
+    val mockWorkers: mutable.Queue[PythonWorker] = mutable.Queue.empty
+    try {
+      (1 to 2).foreach { _ =>
+        val mockChannel = java.nio.channels.SocketChannel.open()
+        mockChannel.configureBlocking(false)
+        mockWorkers.enqueue(PythonWorker(mockChannel))
+      }
+      mockWorkers.foreach(factory.releaseWorker)
+      assert(factory.idleWorkers.size === 2)
+
+
+      val worker3 = {
+        val mockChannel = java.nio.channels.SocketChannel.open()
+        mockChannel.configureBlocking(false)
+        PythonWorker(mockChannel)
+      }
+      mockWorkers.enqueue(worker3)
+      factory.releaseWorker(worker3)
+      assert(factory.idleWorkers.size === 2)
+    } finally {
+      mockWorkers.foreach(factory.stopWorker)
+    }
+  }
 }
diff --git a/core/src/test/scala/org/apache/spark/benchmark/Benchmark.scala b/core/src/test/scala/org/apache/spark/benchmark/Benchmark.scala
index 7e88c7ee684bd..87db697b2a51e 100644
--- a/core/src/test/scala/org/apache/spark/benchmark/Benchmark.scala
+++ b/core/src/test/scala/org/apache/spark/benchmark/Benchmark.scala
@@ -25,7 +25,6 @@ import scala.concurrent.duration._
 import scala.util.Try
 
 import org.apache.commons.io.output.TeeOutputStream
-import org.apache.commons.lang3.SystemUtils
 
 import org.apache.spark.util.Utils
 
@@ -211,10 +210,10 @@ private[spark] object Benchmark {
    * This should return something like "Intel(R) Core(TM) i7-4870HQ CPU @ 2.50GHz"
    */
   def getProcessorName(): String = {
-    val cpu = if (SystemUtils.IS_OS_MAC_OSX) {
+    val cpu = if (Utils.isMac) {
       Utils.executeAndGetOutput(Seq("/usr/sbin/sysctl", "-n", "machdep.cpu.brand_string"))
         .stripLineEnd
-    } else if (SystemUtils.IS_OS_LINUX) {
+    } else if (Utils.isLinux) {
       Try {
         val grepPath = Utils.executeAndGetOutput(Seq("which", "grep")).stripLineEnd
         Utils.executeAndGetOutput(Seq(grepPath, "-m", "1", "model name", "/proc/cpuinfo"))
@@ -234,8 +233,6 @@ private[spark] object Benchmark {
   def getJVMOSInfo(): String = {
     val vmName = System.getProperty("java.vm.name")
     val runtimeVersion = System.getProperty("java.runtime.version")
-    val osName = System.getProperty("os.name")
-    val osVersion = System.getProperty("os.version")
-    s"${vmName} ${runtimeVersion} on ${osName} ${osVersion}"
+    s"${vmName} ${runtimeVersion} on ${Utils.osName} ${Utils.osVersion}"
   }
 }
diff --git a/core/src/test/scala/org/apache/spark/benchmark/BenchmarkBase.scala b/core/src/test/scala/org/apache/spark/benchmark/BenchmarkBase.scala
index 5eb22032a5e80..cd2a042498270 100644
--- a/core/src/test/scala/org/apache/spark/benchmark/BenchmarkBase.scala
+++ b/core/src/test/scala/org/apache/spark/benchmark/BenchmarkBase.scala
@@ -20,6 +20,7 @@ package org.apache.spark.benchmark
 import java.io.{File, FileOutputStream, OutputStream}
 
 import org.apache.spark.internal.config.Tests.IS_TESTING
+import org.apache.spark.util.Utils
 
 /**
  * A base class for generate benchmark results to a file.
@@ -36,7 +37,7 @@ abstract class BenchmarkBase {
   def runBenchmarkSuite(mainArgs: Array[String]): Unit
 
   final def runBenchmark(benchmarkName: String)(func: => Any): Unit = {
-    val separator = "=" * 96
+    val separator = "=".repeat(96)
     val testHeader = (separator + '\n' + benchmarkName + '\n' + separator + '\n' + '\n').getBytes
     output.foreach(_.write(testHeader))
     func
@@ -50,7 +51,7 @@ abstract class BenchmarkBase {
     System.setProperty(IS_TESTING.key, "true")
     val regenerateBenchmarkFiles: Boolean = System.getenv("SPARK_GENERATE_BENCHMARK_FILES") == "1"
     if (regenerateBenchmarkFiles) {
-      val version = System.getProperty("java.version").split("\\D+")(0).toInt
+      val version = Utils.javaVersion.split("\\D+")(0).toInt
       val jdkString = if (version > 17) s"-jdk$version" else ""
       val resultFileName =
         s"${this.getClass.getSimpleName.replace("$", "")}$jdkString$suffix-results.txt"
@@ -60,7 +61,7 @@ abstract class BenchmarkBase {
         // scalastyle:off println
         println(s"Creating ${dir.getAbsolutePath} for benchmark results.")
         // scalastyle:on println
-        dir.mkdirs()
+        Utils.createDirectory(dir)
       }
       val file = new File(dir, resultFileName)
       if (!file.exists()) {
diff --git a/core/src/test/scala/org/apache/spark/deploy/ExternalShuffleServiceDbSuite.scala b/core/src/test/scala/org/apache/spark/deploy/ExternalShuffleServiceDbSuite.scala
index 921175bd41038..224f47f1d89c7 100644
--- a/core/src/test/scala/org/apache/spark/deploy/ExternalShuffleServiceDbSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/ExternalShuffleServiceDbSuite.scala
@@ -17,11 +17,8 @@
 
 package org.apache.spark.deploy
 
-import java.io._
 import java.nio.charset.StandardCharsets
 
-import com.google.common.io.CharStreams
-
 import org.apache.spark.{SecurityManager, SparkConf, SparkFunSuite}
 import org.apache.spark.internal.config._
 import org.apache.spark.network.shuffle.{ExternalBlockHandler, ExternalShuffleBlockResolver}
@@ -110,7 +107,7 @@ abstract class ExternalShuffleServiceDbSuite extends SparkFunSuite {
       blockResolver = blockHandler.getBlockResolver
 
       val block0Stream = blockResolver.getBlockData("app0", "exec0", 0, 0, 0).createInputStream
-      val block0 = CharStreams.toString(new InputStreamReader(block0Stream, StandardCharsets.UTF_8))
+      val block0 = Utils.toString(block0Stream)
       block0Stream.close()
       assert(sortBlock0 == block0)
       // pass
diff --git a/core/src/test/scala/org/apache/spark/deploy/RPackageUtilsSuite.scala b/core/src/test/scala/org/apache/spark/deploy/RPackageUtilsSuite.scala
index 77f5268f79cae..511889e732702 100644
--- a/core/src/test/scala/org/apache/spark/deploy/RPackageUtilsSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/RPackageUtilsSuite.scala
@@ -26,7 +26,6 @@ import java.util.zip.ZipFile
 import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.BeforeAndAfterEach
 
 import org.apache.spark.SparkFunSuite
@@ -147,12 +146,12 @@ class RPackageUtilsSuite
     Utils.tryWithSafeFinally {
       IvyTestUtils.writeFile(tempDir, "test.R", "abc")
       val fakeSparkRDir = new File(tempDir, "SparkR")
-      assert(fakeSparkRDir.mkdirs())
+      assert(Utils.createDirectory(fakeSparkRDir))
       IvyTestUtils.writeFile(fakeSparkRDir, "abc.R", "abc")
       IvyTestUtils.writeFile(fakeSparkRDir, "DESCRIPTION", "abc")
       IvyTestUtils.writeFile(tempDir, "package.zip", "abc") // fake zip file :)
       val fakePackageDir = new File(tempDir, "packageTest")
-      assert(fakePackageDir.mkdirs())
+      assert(Utils.createDirectory(fakePackageDir))
       IvyTestUtils.writeFile(fakePackageDir, "def.R", "abc")
       IvyTestUtils.writeFile(fakePackageDir, "DESCRIPTION", "abc")
       val finalZip = RPackageUtils.zipRLibraries(tempDir, "sparkr.zip")
@@ -170,7 +169,7 @@ class RPackageUtilsSuite
         zipFile.close()
       }
     } {
-      FileUtils.deleteDirectory(tempDir)
+      Utils.deleteRecursively(tempDir)
     }
   }
 }
diff --git a/core/src/test/scala/org/apache/spark/deploy/SparkPipelinesSuite.scala b/core/src/test/scala/org/apache/spark/deploy/SparkPipelinesSuite.scala
new file mode 100644
index 0000000000000..a482eaa42c35d
--- /dev/null
+++ b/core/src/test/scala/org/apache/spark/deploy/SparkPipelinesSuite.scala
@@ -0,0 +1,137 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.deploy
+
+import org.scalatest.BeforeAndAfterEach
+import org.scalatest.matchers.must.Matchers
+
+import org.apache.spark.SparkUserAppException
+
+class SparkPipelinesSuite extends SparkSubmitTestUtils with Matchers with BeforeAndAfterEach {
+  test("only spark submit args") {
+    val args = Array(
+      "--remote",
+      "local[2]",
+      "--deploy-mode",
+      "client",
+      "--supervise",
+      "--conf",
+      "spark.conf1=2",
+      "--conf",
+      "spark.conf2=3"
+    )
+    assert(
+      SparkPipelines.constructSparkSubmitArgs(args, sparkHome = "abc") ==
+      Seq(
+        "--deploy-mode",
+        "client",
+        "--supervise",
+        "--conf",
+        "spark.conf1=2",
+        "--conf",
+        "spark.conf2=3",
+        "--conf",
+        "spark.api.mode=connect",
+        "--remote",
+        "local[2]",
+        "abc/python/pyspark/pipelines/cli.py"
+      )
+    )
+  }
+
+  test("only pipelines args") {
+    val args = Array(
+      "run",
+      "--spec",
+      "pipeline.yml"
+    )
+    assert(
+      SparkPipelines.constructSparkSubmitArgs(args, sparkHome = "abc") ==
+      Seq(
+        "--conf",
+        "spark.api.mode=connect",
+        "--remote",
+        "local",
+        "abc/python/pyspark/pipelines/cli.py",
+        "run",
+        "--spec",
+        "pipeline.yml"
+      )
+    )
+  }
+
+  test("spark-submit and pipelines args") {
+    val args = Array(
+      "--remote",
+      "local[2]",
+      "run",
+      "--supervise",
+      "--spec",
+      "pipeline.yml",
+      "--conf",
+      "spark.conf2=3"
+    )
+    assert(
+      SparkPipelines.constructSparkSubmitArgs(args, sparkHome = "abc") ==
+      Seq(
+        "--supervise",
+        "--conf",
+        "spark.conf2=3",
+        "--conf",
+        "spark.api.mode=connect",
+        "--remote",
+        "local[2]",
+        "abc/python/pyspark/pipelines/cli.py",
+        "run",
+        "--spec",
+        "pipeline.yml"
+      )
+    )
+  }
+
+  test("class arg prohibited") {
+    val args = Array(
+      "--class",
+      "org.apache.spark.deploy.SparkPipelines"
+    )
+    intercept[SparkUserAppException] {
+      SparkPipelines.constructSparkSubmitArgs(args, sparkHome = "abc")
+    }
+  }
+
+  test("name arg") {
+    val args = Array(
+      "init",
+      "--name",
+      "myproject"
+    )
+    assert(
+      SparkPipelines.constructSparkSubmitArgs(args, sparkHome = "abc") ==
+        Seq(
+          "--conf",
+          "spark.api.mode=connect",
+          "--remote",
+          "local",
+          "abc/python/pyspark/pipelines/cli.py",
+          "init",
+          "--name",
+          "myproject"
+        )
+    )
+  }
+}
diff --git a/core/src/test/scala/org/apache/spark/deploy/SparkSubmitSuite.scala b/core/src/test/scala/org/apache/spark/deploy/SparkSubmitSuite.scala
index bd34e6f2bba3d..0db8ba785fcbc 100644
--- a/core/src/test/scala/org/apache/spark/deploy/SparkSubmitSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/SparkSubmitSuite.scala
@@ -25,8 +25,6 @@ import java.nio.file.{Files, Paths}
 import scala.collection.mutable.ArrayBuffer
 import scala.io.{Codec, Source}
 
-import com.google.common.io.ByteStreams
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, FSDataInputStream, Path}
 import org.scalatest.BeforeAndAfterEach
@@ -111,7 +109,7 @@ class SparkSubmitSuite
   with TestPrematureExit {
 
   private val emptyIvySettings = File.createTempFile("ivy", ".xml")
-  FileUtils.write(emptyIvySettings, "<ivysettings />", StandardCharsets.UTF_8)
+  Files.writeString(emptyIvySettings.toPath, "<ivysettings />")
 
   private val submit = new SparkSubmit()
 
@@ -904,7 +902,7 @@ class SparkSubmitSuite
     // compile a small jar containing a class that will be called from R code.
     withTempDir { tempDir =>
       val srcDir = new File(tempDir, "sparkrtest")
-      srcDir.mkdirs()
+      Utils.createDirectory(srcDir)
       val excSource = new JavaSourceFromString(new File(srcDir, "DummyClass").toURI.getPath,
         """package sparkrtest;
         |
@@ -1189,14 +1187,14 @@ class SparkSubmitSuite
 
             val appArgs = new SparkSubmitArguments(args)
             val (_, _, conf, _) = submit.prepareSubmitEnvironment(appArgs)
-            conf.get("spark.yarn.dist.jars").split(",").toSet should be
-            (Set(jar1.toURI.toString, jar2.toURI.toString))
-            conf.get("spark.yarn.dist.files").split(",").toSet should be
-            (Set(file1.toURI.toString, file2.toURI.toString))
-            conf.get("spark.yarn.dist.pyFiles").split(",").toSet should be
-            (Set(pyFile1.getAbsolutePath, pyFile2.getAbsolutePath))
-            conf.get("spark.yarn.dist.archives").split(",").toSet should be
-            (Set(archive1.toURI.toString, archive2.toURI.toString))
+            conf.get("spark.yarn.dist.jars").split(",").toSet should be(
+              Set(jar1.toURI.toString, jar2.toURI.toString))
+            conf.get("spark.yarn.dist.files").split(",").toSet should be(
+              Set(file1.toURI.toString, file2.toURI.toString))
+            conf.get("spark.yarn.dist.pyFiles").split(",").toSet should be(
+              Set(pyFile1.toURI.toString, pyFile2.toURI.toString))
+            conf.get("spark.yarn.dist.archives").split(",").toSet should be(
+              Set(archive1.toURI.toString, archive2.toURI.toString))
           }
         }
       }
@@ -1293,8 +1291,8 @@ class SparkSubmitSuite
 
     // The path and filename are preserved.
     assert(outputUri.getPath.endsWith(new Path(sourceUri).getName))
-    assert(FileUtils.readFileToString(new File(outputUri.getPath), StandardCharsets.UTF_8) ===
-      FileUtils.readFileToString(new File(sourceUri.getPath), StandardCharsets.UTF_8))
+    assert(Files.readString(new File(outputUri.getPath).toPath) ===
+      Files.readString(new File(sourceUri.getPath).toPath))
   }
 
   private def deleteTempOutputFile(outputPath: String): Unit = {
@@ -1336,7 +1334,7 @@ class SparkSubmitSuite
     val jarFile = File.createTempFile("test", ".jar")
     jarFile.deleteOnExit()
     val content = "hello, world"
-    FileUtils.write(jarFile, content, StandardCharsets.UTF_8)
+    Files.writeString(jarFile.toPath, content)
     val hadoopConf = new Configuration()
     val tmpDir = Files.createTempDirectory("tmp").toFile
     updateConfWithFakeS3Fs(hadoopConf)
@@ -1351,7 +1349,7 @@ class SparkSubmitSuite
     val jarFile = File.createTempFile("test", ".jar")
     jarFile.deleteOnExit()
     val content = "hello, world"
-    FileUtils.write(jarFile, content, StandardCharsets.UTF_8)
+    Files.writeString(jarFile.toPath, content)
     val hadoopConf = new Configuration()
     val tmpDir = Files.createTempDirectory("tmp").toFile
     updateConfWithFakeS3Fs(hadoopConf)
@@ -1595,6 +1593,44 @@ class SparkSubmitSuite
       runSparkSubmit(argsSuccess, expectFailure = false))
   }
 
+  test("spark.submit.callSystemExitOnMainExit returns non-zero exit code on unclean main exit") {
+    val unusedJar = TestUtils.createJarWithClasses(Seq.empty)
+    val args = Seq(
+      "--class", MainThrowsUncaughtExceptionSparkApplicationTest.getClass.getName.stripSuffix("$"),
+      "--name", "testApp",
+      "--conf", s"${SUBMIT_CALL_SYSTEM_EXIT_ON_MAIN_EXIT.key}=true",
+      unusedJar.toString
+    )
+    assertResult(1)(runSparkSubmit(args, expectFailure = true))
+  }
+
+  test("spark.submit.callSystemExitOnMainExit calls system exit on clean main exit") {
+    val unusedJar = TestUtils.createJarWithClasses(Seq.empty)
+    val args = Seq(
+      "--class", NonDaemonThreadSparkApplicationTest.getClass.getName.stripSuffix("$"),
+      "--name", "testApp",
+      "--conf", s"${SUBMIT_CALL_SYSTEM_EXIT_ON_MAIN_EXIT.key}=true",
+      unusedJar.toString
+    )
+    // With SUBMIT_CALL_SYSTEM_EXIT_ON_MAIN_EXIT set to false, the non-daemon thread will
+    // prevent the JVM from beginning shutdown and the following call will fail with a
+    // timeout:
+    assertResult(0)(runSparkSubmit(args))
+  }
+
+  test("spark.submit.callSystemExitOnMainExit with main that explicitly calls System.exit") {
+    val unusedJar = TestUtils.createJarWithClasses(Seq.empty)
+    val args = Seq(
+      "--class",
+      MainExplicitlyCallsSystemExit3SparkApplicationTest.getClass.getName.stripSuffix("$"),
+      "--name", "testApp",
+      "--conf", s"${SUBMIT_CALL_SYSTEM_EXIT_ON_MAIN_EXIT.key}=true",
+      unusedJar.toString
+    )
+    // This main class explicitly exits with System.exit(3), hence this expected exit code:
+    assertResult(3)(runSparkSubmit(args, expectFailure = true))
+  }
+
   private def testRemoteResources(
       enableHttpFs: Boolean,
       forceDownloadSchemes: Seq[String] = Nil): Unit = {
@@ -1818,7 +1854,7 @@ class SparkSubmitSuite
         "spark = SparkSession.builder.getOrCreate();" +
         "assert 'connect' in str(type(spark));" +
         "assert spark.range(1).first()[0] == 0"
-    FileUtils.write(pyFile, content, StandardCharsets.UTF_8)
+    Files.writeString(pyFile.toPath, content)
     val args = Seq(
       "--name", "testPyApp",
       "--remote", "local",
@@ -1878,11 +1914,38 @@ object SimpleApplicationTest {
   }
 }
 
+object MainThrowsUncaughtExceptionSparkApplicationTest {
+  def main(args: Array[String]): Unit = {
+    throw new Exception("User exception")
+  }
+}
+
+object NonDaemonThreadSparkApplicationTest {
+  def main(args: Array[String]): Unit = {
+    val nonDaemonThread: Thread = new Thread {
+      override def run(): Unit = {
+        while (true) {
+          Thread.sleep(1000)
+        }
+      }
+    }
+    nonDaemonThread.setDaemon(false)
+    nonDaemonThread.setName("Non-Daemon-Thread")
+    nonDaemonThread.start()
+    // Fall off the end of the main method.
+  }
+}
+
+object MainExplicitlyCallsSystemExit3SparkApplicationTest {
+  def main(args: Array[String]): Unit = {
+    System.exit(3)
+  }
+}
+
 object UserClasspathFirstTest {
   def main(args: Array[String]): Unit = {
     val ccl = Thread.currentThread().getContextClassLoader()
-    val resource = ccl.getResourceAsStream("test.resource")
-    val bytes = ByteStreams.toByteArray(resource)
+    val bytes = ccl.getResourceAsStream("test.resource").readAllBytes()
     val contents = new String(bytes, 0, bytes.length, StandardCharsets.UTF_8)
     if (contents != "USER") {
       throw new SparkException("Should have read user resource, but instead read: " + contents)
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileCompactorSuite.scala b/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileCompactorSuite.scala
index bf2ef07e60a97..5297ac5aac892 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileCompactorSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileCompactorSuite.scala
@@ -161,7 +161,7 @@ class EventLogFileCompactorSuite extends SparkFunSuite {
         val lines = Source.fromInputStream(is)(Codec.UTF8).getLines().toList
         assert(lines.length === 2, "Compacted file should have only two events being accepted")
         lines.foreach { line =>
-          val event = new JsonProtocol(new SparkConf()).sparkEventFromJson(line)
+          val event = JsonProtocol.sparkEventFromJson(line)
           assert(!event.isInstanceOf[SparkListenerJobStart] &&
             !event.isInstanceOf[SparkListenerJobEnd])
         }
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileReadersSuite.scala b/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileReadersSuite.scala
index 7501a98a1a573..c1a93c7aa9a20 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileReadersSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileReadersSuite.scala
@@ -19,10 +19,9 @@ package org.apache.spark.deploy.history
 
 import java.io.{ByteArrayInputStream, ByteArrayOutputStream, File}
 import java.net.URI
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.zip.{ZipInputStream, ZipOutputStream}
 
-import com.google.common.io.{ByteStreams, Files}
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.scalatest.BeforeAndAfter
@@ -220,8 +219,8 @@ class SingleFileEventLogFileReaderSuite extends EventLogFileReadersSuite {
 
       val entry = is.getNextEntry
       assert(entry != null)
-      val actual = new String(ByteStreams.toByteArray(is), StandardCharsets.UTF_8)
-      val expected = Files.asCharSource(new File(logPath.toString), StandardCharsets.UTF_8).read()
+      val actual = is.readAllBytes()
+      val expected = Files.readAllBytes(new File(logPath.toString).toPath)
       assert(actual === expected)
       assert(is.getNextEntry === null)
     }
@@ -242,7 +241,7 @@ class RollingEventLogFilesReaderSuite extends EventLogFileReadersSuite {
         SparkHadoopUtil.get.newConfiguration(conf))
 
       writer.start()
-      val dummyStr = "dummy" * 1024
+      val dummyStr = "dummy".repeat(1024)
       writeTestEvents(writer, dummyStr, 1024 * 1024 * 20)
       writer.stop()
 
@@ -275,7 +274,7 @@ class RollingEventLogFilesReaderSuite extends EventLogFileReadersSuite {
       writer.start()
 
       // write log more than 20m (intended to roll over to 3 files)
-      val dummyStr = "dummy" * 1024
+      val dummyStr = "dummy".repeat(1024)
       writeTestEvents(writer, dummyStr, 1024 * 1024 * 20)
 
       val logPathIncompleted = getCurrentLogPath(writer.logPath, isCompleted = false)
@@ -367,9 +366,8 @@ class RollingEventLogFilesReaderSuite extends EventLogFileReadersSuite {
           val fileName = entry.getName.stripPrefix(logPath.getName + "/")
           assert(allFileNames.contains(fileName))
 
-          val actual = new String(ByteStreams.toByteArray(is), StandardCharsets.UTF_8)
-          val expected = Files.asCharSource(
-            new File(logPath.toString, fileName), StandardCharsets.UTF_8).read()
+          val actual = is.readAllBytes()
+          val expected = Files.readAllBytes(new File(logPath.toString, fileName).toPath)
           assert(actual === expected)
         }
       }
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileWritersSuite.scala b/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileWritersSuite.scala
index 7c05613d8b161..d9d6a4f8d35df 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileWritersSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/EventLogFileWritersSuite.scala
@@ -112,6 +112,26 @@ abstract class EventLogFileWritersSuite extends SparkFunSuite with LocalSparkCon
     assert(writer.compressionCodecName === EVENT_LOG_COMPRESSION_CODEC.defaultValue)
   }
 
+  test("SPARK-52458: Support spark.eventLog.excludedPatterns") {
+    val appId = getUniqueApplicationId
+    val attemptId = None
+
+    val conf = getLoggingConf(testDirPath, None)
+    conf.set(EVENT_LOG_EXCLUDED_PATTERNS, Seq("B", "C"))
+
+    val writer = createWriter(appId, attemptId, testDirPath.toUri, conf,
+      SparkHadoopUtil.get.newConfiguration(conf))
+
+    writer.start()
+    Seq("A", "B", "C", "D").foreach { name =>
+      writer.writeEvent(s"""{"Event":"$name"}""", flushLogger = true)
+    }
+    writer.stop()
+
+    verifyWriteEventLogFile(appId, attemptId, testDirPath.toUri,
+      None, Seq("""{"Event":"A"}""", """{"Event":"D"}"""))
+  }
+
   protected def readLinesFromEventLogFile(log: Path, fs: FileSystem): List[String] = {
     val logDataStream = EventLogFileReader.openEventLog(log, fs)
     try {
@@ -302,7 +322,7 @@ class RollingEventLogFilesWriterSuite extends EventLogFileWritersSuite {
       writer.start()
 
       // write log more than 20m (intended to roll over to 3 files)
-      val dummyStr = "dummy" * 1024
+      val dummyStr = "dummy".repeat(1024)
       val expectedLines = writeTestEvents(writer, dummyStr, 1024 * 1024 * 21)
 
       val logDirPath = getAppEventLogDirPath(testDirPath.toUri, appId, attemptId)
@@ -326,7 +346,7 @@ class RollingEventLogFilesWriterSuite extends EventLogFileWritersSuite {
 
     val conf = getLoggingConf(testDirPath, None)
     conf.set(EVENT_LOG_ENABLE_ROLLING, true)
-    conf.set(EVENT_LOG_ROLLING_MAX_FILE_SIZE.key, "9m")
+    conf.set(EVENT_LOG_ROLLING_MAX_FILE_SIZE.key, "1m")
 
     val e = intercept[IllegalArgumentException] {
       createWriter(appId, attemptId, testDirPath.toUri, conf,
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/EventLogTestHelper.scala b/core/src/test/scala/org/apache/spark/deploy/history/EventLogTestHelper.scala
index cc5a38e007915..0161917f8853d 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/EventLogTestHelper.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/EventLogTestHelper.scala
@@ -108,6 +108,6 @@ object EventLogTestHelper {
   }
 
   def convertEvent(event: SparkListenerEvent): String = {
-    new JsonProtocol(new SparkConf()).sparkEventToJsonString(event)
+    JsonProtocol.sparkEventToJsonString(event)
   }
 }
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/FsHistoryProviderSuite.scala b/core/src/test/scala/org/apache/spark/deploy/history/FsHistoryProviderSuite.scala
index d58c996f23655..8b1b6a5bad383 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/FsHistoryProviderSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/FsHistoryProviderSuite.scala
@@ -19,14 +19,13 @@ package org.apache.spark.deploy.history
 
 import java.io._
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.{Date, Locale}
 import java.util.concurrent.TimeUnit
 import java.util.zip.{ZipInputStream, ZipOutputStream}
 
 import scala.concurrent.duration._
 
-import com.google.common.io.{ByteStreams, Files}
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.fs.{FileStatus, FileSystem, FSDataInputStream, Path}
 import org.apache.hadoop.hdfs.{DFSInputStream, DistributedFileSystem}
 import org.apache.hadoop.ipc.{CallerContext => HadoopCallerContext}
@@ -707,11 +706,8 @@ abstract class FsHistoryProviderSuite extends SparkFunSuite with Matchers with P
       var entry = inputStream.getNextEntry
       entry should not be null
       while (entry != null) {
-        val actual = new String(ByteStreams.toByteArray(inputStream), StandardCharsets.UTF_8)
-        val expected =
-          Files.asCharSource(logs.find(_.getName == entry.getName).get, StandardCharsets.UTF_8)
-            .read()
-        actual should be (expected)
+        val expected = Files.readString(logs.find(_.getName == entry.getName).get.toPath)
+        Utils.toString(inputStream) should be (expected)
         totalEntries += 1
         entry = inputStream.getNextEntry
       }
@@ -733,15 +729,15 @@ abstract class FsHistoryProviderSuite extends SparkFunSuite with Matchers with P
     testConf.set(MAX_DRIVER_LOG_AGE_S, maxAge)
     val provider = new FsHistoryProvider(testConf, clock)
 
-    val log1 = FileUtils.getFile(testDir, "1" + DriverLogger.DRIVER_LOG_FILE_SUFFIX)
+    val log1 = Utils.getFile(testDir, "1" + DriverLogger.DRIVER_LOG_FILE_SUFFIX)
     createEmptyFile(log1)
     clock.setTime(firstFileModifiedTime)
     log1.setLastModified(clock.getTimeMillis())
     provider.cleanDriverLogs()
 
-    val log2 = FileUtils.getFile(testDir, "2" + DriverLogger.DRIVER_LOG_FILE_SUFFIX)
+    val log2 = Utils.getFile(testDir, "2" + DriverLogger.DRIVER_LOG_FILE_SUFFIX)
     createEmptyFile(log2)
-    val log3 = FileUtils.getFile(testDir, "3" + DriverLogger.DRIVER_LOG_FILE_SUFFIX)
+    val log3 = Utils.getFile(testDir, "3" + DriverLogger.DRIVER_LOG_FILE_SUFFIX)
     createEmptyFile(log3)
     clock.setTime(secondFileModifiedTime)
     log2.setLastModified(clock.getTimeMillis())
@@ -759,7 +755,7 @@ abstract class FsHistoryProviderSuite extends SparkFunSuite with Matchers with P
     assert(log3.exists())
 
     // Update the third file length while keeping the original modified time
-    Files.write("Add logs to file".getBytes(), log3)
+    Files.writeString(log3.toPath, "Add logs to file")
     log3.setLastModified(secondFileModifiedTime)
     // Should cleanup the second file but not the third file, as filelength changed.
     clock.setTime(secondFileModifiedTime + TimeUnit.SECONDS.toMillis(maxAge) + 1)
@@ -1640,6 +1636,40 @@ abstract class FsHistoryProviderSuite extends SparkFunSuite with Matchers with P
     }
   }
 
+  test("SPARK-52914: Support spark.history.fs.eventLog.rolling.onDemandLoadEnabled") {
+    Seq(true, false).foreach { onDemandEnabled =>
+      withTempDir { dir =>
+        val conf = createTestConf(true)
+        conf.set(HISTORY_LOG_DIR, dir.getAbsolutePath)
+        conf.set(EVENT_LOG_ROLLING_ON_DEMAND_LOAD_ENABLED, onDemandEnabled)
+        val hadoopConf = SparkHadoopUtil.newConfiguration(conf)
+        val provider = new FsHistoryProvider(conf)
+
+        val writer1 = new RollingEventLogFilesWriter("app1", None, dir.toURI, conf, hadoopConf)
+        writer1.start()
+        writeEventsToRollingWriter(writer1, Seq(
+          SparkListenerApplicationStart("app1", Some("app1"), 0, "user", None),
+          SparkListenerJobStart(1, 0, Seq.empty)), rollFile = false)
+        writer1.stop()
+
+        assert(dir.listFiles().length === 1)
+        assert(provider.getListing().length === 0)
+        assert(provider.getAppUI("app1", None).isDefined == onDemandEnabled)
+        assert(provider.getListing().length === (if (onDemandEnabled) 1 else 0))
+
+        // The dummy entry should be protected from cleanLogs()
+        provider.cleanLogs()
+        assert(dir.listFiles().length === 1)
+
+        assert(dir.listFiles().length === 1)
+        assert(provider.getAppUI("nonexist", None).isEmpty)
+        assert(provider.getListing().length === (if (onDemandEnabled) 1 else 0))
+
+        provider.stop()
+      }
+    }
+  }
+
   test("SPARK-36354: EventLogFileReader should skip rolling event log directories with no logs") {
     withTempDir { dir =>
       val conf = createTestConf(true)
@@ -1809,16 +1839,15 @@ abstract class FsHistoryProviderSuite extends SparkFunSuite with Matchers with P
     val fstream = new FileOutputStream(file)
     val cstream = codec.map(_.compressedContinuousOutputStream(fstream)).getOrElse(fstream)
     val bstream = new BufferedOutputStream(cstream)
-    val jsonProtocol = new JsonProtocol(new SparkConf())
 
     val metadata = SparkListenerLogStart(org.apache.spark.SPARK_VERSION)
-    val eventJsonString = jsonProtocol.sparkEventToJsonString(metadata)
+    val eventJsonString = JsonProtocol.sparkEventToJsonString(metadata)
     val metadataJson = eventJsonString + "\n"
     bstream.write(metadataJson.getBytes(StandardCharsets.UTF_8))
 
     val writer = new OutputStreamWriter(bstream, StandardCharsets.UTF_8)
     Utils.tryWithSafeFinally {
-      events.foreach(e => writer.write(jsonProtocol.sparkEventToJsonString(e) + "\n"))
+      events.foreach(e => writer.write(JsonProtocol.sparkEventToJsonString(e) + "\n"))
     } {
       writer.close()
     }
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerArgumentsSuite.scala b/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerArgumentsSuite.scala
index 807e5ec3e823e..4d8495a7151d5 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerArgumentsSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerArgumentsSuite.scala
@@ -17,9 +17,7 @@
 package org.apache.spark.deploy.history
 
 import java.io.File
-import java.nio.charset.StandardCharsets._
-
-import com.google.common.io.Files
+import java.nio.file.Files
 
 import org.apache.spark._
 import org.apache.spark.internal.config.{ConfigEntry, History}
@@ -45,7 +43,7 @@ class HistoryServerArgumentsSuite extends SparkFunSuite {
   test("Properties File Arguments Parsing --properties-file") {
     withTempDir { tmpDir =>
       val outFile = File.createTempFile("test-load-spark-properties", "test", tmpDir)
-      Files.asCharSink(outFile, UTF_8).write("spark.test.CustomPropertyA blah\n" +
+      Files.writeString(outFile.toPath, "spark.test.CustomPropertyA blah\n" +
         "spark.test.CustomPropertyB notblah\n")
       val argStrings = Array("--properties-file", outFile.getAbsolutePath)
       val hsa = new HistoryServerArguments(conf, argStrings)
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerSuite.scala b/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerSuite.scala
index 4ac919dd9e6a6..0a564f571521e 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/HistoryServerSuite.scala
@@ -18,16 +18,14 @@ package org.apache.spark.deploy.history
 
 import java.io.{File, FileInputStream, FileWriter, InputStream, IOException}
 import java.net.{HttpURLConnection, URI, URL}
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.zip.ZipInputStream
 
 import scala.concurrent.duration._
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.{ByteStreams, Files}
 import jakarta.servlet._
 import jakarta.servlet.http.{HttpServletRequest, HttpServletRequestWrapper, HttpServletResponse}
-import org.apache.commons.io.{FileUtils, IOUtils}
 import org.apache.hadoop.fs.{FileStatus, FileSystem, Path}
 import org.json4s.JsonAST._
 import org.json4s.jackson.JsonMethods
@@ -219,8 +217,8 @@ abstract class HistoryServerSuite extends SparkFunSuite with BeforeAndAfter with
   )
 
   if (regenerateGoldenFiles) {
-    FileUtils.deleteDirectory(expRoot)
-    expRoot.mkdirs()
+    Utils.deleteRecursively(expRoot)
+    Utils.createDirectory(expRoot)
   }
 
   // run a bunch of characterization tests -- just verify the behavior is the same as what is saved
@@ -246,7 +244,7 @@ abstract class HistoryServerSuite extends SparkFunSuite with BeforeAndAfter with
         }
       }
 
-      val exp = IOUtils.toString(new FileInputStream(goldenFile), StandardCharsets.UTF_8)
+      val exp = Utils.toString(new FileInputStream(goldenFile))
       // compare the ASTs so formatting differences don't cause failures
       val expAst = parse(exp)
       assertValidDataInJson(jsonAst, expAst)
@@ -309,9 +307,7 @@ abstract class HistoryServerSuite extends SparkFunSuite with BeforeAndAfter with
         val expectedFile = {
           new File(logDir, entry.getName)
         }
-        val expected = Files.asCharSource(expectedFile, StandardCharsets.UTF_8).read()
-        val actual = new String(ByteStreams.toByteArray(zipStream), StandardCharsets.UTF_8)
-        actual should be (expected)
+        Utils.toString(zipStream) should be (Files.readString(expectedFile.toPath))
         filesCompared += 1
       }
       entry = zipStream.getNextEntry
@@ -750,7 +746,7 @@ object HistoryServerSuite {
 
   def getContentAndCode(url: URL): (Int, Option[String], Option[String]) = {
     val (code, in, errString) = connectAndGetInputStream(url)
-    val inString = in.map(IOUtils.toString(_, StandardCharsets.UTF_8))
+    val inString = in.map(Utils.toString)
     (code, inString, errString)
   }
 
@@ -766,7 +762,7 @@ object HistoryServerSuite {
     }
     val errString = try {
       val err = Option(connection.getErrorStream())
-      err.map(IOUtils.toString(_, StandardCharsets.UTF_8))
+      err.map(Utils.toString)
     } catch {
       case io: IOException => None
     }
diff --git a/core/src/test/scala/org/apache/spark/deploy/history/HybridStoreSuite.scala b/core/src/test/scala/org/apache/spark/deploy/history/HybridStoreSuite.scala
index f59ee63cccf73..6b228de02e3e4 100644
--- a/core/src/test/scala/org/apache/spark/deploy/history/HybridStoreSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/history/HybridStoreSuite.scala
@@ -21,7 +21,6 @@ import java.io.File
 import java.util.NoSuchElementException
 import java.util.concurrent.LinkedBlockingQueue
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.BeforeAndAfter
 import org.scalatest.concurrent.TimeLimits
 import org.scalatest.time.SpanSugar._
@@ -42,7 +41,7 @@ abstract class HybridStoreSuite extends SparkFunSuite with BeforeAndAfter with T
       db.close()
     }
     if (dbpath != null) {
-      FileUtils.deleteQuietly(dbpath)
+      Utils.deleteQuietly(dbpath)
     }
   }
 
diff --git a/core/src/test/scala/org/apache/spark/deploy/worker/WorkerSuite.scala b/core/src/test/scala/org/apache/spark/deploy/worker/WorkerSuite.scala
index f3bae2066e146..ff5d314d1688a 100644
--- a/core/src/test/scala/org/apache/spark/deploy/worker/WorkerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/deploy/worker/WorkerSuite.scala
@@ -383,7 +383,7 @@ class WorkerSuite extends SparkFunSuite with Matchers with BeforeAndAfter with P
     // Create the executor's working directory
     val executorDir = new File(worker.workDir, appId + "/" + execId)
 
-    if (!executorDir.exists && !executorDir.mkdirs()) {
+    if (!executorDir.exists && !Utils.createDirectory(executorDir)) {
       throw new IOException("Failed to create directory " + executorDir)
     }
     executorDir.setLastModified(System.currentTimeMillis - (1000 * 120))
diff --git a/core/src/test/scala/org/apache/spark/executor/ExecutorClassLoaderSuite.scala b/core/src/test/scala/org/apache/spark/executor/ExecutorClassLoaderSuite.scala
index 1573d0286a325..fbb52971960cb 100644
--- a/core/src/test/scala/org/apache/spark/executor/ExecutorClassLoaderSuite.scala
+++ b/core/src/test/scala/org/apache/spark/executor/ExecutorClassLoaderSuite.scala
@@ -22,14 +22,13 @@ import java.lang.reflect.InvocationTargetException
 import java.net.{URI, URL, URLClassLoader}
 import java.nio.channels.{FileChannel, ReadableByteChannel}
 import java.nio.charset.StandardCharsets
-import java.nio.file.{Paths, StandardOpenOption}
+import java.nio.file.{Files, Paths, StandardOpenOption}
 import java.util
 import java.util.Collections
 import javax.tools.{JavaFileObject, SimpleJavaFileObject, ToolProvider}
 
 import scala.io.Source
 
-import com.google.common.io.Files
 import org.mockito.ArgumentMatchers.{any, anyString}
 import org.mockito.Mockito._
 import org.mockito.invocation.InvocationOnMock
@@ -65,7 +64,7 @@ class ExecutorClassLoaderSuite
     urls2 = List(tempDir2.toURI.toURL).toArray
     childClassNames.foreach(TestUtils.createCompiledClass(_, tempDir1, "1"))
     parentResourceNames.foreach { x =>
-      Files.write("resource".getBytes(StandardCharsets.UTF_8), new File(tempDir2, x))
+      Files.writeString(new File(tempDir2, x).toPath, "resource")
     }
     parentClassNames.foreach(TestUtils.createCompiledClass(_, tempDir2, "2"))
   }
@@ -105,7 +104,7 @@ class ExecutorClassLoaderSuite
     assert(result.exists(), "Compiled file not found: " + result.getAbsolutePath)
 
     val out = new File(scalaDir, filename)
-    Files.move(result, out)
+    Utils.moveFile(result, out)
     assert(out.exists(), "Destination file not moved: " + out.getAbsolutePath)
 
     // construct class loader tree
diff --git a/core/src/test/scala/org/apache/spark/executor/ProcfsMetricsGetterSuite.scala b/core/src/test/scala/org/apache/spark/executor/ProcfsMetricsGetterSuite.scala
index 77d782461a2ec..caaf03d5d54ea 100644
--- a/core/src/test/scala/org/apache/spark/executor/ProcfsMetricsGetterSuite.scala
+++ b/core/src/test/scala/org/apache/spark/executor/ProcfsMetricsGetterSuite.scala
@@ -93,6 +93,18 @@ class ProcfsMetricsGetterSuite extends SparkFunSuite {
       SparkEnv.set(originalSparkEnv)
     }
   }
+
+  test("SPARK-52776: Whitespace and parentheses in the comm field") {
+    val p = new ProcfsMetricsGetter(getTestResourcePath("ProcfsMetrics"))
+    var r = ProcfsMetrics(0, 0, 0, 0, 0, 0)
+    r = p.addProcfsMetricsFromOneProcess(r, 487713)
+    assert(r.jvmVmemTotal == 0)
+    assert(r.jvmRSSTotal == 0)
+    assert(r.pythonVmemTotal == 0)
+    assert(r.pythonRSSTotal == 0)
+    assert(r.otherVmemTotal == 7469137920L)
+    assert(r.otherRSSTotal == 494858240)
+  }
 }
 
 object ProcfsMetricsGetterSuite {
diff --git a/core/src/test/scala/org/apache/spark/input/WholeTextFileRecordReaderSuite.scala b/core/src/test/scala/org/apache/spark/input/WholeTextFileRecordReaderSuite.scala
index 9caf778de3848..31784be8b2ebc 100644
--- a/core/src/test/scala/org/apache/spark/input/WholeTextFileRecordReaderSuite.scala
+++ b/core/src/test/scala/org/apache/spark/input/WholeTextFileRecordReaderSuite.scala
@@ -26,6 +26,7 @@ import org.apache.hadoop.io.Text
 import org.apache.hadoop.io.compress.{CompressionCodecFactory, GzipCodec}
 
 import org.apache.spark.{SparkConf, SparkContext, SparkFunSuite}
+import org.apache.spark.io.ZStdCompressionCodec
 
 /**
  * Tests the correctness of
@@ -36,6 +37,10 @@ class WholeTextFileRecordReaderSuite extends SparkFunSuite {
   private var sc: SparkContext = _
   private var factory: CompressionCodecFactory = _
 
+  def getSparkConf(): SparkConf = {
+    new SparkConf()
+  }
+
   override def beforeAll(): Unit = {
     // Hadoop's FileSystem caching does not use the Configuration as part of its cache key, which
     // can cause Filesystem.get(Configuration) to return a cached instance created with a different
@@ -44,7 +49,7 @@ class WholeTextFileRecordReaderSuite extends SparkFunSuite {
     // the new value of "fs.local.block.size" (see SPARK-5227 and SPARK-5679). To work around this,
     // we disable FileSystem caching in this suite.
     super.beforeAll()
-    val conf = new SparkConf().set("spark.hadoop.fs.file.impl.disable.cache", "true")
+    val conf = getSparkConf().set("spark.hadoop.fs.file.impl.disable.cache", "true")
 
     sc = new SparkContext("local", "test", conf)
 
@@ -63,13 +68,25 @@ class WholeTextFileRecordReaderSuite extends SparkFunSuite {
     }
   }
 
-  private def createNativeFile(inputDir: File, fileName: String, contents: Array[Byte],
-                               compress: Boolean) = {
-    val out = if (compress) {
+  import WholeTextFileRecordReaderSuite.CompressionType
+
+  def createNativeFile(inputDir: File, fileName: String, contents: Array[Byte],
+    compressionType: CompressionType.CompressionType = CompressionType.NONE): Unit = {
+    val out = if (compressionType == CompressionType.GZIP ||
+      compressionType == CompressionType.GZ) {
       val codec = new GzipCodec
       codec.setConf(new Configuration())
-      val path = s"${inputDir.toString}/$fileName${codec.getDefaultExtension}"
+      val extension = if (compressionType == CompressionType.GZIP) {
+        ".gzip" // Try with non-standard extension
+      } else {
+        codec.getDefaultExtension
+      }
+      val path = s"${inputDir.toString}/$fileName${extension}"
       codec.createOutputStream(new DataOutputStream(new FileOutputStream(path)))
+    } else if (compressionType == CompressionType.ZSTD || compressionType == CompressionType.ZST) {
+      val extension = if (compressionType == CompressionType.ZSTD) ".zstd" else ".zst"
+      val path = s"${inputDir.toString}/${fileName}${extension}"
+      new ZStdCompressionCodec(sc.conf).compressedOutputStream(new FileOutputStream(path))
     } else {
       val path = s"${inputDir.toString}/$fileName"
       new DataOutputStream(new FileOutputStream(path))
@@ -86,48 +103,29 @@ class WholeTextFileRecordReaderSuite extends SparkFunSuite {
    *   3) Does the contents be the same.
    */
   test("Correctness of WholeTextFileRecordReader.") {
-    withTempDir { dir =>
-      logInfo(s"Local disk address is ${dir.toString}.")
-
-      WholeTextFileRecordReaderSuite.files.foreach { case (filename, contents) =>
-        createNativeFile(dir, filename, contents, false)
-      }
-
-      val res = sc.wholeTextFiles(dir.toString, 3).collect()
-
-      assert(res.length === WholeTextFileRecordReaderSuite.fileNames.length,
-        "Number of files read out does not fit with the actual value.")
-
-      for ((filename, contents) <- res) {
-        val shortName = filename.split('/').last
-        assert(WholeTextFileRecordReaderSuite.fileNames.contains(shortName),
-          s"Missing file name $filename.")
-        assert(contents === new Text(WholeTextFileRecordReaderSuite.files(shortName)).toString,
-          s"file $filename contents can not match.")
-      }
-    }
-  }
-
-  test("Correctness of WholeTextFileRecordReader with GzipCodec.") {
-    withTempDir { dir =>
-      logInfo(s"Local disk address is ${dir.toString}.")
-
-      WholeTextFileRecordReaderSuite.files.foreach { case (filename, contents) =>
-        createNativeFile(dir, filename, contents, true)
-      }
-
-      val res = sc.wholeTextFiles(dir.toString, 3).collect()
-
-      assert(res.length === WholeTextFileRecordReaderSuite.fileNames.length,
-        "Number of files read out does not fit with the actual value.")
-
-      for ((filename, contents) <- res) {
-        val shortName = filename.split('/').last.split('.')(0)
-
-        assert(WholeTextFileRecordReaderSuite.fileNames.contains(shortName),
-          s"Missing file name $filename.")
-        assert(contents === new Text(WholeTextFileRecordReaderSuite.files(shortName)).toString,
-          s"file $filename contents can not match.")
+    CompressionType.values.foreach { compressionType =>
+      withTempDir { dir =>
+        logInfo(s"Local disk address is ${dir.toString}.")
+
+        WholeTextFileRecordReaderSuite.files.foreach { case (filename, contents) =>
+          createNativeFile(dir, filename, contents, compressionType)
+        }
+
+        val res = sc.wholeTextFiles(dir.toString, 3).collect()
+
+        assert(res.length === WholeTextFileRecordReaderSuite.fileNames.length,
+          "Number of files read out does not fit with the actual value.")
+
+        for ((filename, contents) <- res) {
+          val shortName = compressionType match {
+            case CompressionType.NONE => filename.split('/').last
+            case _ => filename.split('/').last.split('.').head
+          }
+          assert(WholeTextFileRecordReaderSuite.fileNames.contains(shortName),
+            s"Missing file name $filename.")
+          assert(contents === new Text(WholeTextFileRecordReaderSuite.files(shortName)).toString,
+            s"file $filename contents can not match.")
+        }
       }
     }
   }
@@ -145,4 +143,9 @@ object WholeTextFileRecordReaderSuite {
   private val files = fileLengths.zip(fileNames).map { case (upperBound, filename) =>
     filename -> LazyList.continually(testWords.toList.to(LazyList)).flatten.take(upperBound).toArray
   }.toMap
+
+  object CompressionType extends Enumeration {
+    type CompressionType = Value
+    val NONE, GZ, GZIP, ZST, ZSTD = Value
+  }
 }
diff --git a/core/src/test/scala/org/apache/spark/internal/plugin/PluginContainerSuite.scala b/core/src/test/scala/org/apache/spark/internal/plugin/PluginContainerSuite.scala
index fc8f48df2cb7d..fa7f1238bcfd9 100644
--- a/core/src/test/scala/org/apache/spark/internal/plugin/PluginContainerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/internal/plugin/PluginContainerSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.internal.plugin
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.{Map => JMap}
 import java.util.concurrent.CountDownLatch
 import java.util.concurrent.atomic.AtomicInteger
@@ -27,7 +27,6 @@ import scala.concurrent.duration._
 import scala.jdk.CollectionConverters._
 
 import com.codahale.metrics.Gauge
-import com.google.common.io.Files
 import org.mockito.ArgumentMatchers.{any, eq => meq}
 import org.mockito.Mockito.{mock, spy, verify, when}
 import org.scalatest.concurrent.Eventually.{eventually, interval, timeout}
@@ -38,10 +37,11 @@ import org.apache.spark.api.plugin._
 import org.apache.spark.internal.config._
 import org.apache.spark.launcher.SparkLauncher
 import org.apache.spark.memory.MemoryMode
-import org.apache.spark.resource.ResourceInformation
+import org.apache.spark.resource.{ResourceInformation, ResourceProfile}
 import org.apache.spark.resource.ResourceUtils.GPU
 import org.apache.spark.resource.TestResourceIDs.{DRIVER_GPU_ID, EXECUTOR_GPU_ID, WORKER_GPU_ID}
 import org.apache.spark.scheduler.{SparkListener, SparkListenerEvent}
+import org.apache.spark.shuffle.sort.SortShuffleManager
 import org.apache.spark.util.Utils
 
 class PluginContainerSuite extends SparkFunSuite with LocalSparkContext {
@@ -218,7 +218,7 @@ class PluginContainerSuite extends SparkFunSuite with LocalSparkContext {
       val execFiles =
         children.filter(_.getName.startsWith(NonLocalModeSparkPlugin.executorFileStr))
       assert(execFiles.length === 1)
-      val allLines = Files.readLines(execFiles(0), StandardCharsets.UTF_8)
+      val allLines = Files.readAllLines(execFiles(0).toPath)
       assert(allLines.size === 1)
       val addrs = NonLocalModeSparkPlugin.extractGpuAddrs(allLines.get(0))
       assert(addrs.length === 2)
@@ -236,6 +236,7 @@ class PluginContainerSuite extends SparkFunSuite with LocalSparkContext {
     val conf = new SparkConf()
       .setAppName(getClass().getName())
       .set(SparkLauncher.SPARK_MASTER, "local-cluster[2,1,1024]")
+      .set(EXECUTOR_MEMORY.key, "1024M")
       .set(PLUGINS, Seq(classOf[MemoryOverridePlugin].getName()))
 
     var sc: SparkContext = null
@@ -246,6 +247,14 @@ class PluginContainerSuite extends SparkFunSuite with LocalSparkContext {
       assert(memoryManager.tungstenMemoryMode == MemoryMode.OFF_HEAP)
       assert(memoryManager.maxOffHeapStorageMemory == MemoryOverridePlugin.offHeapMemory)
 
+      val defaultResourceProfile = sc.resourceProfileManager.defaultResourceProfile
+      assert(512L ==
+        defaultResourceProfile.executorResources
+          .get(ResourceProfile.MEMORY).map(_.amount).getOrElse(-1L))
+      assert(512L ==
+        defaultResourceProfile.executorResources
+          .get(ResourceProfile.OFFHEAP_MEM).map(_.amount).getOrElse(-1L))
+
       // Ensure all executors has started
       TestUtils.waitUntilExecutorsUp(sc, 1, 60000)
 
@@ -292,6 +301,20 @@ class PluginContainerSuite extends SparkFunSuite with LocalSparkContext {
     // If the listener bus is stopped before the plugin is shutdown,
     // then the event will be dropped and won't be delivered to the listener.
   }
+
+  test("SPARK-52548: override shuffle manager in plugin") {
+    val conf = new SparkConf()
+      .setAppName(getClass().getName())
+      .set(SparkLauncher.SPARK_MASTER, "local[1]")
+      .set(SHUFFLE_MANAGER, "sort")
+      .set(PLUGINS, Seq(classOf[SetShuffleManagerPlugin].getName()))
+
+    sc = new SparkContext(conf)
+
+    // Ensures the shuffle manager specified in configuration was
+    // overridden by the Spark plugin.
+    assert(sc.env.shuffleManager.isInstanceOf[SetShuffleManagerPlugin.MyShuffleManager])
+  }
 }
 
 class MemoryOverridePlugin extends SparkPlugin {
@@ -300,10 +323,13 @@ class MemoryOverridePlugin extends SparkPlugin {
       override def init(sc: SparkContext, pluginContext: PluginContext): JMap[String, String] = {
         // Take the original executor memory, and set `spark.memory.offHeap.size` to be the
         // same value. Also set `spark.memory.offHeap.enabled` to true.
-        val originalExecutorMemBytes =
+        val originalExecutorMem =
           sc.conf.getSizeAsMb(EXECUTOR_MEMORY.key, EXECUTOR_MEMORY.defaultValueString)
+        val newExecutorMem = originalExecutorMem / 2
+        val offHeapSize = originalExecutorMem - newExecutorMem
+        sc.conf.set(EXECUTOR_MEMORY.key, s"${newExecutorMem}M")
         sc.conf.set(MEMORY_OFFHEAP_ENABLED.key, "true")
-        sc.conf.set(MEMORY_OFFHEAP_SIZE.key, s"${originalExecutorMemBytes}M")
+        sc.conf.set(MEMORY_OFFHEAP_SIZE.key, s"${offHeapSize}M")
         MemoryOverridePlugin.offHeapMemory = sc.conf.getSizeAsBytes(MEMORY_OFFHEAP_SIZE.key)
         Map.empty[String, String].asJava
       }
@@ -383,7 +409,7 @@ object NonLocalModeSparkPlugin {
       resources: Map[String, ResourceInformation]): Unit = {
     val path = conf.get(TEST_PATH_CONF)
     val strToWrite = createFileStringWithGpuAddrs(id, resources)
-    Files.asCharSink(new File(path, s"$filePrefix$id"), StandardCharsets.UTF_8).write(strToWrite)
+    Files.writeString(new File(path, s"$filePrefix$id").toPath, strToWrite)
   }
 
   def reset(): Unit = {
@@ -391,6 +417,26 @@ object NonLocalModeSparkPlugin {
   }
 }
 
+class SetShuffleManagerPlugin extends SparkPlugin {
+  import SetShuffleManagerPlugin._
+  override def driverPlugin(): DriverPlugin = {
+    new DriverPlugin {
+      override def init(sc: SparkContext, ctx: PluginContext): JMap[String, String] = {
+        sc.conf.set(SHUFFLE_MANAGER, classOf[MyShuffleManager].getName)
+        Map.empty[String, String].asJava
+      }
+    }
+  }
+
+  override def executorPlugin(): ExecutorPlugin = {
+    new ExecutorPlugin {}
+  }
+}
+
+private object SetShuffleManagerPlugin {
+  class MyShuffleManager(conf: SparkConf) extends SortShuffleManager(conf)
+}
+
 class TestSparkPlugin extends SparkPlugin {
 
   override def driverPlugin(): DriverPlugin = {
diff --git a/core/src/test/scala/org/apache/spark/io/ChunkedByteBufferSuite.scala b/core/src/test/scala/org/apache/spark/io/ChunkedByteBufferSuite.scala
index 68b181de29285..5e036b6d01383 100644
--- a/core/src/test/scala/org/apache/spark/io/ChunkedByteBufferSuite.scala
+++ b/core/src/test/scala/org/apache/spark/io/ChunkedByteBufferSuite.scala
@@ -20,11 +20,11 @@ package org.apache.spark.io
 import java.io.{ByteArrayInputStream, ByteArrayOutputStream, ObjectInputStream, ObjectOutputStream}
 import java.nio.ByteBuffer
 
-import com.google.common.io.ByteStreams
-
 import org.apache.spark.{SharedSparkContext, SparkFunSuite}
 import org.apache.spark.internal.config
 import org.apache.spark.network.util.ByteArrayWritableChannel
+import org.apache.spark.util.Utils
+import org.apache.spark.util.collection.Utils.createArray
 import org.apache.spark.util.io.ChunkedByteBuffer
 
 class ChunkedByteBufferSuite extends SparkFunSuite with SharedSparkContext {
@@ -129,7 +129,7 @@ class ChunkedByteBufferSuite extends SparkFunSuite with SharedSparkContext {
   test("toArray() throws UnsupportedOperationException if size exceeds 2GB") {
     val fourMegabyteBuffer = ByteBuffer.allocate(1024 * 1024 * 4)
     fourMegabyteBuffer.limit(fourMegabyteBuffer.capacity())
-    val chunkedByteBuffer = new ChunkedByteBuffer(Array.fill(1024)(fourMegabyteBuffer))
+    val chunkedByteBuffer = new ChunkedByteBuffer(createArray(1024, fourMegabyteBuffer))
     assert(chunkedByteBuffer.size === (1024L * 1024L * 1024L * 4L))
     intercept[UnsupportedOperationException] {
       chunkedByteBuffer.toArray
@@ -145,7 +145,7 @@ class ChunkedByteBufferSuite extends SparkFunSuite with SharedSparkContext {
 
     val inputStream = chunkedByteBuffer.toInputStream(dispose = false)
     val bytesFromStream = new Array[Byte](chunkedByteBuffer.size.toInt)
-    ByteStreams.readFully(inputStream, bytesFromStream)
+    Utils.readFully(inputStream, bytesFromStream, 0, bytesFromStream.length)
     assert(bytesFromStream === bytes1.array() ++ bytes2.array())
     assert(chunkedByteBuffer.getChunks().head.position() === 0)
   }
diff --git a/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala b/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala
index ff971b72d8910..d6f0bfd237e4d 100644
--- a/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala
+++ b/core/src/test/scala/org/apache/spark/io/CompressionCodecSuite.scala
@@ -20,10 +20,9 @@ package org.apache.spark.io
 import java.io.{ByteArrayInputStream, ByteArrayOutputStream}
 import java.util.Locale
 
-import com.google.common.io.ByteStreams
-
 import org.apache.spark.{SparkConf, SparkFunSuite, SparkIllegalArgumentException}
 import org.apache.spark.internal.config.IO_COMPRESSION_ZSTD_BUFFERPOOL_ENABLED
+import org.apache.spark.util.Utils
 
 class CompressionCodecSuite extends SparkFunSuite {
   val conf = new SparkConf(false)
@@ -158,7 +157,7 @@ class CompressionCodecSuite extends SparkFunSuite {
     }
     val concatenatedBytes = codec.compressedInputStream(new ByteArrayInputStream(bytes1 ++ bytes2))
     val decompressed: Array[Byte] = new Array[Byte](128)
-    ByteStreams.readFully(concatenatedBytes, decompressed)
+    Utils.readFully(concatenatedBytes, decompressed, 0, decompressed.length)
     assert(decompressed.toSeq === (0 to 127))
   }
 
diff --git a/core/src/test/scala/org/apache/spark/io/ZStandardBenchmark.scala b/core/src/test/scala/org/apache/spark/io/ZStandardBenchmark.scala
index e5b7bb9278319..1e52b12bb6e59 100644
--- a/core/src/test/scala/org/apache/spark/io/ZStandardBenchmark.scala
+++ b/core/src/test/scala/org/apache/spark/io/ZStandardBenchmark.scala
@@ -21,7 +21,7 @@ import java.io.{ByteArrayInputStream, ByteArrayOutputStream, ObjectOutputStream}
 
 import org.apache.spark.SparkConf
 import org.apache.spark.benchmark.{Benchmark, BenchmarkBase}
-import org.apache.spark.internal.config.{IO_COMPRESSION_ZSTD_BUFFERPOOL_ENABLED, IO_COMPRESSION_ZSTD_BUFFERSIZE, IO_COMPRESSION_ZSTD_LEVEL, IO_COMPRESSION_ZSTD_WORKERS}
+import org.apache.spark.internal.config._
 
 
 /**
@@ -50,6 +50,7 @@ object ZStandardBenchmark extends BenchmarkBase {
       decompressionBenchmark(benchmark2, N)
       benchmark2.run()
       parallelCompressionBenchmark()
+      strategyCompressionBenchmark()
     }
   }
 
@@ -127,4 +128,30 @@ object ZStandardBenchmark extends BenchmarkBase {
       benchmark.run()
     }
   }
+
+  private def strategyCompressionBenchmark(): Unit = {
+    val numberOfLargeObjectToWrite = 128
+    val data: Array[Byte] = (1 until 256 * 1024 * 1024).map(_.toByte).toArray
+
+    Seq(1, 3, 9).foreach { level =>
+      val benchmark = new Benchmark(
+        s"Compression at level $level", numberOfLargeObjectToWrite, output = output)
+      Seq(-1, 1, 3, 5, 7, 9).foreach { strategy =>
+        val conf = new SparkConf(false).set(IO_COMPRESSION_ZSTD_LEVEL, level)
+        if (strategy >= 0) {
+          conf.set(IO_COMPRESSION_ZSTD_STRATEGY, strategy)
+        }
+        benchmark.addCase(s"Compression by strategy $strategy") { _ =>
+          val baos = new ByteArrayOutputStream()
+          val zcos = new ZStdCompressionCodec(conf).compressedOutputStream(baos)
+          val oos = new ObjectOutputStream(zcos)
+          1 to numberOfLargeObjectToWrite foreach { _ =>
+            oos.writeObject(data)
+          }
+          oos.close()
+        }
+      }
+      benchmark.run()
+    }
+  }
 }
diff --git a/core/src/test/scala/org/apache/spark/memory/TestMemoryManager.scala b/core/src/test/scala/org/apache/spark/memory/TestMemoryManager.scala
index 987f383c9c4fa..fb41f1ab287f6 100644
--- a/core/src/test/scala/org/apache/spark/memory/TestMemoryManager.scala
+++ b/core/src/test/scala/org/apache/spark/memory/TestMemoryManager.scala
@@ -108,19 +108,19 @@ class TestMemoryManager(conf: SparkConf)
    * memory (returning `0`), simulating low-on-memory / out-of-memory conditions.
    */
   def markExecutionAsOutOfMemoryOnce(): Unit = {
-    markconsequentOOM(1)
+    markConsequentOOM(1)
   }
 
   /**
    * Causes the next `n` calls to [[acquireExecutionMemory()]] to fail to allocate
    * memory (returning `0`), simulating low-on-memory / out-of-memory conditions.
    */
-  def markconsequentOOM(n: Int): Unit = synchronized {
+  def markConsequentOOM(n: Int): Unit = synchronized {
     consequentOOM += n
   }
 
   /**
-   * Undos the effects of [[markExecutionAsOutOfMemoryOnce]] and [[markconsequentOOM]] and lets
+   * Undos the effects of [[markExecutionAsOutOfMemoryOnce]] and [[markConsequentOOM]] and lets
    * calls to [[acquireExecutionMemory()]] (if there is enough memory available).
    */
   def resetConsequentOOM(): Unit = synchronized {
diff --git a/core/src/test/scala/org/apache/spark/memory/TestMemoryManagerSuite.scala b/core/src/test/scala/org/apache/spark/memory/TestMemoryManagerSuite.scala
index 043f341074b88..5a98ea3ef5f44 100644
--- a/core/src/test/scala/org/apache/spark/memory/TestMemoryManagerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/memory/TestMemoryManagerSuite.scala
@@ -47,7 +47,7 @@ class TestMemoryManagerSuite extends SparkFunSuite {
   test("markconsequentOOM") {
     val testMemoryManager = new TestMemoryManager(new SparkConf())
     assert(testMemoryManager.acquireExecutionMemory(1, 0, MemoryMode.ON_HEAP) == 1)
-    testMemoryManager.markconsequentOOM(2)
+    testMemoryManager.markConsequentOOM(2)
     assert(testMemoryManager.acquireExecutionMemory(1, 0, MemoryMode.ON_HEAP) == 0)
     assert(testMemoryManager.acquireExecutionMemory(1, 0, MemoryMode.ON_HEAP) == 0)
     assert(testMemoryManager.acquireExecutionMemory(1, 0, MemoryMode.ON_HEAP) == 1)
diff --git a/core/src/test/scala/org/apache/spark/memory/UnifiedMemoryManagerSuite.scala b/core/src/test/scala/org/apache/spark/memory/UnifiedMemoryManagerSuite.scala
index 0cafe6891c7d1..9c74f2fdd459b 100644
--- a/core/src/test/scala/org/apache/spark/memory/UnifiedMemoryManagerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/memory/UnifiedMemoryManagerSuite.scala
@@ -340,5 +340,289 @@ class UnifiedMemoryManagerSuite extends MemoryManagerSuite with PrivateMethodTes
     assert(mm.acquireStorageMemory(dummyBlock, 100L, memoryMode))
     assertEvictBlocksToFreeSpaceCalled(ms, 50)
     assert(mm.storageMemoryUsed === 600L)
+    UnifiedMemoryManager.shutdownUnmanagedMemoryPoller()
+  }
+
+  test("unmanaged memory tracking with memory mode separation") {
+    val maxMemory = 1000L
+    val taskAttemptId = 0L
+    val conf = new SparkConf()
+      .set(MEMORY_FRACTION, 1.0)
+      .set(TEST_MEMORY, maxMemory)
+      .set(MEMORY_OFFHEAP_ENABLED, false)
+      .set(MEMORY_STORAGE_FRACTION, storageFraction)
+      .set(UNMANAGED_MEMORY_POLLING_INTERVAL, 100L) // 100ms polling
+    val mm = UnifiedMemoryManager(conf, numCores = 1)
+    val memoryMode = MemoryMode.ON_HEAP
+
+    // Mock unmanaged memory consumer for ON_HEAP
+    class MockOnHeapMemoryConsumer(var memoryUsed: Long) extends UnmanagedMemoryConsumer {
+      override def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId =
+        UnmanagedMemoryConsumerId("TestOnHeap", "test-instance")
+      override def memoryMode: MemoryMode = MemoryMode.ON_HEAP
+      override def getMemBytesUsed: Long = memoryUsed
+    }
+
+    // Mock unmanaged memory consumer for OFF_HEAP
+    class MockOffHeapMemoryConsumer(var memoryUsed: Long) extends UnmanagedMemoryConsumer {
+      override def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId =
+        UnmanagedMemoryConsumerId("TestOffHeap", "test-instance")
+      override def memoryMode: MemoryMode = MemoryMode.OFF_HEAP
+      override def getMemBytesUsed: Long = memoryUsed
+    }
+
+    val onHeapConsumer = new MockOnHeapMemoryConsumer(0L)
+    val offHeapConsumer = new MockOffHeapMemoryConsumer(0L)
+
+    try {
+      // Register both consumers
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(onHeapConsumer)
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(offHeapConsumer)
+
+      // Initially no unmanaged memory usage
+      assert(UnifiedMemoryManager.getMemoryByComponentType("TestOnHeap") === 0L)
+      assert(UnifiedMemoryManager.getMemoryByComponentType("TestOffHeap") === 0L)
+
+      // Set off-heap memory usage - this should NOT affect on-heap allocations
+      offHeapConsumer.memoryUsed = 200L
+
+      // Wait for polling to pick up the change
+      Thread.sleep(200)
+
+      // Test that off-heap unmanaged memory doesn't affect on-heap execution memory allocation
+      val acquiredMemory = mm.acquireExecutionMemory(1000L, taskAttemptId, memoryMode)
+      // Should get full 1000 bytes since off-heap unmanaged memory doesn't affect on-heap pool
+      assert(acquiredMemory == 1000L)
+
+      // Release execution memory
+      mm.releaseExecutionMemory(acquiredMemory, taskAttemptId, memoryMode)
+
+      // Now set on-heap memory usage - this SHOULD affect on-heap allocations
+      onHeapConsumer.memoryUsed = 200L
+      Thread.sleep(200)
+
+      // Test that on-heap unmanaged memory affects on-heap execution memory allocation
+      val acquiredMemory2 = mm.acquireExecutionMemory(900L, taskAttemptId, memoryMode)
+      // Should only get 800 bytes due to 200 bytes of on-heap unmanaged memory usage
+      assert(acquiredMemory2 == 800L)
+
+      // Release execution memory to test storage allocation
+      mm.releaseExecutionMemory(acquiredMemory2, taskAttemptId, memoryMode)
+
+      // Test storage memory with on-heap unmanaged memory consideration
+      onHeapConsumer.memoryUsed = 300L
+      Thread.sleep(200)
+
+      // Storage should fail when block size + unmanaged memory > max memory
+      assert(!mm.acquireStorageMemory(dummyBlock, 800L, memoryMode))
+
+      // But smaller storage requests should succeed with unmanaged memory factored in
+      // With 300L on-heap unmanaged memory, effective max is 700L
+      assert(mm.acquireStorageMemory(dummyBlock, 600L, memoryMode))
+
+    } finally {
+      UnifiedMemoryManager.shutdownUnmanagedMemoryPoller()
+      UnifiedMemoryManager.clearUnmanagedMemoryUsers()
+    }
+  }
+
+  test("unmanaged memory consumer registration and unregistration") {
+    val conf = new SparkConf()
+      .set(MEMORY_FRACTION, 1.0)
+      .set(TEST_MEMORY, 1000L)
+      .set(MEMORY_OFFHEAP_ENABLED, false)
+      .set(UNMANAGED_MEMORY_POLLING_INTERVAL, 100L)
+
+    val mm = UnifiedMemoryManager(conf, numCores = 1)
+
+    class MockMemoryConsumer(
+        var memoryUsed: Long,
+        instanceId: String,
+        mode: MemoryMode = MemoryMode.ON_HEAP) extends UnmanagedMemoryConsumer {
+      override def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId =
+        UnmanagedMemoryConsumerId("Test", instanceId)
+      override def memoryMode: MemoryMode = mode
+      override def getMemBytesUsed: Long = memoryUsed
+    }
+
+    val consumer1 = new MockMemoryConsumer(100L, "test-instance-1")
+    val consumer2 = new MockMemoryConsumer(200L, "test-instance-2")
+
+    try {
+      // Register consumers
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(consumer1)
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(consumer2)
+
+      Thread.sleep(200)
+      assert(UnifiedMemoryManager.getMemoryByComponentType("Test") === 300L)
+
+      // Unregister one consumer
+      UnifiedMemoryManager.unregisterUnmanagedMemoryConsumer(consumer1)
+
+      Thread.sleep(200)
+      assert(UnifiedMemoryManager.getMemoryByComponentType("Test") === 200L)
+
+      // Unregister second consumer
+      UnifiedMemoryManager.unregisterUnmanagedMemoryConsumer(consumer2)
+
+      Thread.sleep(200)
+      assert(UnifiedMemoryManager.getMemoryByComponentType("Test") === 0L)
+
+    } finally {
+      UnifiedMemoryManager.shutdownUnmanagedMemoryPoller()
+      UnifiedMemoryManager.clearUnmanagedMemoryUsers()
+    }
+  }
+
+  test("unmanaged memory consumer auto-removal when returning -1") {
+    val conf = new SparkConf()
+      .set(MEMORY_FRACTION, 1.0)
+      .set(TEST_MEMORY, 1000L)
+      .set(MEMORY_OFFHEAP_ENABLED, false)
+      .set(UNMANAGED_MEMORY_POLLING_INTERVAL, 100L)
+
+    val mm = UnifiedMemoryManager(conf, numCores = 1)
+
+    class MockMemoryConsumer(var memoryUsed: Long) extends UnmanagedMemoryConsumer {
+      override def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId =
+        UnmanagedMemoryConsumerId("Test", s"test-instance-${this.hashCode()}")
+      override def memoryMode: MemoryMode = MemoryMode.ON_HEAP
+      override def getMemBytesUsed: Long = memoryUsed
+    }
+
+    val consumer1 = new MockMemoryConsumer(100L)
+    val consumer2 = new MockMemoryConsumer(200L)
+
+    try {
+      // Register consumers
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(consumer1)
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(consumer2)
+
+      Thread.sleep(200)
+      assert(UnifiedMemoryManager.getMemoryByComponentType("Test") === 300L)
+
+      // Mark consumer1 as inactive
+      consumer1.memoryUsed = -1L
+
+      // Wait for polling to detect and remove the inactive consumer
+      Thread.sleep(200)
+      assert(UnifiedMemoryManager.getMemoryByComponentType("Test") === 200L)
+
+      // Mark consumer2 as inactive as well
+      consumer2.memoryUsed = -1L
+
+      Thread.sleep(200)
+      assert(UnifiedMemoryManager.getMemoryByComponentType("Test") === 0L)
+
+    } finally {
+      UnifiedMemoryManager.shutdownUnmanagedMemoryPoller()
+      UnifiedMemoryManager.clearUnmanagedMemoryUsers()
+    }
+  }
+
+  test("unmanaged memory polling disabled when interval is zero") {
+    val conf = new SparkConf()
+      .set(MEMORY_FRACTION, 1.0)
+      .set(TEST_MEMORY, 1000L)
+      .set(MEMORY_OFFHEAP_ENABLED, false)
+      .set(MEMORY_STORAGE_FRACTION, storageFraction)
+      .set(UNMANAGED_MEMORY_POLLING_INTERVAL, 0L) // Disabled
+
+    val mm = UnifiedMemoryManager(conf, numCores = 1)
+
+    // When polling is disabled, unmanaged memory should not affect allocations
+    class MockUnmanagedMemoryConsumer(var memoryUsed: Long) extends UnmanagedMemoryConsumer {
+      override def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId =
+        UnmanagedMemoryConsumerId("Test", "test-instance")
+      override def memoryMode: MemoryMode = MemoryMode.ON_HEAP
+      override def getMemBytesUsed: Long = memoryUsed
+    }
+
+    val consumer = new MockUnmanagedMemoryConsumer(500L)
+
+    try {
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(consumer)
+
+      // Since polling is disabled, should be able to allocate full memory
+      val acquiredMemory = mm.acquireExecutionMemory(1000L, 0L, MemoryMode.ON_HEAP)
+      assert(acquiredMemory === 1000L)
+
+    } finally {
+      UnifiedMemoryManager.shutdownUnmanagedMemoryPoller()
+      UnifiedMemoryManager.clearUnmanagedMemoryUsers()
+    }
+  }
+
+  test("unmanaged memory tracking with off-heap memory enabled") {
+    val maxOnHeapMemory = 1000L
+    val maxOffHeapMemory = 1500L
+    val taskAttemptId = 0L
+    val conf = new SparkConf()
+      .set(MEMORY_FRACTION, 1.0)
+      .set(TEST_MEMORY, maxOnHeapMemory)
+      .set(MEMORY_OFFHEAP_ENABLED, true)
+      .set(MEMORY_OFFHEAP_SIZE, maxOffHeapMemory)
+      .set(MEMORY_STORAGE_FRACTION, storageFraction)
+      .set(UNMANAGED_MEMORY_POLLING_INTERVAL, 100L)
+    val mm = UnifiedMemoryManager(conf, numCores = 1)
+
+    // Mock unmanaged memory consumer
+    class MockUnmanagedMemoryConsumer(var memoryUsed: Long) extends UnmanagedMemoryConsumer {
+      override def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId =
+        UnmanagedMemoryConsumerId("ExternalLib", "test-instance")
+
+      override def memoryMode: MemoryMode = MemoryMode.OFF_HEAP
+
+      override def getMemBytesUsed: Long = memoryUsed
+    }
+
+    val unmanagedConsumer = new MockUnmanagedMemoryConsumer(0L)
+
+    try {
+      // Register the unmanaged memory consumer
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(unmanagedConsumer)
+
+      // Test off-heap memory allocation with unmanaged memory
+      unmanagedConsumer.memoryUsed = 300L
+      Thread.sleep(200)
+
+      // Test off-heap execution memory
+      // With 300 bytes of unmanaged memory, effective off-heap memory should be reduced
+      val offHeapAcquired = mm.acquireExecutionMemory(1400L, taskAttemptId, MemoryMode.OFF_HEAP)
+      assert(offHeapAcquired <= 1200L, "Off-heap memory should be reduced by unmanaged usage")
+      mm.releaseExecutionMemory(offHeapAcquired, taskAttemptId, MemoryMode.OFF_HEAP)
+
+      // Test off-heap storage memory
+      unmanagedConsumer.memoryUsed = 500L
+      Thread.sleep(200)
+
+      // Storage should fail when block size + unmanaged memory > max off-heap memory
+      assert(!mm.acquireStorageMemory(dummyBlock, 1100L, MemoryMode.OFF_HEAP))
+
+      // But smaller off-heap storage requests should succeed
+      assert(mm.acquireStorageMemory(dummyBlock, 900L, MemoryMode.OFF_HEAP))
+      mm.releaseStorageMemory(900L, MemoryMode.OFF_HEAP)
+
+      // Test that on-heap is NOT affected by off-heap unmanaged memory
+      val onHeapAcquired = mm.acquireExecutionMemory(600L, taskAttemptId, MemoryMode.ON_HEAP)
+      assert(onHeapAcquired == 600L,
+        "On-heap memory should not be reduced by off-heap unmanaged usage")
+      mm.releaseExecutionMemory(onHeapAcquired, taskAttemptId, MemoryMode.ON_HEAP)
+
+      // Test with mixed memory modes
+      unmanagedConsumer.memoryUsed = 200L
+      Thread.sleep(200)
+
+      // Allocate some on-heap and off-heap memory
+      val onHeap = mm.acquireExecutionMemory(400L, taskAttemptId, MemoryMode.ON_HEAP)
+      val offHeap = mm.acquireExecutionMemory(1000L, taskAttemptId, MemoryMode.OFF_HEAP)
+
+      assert(onHeap == 400L && offHeap <= 1300L,
+        "Off-heap memory pool should respect unmanaged memory usage, on-heap should not")
+
+    } finally {
+      UnifiedMemoryManager.shutdownUnmanagedMemoryPoller()
+      UnifiedMemoryManager.clearUnmanagedMemoryUsers()
+    }
   }
 }
diff --git a/core/src/test/scala/org/apache/spark/network/netty/NettyBlockTransferSecuritySuite.scala b/core/src/test/scala/org/apache/spark/network/netty/NettyBlockTransferSecuritySuite.scala
index 124c089b47108..2733800727c0f 100644
--- a/core/src/test/scala/org/apache/spark/network/netty/NettyBlockTransferSecuritySuite.scala
+++ b/core/src/test/scala/org/apache/spark/network/netty/NettyBlockTransferSecuritySuite.scala
@@ -17,7 +17,6 @@
 
 package org.apache.spark.network.netty
 
-import java.io.InputStreamReader
 import java.nio._
 import java.nio.charset.StandardCharsets
 import java.util.concurrent.TimeUnit
@@ -26,7 +25,6 @@ import scala.concurrent.Promise
 import scala.concurrent.duration._
 import scala.util.{Failure, Success, Try}
 
-import com.google.common.io.CharStreams
 import org.mockito.Mockito._
 import org.scalatest.matchers.must.Matchers
 import org.scalatest.matchers.should.Matchers._
@@ -40,7 +38,7 @@ import org.apache.spark.network.buffer.{ManagedBuffer, NioManagedBuffer}
 import org.apache.spark.network.shuffle.BlockFetchingListener
 import org.apache.spark.serializer.{JavaSerializer, SerializerManager}
 import org.apache.spark.storage.{BlockId, ShuffleBlockId}
-import org.apache.spark.util.{SslTestUtils, ThreadUtils}
+import org.apache.spark.util.{SslTestUtils, ThreadUtils, Utils}
 
 class NettyBlockTransferSecuritySuite extends SparkFunSuite with MockitoSugar with Matchers {
 
@@ -150,9 +148,7 @@ class NettyBlockTransferSecuritySuite extends SparkFunSuite with MockitoSugar wi
 
     val result = fetchBlock(exec0, exec1, "1", blockId) match {
       case Success(buf) =>
-        val actualString = CharStreams.toString(
-          new InputStreamReader(buf.createInputStream(), StandardCharsets.UTF_8))
-        actualString should equal(blockString)
+        Utils.toString(buf.createInputStream()) should equal(blockString)
         buf.release()
         Success(())
       case Failure(t) =>
diff --git a/core/src/test/scala/org/apache/spark/rdd/RDDCleanerSuite.scala b/core/src/test/scala/org/apache/spark/rdd/RDDCleanerSuite.scala
index 35dcf0f762a3f..f72bd33fe797b 100644
--- a/core/src/test/scala/org/apache/spark/rdd/RDDCleanerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/rdd/RDDCleanerSuite.scala
@@ -21,9 +21,6 @@ import java.io.File
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
-import org.apache.commons.io.filefilter.TrueFileFilter
-
 import org.apache.spark._
 import org.apache.spark.util.Utils
 
@@ -34,8 +31,7 @@ class RDDCleanerSuite extends SparkFunSuite with LocalRootDirsTest {
     val conf = new SparkConf()
     val localDir = Utils.createTempDir()
     val checkpointDir = Utils.createTempDir()
-    def getAllFiles: Set[File] =
-      FileUtils.listFiles(localDir, TrueFileFilter.INSTANCE, TrueFileFilter.INSTANCE).asScala.toSet
+    def getAllFiles: Set[File] = Utils.listFiles(localDir).asScala.toSet
     try {
       conf.set("spark.local.dir", localDir.getAbsolutePath)
       val sc = new SparkContext("local[2]", "test", conf)
diff --git a/core/src/test/scala/org/apache/spark/rdd/RDDSuite.scala b/core/src/test/scala/org/apache/spark/rdd/RDDSuite.scala
index aecb8b99d0e31..b9774482f9496 100644
--- a/core/src/test/scala/org/apache/spark/rdd/RDDSuite.scala
+++ b/core/src/test/scala/org/apache/spark/rdd/RDDSuite.scala
@@ -38,6 +38,7 @@ import org.apache.spark.rdd.RDDSuiteUtils._
 import org.apache.spark.scheduler.{SparkListener, SparkListenerJobStart}
 import org.apache.spark.util.{ThreadUtils, Utils}
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.collection.Utils.createArray
 
 class RDDSuite extends SparkFunSuite with SharedSparkContext with Eventually {
   var tempDir: File = _
@@ -365,7 +366,7 @@ class RDDSuite extends SparkFunSuite with SharedSparkContext with Eventually {
 
   test("repartitioned RDDs perform load balancing") {
     // Coalesce partitions
-    val input = Array.fill(1000)(1)
+    val input = createArray(1000, 1)
     val initialPartitions = 10
     val data = sc.parallelize(input.toImmutableArraySeq, initialPartitions)
 
@@ -393,9 +394,10 @@ class RDDSuite extends SparkFunSuite with SharedSparkContext with Eventually {
       }
     }
 
-    testSplitPartitions(Array.fill(100)(1).toImmutableArraySeq, 10, 20)
-    testSplitPartitions((Array.fill(10000)(1) ++ Array.fill(10000)(2)).toImmutableArraySeq, 20, 100)
-    testSplitPartitions(Array.fill(1000)(1).toImmutableArraySeq, 250, 128)
+    testSplitPartitions(createArray(100, 1).toImmutableArraySeq, 10, 20)
+    testSplitPartitions(
+      (createArray(10000, 1) ++ createArray(10000, 2)).toImmutableArraySeq, 20, 100)
+    testSplitPartitions(createArray(1000, 1).toImmutableArraySeq, 250, 128)
   }
 
   test("coalesced RDDs") {
diff --git a/core/src/test/scala/org/apache/spark/resource/ResourceDiscoveryPluginSuite.scala b/core/src/test/scala/org/apache/spark/resource/ResourceDiscoveryPluginSuite.scala
index edf138df9e207..57a692ddc0c46 100644
--- a/core/src/test/scala/org/apache/spark/resource/ResourceDiscoveryPluginSuite.scala
+++ b/core/src/test/scala/org/apache/spark/resource/ResourceDiscoveryPluginSuite.scala
@@ -18,13 +18,12 @@
 package org.apache.spark.resource
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.Optional
 import java.util.UUID
 
 import scala.concurrent.duration._
 
-import com.google.common.io.Files
 import org.scalatest.concurrent.Eventually.{eventually, interval, timeout}
 
 import org.apache.spark._
@@ -148,7 +147,7 @@ object TestResourceDiscoveryPlugin {
   def writeFile(conf: SparkConf, id: String): Unit = {
     val path = conf.get(TEST_PATH_CONF)
     val fileName = s"$id - ${UUID.randomUUID.toString}"
-    Files.asCharSink(new File(path, fileName), StandardCharsets.UTF_8).write(id)
+    Files.writeString(new File(path, fileName).toPath, id)
   }
 }
 
diff --git a/core/src/test/scala/org/apache/spark/resource/ResourceProfileSuite.scala b/core/src/test/scala/org/apache/spark/resource/ResourceProfileSuite.scala
index 3464c3b3a0c52..301f978349135 100644
--- a/core/src/test/scala/org/apache/spark/resource/ResourceProfileSuite.scala
+++ b/core/src/test/scala/org/apache/spark/resource/ResourceProfileSuite.scala
@@ -48,21 +48,21 @@ class ResourceProfileSuite extends SparkFunSuite with MockitoSugar {
     assert(rprof.id === ResourceProfile.DEFAULT_RESOURCE_PROFILE_ID)
     assert(rprof.executorResources.size === 3,
       "Executor resources should contain cores, heap and offheap memory by default")
-    assert(rprof.executorResources(ResourceProfile.CORES).amount === 1,
+    assert(rprof.getExecutorCores.get === 1,
       "Executor resources should have 1 core")
     assert(rprof.getExecutorCores.get === 1,
       "Executor resources should have 1 core")
-    assert(rprof.executorResources(ResourceProfile.MEMORY).amount === 1024,
+    assert(rprof.getExecutorMemory.get === 1024,
       "Executor resources should have 1024 memory")
-    assert(rprof.executorResources.get(ResourceProfile.PYSPARK_MEM) == None,
+    assert(rprof.getPySparkMemory == None,
       "pyspark memory empty if not specified")
-    assert(rprof.executorResources.get(ResourceProfile.OVERHEAD_MEM) == None,
+    assert(rprof.getOverheadMemory == None,
       "overhead memory empty if not specified")
-    assert(rprof.executorResources(ResourceProfile.OFFHEAP_MEM).amount === 0,
+    assert(rprof.getExecutorOffHeap.get === 0,
       "Executor resources should have 0 offheap memory")
     assert(rprof.taskResources.size === 1,
       "Task resources should just contain cpus by default")
-    assert(rprof.taskResources(ResourceProfile.CPUS).amount === 1,
+    assert(rprof.getTaskCpus.get === 1,
       "Task resources should have 1 cpu")
     assert(rprof.getTaskCpus.get === 1,
       "Task resources should have 1 cpu")
@@ -121,17 +121,15 @@ class ResourceProfileSuite extends SparkFunSuite with MockitoSugar {
     assert(execResources.size === 6, s"Executor resources should contain cores, pyspark " +
       s"memory, memory overhead, memory, offHeap memory and gpu $execResources")
     assert(execResources.contains("gpu"), "Executor resources should have gpu")
-    assert(rprof.executorResources(ResourceProfile.CORES).amount === 4,
-      "Executor resources should have 4 core")
     assert(rprof.getExecutorCores.get === 4,
       "Executor resources should have 4 core")
-    assert(rprof.executorResources(ResourceProfile.MEMORY).amount === 4096,
+    assert(rprof.getExecutorMemory.get === 4096,
       "Executor resources should have 1024 memory")
-    assert(rprof.executorResources(ResourceProfile.PYSPARK_MEM).amount == 2048,
+    assert(rprof.getPySparkMemory.get == 2048,
       "pyspark memory empty if not specified")
-    assert(rprof.executorResources(ResourceProfile.OVERHEAD_MEM).amount == 1024,
+    assert(rprof.getOverheadMemory.get == 1024,
       "overhead memory empty if not specified")
-    assert(rprof.executorResources(ResourceProfile.OFFHEAP_MEM).amount == 3,
+    assert(rprof.getExecutorOffHeap.get == 3,
       "Executor resources should have 3 offHeap memory")
     assert(rprof.taskResources.size === 2,
       "Task resources should just contain cpus and gpu")
@@ -238,24 +236,24 @@ class ResourceProfileSuite extends SparkFunSuite with MockitoSugar {
   }
 
   test("Create ResourceProfile") {
-    val rprof = new ResourceProfileBuilder()
+    val rprofBuilder = new ResourceProfileBuilder()
     val taskReq = new TaskResourceRequests().resource("gpu", 1)
     val eReq = new ExecutorResourceRequests().resource("gpu", 2, "myscript", "nvidia")
-    rprof.require(taskReq).require(eReq)
+    rprofBuilder.require(taskReq).require(eReq)
 
-    assert(rprof.executorResources.size === 1)
-    assert(rprof.executorResources.contains("gpu"),
+    assert(rprofBuilder.executorResources.size === 1)
+    assert(rprofBuilder.executorResources.contains("gpu"),
       "Executor resources should have gpu")
-    assert(rprof.executorResources.get("gpu").get.vendor === "nvidia",
+    assert(rprofBuilder.executorResources.get("gpu").get.vendor === "nvidia",
       "gpu vendor should be nvidia")
-    assert(rprof.executorResources.get("gpu").get.discoveryScript === "myscript",
+    assert(rprofBuilder.executorResources.get("gpu").get.discoveryScript === "myscript",
       "discoveryScript should be myscript")
-    assert(rprof.executorResources.get("gpu").get.amount === 2,
+    assert(rprofBuilder.executorResources.get("gpu").get.amount === 2,
     "gpu amount should be 2")
 
-    assert(rprof.taskResources.size === 1, "Should have 1 task resource")
-    assert(rprof.taskResources.contains("gpu"), "Task resources should have gpu")
-    assert(rprof.taskResources.get("gpu").get.amount === 1,
+    assert(rprofBuilder.taskResources.size === 1, "Should have 1 task resource")
+    assert(rprofBuilder.taskResources.contains("gpu"), "Task resources should have gpu")
+    assert(rprofBuilder.taskResources.get("gpu").get.amount === 1,
       "Task resources should have 1 gpu")
 
     val ereqs = new ExecutorResourceRequests()
@@ -264,19 +262,20 @@ class ResourceProfileSuite extends SparkFunSuite with MockitoSugar {
     val treqs = new TaskResourceRequests()
     treqs.cpus(1)
 
-    rprof.require(treqs)
-    rprof.require(ereqs)
+    rprofBuilder.require(treqs)
+    rprofBuilder.require(ereqs)
+    val rprof = rprofBuilder.build()
 
     assert(rprof.executorResources.size === 6)
-    assert(rprof.executorResources(ResourceProfile.CORES).amount === 2,
+    assert(rprof.getExecutorCores.get === 2,
       "Executor resources should have 2 cores")
-    assert(rprof.executorResources(ResourceProfile.MEMORY).amount === 4096,
+    assert(rprof.getExecutorMemory.get === 4096,
       "Executor resources should have 4096 memory")
-    assert(rprof.executorResources(ResourceProfile.OVERHEAD_MEM).amount === 2048,
+    assert(rprof.getOverheadMemory.get === 2048,
       "Executor resources should have 2048 overhead memory")
-    assert(rprof.executorResources(ResourceProfile.PYSPARK_MEM).amount === 1024,
+    assert(rprof.getPySparkMemory.get === 1024,
       "Executor resources should have 1024 pyspark memory")
-    assert(rprof.executorResources(ResourceProfile.OFFHEAP_MEM).amount === 3072,
+    assert(rprof.getExecutorOffHeap.get === 3072,
       "Executor resources should have 3072 offHeap memory")
 
     assert(rprof.taskResources.size === 2)
@@ -320,19 +319,20 @@ class ResourceProfileSuite extends SparkFunSuite with MockitoSugar {
   }
 
   test("Test ExecutorResourceRequests memory helpers") {
-    val rprof = new ResourceProfileBuilder()
+    val rprofBuilder = new ResourceProfileBuilder()
     val ereqs = new ExecutorResourceRequests()
     ereqs.memory("4g")
     ereqs.memoryOverhead("2000m").pysparkMemory("512000k").offHeapMemory("1g")
-    rprof.require(ereqs)
+    rprofBuilder.require(ereqs)
+    val rprof = rprofBuilder.build()
 
-    assert(rprof.executorResources(ResourceProfile.MEMORY).amount === 4096,
+    assert(rprof.getExecutorMemory.get === 4096,
       "Executor resources should have 4096 memory")
-    assert(rprof.executorResources(ResourceProfile.OVERHEAD_MEM).amount === 2000,
+    assert(rprof.getOverheadMemory.get === 2000,
       "Executor resources should have 2000 overhead memory")
-    assert(rprof.executorResources(ResourceProfile.PYSPARK_MEM).amount === 500,
+    assert(rprof.getPySparkMemory.get === 500,
       "Executor resources should have 512 pyspark memory")
-    assert(rprof.executorResources(ResourceProfile.OFFHEAP_MEM).amount === 1024,
+    assert(rprof.getExecutorOffHeap.get === 1024,
       "Executor resources should have 1024 offHeap memory")
   }
 
diff --git a/core/src/test/scala/org/apache/spark/rpc/RpcEnvSuite.scala b/core/src/test/scala/org/apache/spark/rpc/RpcEnvSuite.scala
index 66b1ee7b58ac8..8f749415d3239 100644
--- a/core/src/test/scala/org/apache/spark/rpc/RpcEnvSuite.scala
+++ b/core/src/test/scala/org/apache/spark/rpc/RpcEnvSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.rpc
 
 import java.io.{File, NotSerializableException}
-import java.nio.charset.StandardCharsets.UTF_8
+import java.nio.file.Files
 import java.util.UUID
 import java.util.concurrent.{ConcurrentLinkedQueue, CountDownLatch, TimeUnit}
 
@@ -27,7 +27,6 @@ import scala.concurrent.Await
 import scala.concurrent.duration._
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
 import org.mockito.ArgumentMatchers.any
 import org.mockito.Mockito.{mock, never, verify, when}
 import org.scalatest.concurrent.Eventually._
@@ -868,23 +867,23 @@ abstract class RpcEnvSuite extends SparkFunSuite {
         val conf = createSparkConf()
 
         val file = new File(tempDir, "file")
-        Files.asCharSink(file, UTF_8).write(UUID.randomUUID().toString)
+        Files.writeString(file.toPath, UUID.randomUUID().toString)
         val fileWithSpecialChars = new File(tempDir, "file name")
-        Files.asCharSink(fileWithSpecialChars, UTF_8).write(UUID.randomUUID().toString)
+        Files.writeString(fileWithSpecialChars.toPath, UUID.randomUUID().toString)
         val empty = new File(tempDir, "empty")
-        Files.asCharSink(empty, UTF_8).write("")
+        Files.writeString(empty.toPath, "")
         val jar = new File(tempDir, "jar")
-        Files.asCharSink(jar, UTF_8).write(UUID.randomUUID().toString)
+        Files.writeString(jar.toPath, UUID.randomUUID().toString)
 
         val dir1 = new File(tempDir, "dir1")
         assert(dir1.mkdir())
         val subFile1 = new File(dir1, "file1")
-        Files.asCharSink(subFile1, UTF_8).write(UUID.randomUUID().toString)
+        Files.writeString(subFile1.toPath, UUID.randomUUID().toString)
 
         val dir2 = new File(tempDir, "dir2")
         assert(dir2.mkdir())
         val subFile2 = new File(dir2, "file2")
-        Files.asCharSink(subFile2, UTF_8).write(UUID.randomUUID().toString)
+        Files.writeString(subFile2.toPath, UUID.randomUUID().toString)
 
         val fileUri = env.fileServer.addFile(file)
         val fileWithSpecialCharsUri = env.fileServer.addFile(fileWithSpecialChars)
@@ -921,7 +920,7 @@ abstract class RpcEnvSuite extends SparkFunSuite {
         files.foreach { case (f, uri) =>
           val destFile = new File(destDir, f.getName())
           Utils.fetchFile(uri, destDir, conf, hc, 0L, false)
-          assert(Files.equal(f, destFile))
+          assert(Utils.contentEquals(f, destFile))
         }
 
         // Try to download files that do not exist.
diff --git a/core/src/test/scala/org/apache/spark/scheduler/DAGSchedulerSuite.scala b/core/src/test/scala/org/apache/spark/scheduler/DAGSchedulerSuite.scala
index d4e90be7c66dd..bf38c629f700b 100644
--- a/core/src/test/scala/org/apache/spark/scheduler/DAGSchedulerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/scheduler/DAGSchedulerSuite.scala
@@ -50,6 +50,7 @@ import org.apache.spark.shuffle.{FetchFailedException, MetadataFetchFailedExcept
 import org.apache.spark.storage.{BlockId, BlockManager, BlockManagerId, BlockManagerMaster}
 import org.apache.spark.util.{AccumulatorContext, AccumulatorV2, CallSite, Clock, LongAccumulator, SystemClock, ThreadUtils, Utils}
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.collection.Utils.createArray
 
 class DAGSchedulerEventProcessLoopTester(dagScheduler: DAGScheduler)
   extends DAGSchedulerEventProcessLoop(dagScheduler) {
@@ -679,23 +680,24 @@ class DAGSchedulerSuite extends SparkFunSuite with TempLocalSparkContext with Ti
     val reduceRdd = new MyRDD(sc, 1, List(shuffleDep))
     submit(reduceRdd, Array(0))
     // map stage1 completes successfully, with one task on each executor
+    val uncompressedSizes = createArray(1, 2L)
     complete(taskSets(0), Seq(
       (Success,
         MapStatus(
-          BlockManagerId("hostA-exec1", "hostA", 12345), Array.fill[Long](1)(2), mapTaskId = 5)),
+          BlockManagerId("hostA-exec1", "hostA", 12345), uncompressedSizes, mapTaskId = 5)),
       (Success,
         MapStatus(
-          BlockManagerId("hostA-exec2", "hostA", 12345), Array.fill[Long](1)(2), mapTaskId = 6)),
+          BlockManagerId("hostA-exec2", "hostA", 12345), uncompressedSizes, mapTaskId = 6)),
       (Success, makeMapStatus("hostB", 1, mapTaskId = 7))
     ))
     // map stage2 completes successfully, with one task on each executor
     complete(taskSets(1), Seq(
       (Success,
         MapStatus(
-          BlockManagerId("hostA-exec1", "hostA", 12345), Array.fill[Long](1)(2), mapTaskId = 8)),
+          BlockManagerId("hostA-exec1", "hostA", 12345), uncompressedSizes, mapTaskId = 8)),
       (Success,
         MapStatus(
-          BlockManagerId("hostA-exec2", "hostA", 12345), Array.fill[Long](1)(2), mapTaskId = 9)),
+          BlockManagerId("hostA-exec2", "hostA", 12345), uncompressedSizes, mapTaskId = 9)),
       (Success, makeMapStatus("hostB", 1, mapTaskId = 10))
     ))
     // make sure our test setup is correct
@@ -4948,6 +4950,7 @@ class DAGSchedulerSuite extends SparkFunSuite with TempLocalSparkContext with Ti
     }
 
     // stage2`s task0 Fetch failed
+    val uncompressedSizes = createArray(2, 2L)
     runEvent(makeCompletionEvent(
       taskSets(1).tasks(0),
       FetchFailed(makeBlockManagerId("hostA"), shuffleIdA, 0L, 0, 0,
@@ -4957,11 +4960,11 @@ class DAGSchedulerSuite extends SparkFunSuite with TempLocalSparkContext with Ti
     // long running task complete
     runEvent(makeCompletionEvent(taskSets(1).tasks(1), Success,
       result = MapStatus(BlockManagerId("hostC-exec1", "hostC", 44399),
-        Array.fill[Long](2)(2), mapTaskId = taskIdCount),
+        uncompressedSizes, mapTaskId = taskIdCount),
       Seq.empty, Array.empty, createTaskInfo(false)))
     runEvent(makeCompletionEvent(taskSets(1).tasks(0), Success,
       result = MapStatus(BlockManagerId("hostD-exec1", "hostD", 44400),
-        Array.fill[Long](2)(2), mapTaskId = taskIdCount),
+        uncompressedSizes, mapTaskId = taskIdCount),
       Seq.empty, Array.empty, createTaskInfo(true)))
 
 
@@ -4984,7 +4987,7 @@ class DAGSchedulerSuite extends SparkFunSuite with TempLocalSparkContext with Ti
     assert(stage0Retry.size === 1)
     runEvent(makeCompletionEvent(stage0Retry.head.tasks(0), Success,
       result = MapStatus(BlockManagerId("hostE-exec1", "hostE", 44401),
-        Array.fill[Long](2)(2), mapTaskId = taskIdCount)))
+        uncompressedSizes, mapTaskId = taskIdCount)))
 
     // wait stage2 resubmit
     sc.listenerBus.waitUntilEmpty()
@@ -5062,15 +5065,16 @@ class DAGSchedulerSuite extends SparkFunSuite with TempLocalSparkContext with Ti
         normalTask))
 
       // Make the speculative task succeed after initial task has failed
+      val uncompressedSizes = createArray(2, 2L)
       runEvent(makeCompletionEvent(taskSets(1).tasks(0), Success,
         result = MapStatus(BlockManagerId("hostD-exec1", "hostD", 34512),
-          Array.fill[Long](2)(2), mapTaskId = speculativeTask.taskId),
+          uncompressedSizes, mapTaskId = speculativeTask.taskId),
         taskInfo = speculativeTask))
 
       // The second task, for partition 1 succeeds as well.
       runEvent(makeCompletionEvent(taskSets(1).tasks(1), Success,
         result = MapStatus(BlockManagerId("hostE-exec2", "hostE", 23456),
-          Array.fill[Long](2)(2), mapTaskId = taskIdCount)))
+          createArray(2, 2L), mapTaskId = taskIdCount)))
       taskIdCount += 1
 
       sc.listenerBus.waitUntilEmpty()
@@ -5096,7 +5100,7 @@ class DAGSchedulerSuite extends SparkFunSuite with TempLocalSparkContext with Ti
       // make the original task succeed
       runEvent(makeCompletionEvent(stage0Retry.head.tasks(fetchFailParentPartition), Success,
         result = MapStatus(BlockManagerId("hostF-exec1", "hostF", 12345),
-          Array.fill[Long](2)(2), mapTaskId = taskIdCount)))
+          createArray(2, 2L), mapTaskId = taskIdCount)))
       Thread.sleep(DAGScheduler.RESUBMIT_TIMEOUT * 2)
       dagEventProcessLoopTester.runEvents()
 
diff --git a/core/src/test/scala/org/apache/spark/scheduler/EventLoggingListenerSuite.scala b/core/src/test/scala/org/apache/spark/scheduler/EventLoggingListenerSuite.scala
index 421f94af0ade1..74511d642729e 100644
--- a/core/src/test/scala/org/apache/spark/scheduler/EventLoggingListenerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/scheduler/EventLoggingListenerSuite.scala
@@ -52,7 +52,6 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
 
   private val fileSystem = Utils.getHadoopFileSystem("/",
     SparkHadoopUtil.get.newConfiguration(new SparkConf()))
-  private val jsonProtocol = new JsonProtocol(new SparkConf())
   private var testDir: File = _
   private var testDirPath: Path = _
 
@@ -146,7 +145,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
       assert(lines(2).contains("SparkListenerJobStart"))
 
       lines.foreach{
-        line => jsonProtocol.sparkEventFromJson(line) match {
+        line => JsonProtocol.sparkEventFromJson(line) match {
           case logStartEvent: SparkListenerLogStart =>
             assert(logStartEvent == logStart)
 
@@ -188,7 +187,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
     sc.stop()
 
     val eventLogStream = EventLogFileReader.openEventLog(new Path(testDirPath, appId), fileSystem)
-    val events = readLines(eventLogStream).map(line => jsonProtocol.sparkEventFromJson(line))
+    val events = readLines(eventLogStream).map(line => JsonProtocol.sparkEventFromJson(line))
     val jobStartEvents = events
       .filter(event => event.isInstanceOf[SparkListenerJobStart])
       .map(_.asInstanceOf[SparkListenerJobStart])
@@ -238,7 +237,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
       125L, "Mickey", None)
     val applicationEnd = SparkListenerApplicationEnd(1000L, exitCode)
 
-    // A comprehensive test on JSON de/serialization of all events is in jsonProtocolSuite
+    // A comprehensive test on JSON de/serialization of all events is in JsonProtocolSuite
     eventLogger.start()
     listenerBus.start(Mockito.mock(classOf[SparkContext]), Mockito.mock(classOf[MetricsSystem]))
     listenerBus.addToEventLogQueue(eventLogger)
@@ -257,9 +256,9 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
       assert(lines(0).contains("SparkListenerLogStart"))
       assert(lines(1).contains("SparkListenerApplicationStart"))
       assert(lines(2).contains("SparkListenerApplicationEnd"))
-      assert(jsonProtocol.sparkEventFromJson(lines(0)) === logStart)
-      assert(jsonProtocol.sparkEventFromJson(lines(1)) === applicationStart)
-      assert(jsonProtocol.sparkEventFromJson(lines(2)) === applicationEnd)
+      assert(JsonProtocol.sparkEventFromJson(lines(0)) === logStart)
+      assert(JsonProtocol.sparkEventFromJson(lines(1)) === applicationStart)
+      assert(JsonProtocol.sparkEventFromJson(lines(2)) === applicationEnd)
     } finally {
       logData.close()
     }
@@ -316,7 +315,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
       lines.foreach { line =>
         eventSet.foreach { event =>
           if (line.contains(event)) {
-            val parsedEvent = jsonProtocol.sparkEventFromJson(line)
+            val parsedEvent = JsonProtocol.sparkEventFromJson(line)
             val eventType = Utils.getFormattedClassName(parsedEvent)
             if (eventType == event) {
               eventSet.remove(event)
@@ -324,7 +323,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
           }
         }
       }
-      assert(jsonProtocol.sparkEventFromJson(lines(0)) === logStart)
+      assert(JsonProtocol.sparkEventFromJson(lines(0)) === logStart)
       assert(eventSet.isEmpty, "The following events are missing: " + eventSet.toSeq)
     } {
       logData.close()
@@ -527,7 +526,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
       assert(lines.size === 25)
       assert(lines(0).contains("SparkListenerLogStart"))
       assert(lines(1).contains("SparkListenerApplicationStart"))
-      assert(jsonProtocol.sparkEventFromJson(lines(0)) === logStart)
+      assert(JsonProtocol.sparkEventFromJson(lines(0)) === logStart)
       var logIdx = 1
       events.foreach { event =>
         event match {
@@ -618,7 +617,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
   /** Check that the Spark history log line matches the expected event. */
   private def checkEvent(line: String, event: SparkListenerEvent): Unit = {
     assert(line.contains(event.getClass.toString.split("\\.").last))
-    val parsed = jsonProtocol.sparkEventFromJson(line)
+    val parsed = JsonProtocol.sparkEventFromJson(line)
     assert(parsed.getClass === event.getClass)
     (event, parsed) match {
       case (expected: SparkListenerStageSubmitted, actual: SparkListenerStageSubmitted) =>
@@ -650,7 +649,7 @@ class EventLoggingListenerSuite extends SparkFunSuite with LocalSparkContext wit
       line: String,
       stageId: Int,
       expectedEvents: Map[(Int, String), SparkListenerStageExecutorMetrics]): String = {
-    jsonProtocol.sparkEventFromJson(line) match {
+    JsonProtocol.sparkEventFromJson(line) match {
       case executorMetrics: SparkListenerStageExecutorMetrics =>
           expectedEvents.get((stageId, executorMetrics.execId)) match {
             case Some(expectedMetrics) =>
diff --git a/core/src/test/scala/org/apache/spark/scheduler/MapStatusSuite.scala b/core/src/test/scala/org/apache/spark/scheduler/MapStatusSuite.scala
index 13e7ff758ebaf..951c2c2d6cbe8 100644
--- a/core/src/test/scala/org/apache/spark/scheduler/MapStatusSuite.scala
+++ b/core/src/test/scala/org/apache/spark/scheduler/MapStatusSuite.scala
@@ -30,6 +30,7 @@ import org.apache.spark.internal.config
 import org.apache.spark.serializer.{JavaSerializer, KryoSerializer}
 import org.apache.spark.storage.BlockManagerId
 import org.apache.spark.util.Utils
+import org.apache.spark.util.collection.Utils.createArray
 
 class MapStatusSuite extends SparkFunSuite {
   private def doReturn(value: Any) = org.mockito.Mockito.doReturn(value, Seq.empty: _*)
@@ -75,7 +76,7 @@ class MapStatusSuite extends SparkFunSuite {
   }
 
   test("large tasks should use " + classOf[HighlyCompressedMapStatus].getName) {
-    val sizes = Array.fill[Long](2001)(150L)
+    val sizes = createArray(2001, 150L)
     val status = MapStatus(null, sizes, -1)
     assert(status.isInstanceOf[HighlyCompressedMapStatus])
     assert(status.getSizeForBlock(10) === 150L)
@@ -208,7 +209,7 @@ class MapStatusSuite extends SparkFunSuite {
     doReturn(conf).when(env).conf
     SparkEnv.set(env)
 
-    val emptyBlocks = Array.fill[Long](emptyBlocksLength)(0L)
+    val emptyBlocks = createArray(emptyBlocksLength, 0L)
     val smallAndUntrackedBlocks = Array.tabulate[Long](smallAndUntrackedBlocksLength)(i => i)
     val trackedSkewedBlocks =
       Array.tabulate[Long](trackedSkewedBlocksLength)(i => i + 350 * 1024)
@@ -252,7 +253,7 @@ class MapStatusSuite extends SparkFunSuite {
     doReturn(conf).when(env).conf
     SparkEnv.set(env)
 
-    val emptyBlocks = Array.fill[Long](emptyBlocksLength)(0L)
+    val emptyBlocks = createArray(emptyBlocksLength, 0L)
     val smallBlockSizes = Array.tabulate[Long](smallBlocksLength)(i => i + 1)
     val untrackedSkewedBlocksSizes =
       Array.tabulate[Long](untrackedSkewedBlocksLength)(i => i + 3500 * 1024)
diff --git a/core/src/test/scala/org/apache/spark/scheduler/ReplayListenerSuite.scala b/core/src/test/scala/org/apache/spark/scheduler/ReplayListenerSuite.scala
index b0a4b1c261c6a..77d9ae88fbc37 100644
--- a/core/src/test/scala/org/apache/spark/scheduler/ReplayListenerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/scheduler/ReplayListenerSuite.scala
@@ -31,7 +31,7 @@ import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.deploy.history.EventLogFileReader
 import org.apache.spark.deploy.history.EventLogTestHelper._
 import org.apache.spark.io.{CompressionCodec, LZ4CompressionCodec}
-import org.apache.spark.util.{jsonProtocolSuite, JsonProtocol, Utils}
+import org.apache.spark.util.{JsonProtocol, JsonProtocolSuite, Utils}
 
 /**
  * Test whether ReplayListenerBus replays events from logs correctly.
@@ -39,7 +39,6 @@ import org.apache.spark.util.{jsonProtocolSuite, JsonProtocol, Utils}
 class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSparkContext {
   private val fileSystem = Utils.getHadoopFileSystem("/",
     SparkHadoopUtil.get.newConfiguration(new SparkConf()))
-  private val jsonProtocol = new JsonProtocol(new SparkConf())
   private var testDir: File = _
 
   before {
@@ -59,8 +58,8 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
     val applicationEnd = SparkListenerApplicationEnd(1000L)
     Utils.tryWithResource(new PrintWriter(fwriter)) { writer =>
       // scalastyle:off println
-      writer.println(jsonProtocol.sparkEventToJsonString(applicationStart))
-      writer.println(jsonProtocol.sparkEventToJsonString(applicationEnd))
+      writer.println(JsonProtocol.sparkEventToJsonString(applicationStart))
+      writer.println(JsonProtocol.sparkEventToJsonString(applicationEnd))
       // scalastyle:on println
     }
 
@@ -68,15 +67,15 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
     val logData = fileSystem.open(logFilePath)
     val eventMonster = new EventBufferingListener
     try {
-      val replayer = new ReplayListenerBus(jsonProtocol)
+      val replayer = new ReplayListenerBus()
       replayer.addListener(eventMonster)
       replayer.replay(logData, logFilePath.toString)
     } finally {
       logData.close()
     }
     assert(eventMonster.loggedEvents.size === 2)
-    assert(eventMonster.loggedEvents(0) === jsonProtocol.sparkEventToJsonString(applicationStart))
-    assert(eventMonster.loggedEvents(1) === jsonProtocol.sparkEventToJsonString(applicationEnd))
+    assert(eventMonster.loggedEvents(0) === JsonProtocol.sparkEventToJsonString(applicationStart))
+    assert(eventMonster.loggedEvents(1) === JsonProtocol.sparkEventToJsonString(applicationEnd))
   }
 
   /**
@@ -98,8 +97,8 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
       val applicationEnd = SparkListenerApplicationEnd(1000L)
 
       // scalastyle:off println
-      writer.println(jsonProtocol.sparkEventToJsonString(applicationStart))
-      writer.println(jsonProtocol.sparkEventToJsonString(applicationEnd))
+      writer.println(JsonProtocol.sparkEventToJsonString(applicationStart))
+      writer.println(JsonProtocol.sparkEventToJsonString(applicationEnd))
       // scalastyle:on println
     }
 
@@ -111,7 +110,7 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
 
     // Read the compressed .inprogress file and verify only first event was parsed.
     val conf = getLoggingConf(logFilePath)
-    val replayer = new ReplayListenerBus(jsonProtocol)
+    val replayer = new ReplayListenerBus()
 
     val eventMonster = new EventBufferingListener
     replayer.addListener(eventMonster)
@@ -143,9 +142,9 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
     val applicationEnd = SparkListenerApplicationEnd(1000L)
     Utils.tryWithResource(new PrintWriter(fwriter)) { writer =>
       // scalastyle:off println
-      writer.println(jsonProtocol.sparkEventToJsonString(applicationStart))
+      writer.println(JsonProtocol.sparkEventToJsonString(applicationStart))
       writer.println("""{"Event":"UnrecognizedEventOnlyForTest","Timestamp":1477593059313}""")
-      writer.println(jsonProtocol.sparkEventToJsonString(applicationEnd))
+      writer.println(JsonProtocol.sparkEventToJsonString(applicationEnd))
       // scalastyle:on println
     }
 
@@ -153,15 +152,15 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
     val logData = fileSystem.open(logFilePath)
     val eventMonster = new EventBufferingListener
     try {
-      val replayer = new ReplayListenerBus(jsonProtocol)
+      val replayer = new ReplayListenerBus()
       replayer.addListener(eventMonster)
       replayer.replay(logData, logFilePath.toString)
     } finally {
       logData.close()
     }
     assert(eventMonster.loggedEvents.size === 2)
-    assert(eventMonster.loggedEvents(0) === jsonProtocol.sparkEventToJsonString(applicationStart))
-    assert(eventMonster.loggedEvents(1) === jsonProtocol.sparkEventToJsonString(applicationEnd))
+    assert(eventMonster.loggedEvents(0) === JsonProtocol.sparkEventToJsonString(applicationStart))
+    assert(eventMonster.loggedEvents(1) === JsonProtocol.sparkEventToJsonString(applicationEnd))
   }
 
   // This assumes the correctness of EventLoggingListener
@@ -215,7 +214,7 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
     val logData = EventLogFileReader.openEventLog(eventLog.getPath(), fileSystem)
     val eventMonster = new EventBufferingListener
     try {
-      val replayer = new ReplayListenerBus(jsonProtocol)
+      val replayer = new ReplayListenerBus()
       replayer.addListener(eventMonster)
       replayer.replay(logData, eventLog.getPath().toString)
     } finally {
@@ -225,11 +224,11 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
     // Verify the same events are replayed in the same order
     assert(sc.eventLogger.isDefined)
     val originalEvents = sc.eventLogger.get.loggedEvents
-      .map(jsonProtocol.sparkEventFromJson)
+      .map(JsonProtocol.sparkEventFromJson)
     val replayedEvents = eventMonster.loggedEvents
-      .map(jsonProtocol.sparkEventFromJson)
+      .map(JsonProtocol.sparkEventFromJson)
     originalEvents.zip(replayedEvents).foreach { case (e1, e2) =>
-      jsonProtocolSuite.assertEquals(e1, e1)
+      JsonProtocolSuite.assertEquals(e1, e1)
     }
   }
 
@@ -247,7 +246,7 @@ class ReplayListenerSuite extends SparkFunSuite with BeforeAndAfter with LocalSp
     private[scheduler] val loggedEvents = new ArrayBuffer[String]
 
     override def onEvent(event: SparkListenerEvent): Unit = {
-      val eventJson = jsonProtocol.sparkEventToJsonString(event)
+      val eventJson = JsonProtocol.sparkEventToJsonString(event)
       loggedEvents += eventJson
     }
   }
diff --git a/core/src/test/scala/org/apache/spark/scheduler/TaskResultGetterSuite.scala b/core/src/test/scala/org/apache/spark/scheduler/TaskResultGetterSuite.scala
index 5a8722a55ed76..4c6b7f25e3c32 100644
--- a/core/src/test/scala/org/apache/spark/scheduler/TaskResultGetterSuite.scala
+++ b/core/src/test/scala/org/apache/spark/scheduler/TaskResultGetterSuite.scala
@@ -207,7 +207,7 @@ class TaskResultGetterSuite extends SparkFunSuite with BeforeAndAfter with Local
     // compile a small jar containing an exception that will be thrown on an executor.
     val tempDir = Utils.createTempDir()
     val srcDir = new File(tempDir, "repro/")
-    srcDir.mkdirs()
+    Utils.createDirectory(srcDir)
     val excSource = new JavaSourceFromString(new File(srcDir, "MyException").toURI.getPath,
       """package repro;
         |
diff --git a/core/src/test/scala/org/apache/spark/security/CryptoStreamUtilsSuite.scala b/core/src/test/scala/org/apache/spark/security/CryptoStreamUtilsSuite.scala
index e3171116a3e14..fe6530862caba 100644
--- a/core/src/test/scala/org/apache/spark/security/CryptoStreamUtilsSuite.scala
+++ b/core/src/test/scala/org/apache/spark/security/CryptoStreamUtilsSuite.scala
@@ -30,6 +30,7 @@ import org.apache.spark.network.util.CryptoUtils
 import org.apache.spark.security.CryptoStreamUtils._
 import org.apache.spark.serializer.{JavaSerializer, SerializerManager}
 import org.apache.spark.storage.TempShuffleBlockId
+import org.apache.spark.util.Utils
 
 class CryptoStreamUtilsSuite extends SparkFunSuite {
 
@@ -92,7 +93,7 @@ class CryptoStreamUtilsSuite extends SparkFunSuite {
 
     val inputStream = new ByteArrayInputStream(encryptedBytes)
     val wrappedInputStream = serializerManager.wrapStream(blockId, inputStream)
-    val decryptedBytes = ByteStreams.toByteArray(wrappedInputStream)
+    val decryptedBytes = wrappedInputStream.readAllBytes()
     val decryptedStr = new String(decryptedBytes, UTF_8)
     assert(decryptedStr === plainStr)
   }
@@ -116,8 +117,7 @@ class CryptoStreamUtilsSuite extends SparkFunSuite {
 
       val in = CryptoStreamUtils.createCryptoInputStream(new ByteArrayInputStream(encrypted),
         sc.conf, SparkEnv.get.securityManager.getIOEncryptionKey().get)
-      val decrypted = new String(ByteStreams.toByteArray(in), UTF_8)
-      assert(content === decrypted)
+      assert(content === Utils.toString(in))
     } finally {
       sc.stop()
     }
@@ -134,14 +134,14 @@ class CryptoStreamUtilsSuite extends SparkFunSuite {
 
     val outStream = createCryptoOutputStream(new FileOutputStream(file), conf, key)
     try {
-      ByteStreams.copy(new ByteArrayInputStream(testData), outStream)
+      new ByteArrayInputStream(testData).transferTo(outStream)
     } finally {
       outStream.close()
     }
 
     val inStream = createCryptoInputStream(new FileInputStream(file), conf, key)
     try {
-      val inStreamData = ByteStreams.toByteArray(inStream)
+      val inStreamData = inStream.readAllBytes()
       assert(Arrays.equals(inStreamData, testData))
     } finally {
       inStream.close()
@@ -150,14 +150,16 @@ class CryptoStreamUtilsSuite extends SparkFunSuite {
     val outChannel = createWritableChannel(new FileOutputStream(file).getChannel(), conf, key)
     try {
       val inByteChannel = Channels.newChannel(new ByteArrayInputStream(testData))
+      // scalastyle:off bytestreamscopy
       ByteStreams.copy(inByteChannel, outChannel)
+      // scalastyle:on bytestreamscopy
     } finally {
       outChannel.close()
     }
 
     val inChannel = createReadableChannel(new FileInputStream(file).getChannel(), conf, key)
     try {
-      val inChannelData = ByteStreams.toByteArray(Channels.newInputStream(inChannel))
+      val inChannelData = Channels.newInputStream(inChannel).readAllBytes()
       assert(Arrays.equals(inChannelData, testData))
     } finally {
       inChannel.close()
diff --git a/core/src/test/scala/org/apache/spark/shuffle/ShuffleBlockPusherSuite.scala b/core/src/test/scala/org/apache/spark/shuffle/ShuffleBlockPusherSuite.scala
index f030b64944e55..741e5a82e8846 100644
--- a/core/src/test/scala/org/apache/spark/shuffle/ShuffleBlockPusherSuite.scala
+++ b/core/src/test/scala/org/apache/spark/shuffle/ShuffleBlockPusherSuite.scala
@@ -42,6 +42,7 @@ import org.apache.spark.serializer.JavaSerializer
 import org.apache.spark.shuffle.ShuffleBlockPusher.PushRequest
 import org.apache.spark.storage._
 import org.apache.spark.util.{SslTestUtils, ThreadUtils}
+import org.apache.spark.util.collection.Utils.createArray
 
 class ShuffleBlockPusherSuite extends SparkFunSuite {
 
@@ -115,7 +116,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
     val mergerLocs = dependency.getMergerLocs.map(loc => BlockManagerId("", loc.host, loc.port))
     val largeBlockSize = 2 * 1024 * 1024
     blockPusher.initiateBlockPush(mock(classOf[File]),
-      Array.fill(dependency.partitioner.numPartitions) { 5 }, dependency, 0)
+      createArray(dependency.partitioner.numPartitions, 5), dependency, 0)
     val pushRequests = blockPusher.prepareBlockPushRequests(5, 0, 0, 0,
       mock(classOf[File]), Array(2, 2, 2, largeBlockSize, largeBlockSize), mergerLocs,
       mock(classOf[TransportConf]))
@@ -131,7 +132,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
     val blockPusher = new TestShuffleBlockPusher(conf)
     val mergerLocs = dependency.getMergerLocs.map(loc => BlockManagerId("", loc.host, loc.port))
     blockPusher.initiateBlockPush(mock(classOf[File]),
-      Array.fill(dependency.partitioner.numPartitions) { 5 }, dependency, 0)
+      createArray(dependency.partitioner.numPartitions, 5), dependency, 0)
     val pushRequests = blockPusher.prepareBlockPushRequests(5, 0, 0, 0,
       mock(classOf[File]), Array(2, 2, 2, 1028, 1024), mergerLocs, mock(classOf[TransportConf]))
     blockPusher.runPendingTasks()
@@ -146,7 +147,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
     val blockPusher = new TestShuffleBlockPusher(conf)
     val mergerLocs = dependency.getMergerLocs.map(loc => BlockManagerId("", loc.host, loc.port))
     blockPusher.initiateBlockPush(mock(classOf[File]),
-      Array.fill(dependency.partitioner.numPartitions) { 5 }, dependency, 0)
+      createArray(dependency.partitioner.numPartitions, 5), dependency, 0)
     val pushRequests = blockPusher.prepareBlockPushRequests(5, 0, 0, 0,
       mock(classOf[File]), Array(2, 2, 2, 2, 2), mergerLocs, mock(classOf[TransportConf]))
     blockPusher.runPendingTasks()
@@ -188,7 +189,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
     val blockPusher = new ConcurrentTestBlockPusher(conf, semaphore)
     val mergerLocs = dependency.getMergerLocs.map(loc => BlockManagerId("", loc.host, loc.port))
     blockPusher.initiateBlockPush(mock(classOf[File]),
-      Array.fill(dependency.partitioner.numPartitions) { 5 }, dependency, 0)
+      createArray(dependency.partitioner.numPartitions, 5), dependency, 0)
     val pushRequests = blockPusher.prepareBlockPushRequests(5, 0, 0, 0,
       mock(classOf[File]), Array(2, 2, 2, 2, 2), mergerLocs, mock(classOf[TransportConf]))
     latch.countDown()
@@ -204,7 +205,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
     interceptPushedBlocksForSuccess()
     val blockPusher = new TestShuffleBlockPusher(conf)
     blockPusher.initiateBlockPush(mock(classOf[File]),
-      Array.fill(dependency.partitioner.numPartitions) { 2 }, dependency, 0)
+      createArray(dependency.partitioner.numPartitions, 2), dependency, 0)
     blockPusher.runPendingTasks()
     verify(shuffleClient, times(1))
       .pushBlocks(any(), any(), any(), any(), any())
@@ -232,7 +233,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
     interceptPushedBlocksForSuccess()
     val pusher = new TestShuffleBlockPusher(conf)
     pusher.initiateBlockPush(
-      mock(classOf[File]), Array.fill(dependency.partitioner.numPartitions) { 2 }, dependency, 0)
+      mock(classOf[File]), createArray(dependency.partitioner.numPartitions, 2), dependency, 0)
     pusher.runPendingTasks()
     verify(shuffleClient, times(8))
       .pushBlocks(any(), any(), any(), any(), any())
@@ -267,7 +268,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
       })
     val pusher = new TestShuffleBlockPusher(conf)
     pusher.initiateBlockPush(
-      mock(classOf[File]), Array.fill(dependency.partitioner.numPartitions) { 2 }, dependency, 0)
+      mock(classOf[File]), createArray(dependency.partitioner.numPartitions, 2), dependency, 0)
     pusher.runPendingTasks()
     verify(shuffleClient, times(1))
       .pushBlocks(any(), any(), any(), any(), any())
@@ -288,7 +289,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
     interceptPushedBlocksForSuccess()
     val pusher = new TestShuffleBlockPusher(conf)
     pusher.initiateBlockPush(mock(classOf[File]),
-      Array.fill(dependency.partitioner.numPartitions) { 512 * 1024 }, dependency, 0)
+      createArray(dependency.partitioner.numPartitions, 512 * 1024), dependency, 0)
     pusher.runPendingTasks()
     verify(shuffleClient, times(4))
       .pushBlocks(any(), any(), any(), any(), any())
@@ -355,7 +356,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
         })
       })
     pusher.initiateBlockPush(
-      mock(classOf[File]), Array.fill(dependency.partitioner.numPartitions) { 2 }, dependency, 0)
+      mock(classOf[File]), createArray(dependency.partitioner.numPartitions, 2), dependency, 0)
     pusher.runPendingTasks()
     verify(shuffleClient, times(8))
       .pushBlocks(any(), any(), any(), any(), any())
@@ -385,7 +386,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
         })
       })
     pusher.initiateBlockPush(
-      mock(classOf[File]), Array.fill(dependency.partitioner.numPartitions) { 2 }, dependency, 0)
+      mock(classOf[File]), createArray(dependency.partitioner.numPartitions, 2), dependency, 0)
     pusher.runPendingTasks()
     verify(shuffleClient, times(1))
       .pushBlocks(any(), any(), any(), any(), any())
@@ -408,7 +409,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
       })
     val pusher = new TestShuffleBlockPusher(conf)
     pusher.initiateBlockPush(
-      mock(classOf[File]), Array.fill(dependency.partitioner.numPartitions) { 2 }, dependency, 0)
+      mock(classOf[File]), createArray(dependency.partitioner.numPartitions, 2), dependency, 0)
     pusher.runPendingTasks()
     verify(shuffleClient, times(2))
       .pushBlocks(any(), any(), any(), any(), any())
@@ -434,7 +435,7 @@ class ShuffleBlockPusherSuite extends SparkFunSuite {
         })
       })
     pusher.initiateBlockPush(
-      mock(classOf[File]), Array.fill(dependency.partitioner.numPartitions) { 2 }, dependency, 0)
+      mock(classOf[File]), createArray(dependency.partitioner.numPartitions, 2), dependency, 0)
     pusher.runPendingTasks()
     verify(shuffleClient, times(1))
       .pushBlocks(any(), any(), any(), any(), any())
diff --git a/core/src/test/scala/org/apache/spark/shuffle/ShuffleDriverComponentsSuite.scala b/core/src/test/scala/org/apache/spark/shuffle/ShuffleDriverComponentsSuite.scala
index f67204649ce19..b683d664fabb1 100644
--- a/core/src/test/scala/org/apache/spark/shuffle/ShuffleDriverComponentsSuite.scala
+++ b/core/src/test/scala/org/apache/spark/shuffle/ShuffleDriverComponentsSuite.scala
@@ -20,7 +20,6 @@ package org.apache.spark.shuffle
 import java.util.{Map => JMap}
 import java.util.concurrent.atomic.AtomicBoolean
 
-import com.google.common.collect.ImmutableMap
 import org.scalatest.Assertions._
 
 import org.apache.spark.{LocalSparkContext, SparkConf, SparkContext, SparkFunSuite}
@@ -61,7 +60,7 @@ class TestShuffleDataIO(sparkConf: SparkConf) extends ShuffleDataIO {
 
 class TestShuffleDriverComponents extends ShuffleDriverComponents {
   override def initializeApplication(): JMap[String, String] = {
-    ImmutableMap.of("test-plugin-key", "plugin-set-value")
+    JMap.of("test-plugin-key", "plugin-set-value")
   }
 
   override def cleanupApplication(): Unit = {}
diff --git a/core/src/test/scala/org/apache/spark/storage/BlockManagerDecommissionIntegrationSuite.scala b/core/src/test/scala/org/apache/spark/storage/BlockManagerDecommissionIntegrationSuite.scala
index 1c4c00c03a470..2b2a67c3c00ad 100644
--- a/core/src/test/scala/org/apache/spark/storage/BlockManagerDecommissionIntegrationSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/BlockManagerDecommissionIntegrationSuite.scala
@@ -25,14 +25,13 @@ import scala.collection.mutable.ArrayBuffer
 import scala.concurrent.duration._
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.concurrent.Eventually
 
 import org.apache.spark._
 import org.apache.spark.internal.config
 import org.apache.spark.scheduler._
 import org.apache.spark.scheduler.cluster.StandaloneSchedulerBackend
-import org.apache.spark.util.{ResetSystemProperties, SystemClock, ThreadUtils}
+import org.apache.spark.util.{ResetSystemProperties, SystemClock, ThreadUtils, Utils}
 import org.apache.spark.util.ArrayImplicits._
 
 class BlockManagerDecommissionIntegrationSuite extends SparkFunSuite with LocalSparkContext
@@ -361,12 +360,8 @@ class BlockManagerDecommissionIntegrationSuite extends SparkFunSuite with LocalS
 
     val sparkTempDir = System.getProperty("java.io.tmpdir")
 
-    def shuffleFiles: Seq[File] = {
-      FileUtils
-        .listFiles(new File(sparkTempDir), Array("data", "index"), true)
-        .asScala
-        .toSeq
-    }
+    def shuffleFiles: Seq[File] = Utils.listFiles(new File(sparkTempDir)).asScala
+        .filter(f => Array("data", "index").exists(f.getName.endsWith)).toSeq
 
     val existingShuffleFiles = shuffleFiles
 
diff --git a/core/src/test/scala/org/apache/spark/storage/BlockManagerSuite.scala b/core/src/test/scala/org/apache/spark/storage/BlockManagerSuite.scala
index b373e295d5734..5b86345dd5f9a 100644
--- a/core/src/test/scala/org/apache/spark/storage/BlockManagerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/BlockManagerSuite.scala
@@ -66,6 +66,7 @@ import org.apache.spark.shuffle.sort.SortShuffleManager
 import org.apache.spark.storage.BlockManagerMessages._
 import org.apache.spark.util._
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.collection.Utils.createArray
 import org.apache.spark.util.io.ChunkedByteBuffer
 
 class BlockManagerSuite extends SparkFunSuite with Matchers with PrivateMethodTester
@@ -152,7 +153,7 @@ class BlockManagerSuite extends SparkFunSuite with Matchers with PrivateMethodTe
   }
 
   // Save modified system properties so that we can restore them after tests.
-  val originalArch = System.getProperty("os.arch")
+  val originalArch = Utils.osArch
   val originalCompressedOops = System.getProperty(TEST_USE_COMPRESSED_OOPS_KEY)
 
   def reinitializeSizeEstimator(arch: String, useCompressedOops: String): Unit = {
@@ -937,7 +938,7 @@ class BlockManagerSuite extends SparkFunSuite with Matchers with PrivateMethodTe
       // the local disk of sameHostBm where the block is replicated to.
       // When there is no replication then block must be added via sameHostBm directly.
       val bmToPutBlock = if (storageLevel.replication > 1) otherHostBm else sameHostBm
-      val array = Array.fill(16)(Byte.MinValue to Byte.MaxValue).flatten
+      val array = createArray(16, Byte.MinValue to Byte.MaxValue).flatten
       val blockId = "list"
       bmToPutBlock.putIterator(blockId, List(array).iterator, storageLevel, tellMaster = true)
 
@@ -970,7 +971,7 @@ class BlockManagerSuite extends SparkFunSuite with Matchers with PrivateMethodTe
       val store2 = makeBlockManager(8000, "executor2", this.master,
         Some(new MockBlockTransferService(0)))
       val blockId = "list"
-      val array = Array.fill(16)(Byte.MinValue to Byte.MaxValue).flatten
+      val array = createArray(16, Byte.MinValue to Byte.MaxValue).flatten
       store2.putIterator(blockId, List(array).iterator, level, true)
       val expectedBlockData = store2.getLocalBytes(blockId)
       assert(expectedBlockData.isDefined)
diff --git a/core/src/test/scala/org/apache/spark/storage/DiskBlockManagerSuite.scala b/core/src/test/scala/org/apache/spark/storage/DiskBlockManagerSuite.scala
index eacd1eea6fca3..85759dbe06cb8 100644
--- a/core/src/test/scala/org/apache/spark/storage/DiskBlockManagerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/DiskBlockManagerSuite.scala
@@ -25,7 +25,6 @@ import java.util.HashMap
 import com.fasterxml.jackson.core.`type`.TypeReference
 import com.fasterxml.jackson.databind.ObjectMapper
 import jnr.posix.{POSIX, POSIXFactory}
-import org.apache.commons.io.FileUtils
 
 import org.apache.spark.{SparkConf, SparkFunSuite}
 import org.apache.spark.internal.config
@@ -116,14 +115,14 @@ class DiskBlockManagerSuite extends SparkFunSuite {
 
   test("Test dir creation with permission 770") {
     val testDir = new File("target/testDir");
-    FileUtils.deleteQuietly(testDir)
+    Utils.deleteQuietly(testDir)
     diskBlockManager = new DiskBlockManager(testConf, deleteFilesOnStop = true, isDriver = false)
     diskBlockManager.createDirWithPermission770(testDir)
     assert(testDir.exists && testDir.isDirectory)
     val permission = PosixFilePermissions.toString(
       Files.getPosixFilePermissions(Paths.get("target/testDir")))
     assert(permission.equals("rwxrwx---"))
-    FileUtils.deleteQuietly(testDir)
+    Utils.deleteQuietly(testDir)
   }
 
   test("Encode merged directory name and attemptId in shuffleManager field") {
diff --git a/core/src/test/scala/org/apache/spark/storage/DiskStoreSuite.scala b/core/src/test/scala/org/apache/spark/storage/DiskStoreSuite.scala
index b644224652266..475312f8d3a97 100644
--- a/core/src/test/scala/org/apache/spark/storage/DiskStoreSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/DiskStoreSuite.scala
@@ -18,9 +18,9 @@
 package org.apache.spark.storage
 
 import java.nio.{ByteBuffer, MappedByteBuffer}
+import java.nio.file.Files
 import java.util.{Arrays, Random}
 
-import com.google.common.io.{ByteStreams, Files}
 import io.netty.channel.FileRegion
 
 import org.apache.spark.{SecurityManager, SparkConf, SparkFunSuite}
@@ -150,7 +150,7 @@ class DiskStoreSuite extends SparkFunSuite {
 
     assert(diskStore.getSize(blockId) === testData.length)
 
-    val diskData = Files.toByteArray(diskBlockManager.getFile(blockId.name))
+    val diskData = Files.readAllBytes(diskBlockManager.getFile(blockId.name).toPath)
     assert(!Arrays.equals(testData, diskData))
 
     val blockData = diskStore.getBytes(blockId)
@@ -171,7 +171,7 @@ class DiskStoreSuite extends SparkFunSuite {
   private def readViaInputStream(data: BlockData): Array[Byte] = {
     val is = data.toInputStream()
     try {
-      ByteStreams.toByteArray(is)
+      is.readAllBytes()
     } finally {
       is.close()
     }
diff --git a/core/src/test/scala/org/apache/spark/storage/FallbackStorageSuite.scala b/core/src/test/scala/org/apache/spark/storage/FallbackStorageSuite.scala
index 6c51bd4ff2e2f..58fc857a2ae79 100644
--- a/core/src/test/scala/org/apache/spark/storage/FallbackStorageSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/FallbackStorageSuite.scala
@@ -16,20 +16,21 @@
  */
 package org.apache.spark.storage
 
-import java.io.{DataOutputStream, File, FileOutputStream, InputStream, IOException}
+import java.io.{DataOutputStream, File, FileNotFoundException, FileOutputStream, InputStream, IOException}
 import java.nio.file.Files
 
 import scala.concurrent.duration._
 import scala.util.Random
 
 import org.apache.hadoop.conf.Configuration
-import org.apache.hadoop.fs.{FSDataInputStream, LocalFileSystem, Path, PositionedReadable, Seekable}
+import org.apache.hadoop.fs.{FileSystem, FSDataInputStream, LocalFileSystem, Path, PositionedReadable, Seekable}
 import org.mockito.{ArgumentMatchers => mc}
 import org.mockito.Mockito.{mock, never, verify, when}
 import org.scalatest.concurrent.Eventually.{eventually, interval, timeout}
 
 import org.apache.spark.{LocalSparkContext, SparkConf, SparkContext, SparkFunSuite, TestUtils}
 import org.apache.spark.LocalSparkContext.withSpark
+import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.internal.config._
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.launcher.SparkLauncher.{EXECUTOR_MEMORY, SPARK_MASTER}
@@ -39,6 +40,7 @@ import org.apache.spark.scheduler.ExecutorDecommissionInfo
 import org.apache.spark.scheduler.cluster.StandaloneSchedulerBackend
 import org.apache.spark.shuffle.{IndexShuffleBlockResolver, ShuffleBlockInfo}
 import org.apache.spark.shuffle.IndexShuffleBlockResolver.NOOP_REDUCE_ID
+import org.apache.spark.util.Clock
 import org.apache.spark.util.Utils.tryWithResource
 
 class FallbackStorageSuite extends SparkFunSuite with LocalSparkContext {
@@ -334,7 +336,44 @@ class FallbackStorageSuite extends SparkFunSuite with LocalSparkContext {
       }
     }
   }
+
+  Seq(0, 1, 3, 6).foreach { replicationSeconds =>
+    test(s"Consider replication delay - ${replicationSeconds}s") {
+      val replicationMs = replicationSeconds * 1000;
+      val delay = 5 // max allowed replication (in seconds)
+      val wait = 2 // time between open file attempts (in seconds)
+      val conf = getSparkConf()
+        .set(STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_DELAY.key, s"${delay}s")
+        .set(STORAGE_DECOMMISSION_FALLBACK_STORAGE_REPLICATION_WAIT.key, s"${wait}s")
+
+      val filesystem = FileSystem.get(SparkHadoopUtil.get.newConfiguration(conf))
+      val path = new Path(conf.get(STORAGE_DECOMMISSION_FALLBACK_STORAGE_PATH).get, "file")
+      val startMs = 123000000L * 1000L // arbitrary system time
+      val clock = new DelayedActionClock(replicationMs, startMs)(filesystem.create(path).close())
+
+      if (replicationSeconds <= delay) {
+        // expect open to succeed
+        val in = FallbackStorage.open(conf, filesystem, path, clock)
+        assert(in != null)
+
+        // how many waits are expected to observe replication
+        val expectedWaits = Math.ceil(replicationSeconds.toFloat / wait).toInt
+        assert(clock.timeMs == startMs + expectedWaits * wait * 1000)
+        assert(clock.waited == expectedWaits)
+        in.close()
+      } else {
+        // expect open to fail
+        assertThrows[FileNotFoundException](FallbackStorage.open(conf, filesystem, path, clock))
+
+        // how many waits are expected to observe delay
+        val expectedWaits = delay / wait
+        assert(clock.timeMs == startMs + expectedWaits * wait * 1000)
+        assert(clock.waited == expectedWaits)
+      }
+    }
+  }
 }
+
 class ReadPartialInputStream(val in: FSDataInputStream) extends InputStream
   with Seekable with PositionedReadable {
   override def read: Int = in.read
@@ -378,3 +417,30 @@ class ReadPartialFileSystem extends LocalFileSystem {
     new FSDataInputStream(new ReadPartialInputStream(stream))
   }
 }
+
+class DelayedActionClock(delayMs: Long, startTimeMs: Long)(action: => Unit) extends Clock {
+  var timeMs: Long = startTimeMs
+  var waited: Int = 0
+  var triggered: Boolean = false
+
+  if (delayMs == 0) trigger()
+
+  private def trigger(): Unit = {
+    if (!triggered) {
+      triggered = true
+      action
+    }
+  }
+
+  override def getTimeMillis(): Long = timeMs
+  override def nanoTime(): Long = timeMs * 1000000
+  override def waitTillTime(targetTime: Long): Long = {
+    waited += 1
+    if (targetTime >= startTimeMs + delayMs) {
+      timeMs = startTimeMs + delayMs
+      trigger()
+    }
+    timeMs = targetTime
+    targetTime
+  }
+}
diff --git a/core/src/test/scala/org/apache/spark/storage/LocalDirsSuite.scala b/core/src/test/scala/org/apache/spark/storage/LocalDirsSuite.scala
index 4b22ec334e84b..3a30444d0aab0 100644
--- a/core/src/test/scala/org/apache/spark/storage/LocalDirsSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/LocalDirsSuite.scala
@@ -29,7 +29,7 @@ class LocalDirsSuite extends SparkFunSuite with LocalRootDirsTest {
 
   private def assumeNonExistentAndNotCreatable(f: File): Unit = {
     try {
-      assume(!f.exists() && !f.mkdirs())
+      assume(!f.exists() && !Utils.createDirectory(f))
     } finally {
       Utils.deleteRecursively(f)
     }
diff --git a/core/src/test/scala/org/apache/spark/storage/MemoryStoreSuite.scala b/core/src/test/scala/org/apache/spark/storage/MemoryStoreSuite.scala
index 0cf3348235c86..ab8c465074f11 100644
--- a/core/src/test/scala/org/apache/spark/storage/MemoryStoreSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/MemoryStoreSuite.scala
@@ -58,7 +58,7 @@ class MemoryStoreSuite
   def rdd(rddId: Int, splitId: Int): RDDBlockId = RDDBlockId(rddId, splitId)
 
   // Save modified system properties so that we can restore them after tests.
-  val originalArch = System.getProperty("os.arch")
+  val originalArch = Utils.osArch
   val originalCompressedOops = System.getProperty(TEST_USE_COMPRESSED_OOPS_KEY)
 
   def reinitializeSizeEstimator(arch: String, useCompressedOops: String): Unit = {
diff --git a/core/src/test/scala/org/apache/spark/storage/ShuffleBlockFetcherIteratorSuite.scala b/core/src/test/scala/org/apache/spark/storage/ShuffleBlockFetcherIteratorSuite.scala
index b730055e0c8a3..211de2e8729eb 100644
--- a/core/src/test/scala/org/apache/spark/storage/ShuffleBlockFetcherIteratorSuite.scala
+++ b/core/src/test/scala/org/apache/spark/storage/ShuffleBlockFetcherIteratorSuite.scala
@@ -29,7 +29,6 @@ import scala.concurrent.ExecutionContext.Implicits.global
 // scalastyle:on executioncontextglobal
 import scala.concurrent.Future
 
-import com.google.common.io.ByteStreams
 import io.netty.util.internal.OutOfDirectMemoryError
 import org.apache.logging.log4j.Level
 import org.mockito.ArgumentMatchers.{any, eq => meq}
@@ -136,8 +135,13 @@ class ShuffleBlockFetcherIteratorSuite extends SparkFunSuite {
     when(mockExternalBlockStoreClient.getHostLocalDirs(any(), any(), any(), any()))
       .thenAnswer { invocation =>
         import scala.jdk.CollectionConverters._
-        invocation.getArgument[CompletableFuture[java.util.Map[String, Array[String]]]](3)
-          .complete(hostLocalDirs.asJava)
+        if (hostLocalDirs == null) {
+          invocation.getArgument[CompletableFuture[java.util.Map[String, Array[String]]]](3)
+            .completeExceptionally(new RuntimeException("force fail"))
+        } else {
+          invocation.getArgument[CompletableFuture[java.util.Map[String, Array[String]]]](3)
+            .complete(hostLocalDirs.asJava)
+        }
       }
 
     blockManager.hostLocalDirManager = Some(hostLocalDirManager)
@@ -284,7 +288,7 @@ class ShuffleBlockFetcherIteratorSuite extends SparkFunSuite {
       intercept[FetchFailedException] {
         val inputStream = iterator.next()._2
         // Consume the data to trigger the corruption
-        ByteStreams.readFully(inputStream, new Array[Byte](100))
+        Utils.readFully(inputStream, new Array[Byte](100), 0, 100)
       }
       // The block will be fetched only once because corruption can't be detected in
       // maxBytesInFlight/3 of the data size
@@ -692,7 +696,7 @@ class ShuffleBlockFetcherIteratorSuite extends SparkFunSuite {
           ShuffleBlockId(0, 0, 0).toString, blocks(ShuffleBlockId(0, 0, 0)))
         listener.onBlockFetchFailure(
           ShuffleBlockId(0, 1, 0).toString, new BlockNotFoundException("blah"))
-          listener.onBlockFetchFailure(
+        listener.onBlockFetchFailure(
             ShuffleBlockId(0, 2, 0).toString, new BlockNotFoundException("blah"))
         sem.release()
       }
@@ -705,11 +709,12 @@ class ShuffleBlockFetcherIteratorSuite extends SparkFunSuite {
     // Continue only after the mock calls onBlockFetchFailure
     sem.acquire()
 
-    // The first block should be returned without an exception, and the last two should throw
-    // FetchFailedExceptions (due to failure)
-    iterator.next()
+    // There are one success fetch and 2 failures. Since failures are consumed firstly so
+    // the first 2 should throw FetchFailedExceptions (due to failure) and the last block
+    // should be returned without an exception.
     intercept[FetchFailedException] { iterator.next() }
     intercept[FetchFailedException] { iterator.next() }
+    iterator.next()
   }
 
   private def mockCorruptBuffer(size: Long = 1L, corruptAt: Int = 0): ManagedBuffer = {
@@ -1506,10 +1511,10 @@ class ShuffleBlockFetcherIteratorSuite extends SparkFunSuite {
         Seq(ShuffleMergedBlockId(0, 0, 2)), 2L, SHUFFLE_PUSH_MAP_ID)))
     val iterator = createShuffleBlockIteratorWithDefaults(blocksByAddress,
       blockManager = Some(blockManager))
-    // 1st instance of iterator.next() returns the original shuffle block (0, 0, 2)
-    assert(iterator.next()._1 === ShuffleBlockId(0, 0, 2))
-    // 2nd instance of iterator.next() throws FetchFailedException
+    // 1st instance of iterator.next() throws FetchFailedException
     intercept[FetchFailedException] { iterator.next() }
+    // 2nd instance of iterator.next() returns the original shuffle block (0, 0, 2)
+    assert(iterator.next()._1 === ShuffleBlockId(0, 0, 2))
   }
 
   test("SPARK-32922: failure to fetch push-merged-local block should fallback to fetch " +
@@ -1968,4 +1973,107 @@ class ShuffleBlockFetcherIteratorSuite extends SparkFunSuite {
           "shuffle checksum support for ShuffleBlockBatchId")))
     }
   }
+
+  test("SPARK-52395: Fast fail when fetch failure happens for local blocks") {
+    val blockManager = createMockBlockManager()
+    val localBmId = blockManager.blockManagerId
+
+    // Make sure blockManager.getBlockData would return the blocks
+    val localBlocks = Map[BlockId, ManagedBuffer](
+      ShuffleBlockId(0, 0, 0) -> createMockManagedBuffer(),
+      ShuffleBlockId(0, 1, 0) -> createMockManagedBuffer(),
+      ShuffleBlockId(0, 2, 0) -> createMockManagedBuffer())
+    localBlocks.take(2).foreach { case (blockId, buf) =>
+      doReturn(buf).when(blockManager).getLocalBlockData(meq(blockId))
+    }
+    localBlocks.takeRight(1).foreach { case (blockId, buf) =>
+      doThrow(new RuntimeException("force fail")).when(blockManager)
+        .getLocalBlockData(meq(blockId))
+    }
+
+    val iterator = createShuffleBlockIteratorWithDefaults(
+      Map(localBmId -> toBlockList(localBlocks.keys, 1L, 0)),
+      blockManager = Some(blockManager)
+    )
+
+    // Fetch failure should be placed in the head of results, exception should be thrown for the
+    // 1st instance.
+    intercept[FetchFailedException] { iterator.next() }
+    assert(iterator.next()._1 === ShuffleBlockId(0, 0, 0))
+    assert(iterator.next()._1 === ShuffleBlockId(0, 1, 0))
+    assert(!iterator.hasNext)
+  }
+
+  test("SPARK-52395: Fast fail when fetch failure happens for host local blocks") {
+    val blockManager = createMockBlockManager()
+    // Create a block manager running on the same host (host-local)
+    val hostLocalBmId = BlockManagerId("test-host-local-client-1", "test-local-host", 3)
+    val hostLocalBlocks = 0.to(2).map(ShuffleBlockId(0, _, 0) -> createMockManagedBuffer()).toMap
+
+    hostLocalBlocks.take(2).foreach { case (blockId, buf) =>
+      doReturn(buf).when(blockManager)
+        .getHostLocalShuffleData(meq(blockId), any())
+    }
+    hostLocalBlocks.takeRight(1).foreach { case (blockId, buf) =>
+      doThrow(new RuntimeException("force fail")).when(blockManager)
+        .getHostLocalShuffleData(meq(blockId), any())
+    }
+    val hostLocalDirs = Map("test-host-local-client-1" -> Array("local-dir"))
+    // returning local dir for hostLocalBmId
+    initHostLocalDirManager(blockManager, hostLocalDirs)
+
+    val iterator = createShuffleBlockIteratorWithDefaults(
+      Map(hostLocalBmId -> toBlockList(hostLocalBlocks.keys, 1L, 0)),
+      blockManager = Some(blockManager)
+    )
+
+    // Fetch failure should be placed in the head of results, exception should be thrown for the
+    // 1st instance.
+    intercept[FetchFailedException] { iterator.next() }
+    assert(iterator.next()._1 === ShuffleBlockId(0, 0, 0))
+    assert(iterator.next()._1 === ShuffleBlockId(0, 1, 0))
+    assert(!iterator.hasNext)
+  }
+
+  test("SPARK-52395: Fast fail when failed to get host local dirs") {
+    val blockManager = createMockBlockManager()
+    val localBmId = blockManager.blockManagerId
+
+    // Make sure blockManager.getBlockData would return the blocks
+    val localBlocks = Map[BlockId, ManagedBuffer](
+      ShuffleBlockId(0, 0, 0) -> createMockManagedBuffer(),
+      ShuffleBlockId(0, 1, 0) -> createMockManagedBuffer())
+    localBlocks.foreach { case (blockId, buf) =>
+      doReturn(buf).when(blockManager).getLocalBlockData(meq(blockId))
+    }
+
+    // Create a block manager running on the same host (host-local)
+    val hostLocalBmId = BlockManagerId("test-host-local-client-1", "test-local-host", 3)
+    val hostLocalBlocks = Map[BlockId, ManagedBuffer](
+      ShuffleBlockId(0, 2, 0) -> createMockManagedBuffer())
+    hostLocalBlocks.foreach { case (blockId, buf) =>
+      doReturn(buf).when(blockManager)
+        .getHostLocalShuffleData(meq(blockId), any())
+    }
+
+    // Setting hostLocalDirs as null to force fail `getHostLocalDirs`.
+    initHostLocalDirManager(blockManager, null)
+
+    val iterator = createShuffleBlockIteratorWithDefaults(
+      Map(
+        localBmId -> toBlockList(localBlocks.keys, 1L, 0),
+        hostLocalBmId -> toBlockList(hostLocalBlocks.keys, 1L, 1)
+      ),
+      blockManager = Some(blockManager)
+    )
+
+    verify(blockManager, times(0)).getHostLocalShuffleData(any(), any())
+
+    // Fetch failure should be placed in the head of results, exception should be thrown for the
+    // 1st instance.
+    intercept[FetchFailedException] { iterator.next() }
+    assert(iterator.next()._1 === ShuffleBlockId(0, 0, 0))
+    assert(iterator.next()._1 === ShuffleBlockId(0, 1, 0))
+    assert(!iterator.hasNext)
+  }
 }
diff --git a/core/src/test/scala/org/apache/spark/ui/DriverLogPageSuite.scala b/core/src/test/scala/org/apache/spark/ui/DriverLogPageSuite.scala
index 1a26aa53dcbf9..c88378462e2cf 100644
--- a/core/src/test/scala/org/apache/spark/ui/DriverLogPageSuite.scala
+++ b/core/src/test/scala/org/apache/spark/ui/DriverLogPageSuite.scala
@@ -19,9 +19,9 @@ package org.apache.spark.ui
 
 import java.io.File
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
 import jakarta.servlet.http.HttpServletRequest
-import org.apache.commons.io.FileUtils
 import org.mockito.Mockito.{mock, when}
 
 import org.apache.spark.{SparkConf, SparkFunSuite}
@@ -54,7 +54,7 @@ class DriverLogPageSuite extends SparkFunSuite {
     withTempDir { dir =>
       val page = new DriverLogPage(null, conf.set(DRIVER_LOG_LOCAL_DIR, dir.getCanonicalPath))
       val file = new File(dir, "driver.log")
-      FileUtils.writeStringToFile(file, "driver log content", StandardCharsets.UTF_8)
+      Files.writeString(file.toPath(), "driver log content", StandardCharsets.UTF_8)
       val request = mock(classOf[HttpServletRequest])
       val log = page.renderLog(request)
       assert(log.startsWith("==== Bytes 0-18 of 18 of"))
diff --git a/core/src/test/scala/org/apache/spark/util/FileAppenderSuite.scala b/core/src/test/scala/org/apache/spark/util/FileAppenderSuite.scala
index 4497ea1b2b798..165b46832de64 100644
--- a/core/src/test/scala/org/apache/spark/util/FileAppenderSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/FileAppenderSuite.scala
@@ -19,14 +19,13 @@ package org.apache.spark.util
 
 import java.io._
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.concurrent.CountDownLatch
 import java.util.zip.GZIPInputStream
 
 import scala.collection.mutable.HashSet
 import scala.reflect._
 
-import com.google.common.io.Files
-import org.apache.commons.io.IOUtils
 import org.apache.logging.log4j._
 import org.apache.logging.log4j.core.{Appender, LogEvent, Logger}
 import org.mockito.ArgumentCaptor
@@ -35,6 +34,7 @@ import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.{SparkConf, SparkFunSuite}
 import org.apache.spark.internal.config
+import org.apache.spark.util.Utils
 import org.apache.spark.util.logging.{FileAppender, RollingFileAppender, SizeBasedRollingPolicy, TimeBasedRollingPolicy}
 
 class FileAppenderSuite extends SparkFunSuite with BeforeAndAfter {
@@ -54,11 +54,11 @@ class FileAppenderSuite extends SparkFunSuite with BeforeAndAfter {
     val inputStream = new ByteArrayInputStream(testString.getBytes(StandardCharsets.UTF_8))
     // The `header` should not be covered
     val header = "Add header"
-    Files.asCharSink(testFile, StandardCharsets.UTF_8).write(header)
+    Files.writeString(testFile.toPath, header)
     val appender = new FileAppender(inputStream, testFile)
     inputStream.close()
     appender.awaitTermination()
-    assert(Files.asCharSource(testFile, StandardCharsets.UTF_8).read() === header + testString)
+    assert(Files.readString(testFile.toPath) === header + testString)
   }
 
   test("SPARK-35027: basic file appender - close stream") {
@@ -387,12 +387,12 @@ class FileAppenderSuite extends SparkFunSuite with BeforeAndAfter {
       if (file.getName.endsWith(RollingFileAppender.GZIP_LOG_SUFFIX)) {
         val inputStream = new GZIPInputStream(new FileInputStream(file))
         try {
-          IOUtils.toString(inputStream, StandardCharsets.UTF_8)
+          Utils.toString(inputStream)
         } finally {
-          IOUtils.closeQuietly(inputStream)
+          Utils.closeQuietly(inputStream)
         }
       } else {
-        Files.asCharSource(file, StandardCharsets.UTF_8).read()
+        Files.readString(file.toPath)
       }
     }.mkString("")
     assert(allText === expectedText)
diff --git a/core/src/test/scala/org/apache/spark/util/JsonProtocolSuite.scala b/core/src/test/scala/org/apache/spark/util/JsonProtocolSuite.scala
index 115d1f34bcb46..70edf2b7db43e 100644
--- a/core/src/test/scala/org/apache/spark/util/JsonProtocolSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/JsonProtocolSuite.scala
@@ -42,10 +42,9 @@ import org.apache.spark.scheduler.cluster.ExecutorInfo
 import org.apache.spark.shuffle.MetadataFetchFailedException
 import org.apache.spark.storage._
 
-class jsonProtocolSuite extends SparkFunSuite {
-  import jsonProtocolSuite._
-
-  private val jsonProtocol = new JsonProtocol(new SparkConf())
+class JsonProtocolSuite extends SparkFunSuite {
+  import JsonProtocol._
+  import JsonProtocolSuite._
 
   test("SparkListenerEvent") {
     val stageSubmitted =
@@ -271,15 +270,15 @@ class jsonProtocolSuite extends SparkFunSuite {
 
   test("ExceptionFailure backward compatibility: full stack trace") {
     val exceptionFailure = ExceptionFailure("To be", "or not to be", stackTrace, null, None)
-    val oldEvent = jsonProtocol.toJsonString(jsonProtocol.taskEndReasonToJson(exceptionFailure, _))
+    val oldEvent = toJsonString(JsonProtocol.taskEndReasonToJson(exceptionFailure, _))
       .removeField("Full Stack Trace")
-    assertEquals(exceptionFailure, jsonProtocol.taskEndReasonFromJson(oldEvent))
+    assertEquals(exceptionFailure, JsonProtocol.taskEndReasonFromJson(oldEvent))
   }
 
   test("StageInfo backward compatibility (details, accumulables)") {
     val info = makeStageInfo(1, 2, 3, 4L, 5L)
-    val newJson = jsonProtocol.toJsonString(
-      jsonProtocol.stageInfoToJson(info, _, includeAccumulables = true))
+    val newJson = toJsonString(
+      JsonProtocol.stageInfoToJson(info, _, defaultOptions, includeAccumulables = true))
 
     // Fields added after 1.0.0.
     assert(info.details.nonEmpty)
@@ -288,7 +287,7 @@ class jsonProtocolSuite extends SparkFunSuite {
       .removeField("Details")
       .removeField("Accumulables")
 
-    val newInfo = jsonProtocol.stageInfoFromJson(oldJson)
+    val newInfo = JsonProtocol.stageInfoFromJson(oldJson)
 
     assert(info.name === newInfo.name)
     assert("" === newInfo.details)
@@ -297,14 +296,14 @@ class jsonProtocolSuite extends SparkFunSuite {
 
   test("StageInfo resourceProfileId") {
     val info = makeStageInfo(1, 2, 3, 4L, 5L, 5)
-    val json = jsonProtocol.toJsonString(
-      jsonProtocol.stageInfoToJson(info, _, includeAccumulables = true))
+    val json = toJsonString(
+      JsonProtocol.stageInfoToJson(info, _, defaultOptions, includeAccumulables = true))
 
     // Fields added after 1.0.0.
     assert(info.details.nonEmpty)
     assert(info.resourceProfileId === 5)
 
-    val newInfo = jsonProtocol.stageInfoFromJson(json)
+    val newInfo = JsonProtocol.stageInfoFromJson(json)
 
     assert(info.name === newInfo.name)
     assert(5 === newInfo.resourceProfileId)
@@ -313,9 +312,9 @@ class jsonProtocolSuite extends SparkFunSuite {
   test("InputMetrics backward compatibility") {
     // InputMetrics were added after 1.0.1.
     val metrics = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0, hasHadoopInput = true, hasOutput = false)
-    val newJson = jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(metrics, _))
+    val newJson = toJsonString(JsonProtocol.taskMetricsToJson(metrics, _))
     val oldJson = newJson.removeField("Input Metrics")
-    val newMetrics = jsonProtocol.taskMetricsFromJson(oldJson)
+    val newMetrics = JsonProtocol.taskMetricsFromJson(oldJson)
     assert(newMetrics.inputMetrics.recordsRead == 0)
     assert(newMetrics.inputMetrics.bytesRead == 0)
   }
@@ -324,11 +323,11 @@ class jsonProtocolSuite extends SparkFunSuite {
     // records read were added after 1.2
     val metrics = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0,
       hasHadoopInput = true, hasOutput = true, hasRecords = false)
-    val newJson = jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(metrics, _))
+    val newJson = toJsonString(JsonProtocol.taskMetricsToJson(metrics, _))
     val oldJson = newJson
       .removeField("Records Read")
       .removeField("Records Written")
-    val newMetrics = jsonProtocol.taskMetricsFromJson(oldJson)
+    val newMetrics = JsonProtocol.taskMetricsFromJson(oldJson)
     assert(newMetrics.inputMetrics.recordsRead == 0)
     assert(newMetrics.outputMetrics.recordsWritten == 0)
   }
@@ -338,23 +337,35 @@ class jsonProtocolSuite extends SparkFunSuite {
     // "Remote Bytes Read To Disk" was added in 2.3.0
     val metrics = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0,
       hasHadoopInput = false, hasOutput = false, hasRecords = false)
-    val newJson = jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(metrics, _))
+    val newJson = toJsonString(JsonProtocol.taskMetricsToJson(metrics, _))
     val oldJson = newJson
       .removeField("Total Records Read")
       .removeField("Shuffle Records Written")
       .removeField("Remote Bytes Read To Disk")
-    val newMetrics = jsonProtocol.taskMetricsFromJson(oldJson)
+    val newMetrics = JsonProtocol.taskMetricsFromJson(oldJson)
     assert(newMetrics.shuffleReadMetrics.recordsRead == 0)
     assert(newMetrics.shuffleReadMetrics.remoteBytesReadToDisk == 0)
     assert(newMetrics.shuffleWriteMetrics.recordsWritten == 0)
   }
 
+  test("SPARK-43100: Push Based Shuffle metrics should be read correctly") {
+    val metrics = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0,
+      hasHadoopInput = false, hasOutput = true, hasRecords = false)
+    val expectedTaskMetricsJson =
+      JsonProtocol.toJsonString(JsonProtocol.taskMetricsToJson(metrics, _))
+    val foundTaskMetrics = JsonProtocol.taskMetricsFromJson(parse(expectedTaskMetricsJson))
+    val foundTaskMetricsJson = JsonProtocol.toJsonString(
+      JsonProtocol.taskMetricsToJson(foundTaskMetrics, _))
+    assert(expectedTaskMetricsJson.equals(foundTaskMetricsJson),
+      s"Expected: $expectedTaskMetricsJson, Found: $foundTaskMetricsJson")
+  }
+
   test("OutputMetrics backward compatibility") {
     // OutputMetrics were added after 1.1
     val metrics = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0, hasHadoopInput = false, hasOutput = true)
-    val newJson = jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(metrics, _))
+    val newJson = toJsonString(JsonProtocol.taskMetricsToJson(metrics, _))
     val oldJson = newJson.removeField("Output Metrics")
-    val newMetrics = jsonProtocol.taskMetricsFromJson(oldJson)
+    val newMetrics = JsonProtocol.taskMetricsFromJson(oldJson)
     assert(newMetrics.outputMetrics.recordsWritten == 0)
     assert(newMetrics.outputMetrics.bytesWritten == 0)
   }
@@ -366,12 +377,12 @@ class jsonProtocolSuite extends SparkFunSuite {
     metrics.setExecutorDeserializeCpuTime(100L)
     metrics.setExecutorCpuTime(100L)
     metrics.setPeakExecutionMemory(100L)
-    val newJson = jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(metrics, _))
+    val newJson = toJsonString(JsonProtocol.taskMetricsToJson(metrics, _))
     val oldJson = newJson
       .removeField("Executor Deserialize CPU Time")
       .removeField("Executor CPU Time")
       .removeField("Peak Execution Memory")
-    val newMetrics = jsonProtocol.taskMetricsFromJson(oldJson)
+    val newMetrics = JsonProtocol.taskMetricsFromJson(oldJson)
     assert(newMetrics.executorDeserializeCpuTime == 0)
     assert(newMetrics.executorCpuTime == 0)
     assert(newMetrics.peakExecutionMemory == 0)
@@ -386,9 +397,9 @@ class jsonProtocolSuite extends SparkFunSuite {
       deserialized = false,
       replication = 1
     )
-    val newJson = jsonProtocol.toJsonString(jsonProtocol.storageLevelToJson(level, _))
+    val newJson = toJsonString(JsonProtocol.storageLevelToJson(level, _))
     val oldJson = newJson.removeField("Use Off Heap")
-    val newLevel = jsonProtocol.storageLevelFromJson(oldJson)
+    val newLevel = JsonProtocol.storageLevelFromJson(oldJson)
     assert(newLevel.useOffHeap === false)
   }
 
@@ -399,19 +410,17 @@ class jsonProtocolSuite extends SparkFunSuite {
     val blockManagerRemoved = SparkListenerBlockManagerRemoved(2L,
       BlockManagerId("Scarce", "to be counted...", 100))
 
-    val oldBmAdded = jsonProtocol
-      .toJsonString(jsonProtocol.blockManagerAddedToJson(blockManagerAdded, _))
+    val oldBmAdded = toJsonString(JsonProtocol.blockManagerAddedToJson(blockManagerAdded, _))
       .removeField("Timestamp")
 
-    val deserializedBmAdded = jsonProtocol.blockManagerAddedFromJson(oldBmAdded)
+    val deserializedBmAdded = JsonProtocol.blockManagerAddedFromJson(oldBmAdded)
     assert(SparkListenerBlockManagerAdded(-1L, blockManagerAdded.blockManagerId,
       blockManagerAdded.maxMem) === deserializedBmAdded)
 
-    val oldBmRemoved = jsonProtocol
-      .toJsonString(jsonProtocol.blockManagerRemovedToJson(blockManagerRemoved, _))
+    val oldBmRemoved = toJsonString(JsonProtocol.blockManagerRemovedToJson(blockManagerRemoved, _))
       .removeField("Timestamp")
 
-    val deserializedBmRemoved = jsonProtocol.blockManagerRemovedFromJson(oldBmRemoved)
+    val deserializedBmRemoved = JsonProtocol.blockManagerRemovedFromJson(oldBmRemoved)
     assert(SparkListenerBlockManagerRemoved(-1L, blockManagerRemoved.blockManagerId) ===
       deserializedBmRemoved)
   }
@@ -420,31 +429,31 @@ class jsonProtocolSuite extends SparkFunSuite {
     // FetchFailed in Spark 1.1.0 does not have a "Message" property.
     val fetchFailed = FetchFailed(BlockManagerId("With or", "without you", 15), 17, 16L, 18, 19,
       "ignored")
-    val oldEvent = jsonProtocol.toJsonString(jsonProtocol.taskEndReasonToJson(fetchFailed, _))
+    val oldEvent = toJsonString(JsonProtocol.taskEndReasonToJson(fetchFailed, _))
       .removeField("Message")
     val expectedFetchFailed = FetchFailed(BlockManagerId("With or", "without you", 15), 17, 16L,
       18, 19, "Unknown reason")
-    assert(expectedFetchFailed === jsonProtocol.taskEndReasonFromJson(oldEvent))
+    assert(expectedFetchFailed === JsonProtocol.taskEndReasonFromJson(oldEvent))
   }
 
   test("SPARK-32124: FetchFailed Map Index backwards compatibility") {
     // FetchFailed in Spark 2.4.0 does not have "Map Index" property.
     val fetchFailed = FetchFailed(BlockManagerId("With or", "without you", 15), 17, 16L, 18, 19,
       "ignored")
-    val oldEvent = jsonProtocol.toJsonString(jsonProtocol.taskEndReasonToJson(fetchFailed, _))
+    val oldEvent = toJsonString(JsonProtocol.taskEndReasonToJson(fetchFailed, _))
       .removeField("Map Index")
     val expectedFetchFailed = FetchFailed(BlockManagerId("With or", "without you", 15), 17, 16L,
       Int.MinValue, 19, "ignored")
-    assert(expectedFetchFailed === jsonProtocol.taskEndReasonFromJson(oldEvent))
+    assert(expectedFetchFailed === JsonProtocol.taskEndReasonFromJson(oldEvent))
   }
 
   test("ShuffleReadMetrics: Local bytes read backwards compatibility") {
     // Metrics about local shuffle bytes read were added in 1.3.1.
     val metrics = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0,
       hasHadoopInput = false, hasOutput = false, hasRecords = false)
-    val newJson = jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(metrics, _))
+    val newJson = toJsonString(JsonProtocol.taskMetricsToJson(metrics, _))
     val oldJson = newJson.removeField("Local Bytes Read")
-    val newMetrics = jsonProtocol.taskMetricsFromJson(oldJson)
+    val newMetrics = JsonProtocol.taskMetricsFromJson(oldJson)
     assert(newMetrics.shuffleReadMetrics.localBytesRead == 0)
   }
 
@@ -453,22 +462,20 @@ class jsonProtocolSuite extends SparkFunSuite {
     // SparkListenerApplicationStart pre-Spark 1.4 does not have "appAttemptId".
     // SparkListenerApplicationStart pre-Spark 1.5 does not have "driverLogs
     val applicationStart = SparkListenerApplicationStart("test", None, 1L, "user", None, None)
-    val oldEvent = jsonProtocol
-      .toJsonString(jsonProtocol.applicationStartToJson(applicationStart, _))
+    val oldEvent = toJsonString(JsonProtocol.applicationStartToJson(applicationStart, _))
       .removeField("App ID")
       .removeField("App Attempt ID")
       .removeField( "Driver Logs")
-    assert(applicationStart === jsonProtocol.applicationStartFromJson(oldEvent))
+    assert(applicationStart === JsonProtocol.applicationStartFromJson(oldEvent))
   }
 
   test("ExecutorLostFailure backward compatibility") {
     // ExecutorLostFailure in Spark 1.1.0 does not have an "Executor ID" property.
     val executorLostFailure = ExecutorLostFailure("100", true, Some("Induced failure"))
-    val oldEvent = jsonProtocol
-      .toJsonString(jsonProtocol.taskEndReasonToJson(executorLostFailure, _))
+    val oldEvent = toJsonString(JsonProtocol.taskEndReasonToJson(executorLostFailure, _))
       .removeField("Executor ID")
     val expectedExecutorLostFailure = ExecutorLostFailure("Unknown", true, Some("Induced failure"))
-    assert(expectedExecutorLostFailure === jsonProtocol.taskEndReasonFromJson(oldEvent))
+    assert(expectedExecutorLostFailure === JsonProtocol.taskEndReasonFromJson(oldEvent))
   }
 
   test("SparkListenerJobStart backward compatibility") {
@@ -479,10 +486,10 @@ class jsonProtocolSuite extends SparkFunSuite {
       stageIds.map(id => new StageInfo(id, 0, "unknown", 0, Seq.empty, Seq.empty, "unknown",
         resourceProfileId = ResourceProfile.DEFAULT_RESOURCE_PROFILE_ID))
     val jobStart = SparkListenerJobStart(10, jobSubmissionTime, stageInfos, properties)
-    val oldEvent = jsonProtocol.sparkEventToJsonString(jobStart).removeField("Stage Infos")
+    val oldEvent = sparkEventToJsonString(jobStart).removeField("Stage Infos")
     val expectedJobStart =
       SparkListenerJobStart(10, jobSubmissionTime, dummyStageInfos, properties)
-    assertEquals(expectedJobStart, jsonProtocol.jobStartFromJson(oldEvent))
+    assertEquals(expectedJobStart, JsonProtocol.jobStartFromJson(oldEvent))
   }
 
   test("SparkListenerJobStart and SparkListenerJobEnd backward compatibility") {
@@ -491,15 +498,15 @@ class jsonProtocolSuite extends SparkFunSuite {
     val stageIds = Seq[Int](1, 2, 3, 4)
     val stageInfos = stageIds.map(x => makeStageInfo(x * 10, x * 20, x * 30, x * 40L, x * 50L))
     val jobStart = SparkListenerJobStart(11, jobSubmissionTime, stageInfos, properties)
-    val oldStartEvent = jsonProtocol.sparkEventToJsonString(jobStart).removeField("Submission Time")
+    val oldStartEvent = sparkEventToJsonString(jobStart).removeField("Submission Time")
     val expectedJobStart = SparkListenerJobStart(11, -1, stageInfos, properties)
-    assertEquals(expectedJobStart, jsonProtocol.jobStartFromJson(oldStartEvent))
+    assertEquals(expectedJobStart, JsonProtocol.jobStartFromJson(oldStartEvent))
 
     val jobEnd = SparkListenerJobEnd(11, jobCompletionTime, JobSucceeded)
-    val oldEndEvent = jsonProtocol.toJsonString(jsonProtocol.jobEndToJson(jobEnd, _))
+    val oldEndEvent = toJsonString(JsonProtocol.jobEndToJson(jobEnd, _))
       .removeField("Completion Time")
     val expectedJobEnd = SparkListenerJobEnd(11, -1, JobSucceeded)
-    assertEquals(expectedJobEnd, jsonProtocol.jobEndFromJson(oldEndEvent))
+    assertEquals(expectedJobEnd, JsonProtocol.jobEndFromJson(oldEndEvent))
   }
 
   test("RDDInfo backward compatibility") {
@@ -509,7 +516,7 @@ class jsonProtocolSuite extends SparkFunSuite {
     // "DeterministicLevel" was introduced in Spark 3.2.0
     val rddInfo = new RDDInfo(1, "one", 100, StorageLevel.NONE, true, Seq(1, 6, 8),
       "callsite", Some(new RDDOperationScope("fable")), DeterministicLevel.INDETERMINATE)
-    val oldRddInfoJson = jsonProtocol.toJsonString(jsonProtocol.rddInfoToJson(rddInfo, _))
+    val oldRddInfoJson = toJsonString(JsonProtocol.rddInfoToJson(rddInfo, _))
       .removeField("Parent IDs")
       .removeField("Scope")
       .removeField("Callsite")
@@ -518,7 +525,7 @@ class jsonProtocolSuite extends SparkFunSuite {
     val expectedRddInfo = new RDDInfo(
       1, "one", 100, StorageLevel.NONE, false, Seq.empty, "", scope = None,
       outputDeterministicLevel = DeterministicLevel.INDETERMINATE)
-    assertEquals(expectedRddInfo, jsonProtocol.rddInfoFromJson(oldRddInfoJson))
+    assertEquals(expectedRddInfo, JsonProtocol.rddInfoFromJson(oldRddInfoJson))
   }
 
   test("StageInfo backward compatibility (parent IDs)") {
@@ -526,40 +533,39 @@ class jsonProtocolSuite extends SparkFunSuite {
     val stageInfo = new StageInfo(1, 1, "me-stage", 1, Seq.empty, Seq(1, 2, 3), "details",
       resourceProfileId = ResourceProfile.DEFAULT_RESOURCE_PROFILE_ID)
     val oldStageInfo =
-      jsonProtocol.toJsonString(
-        jsonProtocol.stageInfoToJson(stageInfo, _, includeAccumulables = true)
+      toJsonString(
+        JsonProtocol.stageInfoToJson(stageInfo, _, defaultOptions, includeAccumulables = true)
       ).removeField("Parent IDs")
     val expectedStageInfo = new StageInfo(1, 1, "me-stage", 1, Seq.empty, Seq.empty, "details",
       resourceProfileId = ResourceProfile.DEFAULT_RESOURCE_PROFILE_ID)
-    assertEquals(expectedStageInfo, jsonProtocol.stageInfoFromJson(oldStageInfo))
+    assertEquals(expectedStageInfo, JsonProtocol.stageInfoFromJson(oldStageInfo))
   }
 
   // `TaskCommitDenied` was added in 1.3.0 but JSON de/serialization logic was added in 1.5.1
   test("TaskCommitDenied backward compatibility") {
     val denied = TaskCommitDenied(1, 2, 3)
-    val oldDenied = jsonProtocol.toJsonString(jsonProtocol.taskEndReasonToJson(denied, _))
+    val oldDenied = toJsonString(JsonProtocol.taskEndReasonToJson(denied, _))
       .removeField("Job ID")
       .removeField("Partition ID")
       .removeField("Attempt Number")
     val expectedDenied = TaskCommitDenied(-1, -1, -1)
-    assertEquals(expectedDenied, jsonProtocol.taskEndReasonFromJson(oldDenied))
+    assertEquals(expectedDenied, JsonProtocol.taskEndReasonFromJson(oldDenied))
   }
 
   test("AccumulableInfo backward compatibility") {
     // "Internal" property of AccumulableInfo was added in 1.5.1
     val accumulableInfo = makeAccumulableInfo(1, internal = true, countFailedValues = true)
-    val accumulableInfoJson = jsonProtocol
-      .toJsonString(jsonProtocol.accumulableInfoToJson(accumulableInfo, _))
+    val accumulableInfoJson = toJsonString(JsonProtocol.accumulableInfoToJson(accumulableInfo, _))
     val oldJson = accumulableInfoJson.removeField("Internal")
-    val oldInfo = jsonProtocol.accumulableInfoFromJson(oldJson)
+    val oldInfo = JsonProtocol.accumulableInfoFromJson(oldJson)
     assert(!oldInfo.internal)
     // "Count Failed Values" property of AccumulableInfo was added in 2.0.0
     val oldJson2 = accumulableInfoJson.removeField("Count Failed Values")
-    val oldInfo2 = jsonProtocol.accumulableInfoFromJson(oldJson2)
+    val oldInfo2 = JsonProtocol.accumulableInfoFromJson(oldJson2)
     assert(!oldInfo2.countFailedValues)
     // "Metadata" property of AccumulableInfo was added in 2.0.0
     val oldJson3 = accumulableInfoJson.removeField("Metadata")
-    val oldInfo3 = jsonProtocol.accumulableInfoFromJson(oldJson3)
+    val oldInfo3 = JsonProtocol.accumulableInfoFromJson(oldJson3)
     assert(oldInfo3.metadata.isEmpty)
   }
 
@@ -568,18 +574,17 @@ class jsonProtocolSuite extends SparkFunSuite {
     // we should still be able to fallback to constructing the accumulator updates from the
     // "Task Metrics" field, if it exists.
     val tm = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0, hasHadoopInput = true, hasOutput = true)
-    val tmJson = jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(tm, _))
+    val tmJson = toJsonString(JsonProtocol.taskMetricsToJson(tm, _))
     val accumUpdates = tm.accumulators().map(AccumulatorSuite.makeInfo)
     val exception = new SparkException("sentimental")
     val exceptionFailure = new ExceptionFailure(exception, accumUpdates)
-    val exceptionFailureJson = jsonProtocol
-      .toJsonString(jsonProtocol.taskEndReasonToJson(exceptionFailure, _))
+    val exceptionFailureJson = toJsonString(JsonProtocol.taskEndReasonToJson(exceptionFailure, _))
     val oldExceptionFailureJson =
       exceptionFailureJson
         .removeField("Accumulator Updates")
         .addStringField("Task Metrics", tmJson)
     val oldExceptionFailure =
-      jsonProtocol.taskEndReasonFromJson(oldExceptionFailureJson).asInstanceOf[ExceptionFailure]
+      JsonProtocol.taskEndReasonFromJson(oldExceptionFailureJson).asInstanceOf[ExceptionFailure]
     assert(exceptionFailure.className === oldExceptionFailure.className)
     assert(exceptionFailure.description === oldExceptionFailure.description)
     assertSeqEquals[StackTraceElement](
@@ -595,13 +600,13 @@ class jsonProtocolSuite extends SparkFunSuite {
     val tm = makeTaskMetrics(1L, 2L, 3L, 4L, 5, 6, 0, hasHadoopInput = true, hasOutput = true)
     val accumUpdates = tm.accumulators().map(AccumulatorSuite.makeInfo)
     val taskKilled = TaskKilled(reason = "test", accumUpdates)
-    val taskKilledJson = jsonProtocol.toJsonString(jsonProtocol.taskEndReasonToJson(taskKilled, _))
+    val taskKilledJson = toJsonString(JsonProtocol.taskEndReasonToJson(taskKilled, _))
     val oldExceptionFailureJson =
       taskKilledJson
         .removeField("Kill Reason")
         .removeField("Accumulator Updates")
     val oldTaskKilled =
-      jsonProtocol.taskEndReasonFromJson(oldExceptionFailureJson).asInstanceOf[TaskKilled]
+      JsonProtocol.taskEndReasonFromJson(oldExceptionFailureJson).asInstanceOf[TaskKilled]
     assert(oldTaskKilled.reason === "unknown reason")
     assert(oldTaskKilled.accums.isEmpty)
     assert(oldTaskKilled.accumUpdates.isEmpty)
@@ -611,11 +616,11 @@ class jsonProtocolSuite extends SparkFunSuite {
     // executorMetricsUpdate was added in 2.4.0.
     val executorMetricsUpdate = makeExecutorMetricsUpdate("1", true, true)
     val oldExecutorMetricsUpdateJson =
-      jsonProtocol.toJsonString(jsonProtocol.executorMetricsUpdateToJson(executorMetricsUpdate, _))
+      toJsonString(JsonProtocol.executorMetricsUpdateToJson(executorMetricsUpdate, _))
         .removeField("Executor Metrics Updated")
     val expectedExecutorMetricsUpdate = makeExecutorMetricsUpdate("1", true, false)
     assertEquals(expectedExecutorMetricsUpdate,
-      jsonProtocol.executorMetricsUpdateFromJson(oldExecutorMetricsUpdateJson))
+      JsonProtocol.executorMetricsUpdateFromJson(oldExecutorMetricsUpdateJson))
   }
 
   test("executorMetricsFromJson backward compatibility: handle missing metrics") {
@@ -623,24 +628,24 @@ class jsonProtocolSuite extends SparkFunSuite {
     val executorMetrics = new ExecutorMetrics(Array(12L, 23L, 45L, 67L, 78L, 89L,
       90L, 123L, 456L, 789L, 40L, 20L, 20L, 10L, 20L, 10L, 301L))
     val oldExecutorMetricsJson =
-      jsonProtocol.toJsonString(jsonProtocol.executorMetricsToJson(executorMetrics, _))
+      toJsonString(JsonProtocol.executorMetricsToJson(executorMetrics, _))
         .removeField("MappedPoolMemory")
     val expectedExecutorMetrics = new ExecutorMetrics(Array(12L, 23L, 45L, 67L,
       78L, 89L, 90L, 123L, 456L, 0L, 40L, 20L, 20L, 10L, 20L, 10L, 301L))
     assertEquals(expectedExecutorMetrics,
-      jsonProtocol.executorMetricsFromJson(oldExecutorMetricsJson))
+      JsonProtocol.executorMetricsFromJson(oldExecutorMetricsJson))
   }
 
   test("EnvironmentUpdate backward compatibility: handle missing metrics properties") {
     // The "Metrics Properties" field was added in Spark 3.4.0:
     val expectedEvent: SparkListenerEnvironmentUpdate = {
-      val e = jsonProtocol.environmentUpdateFromJson(environmentUpdateJsonString)
+      val e = JsonProtocol.environmentUpdateFromJson(environmentUpdateJsonString)
       e.copy(environmentDetails =
         e.environmentDetails ++ Map("Metrics Properties" -> Seq.empty[(String, String)]))
     }
     val oldEnvironmentUpdateJson = environmentUpdateJsonString
       .removeField("Metrics Properties")
-    assertEquals(expectedEvent, jsonProtocol.environmentUpdateFromJson(oldEnvironmentUpdateJson))
+    assertEquals(expectedEvent, JsonProtocol.environmentUpdateFromJson(oldEnvironmentUpdateJson))
   }
 
   test("ExecutorInfo backward compatibility") {
@@ -660,14 +665,13 @@ class jsonProtocolSuite extends SparkFunSuite {
         resourceProfileId = 123,
         registrationTime = Some(2L),
         requestTime = Some(1L))
-    val oldExecutorInfoJson = jsonProtocol
-      .toJsonString(jsonProtocol.executorInfoToJson(executorInfo, _))
+    val oldExecutorInfoJson = toJsonString(JsonProtocol.executorInfoToJson(executorInfo, _))
       .removeField("Attributes")
       .removeField("Resources")
       .removeField("Resource Profile Id")
       .removeField("Registration Time")
       .removeField("Request Time")
-    val oldEvent = jsonProtocol.executorInfoFromJson(oldExecutorInfoJson)
+    val oldEvent = JsonProtocol.executorInfoFromJson(oldExecutorInfoJson)
     assert(oldEvent.attributes.isEmpty)
     assert(oldEvent.resourcesInfo.isEmpty)
     assert(oldEvent.resourceProfileId == DEFAULT_RESOURCE_PROFILE_ID)
@@ -706,7 +710,7 @@ class jsonProtocolSuite extends SparkFunSuite {
         |}
     """.stripMargin
     val oldJson = newJson.removeField("Partition ID")
-    assert(jsonProtocol.taskInfoFromJson(oldJson).partitionId === -1)
+    assert(JsonProtocol.taskInfoFromJson(oldJson).partitionId === -1)
   }
 
   test("AccumulableInfo value de/serialization") {
@@ -716,7 +720,7 @@ class jsonProtocolSuite extends SparkFunSuite {
       (TestBlockId("feebo"), BlockStatus(StorageLevel.DISK_ONLY, 3L, 4L)))
     val blocksJson = JArray(blocks.toList.map { case (id, status) =>
       ("Block ID" -> id.toString) ~
-      ("Status" -> parse(jsonProtocol.toJsonString(jsonProtocol.blockStatusToJson(status, _))))
+      ("Status" -> parse(toJsonString(JsonProtocol.blockStatusToJson(status, _))))
     })
     testAccumValue(Some(RESULT_SIZE), 3L, JInt(3))
     testAccumValue(Some(shuffleRead.REMOTE_BLOCKS_FETCHED), 2, JInt(2))
@@ -739,8 +743,8 @@ class jsonProtocolSuite extends SparkFunSuite {
       value = value,
       internal = isInternal,
       countFailedValues = false)
-    val json = jsonProtocol.toJsonString(jsonProtocol.accumulableInfoToJson(accum, _))
-    val newAccum = jsonProtocol.accumulableInfoFromJson(json)
+    val json = toJsonString(JsonProtocol.accumulableInfoToJson(accum, _))
+    val newAccum = JsonProtocol.accumulableInfoFromJson(json)
     assert(newAccum == accum.copy(update = expectedValue, value = expectedValue))
   }
 
@@ -783,7 +787,7 @@ class jsonProtocolSuite extends SparkFunSuite {
         |  "bar" : 123,
         |  "unknown" : "unknown"
         |}""".stripMargin
-    assert(jsonProtocol.sparkEventFromJson(unknownFieldsJson) === expected)
+    assert(JsonProtocol.sparkEventFromJson(unknownFieldsJson) === expected)
   }
 
   test("SPARK-30936: backwards compatibility - set default values for missing fields") {
@@ -793,20 +797,20 @@ class jsonProtocolSuite extends SparkFunSuite {
         |  "Event" : "org.apache.spark.util.TestListenerEvent",
         |  "foo" : "foo"
         |}""".stripMargin
-    assert(jsonProtocol.sparkEventFromJson(unknownFieldsJson) === expected)
+    assert(JsonProtocol.sparkEventFromJson(unknownFieldsJson) === expected)
   }
 
   test("SPARK-42204: spark.eventLog.includeTaskMetricsAccumulators config") {
-    val includeProtocol = new JsonProtocol(
+    val includeConf = new JsonProtocolOptions(
       new SparkConf().set(EVENT_LOG_INCLUDE_TASK_METRICS_ACCUMULATORS, true))
-    val excludeProtocol = new JsonProtocol(
+    val excludeConf = new JsonProtocolOptions(
       new SparkConf().set(EVENT_LOG_INCLUDE_TASK_METRICS_ACCUMULATORS, false))
 
     val taskMetricsAccumulables = TaskMetrics
       .empty
       .nameToAccums
       .view
-      .filterKeys(!jsonProtocol.accumulableExcludeList.contains(_))
+      .filterKeys(!JsonProtocol.accumulableExcludeList.contains(_))
       .values
       .map(_.toInfo(Some(1), None))
       .toSeq
@@ -834,11 +838,11 @@ class jsonProtocolSuite extends SparkFunSuite {
           hasHadoopInput = false, hasOutput = false))
       assertEquals(
         originalEvent,
-        jsonProtocol.sparkEventFromJson(includeProtocol.sparkEventToJsonString(originalEvent)))
+        sparkEventFromJson(sparkEventToJsonString(originalEvent, includeConf)))
       val trimmedEvent = originalEvent.copy(taskInfo = taskInfoWithoutTaskMetricsAccums)
       assertEquals(
         trimmedEvent,
-        jsonProtocol.sparkEventFromJson(excludeProtocol.sparkEventToJsonString(originalEvent)))
+        sparkEventFromJson(sparkEventToJsonString(originalEvent, excludeConf)))
     }
 
     // StageCompleted
@@ -846,11 +850,11 @@ class jsonProtocolSuite extends SparkFunSuite {
       val originalEvent = SparkListenerStageCompleted(stageInfoWithTaskMetricsAccums)
       assertEquals(
         originalEvent,
-        jsonProtocol.sparkEventFromJson(includeProtocol.sparkEventToJsonString(originalEvent)))
+        sparkEventFromJson(sparkEventToJsonString(originalEvent, includeConf)))
       val trimmedEvent = originalEvent.copy(stageInfo = stageInfoWithoutTaskMetricsAccums)
       assertEquals(
         trimmedEvent,
-        jsonProtocol.sparkEventFromJson(excludeProtocol.sparkEventToJsonString(originalEvent)))
+        sparkEventFromJson(sparkEventToJsonString(originalEvent, excludeConf)))
     }
 
     // JobStart
@@ -859,22 +863,21 @@ class jsonProtocolSuite extends SparkFunSuite {
         SparkListenerJobStart(1, 1, Seq(stageInfoWithTaskMetricsAccums), properties)
       assertEquals(
         originalEvent,
-        jsonProtocol.sparkEventFromJson(includeProtocol.sparkEventToJsonString(originalEvent)))
+        sparkEventFromJson(sparkEventToJsonString(originalEvent, includeConf)))
       val trimmedEvent = originalEvent.copy(stageInfos = Seq(stageInfoWithoutTaskMetricsAccums))
       assertEquals(
         trimmedEvent,
-        jsonProtocol.sparkEventFromJson(excludeProtocol.sparkEventToJsonString(originalEvent)))
+        sparkEventFromJson(sparkEventToJsonString(originalEvent, excludeConf)))
     }
 
     // ExecutorMetricsUpdate events should be unaffected by the config:
     val executorMetricsUpdate =
       SparkListenerExecutorMetricsUpdate("0", Seq((0, 0, 0, taskMetricsAccumulables)))
     assert(
-      includeProtocol.sparkEventToJsonString(executorMetricsUpdate) ===
-      excludeProtocol.sparkEventToJsonString(executorMetricsUpdate))
+      sparkEventToJsonString(executorMetricsUpdate, includeConf) ===
+      sparkEventToJsonString(executorMetricsUpdate, excludeConf))
     assertEquals(
-      jsonProtocol.sparkEventFromJson(
-        includeProtocol.sparkEventToJsonString(executorMetricsUpdate)),
+      JsonProtocol.sparkEventFromJson(sparkEventToJsonString(executorMetricsUpdate, includeConf)),
       executorMetricsUpdate)
     }
 
@@ -892,7 +895,7 @@ class jsonProtocolSuite extends SparkFunSuite {
         |  }
         |]
         |""".stripMargin
-    val stackTrace = jsonProtocol.stackTraceFromJson(stackTraceJson)
+    val stackTrace = JsonProtocol.stackTraceFromJson(stackTraceJson)
     assert(stackTrace === Array(new StackTraceElement("someClass", "someMethod", null, -1)))
 
     val exceptionFailureJson =
@@ -906,7 +909,7 @@ class jsonProtocolSuite extends SparkFunSuite {
         |}
         |""".stripMargin
     val exceptionFailure =
-      jsonProtocol.taskEndReasonFromJson(exceptionFailureJson).asInstanceOf[ExceptionFailure]
+      JsonProtocol.taskEndReasonFromJson(exceptionFailureJson).asInstanceOf[ExceptionFailure]
     assert(exceptionFailure.description == null)
   }
 
@@ -928,7 +931,7 @@ class jsonProtocolSuite extends SparkFunSuite {
         |  "Message": "Job aborted"
         |}
         |""".stripMargin
-    val exNoStack = jsonProtocol.exceptionFromJson(exNoStackJson)
+    val exNoStack = JsonProtocol.exceptionFromJson(exNoStackJson)
     assert(exNoStack.getStackTrace.isEmpty)
 
     val exEmptyStackJson =
@@ -938,7 +941,7 @@ class jsonProtocolSuite extends SparkFunSuite {
         |  "Stack Trace": []
         |}
         |""".stripMargin
-    val exEmptyStack = jsonProtocol.exceptionFromJson(exEmptyStackJson)
+    val exEmptyStack = JsonProtocol.exceptionFromJson(exEmptyStackJson)
     assert(exEmptyStack.getStackTrace.isEmpty)
 
     // test entire job failure event is equivalent
@@ -971,7 +974,7 @@ class jsonProtocolSuite extends SparkFunSuite {
         |   }
         |}
         |""".stripMargin
-    val jobFailedEvent = jsonProtocol.sparkEventFromJson(exJobFailureNoStackJson)
+    val jobFailedEvent = JsonProtocol.sparkEventFromJson(exJobFailureNoStackJson)
     testEvent(jobFailedEvent, exJobFailureExpectedJson)
   }
 
@@ -993,43 +996,55 @@ class jsonProtocolSuite extends SparkFunSuite {
     val gettingResult = SparkListenerTaskGettingResult(taskInfo)
 
     assert(
-      jsonProtocol.stageSubmittedFromJson(
-        jsonProtocol.sparkEventToJsonString(stageSubmitted)).stageInfo.accumulables.isEmpty)
+      stageSubmittedFromJson(sparkEventToJsonString(stageSubmitted)).stageInfo.accumulables.isEmpty)
     assert(
-      jsonProtocol.taskStartFromJson(
-        jsonProtocol.sparkEventToJsonString(taskStart)).taskInfo.accumulables.isEmpty)
+      taskStartFromJson(sparkEventToJsonString(taskStart)).taskInfo.accumulables.isEmpty)
     assert(
-      jsonProtocol.taskGettingResultFromJson(
-          jsonProtocol.sparkEventToJsonString(gettingResult))
+      taskGettingResultFromJson(sparkEventToJsonString(gettingResult))
         .taskInfo.accumulables.isEmpty)
 
     // Deliberately not fixed for job starts because a job might legitimately reference
     // stages that have completed even before the job start event is emitted.
-    testEvent(jobStart, jsonProtocol.sparkEventToJsonString(jobStart))
-  }
-
-  test("SPARK-49872: allow to limit json reader string sizes") {
-    val bigStringEvent = SparkListenerExecutorUnexcluded(
-      executorUnexcludedTime, "a".repeat(10_000))
-    val jsonString = jsonProtocol.sparkEventToJsonString(bigStringEvent)
-    assert(jsonProtocol.sparkEventFromJson(jsonString) == bigStringEvent)
-    val jsonProtocolWithLimit = new JsonProtocol(new SparkConf()
-      .set(EVENT_LOG_READER_MAX_STRING_LENGTH, 1_000))
-    val ex = intercept[com.fasterxml.jackson.core.exc.StreamConstraintsException] {
-      jsonProtocolWithLimit.sparkEventFromJson(jsonString)
+    testEvent(jobStart, sparkEventToJsonString(jobStart))
+  }
+
+  test("SPARK-52381: handle class not found") {
+    val unknownJson =
+      """{
+        |  "Event" : "com.example.UnknownEvent",
+        |  "foo" : "foo"
+        |}""".stripMargin
+    try {
+      JsonProtocol.sparkEventFromJson(unknownJson)
+      fail("Expected ClassNotFoundException for unknown event type")
+    } catch {
+      case e: ClassNotFoundException =>
+    }
+  }
+
+  test("SPARK-52381: only read classes that extend SparkListenerEvent") {
+    val unknownJson =
+      """{
+        |  "Event" : "org.apache.spark.SparkException",
+        |  "foo" : "foo"
+        |}""".stripMargin
+    try {
+      JsonProtocol.sparkEventFromJson(unknownJson)
+      fail("Expected SparkException for unknown event type")
+    } catch {
+      case e: SparkException =>
+        assert(e.getMessage.startsWith("Unknown event type"))
     }
-    assert(ex.getMessage.startsWith(
-      "String value length (10000) exceeds the maximum allowed"
-    ))
   }
+
 }
 
 
-private[spark] object jsonProtocolSuite extends Assertions {
+private[spark] object JsonProtocolSuite extends Assertions {
   import InternalAccumulator._
+  import JsonProtocol._
 
   private val mapper = new ObjectMapper()
-  private val jsonProtocol = new JsonProtocol(new SparkConf())
 
   private implicit class JsonStringImplicits(json: String) {
     def removeField(field: String): String = {
@@ -1063,59 +1078,59 @@ private[spark] object jsonProtocolSuite extends Assertions {
   }
 
   private def testEvent(event: SparkListenerEvent, jsonString: String): Unit = {
-    val actualJsonString = jsonProtocol.sparkEventToJsonString(event)
-    val newEvent = jsonProtocol.sparkEventFromJson(actualJsonString)
+    val actualJsonString = JsonProtocol.sparkEventToJsonString(event)
+    val newEvent = JsonProtocol.sparkEventFromJson(actualJsonString)
     assertJsonStringEquals(jsonString, actualJsonString, event.getClass.getSimpleName)
     assertEquals(event, newEvent)
   }
 
   private def testRDDInfo(info: RDDInfo): Unit = {
-    val newInfo = jsonProtocol.rddInfoFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.rddInfoToJson(info, _)))
+    val newInfo = JsonProtocol.rddInfoFromJson(
+      toJsonString(JsonProtocol.rddInfoToJson(info, _)))
     assertEquals(info, newInfo)
   }
 
   private def testStageInfo(info: StageInfo): Unit = {
-    val newInfo = jsonProtocol.stageInfoFromJson(
-      jsonProtocol.toJsonString(
-        jsonProtocol.stageInfoToJson(info, _, includeAccumulables = true)))
+    val newInfo = JsonProtocol.stageInfoFromJson(
+      toJsonString(
+        JsonProtocol.stageInfoToJson(info, _, defaultOptions, includeAccumulables = true)))
     assertEquals(info, newInfo)
   }
 
   private def testStorageLevel(level: StorageLevel): Unit = {
-    val newLevel = jsonProtocol.storageLevelFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.storageLevelToJson(level, _)))
+    val newLevel = JsonProtocol.storageLevelFromJson(
+      toJsonString(JsonProtocol.storageLevelToJson(level, _)))
     assertEquals(level, newLevel)
   }
 
   private def testTaskMetrics(metrics: TaskMetrics): Unit = {
-    val newMetrics = jsonProtocol.taskMetricsFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.taskMetricsToJson(metrics, _)))
+    val newMetrics = JsonProtocol.taskMetricsFromJson(
+      toJsonString(JsonProtocol.taskMetricsToJson(metrics, _)))
     assertEquals(metrics, newMetrics)
   }
 
   private def testBlockManagerId(id: BlockManagerId): Unit = {
-    val newId = jsonProtocol.blockManagerIdFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.blockManagerIdToJson(id, _)))
+    val newId = JsonProtocol.blockManagerIdFromJson(
+      toJsonString(JsonProtocol.blockManagerIdToJson(id, _)))
     assert(id === newId)
   }
 
   private def testTaskInfo(info: TaskInfo): Unit = {
-    val newInfo = jsonProtocol.taskInfoFromJson(
-      jsonProtocol.toJsonString(
-        jsonProtocol.taskInfoToJson(info, _, includeAccumulables = true)))
+    val newInfo = JsonProtocol.taskInfoFromJson(
+      toJsonString(
+        JsonProtocol.taskInfoToJson(info, _, defaultOptions, includeAccumulables = true)))
     assertEquals(info, newInfo)
   }
 
   private def testJobResult(result: JobResult): Unit = {
-    val newResult = jsonProtocol.jobResultFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.jobResultToJson(result, _)))
+    val newResult = JsonProtocol.jobResultFromJson(
+      toJsonString(JsonProtocol.jobResultToJson(result, _)))
     assertEquals(result, newResult)
   }
 
   private def testTaskEndReason(reason: TaskEndReason): Unit = {
-    val newReason = jsonProtocol.taskEndReasonFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.taskEndReasonToJson(reason, _)))
+    val newReason = JsonProtocol.taskEndReasonFromJson(
+      toJsonString(JsonProtocol.taskEndReasonToJson(reason, _)))
     assertEquals(reason, newReason)
   }
 
@@ -1125,22 +1140,22 @@ private[spark] object jsonProtocolSuite extends Assertions {
   }
 
   private def testExecutorInfo(info: ExecutorInfo): Unit = {
-    val newInfo = jsonProtocol.executorInfoFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.executorInfoToJson(info, _)))
+    val newInfo = JsonProtocol.executorInfoFromJson(
+      toJsonString(JsonProtocol.executorInfoToJson(info, _)))
     assertEquals(info, newInfo)
   }
 
   private def testAccumValue(name: Option[String], value: Any, expectedJson: JValue): Unit = {
-    val json = parse(jsonProtocol.toJsonString(jsonProtocol.accumValueToJson(name, value, _)))
+    val json = parse(toJsonString(JsonProtocol.accumValueToJson(name, value, _)))
     assert(json === expectedJson)
-    val newValue = jsonProtocol.accumValueFromJson(name, json)
+    val newValue = JsonProtocol.accumValueFromJson(name, json)
     val expectedValue = if (name.exists(_.startsWith(METRICS_PREFIX))) value else value.toString
     assert(newValue === expectedValue)
   }
 
   private def testException(exception: Exception): Unit = {
-    val newException = jsonProtocol.exceptionFromJson(
-      jsonProtocol.toJsonString(jsonProtocol.exceptionToJson(exception, _)))
+    val newException = JsonProtocol.exceptionFromJson(
+      toJsonString(JsonProtocol.exceptionToJson(exception, _)))
     assertEquals(exception, newException)
   }
 
@@ -1194,7 +1209,7 @@ private[spark] object jsonProtocolSuite extends Assertions {
             assert(stageId1 === stageId2)
             assert(stageAttemptId1 === stageAttemptId2)
             val filteredUpdates = updates1
-              .filterNot { acc => acc.name.exists(jsonProtocol.accumulableExcludeList.contains) }
+              .filterNot { acc => acc.name.exists(accumulableExcludeList.contains) }
             assertSeqEquals[AccumulableInfo](filteredUpdates, updates2, (a, b) => a.equals(b))
           })
         assertSeqEquals[((Int, Int), ExecutorMetrics)](
@@ -1329,7 +1344,7 @@ private[spark] object jsonProtocolSuite extends Assertions {
         assertSeqEquals(r1.stackTrace, r2.stackTrace, assertStackTraceElementEquals)
         assert(r1.fullStackTrace === r2.fullStackTrace)
         val filteredUpdates = r1.accumUpdates
-          .filterNot { acc => acc.name.exists(jsonProtocol.accumulableExcludeList.contains) }
+          .filterNot { acc => acc.name.exists(accumulableExcludeList.contains) }
         assertSeqEquals[AccumulableInfo](filteredUpdates, r2.accumUpdates, (a, b) => a.equals(b))
       case (TaskResultLost, TaskResultLost) =>
       case (r1: TaskKilled, r2: TaskKilled) =>
diff --git a/core/src/test/scala/org/apache/spark/util/SizeEstimatorSuite.scala b/core/src/test/scala/org/apache/spark/util/SizeEstimatorSuite.scala
index d669f2c655abb..a7908d89288a9 100644
--- a/core/src/test/scala/org/apache/spark/util/SizeEstimatorSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/SizeEstimatorSuite.scala
@@ -23,6 +23,8 @@ import org.scalatest.{BeforeAndAfterEach, PrivateMethodTester}
 
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.internal.config.Tests.TEST_USE_COMPRESSED_OOPS_KEY
+import org.apache.spark.util.Utils
+import org.apache.spark.util.collection.Utils.createArray
 
 class DummyClass1 {}
 
@@ -74,7 +76,7 @@ class SizeEstimatorSuite
   with ResetSystemProperties {
 
   // Save modified system properties so that we can restore them after tests.
-  val originalArch = System.getProperty("os.arch")
+  val originalArch = Utils.osArch
   val originalCompressedOops = System.getProperty(TEST_USE_COMPRESSED_OOPS_KEY)
 
   def reinitializeSizeEstimator(arch: String, useCompressedOops: String): Unit = {
@@ -183,16 +185,16 @@ class SizeEstimatorSuite
     // If an array contains the *same* element many times, we should only count it once.
     val d1 = new DummyClass1
     // 10 pointers plus 8-byte object
-    assertResult(72)(SizeEstimator.estimate(Array.fill(10)(d1)))
+    assertResult(72)(SizeEstimator.estimate(createArray(10, d1)))
     // 100 pointers plus 8-byte object
-    assertResult(432)(SizeEstimator.estimate(Array.fill(100)(d1)))
+    assertResult(432)(SizeEstimator.estimate(createArray(100, d1)))
 
     // Same thing with huge array containing the same element many times. Note that this won't
     // return exactly 4032 because it can't tell that *all* the elements will equal the first
     // one it samples, but it should be close to that.
 
     // TODO: If we sample 100 elements, this should always be 4176 ?
-    val estimatedSize = SizeEstimator.estimate(Array.fill(1000)(d1))
+    val estimatedSize = SizeEstimator.estimate(createArray(1000, d1))
     assert(estimatedSize >= 4000, "Estimated size " + estimatedSize + " should be more than 4000")
     assert(estimatedSize <= 4200, "Estimated size " + estimatedSize + " should be less than 4200")
   }
diff --git a/core/src/test/scala/org/apache/spark/util/UtilsSuite.scala b/core/src/test/scala/org/apache/spark/util/UtilsSuite.scala
index 077dd489378fd..933b6fc39e913 100644
--- a/core/src/test/scala/org/apache/spark/util/UtilsSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/UtilsSuite.scala
@@ -22,7 +22,7 @@ import java.lang.reflect.Field
 import java.net.{BindException, ServerSocket, URI}
 import java.nio.{ByteBuffer, ByteOrder}
 import java.nio.charset.StandardCharsets.UTF_8
-import java.nio.file.{Files => JFiles}
+import java.nio.file.Files
 import java.text.DecimalFormatSymbols
 import java.util.Locale
 import java.util.concurrent.TimeUnit
@@ -31,9 +31,6 @@ import java.util.zip.GZIPOutputStream
 import scala.collection.mutable.ListBuffer
 import scala.util.{Random, Try}
 
-import com.google.common.io.Files
-import org.apache.commons.io.IOUtils
-import org.apache.commons.lang3.SystemUtils
 import org.apache.commons.math3.stat.inference.ChiSquareTest
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
@@ -47,6 +44,7 @@ import org.apache.spark.internal.config.Tests.IS_TESTING
 import org.apache.spark.launcher.SparkLauncher
 import org.apache.spark.network.util.ByteUnit
 import org.apache.spark.scheduler.SparkListener
+import org.apache.spark.util.collection.Utils.createArray
 import org.apache.spark.util.io.ChunkedByteBufferInputStream
 
 class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
@@ -249,8 +247,8 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
         assert(mergedStream.read() === -1)
         assert(byteBufferInputStream.chunkedByteBuffer === null)
       } finally {
-        IOUtils.closeQuietly(mergedStream)
-        IOUtils.closeQuietly(in)
+        Utils.closeQuietly(mergedStream)
+        Utils.closeQuietly(in)
       }
     }
   }
@@ -344,7 +342,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
     } else {
       new FileOutputStream(path)
     }
-    IOUtils.write(content, outputStream)
+    outputStream.write(content)
     outputStream.close()
     content.length
   }
@@ -493,10 +491,10 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
     assert(Utils.createDirectory(testDirPath, "scenario1").exists())
 
     // 2. Illegal file path
-    val scenario2 = new File(testDir, "scenario2" * 256)
+    val scenario2 = new File(testDir, "scenario2".repeat(256))
     assert(!Utils.createDirectory(scenario2))
     assert(!scenario2.exists())
-    assertThrows[IOException](Utils.createDirectory(testDirPath, "scenario2" * 256))
+    assertThrows[IOException](Utils.createDirectory(testDirPath, "scenario2".repeat(256)))
 
     // 3. The parent directory cannot read
     val scenario3 = new File(testDir, "scenario3")
@@ -527,13 +525,11 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
 
     // The following 3 scenarios are only for the method: createDirectory(File)
     // 6. Symbolic link
-    // JAVA_RUNTIME_VERSION is like "17.0.14+7-LTS"
-    lazy val javaVersion = Runtime.Version.parse(SystemUtils.JAVA_RUNTIME_VERSION)
-    val scenario6 = java.nio.file.Files.createSymbolicLink(new File(testDir, "scenario6")
+    val scenario6 = Files.createSymbolicLink(new File(testDir, "scenario6")
       .toPath, scenario1.toPath).toFile
     if (Utils.isJavaVersionAtLeast21) {
       assert(Utils.createDirectory(scenario6))
-    } else if (javaVersion.feature() == 17 && javaVersion.update() >= 14) {
+    } else if (Runtime.version().feature() == 17 && Runtime.version().update() >= 14) {
       // SPARK-50946: Java 17.0.14 includes JDK-8294193, so scenario6 can succeed.
       assert(Utils.createDirectory(scenario6))
     } else {
@@ -722,7 +718,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
 
     val tempDir2 = Utils.createTempDir()
     val sourceFile1 = new File(tempDir2, "foo.txt")
-    Files.touch(sourceFile1)
+    Utils.touch(sourceFile1)
     assert(sourceFile1.exists())
     Utils.deleteRecursively(sourceFile1)
     assert(!sourceFile1.exists())
@@ -730,7 +726,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
     val tempDir3 = new File(tempDir2, "subdir")
     assert(tempDir3.mkdir())
     val sourceFile2 = new File(tempDir3, "bar.txt")
-    Files.touch(sourceFile2)
+    Utils.touch(sourceFile2)
     assert(sourceFile2.exists())
     Utils.deleteRecursively(tempDir2)
     assert(!tempDir2.exists())
@@ -741,14 +737,14 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
   test("SPARK-50716: deleteRecursively - SymbolicLink To File") {
     val tempDir = Utils.createTempDir()
     val sourceFile = new File(tempDir, "foo.txt")
-    JFiles.write(sourceFile.toPath, "Some content".getBytes)
+    Files.writeString(sourceFile.toPath, "Some content")
     assert(sourceFile.exists())
 
     val symlinkFile = new File(tempDir, "bar.txt")
-    JFiles.createSymbolicLink(symlinkFile.toPath, sourceFile.toPath)
+    Files.createSymbolicLink(symlinkFile.toPath, sourceFile.toPath)
 
     // Check that the symlink was created successfully
-    assert(JFiles.isSymbolicLink(symlinkFile.toPath))
+    assert(Files.isSymbolicLink(symlinkFile.toPath))
     Utils.deleteRecursively(tempDir)
 
     // Verify that everything is deleted
@@ -760,13 +756,13 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
     val sourceDir = new File(tempDir, "sourceDir")
     assert(sourceDir.mkdir())
     val sourceFile = new File(sourceDir, "file.txt")
-    JFiles.write(sourceFile.toPath, "Some content".getBytes)
+    Files.writeString(sourceFile.toPath, "Some content")
 
     val symlinkDir = new File(tempDir, "targetDir")
-    JFiles.createSymbolicLink(symlinkDir.toPath, sourceDir.toPath)
+    Files.createSymbolicLink(symlinkDir.toPath, sourceDir.toPath)
 
     // Check that the symlink was created successfully
-    assert(JFiles.isSymbolicLink(symlinkDir.toPath))
+    assert(Files.isSymbolicLink(symlinkDir.toPath))
 
     // Now delete recursively
     Utils.deleteRecursively(tempDir)
@@ -779,7 +775,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
     withTempDir { tmpDir =>
       val outFile = File.createTempFile("test-load-spark-properties", "test", tmpDir)
       System.setProperty("spark.test.fileNameLoadB", "2")
-      Files.asCharSink(outFile, UTF_8).write("spark.test.fileNameLoadA true\n" +
+      Files.writeString(outFile.toPath, "spark.test.fileNameLoadA true\n" +
         "spark.test.fileNameLoadB 1\n")
       val properties = Utils.getPropertiesFromFile(outFile.getAbsolutePath)
       properties
@@ -809,7 +805,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
       val innerSourceDir = Utils.createTempDir(root = sourceDir.getPath)
       val sourceFile = File.createTempFile("someprefix", "somesuffix", innerSourceDir)
       val targetDir = new File(tempDir, "target-dir")
-      Files.asCharSink(sourceFile, UTF_8).write("some text")
+      Files.writeString(sourceFile.toPath, "some text")
 
       val path =
         if (Utils.isWindows) {
@@ -1034,7 +1030,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
   test("Kill process") {
     // Verify that we can terminate a process even if it is in a bad state. This is only run
     // on UNIX since it does some OS specific things to verify the correct behavior.
-    if (SystemUtils.IS_OS_UNIX) {
+    if (Utils.isUnix) {
       def pidExists(pid: Long): Boolean = {
         val p = Runtime.getRuntime.exec(Array("kill", "-0", s"$pid"))
         p.waitFor()
@@ -1075,7 +1071,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
            |trap "" SIGTERM
            |sleep 10
          """.stripMargin
-      Files.write(cmd.getBytes(UTF_8), file)
+      Files.writeString(file.toPath, cmd)
       file.getAbsoluteFile.setExecutable(true)
 
       process = new ProcessBuilder(file.getAbsolutePath).start()
@@ -1120,7 +1116,7 @@ class UtilsSuite extends SparkFunSuite with ResetSystemProperties {
     val chi = new ChiSquareTest()
 
     // We expect an even distribution; this array will be rescaled by `chiSquareTest`
-    val expected = Array.fill(arraySize * arraySize)(1.0)
+    val expected = createArray(arraySize * arraySize, 1.0)
     val observed = results.flatten
 
     // Performs Pearson's chi-squared test. Using the sum-of-squares as the test statistic, gives
diff --git a/core/src/test/scala/org/apache/spark/util/collection/PrimitiveKeyOpenHashMapSuite.scala b/core/src/test/scala/org/apache/spark/util/collection/PrimitiveKeyOpenHashMapSuite.scala
deleted file mode 100644
index 636ea7b0ee70e..0000000000000
--- a/core/src/test/scala/org/apache/spark/util/collection/PrimitiveKeyOpenHashMapSuite.scala
+++ /dev/null
@@ -1,126 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.util.collection
-
-import scala.collection.mutable.HashSet
-
-import org.scalatest.matchers.must.Matchers
-import org.scalatest.matchers.should.Matchers._
-
-import org.apache.spark.SparkFunSuite
-import org.apache.spark.util.SizeEstimator
-
-class PrimitiveKeyOpenHashMapSuite extends SparkFunSuite with Matchers {
-
-  test("size for specialized, primitive key, value (int, int)") {
-    val capacity = 1024
-    val map = new PrimitiveKeyOpenHashMap[Int, Int](capacity)
-    val actualSize = SizeEstimator.estimate(map)
-    // 32 bit for keys, 32 bit for values, and 1 bit for the bitset.
-    val expectedSize = capacity * (32 + 32 + 1) / 8
-    // Make sure we are not allocating a significant amount of memory beyond our expected.
-    actualSize should be <= (expectedSize * 1.1).toLong
-  }
-
-  test("initialization") {
-    val goodMap1 = new PrimitiveKeyOpenHashMap[Int, Int](1)
-    assert(goodMap1.size === 0)
-    val goodMap2 = new PrimitiveKeyOpenHashMap[Int, Int](255)
-    assert(goodMap2.size === 0)
-    val goodMap3 = new PrimitiveKeyOpenHashMap[Int, Int](256)
-    assert(goodMap3.size === 0)
-    intercept[IllegalArgumentException] {
-      new PrimitiveKeyOpenHashMap[Int, Int](1 << 30 + 1) // Invalid map size: bigger than 2^30
-    }
-    intercept[IllegalArgumentException] {
-      new PrimitiveKeyOpenHashMap[Int, Int](-1)
-    }
-  }
-
-  test("basic operations") {
-    val longBase = 1000000L
-    val map = new PrimitiveKeyOpenHashMap[Long, Int]
-
-    for (i <- 1 to 1000) {
-      map(i + longBase) = i
-      assert(map(i + longBase) === i)
-    }
-
-    assert(map.size === 1000)
-
-    for (i <- 1 to 1000) {
-      assert(map(i + longBase) === i)
-    }
-
-    // Test iterator
-    val set = new HashSet[(Long, Int)]
-    for ((k, v) <- map) {
-      set.add((k, v))
-    }
-    assert(set === (1 to 1000).map(x => (x + longBase, x)).toSet)
-  }
-
-  test("null values") {
-    val map = new PrimitiveKeyOpenHashMap[Long, String]()
-    for (i <- 1 to 100) {
-      map(i.toLong) = null
-    }
-    assert(map.size === 100)
-    assert(map(1.toLong) === null)
-  }
-
-  test("changeValue") {
-    val map = new PrimitiveKeyOpenHashMap[Long, String]()
-    for (i <- 1 to 100) {
-      map(i.toLong) = i.toString
-    }
-    assert(map.size === 100)
-    for (i <- 1 to 100) {
-      val res = map.changeValue(i.toLong, { assert(false); "" }, v => {
-        assert(v === i.toString)
-        v + "!"
-      })
-      assert(res === s"$i!")
-    }
-    // Iterate from 101 to 400 to make sure the map grows a couple of times, because we had a
-    // bug where changeValue would return the wrong result when the map grew on that insert
-    for (i <- 101 to 400) {
-      val res = map.changeValue(i.toLong, { s"$i!" }, v => { assert(false); v })
-      assert(res === s"$i!")
-    }
-    assert(map.size === 400)
-  }
-
-  test("inserting in capacity-1 map") {
-    val map = new PrimitiveKeyOpenHashMap[Long, String](1)
-    for (i <- 1 to 100) {
-      map(i.toLong) = i.toString
-    }
-    assert(map.size === 100)
-    for (i <- 1 to 100) {
-      assert(map(i.toLong) === i.toString)
-    }
-  }
-
-  test("contains") {
-    val map = new PrimitiveKeyOpenHashMap[Int, Int](1)
-    map(0) = 0
-    assert(map.contains(0))
-    assert(!map.contains(1))
-  }
-}
diff --git a/core/src/test/scala/org/apache/spark/util/collection/SizeTrackerSuite.scala b/core/src/test/scala/org/apache/spark/util/collection/SizeTrackerSuite.scala
index 82a4c85b02fa0..db69f2b78106a 100644
--- a/core/src/test/scala/org/apache/spark/util/collection/SizeTrackerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/collection/SizeTrackerSuite.scala
@@ -40,7 +40,7 @@ class SizeTrackerSuite extends SparkFunSuite {
   test("vector variable size insertions") {
     val rand = new Random(123456789)
     def randString(minLen: Int, maxLen: Int): String = {
-      "a" * (rand.nextInt(maxLen - minLen) + minLen)
+      "a".repeat(rand.nextInt(maxLen - minLen) + minLen)
     }
     testVector[String](10000, i => randString(0, 10))
     testVector[String](10000, i => randString(0, 100))
@@ -56,7 +56,7 @@ class SizeTrackerSuite extends SparkFunSuite {
   test("map variable size insertions") {
     val rand = new Random(123456789)
     def randString(minLen: Int, maxLen: Int): String = {
-      "a" * (rand.nextInt(maxLen - minLen) + minLen)
+      "a".repeat(rand.nextInt(maxLen - minLen) + minLen)
     }
     testMap[Int, String](10000, i => (i, randString(0, 10)))
     testMap[Int, String](10000, i => (i, randString(0, 100)))
@@ -66,7 +66,7 @@ class SizeTrackerSuite extends SparkFunSuite {
   test("map updates") {
     val rand = new Random(123456789)
     def randString(minLen: Int, maxLen: Int): String = {
-      "a" * (rand.nextInt(maxLen - minLen) + minLen)
+      "a".repeat(rand.nextInt(maxLen - minLen) + minLen)
     }
     testMap[String, Int](10000, i => (randString(0, 10000), i))
   }
diff --git a/core/src/test/scala/org/apache/spark/util/collection/SorterBenchmark.scala b/core/src/test/scala/org/apache/spark/util/collection/SorterBenchmark.scala
index 34a8fa023a54b..0d4fe1a09f90e 100644
--- a/core/src/test/scala/org/apache/spark/util/collection/SorterBenchmark.scala
+++ b/core/src/test/scala/org/apache/spark/util/collection/SorterBenchmark.scala
@@ -57,6 +57,15 @@ object SorterBenchmark extends BenchmarkBase {
       timer.stopTiming()
     }
 
+    benchmark.addTimerCase("Tuple-sort using Arrays.parallelSort()") { timer =>
+      val kvTupleArray = new Array[AnyRef](numElements)
+      System.arraycopy(kvTuples, 0, kvTupleArray, 0, numElements)
+      timer.startTiming()
+      util.Arrays.parallelSort(kvTupleArray, (x: AnyRef, y: AnyRef) =>
+        x.asInstanceOf[(JFloat, _)]._1.compareTo(y.asInstanceOf[(JFloat, _)]._1))
+      timer.stopTiming()
+    }
+
     // Test Sorter where each element alternates between Float and Integer, non-primitive
     val keyValues = {
       val data = new Array[AnyRef](numElements * 2)
@@ -106,6 +115,14 @@ object SorterBenchmark extends BenchmarkBase {
       timer.stopTiming()
     }
 
+    benchmark.addTimerCase("Java Arrays.parallelSort() on non-primitive int array") { timer =>
+      val intObjectArray = new Array[Integer](numElements)
+      System.arraycopy(intObjects, 0, intObjectArray, 0, numElements)
+      timer.startTiming()
+      util.Arrays.parallelSort(intObjectArray, (x: Integer, y: Integer) => x.compareTo(y))
+      timer.stopTiming()
+    }
+
     benchmark.addTimerCase("Java Arrays.sort() on primitive int array") { timer =>
       val intPrimitiveArray = new Array[Int](numElements)
       System.arraycopy(ints, 0, intPrimitiveArray, 0, numElements)
@@ -114,6 +131,14 @@ object SorterBenchmark extends BenchmarkBase {
       timer.stopTiming()
     }
 
+    benchmark.addTimerCase("Java Arrays.parallelSort() on primitive int array") { timer =>
+      val intPrimitiveArray = new Array[Int](numElements)
+      System.arraycopy(ints, 0, intPrimitiveArray, 0, numElements)
+      timer.startTiming()
+      util.Arrays.parallelSort(intPrimitiveArray)
+      timer.stopTiming()
+    }
+
     benchmark.addTimerCase("Sorter without key reuse on primitive int array") { timer =>
       val intPrimitiveArray = new Array[Int](numElements)
       System.arraycopy(ints, 0, intPrimitiveArray, 0, numElements)
diff --git a/core/src/test/scala/org/apache/spark/util/collection/unsafe/sort/RadixSortSuite.scala b/core/src/test/scala/org/apache/spark/util/collection/unsafe/sort/RadixSortSuite.scala
index f5d417fcf19dc..49b7683b7857a 100644
--- a/core/src/test/scala/org/apache/spark/util/collection/unsafe/sort/RadixSortSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/collection/unsafe/sort/RadixSortSuite.scala
@@ -22,12 +22,12 @@ import java.util.{Arrays, Comparator}
 
 import scala.util.Random
 
-import com.google.common.primitives.Ints
-
 import org.apache.spark.SparkFunSuite
+import org.apache.spark.network.util.JavaUtils.checkedCast
 import org.apache.spark.unsafe.array.LongArray
 import org.apache.spark.unsafe.memory.MemoryBlock
 import org.apache.spark.util.collection.Sorter
+import org.apache.spark.util.collection.Utils.createArray
 import org.apache.spark.util.random.XORShiftRandom
 
 class RadixSortSuite extends SparkFunSuite {
@@ -74,21 +74,21 @@ class RadixSortSuite extends SparkFunSuite {
       2, 4, false, false, true))
 
   private def generateTestData(size: Long, rand: => Long): (Array[JLong], LongArray) = {
-    val ref = Array.tabulate[Long](Ints.checkedCast(size)) { i => rand }
-    val extended = ref ++ Array.fill[Long](Ints.checkedCast(size))(0)
+    val ref = Array.tabulate[Long](checkedCast(size)) { i => rand }
+    val extended = ref ++ createArray(checkedCast(size), 0L)
     (ref.map(i => JLong.valueOf(i)), new LongArray(MemoryBlock.fromLongArray(extended)))
   }
 
   private def generateKeyPrefixTestData(size: Long, rand: => Long): (LongArray, LongArray) = {
-    val ref = Array.tabulate[Long](Ints.checkedCast(size * 2)) { i => rand }
-    val extended = ref ++ Array.fill[Long](Ints.checkedCast(size * 2))(0)
+    val ref = Array.tabulate[Long](checkedCast(size * 2)) { i => rand }
+    val extended = ref ++ createArray(checkedCast(size * 2), 0L)
     (new LongArray(MemoryBlock.fromLongArray(ref)),
      new LongArray(MemoryBlock.fromLongArray(extended)))
   }
 
   private def collectToArray(array: LongArray, offset: Int, length: Long): Array[Long] = {
     var i = 0
-    val out = new Array[Long](Ints.checkedCast(length))
+    val out = new Array[Long](checkedCast(length))
     while (i < length) {
       out(i) = array.get(offset + i)
       i += 1
@@ -111,7 +111,7 @@ class RadixSortSuite extends SparkFunSuite {
       refCmp: PrefixComparator): Unit = {
     val sortBuffer = new LongArray(MemoryBlock.fromLongArray(new Array[Long](buf.size().toInt)))
     new Sorter(new UnsafeSortDataFormat(sortBuffer)).sort(
-      buf, Ints.checkedCast(lo), Ints.checkedCast(hi),
+      buf, checkedCast(lo), checkedCast(hi),
       (r1: RecordPointerAndKeyPrefix, r2: RecordPointerAndKeyPrefix) =>
         refCmp.compare(r1.keyPrefix, r2.keyPrefix))
   }
diff --git a/core/src/test/scala/org/apache/spark/util/kvstore/RocksDBBenchmark.scala b/core/src/test/scala/org/apache/spark/util/kvstore/RocksDBBenchmark.scala
new file mode 100644
index 0000000000000..5eafce5d2e49e
--- /dev/null
+++ b/core/src/test/scala/org/apache/spark/util/kvstore/RocksDBBenchmark.scala
@@ -0,0 +1,547 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.util.kvstore
+
+import java.io.File
+import java.util.concurrent.atomic.AtomicInteger
+
+import scala.beans.BeanProperty
+import scala.collection.mutable.ArrayBuffer
+import scala.util.Random
+
+import org.apache.spark.benchmark.{Benchmark, BenchmarkBase}
+import org.apache.spark.util.Utils
+
+
+/**
+ * Benchmark suite for the KVStore implemented based on RocksDB.
+ *
+ * The benchmarks are run over two different types (one with just a natural index, and one
+ * with a ref index), over a set of elements, and the following tests are performed:
+ *
+ * - create and close rocksdb
+ * - write/update/delete elements in sequential natural key order
+ * - write/update/delete elements in random natural key order
+ * - iterate over natural index, ascending and descending
+ * - iterate over ref index, ascending and descending
+ *
+ * To run this benchmark:
+ * {{{
+ *   1. without sbt:
+ *      bin/spark-submit --class <this class> <spark core test jar>
+ *   2. build/sbt "core/Test/runMain <this class>"
+ *   3. generate result:
+ *      SPARK_GENERATE_BENCHMARK_FILES=1 build/sbt "core/Test/runMain <this class>"
+ *      Results will be written to "benchmarks/RocksDBBenchmark-results.txt".
+ * }}}
+ */
+object RocksDBBenchmark extends BenchmarkBase {
+
+  private val COUNT = 1024
+  private val ITERATIONS = 4
+  private val IDGEN = new AtomicInteger()
+
+  private var db: RocksDB = _
+  private var dbpath: File = _
+
+  override def runBenchmarkSuite(mainArgs: Array[String]): Unit = {
+    runBenchmark("RocksDB Lifecycle Benchmark") {
+      databaseLifecycle()
+    }
+
+    runBenchmark("Sequential Operations Benchmark") {
+      sequentialWrites()
+      sequentialUpdates()
+      sequentialDeletes()
+    }
+
+    runBenchmark("Random Operations Benchmark") {
+      randomWrites()
+      randomUpdates()
+      randomDeletes()
+    }
+
+    runBenchmark("Natural Index Benchmark") {
+      naturalIndexCreateIterator()
+      naturalIndexIteration()
+    }
+
+    runBenchmark("Ref Index Benchmark") {
+      refIndexCreateIterator()
+      refIndexIteration()
+    }
+  }
+
+  private def databaseLifecycle(): Unit = {
+    val benchmark =
+      new Benchmark("RocksDB Lifecycle Operations", 1, ITERATIONS, output = output)
+
+    benchmark.addTimerCase("DB Creation") { timer =>
+      try {
+        dbpath = File.createTempFile("test.", ".rdb")
+        dbpath.delete()
+        timer.startTiming()
+        db = new RocksDB(dbpath)
+        timer.stopTiming()
+      } catch {
+        case e: Exception =>
+          throw new RuntimeException("Failed to setup database", e)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.addTimerCase("DB Close") { timer =>
+      try {
+        setupDB()
+        val entries = createSimpleType().take(10)
+        // Add some data to make close operation more realistic
+        entries.foreach(db.write)
+      } finally {
+        timer.startTiming()
+        db.close()
+        timer.stopTiming()
+        cleanupDB()
+      }
+    }
+
+    benchmark.run()
+  }
+
+  private def sequentialDeletes(): Unit = {
+    val benchmark = new Benchmark("Sequential Deletes", COUNT, ITERATIONS, output = output)
+
+    benchmark.addTimerCase("Indexed") { timer =>
+      try {
+        setupDB()
+        val entries = createIndexedType()
+        entries.foreach(db.write)
+        indexDelete(entries, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.addTimerCase("No Index") { timer =>
+      try {
+        setupDB()
+        val entries = createSimpleType()
+        entries.foreach(db.write)
+        noIndexDelete(entries, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.run()
+  }
+
+  private def sequentialUpdates(): Unit = {
+    val benchmark = new Benchmark("Sequential Updates", COUNT, ITERATIONS, output = output)
+
+    benchmark.addTimerCase("Indexed") { timer =>
+      try {
+        setupDB()
+        val entries = createIndexedType()
+        entries.foreach(db.write)
+        indexUpdate(entries, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.addTimerCase("No Index") { timer =>
+      try {
+        setupDB()
+        val entries = createSimpleType()
+        entries.foreach(db.write)
+        noIndexUpdate(entries, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.run()
+  }
+
+
+  private def sequentialWrites(): Unit = {
+    val benchmark = new Benchmark("Sequential Writes", COUNT, ITERATIONS, output = output)
+
+    benchmark.addTimerCase("Indexed") { timer =>
+      try {
+        setupDB()
+        val entries = createIndexedType()
+        indexWrite(entries, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.addTimerCase("No Index") { timer =>
+      try {
+        setupDB()
+        val entries = createSimpleType()
+        noIndexWrite(entries, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.run()
+  }
+
+  private def randomDeletes(): Unit = {
+    val benchmark = new Benchmark("Random Deletes", COUNT, ITERATIONS, output = output)
+
+    benchmark.addTimerCase("Indexed") { timer =>
+      try {
+        setupDB()
+        val entries = createIndexedType()
+        entries.foreach(db.write)
+        val shuffled = Random.shuffle(entries)
+        indexDelete(shuffled, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.addTimerCase("No Index") { timer =>
+      try {
+        setupDB()
+        val entries = createSimpleType()
+        entries.foreach(db.write)
+        val shuffled = Random.shuffle(entries)
+        noIndexDelete(shuffled, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.run()
+  }
+
+  private def randomUpdates(): Unit = {
+    val benchmark = new Benchmark("Random Updates", COUNT, ITERATIONS, output = output)
+
+    benchmark.addTimerCase("Indexed") { timer =>
+      try {
+        setupDB()
+        val entries = createIndexedType()
+        entries.foreach(db.write)
+        val shuffled = Random.shuffle(entries)
+        indexUpdate(shuffled, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.addTimerCase("No Index") { timer =>
+      try {
+        setupDB()
+        val entries = createSimpleType()
+        entries.foreach(db.write)
+        val shuffled = Random.shuffle(entries)
+        noIndexUpdate(shuffled, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.run()
+  }
+
+  private def randomWrites(): Unit = {
+    val benchmark = new Benchmark("Random Writes", COUNT, ITERATIONS, output = output)
+
+    benchmark.addTimerCase("Indexed") { timer =>
+      try {
+        setupDB()
+        val shuffled = Random.shuffle(createIndexedType())
+        indexWrite(shuffled, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.addTimerCase("No Index") { timer =>
+      try {
+        setupDB()
+        val shuffled = Random.shuffle(createSimpleType())
+        noIndexWrite(shuffled, timer)
+      } finally {
+        cleanupDB()
+      }
+    }
+
+    benchmark.run()
+  }
+
+  private def naturalIndexCreateIterator(): Unit = {
+    val benchmark =
+      new Benchmark("Natural Index - Create Iterator", COUNT, ITERATIONS, output = output)
+
+    try {
+      setupDB()
+      val entries = Random.shuffle(createIndexedType())
+      entries.foreach(db.write)
+
+      val view = db.view(classOf[IndexedType])
+
+      benchmark.addTimerCase("Ascending") { timer =>
+        timer.startTiming()
+        val it = view.closeableIterator()
+        timer.stopTiming()
+        it.close()
+      }
+
+      benchmark.addTimerCase("Descending") { timer =>
+        timer.startTiming()
+        val it = view.reverse().closeableIterator()
+        timer.stopTiming()
+        it.close()
+      }
+
+      benchmark.run()
+    } finally {
+      cleanupDB()
+    }
+  }
+
+  private def naturalIndexIteration(): Unit = {
+    val benchmark = new Benchmark("Natural Index - Iteration", COUNT, ITERATIONS, output = output)
+
+    try {
+      setupDB()
+      val entries = Random.shuffle(createIndexedType())
+      entries.foreach(db.write)
+
+      val view = db.view(classOf[IndexedType])
+
+      benchmark.addTimerCase("Ascending") { timer =>
+        val it = view.closeableIterator()
+        try {
+          timer.startTiming()
+          while (it.hasNext) {
+            it.next()
+          }
+          timer.stopTiming()
+        } finally {
+          it.close()
+        }
+      }
+
+      benchmark.addTimerCase("Descending") { timer =>
+        val it = view.reverse().closeableIterator()
+        try {
+          timer.startTiming()
+          while (it.hasNext) {
+            it.next()
+          }
+          timer.stopTiming()
+        } finally {
+          it.close()
+        }
+      }
+
+      benchmark.run()
+    } finally {
+      cleanupDB()
+    }
+  }
+
+  private def refIndexCreateIterator(): Unit = {
+    val benchmark = new Benchmark("Ref Index - Create Iterator", COUNT, ITERATIONS, output = output)
+
+    try {
+      setupDB()
+      val entries = Random.shuffle(createIndexedType())
+      entries.foreach(db.write)
+
+      val view = db.view(classOf[IndexedType])
+
+      benchmark.addTimerCase("Ascending") { timer =>
+        timer.startTiming()
+        val it = view.index("name").closeableIterator()
+        timer.stopTiming()
+        it.close()
+      }
+
+      benchmark.addTimerCase("Descending") { timer =>
+        timer.startTiming()
+        val it = view.index("name").reverse().closeableIterator()
+        timer.stopTiming()
+        it.close()
+      }
+
+      benchmark.run()
+    } finally {
+      cleanupDB()
+    }
+  }
+
+  private def refIndexIteration(): Unit = {
+    val benchmark = new Benchmark("Ref Index - Iteration", COUNT, ITERATIONS, output = output)
+
+    try {
+      setupDB()
+      val entries = Random.shuffle(createIndexedType())
+      entries.foreach(db.write)
+
+      val view = db.view(classOf[IndexedType])
+
+      benchmark.addTimerCase("Ascending") { timer =>
+        val it = view.index("name").closeableIterator()
+        try {
+          timer.startTiming()
+          while (it.hasNext) {
+            it.next()
+          }
+          timer.stopTiming()
+        } finally {
+          it.close()
+        }
+      }
+
+      benchmark.addTimerCase("Descending") { timer =>
+        val it = view.index("name").reverse().closeableIterator()
+        try {
+          timer.startTiming()
+          while (it.hasNext) {
+            it.next()
+          }
+          timer.stopTiming()
+        } finally {
+          it.close()
+        }
+      }
+
+      benchmark.run()
+    } finally {
+      cleanupDB()
+    }
+  }
+
+  private def setupDB(): Unit = {
+    try {
+      dbpath = File.createTempFile("test.", ".rdb")
+      dbpath.delete()
+      db = new RocksDB(dbpath)
+    } catch {
+      case e: Exception =>
+        throw new RuntimeException("Failed to setup database", e)
+    }
+  }
+
+  private def cleanupDB(): Unit = {
+    if (db != null) {
+      try {
+        db.close()
+      } catch {
+        case _: Exception => // Ignore cleanup errors
+      }
+      db = null
+    }
+    if (dbpath != null) {
+      Utils.deleteQuietly(dbpath)
+      dbpath = null
+    }
+  }
+
+  private def createSimpleType(): Seq[SimpleType] = {
+    val entries = ArrayBuffer[SimpleType]()
+    for (_ <- 0 until COUNT) {
+      val t = new SimpleType()
+      t.key = IDGEN.getAndIncrement()
+      t.name = s"name${t.key % 1024}"
+      entries += t
+    }
+    entries.toSeq
+  }
+
+  private def createIndexedType(): Seq[IndexedType] = {
+    val entries = ArrayBuffer[IndexedType]()
+    for (_ <- 0 until COUNT) {
+      val t = new IndexedType()
+      t.key = IDGEN.getAndIncrement()
+      t.name = s"name${t.key % 1024}"
+      entries += t
+    }
+    entries.toSeq
+  }
+
+  private def noIndexWrite(entries: Seq[SimpleType], timer: Benchmark.Timer): Unit = {
+    entries.foreach { e =>
+      timer.startTiming()
+      db.write(e)
+      timer.stopTiming()
+    }
+  }
+
+  private def noIndexUpdate(entries: Seq[SimpleType], timer: Benchmark.Timer): Unit = {
+    entries.foreach { e =>
+      e.name = s"updated_${e.name}"
+      timer.startTiming()
+      db.write(e)
+      timer.stopTiming()
+    }
+  }
+
+  private def noIndexDelete(entries: Seq[SimpleType], timer: Benchmark.Timer): Unit = {
+    entries.foreach { e =>
+      timer.startTiming()
+      db.delete(e.getClass, e.key)
+      timer.stopTiming()
+    }
+  }
+
+  private def indexWrite(entries: Seq[IndexedType], timer: Benchmark.Timer): Unit = {
+    entries.foreach { e =>
+      timer.startTiming()
+      db.write(e)
+      timer.stopTiming()
+    }
+  }
+
+  private def indexUpdate(entries: Seq[IndexedType], timer: Benchmark.Timer): Unit = {
+    entries.foreach { e =>
+      e.name = s"updated_${e.name}"
+      timer.startTiming()
+      db.write(e)
+      timer.stopTiming()
+    }
+  }
+
+  private def indexDelete(entries: Seq[IndexedType], timer: Benchmark.Timer): Unit = {
+    entries.foreach { e =>
+      timer.startTiming()
+      db.delete(e.getClass, e.key)
+      timer.stopTiming()
+    }
+  }
+}
+
+private class SimpleType {
+  @KVIndex var key = 0
+  var name: String = _
+}
+
+private class IndexedType {
+  @KVIndex var key = 0
+  @KVIndex("name") @BeanProperty var name: String = _
+}
diff --git a/core/src/test/scala/org/apache/spark/util/logging/DriverLoggerSuite.scala b/core/src/test/scala/org/apache/spark/util/logging/DriverLoggerSuite.scala
index 97cd5caaac907..223f5e17731d1 100644
--- a/core/src/test/scala/org/apache/spark/util/logging/DriverLoggerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/logging/DriverLoggerSuite.scala
@@ -19,7 +19,6 @@ package org.apache.spark.util.logging
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark._
@@ -52,7 +51,7 @@ class DriverLoggerSuite extends SparkFunSuite with LocalSparkContext {
 
     // Assert driver log file exists
     val rootDir = Utils.getLocalDir(sc.getConf)
-    val driverLogsDir = FileUtils.getFile(rootDir, DriverLogger.DRIVER_LOG_DIR)
+    val driverLogsDir = Utils.getFile(rootDir, DriverLogger.DRIVER_LOG_DIR)
     assert(driverLogsDir.exists())
     val files = driverLogsDir.listFiles()
     assert(files.length === 1)
@@ -60,7 +59,7 @@ class DriverLoggerSuite extends SparkFunSuite with LocalSparkContext {
 
     sc.stop()
     assert(!driverLogsDir.exists())
-    val dfsFile = FileUtils.getFile(sc.getConf.get(DRIVER_LOG_DFS_DIR).get,
+    val dfsFile = Utils.getFile(sc.getConf.get(DRIVER_LOG_DFS_DIR).get,
       app_id + DriverLogger.DRIVER_LOG_FILE_SUFFIX)
     assert(dfsFile.exists())
     assert(dfsFile.length() > 0)
@@ -77,7 +76,7 @@ class DriverLoggerSuite extends SparkFunSuite with LocalSparkContext {
 
     // Assert driver log file exists
     val rootDir = Utils.getLocalDir(sc.getConf)
-    val driverLogsDir = FileUtils.getFile(rootDir, DriverLogger.DRIVER_LOG_DIR)
+    val driverLogsDir = Utils.getFile(rootDir, DriverLogger.DRIVER_LOG_DIR)
     assert(driverLogsDir.exists())
     val files = driverLogsDir.listFiles()
     assert(files.length === 1)
diff --git a/core/src/test/scala/org/apache/spark/util/random/RandomSamplerSuite.scala b/core/src/test/scala/org/apache/spark/util/random/RandomSamplerSuite.scala
index 8fcbfd9ccad85..dfba45b756b79 100644
--- a/core/src/test/scala/org/apache/spark/util/random/RandomSamplerSuite.scala
+++ b/core/src/test/scala/org/apache/spark/util/random/RandomSamplerSuite.scala
@@ -26,6 +26,7 @@ import org.scalatest.matchers.must.Matchers
 import org.scalatest.matchers.should.Matchers._
 
 import org.apache.spark.SparkFunSuite
+import org.apache.spark.util.collection.Utils.createArray
 
 class RandomSamplerSuite extends SparkFunSuite with Matchers {
   /**
@@ -100,8 +101,8 @@ class RandomSamplerSuite extends SparkFunSuite with Matchers {
     assert(math.min(d1.length, d2.length) > 0)
     assert(math.min(d1.min, d2.min)  >=  0)
     val m = 1 + math.max(d1.max, d2.max)
-    val h1 = Array.fill[Int](m)(0)
-    val h2 = Array.fill[Int](m)(0)
+    val h1 = createArray(m, 0)
+    val h2 = createArray(m, 0)
     for (v <- d1) { h1(v) += 1 }
     for (v <- d2) { h2(v) += 1 }
     assert(h1.sum == h2.sum)
diff --git a/dev/.rat-excludes b/dev/.rat-excludes
index 5084d0b6905a3..f976b03b49c9d 100644
--- a/dev/.rat-excludes
+++ b/dev/.rat-excludes
@@ -132,6 +132,7 @@ SqlBaseLexer.tokens
 .*\.proto.bin
 LimitedInputStream.java
 TimSort.java
+mllib-local/src/main/scala/scala/collection/compat/package.scala
 xml-resources/*
 loose_version.py
 people.xml
diff --git a/dev/check_pyspark_custom_errors.py b/dev/check_pyspark_custom_errors.py
index bce73c84028a1..db152c77d1b86 100644
--- a/dev/check_pyspark_custom_errors.py
+++ b/dev/check_pyspark_custom_errors.py
@@ -124,7 +124,6 @@ def check_pyspark_custom_errors(target_paths, exclude_paths):
         "PySparkValueError",
         "PythonException",
         "QueryExecutionException",
-        "RetriesExceeded",
         "SessionNotSameException",
         "SparkNoSuchElementException",
         "SparkRuntimeException",
diff --git a/dev/checkstyle.xml b/dev/checkstyle.xml
index 6c50718e27fe5..4cf26871a8db8 100644
--- a/dev/checkstyle.xml
+++ b/dev/checkstyle.xml
@@ -183,11 +183,109 @@
         <module name="IllegalImport">
             <property name="illegalPkgs" value="org.apache.log4j" />
             <property name="illegalPkgs" value="org.apache.commons.lang" />
+            <property name="illegalPkgs" value="org.apache.commons.lang3.tuple" />
+            <property name="illegalClasses" value="org.apache.commons.codec.binary.Base64" />
+            <property name="illegalClasses" value="org.apache.commons.io.FileUtils" />
+            <property name="illegalClasses" value="org.apache.commons.lang3.JavaVersion" />
+            <property name="illegalClasses" value="org.apache.commons.lang3.Strings" />
+            <property name="illegalClasses" value="org.apache.commons.lang3.StringUtils" />
+            <property name="illegalClasses" value="org.apache.commons.lang3.SystemUtils" />
+            <property name="illegalClasses" value="org.apache.hadoop.io.IOUtils" />
+            <property name="illegalClasses" value="org.apache.parquet.Preconditions" />
+            <property name="illegalClasses" value="com.google.common.base.Joiner" />
+            <property name="illegalClasses" value="com.google.common.base.Objects" />
+            <property name="illegalClasses" value="com.google.common.base.Preconditions" />
+            <property name="illegalClasses" value="com.google.common.base.Strings" />
+            <property name="illegalClasses" value="com.google.common.collect.ArrayListMultimap" />
+            <property name="illegalClasses" value="com.google.common.collect.Multimap" />
+            <property name="illegalClasses" value="com.google.common.collect.Sets" />
+            <property name="illegalClasses" value="com.google.common.io.BaseEncoding" />
+            <property name="illegalClasses" value="com.google.common.io.Files" />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Ints\.checkedCast"/>
+            <property name="message" value="Use JavaUtils.checkedCast instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Charset\.defaultCharset"/>
+            <property name="message" value="Use StandardCharsets.UTF_8 instead." />
         </module>
         <module name="RegexpSinglelineJava">
             <property name="format" value="new URL\("/>
             <property name="message" value="Use URI.toURL or URL.of instead of URL constructors." />
         </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="new ToStringBuilder\("/>
+            <property name="message" value="Use String concatenation instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Files\.equal\("/>
+            <property name="message" value="Use contentEquals of SparkFileUtils or Utils instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Files\.asCharSink"/>
+            <property name="message" value="Use java.nio.file.Files.writeString instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="ByteStreams\.copy"/>
+            <property name="message" value="Use Java transferTo instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="ByteStreams\.skipFully"/>
+            <property name="message" value="Use Java skipNBytes instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Files\.asByteSource"/>
+            <property name="message" value="Use Java Files.newInputStream instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="ByteStreams\.readFully"/>
+            <property name="message" value="Use readFully of JavaUtils/SparkStreamUtils/Utils instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="FileUtils.writeStringToFile"/>
+            <property name="message" value="Use java.nio.file.Files.writeString instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="FileUtils\.deleteDirectory"/>
+            <property name="message" value="Use deleteRecursively of JavaUtils/SparkFileUtils/Utils instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="FileUtils\.forceDelete\("/>
+            <property name="message" value="Use deleteRecursively of JavaUtils/SparkFileUtils/Utils instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="FileUtils\.forceDeleteOnExit\("/>
+            <property name="message" value="Use forceDeleteOnExit of JavaUtils/SparkFileUtils/Utils instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="FileUtils\.deleteQuietly"/>
+            <property name="message" value="Use deleteQuietly of JavaUtils/SparkFileUtils/Utils instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="CharStreams\.toString"/>
+            <property name="message" value="Use toString of SparkStreamUtils or Utils instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Preconditions\.checkNotNull"/>
+            <property name="message" value="Use requireNonNull of java.util.Objects instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Lists\.newArrayList"/>
+            <property name="message" value="Use ArrayList constructor instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="ImmutableMap\.of"/>
+            <property name="message" value="Use Map.of instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="ImmutableSet\.of"/>
+            <property name="message" value="Use Set.of instead." />
+        </module>
+        <module name="RegexpSinglelineJava">
+            <property name="format" value="Throwables\.getStackTraceAsString"/>
+            <property name="message" value="Use stackTraceToString of JavaUtils/SparkFileUtils/Utils instead." />
+        </module>
         <!-- support structured logging -->
         <module name="RegexpSinglelineJava">
             <property name="format" value="org\.slf4j\.(Logger|LoggerFactory)" />
diff --git a/dev/create-release/release-build.sh b/dev/create-release/release-build.sh
index 602d4db97a666..93ec3684ccc49 100755
--- a/dev/create-release/release-build.sh
+++ b/dev/create-release/release-build.sh
@@ -137,12 +137,12 @@ if [[ "$1" == "finalize" ]]; then
     --repository-url https://upload.pypi.org/legacy/ \
     "pyspark_connect-$PYSPARK_VERSION.tar.gz" \
     "pyspark_connect-$PYSPARK_VERSION.tar.gz.asc"
-  svn update "pyspark_client-$RELEASE_VERSION.tar.gz"
-  svn update "pyspark_client-$RELEASE_VERSION.tar.gz.asc"
+  svn update "pyspark_client-$PYSPARK_VERSION.tar.gz"
+  svn update "pyspark_client-$PYSPARK_VERSION.tar.gz.asc"
   twine upload -u __token__ -p $PYPI_API_TOKEN \
     --repository-url https://upload.pypi.org/legacy/ \
-    "pyspark_client-$RELEASE_VERSION.tar.gz" \
-    "pyspark_client-$RELEASE_VERSION.tar.gz.asc"
+    "pyspark_client-$PYSPARK_VERSION.tar.gz" \
+    "pyspark_client-$PYSPARK_VERSION.tar.gz.asc"
   cd ..
   rm -rf svn-spark
   echo "PySpark uploaded"
@@ -157,9 +157,323 @@ if [[ "$1" == "finalize" ]]; then
   git commit -m "Add docs for Apache Spark $RELEASE_VERSION"
   git push origin HEAD:asf-site
   cd ..
-  rm -rf spark-website
   echo "docs uploaded"
 
+  echo "Uploading release docs to spark-website"
+  cd spark-website
+
+  # TODO: Test it in the actual release
+  # 1. Add download link to documentation.md
+  python3 <<EOF
+import re
+
+release_version = "${RELEASE_VERSION}"
+is_preview = bool(re.search(r'-preview\d*$', release_version))
+base_version = re.sub(r'-preview\d*$', '', release_version)
+
+stable_newline = f'  <li><a href="{{{{site.baseurl}}}}/docs/{release_version}/">Spark {release_version}</a></li>'
+preview_newline = f'  <li><a href="{{{{site.baseurl}}}}/docs/{release_version}/">Spark {release_version} preview</a></li>'
+
+inserted = False
+
+def parse_version(v):
+    return [int(p) for p in v.strip().split(".")]
+
+def vercmp(v1, v2):
+    a = parse_version(v1)
+    b = parse_version(v2)
+    return (a > b) - (a < b)
+
+with open("documentation.md") as f:
+    lines = f.readlines()
+
+with open("documentation.md", "w") as f:
+    if is_preview:
+        in_preview_section = False
+        for i, line in enumerate(lines):
+            if '<p>Documentation for preview releases:</p>' in line:
+                in_preview_section = True
+                f.write(line)
+                continue
+
+            if in_preview_section and re.search(r'docs/\d+\.\d+\.\d+-preview\d*/', line):
+                existing_version = re.search(r'docs/(\d+\.\d+\.\d+-preview\d*)/', line).group(1)
+
+                if existing_version == release_version:
+                    inserted = True  # Already exists, don't add
+                elif not inserted:
+                    base_existing = re.sub(r'-preview\d*$', '', existing_version)
+                    preview_num_existing = int(re.search(r'preview(\d*)', existing_version).group(1) or "0")
+                    preview_num_new = int(re.search(r'preview(\d*)', release_version).group(1) or "0")
+
+                    if (vercmp(base_version, base_existing) > 0) or \
+                       (vercmp(base_version, base_existing) == 0 and preview_num_new >= preview_num_existing):
+                        f.write(preview_newline + "\n")
+                        inserted = True
+
+                f.write(line)
+                continue
+
+            if in_preview_section and "</ul>" in line and not inserted:
+                f.write(preview_newline + "\n")
+                inserted = True
+            f.write(line)
+    else:
+        for line in lines:
+            match = re.search(r'docs/(\d+\.\d+\.\d+)/', line)
+            if not inserted and match:
+                existing_version = match.group(1)
+                if vercmp(release_version, existing_version) >= 0:
+                    f.write(stable_newline + "\n")
+                    inserted = True
+            f.write(line)
+        if not inserted:
+            f.write(stable_newline + "\n")
+EOF
+
+  echo "Edited documentation.md"
+
+  # 2. Add download link to js/downloads.js
+  if [[ "$RELEASE_VERSION" =~ -preview[0-9]*$ ]]; then
+    echo "Skipping js/downloads.js for preview release: $RELEASE_VERSION"
+  else
+    RELEASE_DATE=$(TZ=America/Los_Angeles date +"%m/%d/%Y")
+    IFS='.' read -r rel_maj rel_min rel_patch <<< "$RELEASE_VERSION"
+    NEW_PACKAGES="packagesV14"
+    if [[ "$rel_maj" -ge 4 ]]; then
+      NEW_PACKAGES="packagesV15"
+    fi
+
+    python3 <<EOF
+import re
+
+release_version = "${RELEASE_VERSION}"
+release_date = "${RELEASE_DATE}"
+new_packages = "${NEW_PACKAGES}"
+newline = f'addRelease("{release_version}", new Date("{release_date}"), {new_packages}, true);'
+
+new_major, new_minor, new_patch = [int(p) for p in release_version.split(".")]
+
+def parse_version(v):
+    return [int(p) for p in v.strip().split(".")]
+
+def vercmp(v1, v2):
+    a = parse_version(v1)
+    b = parse_version(v2)
+    return (a > b) - (a < b)
+
+inserted = replaced = False
+
+with open("js/downloads.js") as f:
+    lines = f.readlines()
+
+with open("js/downloads.js", "w") as f:
+    for line in lines:
+        m = re.search(r'addRelease\("(\d+\.\d+\.\d+)"', line)
+        if m:
+            existing_version = m.group(1)
+            cmp_result = vercmp(release_version, existing_version)
+            ex_major, ex_minor, ex_patch = parse_version(existing_version)
+
+            if cmp_result == 0:
+                f.write(newline + "\n")
+                replaced = True
+            elif not replaced and ex_major == new_major and ex_minor == new_minor:
+                f.write(newline + "\n")
+                replaced = True
+            elif not replaced and not inserted and cmp_result > 0:
+                f.write(newline + "\n")
+                f.write(line)
+                inserted = True
+            else:
+                f.write(line)
+        else:
+            f.write(line)
+    if not replaced and not inserted:
+        f.write(newline + "\n")
+EOF
+
+    echo "Edited js/downloads.js"
+  fi
+
+  # 3. Add news post
+  RELEASE_DATE=$(TZ=America/Los_Angeles date +"%Y-%m-%d")
+  FILENAME="news/_posts/${RELEASE_DATE}-spark-${RELEASE_VERSION//./-}-released.md"
+  mkdir -p news/_posts
+
+  if [[ "$RELEASE_VERSION" =~ -preview[0-9]*$ ]]; then
+    BASE_VERSION="${RELEASE_VERSION%%-preview*}"
+    cat > "$FILENAME" <<EOF
+---
+layout: post
+title: Preview release of Spark ${BASE_VERSION}
+categories:
+- News
+tags: []
+status: publish
+type: post
+published: true
+meta:
+  _edit_last: '4'
+  _wpas_done_all: '1'
+---
+To enable wide-scale community testing of the upcoming Spark ${BASE_VERSION} release, the Apache Spark community has posted a
+<a href="https://archive.apache.org/dist/spark/spark-${RELEASE_VERSION}/">Spark ${RELEASE_VERSION} release</a>.
+This preview is not a stable release in terms of either API or functionality, but it is meant to give the community early
+access to try the code that will become Spark ${BASE_VERSION}. If you would like to test the release,
+please <a href="https://archive.apache.org/dist/spark/spark-${RELEASE_VERSION}/">download</a> it, and send feedback using either
+<a href="https://spark.apache.org/community.html">mailing lists</a> or
+<a href="https://issues.apache.org/jira/browse/SPARK/?selectedTab=com.atlassian.jira.jira-projects-plugin:summary-panel">JIRA</a>.
+The documentation is available at the <a href="https://spark.apache.org/docs/${RELEASE_VERSION}/">link</a>.
+
+We'd like to thank our contributors and users for their contributions and early feedback to this release. This release would not have been possible without you.
+EOF
+
+  else
+    cat > "$FILENAME" <<EOF
+---
+layout: post
+title: Spark ${RELEASE_VERSION} released
+categories:
+- News
+tags: []
+status: publish
+type: post
+published: true
+meta:
+  _edit_last: '4'
+  _wpas_done_all: '1'
+---
+We are happy to announce the availability of <a href="{{site.baseurl}}/releases/spark-release-${RELEASE_VERSION}.html" title="Spark Release ${RELEASE_VERSION}">Apache Spark ${RELEASE_VERSION}</a>! Visit the <a href="{{site.baseurl}}/releases/spark-release-${RELEASE_VERSION}.html" title="Spark Release ${RELEASE_VERSION}">release notes</a> to read about the new features, or <a href="{{site.baseurl}}/downloads.html">download</a> the release today.
+EOF
+  fi
+
+  echo "Created $FILENAME"
+
+  # 4. Add release notes with Python to extract JIRA version ID
+  if [[ "$RELEASE_VERSION" =~ -preview[0-9]*$ ]]; then
+    echo "Skipping JIRA release notes for preview release: $RELEASE_VERSION"
+  else
+    RELEASE_DATE=$(TZ=America/Los_Angeles date +"%Y-%m-%d")
+    JIRA_PROJECT_ID=12315420
+    JIRA_URL="https://issues.apache.org/jira/rest/api/2/project/SPARK/versions"
+    JSON=$(curl -s "$JIRA_URL")
+
+    VERSION_ID=$(python3 - <<EOF
+import sys, json
+
+release_version = "${RELEASE_VERSION}"
+json_str = """$JSON"""
+
+try:
+    versions = json.loads(json_str)
+except Exception as e:
+    print(f"Error parsing JSON: {e}", file=sys.stderr)
+    sys.exit(1)
+
+version_id = ""
+for v in versions:
+    if v.get("name") == release_version:
+        version_id = v.get("id", "")
+        break
+
+print(version_id)
+EOF
+    )
+
+    if [[ -z "$VERSION_ID" ]]; then
+      echo "Error: Couldn't find JIRA version ID for $RELEASE_VERSION" >&2
+    fi
+
+    JIRA_LINK="https://issues.apache.org/jira/secure/ReleaseNote.jspa?projectId=${JIRA_PROJECT_ID}&version=${VERSION_ID}"
+
+    IFS='.' read -r rel_maj rel_min rel_patch <<< "$RELEASE_VERSION"
+    if [[ "$rel_patch" -eq 0 ]]; then
+      ACKNOWLEDGE="patches and features to this release."
+      BODY="Apache Spark ${RELEASE_VERSION} is a new feature release. It introduces new functionality and improvements. We encourage users to try it and provide feedback."
+    else
+      ACKNOWLEDGE="patches to this release."
+      BODY="Apache Spark ${RELEASE_VERSION} is a maintenance release containing security and correctness fixes. This release is based on the branch-${rel_maj}.${rel_min} maintenance branch of Spark. We strongly recommend all ${rel_maj}.${rel_min} users to upgrade to this stable release."
+    fi
+
+    BODY+="
+
+You can find the list of resolved issues and detailed changes in the [JIRA release notes](${JIRA_LINK}).
+
+We would like to acknowledge all community members for contributing ${ACKNOWLEDGE}"
+
+    FILENAME="releases/_posts/${RELEASE_DATE}-spark-release-${RELEASE_VERSION}.md"
+    mkdir -p releases/_posts
+    cat > "$FILENAME" <<EOF
+---
+layout: post
+title: Spark Release ${RELEASE_VERSION}
+categories: []
+tags: []
+status: publish
+type: post
+published: true
+meta:
+  _edit_last: '4'
+  _wpas_done_all: '1'
+---
+
+${BODY}
+EOF
+
+    echo "Created $FILENAME"
+  fi
+
+  # 5. Build the website
+  bundle install
+  bundle exec jekyll build
+
+  # 6. Update latest or preview symlink
+  IFS='.' read -r rel_maj rel_min rel_patch <<< "$RELEASE_VERSION"
+
+  if [[ "$RELEASE_VERSION" =~ -preview[0-9]*$ ]]; then
+    LINK_PATH="site/docs/preview"
+
+    ln -sfn "$RELEASE_VERSION" "$LINK_PATH"
+    echo "Updated symlink $LINK_PATH -> $RELEASE_VERSION (preview release)"
+
+  else
+    LINK_PATH="site/docs/latest"
+
+    if [[ "$rel_patch" -eq 0 ]]; then
+      if [[ -L "$LINK_PATH" ]]; then
+        CURRENT_TARGET=$(readlink "$LINK_PATH")
+      else
+        CURRENT_TARGET=""
+      fi
+
+      if [[ "$CURRENT_TARGET" =~ ^[0-9]+\.[0-9]+\.[0-9]+$ ]]; then
+        IFS='.' read -r cur_maj cur_min cur_patch <<< "$CURRENT_TARGET"
+
+        if [[ "$rel_maj" -gt "$cur_maj" ]]; then
+          ln -sfn "$RELEASE_VERSION" "$LINK_PATH"
+          echo "Updated symlink $LINK_PATH -> $RELEASE_VERSION (major version increased)"
+        elif [[ "$rel_maj" -eq "$cur_maj" && "$rel_min" -gt "$cur_min" ]]; then
+          ln -sfn "$RELEASE_VERSION" "$LINK_PATH"
+          echo "Updated symlink $LINK_PATH -> $RELEASE_VERSION (minor version increased)"
+        else
+          echo "Symlink $LINK_PATH points to $CURRENT_TARGET with equal or newer major.minor, no change"
+        fi
+      else
+        echo "No valid existing version target."
+      fi
+    else
+      echo "Patch release detected ($RELEASE_VERSION), not updating symlink"
+    fi
+  fi
+
+  git add .
+  git commit -m "Add release docs for Apache Spark $RELEASE_VERSION"
+  git push origin HEAD:asf-site
+  cd ..
+  echo "release docs uploaded"
+  rm -rf spark-website
+
   # Moves the docs from dev directory to release directory.
   echo "Moving Spark docs to the release directory"
   svn mv --username "$ASF_USERNAME" --password "$ASF_PASSWORD" -m"Apache Spark $RELEASE_VERSION" \
@@ -180,6 +494,76 @@ if [[ "$1" == "finalize" ]]; then
   echo "KEYS sync'ed"
   rm -rf svn-spark
 
+  # TODO: Test it in the actual release
+  # Release artifacts in the Nexus repository
+  # Find latest orgapachespark-* repo for this release version
+  REPO_ID=$(curl --retry 10 --retry-all-errors -s -u "$ASF_USERNAME:$ASF_PASSWORD" \
+    https://repository.apache.org/service/local/staging/profile_repositories | \
+    grep -A 5 "<repositoryId>orgapachespark-" | \
+    awk '/<repositoryId>/ { id = $0 } /<description>/ && $0 ~ /Apache Spark '"$RELEASE_VERSION"'/ { print id }' | \
+    grep -oP '(?<=<repositoryId>)orgapachespark-[0-9]+(?=</repositoryId>)' | \
+    sort -V | tail -n 1)
+
+  if [[ -z "$REPO_ID" ]]; then
+    echo "No matching staging repository found for Apache Spark $RELEASE_VERSION"
+    exit 1
+  fi
+
+  echo "Using repository ID: $REPO_ID"
+
+  # Release the repository
+  curl --retry 10 --retry-all-errors -s -u "$APACHE_USERNAME:$APACHE_PASSWORD" \
+    -H "Content-Type: application/json" \
+    -X POST https://repository.apache.org/service/local/staging/bulk/promote \
+    -d "{\"data\": {\"stagedRepositoryIds\": [\"$REPO_ID\"], \"description\": \"Apache Spark $RELEASE_VERSION\"}}"
+
+  # Wait for release to complete
+  echo "Waiting for release to complete..."
+  while true; do
+    STATUS=$(curl --retry 10 --retry-all-errors -s -u "$APACHE_USERNAME:$APACHE_PASSWORD" \
+      https://repository.apache.org/service/local/staging/repository/$REPO_ID | \
+      grep -oPm1 "(?<=<type>)[^<]+")
+    echo "Current state: $STATUS"
+    if [[ "$STATUS" == "released" ]]; then
+      echo "Release complete."
+      break
+    elif [[ "$STATUS" == "release_failed" || "$STATUS" == "error" ]]; then
+      echo "Release failed."
+      exit 1
+    elif [[ "$STATUS" == "open" ]]; then
+      echo "Repository is still open. Cannot release. Please close it first."
+      exit 1
+    fi
+    sleep 10
+  done
+
+  # Drop the repository after release
+  curl --retry 10 --retry-all-errors -s -u "$APACHE_USERNAME:$APACHE_PASSWORD" \
+    -H "Content-Type: application/json" \
+    -X POST https://repository.apache.org/service/local/staging/bulk/drop \
+    -d "{\"data\": {\"stagedRepositoryIds\": [\"$REPO_ID\"], \"description\": \"Dropped after release\"}}"
+
+  echo "Done."
+
+  # TODO: Test it in the actual official release
+  # Remove old releases from the mirror
+  # Extract major.minor prefix
+  RELEASE_SERIES=$(echo "$RELEASE_VERSION" | cut -d. -f1-2)
+  
+  # Fetch existing dist URLs
+  OLD_VERSION=$(svn ls https://dist.apache.org/repos/dist/release/spark/ | \
+    grep "^spark-$RELEASE_SERIES" | \
+    grep -v "^spark-$RELEASE_VERSION/" | \
+    sed 's#/##' | sed 's/^spark-//' | \
+    sort -V | tail -n 1)
+  
+  if [[ -n "$OLD_VERSION" ]]; then
+    echo "Removing old version: spark-$OLD_VERSION"
+    svn rm "https://dist.apache.org/repos/dist/release/spark/spark-$OLD_VERSION" -m "Remove older $RELEASE_SERIES release after $RELEASE_VERSION"
+  else
+    echo "No previous $RELEASE_SERIES version found to remove. Manually remove it if there is."
+  fi
+
   exit 0
 fi
 
@@ -609,13 +993,15 @@ if [[ "$1" == "publish-release" ]]; then
 
     # Calculate deadline in Pacific Time (PST/PDT)
     DEADLINE=$(TZ=America/Los_Angeles date -d "+4 days" "+%a, %d %b %Y %H:%M:%S %Z")
+    PYSPARK_VERSION=`echo "$RELEASE_VERSION" |  sed -e "s/-/./" -e "s/preview/dev/"`
 
     JIRA_API_URL="https://issues.apache.org/jira/rest/api/2/project/SPARK/versions"
+    SPARK_VERSION_BASE=$(echo "$SPARK_VERSION" | sed 's/-preview[0-9]*//')
     JIRA_VERSION_ID=$(curl -s "$JIRA_API_URL" | \
       # Split JSON objects by replacing '},{' with a newline-separated pattern
       tr '}' '\n' | \
       # Find the block containing the exact version name
-      grep -F "\"name\":\"$SPARK_VERSION\"" -A 5 | \
+      grep -F "\"name\":\"$SPARK_VERSION_BASE\"" -A 5 | \
       # Extract the line with "id"
       grep '"id"' | \
       # Extract the numeric id value (assuming "id":"123456")
@@ -665,7 +1051,7 @@ EOF
       echo "https://dist.apache.org/repos/dist/dev/spark/${GIT_REF}-bin/"
       echo
       echo "Signatures used for Spark RCs can be found in this file:"
-      echo "https://dist.apache.org/repos/dist/dev/spark/KEYS"
+      echo "https://downloads.apache.org/spark/KEYS"
       echo
       echo "The staging repository for this release can be found at:"
       echo "https://repository.apache.org/content/repositories/${staged_repo_id}/"
@@ -687,7 +1073,7 @@ EOF
       echo "reporting any regressions."
       echo
       echo "If you're working in PySpark you can set up a virtual env and install"
-      echo "the current RC via \"pip install https://dist.apache.org/repos/dist/dev/spark/${GIT_REF}-bin/pyspark-${SPARK_VERSION}.tar.gz\""
+      echo "the current RC via \"pip install https://dist.apache.org/repos/dist/dev/spark/${GIT_REF}-bin/pyspark-${PYSPARK_VERSION}.tar.gz\""
       echo "and see if anything important breaks."
       echo "In the Java/Scala, you can add the staging repository to your project's resolvers and test"
       echo "with the RC (make sure to clean up the artifact cache before/after so"
diff --git a/dev/create-release/spark-rm/Dockerfile b/dev/create-release/spark-rm/Dockerfile
index b070aad1c52f0..79b4cfaeb8b0a 100644
--- a/dev/create-release/spark-rm/Dockerfile
+++ b/dev/create-release/spark-rm/Dockerfile
@@ -98,10 +98,10 @@ RUN mkdir -p /usr/local/pypy/pypy3.10 && \
     ln -sf /usr/local/pypy/pypy3.10/bin/pypy /usr/local/bin/pypy3.10 && \
     ln -sf /usr/local/pypy/pypy3.10/bin/pypy /usr/local/bin/pypy3
 RUN curl -sS https://bootstrap.pypa.io/get-pip.py | pypy3
-RUN pypy3 -m pip install numpy 'six==1.16.0' 'pandas==2.2.3' scipy coverage matplotlib lxml
+RUN pypy3 -m pip install numpy 'six==1.16.0' 'pandas==2.3.2' scipy coverage matplotlib lxml
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=18.0.0 six==1.16.0 pandas==2.2.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2 twine==3.4.1"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=18.0.0 six==1.16.0 pandas==2.3.2 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2 twine==3.4.1"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
 
@@ -114,31 +114,19 @@ RUN python3.10 -m pip install $BASIC_PIP_PKGS unittest-xml-reporting $CONNECT_PI
     python3.10 -m pip install deepspeed torcheval && \
     python3.10 -m pip cache purge
 
-# Install Python 3.9
-RUN add-apt-repository ppa:deadsnakes/ppa
-RUN apt-get update && apt-get install -y \
-    python3.9 python3.9-distutils \
-    && rm -rf /var/lib/apt/lists/*
-RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.9
-RUN python3.9 -m pip install --ignore-installed blinker>=1.6.2 # mlflow needs this
-RUN python3.9 -m pip install --force $BASIC_PIP_PKGS unittest-xml-reporting $CONNECT_PIP_PKGS && \
-    python3.9 -m pip install 'torch<2.6.0' torchvision --index-url https://download.pytorch.org/whl/cpu && \
-    python3.9 -m pip install torcheval && \
-    python3.9 -m pip cache purge
-
 # Should unpin 'sphinxcontrib-*' after upgrading sphinx>5
 # See 'ipython_genutils' in SPARK-38517
 # See 'docutils<0.18.0' in SPARK-39421
-RUN python3.9 -m pip install 'sphinx==4.5.0' mkdocs 'pydata_sphinx_theme>=0.13' sphinx-copybutton nbsphinx numpydoc jinja2 markupsafe 'pyzmq<24.0.0' \
-ipython ipython_genutils sphinx_plotly_directive 'numpy>=1.20.0' pyarrow pandas 'plotly>=4.8' 'docutils<0.18.0' \
+RUN python3.10 -m pip install 'sphinx==4.5.0' mkdocs 'pydata_sphinx_theme>=0.13' sphinx-copybutton nbsphinx numpydoc jinja2 markupsafe 'pyzmq<24.0.0' \
+ipython ipython_genutils sphinx_plotly_directive 'numpy>=1.22' pyarrow pandas 'plotly>=4.8' 'docutils<0.18.0' \
 'flake8==3.9.0' 'mypy==1.8.0' 'pytest==7.1.3' 'pytest-mypy-plugins==1.9.3' 'black==23.12.1' \
 'pandas-stubs==1.2.0.53' 'grpcio==1.67.0' 'grpc-stubs==1.24.11' 'googleapis-common-protos-stubs==2.2.0' \
 'sphinxcontrib-applehelp==1.0.4' 'sphinxcontrib-devhelp==1.0.2' 'sphinxcontrib-htmlhelp==2.0.1' 'sphinxcontrib-qthelp==1.0.3' 'sphinxcontrib-serializinghtml==1.1.5'
-RUN python3.9 -m pip list
+RUN python3.10 -m pip list
 
 RUN gem install --no-document "bundler:2.4.22"
-RUN ln -s "$(which python3.9)" "/usr/local/bin/python"
-RUN ln -s "$(which python3.9)" "/usr/local/bin/python3"
+RUN ln -s "$(which python3.10)" "/usr/local/bin/python"
+RUN ln -s "$(which python3.10)" "/usr/local/bin/python3"
 
 WORKDIR /opt/spark-rm/output
 
diff --git a/dev/create-release/vote.tmpl b/dev/create-release/vote.tmpl
index b5e53345f27b1..2dc56e3386b22 100644
--- a/dev/create-release/vote.tmpl
+++ b/dev/create-release/vote.tmpl
@@ -15,7 +15,7 @@ The release files, including signatures, digests, etc. can be found at:
 https://dist.apache.org/repos/dist/dev/spark/{tag}-bin/
 
 Signatures used for Spark RCs can be found in this file:
-https://dist.apache.org/repos/dist/dev/spark/KEYS
+https://downloads.apache.org/spark/KEYS
 
 The staging repository for this release can be found at:
 https://repository.apache.org/content/repositories/orgapachespark-{repo_id}/
diff --git a/dev/deps/spark-deps-hadoop-3-hive-2.3 b/dev/deps/spark-deps-hadoop-3-hive-2.3
index f3f7ad4bcd1f9..a2ec364961155 100644
--- a/dev/deps/spark-deps-hadoop-3-hive-2.3
+++ b/dev/deps/spark-deps-hadoop-3-hive-2.3
@@ -9,11 +9,11 @@ aliyun-java-sdk-core/4.5.10//aliyun-java-sdk-core-4.5.10.jar
 aliyun-java-sdk-kms/2.11.0//aliyun-java-sdk-kms-2.11.0.jar
 aliyun-java-sdk-ram/3.1.0//aliyun-java-sdk-ram-3.1.0.jar
 aliyun-sdk-oss/3.13.2//aliyun-sdk-oss-3.13.2.jar
-annotations/17.0.0//annotations-17.0.0.jar
+analyticsaccelerator-s3/1.2.1//analyticsaccelerator-s3-1.2.1.jar
 antlr-runtime/3.5.2//antlr-runtime-3.5.2.jar
 antlr4-runtime/4.13.1//antlr4-runtime-4.13.1.jar
 aopalliance-repackaged/3.0.6//aopalliance-repackaged-3.0.6.jar
-arpack/3.0.3//arpack-3.0.3.jar
+arpack/3.0.4//arpack-3.0.4.jar
 arpack_combined_all/0.1//arpack_combined_all-0.1.jar
 arrow-format/18.3.0//arrow-format-18.3.0.jar
 arrow-memory-core/18.3.0//arrow-memory-core-18.3.0.jar
@@ -27,8 +27,8 @@ avro/1.12.0//avro-1.12.0.jar
 azure-data-lake-store-sdk/2.3.9//azure-data-lake-store-sdk-2.3.9.jar
 azure-keyvault-core/1.0.0//azure-keyvault-core-1.0.0.jar
 azure-storage/7.0.1//azure-storage-7.0.1.jar
-bcprov-jdk18on/1.80//bcprov-jdk18on-1.80.jar
-blas/3.0.3//blas-3.0.3.jar
+bcprov-jdk18on/1.81//bcprov-jdk18on-1.81.jar
+blas/3.0.4//blas-3.0.4.jar
 breeze-macros_2.13/2.1.0//breeze-macros_2.13-2.1.0.jar
 breeze_2.13/2.1.0//breeze_2.13-2.1.0.jar
 bundle/2.29.52//bundle-2.29.52.jar
@@ -36,24 +36,24 @@ cats-kernel_2.13/2.8.0//cats-kernel_2.13-2.8.0.jar
 checker-qual/3.43.0//checker-qual-3.43.0.jar
 chill-java/0.10.0//chill-java-0.10.0.jar
 chill_2.13/0.10.0//chill_2.13-0.10.0.jar
-commons-cli/1.9.0//commons-cli-1.9.0.jar
-commons-codec/1.18.0//commons-codec-1.18.0.jar
+commons-cli/1.10.0//commons-cli-1.10.0.jar
+commons-codec/1.19.0//commons-codec-1.19.0.jar
 commons-collections/3.2.2//commons-collections-3.2.2.jar
 commons-collections4/4.5.0//commons-collections4-4.5.0.jar
 commons-compiler/3.1.9//commons-compiler-3.1.9.jar
-commons-compress/1.27.1//commons-compress-1.27.1.jar
+commons-compress/1.28.0//commons-compress-1.28.0.jar
 commons-crypto/1.1.0//commons-crypto-1.1.0.jar
 commons-dbcp/1.4//commons-dbcp-1.4.jar
-commons-io/2.19.0//commons-io-2.19.0.jar
+commons-io/2.20.0//commons-io-2.20.0.jar
 commons-lang/2.6//commons-lang-2.6.jar
-commons-lang3/3.17.0//commons-lang3-3.17.0.jar
+commons-lang3/3.18.0//commons-lang3-3.18.0.jar
 commons-math3/3.6.1//commons-math3-3.6.1.jar
 commons-pool/1.5.4//commons-pool-1.5.4.jar
-commons-text/1.13.1//commons-text-1.13.1.jar
+commons-text/1.14.0//commons-text-1.14.0.jar
 compress-lzf/1.1.2//compress-lzf-1.1.2.jar
-curator-client/5.7.1//curator-client-5.7.1.jar
-curator-framework/5.7.1//curator-framework-5.7.1.jar
-curator-recipes/5.7.1//curator-recipes-5.7.1.jar
+curator-client/5.9.0//curator-client-5.9.0.jar
+curator-framework/5.9.0//curator-framework-5.9.0.jar
+curator-recipes/5.9.0//curator-recipes-5.9.0.jar
 datanucleus-api-jdo/4.2.4//datanucleus-api-jdo-4.2.4.jar
 datanucleus-core/4.1.17//datanucleus-core-4.1.17.jar
 datanucleus-rdbms/4.1.19//datanucleus-rdbms-4.1.19.jar
@@ -67,20 +67,20 @@ error_prone_annotations/2.36.0//error_prone_annotations-2.36.0.jar
 esdk-obs-java/3.20.4.2//esdk-obs-java-3.20.4.2.jar
 failureaccess/1.0.2//failureaccess-1.0.2.jar
 flatbuffers-java/25.2.10//flatbuffers-java-25.2.10.jar
-gcs-connector/hadoop3-2.2.26/shaded/gcs-connector-hadoop3-2.2.26-shaded.jar
+gcs-connector/hadoop3-2.2.28/shaded/gcs-connector-hadoop3-2.2.28-shaded.jar
 gmetric4j/1.0.10//gmetric4j-1.0.10.jar
 gson/2.11.0//gson-2.11.0.jar
 guava/33.4.0-jre//guava-33.4.0-jre.jar
-hadoop-aliyun/3.4.1//hadoop-aliyun-3.4.1.jar
-hadoop-annotations/3.4.1//hadoop-annotations-3.4.1.jar
-hadoop-aws/3.4.1//hadoop-aws-3.4.1.jar
-hadoop-azure-datalake/3.4.1//hadoop-azure-datalake-3.4.1.jar
-hadoop-azure/3.4.1//hadoop-azure-3.4.1.jar
-hadoop-client-api/3.4.1//hadoop-client-api-3.4.1.jar
-hadoop-client-runtime/3.4.1//hadoop-client-runtime-3.4.1.jar
-hadoop-cloud-storage/3.4.1//hadoop-cloud-storage-3.4.1.jar
-hadoop-huaweicloud/3.4.1//hadoop-huaweicloud-3.4.1.jar
-hadoop-shaded-guava/1.3.0//hadoop-shaded-guava-1.3.0.jar
+hadoop-aliyun/3.4.2//hadoop-aliyun-3.4.2.jar
+hadoop-annotations/3.4.2//hadoop-annotations-3.4.2.jar
+hadoop-aws/3.4.2//hadoop-aws-3.4.2.jar
+hadoop-azure-datalake/3.4.2//hadoop-azure-datalake-3.4.2.jar
+hadoop-azure/3.4.2//hadoop-azure-3.4.2.jar
+hadoop-client-api/3.4.2//hadoop-client-api-3.4.2.jar
+hadoop-client-runtime/3.4.2//hadoop-client-runtime-3.4.2.jar
+hadoop-cloud-storage/3.4.2//hadoop-cloud-storage-3.4.2.jar
+hadoop-huaweicloud/3.4.2//hadoop-huaweicloud-3.4.2.jar
+hadoop-shaded-guava/1.4.0//hadoop-shaded-guava-1.4.0.jar
 hive-beeline/2.3.10//hive-beeline-2.3.10.jar
 hive-cli/2.3.10//hive-cli-2.3.10.jar
 hive-common/2.3.10//hive-common-2.3.10.jar
@@ -104,15 +104,13 @@ ini4j/0.5.4//ini4j-0.5.4.jar
 istack-commons-runtime/4.1.2//istack-commons-runtime-4.1.2.jar
 ivy/2.5.3//ivy-2.5.3.jar
 j2objc-annotations/3.0.0//j2objc-annotations-3.0.0.jar
-jackson-annotations/2.19.0//jackson-annotations-2.19.0.jar
-jackson-core-asl/1.9.13//jackson-core-asl-1.9.13.jar
-jackson-core/2.19.0//jackson-core-2.19.0.jar
-jackson-databind/2.19.0//jackson-databind-2.19.0.jar
-jackson-dataformat-cbor/2.19.0//jackson-dataformat-cbor-2.19.0.jar
-jackson-dataformat-yaml/2.19.0//jackson-dataformat-yaml-2.19.0.jar
-jackson-datatype-jsr310/2.19.0//jackson-datatype-jsr310-2.19.0.jar
-jackson-mapper-asl/1.9.13//jackson-mapper-asl-1.9.13.jar
-jackson-module-scala_2.13/2.19.0//jackson-module-scala_2.13-2.19.0.jar
+jackson-annotations/2.19.2//jackson-annotations-2.19.2.jar
+jackson-core/2.19.2//jackson-core-2.19.2.jar
+jackson-databind/2.19.2//jackson-databind-2.19.2.jar
+jackson-dataformat-cbor/2.19.2//jackson-dataformat-cbor-2.19.2.jar
+jackson-dataformat-yaml/2.19.2//jackson-dataformat-yaml-2.19.2.jar
+jackson-datatype-jsr310/2.19.2//jackson-datatype-jsr310-2.19.2.jar
+jackson-module-scala_2.13/2.19.2//jackson-module-scala_2.13-2.19.2.jar
 jakarta.activation-api/2.1.3//jakarta.activation-api-2.1.3.jar
 jakarta.annotation-api/2.1.1//jakarta.annotation-api-2.1.1.jar
 jakarta.inject-api/2.0.1//jakarta.inject-api-2.0.1.jar
@@ -132,12 +130,12 @@ jaxb-runtime/4.0.5//jaxb-runtime-4.0.5.jar
 jcl-over-slf4j/2.0.17//jcl-over-slf4j-2.0.17.jar
 jdo-api/3.0.1//jdo-api-3.0.1.jar
 jdom2/2.0.6//jdom2-2.0.6.jar
-jersey-client/3.0.17//jersey-client-3.0.17.jar
-jersey-common/3.0.17//jersey-common-3.0.17.jar
-jersey-container-servlet-core/3.0.17//jersey-container-servlet-core-3.0.17.jar
-jersey-container-servlet/3.0.17//jersey-container-servlet-3.0.17.jar
-jersey-hk2/3.0.17//jersey-hk2-3.0.17.jar
-jersey-server/3.0.17//jersey-server-3.0.17.jar
+jersey-client/3.0.18//jersey-client-3.0.18.jar
+jersey-common/3.0.18//jersey-common-3.0.18.jar
+jersey-container-servlet-core/3.0.18//jersey-container-servlet-core-3.0.18.jar
+jersey-container-servlet/3.0.18//jersey-container-servlet-3.0.18.jar
+jersey-hk2/3.0.18//jersey-hk2-3.0.18.jar
+jersey-server/3.0.18//jersey-server-3.0.18.jar
 jettison/1.5.4//jettison-1.5.4.jar
 jetty-util-ajax/11.0.25//jetty-util-ajax-11.0.25.jar
 jetty-util/11.0.25//jetty-util-11.0.25.jar
@@ -146,8 +144,7 @@ jjwt-impl/0.12.6//jjwt-impl-0.12.6.jar
 jjwt-jackson/0.12.6//jjwt-jackson-0.12.6.jar
 jline/2.14.6//jline-2.14.6.jar
 jline/3.27.1/jdk8/jline-3.27.1-jdk8.jar
-joda-time/2.13.0//joda-time-2.13.0.jar
-jodd-core/3.5.2//jodd-core-3.5.2.jar
+joda-time/2.14.0//joda-time-2.14.0.jar
 jpam/1.1//jpam-1.1.jar
 json/1.8//json-1.8.jar
 json4s-ast_2.13/4.0.7//json4s-ast_2.13-4.0.7.jar
@@ -157,6 +154,7 @@ json4s-jackson_2.13/4.0.7//json4s-jackson_2.13-4.0.7.jar
 json4s-scalap_2.13/4.0.7//json4s-scalap_2.13-4.0.7.jar
 jsr305/3.0.0//jsr305-3.0.0.jar
 jta/1.1//jta-1.1.jar
+jts-core/1.20.0//jts-core-1.20.0.jar
 jul-to-slf4j/2.0.17//jul-to-slf4j-2.0.17.jar
 kryo-shaded/4.0.3//kryo-shaded-4.0.3.jar
 kubernetes-client-api/7.3.1//kubernetes-client-api-7.3.1.jar
@@ -184,61 +182,61 @@ kubernetes-model-rbac/7.3.1//kubernetes-model-rbac-7.3.1.jar
 kubernetes-model-resource/7.3.1//kubernetes-model-resource-7.3.1.jar
 kubernetes-model-scheduling/7.3.1//kubernetes-model-scheduling-7.3.1.jar
 kubernetes-model-storageclass/7.3.1//kubernetes-model-storageclass-7.3.1.jar
-lapack/3.0.3//lapack-3.0.3.jar
+lapack/3.0.4//lapack-3.0.4.jar
 leveldbjni-all/1.8//leveldbjni-all-1.8.jar
 libfb303/0.9.3//libfb303-0.9.3.jar
 libthrift/0.16.0//libthrift-0.16.0.jar
 listenablefuture/9999.0-empty-to-avoid-conflict-with-guava//listenablefuture-9999.0-empty-to-avoid-conflict-with-guava.jar
-log4j-1.2-api/2.24.3//log4j-1.2-api-2.24.3.jar
-log4j-api/2.24.3//log4j-api-2.24.3.jar
-log4j-core/2.24.3//log4j-core-2.24.3.jar
-log4j-layout-template-json/2.24.3//log4j-layout-template-json-2.24.3.jar
-log4j-slf4j2-impl/2.24.3//log4j-slf4j2-impl-2.24.3.jar
+log4j-1.2-api/2.25.1//log4j-1.2-api-2.25.1.jar
+log4j-api/2.25.1//log4j-api-2.25.1.jar
+log4j-core/2.25.1//log4j-core-2.25.1.jar
+log4j-layout-template-json/2.25.1//log4j-layout-template-json-2.25.1.jar
+log4j-slf4j2-impl/2.25.1//log4j-slf4j2-impl-2.25.1.jar
 lz4-java/1.8.0//lz4-java-1.8.0.jar
-metrics-core/4.2.30//metrics-core-4.2.30.jar
-metrics-graphite/4.2.30//metrics-graphite-4.2.30.jar
-metrics-jmx/4.2.30//metrics-jmx-4.2.30.jar
-metrics-json/4.2.30//metrics-json-4.2.30.jar
-metrics-jvm/4.2.30//metrics-jvm-4.2.30.jar
+metrics-core/4.2.33//metrics-core-4.2.33.jar
+metrics-graphite/4.2.33//metrics-graphite-4.2.33.jar
+metrics-jmx/4.2.33//metrics-jmx-4.2.33.jar
+metrics-json/4.2.33//metrics-json-4.2.33.jar
+metrics-jvm/4.2.33//metrics-jvm-4.2.33.jar
 minlog/1.3.0//minlog-1.3.0.jar
-netty-all/4.1.121.Final//netty-all-4.1.121.Final.jar
-netty-buffer/4.1.121.Final//netty-buffer-4.1.121.Final.jar
-netty-codec-dns/4.1.121.Final//netty-codec-dns-4.1.121.Final.jar
-netty-codec-http/4.1.121.Final//netty-codec-http-4.1.121.Final.jar
-netty-codec-http2/4.1.121.Final//netty-codec-http2-4.1.121.Final.jar
-netty-codec-socks/4.1.121.Final//netty-codec-socks-4.1.121.Final.jar
-netty-codec/4.1.121.Final//netty-codec-4.1.121.Final.jar
-netty-common/4.1.121.Final//netty-common-4.1.121.Final.jar
-netty-handler-proxy/4.1.121.Final//netty-handler-proxy-4.1.121.Final.jar
-netty-handler/4.1.121.Final//netty-handler-4.1.121.Final.jar
-netty-resolver-dns/4.1.121.Final//netty-resolver-dns-4.1.121.Final.jar
-netty-resolver/4.1.121.Final//netty-resolver-4.1.121.Final.jar
-netty-tcnative-boringssl-static/2.0.70.Final/linux-aarch_64/netty-tcnative-boringssl-static-2.0.70.Final-linux-aarch_64.jar
-netty-tcnative-boringssl-static/2.0.70.Final/linux-x86_64/netty-tcnative-boringssl-static-2.0.70.Final-linux-x86_64.jar
-netty-tcnative-boringssl-static/2.0.70.Final/osx-aarch_64/netty-tcnative-boringssl-static-2.0.70.Final-osx-aarch_64.jar
-netty-tcnative-boringssl-static/2.0.70.Final/osx-x86_64/netty-tcnative-boringssl-static-2.0.70.Final-osx-x86_64.jar
-netty-tcnative-boringssl-static/2.0.70.Final/windows-x86_64/netty-tcnative-boringssl-static-2.0.70.Final-windows-x86_64.jar
-netty-tcnative-classes/2.0.70.Final//netty-tcnative-classes-2.0.70.Final.jar
-netty-transport-classes-epoll/4.1.121.Final//netty-transport-classes-epoll-4.1.121.Final.jar
-netty-transport-classes-kqueue/4.1.121.Final//netty-transport-classes-kqueue-4.1.121.Final.jar
-netty-transport-native-epoll/4.1.121.Final/linux-aarch_64/netty-transport-native-epoll-4.1.121.Final-linux-aarch_64.jar
-netty-transport-native-epoll/4.1.121.Final/linux-riscv64/netty-transport-native-epoll-4.1.121.Final-linux-riscv64.jar
-netty-transport-native-epoll/4.1.121.Final/linux-x86_64/netty-transport-native-epoll-4.1.121.Final-linux-x86_64.jar
-netty-transport-native-kqueue/4.1.121.Final/osx-aarch_64/netty-transport-native-kqueue-4.1.121.Final-osx-aarch_64.jar
-netty-transport-native-kqueue/4.1.121.Final/osx-x86_64/netty-transport-native-kqueue-4.1.121.Final-osx-x86_64.jar
-netty-transport-native-unix-common/4.1.121.Final//netty-transport-native-unix-common-4.1.121.Final.jar
-netty-transport/4.1.121.Final//netty-transport-4.1.121.Final.jar
-objenesis/3.3//objenesis-3.3.jar
+netty-all/4.1.124.Final//netty-all-4.1.124.Final.jar
+netty-buffer/4.1.124.Final//netty-buffer-4.1.124.Final.jar
+netty-codec-dns/4.1.124.Final//netty-codec-dns-4.1.124.Final.jar
+netty-codec-http/4.1.124.Final//netty-codec-http-4.1.124.Final.jar
+netty-codec-http2/4.1.124.Final//netty-codec-http2-4.1.124.Final.jar
+netty-codec-socks/4.1.124.Final//netty-codec-socks-4.1.124.Final.jar
+netty-codec/4.1.124.Final//netty-codec-4.1.124.Final.jar
+netty-common/4.1.124.Final//netty-common-4.1.124.Final.jar
+netty-handler-proxy/4.1.124.Final//netty-handler-proxy-4.1.124.Final.jar
+netty-handler/4.1.124.Final//netty-handler-4.1.124.Final.jar
+netty-resolver-dns/4.1.124.Final//netty-resolver-dns-4.1.124.Final.jar
+netty-resolver/4.1.124.Final//netty-resolver-4.1.124.Final.jar
+netty-tcnative-boringssl-static/2.0.72.Final/linux-aarch_64/netty-tcnative-boringssl-static-2.0.72.Final-linux-aarch_64.jar
+netty-tcnative-boringssl-static/2.0.72.Final/linux-x86_64/netty-tcnative-boringssl-static-2.0.72.Final-linux-x86_64.jar
+netty-tcnative-boringssl-static/2.0.72.Final/osx-aarch_64/netty-tcnative-boringssl-static-2.0.72.Final-osx-aarch_64.jar
+netty-tcnative-boringssl-static/2.0.72.Final/osx-x86_64/netty-tcnative-boringssl-static-2.0.72.Final-osx-x86_64.jar
+netty-tcnative-boringssl-static/2.0.72.Final/windows-x86_64/netty-tcnative-boringssl-static-2.0.72.Final-windows-x86_64.jar
+netty-tcnative-classes/2.0.72.Final//netty-tcnative-classes-2.0.72.Final.jar
+netty-transport-classes-epoll/4.1.124.Final//netty-transport-classes-epoll-4.1.124.Final.jar
+netty-transport-classes-kqueue/4.1.124.Final//netty-transport-classes-kqueue-4.1.124.Final.jar
+netty-transport-native-epoll/4.1.124.Final/linux-aarch_64/netty-transport-native-epoll-4.1.124.Final-linux-aarch_64.jar
+netty-transport-native-epoll/4.1.124.Final/linux-riscv64/netty-transport-native-epoll-4.1.124.Final-linux-riscv64.jar
+netty-transport-native-epoll/4.1.124.Final/linux-x86_64/netty-transport-native-epoll-4.1.124.Final-linux-x86_64.jar
+netty-transport-native-kqueue/4.1.124.Final/osx-aarch_64/netty-transport-native-kqueue-4.1.124.Final-osx-aarch_64.jar
+netty-transport-native-kqueue/4.1.124.Final/osx-x86_64/netty-transport-native-kqueue-4.1.124.Final-osx-x86_64.jar
+netty-transport-native-unix-common/4.1.124.Final//netty-transport-native-unix-common-4.1.124.Final.jar
+netty-transport/4.1.124.Final//netty-transport-4.1.124.Final.jar
+objenesis/3.4//objenesis-3.4.jar
 okhttp/3.12.12//okhttp-3.12.12.jar
 okio/1.17.6//okio-1.17.6.jar
 opencsv/2.3//opencsv-2.3.jar
 opentracing-api/0.33.0//opentracing-api-0.33.0.jar
 opentracing-noop/0.33.0//opentracing-noop-0.33.0.jar
 opentracing-util/0.33.0//opentracing-util-0.33.0.jar
-orc-core/2.1.2/shaded-protobuf/orc-core-2.1.2-shaded-protobuf.jar
-orc-format/1.1.0/shaded-protobuf/orc-format-1.1.0-shaded-protobuf.jar
-orc-mapreduce/2.1.2/shaded-protobuf/orc-mapreduce-2.1.2-shaded-protobuf.jar
-orc-shims/2.1.2//orc-shims-2.1.2.jar
+orc-core/2.2.0/shaded-protobuf/orc-core-2.2.0-shaded-protobuf.jar
+orc-format/1.1.1/shaded-protobuf/orc-format-1.1.1-shaded-protobuf.jar
+orc-mapreduce/2.2.0/shaded-protobuf/orc-mapreduce-2.2.0-shaded-protobuf.jar
+orc-shims/2.2.0//orc-shims-2.2.0.jar
 oro/2.0.8//oro-2.0.8.jar
 osgi-resource-locator/1.0.3//osgi-resource-locator-1.0.3.jar
 paranamer/2.8.3//paranamer-2.8.3.jar
@@ -252,7 +250,6 @@ pickle/1.5//pickle-1.5.jar
 py4j/0.10.9.9//py4j-0.10.9.9.jar
 remotetea-oncrpc/1.1.2//remotetea-oncrpc-1.1.2.jar
 rocksdbjni/9.8.4//rocksdbjni-9.8.4.jar
-scala-collection-compat_2.13/2.7.0//scala-collection-compat_2.13-2.7.0.jar
 scala-compiler/2.13.16//scala-compiler-2.13.16.jar
 scala-library/2.13.16//scala-library-2.13.16.jar
 scala-parallel-collections_2.13/1.2.0//scala-parallel-collections_2.13-1.2.0.jar
@@ -262,7 +259,7 @@ scala-xml_2.13/2.3.0//scala-xml_2.13-2.3.0.jar
 slf4j-api/2.0.17//slf4j-api-2.0.17.jar
 snakeyaml-engine/2.9//snakeyaml-engine-2.9.jar
 snakeyaml/2.4//snakeyaml-2.4.jar
-snappy-java/1.1.10.7//snappy-java-1.1.10.7.jar
+snappy-java/1.1.10.8//snappy-java-1.1.10.8.jar
 spire-macros_2.13/0.18.0//spire-macros_2.13-0.18.0.jar
 spire-platform_2.13/0.18.0//spire-platform_2.13-0.18.0.jar
 spire-util_2.13/0.18.0//spire-util_2.13-0.18.0.jar
@@ -285,4 +282,4 @@ xz/1.10//xz-1.10.jar
 zjsonpatch/7.3.1//zjsonpatch-7.3.1.jar
 zookeeper-jute/3.9.3//zookeeper-jute-3.9.3.jar
 zookeeper/3.9.3//zookeeper-3.9.3.jar
-zstd-jni/1.5.7-3//zstd-jni-1.5.7-3.jar
+zstd-jni/1.5.7-4//zstd-jni-1.5.7-4.jar
diff --git a/dev/infra/Dockerfile b/dev/infra/Dockerfile
index 9cd6031023ca5..8813112127d11 100644
--- a/dev/infra/Dockerfile
+++ b/dev/infra/Dockerfile
@@ -91,10 +91,10 @@ RUN mkdir -p /usr/local/pypy/pypy3.10 && \
     ln -sf /usr/local/pypy/pypy3.10/bin/pypy /usr/local/bin/pypy3.10 && \
     ln -sf /usr/local/pypy/pypy3.10/bin/pypy /usr/local/bin/pypy3
 RUN curl -sS https://bootstrap.pypa.io/get-pip.py | pypy3
-RUN pypy3 -m pip install numpy 'six==1.16.0' 'pandas==2.2.3' scipy coverage matplotlib lxml
+RUN pypy3 -m pip install numpy 'six==1.16.0' 'pandas==2.3.0' scipy coverage matplotlib lxml
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=18.0.0 six==1.16.0 pandas==2.2.3 scipy plotly>=4.8 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=18.0.0 six==1.16.0 pandas==2.3.0 scipy plotly>=4.8 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
 
@@ -148,7 +148,7 @@ RUN apt-get update && apt-get install -y \
 RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.13
 # TODO(SPARK-49862) Add BASIC_PIP_PKGS and CONNECT_PIP_PKGS to Python 3.13 image when it supports Python 3.13
 RUN python3.13 -m pip install --ignore-installed blinker>=1.6.2 # mlflow needs this
-RUN python3.13 -m pip install numpy>=2.1 pyarrow>=18.0.0 six==1.16.0 pandas==2.2.3 scipy coverage matplotlib openpyxl grpcio==1.67.0 grpcio-status==1.67.0 lxml jinja2 && \
+RUN python3.13 -m pip install numpy>=2.1 pyarrow>=18.0.0 six==1.16.0 pandas==2.3.0 scipy coverage matplotlib openpyxl grpcio==1.67.0 grpcio-status==1.67.0 lxml jinja2 && \
     python3.13 -m pip cache purge
 
 # Remove unused installation packages to free up disk space
diff --git a/dev/lint-scala b/dev/lint-scala
index 19c8853c787db..bfd0646f5f328 100755
--- a/dev/lint-scala
+++ b/dev/lint-scala
@@ -34,6 +34,7 @@ ERRORS=$(./build/mvn \
     -pl sql/api \
     -pl sql/connect/common \
     -pl sql/connect/server \
+    -pl sql/connect/shims \
     -pl sql/connect/client/jvm \
     2>&1 | grep -e "Unformatted files found" \
 )
@@ -41,7 +42,7 @@ ERRORS=$(./build/mvn \
 if test ! -z "$ERRORS"; then
   echo -e "The scalafmt check failed on sql/connect or sql/connect at following occurrences:\n\n$ERRORS\n"
   echo "Before submitting your change, please make sure to format your code using the following command:"
-  echo "./build/mvn scalafmt:format -Dscalafmt.skip=false -Dscalafmt.validateOnly=false -Dscalafmt.changedOnly=false -pl sql/api -pl sql/connect/common -pl sql/connect/server -pl sql/connect/client/jvm"
+  echo "./build/mvn scalafmt:format -Dscalafmt.skip=false -Dscalafmt.validateOnly=false -Dscalafmt.changedOnly=false -pl sql/api -pl sql/connect/common -pl sql/connect/server -pl sql/connect/shims -pl sql/connect/client/jvm"
   exit 1
 else
   echo -e "Scalafmt checks passed."
diff --git a/dev/make-distribution.sh b/dev/make-distribution.sh
index 39f6477e07c97..b54ea496c633b 100755
--- a/dev/make-distribution.sh
+++ b/dev/make-distribution.sh
@@ -133,7 +133,7 @@ if [ $(command -v git) ]; then
     unset GITREV
 fi
 
-if [ "$SBT_ENABLED" == "true" && ! "$(command -v "$SBT")" ]; then
+if [ "$SBT_ENABLED" == "true" ] && [ ! "$(command -v "$SBT")" ]; then
   echo -e "Could not locate SBT command: '$SBT'."
   echo -e "Specify the SBT command with the --sbt flag"
   exit -1;
@@ -204,14 +204,6 @@ echo "Build flags: $@" >> "$DISTDIR/RELEASE"
 # Copy jars
 cp -r "$SPARK_HOME"/assembly/target/scala*/jars/* "$DISTDIR/jars/"
 
-# Only create the hive-jackson directory if they exist.
-if [ -f "$DISTDIR"/jars/jackson-core-asl-1.9.13.jar ]; then
-  for f in "$DISTDIR"/jars/jackson-*-asl-*.jar; do
-    mkdir -p "$DISTDIR"/hive-jackson
-    mv $f "$DISTDIR"/hive-jackson/
-  done
-fi
-
 # Only create the yarn directory if the yarn artifacts were built.
 if [ -f "$SPARK_HOME"/common/network-yarn/target/scala*/spark-*-yarn-shuffle.jar ]; then
   mkdir "$DISTDIR/yarn"
diff --git a/dev/merge_spark_pr.py b/dev/merge_spark_pr.py
index e9e82b010032f..ff38253bcf536 100755
--- a/dev/merge_spark_pr.py
+++ b/dev/merge_spark_pr.py
@@ -611,7 +611,11 @@ def main():
     branch_names = sorted(branch_names, reverse=True)
     branch_iter = iter(branch_names)
 
-    pr_num = bold_input("Which pull request would you like to merge? (e.g. 34): ")
+    if len(sys.argv) == 1:
+        pr_num = bold_input("Which pull request would you like to merge? (e.g. 34): ")
+    else:
+        pr_num = sys.argv[1]
+        print("Start to merge pull request #%s" % (pr_num))
     pr = get_json("%s/pulls/%s" % (GITHUB_API_BASE, pr_num))
     pr_events = get_json("%s/issues/%s/events" % (GITHUB_API_BASE, pr_num))
 
diff --git a/dev/package-lock.json b/dev/package-lock.json
index e6ec1406a7620..4f20040d08cdb 100644
--- a/dev/package-lock.json
+++ b/dev/package-lock.json
@@ -4,9 +4,9 @@
   "requires": true,
   "packages": {
     "": {
-      "name": "dev",
       "devDependencies": {
         "ansi-regex": "^5.0.1",
+        "brace-expansion": "^1.1.12",
         "eslint": "^7.25.0",
         "minimatch": "^3.1.2"
       }
@@ -237,10 +237,11 @@
       "dev": true
     },
     "node_modules/brace-expansion": {
-      "version": "1.1.11",
-      "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.11.tgz",
-      "integrity": "sha512-iCuPHDFgrHX7H2vEI/5xpz07zSHB00TpugqhmYtVmMO6518mCuRMoOYFldEBl0g187ufozdaHgWKcYFb61qGiA==",
+      "version": "1.1.12",
+      "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.12.tgz",
+      "integrity": "sha512-9T9UjW3r0UW5c1Q7GTwllptXwhvYmEzFhzMfZ9H7FQWt+uZePjZPjBP/W1ZEyZ1twGWom5/56TF4lPcqjnDHcg==",
       "dev": true,
+      "license": "MIT",
       "dependencies": {
         "balanced-match": "^1.0.0",
         "concat-map": "0.0.1"
@@ -1407,9 +1408,9 @@
       "dev": true
     },
     "brace-expansion": {
-      "version": "1.1.11",
-      "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.11.tgz",
-      "integrity": "sha512-iCuPHDFgrHX7H2vEI/5xpz07zSHB00TpugqhmYtVmMO6518mCuRMoOYFldEBl0g187ufozdaHgWKcYFb61qGiA==",
+      "version": "1.1.12",
+      "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.12.tgz",
+      "integrity": "sha512-9T9UjW3r0UW5c1Q7GTwllptXwhvYmEzFhzMfZ9H7FQWt+uZePjZPjBP/W1ZEyZ1twGWom5/56TF4lPcqjnDHcg==",
       "dev": true,
       "requires": {
         "balanced-match": "^1.0.0",
diff --git a/dev/package.json b/dev/package.json
index 98f204868dbcb..738f9c178b1b4 100644
--- a/dev/package.json
+++ b/dev/package.json
@@ -2,7 +2,8 @@
   "devDependencies": {
     "eslint": "^7.25.0",
     "ansi-regex": "^5.0.1",
-    "minimatch": "^3.1.2"
+    "minimatch": "^3.1.2",
+    "brace-expansion": "^1.1.12"
   },
   "resolutions": {
     "optionator": "^0.9.3"
diff --git a/dev/requirements.txt b/dev/requirements.txt
index dbc517688cede..a8c3ef2c91ac2 100644
--- a/dev/requirements.txt
+++ b/dev/requirements.txt
@@ -2,8 +2,8 @@
 py4j>=0.10.9.9
 
 # PySpark dependencies (optional)
-numpy>=1.21
-pyarrow>=11.0.0
+numpy>=1.22
+pyarrow>=15.0.0
 six==1.16.0
 pandas>=2.2.0
 scipy
@@ -27,6 +27,7 @@ pytest-mypy-plugins==1.9.3
 flake8==3.9.0
 # See SPARK-38680.
 pandas-stubs<1.2.0.54
+scipy-stubs; python_version>='3.10'
 types-PyYAML
 
 # Documentation (SQL)
diff --git a/dev/run-pip-tests b/dev/run-pip-tests
index 7740481e4d832..426ec329d915d 100755
--- a/dev/run-pip-tests
+++ b/dev/run-pip-tests
@@ -55,7 +55,7 @@ if hash virtualenv 2>/dev/null && [ ! -n "$USE_CONDA" ]; then
   fi
 elif hash conda 2>/dev/null; then
   echo "Using conda virtual environments"
-  PYTHON_EXECS=('3.9')
+  PYTHON_EXECS=('3.10')
   USE_CONDA=1
 else
   echo "Missing virtualenv & conda, skipping pip installability tests"
diff --git a/dev/run-tests.py b/dev/run-tests.py
index eb760139f9b68..32c46e0d2b94b 100755
--- a/dev/run-tests.py
+++ b/dev/run-tests.py
@@ -427,7 +427,7 @@ def parse_opts():
     parser.add_argument(
         "--python-executables",
         type=str,
-        default="python3.9",
+        default="python3.11",
         help="A comma-separated list of Python executables to test against (default: %(default)s)",
     )
     parser.add_argument(
diff --git a/dev/spark-test-image/docs/Dockerfile b/dev/spark-test-image/docs/Dockerfile
index f1e33763df468..2068d53d6aba5 100644
--- a/dev/spark-test-image/docs/Dockerfile
+++ b/dev/spark-test-image/docs/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image for Documentat
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20241029
+ENV FULL_REFRESH_DATE=20250616
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -56,6 +56,7 @@ RUN apt-get update && apt-get install -y \
     pandoc \
     pkg-config \
     qpdf \
+    tzdata \
     r-base \
     ruby \
     ruby-dev \
@@ -74,18 +75,21 @@ RUN Rscript -e "install.packages(c('devtools', 'knitr', 'markdown', 'rmarkdown',
 # See more in SPARK-39735
 ENV R_LIBS_SITE="/usr/local/lib/R/site-library:${R_LIBS_SITE}:/usr/lib/R/library"
 
-# Install Python 3.9
+# Install Python 3.11
 RUN add-apt-repository ppa:deadsnakes/ppa
-RUN apt-get update && apt-get install -y python3.9 python3.9-distutils \
+RUN apt-get update && apt-get install -y \
+    python3.11 \
+    && apt-get autoremove --purge -y \
+    && apt-get clean \
     && rm -rf /var/lib/apt/lists/*
-RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.9
+RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.11
 
 # Should unpin 'sphinxcontrib-*' after upgrading sphinx>5
 # See 'ipython_genutils' in SPARK-38517
 # See 'docutils<0.18.0' in SPARK-39421
-RUN python3.9 -m pip install 'sphinx==4.5.0' mkdocs 'pydata_sphinx_theme>=0.13' sphinx-copybutton nbsphinx numpydoc jinja2 markupsafe 'pyzmq<24.0.0' \
-  ipython ipython_genutils sphinx_plotly_directive 'numpy>=1.20.0' pyarrow pandas 'plotly>=4.8' 'docutils<0.18.0' \
+RUN python3.11 -m pip install 'sphinx==4.5.0' mkdocs 'pydata_sphinx_theme>=0.13' sphinx-copybutton nbsphinx numpydoc jinja2 markupsafe 'pyzmq<24.0.0' \
+  ipython ipython_genutils sphinx_plotly_directive 'numpy>=1.22' pyarrow 'pandas==2.3.2' 'plotly>=4.8' 'docutils<0.18.0' \
   'flake8==3.9.0' 'mypy==1.8.0' 'pytest==7.1.3' 'pytest-mypy-plugins==1.9.3' 'black==23.12.1' \
   'pandas-stubs==1.2.0.53' 'grpcio==1.67.0' 'grpcio-status==1.67.0' 'protobuf==5.29.1' 'grpc-stubs==1.24.11' 'googleapis-common-protos-stubs==2.2.0' \
   'sphinxcontrib-applehelp==1.0.4' 'sphinxcontrib-devhelp==1.0.2' 'sphinxcontrib-htmlhelp==2.0.1' 'sphinxcontrib-qthelp==1.0.3' 'sphinxcontrib-serializinghtml==1.1.5' \
-  && python3.9 -m pip cache purge
+  && python3.11 -m pip cache purge
diff --git a/dev/spark-test-image/lint/Dockerfile b/dev/spark-test-image/lint/Dockerfile
index e43ca46d1409b..3b603d4ab4a68 100644
--- a/dev/spark-test-image/lint/Dockerfile
+++ b/dev/spark-test-image/lint/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image for Linter"
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250519
+ENV FULL_REFRESH_DATE=20250618
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -93,7 +93,7 @@ RUN python3.11 -m pip install \
     'pandas' \
     'pandas-stubs==1.2.0.53' \
     'plotly>=4.8' \
-    'pyarrow>=19.0.0' \
+    'pyarrow>=21.0.0' \
     'pytest-mypy-plugins==1.9.3' \
     'pytest==7.1.3' \
     && python3.11 -m pip install torch torchvision --index-url https://download.pytorch.org/whl/cpu \
diff --git a/dev/spark-test-image/pypy-310/Dockerfile b/dev/spark-test-image/pypy-310/Dockerfile
index 6a309d38f1d55..cddf0f8ea10a3 100644
--- a/dev/spark-test-image/pypy-310/Dockerfile
+++ b/dev/spark-test-image/pypy-310/Dockerfile
@@ -68,4 +68,4 @@ RUN mkdir -p /usr/local/pypy/pypy3.10 && \
     ln -sf /usr/local/pypy/pypy3.10/bin/pypy /usr/local/bin/pypy3.10 && \
     ln -sf /usr/local/pypy/pypy3.10/bin/pypy /usr/local/bin/pypy3
 RUN curl -sS https://bootstrap.pypa.io/get-pip.py | pypy3
-RUN pypy3 -m pip install numpy 'six==1.16.0' 'pandas==2.2.3' scipy coverage matplotlib lxml
+RUN pypy3 -m pip install numpy 'six==1.16.0' 'pandas==2.3.2' scipy coverage matplotlib lxml
diff --git a/dev/spark-test-image/python-309/Dockerfile b/dev/spark-test-image/python-309/Dockerfile
deleted file mode 100644
index 7fd4b604225c8..0000000000000
--- a/dev/spark-test-image/python-309/Dockerfile
+++ /dev/null
@@ -1,80 +0,0 @@
-#
-# Licensed to the Apache Software Foundation (ASF) under one or more
-# contributor license agreements.  See the NOTICE file distributed with
-# this work for additional information regarding copyright ownership.
-# The ASF licenses this file to You under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-#
-
-# Image for building and testing Spark branches. Based on Ubuntu 22.04.
-# See also in https://hub.docker.com/_/ubuntu
-FROM ubuntu:jammy-20240911.1
-LABEL org.opencontainers.image.authors="Apache Spark project <dev@spark.apache.org>"
-LABEL org.opencontainers.image.licenses="Apache-2.0"
-LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark with Python 3.09"
-# Overwrite this label to avoid exposing the underlying Ubuntu OS version label
-LABEL org.opencontainers.image.version=""
-
-ENV FULL_REFRESH_DATE=20250312
-
-ENV DEBIAN_FRONTEND=noninteractive
-ENV DEBCONF_NONINTERACTIVE_SEEN=true
-
-RUN apt-get update && apt-get install -y \
-    build-essential \
-    ca-certificates \
-    curl \
-    gfortran \
-    git \
-    gnupg \
-    libcurl4-openssl-dev \
-    libfontconfig1-dev \
-    libfreetype6-dev \
-    libfribidi-dev \
-    libgit2-dev \
-    libharfbuzz-dev \
-    libjpeg-dev \
-    liblapack-dev \
-    libopenblas-dev \
-    libpng-dev \
-    libpython3-dev \
-    libssl-dev \
-    libtiff5-dev \
-    libxml2-dev \
-    openjdk-17-jdk-headless \
-    pkg-config \
-    qpdf \
-    tzdata \
-    software-properties-common \
-    wget \
-    zlib1g-dev
-
-# Install Python 3.9
-RUN add-apt-repository ppa:deadsnakes/ppa
-RUN apt-get update && apt-get install -y \
-    python3.9 \
-    python3.9-distutils \
-    && apt-get autoremove --purge -y \
-    && apt-get clean \
-    && rm -rf /var/lib/apt/lists/*
-
-ARG BASIC_PIP_PKGS="numpy pyarrow>=19.0.0 six==1.16.0 pandas==2.2.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
-# Python deps for Spark Connect
-ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
-
-# Install Python 3.9 packages
-RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.9
-RUN python3.9 -m pip install --ignore-installed blinker>=1.6.2 # mlflow needs this
-RUN python3.9 -m pip install --force $BASIC_PIP_PKGS unittest-xml-reporting $CONNECT_PIP_PKGS && \
-    python3.9 -m pip install 'torch<2.6.0' torchvision --index-url https://download.pytorch.org/whl/cpu && \
-    python3.9 -m pip install torcheval && \
-    python3.9 -m pip cache purge
diff --git a/dev/spark-test-image/python-310/Dockerfile b/dev/spark-test-image/python-310/Dockerfile
index 57c6c850a6219..292970e519568 100644
--- a/dev/spark-test-image/python-310/Dockerfile
+++ b/dev/spark-test-image/python-310/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark wi
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250312
+ENV FULL_REFRESH_DATE=20250618
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -63,7 +63,7 @@ RUN apt-get update && apt-get install -y \
     && rm -rf /var/lib/apt/lists/*
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=19.0.0 six==1.16.0 pandas==2.2.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=21.0.0 six==1.16.0 pandas==2.3.2 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
 
diff --git a/dev/spark-test-image/python-311-classic-only/Dockerfile b/dev/spark-test-image/python-311-classic-only/Dockerfile
index 8f2ec0b0dd1f5..e8bed6b909889 100644
--- a/dev/spark-test-image/python-311-classic-only/Dockerfile
+++ b/dev/spark-test-image/python-311-classic-only/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark Cl
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250424
+ENV FULL_REFRESH_DATE=20250618
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -67,7 +67,7 @@ RUN apt-get update && apt-get install -y \
     && rm -rf /var/lib/apt/lists/*
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=19.0.0 pandas==2.2.3 plotly<6.0.0 matplotlib openpyxl memory-profiler>=0.61.0 mlflow>=2.8.1 scipy scikit-learn>=1.3.2"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=21.0.0 pandas==2.3.2 plotly<6.0.0 matplotlib openpyxl memory-profiler>=0.61.0 mlflow>=2.8.1 scipy scikit-learn>=1.3.2"
 ARG TEST_PIP_PKGS="coverage unittest-xml-reporting"
 
 # Install Python 3.11 packages
diff --git a/dev/spark-test-image/python-311/Dockerfile b/dev/spark-test-image/python-311/Dockerfile
index 1a2caa483785b..29f80d7bae3f6 100644
--- a/dev/spark-test-image/python-311/Dockerfile
+++ b/dev/spark-test-image/python-311/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark wi
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250312
+ENV FULL_REFRESH_DATE=20250618
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -67,7 +67,7 @@ RUN apt-get update && apt-get install -y \
     && rm -rf /var/lib/apt/lists/*
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=19.0.0 six==1.16.0 pandas==2.2.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=21.0.0 six==1.16.0 pandas==2.3.2 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
 
diff --git a/dev/spark-test-image/python-312/Dockerfile b/dev/spark-test-image/python-312/Dockerfile
index f64e3e3ba30ce..d9a3944f10647 100644
--- a/dev/spark-test-image/python-312/Dockerfile
+++ b/dev/spark-test-image/python-312/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark wi
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250312
+ENV FULL_REFRESH_DATE=20250618
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -67,7 +67,7 @@ RUN apt-get update && apt-get install -y \
     && rm -rf /var/lib/apt/lists/*
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=19.0.0 six==1.16.0 pandas==2.2.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=21.0.0 six==1.16.0 pandas==2.3.2 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
 
diff --git a/dev/spark-test-image/python-313-nogil/Dockerfile b/dev/spark-test-image/python-313-nogil/Dockerfile
index cee6a4cca4d33..2819ac3114f3a 100644
--- a/dev/spark-test-image/python-313-nogil/Dockerfile
+++ b/dev/spark-test-image/python-313-nogil/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark wi
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250407
+ENV FULL_REFRESH_DATE=20250618
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -67,7 +67,7 @@ RUN apt-get update && apt-get install -y \
     && rm -rf /var/lib/apt/lists/*
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=19.0.0 six==1.16.0 pandas==2.2.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=21.0.0 six==1.16.0 pandas==2.3.2 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
 
 
@@ -76,5 +76,5 @@ RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.13t
 # TODO: Add BASIC_PIP_PKGS and CONNECT_PIP_PKGS when it supports Python 3.13 free threaded
 # TODO: Add lxml, grpcio, grpcio-status back when they support Python 3.13 free threaded
 RUN python3.13t -m pip install --ignore-installed blinker>=1.6.2 # mlflow needs this
-RUN python3.13t -m pip install numpy>=2.1 pyarrow>=19.0.0 six==1.16.0 pandas==2.2.3 scipy coverage matplotlib openpyxl jinja2 && \
+RUN python3.13t -m pip install numpy>=2.1 pyarrow>=19.0.0 six==1.16.0 pandas==2.3.2 scipy coverage matplotlib openpyxl jinja2 && \
     python3.13t -m pip cache purge
diff --git a/dev/spark-test-image/python-313/Dockerfile b/dev/spark-test-image/python-313/Dockerfile
index aede82ac7d78c..e1ef91341a1f3 100644
--- a/dev/spark-test-image/python-313/Dockerfile
+++ b/dev/spark-test-image/python-313/Dockerfile
@@ -24,7 +24,7 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark wi
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250312
+ENV FULL_REFRESH_DATE=20250618
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
@@ -67,7 +67,7 @@ RUN apt-get update && apt-get install -y \
     && rm -rf /var/lib/apt/lists/*
 
 
-ARG BASIC_PIP_PKGS="numpy pyarrow>=19.0.0 six==1.16.0 pandas==2.2.3 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
+ARG BASIC_PIP_PKGS="numpy pyarrow>=21.0.0 six==1.16.0 pandas==2.3.2 scipy plotly<6.0.0 mlflow>=2.8.1 coverage matplotlib openpyxl memory-profiler>=0.61.0 scikit-learn>=1.3.2"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 protobuf==5.29.1 googleapis-common-protos==1.65.0 graphviz==0.20.3"
 
diff --git a/dev/spark-test-image/python-minimum/Dockerfile b/dev/spark-test-image/python-minimum/Dockerfile
index 59d9ebed4e40f..8f42d02023e50 100644
--- a/dev/spark-test-image/python-minimum/Dockerfile
+++ b/dev/spark-test-image/python-minimum/Dockerfile
@@ -24,11 +24,12 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For PySpark wi
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250327
+ENV FULL_REFRESH_DATE=20250703
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
 
+# Should keep the installation consistent with https://apache.github.io/spark/api/python/getting_started/install.html
 RUN apt-get update && apt-get install -y \
     build-essential \
     ca-certificates \
@@ -52,30 +53,19 @@ RUN apt-get update && apt-get install -y \
     libxml2-dev \
     openjdk-17-jdk-headless \
     pkg-config \
+    python3.10 \
+    python3-psutil \
     qpdf \
     tzdata \
     software-properties-common \
     wget \
     zlib1g-dev
 
-
-# Should keep the installation consistent with https://apache.github.io/spark/api/python/getting_started/install.html
-
-# Install Python 3.9
-RUN add-apt-repository ppa:deadsnakes/ppa
-RUN apt-get update && apt-get install -y \
-    python3.9 \
-    python3.9-distutils \
-    && apt-get autoremove --purge -y \
-    && apt-get clean \
-    && rm -rf /var/lib/apt/lists/*
-
-
-ARG BASIC_PIP_PKGS="numpy==1.21 pyarrow==11.0.0 pandas==2.0.0 six==1.16.0 scipy scikit-learn coverage unittest-xml-reporting"
+ARG BASIC_PIP_PKGS="numpy==1.22.4 pyarrow==15.0.0 pandas==2.2.0 six==1.16.0 scipy scikit-learn coverage unittest-xml-reporting"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 googleapis-common-protos==1.65.0 graphviz==0.20 protobuf"
 
 # Install Python 3.9 packages
-RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.9
-RUN python3.9 -m pip install --force $BASIC_PIP_PKGS $CONNECT_PIP_PKGS && \
-    python3.9 -m pip cache purge
+RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.10
+RUN python3.10 -m pip install --force $BASIC_PIP_PKGS $CONNECT_PIP_PKGS && \
+    python3.10 -m pip cache purge
diff --git a/dev/spark-test-image/python-ps-minimum/Dockerfile b/dev/spark-test-image/python-ps-minimum/Dockerfile
index 0cdf1fa6aa1f1..440fda96f0fc8 100644
--- a/dev/spark-test-image/python-ps-minimum/Dockerfile
+++ b/dev/spark-test-image/python-ps-minimum/Dockerfile
@@ -24,11 +24,12 @@ LABEL org.opencontainers.image.ref.name="Apache Spark Infra Image For Pandas API
 # Overwrite this label to avoid exposing the underlying Ubuntu OS version label
 LABEL org.opencontainers.image.version=""
 
-ENV FULL_REFRESH_DATE=20250327
+ENV FULL_REFRESH_DATE=20250708
 
 ENV DEBIAN_FRONTEND=noninteractive
 ENV DEBCONF_NONINTERACTIVE_SEEN=true
 
+# Should keep the installation consistent with https://apache.github.io/spark/api/python/getting_started/install.html
 RUN apt-get update && apt-get install -y \
     build-essential \
     ca-certificates \
@@ -52,6 +53,8 @@ RUN apt-get update && apt-get install -y \
     libxml2-dev \
     openjdk-17-jdk-headless \
     pkg-config \
+    python3.10 \
+    python3-psutil \
     qpdf \
     tzdata \
     software-properties-common \
@@ -59,23 +62,11 @@ RUN apt-get update && apt-get install -y \
     zlib1g-dev
 
 
-# Should keep the installation consistent with https://apache.github.io/spark/api/python/getting_started/install.html
-
-# Install Python 3.9
-RUN add-apt-repository ppa:deadsnakes/ppa
-RUN apt-get update && apt-get install -y \
-    python3.9 \
-    python3.9-distutils \
-    && apt-get autoremove --purge -y \
-    && apt-get clean \
-    && rm -rf /var/lib/apt/lists/*
-
-
-ARG BASIC_PIP_PKGS="pyarrow==11.0.0 pandas==2.2.0 six==1.16.0 numpy scipy coverage unittest-xml-reporting"
+ARG BASIC_PIP_PKGS="pyarrow==15.0.0 pandas==2.2.0 six==1.16.0 numpy scipy coverage unittest-xml-reporting"
 # Python deps for Spark Connect
 ARG CONNECT_PIP_PKGS="grpcio==1.67.0 grpcio-status==1.67.0 googleapis-common-protos==1.65.0 graphviz==0.20 protobuf"
 
-# Install Python 3.9 packages
-RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.9
-RUN python3.9 -m pip install --force $BASIC_PIP_PKGS $CONNECT_PIP_PKGS && \
-    python3.9 -m pip cache purge
+# Install Python 3.10 packages
+RUN curl -sS https://bootstrap.pypa.io/get-pip.py | python3.10
+RUN python3.10 -m pip install --force $BASIC_PIP_PKGS $CONNECT_PIP_PKGS && \
+    python3.10 -m pip cache purge
diff --git a/dev/sparktestsupport/modules.py b/dev/sparktestsupport/modules.py
index 4c748aec64278..f26a70d68d039 100644
--- a/dev/sparktestsupport/modules.py
+++ b/dev/sparktestsupport/modules.py
@@ -113,9 +113,20 @@ def __hash__(self):
     ],
 )
 
+utils_java = Module(
+    name="utils-java",
+    dependencies=[tags],
+    source_file_regexes=[
+        "common/utils-java/",
+    ],
+    sbt_test_goals=[
+        "common-utils-java/test",
+    ],
+)
+
 utils = Module(
     name="utils",
-    dependencies=[tags],
+    dependencies=[tags, utils_java],
     source_file_regexes=[
         "common/utils/",
     ],
@@ -137,7 +148,7 @@ def __hash__(self):
 
 network_common = Module(
     name="network-common",
-    dependencies=[tags, utils],
+    dependencies=[tags, utils_java],
     source_file_regexes=[
         "common/network-common/",
     ],
@@ -509,6 +520,7 @@ def __hash__(self):
         "pyspark.sql.avro.functions",
         "pyspark.sql.protobuf.functions",
         "pyspark.sql.pandas.conversion",
+        "pyspark.sql.pandas.functions",
         "pyspark.sql.pandas.map_ops",
         "pyspark.sql.pandas.group_ops",
         "pyspark.sql.pandas.types",
@@ -526,6 +538,7 @@ def __hash__(self):
         "pyspark.sql.tests.test_dataframe",
         "pyspark.sql.tests.test_collection",
         "pyspark.sql.tests.test_creation",
+        "pyspark.sql.tests.test_conversion",
         "pyspark.sql.tests.test_listener",
         "pyspark.sql.tests.test_observation",
         "pyspark.sql.tests.test_repartition",
@@ -542,7 +555,11 @@ def __hash__(self):
         "pyspark.sql.tests.arrow.test_arrow_grouped_map",
         "pyspark.sql.tests.arrow.test_arrow_python_udf",
         "pyspark.sql.tests.arrow.test_arrow_udf",
+        "pyspark.sql.tests.arrow.test_arrow_udf_grouped_agg",
         "pyspark.sql.tests.arrow.test_arrow_udf_scalar",
+        "pyspark.sql.tests.arrow.test_arrow_udf_window",
+        "pyspark.sql.tests.arrow.test_arrow_udf_typehints",
+        "pyspark.sql.tests.arrow.test_arrow_udtf",
         "pyspark.sql.tests.pandas.test_pandas_cogrouped_map",
         "pyspark.sql.tests.pandas.test_pandas_grouped_map",
         "pyspark.sql.tests.pandas.test_pandas_grouped_map_with_state",
@@ -568,6 +585,7 @@ def __hash__(self):
         "pyspark.sql.tests.test_subquery",
         "pyspark.sql.tests.test_types",
         "pyspark.sql.tests.test_udf",
+        "pyspark.sql.tests.test_udf_combinations",
         "pyspark.sql.tests.test_udf_profiler",
         "pyspark.sql.tests.test_udtf",
         "pyspark.sql.tests.test_tvf",
@@ -576,6 +594,8 @@ def __hash__(self):
         "pyspark.sql.tests.plot.test_frame_plot",
         "pyspark.sql.tests.plot.test_frame_plot_plotly",
         "pyspark.sql.tests.test_connect_compatibility",
+        "pyspark.sql.tests.udf_type_tests.test_udf_input_types",
+        "pyspark.sql.tests.udf_type_tests.test_udf_return_types",
     ],
 )
 
@@ -587,6 +607,14 @@ def __hash__(self):
         # doctests
         "pyspark.testing.utils",
         "pyspark.testing.pandasutils",
+        # unittests
+        "pyspark.testing.tests.test_fail",
+        "pyspark.testing.tests.test_fail_in_set_up_class",
+        "pyspark.testing.tests.test_no_tests",
+        "pyspark.testing.tests.test_pass_all",
+        "pyspark.testing.tests.test_skip_all",
+        "pyspark.testing.tests.test_skip_class",
+        "pyspark.testing.tests.test_skip_set_up_class",
     ],
 )
 
@@ -1077,6 +1105,7 @@ def __hash__(self):
         "pyspark.sql.tests.connect.test_parity_column",
         "pyspark.sql.tests.connect.test_parity_readwriter",
         "pyspark.sql.tests.connect.test_parity_udf",
+        "pyspark.sql.tests.connect.test_parity_udf_combinations",
         "pyspark.sql.tests.connect.test_parity_udf_profiler",
         "pyspark.sql.tests.connect.test_parity_memory_profiler",
         "pyspark.sql.tests.connect.test_parity_udtf",
@@ -1104,6 +1133,9 @@ def __hash__(self):
         "pyspark.sql.tests.connect.arrow.test_parity_arrow_python_udf",
         "pyspark.sql.tests.connect.arrow.test_parity_arrow_udf",
         "pyspark.sql.tests.connect.arrow.test_parity_arrow_udf_scalar",
+        "pyspark.sql.tests.connect.arrow.test_parity_arrow_udf_grouped_agg",
+        "pyspark.sql.tests.connect.arrow.test_parity_arrow_udf_window",
+        "pyspark.sql.tests.connect.arrow.test_parity_arrow_udtf",
         "pyspark.sql.tests.connect.pandas.test_parity_pandas_map",
         "pyspark.sql.tests.connect.pandas.test_parity_pandas_grouped_map",
         "pyspark.sql.tests.connect.pandas.test_parity_pandas_grouped_map_with_state",
@@ -1507,6 +1539,7 @@ def __hash__(self):
     source_file_regexes=["python/pyspark/pipelines"],
     python_test_goals=[
         "pyspark.pipelines.tests.test_block_connect_access",
+        "pyspark.pipelines.tests.test_block_session_mutations",
         "pyspark.pipelines.tests.test_cli",
         "pyspark.pipelines.tests.test_decorators",
         "pyspark.pipelines.tests.test_graph_element_registry",
diff --git a/dev/sparktestsupport/utils.py b/dev/sparktestsupport/utils.py
index 94ca1f52ef2b8..26e7a12b69d5b 100755
--- a/dev/sparktestsupport/utils.py
+++ b/dev/sparktestsupport/utils.py
@@ -47,6 +47,12 @@ def determine_modules_for_files(filenames):
     for filename in filenames:
         if filename.endswith("README.md"):
             continue
+        if filename in (
+            "scalastyle-config.xml",
+            "dev/checkstyle.xml",
+            "dev/checkstyle-suppressions.xml",
+        ):
+            continue
         if ("GITHUB_ACTIONS" not in os.environ) and filename.startswith(".github"):
             continue
         matched_at_least_one_module = False
diff --git a/dev/test-classes.txt b/dev/test-classes.txt
index 5315c970c5bab..2dc6b290ad4f9 100644
--- a/dev/test-classes.txt
+++ b/dev/test-classes.txt
@@ -1,4 +1,3 @@
-repl/src/test/resources/IntSumUdf.class
 sql/core/src/test/resources/artifact-tests/Hello.class
 sql/core/src/test/resources/artifact-tests/IntSumUdf.class
 sql/core/src/test/resources/artifact-tests/smallClassFile.class
diff --git a/dev/test-dependencies.sh b/dev/test-dependencies.sh
index 563a7e1acab4f..68c61232ea2af 100755
--- a/dev/test-dependencies.sh
+++ b/dev/test-dependencies.sh
@@ -37,6 +37,9 @@ HADOOP_HIVE_PROFILES=(
     hadoop-3-hive-2.3
 )
 
+MVN_EXEC_PLUGIN_VERSION=$(build/mvn help:evaluate \
+    -Dexpression=exec-maven-plugin.version -q -DforceStdout | grep -E "[0-9]+\.[0-9]+\.[0-9]+")
+
 # We'll switch the version to a temp. one, publish POMs using that new version, then switch back to
 # the old version. We need to do this because the `dependency:build-classpath` task needs to
 # resolve Spark's internal submodule dependencies.
@@ -47,7 +50,7 @@ OLD_VERSION=$($MVN -q \
     -Dexec.executable="echo" \
     -Dexec.args='${project.version}' \
     --non-recursive \
-    org.codehaus.mojo:exec-maven-plugin:1.6.0:exec | grep -E '[0-9]+\.[0-9]+\.[0-9]+')
+    org.codehaus.mojo:exec-maven-plugin:${MVN_EXEC_PLUGIN_VERSION}:exec | grep -E '[0-9]+\.[0-9]+\.[0-9]+')
 # dependency:get for guava and jetty-io are workaround for SPARK-37302.
 GUAVA_VERSION=$(build/mvn help:evaluate -Dexpression=guava.version -q -DforceStdout | grep -E "^[0-9\.]+")
 build/mvn dependency:get -Dartifact=com.google.guava:guava:${GUAVA_VERSION} -q
@@ -61,7 +64,7 @@ SCALA_BINARY_VERSION=$($MVN -q \
     -Dexec.executable="echo" \
     -Dexec.args='${scala.binary.version}' \
     --non-recursive \
-    org.codehaus.mojo:exec-maven-plugin:1.6.0:exec | grep -E '[0-9]+\.[0-9]+')
+    org.codehaus.mojo:exec-maven-plugin:${MVN_EXEC_PLUGIN_VERSION}:exec | grep -E '[0-9]+\.[0-9]+')
 if [[ "$SCALA_BINARY_VERSION" != "2.13" ]]; then
   echo "Skip dependency testing on $SCALA_BINARY_VERSION"
   exit 0
diff --git a/dev/tox.ini b/dev/tox.ini
index 05a6b16a03bd9..8a8e03ec9be3e 100644
--- a/dev/tox.ini
+++ b/dev/tox.ini
@@ -43,7 +43,8 @@ per-file-ignores =
     python/pyspark/sql/tests/*.py: F403,
     python/pyspark/streaming/tests/*.py: F403,
     python/pyspark/tests/*.py: F403,
-    python/pyspark/testing/*: F401
+    python/pyspark/testing/*.py: F401,
+    python/pyspark/testing/tests/*.py: F403
 exclude =
     */target/*,
     docs/.local_ruby_bundle/,
diff --git a/docs/Gemfile b/docs/Gemfile
index 68727dee9e1fb..533b4d9d78536 100644
--- a/docs/Gemfile
+++ b/docs/Gemfile
@@ -22,7 +22,7 @@ source "https://rubygems.org"
 # To update the lock file, run `bundle update`.
 # Version constraint reference: https://guides.rubygems.org/patterns/#declaring-dependencies
 
-gem "jekyll", "~> 4.3"
+gem "jekyll", "~> 4.4"
 gem "jekyll-redirect-from", "~> 0.16"
 # This resolves a build issue on Apple Silicon.
 # See: https://issues.apache.org/jira/browse/SPARK-38488
diff --git a/docs/Gemfile.lock b/docs/Gemfile.lock
index fab7bc1bcd37b..03617ea776421 100644
--- a/docs/Gemfile.lock
+++ b/docs/Gemfile.lock
@@ -3,18 +3,18 @@ GEM
   specs:
     addressable (2.8.7)
       public_suffix (>= 2.0.2, < 7.0)
-    base64 (0.2.0)
-    bigdecimal (3.1.9)
+    base64 (0.3.0)
+    bigdecimal (3.2.2)
     colorator (1.1.0)
     concurrent-ruby (1.3.5)
-    csv (3.3.2)
+    csv (3.3.5)
     em-websocket (0.5.3)
       eventmachine (>= 0.12.9)
       http_parser.rb (~> 0)
     eventmachine (1.2.7)
-    ffi (1.17.1)
+    ffi (1.17.2)
     forwardable-extended (2.6.0)
-    google-protobuf (4.29.3-arm64-darwin)
+    google-protobuf (4.31.1)
       bigdecimal
       rake (>= 13)
     http_parser.rb (0.8.0)
@@ -45,7 +45,7 @@ GEM
       sass-embedded (~> 1.75)
     jekyll-watch (2.2.1)
       listen (~> 3.0)
-    json (2.9.1)
+    json (2.12.2)
     kramdown (2.5.1)
       rexml (>= 3.3.9)
     kramdown-parser-gfm (1.1.0)
@@ -57,16 +57,17 @@ GEM
     mercenary (0.4.0)
     pathutil (0.16.2)
       forwardable-extended (~> 2.6)
-    public_suffix (6.0.1)
-    rake (13.2.1)
+    public_suffix (6.0.2)
+    rake (13.3.0)
     rb-fsevent (0.11.2)
     rb-inotify (0.11.1)
       ffi (~> 1.0)
     rexml (3.3.9)
-    rouge (4.5.1)
+    rouge (4.5.2)
     safe_yaml (1.0.5)
-    sass-embedded (1.83.4-arm64-darwin)
-      google-protobuf (~> 4.29)
+    sass-embedded (1.89.2)
+      google-protobuf (~> 4.31)
+      rake (>= 13)
     terminal-table (3.0.2)
       unicode-display_width (>= 1.1.1, < 3)
     unicode-display_width (2.6.0)
@@ -77,7 +78,7 @@ PLATFORMS
 
 DEPENDENCIES
   ffi (~> 1.15)
-  jekyll (~> 4.3)
+  jekyll (~> 4.4)
   jekyll-redirect-from (~> 0.16)
   rexml (~> 3.3.9)
 
diff --git a/docs/_layouts/global.html b/docs/_layouts/global.html
index 4d6ddfc2c74a1..115f5c98ce65f 100755
--- a/docs/_layouts/global.html
+++ b/docs/_layouts/global.html
@@ -80,6 +80,7 @@
                             <a class="dropdown-item" href="{{ rel_path_to_root }}graphx-programming-guide.html">GraphX (Graph Processing)</a>
                             <a class="dropdown-item" href="{{ rel_path_to_root }}sparkr.html">SparkR (R on Spark)</a>
                             <a class="dropdown-item" href="{{ rel_path_to_root }}api/python/getting_started/index.html">PySpark (Python on Spark)</a>
+                            <a class="dropdown-item" href="{{ rel_path_to_root }}declarative-pipelines-programming-guide.html">Declarative Pipelines</a>
                         </div>
                     </li>
 
diff --git a/docs/_plugins/build_api_docs.rb b/docs/_plugins/build_api_docs.rb
index 0aa0db0bf9898..918d99cd2d028 100644
--- a/docs/_plugins/build_api_docs.rb
+++ b/docs/_plugins/build_api_docs.rb
@@ -45,7 +45,7 @@ def build_spark_if_necessary
 
   print_header "Building Spark."
   cd(SPARK_PROJECT_ROOT)
-  command = "build/sbt -Phive -Pkinesis-asl clean package"
+  command = "NO_PROVIDED_SPARK_JARS=0 build/sbt -Phive -Pkinesis-asl clean package"
   puts "Running '#{command}'; this may take a few minutes..."
   system(command) || raise("Failed to build Spark")
   $spark_package_is_built = true
@@ -168,7 +168,6 @@ def build_python_docs
   mkdir_p "api/python"
 
   puts "cp -r ../python/docs/build/html/. api/python"
-  rm_r("../python/docs/build/html/_sources")
   cp_r("../python/docs/build/html/.", "api/python")
 end
 
diff --git a/docs/core-migration-guide.md b/docs/core-migration-guide.md
index 7d51801edc67c..edd5e3e7f85d6 100644
--- a/docs/core-migration-guide.md
+++ b/docs/core-migration-guide.md
@@ -27,6 +27,7 @@ license: |
 - Since Spark 4.1, Spark Master deamon provides REST API by default. To restore the behavior before Spark 4.1, you can set `spark.master.rest.enabled` to `false`.
 - Since Spark 4.1, Spark will compress RDD checkpoints by default. To restore the behavior before Spark 4.1, you can set `spark.checkpoint.compress` to `false`.
 - Since Spark 4.1, Spark uses Apache Hadoop Magic Committer for all S3 buckets by default. To restore the behavior before Spark 4.0, you can set `spark.hadoop.fs.s3a.committer.magic.enabled=false`.
+- Since Spark 4.1, `java.lang.InternalError` encountered during file reading will no longer fail the task if the configuration `spark.sql.files.ignoreCorruptFiles` or the data source option `ignoreCorruptFiles` is set to `true`. 
 
 ## Upgrading from Core 3.5 to 4.0
 
@@ -58,7 +59,7 @@ license: |
 
 - Since Spark 4.0, `spark.shuffle.unsafe.file.output.buffer` is deprecated though still works. Use `spark.shuffle.localDisk.file.output.buffer` instead.
 
-- Since Spark 4.0, when reading files hits `org.apache.hadoop.security.AccessControlException` and `org.apache.hadoop.hdfs.BlockMissingException`, the exception will be thrown and fail the task, even if `spark.files.ignoreCorruptFiles` is set to `true`.
+- Since Spark 4.0, `org.apache.hadoop.security.AccessControlException` or `org.apache.hadoop.hdfs.BlockMissingException` encountered during file reading will fail the task even if the configuration `spark.sql.files.ignoreCorruptFiles` or the data source option `ignoreCorruptFiles` is set to `true`.
 
 ## Upgrading from Core 3.5.3 to 3.5.4
 
diff --git a/docs/declarative-pipelines-programming-guide.md b/docs/declarative-pipelines-programming-guide.md
new file mode 100644
index 0000000000000..3e33153e3d252
--- /dev/null
+++ b/docs/declarative-pipelines-programming-guide.md
@@ -0,0 +1,418 @@
+---
+layout: global
+title: Spark Declarative Pipelines Programming Guide
+displayTitle: Spark Declarative Pipelines Programming Guide
+license: |
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+ 
+     http://www.apache.org/licenses/LICENSE-2.0
+ 
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+---
+
+* Table of contents
+{:toc}
+
+## What is Spark Declarative Pipelines (SDP)?
+
+Spark Declarative Pipelines (SDP) is a declarative framework for building reliable, maintainable, and testable data pipelines on Spark. SDP simplifies ETL development by allowing you to focus on the transformations you want to apply to your data, rather than the mechanics of pipeline execution.
+
+SDP is designed for both batch and streaming data processing, supporting common use cases such as:
+- Data ingestion from cloud storage (Amazon S3, Azure ADLS Gen2, Google Cloud Storage)
+- Data ingestion from message buses (Apache Kafka, Amazon Kinesis, Google Pub/Sub, Azure EventHub)
+- Incremental batch and streaming transformations
+
+The key advantage of SDP is its declarative approach - you define what tables should exist and what their contents should be, and SDP handles the orchestration, compute management, and error handling automatically.
+
+![Dataflow Graph](img/declarative-pipelines-dataflow-graph.png)
+
+## Key Concepts
+
+### Flows
+
+A flow is the foundational data processing concept in SDP which supports both streaming and batch semantics. A flow reads data from a source, applies user-defined processing logic, and writes the result into a target dataset.
+
+For example, when you author a query like:
+
+```sql
+CREATE STREAMING TABLE target_table AS
+SELECT * FROM STREAM source_table
+```
+
+SDP creates the table named `target_table` along with a flow that reads new data from `source_table` and writes it to `target_table`.
+
+### Datasets
+
+A dataset is queryable object that's the output of one of more flows within a pipeline. Flows in the pipeline can also read from datasets produced in the pipeline.
+
+- **Streaming Table** – a definition of a table and one or more streaming flows written into it. Streaming tables support incremental processing of data, allowing you to process only new data as it arrives.
+- **Materialized View** – is a view that is precomputed into a table. A materialized view always has exactly one batch flow writing to it.
+- **Temporary View** – a view that is scoped to an execution of the pipeline. It can be referenced from flows within the pipeline. It's useful for encapsulating transformations and intermediate logical entities that multiple other elements of the pipeline depend on.
+
+### Pipelines
+
+A pipeline is the primary unit of development and execution in SDP. A pipeline can contain one or more flows, streaming tables, and materialized views. While your pipeline runs, it analyzes the dependencies of your defined objects and orchestrates their order of execution and parallelization automatically.
+
+### Pipeline Projects
+
+A pipeline project is a set of source files that contain code that define the datasets and flows that make up a pipeline. These source files can be `.py` or `.sql` files.
+
+A YAML-formatted pipeline spec file contains the top-level configuration for the pipeline project. It supports the following fields:
+- **definitions** (Required) - Paths where definition files can be found.
+- **database** (Optional) - The default target database for pipeline outputs.
+- **catalog** (Optional) - The default target catalog for pipeline outputs.
+- **configuration** (Optional) - Map of Spark configuration properties.
+
+An example pipeline spec file:
+
+```yaml
+name: my_pipeline
+definitions:
+  - glob:
+      include: transformations/**/*.py
+  - glob:
+      include: transformations/**/*.sql
+catalog: my_catalog
+database: my_db
+configuration:
+  spark.sql.shuffle.partitions: "1000"
+```
+
+It's conventional to name pipeline spec files `pipeline.yml`.
+
+The `spark-pipelines init` command, described below, makes it easy to generate a pipeline project with default configuration and directory structure.
+
+
+## The `spark-pipelines` Command Line Interface
+
+The `spark-pipelines` command line interface (CLI) is the primary way to execute a pipeline. It also contains an `init` subcommand for generating a pipeline project and a `dry-run` subcommand for validating a pipeline.
+
+`spark-pipelines` is built on top of `spark-submit`, meaning that it supports all cluster managers supported by `spark-submit`. It supports all `spark-submit` arguments except for `--class`.
+
+### `spark-pipelines init`
+
+`spark-pipelines init --name my_pipeline` generates a simple pipeline project, inside a directory named "my_pipeline", including a spec file and example definitions.
+
+### `spark-pipelines run`
+
+`spark-pipelines run` launches an execution of a pipeline and monitors its progress until it completes. The `--spec` parameter allows selecting the pipeline spec file. If not provided, the CLI will look in the current directory and parent directories for a file named `pipeline.yml` or `pipeline.yaml`.
+
+### `spark-pipelines dry-run`
+
+`spark-pipelines dry-run` launches an execution of a pipeline that doesn't write or read any data, but catches many kinds of errors that would be caught if the pipeline were to actually run. E.g.
+- Syntax errors – e.g. invalid Python or SQL code
+- Analysis errors – e.g. selecting from a table that doesn't exist or selecting a column that doesn't exist
+- Graph validation errors - e.g. cyclic dependencies
+
+## Programming with SDP in Python
+
+SDP Python functions are defined in the `pyspark.pipelines` module. Your pipelines implemented with the Python API must import this module. It's common to alias the module to `dp` to limit the number of characters you need to type when using its APIs.
+
+```python
+from pyspark import pipelines as dp
+```
+
+### Creating a Materialized View with Python
+
+The `@dp.materialized_view` decorator tells SDP to create a materialized view based on the results returned by a function that performs a batch read:
+
+```python
+from pyspark import pipelines as dp
+
+@dp.materialized_view
+def basic_mv():
+    return spark.table("samples.nyctaxi.trips")
+```
+
+Optionally, you can specify the table name using the `name` argument:
+
+```python
+from pyspark import pipelines as dp
+
+@dp.materialized_view(name="trips_mv")
+def basic_mv():
+    return spark.table("samples.nyctaxi.trips")
+```
+
+### Creating a Temporary View with Python
+
+The `@dp.temporary_view` decorator tells SDP to create a temporary view based on the results returned by a function that performs a batch read:
+
+```python
+from pyspark import pipelines as dp
+
+@dp.temporary_view
+def basic_tv():
+    return spark.table("samples.nyctaxi.trips")
+```
+
+This temporary view can be read by other queries within the pipeline, but can't be read outside the scope of the pipeline.
+
+### Creating a Streaming Table with Python
+
+Similarly, you can create a streaming table by using the `@dp.table` decorator with a function that performs a streaming read:
+
+```python
+from pyspark import pipelines as dp
+
+@dp.table
+def basic_st():
+    return spark.readStream.table("samples.nyctaxi.trips")
+```
+
+### Loading Data from a Streaming Source
+
+SDP supports loading data from all formats supported by Spark. For example, you can create a streaming table whose query reads from a Kafka topic:
+
+```python
+from pyspark import pipelines as dp
+
+@dp.table
+def ingestion_st():
+    return (
+        spark.readStream.format("kafka")
+        .option("kafka.bootstrap.servers", "localhost:9092")
+        .option("subscribe", "orders")
+        .load()
+    )
+```
+
+For batch reads:
+
+```python
+from pyspark import pipelines as dp
+
+@dp.materialized_view
+def batch_mv():
+    return spark.read.format("json").load("/datasets/retail-org/sales_orders")
+```
+
+### Querying Tables Defined in Your Pipeline
+
+You can reference other tables defined in your pipeline in the same way you'd reference tables defined outside your pipeline:
+
+```python
+from pyspark import pipelines as dp
+from pyspark.sql.functions import col
+
+@dp.table
+def orders():
+    return (
+        spark.readStream.format("kafka")
+        .option("kafka.bootstrap.servers", "localhost:9092")
+        .option("subscribe", "orders")
+        .load()
+    )
+
+@dp.materialized_view
+def customers():
+    return spark.read.format("csv").option("header", True).load("/datasets/retail-org/customers")
+
+@dp.materialized_view
+def customer_orders():
+    return (spark.table("orders")
+        .join(spark.table("customers"), "customer_id")
+        .select("customer_id",
+            "order_number",
+            "state",
+            col("order_datetime").cast("int").cast("timestamp").cast("date").alias("order_date"),
+        )
+    )
+
+@dp.materialized_view
+def daily_orders_by_state():
+    return (spark.table("customer_orders")
+        .groupBy("state", "order_date")
+        .count().withColumnRenamed("count", "order_count")
+    )
+```
+
+### Creating Tables in a For Loop
+
+You can use Python `for` loops to create multiple tables programmatically:
+
+```python
+from pyspark import pipelines as dp
+from pyspark.sql.functions import collect_list, col
+
+@dp.temporary_view()
+def customer_orders():
+    orders = spark.table("samples.tpch.orders")
+    customer = spark.table("samples.tpch.customer")
+
+    return (orders.join(customer, orders.o_custkey == customer.c_custkey)
+        .select(
+            col("c_custkey").alias("custkey"),
+            col("c_name").alias("name"),
+            col("c_nationkey").alias("nationkey"),
+            col("c_phone").alias("phone"),
+            col("o_orderkey").alias("orderkey"),
+            col("o_orderstatus").alias("orderstatus"),
+            col("o_totalprice").alias("totalprice"),
+            col("o_orderdate").alias("orderdate"))
+    )
+
+@dp.temporary_view()
+def nation_region():
+    nation = spark.table("samples.tpch.nation")
+    region = spark.table("samples.tpch.region")
+
+    return (nation.join(region, nation.n_regionkey == region.r_regionkey)
+        .select(
+            col("n_name").alias("nation"),
+            col("r_name").alias("region"),
+            col("n_nationkey").alias("nationkey")
+        )
+    )
+
+# Extract region names from region table
+region_list = spark.table("samples.tpch.region").select(collect_list("r_name")).collect()[0][0]
+
+# Iterate through region names to create new region-specific materialized views
+for region in region_list:
+    @dp.table(name=f"{region.lower().replace(' ', '_')}_customer_orders")
+    def regional_customer_orders(region_filter=region):
+        customer_orders = spark.table("customer_orders")
+        nation_region = spark.table("nation_region")
+
+        return (customer_orders.join(nation_region, customer_orders.nationkey == nation_region.nationkey)
+            .select(
+                col("custkey"),
+                col("name"),
+                col("phone"),
+                col("nation"),
+                col("region"),
+                col("orderkey"),
+                col("orderstatus"),
+                col("totalprice"),
+                col("orderdate")
+            ).filter(f"region = '{region_filter}'")
+        )
+```
+
+### Using Multiple Flows to Write to a Single Target
+
+You can create multiple flows that append data to the same target:
+
+```python
+from pyspark import pipelines as dp
+
+# create a streaming table
+dp.create_streaming_table("customers_us")
+
+# add the first append flow
+@dp.append_flow(target = "customers_us")
+def append1():
+    return spark.readStream.table("customers_us_west")
+
+# add the second append flow
+@dp.append_flow(target = "customers_us")
+def append2():
+    return spark.readStream.table("customers_us_east")
+```
+
+## Programming with SDP in SQL
+
+### Creating a Materialized View with SQL
+
+The basic syntax for creating a materialized view with SQL is:
+
+```sql
+CREATE MATERIALIZED VIEW basic_mv
+AS SELECT * FROM samples.nyctaxi.trips;
+```
+
+### Creating a Temporary View with SQL
+
+The basic syntax for creating a temporary view with SQL is:
+
+```sql
+CREATE TEMPORARY VIEW basic_tv
+AS SELECT * FROM samples.nyctaxi.trips;
+```
+
+### Creating a Streaming Table with SQL
+
+When creating a streaming table, use the `STREAM` keyword to indicate streaming semantics for the source:
+
+```sql
+CREATE STREAMING TABLE basic_st
+AS SELECT * FROM STREAM samples.nyctaxi.trips;
+```
+
+### Querying Tables Defined in Your Pipeline
+
+You can reference other tables defined in your pipeline:
+
+```sql
+CREATE STREAMING TABLE orders
+AS SELECT * FROM STREAM orders_source;
+
+CREATE MATERIALIZED VIEW customers
+AS SELECT * FROM customers_source;
+
+CREATE MATERIALIZED VIEW customer_orders
+AS SELECT
+  c.customer_id,
+  o.order_number,
+  c.state,
+  date(timestamp(int(o.order_datetime))) order_date
+FROM orders o
+INNER JOIN customers c
+ON o.customer_id = c.customer_id;
+
+CREATE MATERIALIZED VIEW daily_orders_by_state
+AS SELECT state, order_date, count(*) order_count
+FROM customer_orders
+GROUP BY state, order_date;
+```
+
+### Using Multiple Flows to Write to a Single Target
+
+You can create multiple flows that append data to the same target:
+
+```sql
+-- create a streaming table
+CREATE STREAMING TABLE customers_us;
+
+-- add the first append flow
+CREATE FLOW append1
+AS INSERT INTO customers_us
+SELECT * FROM STREAM(customers_us_west);
+
+-- add the second append flow
+CREATE FLOW append2
+AS INSERT INTO customers_us
+SELECT * FROM STREAM(customers_us_east);
+```
+
+## Important Considerations
+
+### Python Considerations
+
+- SDP evaluates the code that defines a pipeline multiple times during planning and pipeline runs. Python functions that define datasets should include only the code required to define the table or view.
+- The function used to define a dataset must return a Spark DataFrame.
+- Never use methods that save or write to files or tables as part of your SDP dataset code.
+
+Examples of Apache Spark operations that should never be used in SDP code:
+- `collect()`
+- `count()`
+- `toPandas()`
+- `save()`
+- `saveAsTable()`
+- `start()`
+- `toTable()`
+
+### SQL Considerations
+
+- The `PIVOT` clause is not supported in SDP SQL.
+- When using the `for` loop pattern to define datasets in Python, ensure that the list of values passed to the `for` loop is always additive.
diff --git a/docs/img/declarative-pipelines-dataflow-graph.png b/docs/img/declarative-pipelines-dataflow-graph.png
new file mode 100644
index 0000000000000..cadd2d81482ff
Binary files /dev/null and b/docs/img/declarative-pipelines-dataflow-graph.png differ
diff --git a/docs/index.md b/docs/index.md
index 88ea8ad9efc3b..cb32ddcde7e2b 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -34,7 +34,7 @@ source, visit [Building Spark](building-spark.html).
 
 Spark runs on both Windows and UNIX-like systems (e.g. Linux, Mac OS), and it should run on any platform that runs a supported version of Java. This should include JVMs on x86_64 and ARM64. It's easy to run locally on one machine --- all you need is to have `java` installed on your system `PATH`, or the `JAVA_HOME` environment variable pointing to a Java installation.
 
-Spark runs on Java 17/21, Scala 2.13, Python 3.9+, and R 3.5+ (Deprecated).
+Spark runs on Java 17/21, Scala 2.13, Python 3.10+, and R 3.5+ (Deprecated).
 When using the Scala API, it is necessary for applications to use the same version of Scala that Spark was compiled for. Since Spark 4.0.0, it's Scala 2.13.
 
 # Running the Examples and Shell
@@ -112,6 +112,7 @@ options for deployment:
 * [SparkR (Deprecated)](sparkr.html): processing data with Spark in R
 * [PySpark](api/python/getting_started/index.html): processing data with Spark in Python
 * [Spark SQL CLI](sql-distributed-sql-engine-spark-sql-cli.html): processing data with SQL on the command line
+* [Declarative Pipelines](declarative-pipelines-programming-guide.html): building data pipelines that create and maintain multiple tables
 
 **API Docs:**
 
diff --git a/docs/quick-start.md b/docs/quick-start.md
index 5a03af98cd832..83fc3421c0381 100644
--- a/docs/quick-start.md
+++ b/docs/quick-start.md
@@ -462,7 +462,7 @@ Lines with a: 46, Lines with b: 23
 
 </div>
 
-Other dependency management tools such as Conda and pip can be also used for custom classes or third-party libraries. See also [Python Package Management](api/python/user_guide/python_packaging.html).
+Other dependency management tools such as Conda and pip can be also used for custom classes or third-party libraries. See also [Python Package Management](api/python/tutorial/python_packaging.html).
 
 # Where to Go from Here
 Congratulations on running your first Spark application!
diff --git a/docs/rdd-programming-guide.md b/docs/rdd-programming-guide.md
index 400f8a512e7a7..6e69cec23a40d 100644
--- a/docs/rdd-programming-guide.md
+++ b/docs/rdd-programming-guide.md
@@ -39,7 +39,7 @@ along with if you launch Spark's interactive shell -- either `bin/spark-shell` f
 
 <div data-lang="python"  markdown="1">
 
-Spark {{site.SPARK_VERSION}} works with Python 3.9+. It can use the standard CPython interpreter,
+Spark {{site.SPARK_VERSION}} works with Python 3.10+. It can use the standard CPython interpreter,
 so C libraries like NumPy can be used. It also works with PyPy 7.3.6+.
 
 Spark applications in Python can either be run with the `bin/spark-submit` script which includes Spark at runtime, or by including it in your setup.py as:
diff --git a/docs/running-on-kubernetes.md b/docs/running-on-kubernetes.md
index 8ad9078a6a9aa..9f385a11d92e1 100644
--- a/docs/running-on-kubernetes.md
+++ b/docs/running-on-kubernetes.md
@@ -44,7 +44,7 @@ Cluster administrators should use [Pod Security Policies](https://kubernetes.io/
 
 # Prerequisites
 
-* A running Kubernetes cluster at version >= 1.31 with access configured to it using
+* A running Kubernetes cluster at version >= 1.32 with access configured to it using
 [kubectl](https://kubernetes.io/docs/reference/kubectl/).  If you do not already have a working Kubernetes cluster,
 you may set up a test cluster on your local machine using
 [minikube](https://kubernetes.io/docs/getting-started-guides/minikube/).
@@ -643,7 +643,8 @@ See the [configuration page](configuration.html) for information on Spark config
     Container image to use for the Spark application.
     This is usually of the form <code>example.com/repo/spark:v1.0.0</code>.
     This configuration is required and must be provided by the user, unless explicit
-    images are provided for each different container type.
+    images are provided for each different container type. Note that <code>{{SPARK_VERSION}}</code> 
+    is the built-in variable that will be substituted with current Spark's version.
   </td>
   <td>2.3.0</td>
 </tr>
@@ -651,7 +652,8 @@ See the [configuration page](configuration.html) for information on Spark config
   <td><code>spark.kubernetes.driver.container.image</code></td>
   <td><code>(value of spark.kubernetes.container.image)</code></td>
   <td>
-    Custom container image to use for the driver.
+    Custom container image to use for the driver. Note that <code>{{SPARK_VERSION}}</code> 
+    is the built-in variable that will be substituted with current Spark's version.
   </td>
   <td>2.3.0</td>
 </tr>
@@ -659,7 +661,8 @@ See the [configuration page](configuration.html) for information on Spark config
   <td><code>spark.kubernetes.executor.container.image</code></td>
   <td><code>(value of spark.kubernetes.container.image)</code></td>
   <td>
-    Custom container image to use for executors.
+    Custom container image to use for executors. Note that <code>{{SPARK_VERSION}}</code> 
+    is the built-in variable that will be substituted with current Spark's version.
   </td>
   <td>2.3.0</td>
 </tr>
@@ -1988,10 +1991,10 @@ Install Apache YuniKorn:
 ```bash
 helm repo add yunikorn https://apache.github.io/yunikorn-release
 helm repo update
-helm install yunikorn yunikorn/yunikorn --namespace yunikorn --version 1.6.3 --create-namespace --set embedAdmissionController=false
+helm install yunikorn yunikorn/yunikorn --namespace yunikorn --version 1.7.0 --create-namespace --set embedAdmissionController=false
 ```
 
-The above steps will install YuniKorn v1.6.3 on an existing Kubernetes cluster.
+The above steps will install YuniKorn v1.7.0 on an existing Kubernetes cluster.
 
 ##### Get started
 
diff --git a/docs/sql-data-sources-hive-tables.md b/docs/sql-data-sources-hive-tables.md
index d45174425f470..977efa8f24330 100644
--- a/docs/sql-data-sources-hive-tables.md
+++ b/docs/sql-data-sources-hive-tables.md
@@ -130,7 +130,7 @@ The following options can be used to configure the version of Hive that is used
     <td><code>2.3.10</code></td>
     <td>
       Version of the Hive metastore. Available
-      options are <code>2.0.0</code> through <code>2.3.10</code>, <code>3.0.0</code> through <code>3.1.3</code>, and <code>4.0.0</code> through <code>4.0.1</code>.
+      options are <code>2.0.0</code> through <code>2.3.10</code>, <code>3.0.0</code> through <code>3.1.3</code>, and <code>4.0.0</code> through <code>4.1.0</code>.
     </td>
     <td>1.4.0</td>
   </tr>
diff --git a/docs/sql-getting-started.md b/docs/sql-getting-started.md
index c2733a0ebf012..11733a308bf0a 100644
--- a/docs/sql-getting-started.md
+++ b/docs/sql-getting-started.md
@@ -124,9 +124,9 @@ latter form, which is future proof and won't break with column names that
 are also attributes on the DataFrame class.
 
 {% include_example untyped_ops python/sql/basic.py %}
-For a complete list of the types of operations that can be performed on a DataFrame refer to the [API Documentation](api/python/reference/pyspark.sql.html#dataframe-apis).
+For a complete list of the types of operations that can be performed on a DataFrame refer to the [API Documentation](api/python/reference/pyspark.sql/dataframe.html).
 
-In addition to simple column references and expressions, DataFrames also have a rich library of functions including string manipulation, date arithmetic, common math operations and more. The complete list is available in the [DataFrame Function Reference](api/python/reference/pyspark.sql.html#functions).
+In addition to simple column references and expressions, DataFrames also have a rich library of functions including string manipulation, date arithmetic, common math operations and more. The complete list is available in the [DataFrame Function Reference](api/python/reference/pyspark.sql/functions.html).
 
 </div>
 
diff --git a/docs/sql-migration-guide.md b/docs/sql-migration-guide.md
index edc0a61d8f1d8..d199dc31c58be 100644
--- a/docs/sql-migration-guide.md
+++ b/docs/sql-migration-guide.md
@@ -1059,7 +1059,7 @@ Python UDF registration is unchanged.
 Spark SQL is designed to be compatible with the Hive Metastore, SerDes and UDFs.
 Currently, Hive SerDes and UDFs are based on built-in Hive,
 and Spark SQL can be connected to different versions of Hive Metastore
-(from 2.0.0 to 2.3.10 and 3.0.0 to 3.1.3. Also see [Interacting with Different Versions of Hive Metastore](sql-data-sources-hive-tables.html#interacting-with-different-versions-of-hive-metastore)).
+(from 2.0.0 to 2.3.10 and 3.0.0 to 4.1.0. Also see [Interacting with Different Versions of Hive Metastore](sql-data-sources-hive-tables.html#interacting-with-different-versions-of-hive-metastore).
 
 #### Deploying in Existing Hive Warehouses
 {:.no_toc}
diff --git a/docs/sql-ref-ansi-compliance.md b/docs/sql-ref-ansi-compliance.md
index ef79ef1871363..8d2c13beff975 100644
--- a/docs/sql-ref-ansi-compliance.md
+++ b/docs/sql-ref-ansi-compliance.md
@@ -110,19 +110,20 @@ Besides, the ANSI SQL mode disallows the following type conversions which are al
  The valid combinations of source and target data type in a `CAST` expression are given by the following table.
 “Y” indicates that the combination is syntactically valid without restriction and “N” indicates that the combination is not valid.
 
-| Source\Target | Numeric                              | String                               | Date                                 | Timestamp                            | Timestamp_NTZ                        | Interval                             | Boolean                              | Binary | Array                                | Map                                  | Struct                               |
-|---------------|--------------------------------------|--------------------------------------|--------------------------------------|--------------------------------------|--------------------------------------|--------------------------------------|--------------------------------------|--------|--------------------------------------|--------------------------------------|--------------------------------------|
-| Numeric       | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | N                                    | <span style="color:red">**Y**</span> | N                                    | <span style="color:red">**Y**</span> | Y                                    | N      | N                                    | N                                    | N                                    |
-| String        | <span style="color:red">**Y**</span> | Y                                    | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | Y      | N                                    | N                                    | N                                    |
-| Date          | N                                    | Y                                    | Y                                    | Y                                    | Y                                    | N                                    | N                                    | N      | N                                    | N                                    | N                                    |
-| Timestamp     | <span style="color:red">**Y**</span> | Y                                    | Y                                    | Y                                    | Y                                    | N                                    | N                                    | N      | N                                    | N                                    | N                                    |
-| Timestamp_NTZ | N                                    | Y                                    | Y                                    | Y                                    | Y                                    | N                                    | N                                    | N      | N                                    | N                                    | N                                    |
-| Interval      | <span style="color:red">**Y**</span> | Y                                    | N                                    | N                                    | N                                    | Y                                    | N                                    | N      | N                                    | N                                    | N                                    |
-| Boolean       | Y                                    | Y                                    | N                                    | N                                    | N                                    | N                                    | Y                                    | N      | N                                    | N                                    | N                                    |
-| Binary        | N                                    | Y                                    | N                                    | N                                    | N                                    | N                                    | N                                    | Y      | N                                    | N                                    | N                                    |
-| Array         | N                                    | Y                                    | N                                    | N                                    | N                                    | N                                    | N                                    | N      | <span style="color:red">**Y**</span> | N                                    | N                                    |
-| Map           | N                                    | Y                                    | N                                    | N                                    | N                                    | N                                    | N                                    | N      | N                                    | <span style="color:red">**Y**</span> | N                                    |
-| Struct        | N                                    | Y                                    | N                                    | N                                    | N                                    | N                                    | N                                    | N      | N                                    | N                                    | <span style="color:red">**Y**</span> |
+| Source\Target | Numeric                              | String                               | Date                                 | Time | Timestamp                            | Timestamp_NTZ                        | Interval                             | Boolean                              | Binary | Array                                | Map                                  | Struct                               |
+|---------------|--------------------------------------|--------------------------------------|--------------------------------------|------|--------------------------------------|--------------------------------------|--------------------------------------|--------------------------------------|--------|--------------------------------------|--------------------------------------|--------------------------------------|
+| Numeric       | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | N                                    | N    |<span style="color:red">**Y**</span> | N                                    | <span style="color:red">**Y**</span> | Y                                    | N      | N                                    | N                                    | N                                    |
+| String        | <span style="color:red">**Y**</span> | Y                                    | <span style="color:red">**Y**</span> | Y    |<span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | <span style="color:red">**Y**</span> | Y      | N                                    | N                                    | N                                    |
+| Date          | N                                    | Y                                    | Y                                    | N    | Y                                   | Y                                    | N                                    | N                                    | N      | N                                    | N                                    | N                                    |
+| Time          | N                                    | Y                                    | N                                    | Y    | N                                   | N                                    | N                                    | N                                    | N      | N                                    | N                                    | N                                    |
+| Timestamp     | <span style="color:red">**Y**</span> | Y                                    | Y                                    | N    | Y                                   | Y                                    | N                                    | N                                    | N      | N                                    | N                                    | N                                    |
+| Timestamp_NTZ | N                                    | Y                                    | Y                                    | N    | Y                                   | Y                                    | N                                    | N                                    | N      | N                                    | N                                    | N                                    |
+| Interval      | <span style="color:red">**Y**</span> | Y                                    | N                                    | N    | N                                   | N                                    | Y                                    | N                                    | N      | N                                    | N                                    | N                                    |
+| Boolean       | Y                                    | Y                                    | N                                    | N    | N                                   | N                                    | N                                    | Y                                    | N      | N                                    | N                                    | N                                    |
+| Binary        | N                                    | Y                                    | N                                    | N    | N                                   | N                                    | N                                    | N                                    | Y      | N                                    | N                                    | N                                    |
+| Array         | N                                    | Y                                    | N                                    | N    | N                                   | N                                    | N                                    | N                                    | N      | <span style="color:red">**Y**</span> | N                                    | N                                    |
+| Map           | N                                    | Y                                    | N                                    | N    | N                                   | N                                    | N                                    | N                                    | N      | N                                    | <span style="color:red">**Y**</span> | N                                    |
+| Struct        | N                                    | Y                                    | N                                    | N    | N                                   | N                                    | N                                    | N                                    | N      | N                                    | N                                    | <span style="color:red">**Y**</span> |
 
 In the table above, all the `CAST`s with new syntax are marked as red <span style="color:red">**Y**</span>:
 * CAST(Numeric AS Numeric): raise an overflow exception if the value is out of the target data type's range.
@@ -198,19 +199,20 @@ While casting of a decimal with a fraction to an interval type with SECOND as th
 ### Store assignment
 As mentioned at the beginning, when `spark.sql.storeAssignmentPolicy` is set to `ANSI`(which is the default value), Spark SQL complies with the ANSI store assignment rules on table insertions. The valid combinations of source and target data type in table insertions are given by the following table.
 
-| Source\Target | Numeric | String | Date | Timestamp | Timestamp_NTZ | Interval | Boolean | Binary | Array | Map | Struct |
-|:-------------:|:-------:|:------:|:----:|:---------:|---------------|:--------:|:-------:|:------:|:-----:|:---:|:------:|
-|    Numeric    |    Y    |   Y    |  N   |     N     | N             |    N     |    N    |   N    |   N   |  N  |   N    |
-|    String     |    N    |   Y    |  N   |     N     | N             |    N     |    N    |   N    |   N   |  N  |   N    |
-|     Date      |    N    |   Y    |  Y   |     Y     | Y             |    N     |    N    |   N    |   N   |  N  |   N    |
-|   Timestamp   |    N    |   Y    |  Y   |     Y     | Y             |    N     |    N    |   N    |   N   |  N  |   N    |
-| Timestamp_NTZ |    N    |   Y    |  Y   |     Y     | Y             |    N     |    N    |   N    |   N   |  N  |   N    |
-|   Interval    |    N    |   Y    |  N   |     N     | N             |    N*    |    N    |   N    |   N   |  N  |   N    |
-|    Boolean    |    N    |   Y    |  N   |     N     | N             |    N     |    Y    |   N    |   N   |  N  |   N    |
-|    Binary     |    N    |   Y    |  N   |     N     | N             |    N     |    N    |   Y    |   N   |  N  |   N    |
-|     Array     |    N    |   N    |  N   |     N     | N             |    N     |    N    |   N    |  Y**  |  N  |   N    |
-|      Map      |    N    |   N    |  N   |     N     | N             |    N     |    N    |   N    |   N   | Y** |   N    |
-|    Struct     |    N    |   N    |  N   |     N     | N             |    N     |    N    |   N    |   N   |  N  |  Y**   |
+| Source\Target | Numeric | String | Date | Time | Timestamp | Timestamp_NTZ | Interval | Boolean | Binary | Array | Map | Struct |
+|:-------------:|:-------:|:------:|:----:|:----:|:---------:|---------------|:--------:|:-------:|:------:|:-----:|:---:|:------:|
+|    Numeric    |    Y    |   Y    |  N   |  N   |     N     | N             |    N     |    N    |   N    |   N   |  N  |   N    |
+|    String     |    N    |   Y    |  N   |  Y   |     N     | N             |    N     |    N    |   N    |   N   |  N  |   N    |
+|     Date      |    N    |   Y    |  Y   |  N   |     Y     | Y             |    N     |    N    |   N    |   N   |  N  |   N    |
+|     Time      |    N    |   Y    |  N   |  Y   |     N     | N             |    N     |    N    |   N    |   N   |  N  |   N    |
+|   Timestamp   |    N    |   Y    |  Y   |  N   |     Y     | Y             |    N     |    N    |   N    |   N   |  N  |   N    |
+| Timestamp_NTZ |    N    |   Y    |  Y   |  N   |     Y     | Y             |    N     |    N    |   N    |   N   |  N  |   N    |
+|   Interval    |    N    |   Y    |  N   |  N   |     N     | N             |    N*    |    N    |   N    |   N   |  N  |   N    |
+|    Boolean    |    N    |   Y    |  N   |  N   |     N     | N             |    N     |    Y    |   N    |   N   |  N  |   N    |
+|    Binary     |    N    |   Y    |  N   |  N   |     N     | N             |    N     |    N    |   Y    |   N   |  N  |   N    |
+|     Array     |    N    |   N    |  N   |  N   |     N     | N             |    N     |    N    |   N    |  Y**  |  N  |   N    |
+|      Map      |    N    |   N    |  N   |  N   |     N     | N             |    N     |    N    |   N    |   N   | Y** |   N    |
+|    Struct     |    N    |   N    |  N   |  N   |     N     | N             |    N     |    N    |   N    |   N   |  N  |  Y**   |
 
 \* Spark doesn't support interval type table column.
 
@@ -239,6 +241,7 @@ At the heart of this conflict resolution is the Type Precedence List which defin
 | Float     | Float -> Double                                                                 |
 | Double    | Double                                                                          |
 | Date      | Date -> Timestamp_NTZ -> Timestamp                                              |
+| Time      | Time                                                                            |
 | Timestamp | Timestamp                                                                       |
 | String    | String, Long -> Double, Date -> Timestamp_NTZ -> Timestamp , Boolean, Binary ** |
 | Binary    | Binary                                                                          |
@@ -385,6 +388,8 @@ When ANSI mode is on, it throws exceptions for invalid operations. You can use t
   - `try_make_timestamp_ntz`: identical to the function `make_timestamp_ntz`, except that it returns `NULL` result instead of throwing an exception on error.
   - `try_make_interval`: identical to the function `make_interval`, except that it returns `NULL` result instead of throwing an exception on invalid interval.
   - `try_to_time`: identical to the function `to_time`, except that it returns `NULL` result instead of throwing an exception on string parsing error.
+  - `try_to_date`: identical to the function `to_date`, except that it returns `NULL` result instead of throwing an exception on string parsing error.
+
 
 ### SQL Keywords (optional, disabled by default)
 
@@ -794,6 +799,7 @@ Below is a list of all the keywords in Spark SQL.
 |WINDOW|non-reserved|non-reserved|reserved|
 |WITH|reserved|non-reserved|reserved|
 |WITHIN|reserved|non-reserved|reserved|
+|WITHOUT|non-reserved|non-reserved|non-reserved|
 |X|non-reserved|non-reserved|non-reserved|
 |YEAR|non-reserved|non-reserved|non-reserved|
 |YEARS|non-reserved|non-reserved|non-reserved|
diff --git a/docs/sql-ref-literals.md b/docs/sql-ref-literals.md
index 7a10676cce237..13f310503b51d 100644
--- a/docs/sql-ref-literals.md
+++ b/docs/sql-ref-literals.md
@@ -373,7 +373,7 @@ SELECT -3.E-3D AS col;
 
 ### Datetime Literal
 
-A datetime literal is used to specify a date or timestamp value.
+A datetime literal is used to specify a date, time or timestamp value.
 
 #### Date Syntax
 
@@ -410,6 +410,44 @@ SELECT DATE '2011-11-11' AS col;
 +----------+
 ```
 
+#### Time Syntax
+
+```sql
+TIME { '[h]h:[m]m[:]' |
+       '[h]h:[m]m:[s]s[.]' |
+       '[h]h:[m]m:[s]s.[ms][ms][ms][us][us][us]'}
+```
+**Note:** defaults to `00` if hour, minute or second is not specified.
+
+#### Time Examples
+
+```sql
+SELECT TIME'12:00' as col;
++--------+
+|col     |
++--------+
+|12:00:00|
++--------+
+SELECT TIME'2:0' as col;
++--------+
+|col     |
++--------+
+|02:00:00|
++--------+
+SELECT TIME'2:0:3' as col;
++--------+
+|col     |
++--------+
+|02:00:03|
++--------+
+SELECT TIME'23:59:59.999999' as col;
++---------------+
+|col            |
++---------------+
+|23:59:59.999999|
++---------------+
+```
+
 #### Timestamp Syntax
 
 ```sql
diff --git a/docs/sql-ref-syntax-ddl-create-function.md b/docs/sql-ref-syntax-ddl-create-function.md
index db54a4bd5ea69..e0e2545f5ee3f 100644
--- a/docs/sql-ref-syntax-ddl-create-function.md
+++ b/docs/sql-ref-syntax-ddl-create-function.md
@@ -1,7 +1,7 @@
 ---
 layout: global
-title: CREATE FUNCTION
-displayTitle: CREATE FUNCTION
+title: CREATE FUNCTION (External)
+displayTitle: CREATE FUNCTION (External)
 license: |
   Licensed to the Apache Software Foundation (ASF) under one or more
   contributor license agreements.  See the NOTICE file distributed with
@@ -21,7 +21,7 @@ license: |
 
 ### Description
 
-The `CREATE FUNCTION` statement is used to create a temporary or permanent function
+The `CREATE FUNCTION` statement is used to create a temporary or permanent external function
 in Spark. Temporary functions are scoped at a session level where as permanent
 functions are created in the persistent catalog and are made available to
 all sessions. The resources specified in the `USING` clause are made available
@@ -161,6 +161,7 @@ SELECT simple_udf(c1) AS function_return_value FROM test;
 
 ### Related Statements
 
+* [CREATE FUNCTION (SQL)](sql-ref-syntax-ddl-create-sql-function.html)
 * [SHOW FUNCTIONS](sql-ref-syntax-aux-show-functions.html)
 * [DESCRIBE FUNCTION](sql-ref-syntax-aux-describe-function.html)
 * [DROP FUNCTION](sql-ref-syntax-ddl-drop-function.html)
diff --git a/docs/sql-ref-syntax-ddl-create-sql-function.md b/docs/sql-ref-syntax-ddl-create-sql-function.md
new file mode 100644
index 0000000000000..649cd895a1974
--- /dev/null
+++ b/docs/sql-ref-syntax-ddl-create-sql-function.md
@@ -0,0 +1,303 @@
+---
+layout: global
+title: CREATE FUNCTION (SQL)
+displayTitle: CREATE FUNCTION (SQL)
+license: |
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+ 
+     http://www.apache.org/licenses/LICENSE-2.0
+ 
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+---
+
+### Description
+The `CREATE FUNCTION` statement creates a SQL function that can be used in SQL statements. The function can be temporary or permanent, and can return either a scalar value or a table result. The function body can be defined either a SQL expression or a query.
+
+When `TEMPORARY` is specified, the function is only available for the current session. Otherwise, it is persisted in the catalog and available across sessions. The `OR REPLACE` option allows updating an existing function definition, while `IF NOT EXISTS` prevents errors when creating a function that already exists.
+
+The function parameters must be specified with their data types. The return type can be either a scalar data type or a table with an optional schema definition. 
+
+
+### Syntax
+
+```sql
+CREATE [OR REPLACE] [TEMPORARY] FUNCTION [IF NOT EXISTS]
+    function_name ( [ function_parameter [, ...] ] )
+    { [ RETURNS data_type ] |
+      RETURNS TABLE [ ( column_spec [, ...]) ] }
+    [ characteristic [...] ]
+    RETURN { expression | query }
+
+function_parameter
+    parameter_name data_type [DEFAULT default_expression] [COMMENT parameter_comment]
+
+column_spec
+    column_name data_type [COMMENT column_comment]
+
+characteristic
+  { LANGUAGE SQL |
+    [NOT] DETERMINISTIC |
+    COMMENT function_comment |
+    [CONTAINS SQL | READS SQL DATA] }
+```
+
+### Parameters
+
+- **OR REPLACE**
+
+  If specified, the function with the same name and signature (number of parameters and parameter types) is replaced. You cannot replace an existing function with a different signature or a procedure. This is mainly useful to update the function body and the return type of the function. You cannot specify this parameter with `IF NOT EXISTS`.
+
+- **TEMPORARY**
+
+  The scope of the function being created. When you specify `TEMPORARY`, the created function is valid and visible in the current session. No persistent entry is made in the catalog.
+
+- **IF NOT EXISTS**
+
+  If specified, creates the function only when it does not exist. The creation of the function succeeds (no error is thrown) if the specified function already exists in the system. You cannot specify this parameter with `OR REPLACE`.
+
+- **function_name**
+
+  A name for the function. For a permanent function, you can optionally qualify the function name, or it will be created under the current catalog and namespace.
+  If the name is not qualified the permanent function is created in the current schema.
+
+  **Syntax:** `[ database_name. ] function_name`
+
+- **function_parameter**
+
+  Specifies a parameter of the function.
+
+  - **[parameter_name](sql-ref-identifier.md)**
+
+    The parameter name must be unique within the function.
+
+  - **[data_type](sql-ref-datatypes.md)**
+
+    Any supported data type.
+
+  - **DEFAULT default_expression**
+
+    An optional default to be used when a function invocation does not assign an argument to the parameter.
+    `default_expression` must be castable to `data_type`.
+    The expression must not reference another parameter or contain a subquery.
+
+    When you specify a default for one parameter, all following parameters must also have a default.
+
+  - **COMMENT comment**
+
+    An optional description of the parameter. `comment` must be a `STRING` literal.
+
+- **RETURNS [data_type](sql-ref-datatypes.md)**
+
+  The return data type of the scalar function. This clause is optional. The data type will be derived from the SQL function body if it is not provided.
+
+- **RETURNS TABLE [ (column_spec [,…] ) ]**
+
+  This clause marks the function as a table function.
+  Optionally it also specifies the signature of the result of the table function.
+  If no column_spec is specified it will be derived from the body of the SQL UDF.
+
+  - **[column_name](sql-ref-identifier.md)**
+
+    The column name must be unique within the signature.
+
+  - **[data_type](sql-ref-datatypes.md)**
+
+    Any supported data type.
+
+  - **COMMENT column_comment**
+
+    An optional description of the column. `comment` must be a `STRING` literal.
+
+- **RETURN \{ expression| query \}**
+
+  The body of the function. For a scalar function, it can either be a query or an expression. For a table function, it can only be a query. The expression cannot contain:
+
+  - [Aggregate functions](sql-ref-functions-builtin.md#aggregate-functions)
+  - [Window functions](sql-ref-functions-builtin.md#analytic-window-functions)
+  - [Ranking functions](sql-ref-functions-builtin.md#ranking-window-functions)
+  - Row producing functions such as `explode`
+
+  Within the body of the function you can refer to parameter by its unqualified name or by qualifying the parameter with the function name.
+
+- **characteristic**
+
+  All characteristic clauses are optional.
+  You can specify any number of them in any order, but you can specify each clause only once.
+
+  - **LANGUAGE SQL**
+
+    The language of the function implementation.
+
+  - **[NOT] DETERMINISTIC**
+
+    Whether the function is deterministic.
+    A function is deterministic when it returns only one result for a given set of arguments.
+    You may mark a function as `DETERMINISTIC` when its body is not and vice versa.
+    A reason for this may be to encourage or discourage query optimizations such as constant
+    folding or query caching.
+    If you do not specify ths option it is derived from the function body.
+
+  - **COMMENT function_comment**
+
+    A comment for the function. `function_comment` must be String literal.
+
+  - **CONTAINS SQL** or **READS SQL DATA**
+
+    Whether a function reads data directly or indirectly from a table or a view.
+    When the function reads SQL data, you cannot specify `CONTAINS SQL`.
+    If you don't specify either clause, the property is derived from the function body.
+
+## Examples
+
+
+### Create and use a SQL scalar function
+
+```sql
+> CREATE VIEW t(c1, c2) AS VALUES (0, 1), (1, 2);
+
+-- Create a temporary function with no parameter.
+> CREATE TEMPORARY FUNCTION hello() RETURNS STRING
+    RETURN 'Hello World!';
+
+> SELECT hello();
+  Hello World!
+
+-- Create a permanent function with parameters.
+> CREATE FUNCTION area(x DOUBLE, y DOUBLE) RETURNS DOUBLE RETURN x * y;
+
+-- Use a SQL function in the SELECT clause of a query.
+> SELECT area(c1, c2) AS area FROM t;
+ 1.0
+ 1.0
+
+-- Use a SQL function in the WHERE clause of a query.
+> SELECT * FROM t WHERE area(c1, c2) > 0;
+ 1  2
+
+-- Compose SQL functions.
+> CREATE FUNCTION square(x DOUBLE) RETURNS DOUBLE RETURN area(x, x);
+
+> SELECT c1, square(c1) AS square FROM t;
+  0  0.0
+  1  1.0
+
+-- Create a non-deterministic function
+> CREATE FUNCTION roll_dice()
+    RETURNS INT
+    NOT DETERMINISTIC
+    CONTAINS SQL
+    COMMENT 'Roll a single 6 sided die'
+    RETURN (rand() * 6)::INT + 1;
+-- Roll a single 6-sided die
+> SELECT roll_dice();
+ 3
+```
+
+### Create a SQL table function
+
+```sql
+-- Produce all weekdays between two dates
+> CREATE FUNCTION weekdays(start DATE, end DATE)
+    RETURNS TABLE(day_of_week STRING, day DATE)
+    RETURN SELECT extract(DAYOFWEEK_ISO FROM day), day
+             FROM (SELECT sequence(weekdays.start, weekdays.end)) AS T(days)
+                  LATERAL VIEW explode(days) AS day
+             WHERE extract(DAYOFWEEK_ISO FROM day) BETWEEN 1 AND 5;
+
+-- Return all weekdays
+> SELECT weekdays.day_of_week, day
+    FROM weekdays(DATE'2022-01-01', DATE'2022-01-14');
+  1     2022-01-03
+  2     2022-01-04
+  3     2022-01-05
+  4     2022-01-06
+  5     2022-01-07
+  1     2022-01-10
+  2     2022-01-11
+  3     2022-01-12
+  4     2022-01-13
+  5     2022-01-14
+
+-- Return weekdays for date ranges originating from a LATERAL correlation
+> SELECT weekdays.*
+    FROM VALUES (DATE'2020-01-01'),
+                (DATE'2021-01-01'),
+                (DATE'2022-01-01') AS starts(start),
+         LATERAL weekdays(start, start + INTERVAL '7' DAYS);
+  3     2020-01-01
+  4     2020-01-02
+  5     2020-01-03
+  1     2020-01-06
+  2     2020-01-07
+  3     2020-01-08
+  5     2021-01-01
+  1     2021-01-04
+  2     2021-01-05
+  3     2021-01-06
+  4     2021-01-07
+  5     2021-01-08
+  1     2022-01-03
+  2     2022-01-04
+  3     2022-01-05
+  4     2022-01-06
+  5     2022-01-07
+```
+
+### Replace a SQL function
+
+```sql
+-- Replace a SQL scalar function.
+> CREATE OR REPLACE FUNCTION square(x DOUBLE) RETURNS DOUBLE RETURN x * x;
+
+-- Replace a SQL table function.
+> CREATE OR REPLACE FUNCTION getemps(deptno INT)
+    RETURNS TABLE (name STRING)
+    RETURN SELECT name FROM employee e WHERE e.deptno = getemps.deptno;
+
+-- Describe a SQL table function.
+> DESCRIBE FUNCTION getemps;
+ Function: default.getemps
+ Type:     TABLE
+ Input:    deptno INT
+ Returns:  id   INT
+           name STRING
+```
+
+### Describe a SQL function
+
+```sql
+> DESCRIBE FUNCTION hello;
+ Function: hello
+ Type:     SCALAR
+ Input:    ()
+ Returns:  STRING
+
+> DESCRIBE FUNCTION area;
+ Function: default.area
+ Type:     SCALAR
+ Input:    x DOUBLE
+           y DOUBLE
+ Returns:  DOUBLE
+
+> DESCRIBE FUNCTION roll_dice;
+ Function: default.roll_dice
+ Type:     SCALAR
+ Input:    num_dice  INT
+           num_sides INT
+ Returns:  INT
+```
+
+### Related Statements
+
+* [SHOW FUNCTIONS](sql-ref-syntax-aux-show-functions.html)
+* [DESCRIBE FUNCTION](sql-ref-syntax-aux-describe-function.html)
+* [DROP FUNCTION](sql-ref-syntax-ddl-drop-function.html)
diff --git a/docs/submitting-applications.md b/docs/submitting-applications.md
index 071fbf5549398..922c0a953d423 100644
--- a/docs/submitting-applications.md
+++ b/docs/submitting-applications.md
@@ -36,7 +36,7 @@ script as shown here while passing your jar.
 For Python, you can use the `--py-files` argument of `spark-submit` to add `.py`, `.zip` or `.egg`
 files to be distributed with your application. If you depend on multiple Python files we recommend
 packaging them into a `.zip` or `.egg`. For third-party Python dependencies,
-see [Python Package Management](api/python/user_guide/python_packaging.html).
+see [Python Package Management](api/python/tutorial/python_packaging.html).
 
 # Launching Applications with spark-submit
 
diff --git a/examples/src/main/java/org/apache/spark/examples/mllib/JavaStratifiedSamplingExample.java b/examples/src/main/java/org/apache/spark/examples/mllib/JavaStratifiedSamplingExample.java
index b06b2cceccfcd..3d50b6917c77c 100644
--- a/examples/src/main/java/org/apache/spark/examples/mllib/JavaStratifiedSamplingExample.java
+++ b/examples/src/main/java/org/apache/spark/examples/mllib/JavaStratifiedSamplingExample.java
@@ -17,7 +17,6 @@
 
 package org.apache.spark.examples.mllib;
 
-import com.google.common.collect.ImmutableMap;
 import org.apache.spark.SparkConf;
 import org.apache.spark.api.java.JavaSparkContext;
 
@@ -48,7 +47,7 @@ public static void main(String[] args) {
     JavaPairRDD<Integer, Character> data = jsc.parallelizePairs(list);
 
     // specify the exact fraction desired from each key Map<K, Double>
-    ImmutableMap<Integer, Double> fractions = ImmutableMap.of(1, 0.1, 2, 0.6, 3, 0.3);
+    Map<Integer, Double> fractions = Map.of(1, 0.1, 2, 0.6, 3, 0.3);
 
     // Get an approximate sample from each stratum
     JavaPairRDD<Integer, Character> approxSample = data.sampleByKey(false, fractions);
diff --git a/examples/src/main/java/org/apache/spark/examples/sql/JavaSQLDataSourceExample.java b/examples/src/main/java/org/apache/spark/examples/sql/JavaSQLDataSourceExample.java
index efbed9e591eca..e7d52ce03e860 100644
--- a/examples/src/main/java/org/apache/spark/examples/sql/JavaSQLDataSourceExample.java
+++ b/examples/src/main/java/org/apache/spark/examples/sql/JavaSQLDataSourceExample.java
@@ -17,7 +17,6 @@
 package org.apache.spark.examples.sql;
 
 // $example on:schema_merging$
-import com.google.common.collect.Lists;
 import java.io.Serializable;
 import java.util.ArrayList;
 import java.util.Arrays;
@@ -534,7 +533,7 @@ private static void runXmlDatasetExample(SparkSession spark) {
             "<person>" +
             "<name>laglangyue</name><job>Developer</job><age>28</age>" +
             "</person>");
-    Dataset<String> otherPeopleDataset = spark.createDataset(Lists.newArrayList(xmlData),
+    Dataset<String> otherPeopleDataset = spark.createDataset(new ArrayList<>(xmlData),
             Encoders.STRING());
 
     Dataset<Row> otherPeople = spark.read()
diff --git a/examples/src/main/java/org/apache/spark/examples/streaming/JavaRecoverableNetworkWordCount.java b/examples/src/main/java/org/apache/spark/examples/streaming/JavaRecoverableNetworkWordCount.java
index 1052f47ea496e..633b1ed5f5edf 100644
--- a/examples/src/main/java/org/apache/spark/examples/streaming/JavaRecoverableNetworkWordCount.java
+++ b/examples/src/main/java/org/apache/spark/examples/streaming/JavaRecoverableNetworkWordCount.java
@@ -18,16 +18,14 @@
 package org.apache.spark.examples.streaming;
 
 import java.io.File;
-import java.nio.charset.Charset;
+import java.nio.file.Files;
+import java.nio.file.StandardOpenOption;
 import java.util.Arrays;
 import java.util.List;
 import java.util.regex.Pattern;
 
-import com.google.common.io.FileWriteMode;
 import scala.Tuple2;
 
-import com.google.common.io.Files;
-
 import org.apache.spark.SparkConf;
 import org.apache.spark.api.java.JavaSparkContext;
 import org.apache.spark.api.java.function.*;
@@ -153,8 +151,7 @@ private static JavaStreamingContext createContext(String ip,
       System.out.println(output);
       System.out.println("Dropped " + droppedWordsCounter.value() + " word(s) totally");
       System.out.println("Appending to " + outputFile.getAbsolutePath());
-      Files.asCharSink(outputFile, Charset.defaultCharset(), FileWriteMode.APPEND)
-        .write(output + "\n");
+      Files.writeString(outputFile.toPath(), output + "\n", StandardOpenOption.APPEND);
     });
 
     return ssc;
diff --git a/examples/src/main/scala/org/apache/spark/examples/streaming/RecoverableNetworkWordCount.scala b/examples/src/main/scala/org/apache/spark/examples/streaming/RecoverableNetworkWordCount.scala
index 1ec6ee4abd327..d4f2c78999d96 100644
--- a/examples/src/main/scala/org/apache/spark/examples/streaming/RecoverableNetworkWordCount.scala
+++ b/examples/src/main/scala/org/apache/spark/examples/streaming/RecoverableNetworkWordCount.scala
@@ -19,9 +19,8 @@
 package org.apache.spark.examples.streaming
 
 import java.io.File
-import java.nio.charset.Charset
-
-import com.google.common.io.{Files, FileWriteMode}
+import java.nio.file.Files
+import java.nio.file.StandardOpenOption
 
 import org.apache.spark.{SparkConf, SparkContext}
 import org.apache.spark.broadcast.Broadcast
@@ -134,8 +133,7 @@ object RecoverableNetworkWordCount {
       println(output)
       println(s"Dropped ${droppedWordsCounter.value} word(s) totally")
       println(s"Appending to ${outputFile.getAbsolutePath}")
-      Files.asCharSink(outputFile, Charset.defaultCharset(), FileWriteMode.APPEND)
-        .write(output + "\n")
+      Files.writeString(outputFile.toPath, output + "\n", StandardOpenOption.APPEND)
     }
     ssc
   }
diff --git a/graphx/src/main/scala/org/apache/spark/graphx/GraphLoader.scala b/graphx/src/main/scala/org/apache/spark/graphx/GraphLoader.scala
index 045149922c8ed..0c17e0b3bc4ac 100644
--- a/graphx/src/main/scala/org/apache/spark/graphx/GraphLoader.scala
+++ b/graphx/src/main/scala/org/apache/spark/graphx/GraphLoader.scala
@@ -21,7 +21,7 @@ import java.util.concurrent.TimeUnit
 
 import org.apache.spark.SparkContext
 import org.apache.spark.graphx.impl.{EdgePartitionBuilder, GraphImpl}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.TOTAL_TIME
 import org.apache.spark.storage.StorageLevel
 
diff --git a/graphx/src/main/scala/org/apache/spark/graphx/Pregel.scala b/graphx/src/main/scala/org/apache/spark/graphx/Pregel.scala
index 823143f9b9abb..5b1e1ca6565b4 100644
--- a/graphx/src/main/scala/org/apache/spark/graphx/Pregel.scala
+++ b/graphx/src/main/scala/org/apache/spark/graphx/Pregel.scala
@@ -20,7 +20,7 @@ package org.apache.spark.graphx
 import scala.reflect.ClassTag
 
 import org.apache.spark.graphx.util.PeriodicGraphCheckpointer
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.NUM_ITERATIONS
 import org.apache.spark.rdd.RDD
 import org.apache.spark.rdd.util.PeriodicRDDCheckpointer
diff --git a/graphx/src/main/scala/org/apache/spark/graphx/lib/PageRank.scala b/graphx/src/main/scala/org/apache/spark/graphx/lib/PageRank.scala
index 4fe010bfce785..2b3636ac1e333 100644
--- a/graphx/src/main/scala/org/apache/spark/graphx/lib/PageRank.scala
+++ b/graphx/src/main/scala/org/apache/spark/graphx/lib/PageRank.scala
@@ -22,7 +22,7 @@ import scala.reflect.ClassTag
 import breeze.linalg.{Vector => BV}
 
 import org.apache.spark.graphx._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.NUM_ITERATIONS
 import org.apache.spark.ml.linalg.{Vector, Vectors}
 
diff --git a/hadoop-cloud/src/main/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManager.scala b/hadoop-cloud/src/main/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManager.scala
index 599361009fcc5..e64ba7882b918 100644
--- a/hadoop-cloud/src/main/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManager.scala
+++ b/hadoop-cloud/src/main/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManager.scala
@@ -24,9 +24,9 @@ import scala.util.control.NonFatal
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
-import org.apache.spark.sql.execution.streaming.AbstractFileContextBasedCheckpointFileManager
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.CancellableFSDataOutputStream
+import org.apache.spark.internal.{Logging, LogKeys}
+import org.apache.spark.sql.execution.streaming.checkpointing.AbstractFileContextBasedCheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.CancellableFSDataOutputStream
 
 class AbortableStreamBasedCheckpointFileManager(path: Path, hadoopConf: Configuration)
   extends AbstractFileContextBasedCheckpointFileManager(path, hadoopConf) with Logging {
diff --git a/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManagerSuite.scala b/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManagerSuite.scala
index 0dbc650fc8c73..0b7e65ff78d98 100644
--- a/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManagerSuite.scala
+++ b/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/AbortableStreamBasedCheckpointFileManagerSuite.scala
@@ -27,8 +27,8 @@ import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.internal.io.cloud.abortable.AbortableFileSystem
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager
 import org.apache.spark.sql.execution.streaming.CheckpointFileManagerTests
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
 
 class AbortableStreamBasedCheckpointFileManagerSuite
   extends CheckpointFileManagerTests with Logging {
diff --git a/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/CommitterBindingSuite.scala b/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/CommitterBindingSuite.scala
index 2a2d25af758ec..ee89adab94fb9 100644
--- a/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/CommitterBindingSuite.scala
+++ b/hadoop-cloud/src/test/scala/org/apache/spark/internal/io/cloud/CommitterBindingSuite.scala
@@ -21,7 +21,6 @@ import java.io.{File, FileInputStream, FileOutputStream, IOException, ObjectInpu
 
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{Path, StreamCapabilities}
-import org.apache.hadoop.io.IOUtils
 import org.apache.hadoop.mapreduce.{Job, JobStatus, MRJobConfig, TaskAttemptContext, TaskAttemptID}
 import org.apache.hadoop.mapreduce.lib.output.{BindingPathOutputCommitter, FileOutputFormat}
 import org.apache.hadoop.mapreduce.task.TaskAttemptContextImpl
@@ -29,6 +28,7 @@ import org.apache.hadoop.mapreduce.task.TaskAttemptContextImpl
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.internal.io.{FileCommitProtocol, FileNameSpec}
 import org.apache.spark.internal.io.cloud.PathOutputCommitProtocol.{CAPABILITY_DYNAMIC_PARTITIONING, OUTPUTCOMMITTER_FACTORY_SCHEME}
+import org.apache.spark.network.util.JavaUtils
 
 class CommitterBindingSuite extends SparkFunSuite {
 
@@ -130,7 +130,8 @@ class CommitterBindingSuite extends SparkFunSuite {
       assert(committer.destPath === committer2.destPath,
         "destPath mismatch on round trip")
     } finally {
-      IOUtils.closeStreams(out, in)
+      JavaUtils.closeQuietly(out)
+      JavaUtils.closeQuietly(in)
       serData.delete()
     }
   }
diff --git a/launcher/src/main/java/org/apache/spark/launcher/AbstractCommandBuilder.java b/launcher/src/main/java/org/apache/spark/launcher/AbstractCommandBuilder.java
index d4d3faf83e3b0..caa2d2b5854e1 100644
--- a/launcher/src/main/java/org/apache/spark/launcher/AbstractCommandBuilder.java
+++ b/launcher/src/main/java/org/apache/spark/launcher/AbstractCommandBuilder.java
@@ -49,6 +49,7 @@ abstract class AbstractCommandBuilder {
   String master;
   String remote;
   protected String propertiesFile;
+  protected boolean loadSparkDefaults;
   final List<String> appArgs;
   final List<String> jars;
   final List<String> files;
@@ -362,21 +363,35 @@ Map<String, String> getEffectiveConfig() throws IOException {
   }
 
   /**
-   * Loads the configuration file for the application, if it exists. This is either the
-   * user-specified properties file, or the spark-defaults.conf file under the Spark configuration
-   * directory.
+   * Load the configuration file(s) for the application - from the user-specified properties
+   * file, and/or the spark-defaults.conf file under the Spark configuration directory, if exists.
+   * Configurations from user-specified properties file take precedence over spark-defaults.conf.
    */
   private Properties loadPropertiesFile() throws IOException {
     Properties props = new Properties();
-    File propsFile;
     if (propertiesFile != null) {
-      propsFile = new File(propertiesFile);
+      File propsFile = new File(propertiesFile);
       checkArgument(propsFile.isFile(), "Invalid properties file '%s'.", propertiesFile);
-    } else {
-      propsFile = new File(getConfDir(), DEFAULT_PROPERTIES_FILE);
+      props = loadPropertiesFile(propsFile);
     }
 
-    if (propsFile.isFile()) {
+    Properties defaultsProps = new Properties();
+    if (propertiesFile == null || loadSparkDefaults) {
+      defaultsProps = loadPropertiesFile(new File(getConfDir(), DEFAULT_PROPERTIES_FILE));
+    }
+
+    for (Map.Entry<Object, Object> entry : defaultsProps.entrySet()) {
+      if (!props.containsKey(entry.getKey())) {
+        props.put(entry.getKey(), entry.getValue());
+      }
+    }
+
+    return props;
+  }
+
+  private Properties loadPropertiesFile(File propsFile) throws IOException {
+    Properties props = new Properties();
+    if (propsFile != null && propsFile.isFile()) {
       try (InputStreamReader isr = new InputStreamReader(
           new FileInputStream(propsFile), StandardCharsets.UTF_8)) {
         props.load(isr);
diff --git a/launcher/src/main/java/org/apache/spark/launcher/SparkClassCommandBuilder.java b/launcher/src/main/java/org/apache/spark/launcher/SparkClassCommandBuilder.java
index 8d95bc06d7a7d..d7d10d486e3f5 100644
--- a/launcher/src/main/java/org/apache/spark/launcher/SparkClassCommandBuilder.java
+++ b/launcher/src/main/java/org/apache/spark/launcher/SparkClassCommandBuilder.java
@@ -99,6 +99,7 @@ public List<String> buildCommand(Map<String, String> env)
 
     String mem = firstNonEmpty(memKey != null ? System.getenv(memKey) : null, DEFAULT_MEM);
     cmd.add("-Xmx" + mem);
+    addOptionString(cmd, JavaModuleOptions.defaultModuleOptions());
     cmd.add(className);
     cmd.addAll(classArgs);
     return cmd;
diff --git a/launcher/src/main/java/org/apache/spark/launcher/SparkLauncher.java b/launcher/src/main/java/org/apache/spark/launcher/SparkLauncher.java
index 67f76a73c214d..c3cc470e8871d 100644
--- a/launcher/src/main/java/org/apache/spark/launcher/SparkLauncher.java
+++ b/launcher/src/main/java/org/apache/spark/launcher/SparkLauncher.java
@@ -59,7 +59,7 @@ public class SparkLauncher extends AbstractLauncher<SparkLauncher> {
   /** Configuration key for the driver default extra class path. */
   public static final String DRIVER_DEFAULT_EXTRA_CLASS_PATH =
     "spark.driver.defaultExtraClassPath";
-  public static final String DRIVER_DEFAULT_EXTRA_CLASS_PATH_VALUE = "hive-jackson/*";
+  public static final String DRIVER_DEFAULT_EXTRA_CLASS_PATH_VALUE = "";
   /** Configuration key for the driver class path. */
   public static final String DRIVER_EXTRA_CLASSPATH = "spark.driver.extraClassPath";
   /** Configuration key for the default driver VM options. */
@@ -74,7 +74,7 @@ public class SparkLauncher extends AbstractLauncher<SparkLauncher> {
   /** Configuration key for the executor default extra class path. */
   public static final String EXECUTOR_DEFAULT_EXTRA_CLASS_PATH =
     "spark.executor.defaultExtraClassPath";
-  public static final String EXECUTOR_DEFAULT_EXTRA_CLASS_PATH_VALUE = "hive-jackson/*";
+  public static final String EXECUTOR_DEFAULT_EXTRA_CLASS_PATH_VALUE = "";
   /** Configuration key for the executor class path. */
   public static final String EXECUTOR_EXTRA_CLASSPATH = "spark.executor.extraClassPath";
   /** Configuration key for the default executor VM options. */
diff --git a/launcher/src/main/java/org/apache/spark/launcher/SparkSubmitCommandBuilder.java b/launcher/src/main/java/org/apache/spark/launcher/SparkSubmitCommandBuilder.java
index 5efa3bef78bcc..7b9f90ac7b7a6 100644
--- a/launcher/src/main/java/org/apache/spark/launcher/SparkSubmitCommandBuilder.java
+++ b/launcher/src/main/java/org/apache/spark/launcher/SparkSubmitCommandBuilder.java
@@ -172,6 +172,16 @@ private static String getApiMode(Map<String, String> conf) {
   @Override
   public List<String> buildCommand(Map<String, String> env)
       throws IOException, IllegalArgumentException {
+    for (Map.Entry<String, String> entry : getEffectiveConfig().entrySet()) {
+      // If both spark.remote and spark.master are set, the error will be thrown later
+      // when the application is started.
+      if (entry.getKey().equals("spark.remote")) {
+        isRemote = true;
+      } else if (entry.getKey().equals(SparkLauncher.SPARK_API_MODE)) {
+        // Respects if the API mode is explicitly set.
+        isRemote = entry.getValue().equalsIgnoreCase("connect");
+      }
+    }
     if (PYSPARK_SHELL.equals(appResource) && !isSpecialCommand) {
       return buildPySparkShellCommand(env);
     } else if (SPARKR_SHELL.equals(appResource) && !isSpecialCommand) {
@@ -241,6 +251,10 @@ List<String> buildSparkSubmitArgs(boolean includeRemote) {
       args.add(propertiesFile);
     }
 
+    if (loadSparkDefaults) {
+      args.add(parser.LOAD_SPARK_DEFAULTS);
+    }
+
     if (isExample) {
       jars.addAll(findExamplesJars());
     }
@@ -540,6 +554,7 @@ protected boolean handle(String opt, String value) {
         }
         case DEPLOY_MODE -> deployMode = value;
         case PROPERTIES_FILE -> propertiesFile = value;
+        case LOAD_SPARK_DEFAULTS -> loadSparkDefaults = true;
         case DRIVER_MEMORY -> conf.put(SparkLauncher.DRIVER_MEMORY, value);
         case DRIVER_JAVA_OPTIONS -> conf.put(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS, value);
         case DRIVER_LIBRARY_PATH -> conf.put(SparkLauncher.DRIVER_EXTRA_LIBRARY_PATH, value);
@@ -550,14 +565,6 @@ protected boolean handle(String opt, String value) {
           checkArgument(value != null, "Missing argument to %s", CONF);
           String[] setConf = value.split("=", 2);
           checkArgument(setConf.length == 2, "Invalid argument to %s: %s", CONF, value);
-          // If both spark.remote and spark.mater are set, the error will be thrown later when
-          // the application is started.
-          if (setConf[0].equals("spark.remote")) {
-            isRemote = true;
-          } else if (setConf[0].equals(SparkLauncher.SPARK_API_MODE)) {
-            // Respects if the API mode is explicitly set.
-            isRemote = setConf[1].equalsIgnoreCase("connect");
-          }
           conf.put(setConf[0], setConf[1]);
         }
         case CLASS -> {
diff --git a/launcher/src/test/java/org/apache/spark/launcher/SparkClassCommandBuilderSuite.java b/launcher/src/test/java/org/apache/spark/launcher/SparkClassCommandBuilderSuite.java
index 76a5e23d4693a..23ebbfc098aca 100644
--- a/launcher/src/test/java/org/apache/spark/launcher/SparkClassCommandBuilderSuite.java
+++ b/launcher/src/test/java/org/apache/spark/launcher/SparkClassCommandBuilderSuite.java
@@ -33,6 +33,7 @@ public void testBeelineBuilder() throws Exception {
     SparkClassCommandBuilder builder =
       new SparkClassCommandBuilder("org.apache.hive.beeline.BeeLine", args);
     List<String> strings = builder.buildCommand(new HashMap<>());
+    assertTrue(strings.containsAll(Arrays.asList(JavaModuleOptions.defaultModuleOptionArray())));
     assertTrue(strings.contains("-DmyKey=yourValue"));
     assertTrue(strings.contains("myBeelineArg"));
   }
diff --git a/launcher/src/test/java/org/apache/spark/launcher/SparkSubmitCommandBuilderSuite.java b/launcher/src/test/java/org/apache/spark/launcher/SparkSubmitCommandBuilderSuite.java
index 31318f1318ca0..d1dba85a534f2 100644
--- a/launcher/src/test/java/org/apache/spark/launcher/SparkSubmitCommandBuilderSuite.java
+++ b/launcher/src/test/java/org/apache/spark/launcher/SparkSubmitCommandBuilderSuite.java
@@ -18,12 +18,16 @@
 package org.apache.spark.launcher;
 
 import java.io.File;
+import java.io.FileReader;
+import java.nio.charset.StandardCharsets;
+import java.nio.file.Files;
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
+import java.util.Properties;
 import java.util.regex.Pattern;
 
 import org.junit.jupiter.api.*;
@@ -33,29 +37,106 @@
 public class SparkSubmitCommandBuilderSuite extends BaseSuite {
 
   private static File dummyPropsFile;
+  private static File connectPropsFile;
+  private static File driverMemPropsFile;
   private static SparkSubmitOptionParser parser;
 
   @BeforeAll
   public static void setUp() throws Exception {
     dummyPropsFile = File.createTempFile("spark", "properties");
+    connectPropsFile = File.createTempFile("spark", "properties");
+    Files.writeString(connectPropsFile.toPath(), "spark.remote=sc://connect-server:15002");
+    driverMemPropsFile = File.createTempFile("spark", "properties");
+    Files.writeString(driverMemPropsFile.toPath(),
+        "spark.driver.memory=4g\nspark.driver.memoryOverhead=768m");
     parser = new SparkSubmitOptionParser();
   }
 
   @AfterAll
   public static void cleanUp() throws Exception {
     dummyPropsFile.delete();
+    connectPropsFile.delete();
+    driverMemPropsFile.delete();
+  }
+
+  @Test
+  public void testGetEffectiveConfig() throws Exception {
+    doTestGetEffectiveConfig(null, true, true);
+    doTestGetEffectiveConfig(null, true, false);
+    doTestGetEffectiveConfig(null, false, true);
+    doTestGetEffectiveConfig(null, false, false);
+    doTestGetEffectiveConfig(driverMemPropsFile, true, true);
+    doTestGetEffectiveConfig(driverMemPropsFile, true, false);
+    doTestGetEffectiveConfig(driverMemPropsFile, false, true);
+    doTestGetEffectiveConfig(driverMemPropsFile, false, false);
+  }
+
+  private void doTestGetEffectiveConfig(
+      File propertiesFile, boolean loadSparkDefaults, boolean confDriverMemory) throws Exception {
+    SparkSubmitCommandBuilder launcher =
+        newCommandBuilder(Collections.emptyList());
+    launcher.loadSparkDefaults = loadSparkDefaults;
+    launcher.conf.put("spark.foo", "bar");
+    launcher.childEnv.put("SPARK_CONF_DIR", System.getProperty("spark.test.home")
+        + "/launcher/src/test/resources");
+
+    if (propertiesFile != null) {
+      launcher.setPropertiesFile(propertiesFile.getAbsolutePath());
+    }
+
+    if (confDriverMemory) {
+      launcher.conf.put(SparkLauncher.DRIVER_MEMORY, "2g");
+    }
+
+    Map<String, String> effectiveConfig = launcher.getEffectiveConfig();
+
+    assertEquals("bar", effectiveConfig.get("spark.foo"));
+    if (confDriverMemory) {
+      assertEquals("2g", effectiveConfig.get(SparkLauncher.DRIVER_MEMORY));
+    } else if (propertiesFile != null) {
+      try (FileReader reader = new FileReader(propertiesFile, StandardCharsets.UTF_8)) {
+        Properties props = new Properties();
+        props.load(reader);
+        if (props.containsKey(SparkLauncher.DRIVER_MEMORY)) {
+          assertEquals(props.getProperty(SparkLauncher.DRIVER_MEMORY),
+            effectiveConfig.get(SparkLauncher.DRIVER_MEMORY));
+        }
+      }
+    } else {
+      assertEquals("1g", effectiveConfig.get(SparkLauncher.DRIVER_MEMORY));
+    }
+
+    if (propertiesFile != null) {
+      try (FileReader reader = new FileReader(propertiesFile, StandardCharsets.UTF_8)) {
+        Properties props = new Properties();
+        props.load(reader);
+        if (props.containsKey("spark.driver.memoryOverhead")) {
+          assertEquals(props.getProperty("spark.driver.memoryOverhead"),
+              effectiveConfig.get("spark.driver.memoryOverhead"));
+        }
+      }
+      if (loadSparkDefaults) {
+        assertEquals("/driver", effectiveConfig.get(SparkLauncher.DRIVER_EXTRA_CLASSPATH));
+      } else {
+        assertFalse(effectiveConfig.containsKey(SparkLauncher.DRIVER_EXTRA_CLASSPATH));
+      }
+    } else {
+      assertEquals("/driver", effectiveConfig.get(SparkLauncher.DRIVER_EXTRA_CLASSPATH));
+    }
   }
 
   @Test
   public void testDriverCmdBuilder() throws Exception {
-    testCmdBuilder(true, true);
-    testCmdBuilder(true, false);
+    testCmdBuilder(true, null);
+    testCmdBuilder(true, dummyPropsFile);
+    testCmdBuilder(true, connectPropsFile);
   }
 
   @Test
   public void testClusterCmdBuilder() throws Exception {
-    testCmdBuilder(false, true);
-    testCmdBuilder(false, false);
+    testCmdBuilder(false, null);
+    testCmdBuilder(false, dummyPropsFile);
+    testCmdBuilder(false, connectPropsFile);
   }
 
   @Test
@@ -307,7 +388,7 @@ public void testIsClientMode() {
     assertTrue(builder.isClientMode(userProps));
   }
 
-  private void testCmdBuilder(boolean isDriver, boolean useDefaultPropertyFile) throws Exception {
+  private void testCmdBuilder(boolean isDriver, File propertiesFile) throws Exception {
     final String DRIVER_DEFAULT_PARAM = "-Ddriver-default";
     final String DRIVER_EXTRA_PARAM = "-Ddriver-extra";
     String deployMode = isDriver ? "client" : "cluster";
@@ -325,16 +406,16 @@ private void testCmdBuilder(boolean isDriver, boolean useDefaultPropertyFile) th
     launcher.appArgs.add("bar");
     launcher.conf.put("spark.foo", "foo");
     // either set the property through "--conf" or through default property file
-    if (!useDefaultPropertyFile) {
-      launcher.setPropertiesFile(dummyPropsFile.getAbsolutePath());
+    if (propertiesFile == null) {
+      launcher.childEnv.put("SPARK_CONF_DIR", System.getProperty("spark.test.home")
+          + "/launcher/src/test/resources");
+    } else {
+      launcher.setPropertiesFile(propertiesFile.getAbsolutePath());
       launcher.conf.put(SparkLauncher.DRIVER_MEMORY, "1g");
       launcher.conf.put(SparkLauncher.DRIVER_EXTRA_CLASSPATH, "/driver");
       launcher.conf.put(SparkLauncher.DRIVER_DEFAULT_JAVA_OPTIONS, DRIVER_DEFAULT_PARAM);
       launcher.conf.put(SparkLauncher.DRIVER_EXTRA_JAVA_OPTIONS, DRIVER_EXTRA_PARAM);
       launcher.conf.put(SparkLauncher.DRIVER_EXTRA_LIBRARY_PATH, "/native");
-    } else {
-      launcher.childEnv.put("SPARK_CONF_DIR", System.getProperty("spark.test.home")
-          + "/launcher/src/test/resources");
     }
 
     Map<String, String> env = new HashMap<>();
@@ -348,13 +429,7 @@ private void testCmdBuilder(boolean isDriver, boolean useDefaultPropertyFile) th
         "Driver default options should be configured.");
       assertTrue(cmd.contains(DRIVER_EXTRA_PARAM), "Driver extra options should be configured.");
     } else {
-      boolean found = false;
-      for (String arg : cmd) {
-        if (arg.startsWith("-Xmx")) {
-          found = true;
-          break;
-        }
-      }
+      boolean found = cmd.stream().anyMatch(arg -> arg.startsWith("-Xmx"));
       assertFalse(found, "Memory arguments should not be set.");
       assertFalse(cmd.contains(DRIVER_DEFAULT_PARAM),
         "Driver default options should not be configured.");
@@ -379,8 +454,15 @@ private void testCmdBuilder(boolean isDriver, boolean useDefaultPropertyFile) th
     }
 
     // Checks below are the same for both driver and non-driver mode.
-    if (!useDefaultPropertyFile) {
-      assertEquals(dummyPropsFile.getAbsolutePath(), findArgValue(cmd, parser.PROPERTIES_FILE));
+    if (propertiesFile != null) {
+      assertEquals(propertiesFile.getAbsolutePath(), findArgValue(cmd, parser.PROPERTIES_FILE));
+      try (FileReader reader = new FileReader(propertiesFile, StandardCharsets.UTF_8)) {
+        Properties props = new Properties();
+        props.load(reader);
+        if (props.containsKey("spark.remote")) {
+          assertTrue(launcher.isRemote);
+        }
+      }
     }
     assertEquals("yarn", findArgValue(cmd, parser.MASTER));
     assertEquals(deployMode, findArgValue(cmd, parser.DEPLOY_MODE));
diff --git a/licenses-binary/LICENSE-jodd.txt b/licenses-binary/LICENSE-jodd.txt
deleted file mode 100644
index cc6b458adb386..0000000000000
--- a/licenses-binary/LICENSE-jodd.txt
+++ /dev/null
@@ -1,24 +0,0 @@
-Copyright (c) 2003-present, Jodd Team (https://jodd.org)
-All rights reserved.
-
-Redistribution and use in source and binary forms, with or without
-modification, are permitted provided that the following conditions are met:
-
-1. Redistributions of source code must retain the above copyright notice,
-this list of conditions and the following disclaimer.
-
-2. Redistributions in binary form must reproduce the above copyright
-notice, this list of conditions and the following disclaimer in the
-documentation and/or other materials provided with the distribution.
-
-THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
-AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
-IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
-ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
-LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
-CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
-SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
-INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
-CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
-ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
-POSSIBILITY OF SUCH DAMAGE.
\ No newline at end of file
diff --git a/mllib-local/benchmarks/BLASBenchmark-jdk21-results.txt b/mllib-local/benchmarks/BLASBenchmark-jdk21-results.txt
index dac9751d9afc4..7eba64d4ec8fd 100644
--- a/mllib-local/benchmarks/BLASBenchmark-jdk21-results.txt
+++ b/mllib-local/benchmarks/BLASBenchmark-jdk21-results.txt
@@ -2,311 +2,311 @@
 daxpy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 daxpy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 151            178          26        661.0           1.5       1.0X
-java                                                142            174          24        706.6           1.4       1.1X
+f2j                                                 142            152           5        702.9           1.4       1.0X
+java                                                142            146           4        704.9           1.4       1.0X
 
 
 ================================================================================================
 saxpy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 saxpy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  77             94          14       1298.8           0.8       1.0X
-java                                                 71             84          13       1410.4           0.7       1.1X
+f2j                                                  75             83           6       1325.6           0.8       1.0X
+java                                                 69             71           1       1459.8           0.7       1.1X
 
 
 ================================================================================================
 dcopy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dcopy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 142            178          25        702.4           1.4       1.0X
-java                                                150            183          32        664.8           1.5       0.9X
+f2j                                                 129            148           8        776.0           1.3       1.0X
+java                                                127            144          12        788.7           1.3       1.0X
 
 
 ================================================================================================
 scopy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scopy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  72             91          14       1394.3           0.7       1.0X
-java                                                 72             88          19       1387.3           0.7       1.0X
+f2j                                                  69             78           6       1444.8           0.7       1.0X
+java                                                 69             72           2       1449.4           0.7       1.0X
 
 
 ================================================================================================
 ddot
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 ddot:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  95            100           7       1050.9           1.0       1.0X
-java                                                 46             57           9       2171.0           0.5       2.1X
+f2j                                                  96             96           0       1041.9           1.0       1.0X
+java                                                 47             49           1       2121.9           0.5       2.0X
 
 
 ================================================================================================
 sdot
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sdot:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  94             94           1       1068.5           0.9       1.0X
-java                                                 23             29           5       4399.8           0.2       4.1X
+f2j                                                  92             94           0       1090.5           0.9       1.0X
+java                                                 24             25           1       4188.1           0.2       3.8X
 
 
 ================================================================================================
 dnrm2
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dnrm2:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 143            144           2        698.6           1.4       1.0X
-java                                                 33             38           7       3012.7           0.3       4.3X
+f2j                                                 140            144           1        713.5           1.4       1.0X
+java                                                 32             33           1       3151.0           0.3       4.4X
 
 
 ================================================================================================
 snrm2
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 snrm2:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 125            125           2        802.5           1.2       1.0X
-java                                                 17             20           4       6044.7           0.2       7.5X
+f2j                                                 121            125           1        824.1           1.2       1.0X
+java                                                 16             16           0       6405.3           0.2       7.8X
 
 
 ================================================================================================
 dscal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dscal:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 136            160          24        736.1           1.4       1.0X
-java                                                122            145          21        821.1           1.2       1.1X
+f2j                                                 133            136           1        753.4           1.3       1.0X
+java                                                121            124           1        828.0           1.2       1.1X
 
 
 ================================================================================================
 sscal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sscal:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  80             97          14       1254.5           0.8       1.0X
-java                                                 59             75          12       1707.3           0.6       1.4X
+f2j                                                  77             84           8       1300.9           0.8       1.0X
+java                                                 55             63           6       1808.1           0.6       1.4X
 
 
 ================================================================================================
 dgemv[N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemv[N]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 100            102           4       1002.2           1.0       1.0X
-java                                                 23             29           5       4265.7           0.2       4.3X
+f2j                                                 100            100           0       1003.6           1.0       1.0X
+java                                                 22             23           0       4444.7           0.2       4.4X
 
 
 ================================================================================================
 dgemv[T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemv[T]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  94             96           3       1064.1           0.9       1.0X
-java                                                 23             29           6       4285.4           0.2       4.0X
+f2j                                                  94             94           1       1067.3           0.9       1.0X
+java                                                 22             23           0       4448.5           0.2       4.2X
 
 
 ================================================================================================
 sgemv[N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemv[N]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  96             96           0       1043.1           1.0       1.0X
-java                                                 12             15           2       8498.9           0.1       8.1X
+f2j                                                  96             96           0       1042.9           1.0       1.0X
+java                                                 11             11           0       9050.4           0.1       8.7X
 
 
 ================================================================================================
 sgemv[T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemv[T]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  93             94           0       1071.3           0.9       1.0X
-java                                                 12             15           2       8475.7           0.1       7.9X
+f2j                                                  93             93           0       1071.7           0.9       1.0X
+java                                                 11             12           0       9015.6           0.1       8.4X
 
 
 ================================================================================================
 dger
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dger:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 145            169          21        691.0           1.4       1.0X
-java                                                122            141          19        817.2           1.2       1.2X
+f2j                                                 140            145           2        712.8           1.4       1.0X
+java                                                125            128           2        800.7           1.2       1.1X
 
 
 ================================================================================================
 dspmv[U]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dspmv[U]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  92             93           0        542.4           1.8       1.0X
-java                                                 12             15           2       4102.6           0.2       7.6X
+f2j                                                  92             92           0        543.0           1.8       1.0X
+java                                                 11             12           0       4393.4           0.2       8.1X
 
 
 ================================================================================================
 dspr[U]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dspr[U]:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  96            106          10        520.2           1.9       1.0X
-java                                                 90            106          12        558.6           1.8       1.1X
+f2j                                                  93             97           1        537.4           1.9       1.0X
+java                                                 86             94           8        578.1           1.7       1.1X
 
 
 ================================================================================================
 dsyr[U]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dsyr[U]:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 140            161          17        356.5           2.8       1.0X
-java                                                143            160          17        349.1           2.9       1.0X
+f2j                                                 136            139           2        368.8           2.7       1.0X
+java                                                136            139           2        367.1           2.7       1.0X
 
 
 ================================================================================================
 dgemm[N,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[N,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 671            673           1       1490.1           0.7       1.0X
-java                                                 63             70           4      15790.7           0.1      10.6X
+f2j                                                 664            665           1       1505.2           0.7       1.0X
+java                                                 64             70           4      15702.2           0.1      10.4X
 
 
 ================================================================================================
 dgemm[N,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[N,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 673            675           1       1484.9           0.7       1.0X
-java                                                 64             70           4      15709.3           0.1      10.6X
+f2j                                                 674            676           1       1482.6           0.7       1.0X
+java                                                 64             70           4      15614.9           0.1      10.5X
 
 
 ================================================================================================
 dgemm[T,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[T,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 906            908           1       1103.5           0.9       1.0X
-java                                                 63             69           4      15850.6           0.1      14.4X
+f2j                                                 908            909           0       1101.1           0.9       1.0X
+java                                                 64             69           4      15734.9           0.1      14.3X
 
 
 ================================================================================================
 dgemm[T,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[T,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 950            952           1       1052.5           1.0       1.0X
-java                                                 63             70           4      15793.7           0.1      15.0X
+f2j                                                 951            953           3       1051.2           1.0       1.0X
+java                                                 63             69           4      15754.9           0.1      15.0X
 
 
 ================================================================================================
 sgemm[N,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[N,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 653            655           1       1530.9           0.7       1.0X
-java                                                 40             41           1      25152.3           0.0      16.4X
+f2j                                                 653            654           1       1531.6           0.7       1.0X
+java                                                 40             41           1      24917.5           0.0      16.3X
 
 
 ================================================================================================
 sgemm[N,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[N,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 655            656           1       1527.4           0.7       1.0X
-java                                                 40             41           1      24811.8           0.0      16.2X
+f2j                                                 656            657           1       1524.6           0.7       1.0X
+java                                                 41             41           1      24687.2           0.0      16.2X
 
 
 ================================================================================================
 sgemm[T,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[T,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 906            907           1       1104.1           0.9       1.0X
-java                                                 39             40           1      25372.9           0.0      23.0X
+f2j                                                 907            907           1       1102.7           0.9       1.0X
+java                                                 40             40           1      25305.9           0.0      22.9X
 
 
 ================================================================================================
 sgemm[T,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[T,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 946            948           1       1057.3           0.9       1.0X
-java                                                 40             41           1      25019.0           0.0      23.7X
+f2j                                                 947            948           2       1056.1           0.9       1.0X
+java                                                 40             41           1      24894.4           0.0      23.6X
 
 
diff --git a/mllib-local/benchmarks/BLASBenchmark-results.txt b/mllib-local/benchmarks/BLASBenchmark-results.txt
index 16dfba14e3168..794c61b2567f4 100644
--- a/mllib-local/benchmarks/BLASBenchmark-results.txt
+++ b/mllib-local/benchmarks/BLASBenchmark-results.txt
@@ -2,311 +2,311 @@
 daxpy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 daxpy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 147            151           2        681.6           1.5       1.0X
-java                                                142            144           1        705.3           1.4       1.0X
+f2j                                                 144            160           9        693.6           1.4       1.0X
+java                                                137            148           9        728.3           1.4       1.1X
 
 
 ================================================================================================
 saxpy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 saxpy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  85             86           1       1176.1           0.9       1.0X
-java                                                 71             73           1       1401.3           0.7       1.2X
+f2j                                                  81             86           4       1227.9           0.8       1.0X
+java                                                 70             76           4       1433.1           0.7       1.2X
 
 
 ================================================================================================
 dcopy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dcopy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 143            146           2        700.2           1.4       1.0X
-java                                                142            145           2        705.7           1.4       1.0X
+f2j                                                 140            152           7        713.2           1.4       1.0X
+java                                                138            152          10        726.9           1.4       1.0X
 
 
 ================================================================================================
 scopy
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scopy:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  82             83           1       1219.9           0.8       1.0X
-java                                                 72             74           1       1395.8           0.7       1.1X
+f2j                                                  78             83           4       1279.4           0.8       1.0X
+java                                                 69             80          12       1443.0           0.7       1.1X
 
 
 ================================================================================================
 ddot
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 ddot:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  96             97           0       1037.6           1.0       1.0X
-java                                                 46             48           1       2158.4           0.5       2.1X
+f2j                                                  96             96           1       1045.6           1.0       1.0X
+java                                                 47             50           3       2143.6           0.5       2.1X
 
 
 ================================================================================================
 sdot
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sdot:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  94             94           0       1068.1           0.9       1.0X
-java                                                 23             23           0       4433.6           0.2       4.2X
+f2j                                                  94             94           0       1067.6           0.9       1.0X
+java                                                 23             25           2       4360.3           0.2       4.1X
 
 
 ================================================================================================
 dnrm2
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dnrm2:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 143            144           1        696.9           1.4       1.0X
-java                                                 32             32           0       3105.3           0.3       4.5X
+f2j                                                 144            144           0        696.5           1.4       1.0X
+java                                                 33             34           2       3071.3           0.3       4.4X
 
 
 ================================================================================================
 snrm2
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 snrm2:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 121            121           0        829.1           1.2       1.0X
-java                                                 16             16           0       6203.2           0.2       7.5X
+f2j                                                 121            121           0        828.5           1.2       1.0X
+java                                                 16             17           1       6148.4           0.2       7.4X
 
 
 ================================================================================================
 dscal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dscal:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 140            144           2        713.0           1.4       1.0X
-java                                                129            131           2        777.2           1.3       1.1X
+f2j                                                 131            145           8        760.5           1.3       1.0X
+java                                                122            130           7        821.8           1.2       1.1X
 
 
 ================================================================================================
 sscal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sscal:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  79             81           1       1258.7           0.8       1.0X
-java                                                 65             67           1       1548.0           0.6       1.2X
+f2j                                                  75             79           4       1337.5           0.7       1.0X
+java                                                 61             66           4       1645.9           0.6       1.2X
 
 
 ================================================================================================
 dgemv[N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemv[N]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  96             96           0       1038.5           1.0       1.0X
-java                                                 22             23           0       4459.6           0.2       4.3X
+f2j                                                  96             97           1       1036.5           1.0       1.0X
+java                                                 23             26           2       4283.2           0.2       4.1X
 
 
 ================================================================================================
 dgemv[T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemv[T]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  94             95           0       1060.3           0.9       1.0X
-java                                                 23             24           1       4422.6           0.2       4.2X
+f2j                                                  95             95           1       1057.4           0.9       1.0X
+java                                                 23             25           2       4311.6           0.2       4.1X
 
 
 ================================================================================================
 sgemv[N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemv[N]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  96             96           0       1044.2           1.0       1.0X
-java                                                 11             11           0       8998.8           0.1       8.6X
+f2j                                                  96             96           0       1043.9           1.0       1.0X
+java                                                 12             13           1       8673.8           0.1       8.3X
 
 
 ================================================================================================
 sgemv[T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemv[T]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  93             94           0       1070.6           0.9       1.0X
-java                                                 11             12           0       8924.2           0.1       8.3X
+f2j                                                  93             94           0       1070.8           0.9       1.0X
+java                                                 12             13           1       8342.2           0.1       7.8X
 
 
 ================================================================================================
 dger
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dger:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 146            149           2        684.3           1.5       1.0X
-java                                                127            131           2        787.4           1.3       1.2X
+f2j                                                 137            157          24        732.5           1.4       1.0X
+java                                                119            129           7        843.7           1.2       1.2X
 
 
 ================================================================================================
 dspmv[U]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dspmv[U]:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 100            100           0        501.3           2.0       1.0X
-java                                                 11             12           0       4366.1           0.2       8.7X
+f2j                                                 100            100           0        500.1           2.0       1.0X
+java                                                 12             14           2       4169.4           0.2       8.3X
 
 
 ================================================================================================
 dspr[U]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dspr[U]:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                  95             97           1        524.0           1.9       1.0X
-java                                                 95             97           1        525.3           1.9       1.0X
+f2j                                                  92             96           3        545.3           1.8       1.0X
+java                                                 92             96           3        546.1           1.8       1.0X
 
 
 ================================================================================================
 dsyr[U]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dsyr[U]:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 143            145           1        350.1           2.9       1.0X
-java                                                143            144           1        350.1           2.9       1.0X
+f2j                                                 140            155          16        357.9           2.8       1.0X
+java                                                138            147           6        361.9           2.8       1.0X
 
 
 ================================================================================================
 dgemm[N,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[N,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 668            670           1       1496.5           0.7       1.0X
-java                                                 64             72           4      15627.5           0.1      10.4X
+f2j                                                 669            670           1       1495.7           0.7       1.0X
+java                                                 77             78           2      13051.7           0.1       8.7X
 
 
 ================================================================================================
 dgemm[N,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[N,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 676            678           1       1478.6           0.7       1.0X
-java                                                 65             72           4      15494.6           0.1      10.5X
+f2j                                                 676            678           1       1478.9           0.7       1.0X
+java                                                 73             74           1      13704.1           0.1       9.3X
 
 
 ================================================================================================
 dgemm[T,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[T,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 926            928           1       1079.9           0.9       1.0X
-java                                                 64             71           4      15716.6           0.1      14.6X
+f2j                                                 926            929           2       1079.5           0.9       1.0X
+java                                                 76             78           2      13187.8           0.1      12.2X
 
 
 ================================================================================================
 dgemm[T,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dgemm[T,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 960            962           1       1042.0           1.0       1.0X
-java                                                 64             72           4      15644.9           0.1      15.0X
+f2j                                                 960            962           3       1042.2           1.0       1.0X
+java                                                 77             78           2      13051.9           0.1      12.5X
 
 
 ================================================================================================
 sgemm[N,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[N,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 652            653           1       1533.2           0.7       1.0X
-java                                                 41             41           1      24534.0           0.0      16.0X
+f2j                                                 652            656           3       1533.4           0.7       1.0X
+java                                                 41             42           1      24439.5           0.0      15.9X
 
 
 ================================================================================================
 sgemm[N,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[N,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 656            658           1       1524.1           0.7       1.0X
-java                                                 41             42           1      24202.1           0.0      15.9X
+f2j                                                 655            657           1       1525.7           0.7       1.0X
+java                                                 41             43           1      24129.1           0.0      15.8X
 
 
 ================================================================================================
 sgemm[T,N]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[T,N]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 906            907           0       1104.1           0.9       1.0X
-java                                                 40             41           1      24801.4           0.0      22.5X
+f2j                                                 906            907           1       1103.9           0.9       1.0X
+java                                                 40             42           1      24767.2           0.0      22.4X
 
 
 ================================================================================================
 sgemm[T,T]
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sgemm[T,T]:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-f2j                                                 956            958           2       1046.3           1.0       1.0X
-java                                                 41             42           1      24445.7           0.0      23.4X
+f2j                                                 955            956           1       1047.4           1.0       1.0X
+java                                                 41             42           1      24444.2           0.0      23.3X
 
 
diff --git a/mllib-local/src/main/scala/scala/collection/compat/package.scala b/mllib-local/src/main/scala/scala/collection/compat/package.scala
new file mode 100644
index 0000000000000..8ce1cfff886f6
--- /dev/null
+++ b/mllib-local/src/main/scala/scala/collection/compat/package.scala
@@ -0,0 +1,26 @@
+// scalastyle:off license
+/*
+ * Scala (https://www.scala-lang.org)
+ *
+ * Copyright EPFL and Lightbend, Inc. dba Akka
+ *
+ * Licensed under Apache License 2.0
+ * (http://www.apache.org/licenses/LICENSE-2.0).
+ *
+ * See the NOTICE file distributed with this work for
+ * additional information regarding copyright ownership.
+ */
+// scalastyle:on license
+
+package scala.collection
+
+package object compat {
+  type Factory[-A, +C] = scala.collection.Factory[A, C]
+  val Factory = scala.collection.Factory
+
+  type BuildFrom[-From, -A, +C] = scala.collection.BuildFrom[From, A, C]
+  val BuildFrom = scala.collection.BuildFrom
+
+  type IterableOnce[+X] = scala.collection.IterableOnce[X]
+  val IterableOnce = scala.collection.IterableOnce
+}
diff --git a/mllib/benchmarks/UDTSerializationBenchmark-jdk21-results.txt b/mllib/benchmarks/UDTSerializationBenchmark-jdk21-results.txt
index 1d84715344887..e7bc62b022135 100644
--- a/mllib/benchmarks/UDTSerializationBenchmark-jdk21-results.txt
+++ b/mllib/benchmarks/UDTSerializationBenchmark-jdk21-results.txt
@@ -2,11 +2,11 @@
 VectorUDT de/serialization
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 VectorUDT de/serialization:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-serialize                                            90             94           4          0.0       89629.8       1.0X
-deserialize                                          67             70           2          0.0       66956.8       1.3X
+serialize                                           101            105           4          0.0      100568.0       1.0X
+deserialize                                          72             77           3          0.0       72050.7       1.4X
 
 
diff --git a/mllib/benchmarks/UDTSerializationBenchmark-results.txt b/mllib/benchmarks/UDTSerializationBenchmark-results.txt
index 84d023b405cf1..af2e5f972bcf1 100644
--- a/mllib/benchmarks/UDTSerializationBenchmark-results.txt
+++ b/mllib/benchmarks/UDTSerializationBenchmark-results.txt
@@ -2,11 +2,11 @@
 VectorUDT de/serialization
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 VectorUDT de/serialization:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-serialize                                            93             95           2          0.0       92851.3       1.0X
-deserialize                                          71             74           2          0.0       71022.3       1.3X
+serialize                                            99            104           3          0.0       98606.8       1.0X
+deserialize                                          71             76           2          0.0       71492.9       1.4X
 
 
diff --git a/mllib/src/main/scala/org/apache/spark/ml/Predictor.scala b/mllib/src/main/scala/org/apache/spark/ml/Predictor.scala
index 83b77510602b2..17d6be0ce7cd5 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/Predictor.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/Predictor.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.ml
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.linalg.VectorUDT
 import org.apache.spark.ml.param._
 import org.apache.spark.ml.param.shared._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/Classifier.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/Classifier.scala
index 7883a0dea54f1..d9238479e8031 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/Classifier.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/Classifier.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.ml.classification
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.{PredictionModel, Predictor, PredictorParams}
 import org.apache.spark.ml.linalg.{Vector, VectorUDT}
 import org.apache.spark.ml.param.ParamMap
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/FMClassifier.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/FMClassifier.scala
index cefa13b2bbe71..b653383161e74 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/FMClassifier.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/FMClassifier.scala
@@ -224,17 +224,8 @@ class FMClassifier @Since("3.0.0") (
     factors: Matrix,
     objectiveHistory: Array[Double]): FMClassificationModel = {
     val model = copyValues(new FMClassificationModel(uid, intercept, linear, factors))
-    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
-
-    val (summaryModel, probabilityColName, predictionColName) = model.findSummaryModel()
-    val summary = new FMClassificationTrainingSummaryImpl(
-      summaryModel.transform(dataset),
-      probabilityColName,
-      predictionColName,
-      $(labelCol),
-      weightColName,
-      objectiveHistory)
-    model.setSummary(Some(summary))
+    model.createSummary(dataset, objectiveHistory)
+    model
   }
 
   @Since("3.0.0")
@@ -343,6 +334,42 @@ class FMClassificationModel private[classification] (
       s"uid=${super.toString}, numClasses=$numClasses, numFeatures=$numFeatures, " +
       s"factorSize=${$(factorSize)}, fitLinear=${$(fitLinear)}, fitIntercept=${$(fitIntercept)}"
   }
+
+  private[spark] def createSummary(
+    dataset: Dataset[_], objectiveHistory: Array[Double]
+  ): Unit = {
+    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
+
+    val (summaryModel, probabilityColName, predictionColName) = findSummaryModel()
+    val summary = new FMClassificationTrainingSummaryImpl(
+      summaryModel.transform(dataset),
+      probabilityColName,
+      predictionColName,
+      $(labelCol),
+      weightColName,
+      objectiveHistory)
+    setSummary(Some(summary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[Tuple1[Array[Double]]](
+      path, Tuple1(summary.objectiveHistory),
+      (data, dos) => {
+        ReadWriteUtils.serializeDoubleArray(data._1, dos)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val Tuple1(objectiveHistory: Array[Double])
+    = ReadWriteUtils.loadObjectFromLocal[Tuple1[Array[Double]]](
+      path,
+      dis => {
+        Tuple1(ReadWriteUtils.deserializeDoubleArray(dis))
+      }
+    )
+    createSummary(dataset, objectiveHistory)
+  }
 }
 
 @Since("3.0.0")
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/LinearSVC.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/LinearSVC.scala
index a50346ae88f4c..89f1f7792c075 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/LinearSVC.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/LinearSVC.scala
@@ -27,7 +27,7 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{COUNT, RANGE}
 import org.apache.spark.ml.feature._
 import org.apache.spark.ml.linalg._
@@ -277,17 +277,8 @@ class LinearSVC @Since("2.2.0") (
       intercept: Double,
       objectiveHistory: Array[Double]): LinearSVCModel = {
     val model = copyValues(new LinearSVCModel(uid, coefficients, intercept))
-    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
-
-    val (summaryModel, rawPredictionColName, predictionColName) = model.findSummaryModel()
-    val summary = new LinearSVCTrainingSummaryImpl(
-      summaryModel.transform(dataset),
-      rawPredictionColName,
-      predictionColName,
-      $(labelCol),
-      weightColName,
-      objectiveHistory)
-    model.setSummary(Some(summary))
+    model.createSummary(dataset, objectiveHistory)
+    model
   }
 
   private def trainImpl(
@@ -445,6 +436,42 @@ class LinearSVCModel private[classification] (
   override def toString: String = {
     s"LinearSVCModel: uid=$uid, numClasses=$numClasses, numFeatures=$numFeatures"
   }
+
+  private[spark] def createSummary(
+    dataset: Dataset[_], objectiveHistory: Array[Double]
+  ): Unit = {
+    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
+
+    val (summaryModel, rawPredictionColName, predictionColName) = findSummaryModel()
+    val summary = new LinearSVCTrainingSummaryImpl(
+      summaryModel.transform(dataset),
+      rawPredictionColName,
+      predictionColName,
+      $(labelCol),
+      weightColName,
+      objectiveHistory)
+    setSummary(Some(summary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[Tuple1[Array[Double]]](
+      path, Tuple1(summary.objectiveHistory),
+      (data, dos) => {
+        ReadWriteUtils.serializeDoubleArray(data._1, dos)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val Tuple1(objectiveHistory: Array[Double])
+    = ReadWriteUtils.loadObjectFromLocal[Tuple1[Array[Double]]](
+      path,
+      dis => {
+        Tuple1(ReadWriteUtils.deserializeDoubleArray(dis))
+      }
+    )
+    createSummary(dataset, objectiveHistory)
+  }
 }
 
 @Since("2.2.0")
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/LogisticRegression.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/LogisticRegression.scala
index 58a2652d0eab9..d0824925780c0 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/LogisticRegression.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/LogisticRegression.scala
@@ -28,7 +28,7 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{COUNT, RANGE}
 import org.apache.spark.ml.feature._
 import org.apache.spark.ml.impl.Utils
@@ -718,29 +718,8 @@ class LogisticRegression @Since("1.2.0") (
       objectiveHistory: Array[Double]): LogisticRegressionModel = {
     val model = copyValues(new LogisticRegressionModel(uid, coefficientMatrix, interceptVector,
       numClasses, checkMultinomial(numClasses)))
-    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
-
-    val (summaryModel, probabilityColName, predictionColName) = model.findSummaryModel()
-    val logRegSummary = if (numClasses <= 2) {
-      new BinaryLogisticRegressionTrainingSummaryImpl(
-        summaryModel.transform(dataset),
-        probabilityColName,
-        predictionColName,
-        $(labelCol),
-        $(featuresCol),
-        weightColName,
-        objectiveHistory)
-    } else {
-      new LogisticRegressionTrainingSummaryImpl(
-        summaryModel.transform(dataset),
-        probabilityColName,
-        predictionColName,
-        $(labelCol),
-        $(featuresCol),
-        weightColName,
-        objectiveHistory)
-    }
-    model.setSummary(Some(logRegSummary))
+    model.createSummary(dataset, objectiveHistory)
+    model
   }
 
   private def createBounds(
@@ -1323,6 +1302,54 @@ class LogisticRegressionModel private[spark] (
   override def toString: String = {
     s"LogisticRegressionModel: uid=$uid, numClasses=$numClasses, numFeatures=$numFeatures"
   }
+
+  private[spark] def createSummary(
+    dataset: Dataset[_], objectiveHistory: Array[Double]
+  ): Unit = {
+    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
+
+    val (summaryModel, probabilityColName, predictionColName) = findSummaryModel()
+    val logRegSummary = if (numClasses <= 2) {
+      new BinaryLogisticRegressionTrainingSummaryImpl(
+        summaryModel.transform(dataset),
+        probabilityColName,
+        predictionColName,
+        $(labelCol),
+        $(featuresCol),
+        weightColName,
+        objectiveHistory)
+    } else {
+      new LogisticRegressionTrainingSummaryImpl(
+        summaryModel.transform(dataset),
+        probabilityColName,
+        predictionColName,
+        $(labelCol),
+        $(featuresCol),
+        weightColName,
+        objectiveHistory)
+    }
+    setSummary(Some(logRegSummary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[Tuple1[Array[Double]]](
+      path, Tuple1(summary.objectiveHistory),
+      (data, dos) => {
+        ReadWriteUtils.serializeDoubleArray(data._1, dos)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val Tuple1(objectiveHistory: Array[Double])
+    = ReadWriteUtils.loadObjectFromLocal[Tuple1[Array[Double]]](
+      path,
+      dis => {
+        Tuple1(ReadWriteUtils.deserializeDoubleArray(dis))
+      }
+    )
+    createSummary(dataset, objectiveHistory)
+  }
 }
 
 @Since("1.6.0")
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/MultilayerPerceptronClassifier.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/MultilayerPerceptronClassifier.scala
index 6bd46cff815d7..5e52d62fb83cb 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/MultilayerPerceptronClassifier.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/MultilayerPerceptronClassifier.scala
@@ -251,14 +251,8 @@ class MultilayerPerceptronClassifier @Since("1.5.0") (
       objectiveHistory: Array[Double]): MultilayerPerceptronClassificationModel = {
     val model = copyValues(new MultilayerPerceptronClassificationModel(uid, weights))
 
-    val (summaryModel, _, predictionColName) = model.findSummaryModel()
-    val summary = new MultilayerPerceptronClassificationTrainingSummaryImpl(
-      summaryModel.transform(dataset),
-      predictionColName,
-      $(labelCol),
-      "",
-      objectiveHistory)
-    model.setSummary(Some(summary))
+    model.createSummary(dataset, objectiveHistory)
+    model
   }
 }
 
@@ -365,6 +359,39 @@ class MultilayerPerceptronClassificationModel private[ml] (
     s"MultilayerPerceptronClassificationModel: uid=$uid, numLayers=${$(layers).length}, " +
       s"numClasses=$numClasses, numFeatures=$numFeatures"
   }
+
+  private[spark] def createSummary(
+    dataset: Dataset[_], objectiveHistory: Array[Double]
+  ): Unit = {
+    val (summaryModel, _, predictionColName) = findSummaryModel()
+    val summary = new MultilayerPerceptronClassificationTrainingSummaryImpl(
+      summaryModel.transform(dataset),
+      predictionColName,
+      $(labelCol),
+      "",
+      objectiveHistory)
+    setSummary(Some(summary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[Tuple1[Array[Double]]](
+      path, Tuple1(summary.objectiveHistory),
+      (data, dos) => {
+        ReadWriteUtils.serializeDoubleArray(data._1, dos)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val Tuple1(objectiveHistory: Array[Double])
+    = ReadWriteUtils.loadObjectFromLocal[Tuple1[Array[Double]]](
+      path,
+      dis => {
+        Tuple1(ReadWriteUtils.deserializeDoubleArray(dis))
+      }
+    )
+    createSummary(dataset, objectiveHistory)
+  }
 }
 
 @Since("2.0.0")
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/OneVsRest.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/OneVsRest.scala
index 929bd1541ec6e..f62b951fd6505 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/OneVsRest.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/OneVsRest.scala
@@ -29,7 +29,7 @@ import org.json4s.JsonDSL._
 import org.json4s.jackson.JsonMethods._
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml._
 import org.apache.spark.ml.attribute._
 import org.apache.spark.ml.functions._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/ProbabilisticClassifier.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/ProbabilisticClassifier.scala
index 61fab02cb4518..ea2c79d8a2181 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/ProbabilisticClassifier.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/ProbabilisticClassifier.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.ml.classification
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.linalg.{DenseVector, Vector, VectorUDT}
 import org.apache.spark.ml.param.ParamMap
 import org.apache.spark.ml.param.shared._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/classification/RandomForestClassifier.scala b/mllib/src/main/scala/org/apache/spark/ml/classification/RandomForestClassifier.scala
index f64e2a6d4efc3..8b580b1e075c5 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/classification/RandomForestClassifier.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/classification/RandomForestClassifier.scala
@@ -182,26 +182,8 @@ class RandomForestClassifier @Since("1.4.0") (
       numFeatures: Int,
       numClasses: Int): RandomForestClassificationModel = {
     val model = copyValues(new RandomForestClassificationModel(uid, trees, numFeatures, numClasses))
-    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
-
-    val (summaryModel, probabilityColName, predictionColName) = model.findSummaryModel()
-    val rfSummary = if (numClasses <= 2) {
-      new BinaryRandomForestClassificationTrainingSummaryImpl(
-        summaryModel.transform(dataset),
-        probabilityColName,
-        predictionColName,
-        $(labelCol),
-        weightColName,
-        Array(0.0))
-    } else {
-      new RandomForestClassificationTrainingSummaryImpl(
-        summaryModel.transform(dataset),
-        predictionColName,
-        $(labelCol),
-        weightColName,
-        Array(0.0))
-    }
-    model.setSummary(Some(rfSummary))
+    model.createSummary(dataset)
+    model
   }
 
   @Since("1.4.1")
@@ -393,6 +375,35 @@ class RandomForestClassificationModel private[ml] (
   @Since("2.0.0")
   override def write: MLWriter =
     new RandomForestClassificationModel.RandomForestClassificationModelWriter(this)
+
+  private[spark] def createSummary(dataset: Dataset[_]): Unit = {
+    val weightColName = if (!isDefined(weightCol)) "weightCol" else $(weightCol)
+
+    val (summaryModel, probabilityColName, predictionColName) = findSummaryModel()
+    val rfSummary = if (numClasses <= 2) {
+      new BinaryRandomForestClassificationTrainingSummaryImpl(
+        summaryModel.transform(dataset),
+        probabilityColName,
+        predictionColName,
+        $(labelCol),
+        weightColName,
+        Array(0.0))
+    } else {
+      new RandomForestClassificationTrainingSummaryImpl(
+        summaryModel.transform(dataset),
+        predictionColName,
+        $(labelCol),
+        weightColName,
+        Array(0.0))
+    }
+    setSummary(Some(rfSummary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {}
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    createSummary(dataset)
+  }
 }
 
 @Since("2.0.0")
diff --git a/mllib/src/main/scala/org/apache/spark/ml/clustering/BisectingKMeans.scala b/mllib/src/main/scala/org/apache/spark/ml/clustering/BisectingKMeans.scala
index 3248b4b391d0a..9e09ee00c3e30 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/clustering/BisectingKMeans.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/clustering/BisectingKMeans.scala
@@ -180,6 +180,9 @@ class BisectingKMeansModel private[ml] (
   override def summary: BisectingKMeansSummary = super.summary
 
   override def estimatedSize: Long = SizeEstimator.estimate(parentModel)
+
+  // BisectingKMeans model hasn't supported offloading, so put an empty `saveSummary` here for now
+  override private[spark] def saveSummary(path: String): Unit = {}
 }
 
 object BisectingKMeansModel extends MLReadable[BisectingKMeansModel] {
diff --git a/mllib/src/main/scala/org/apache/spark/ml/clustering/GaussianMixture.scala b/mllib/src/main/scala/org/apache/spark/ml/clustering/GaussianMixture.scala
index a94b8a87d8fc7..5d3e36be28082 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/clustering/GaussianMixture.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/clustering/GaussianMixture.scala
@@ -23,7 +23,7 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.annotation.Since
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.{Estimator, Model}
 import org.apache.spark.ml.impl.Utils.{unpackUpperTriangular, EPSILON}
 import org.apache.spark.ml.linalg._
@@ -223,6 +223,36 @@ class GaussianMixtureModel private[ml] (
   override def summary: GaussianMixtureSummary = super.summary
 
   override def estimatedSize: Long = SizeEstimator.estimate((weights, gaussians))
+
+  private[spark] def createSummary(
+    predictions: DataFrame, logLikelihood: Double, iteration: Int
+  ): Unit = {
+    val summary = new GaussianMixtureSummary(predictions,
+      $(predictionCol), $(probabilityCol), $(featuresCol), $(k), logLikelihood, iteration)
+    setSummary(Some(summary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[(Double, Int)](
+      path, (summary.logLikelihood, summary.numIter),
+      (data, dos) => {
+        dos.writeDouble(data._1)
+        dos.writeInt(data._2)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val (logLikelihood: Double, numIter: Int) = ReadWriteUtils.loadObjectFromLocal[(Double, Int)](
+      path,
+      dis => {
+        val logLikelihood = dis.readDouble()
+        val numIter = dis.readInt()
+        (logLikelihood, numIter)
+      }
+    )
+    createSummary(dataset, logLikelihood, numIter)
+  }
 }
 
 @Since("2.0.0")
@@ -453,11 +483,10 @@ class GaussianMixture @Since("2.0.0") (
 
     val model = copyValues(new GaussianMixtureModel(uid, weights, gaussianDists))
       .setParent(this)
-    val summary = new GaussianMixtureSummary(model.transform(dataset),
-      $(predictionCol), $(probabilityCol), $(featuresCol), $(k), logLikelihood, iteration)
+    model.createSummary(model.transform(dataset), logLikelihood, iteration)
     instr.logNamedValue("logLikelihood", logLikelihood)
-    instr.logNamedValue("clusterSizes", summary.clusterSizes)
-    model.setSummary(Some(summary))
+    instr.logNamedValue("clusterSizes", model.summary.clusterSizes)
+    model
   }
 
   private def trainImpl(
diff --git a/mllib/src/main/scala/org/apache/spark/ml/clustering/KMeans.scala b/mllib/src/main/scala/org/apache/spark/ml/clustering/KMeans.scala
index f3ac58e670e5a..2abd82c712960 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/clustering/KMeans.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/clustering/KMeans.scala
@@ -25,7 +25,6 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.annotation.Since
 import org.apache.spark.internal.LogKeys.{COST, INIT_MODE, NUM_ITERATIONS, TOTAL_TIME}
-import org.apache.spark.internal.MDC
 import org.apache.spark.ml.{Estimator, Model, PipelineStage}
 import org.apache.spark.ml.feature.{Instance, InstanceBlock}
 import org.apache.spark.ml.linalg._
@@ -215,6 +214,42 @@ class KMeansModel private[ml] (
   override def summary: KMeansSummary = super.summary
 
   override def estimatedSize: Long = SizeEstimator.estimate(parentModel.clusterCenters)
+
+  private[spark] def createSummary(
+    predictions: DataFrame, numIter: Int, trainingCost: Double
+  ): Unit = {
+    val summary = new KMeansSummary(
+      predictions,
+      $(predictionCol),
+      $(featuresCol),
+      $(k),
+      numIter,
+      trainingCost)
+
+    setSummary(Some(summary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[(Int, Double)](
+      path, (summary.numIter, summary.trainingCost),
+      (data, dos) => {
+        dos.writeInt(data._1)
+        dos.writeDouble(data._2)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val (numIter: Int, trainingCost: Double) = ReadWriteUtils.loadObjectFromLocal[(Int, Double)](
+      path,
+      dis => {
+        val numIter = dis.readInt()
+        val trainingCost = dis.readDouble()
+        (numIter, trainingCost)
+      }
+    )
+    createSummary(dataset, numIter, trainingCost)
+  }
 }
 
 /** Helper class for storing model data */
@@ -414,16 +449,9 @@ class KMeans @Since("1.5.0") (
     }
 
     val model = copyValues(new KMeansModel(uid, oldModel).setParent(this))
-    val summary = new KMeansSummary(
-      model.transform(dataset),
-      $(predictionCol),
-      $(featuresCol),
-      $(k),
-      oldModel.numIter,
-      oldModel.trainingCost)
 
-    model.setSummary(Some(summary))
-    instr.logNamedValue("clusterSizes", summary.clusterSizes)
+    model.createSummary(model.transform(dataset), oldModel.numIter, oldModel.trainingCost)
+    instr.logNamedValue("clusterSizes", model.summary.clusterSizes)
     model
   }
 
diff --git a/mllib/src/main/scala/org/apache/spark/ml/feature/Binarizer.scala b/mllib/src/main/scala/org/apache/spark/ml/feature/Binarizer.scala
index 8123438fd8878..52ed90415f1cd 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/feature/Binarizer.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/feature/Binarizer.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable.ArrayBuilder
 
 import org.apache.spark.{SparkException, SparkIllegalArgumentException}
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.Transformer
 import org.apache.spark.ml.attribute._
 import org.apache.spark.ml.linalg._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/feature/IDF.scala b/mllib/src/main/scala/org/apache/spark/ml/feature/IDF.scala
index 12d957ea360f7..289217e1b8179 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/feature/IDF.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/feature/IDF.scala
@@ -231,7 +231,6 @@ object IDFModel extends MLReadable[IDFModel] {
     override def load(path: String): IDFModel = {
       val metadata = DefaultParamsReader.loadMetadata(path, sparkSession, className)
       val dataPath = new Path(path, "data").toString
-      val data = sparkSession.read.parquet(dataPath)
 
       val model = if (majorVersion(metadata.sparkVersion) >= 3) {
         val data = ReadWriteUtils.loadObject[Data](dataPath, sparkSession, deserializeData)
@@ -240,6 +239,7 @@ object IDFModel extends MLReadable[IDFModel] {
           new feature.IDFModel(OldVectors.fromML(data.idf), data.docFreq, data.numDocs)
         )
       } else {
+        val data = sparkSession.read.parquet(dataPath)
         val Row(idf: Vector) = MLUtils.convertVectorColumnsToML(data, "idf")
           .select("idf")
           .head()
diff --git a/mllib/src/main/scala/org/apache/spark/ml/feature/StopWordsRemover.scala b/mllib/src/main/scala/org/apache/spark/ml/feature/StopWordsRemover.scala
index cb9d8b32f0064..4bd1bfaf582d0 100755
--- a/mllib/src/main/scala/org/apache/spark/ml/feature/StopWordsRemover.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/feature/StopWordsRemover.scala
@@ -20,7 +20,7 @@ package org.apache.spark.ml.feature
 import java.util.Locale
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.ml.Transformer
 import org.apache.spark.ml.param._
 import org.apache.spark.ml.param.shared.{HasInputCol, HasInputCols, HasOutputCol, HasOutputCols}
diff --git a/mllib/src/main/scala/org/apache/spark/ml/feature/StringIndexer.scala b/mllib/src/main/scala/org/apache/spark/ml/feature/StringIndexer.scala
index db3749558f473..6ba57f583ae31 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/feature/StringIndexer.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/feature/StringIndexer.scala
@@ -23,7 +23,7 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.{SparkException, SparkIllegalArgumentException}
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.{Estimator, Model, Transformer}
 import org.apache.spark.ml.attribute.{Attribute, NominalAttribute}
 import org.apache.spark.ml.param._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/optim/IterativelyReweightedLeastSquares.scala b/mllib/src/main/scala/org/apache/spark/ml/optim/IterativelyReweightedLeastSquares.scala
index 17adf61e46e9d..346595f80a9c4 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/optim/IterativelyReweightedLeastSquares.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/optim/IterativelyReweightedLeastSquares.scala
@@ -17,13 +17,12 @@
 
 package org.apache.spark.ml.optim
 
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{NUM_ITERATIONS, RELATIVE_TOLERANCE}
-import org.apache.spark.internal.MDC
 import org.apache.spark.ml.feature.{Instance, OffsetInstance}
 import org.apache.spark.ml.linalg._
 import org.apache.spark.ml.util.OptionalInstrumentation
 import org.apache.spark.rdd.RDD
-import org.apache.spark.util.MavenUtils.LogStringContext
 
 /**
  * Model fitted by [[IterativelyReweightedLeastSquares]].
@@ -64,7 +63,7 @@ private[ml] class IterativelyReweightedLeastSquares(
     val fitIntercept: Boolean,
     val regParam: Double,
     val maxIter: Int,
-    val tol: Double) extends Serializable {
+    val tol: Double) extends Serializable with Logging {
 
   def fit(
       instances: RDD[OffsetInstance],
diff --git a/mllib/src/main/scala/org/apache/spark/ml/optim/WeightedLeastSquares.scala b/mllib/src/main/scala/org/apache/spark/ml/optim/WeightedLeastSquares.scala
index 31db7b18efb3a..177f75b898c1b 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/optim/WeightedLeastSquares.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/optim/WeightedLeastSquares.scala
@@ -17,13 +17,12 @@
 
 package org.apache.spark.ml.optim
 
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.COUNT
-import org.apache.spark.internal.MDC
 import org.apache.spark.ml.feature.Instance
 import org.apache.spark.ml.linalg._
 import org.apache.spark.ml.util.OptionalInstrumentation
 import org.apache.spark.rdd.RDD
-import org.apache.spark.util.MavenUtils.LogStringContext
 
 /**
  * Model fitted by [[WeightedLeastSquares]].
@@ -85,7 +84,7 @@ private[ml] class WeightedLeastSquares(
     val solverType: WeightedLeastSquares.Solver = WeightedLeastSquares.Auto,
     val maxIter: Int = 100,
     val tol: Double = 1e-6
-  ) extends Serializable {
+  ) extends Serializable with Logging {
   import WeightedLeastSquares._
 
   require(regParam >= 0.0, s"regParam cannot be negative: $regParam")
diff --git a/mllib/src/main/scala/org/apache/spark/ml/r/RWrapperUtils.scala b/mllib/src/main/scala/org/apache/spark/ml/r/RWrapperUtils.scala
index 9e66647ef35fb..87948d1796d2f 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/r/RWrapperUtils.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/r/RWrapperUtils.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.ml.r
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FEATURE_COLUMN, LABEL_COLUMN, NEW_FEATURE_COLUMN_NAME, NEW_LABEL_COLUMN_NAME}
 import org.apache.spark.ml.attribute.{Attribute, AttributeGroup, NominalAttribute}
 import org.apache.spark.ml.feature.{RFormula, RFormulaModel}
diff --git a/mllib/src/main/scala/org/apache/spark/ml/recommendation/ALS.scala b/mllib/src/main/scala/org/apache/spark/ml/recommendation/ALS.scala
index 276c7630d2d51..538ad03820754 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/recommendation/ALS.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/recommendation/ALS.scala
@@ -33,7 +33,7 @@ import org.json4s.JsonDSL._
 
 import org.apache.spark.{Partitioner, SparkException}
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.ml.{Estimator, Model}
 import org.apache.spark.ml.linalg.BLAS
diff --git a/mllib/src/main/scala/org/apache/spark/ml/regression/AFTSurvivalRegression.scala b/mllib/src/main/scala/org/apache/spark/ml/regression/AFTSurvivalRegression.scala
index 3aee34a148adf..d96500ea84ab9 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/regression/AFTSurvivalRegression.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/regression/AFTSurvivalRegression.scala
@@ -26,7 +26,7 @@ import breeze.optimize.{CachedDiffFunction, LBFGS => BreezeLBFGS}
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.ml.PredictorParams
 import org.apache.spark.ml.feature._
 import org.apache.spark.ml.linalg._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/regression/DecisionTreeRegressor.scala b/mllib/src/main/scala/org/apache/spark/ml/regression/DecisionTreeRegressor.scala
index 2c40a2f353b7d..f049e9a44cc28 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/regression/DecisionTreeRegressor.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/regression/DecisionTreeRegressor.scala
@@ -22,7 +22,7 @@ import org.json4s.{DefaultFormats, JObject}
 import org.json4s.JsonDSL._
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.feature.Instance
 import org.apache.spark.ml.linalg.Vector
 import org.apache.spark.ml.param.ParamMap
diff --git a/mllib/src/main/scala/org/apache/spark/ml/regression/GBTRegressor.scala b/mllib/src/main/scala/org/apache/spark/ml/regression/GBTRegressor.scala
index 163921c703903..c8fa97bfccce0 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/regression/GBTRegressor.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/regression/GBTRegressor.scala
@@ -21,7 +21,7 @@ import org.json4s.{DefaultFormats, JObject}
 import org.json4s.JsonDSL._
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.ml.linalg.{BLAS, Vector}
 import org.apache.spark.ml.param.ParamMap
 import org.apache.spark.ml.tree._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/regression/GeneralizedLinearRegression.scala b/mllib/src/main/scala/org/apache/spark/ml/regression/GeneralizedLinearRegression.scala
index 14467c761b216..f4d6e4e3562af 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/regression/GeneralizedLinearRegression.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/regression/GeneralizedLinearRegression.scala
@@ -22,12 +22,11 @@ import java.util.Locale
 
 import breeze.stats.{distributions => dist}
 import breeze.stats.distributions.Rand.FixedSeed.randBasis
-import org.apache.commons.lang3.StringUtils
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.ml.PredictorParams
 import org.apache.spark.ml.attribute._
 import org.apache.spark.ml.feature.{Instance, OffsetInstance}
@@ -42,6 +41,7 @@ import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.{Column, DataFrame, Dataset, Row}
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.types.{DataType, DoubleType, StructType}
+import org.apache.spark.util.Utils
 
 /**
  * Params for Generalized Linear Regression.
@@ -419,9 +419,8 @@ class GeneralizedLinearRegression @Since("2.0.0") (@Since("2.0.0") override val
       val model = copyValues(
         new GeneralizedLinearRegressionModel(uid, wlsModel.coefficients, wlsModel.intercept)
           .setParent(this))
-      val trainingSummary = new GeneralizedLinearRegressionTrainingSummary(dataset, model,
-        wlsModel.diagInvAtWA.toArray, 1, getSolver)
-      model.setSummary(Some(trainingSummary))
+      model.createSummary(dataset, wlsModel.diagInvAtWA.toArray, 1)
+      model
     } else {
       val instances = validated.rdd.map {
         case Row(label: Double, weight: Double, offset: Double, features: Vector) =>
@@ -436,9 +435,8 @@ class GeneralizedLinearRegression @Since("2.0.0") (@Since("2.0.0") override val
       val model = copyValues(
         new GeneralizedLinearRegressionModel(uid, irlsModel.coefficients, irlsModel.intercept)
           .setParent(this))
-      val trainingSummary = new GeneralizedLinearRegressionTrainingSummary(dataset, model,
-        irlsModel.diagInvAtWA.toArray, irlsModel.numIterations, getSolver)
-      model.setSummary(Some(trainingSummary))
+      model.createSummary(dataset, irlsModel.diagInvAtWA.toArray, irlsModel.numIterations)
+      model
     }
 
     model
@@ -1140,6 +1138,39 @@ class GeneralizedLinearRegressionModel private[ml] (
     s"GeneralizedLinearRegressionModel: uid=$uid, family=${$(family)}, link=${$(link)}, " +
       s"numFeatures=$numFeatures"
   }
+
+  private[spark] def createSummary(
+    dataset: Dataset[_], diagInvAtWA: Array[Double], numIter: Int
+  ): Unit = {
+    val summary = new GeneralizedLinearRegressionTrainingSummary(
+      dataset, this, diagInvAtWA, numIter, $(solver)
+    )
+
+    setSummary(Some(summary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[(Array[Double], Int)](
+      path, (summary.diagInvAtWA, summary.numIterations),
+      (data, dos) => {
+        ReadWriteUtils.serializeDoubleArray(data._1, dos)
+        dos.writeInt(data._2)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val (diagInvAtWA: Array[Double], numIterations: Int) =
+      ReadWriteUtils.loadObjectFromLocal[(Array[Double], Int)](
+      path,
+      dis => {
+        val diagInvAtWA = ReadWriteUtils.deserializeDoubleArray(dis)
+        val numIterations = dis.readInt()
+        (diagInvAtWA, numIterations)
+      }
+    )
+    createSummary(dataset, diagInvAtWA, numIterations)
+  }
 }
 
 @Since("2.0.0")
@@ -1467,7 +1498,7 @@ class GeneralizedLinearRegressionSummary private[regression] (
 class GeneralizedLinearRegressionTrainingSummary private[regression] (
     dataset: Dataset[_],
     origModel: GeneralizedLinearRegressionModel,
-    private val diagInvAtWA: Array[Double],
+    private[spark] val diagInvAtWA: Array[Double],
     @Since("2.0.0") val numIterations: Int,
     @Since("2.0.0") val solver: String)
   extends GeneralizedLinearRegressionSummary(dataset, origModel) with Serializable {
@@ -1605,12 +1636,12 @@ class GeneralizedLinearRegressionTrainingSummary private[regression] (
       // Output coefficients with statistics
       sb.append("Coefficients:\n")
       colNames.zipWithIndex.map { case (colName: String, i: Int) =>
-        StringUtils.leftPad(colName, colWidths(i))
+        Utils.leftPad(colName, colWidths(i))
       }.addString(sb, "", " ", "\n")
 
       data.foreach { case strRow: Array[String] =>
         strRow.zipWithIndex.map { case (cell: String, i: Int) =>
-          StringUtils.leftPad(cell, colWidths(i))
+          Utils.leftPad(cell, colWidths(i))
         }.addString(sb, "", " ", "\n")
       }
 
@@ -1623,9 +1654,9 @@ class GeneralizedLinearRegressionTrainingSummary private[regression] (
       val rd = s"Residual deviance: ${round(deviance)} on $residualDegreeOfFreedom degrees of " +
         "freedom"
       val l = math.max(nd.length, rd.length)
-      sb.append(StringUtils.leftPad(nd, l))
+      sb.append(Utils.leftPad(nd, l))
       sb.append("\n")
-      sb.append(StringUtils.leftPad(rd, l))
+      sb.append(Utils.leftPad(rd, l))
 
       if (family.name != "tweedie") {
         sb.append("\n")
diff --git a/mllib/src/main/scala/org/apache/spark/ml/regression/LinearRegression.scala b/mllib/src/main/scala/org/apache/spark/ml/regression/LinearRegression.scala
index b06140e48338c..822df270c0bf7 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/regression/LinearRegression.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/regression/LinearRegression.scala
@@ -433,15 +433,8 @@ class LinearRegression @Since("1.3.0") (@Since("1.3.0") override val uid: String
     }
 
     val model = createModel(parameters, yMean, yStd, featuresMean, featuresStd)
-
-    // Handle possible missing or invalid prediction columns
-    val (summaryModel, predictionColName) = model.findSummaryModelAndPredictionCol()
-    val trainingSummary = new LinearRegressionTrainingSummary(
-      summaryModel.transform(dataset), predictionColName, $(labelCol), $(featuresCol),
-      summaryModel.get(summaryModel.weightCol).getOrElse(""),
-      summaryModel.numFeatures, summaryModel.getFitIntercept,
-      Array(0.0), objectiveHistory)
-    model.setSummary(Some(trainingSummary))
+    model.createSummary(dataset, Array(0.0), objectiveHistory, Array.emptyDoubleArray)
+    model
   }
 
   private def trainWithNormal(
@@ -459,20 +452,16 @@ class LinearRegression @Since("1.3.0") (@Since("1.3.0") override val uid: String
     // attach returned model.
     val lrModel = copyValues(new LinearRegressionModel(
       uid, model.coefficients.compressed, model.intercept))
-    val (summaryModel, predictionColName) = lrModel.findSummaryModelAndPredictionCol()
 
-    val coefficientArray = if (summaryModel.getFitIntercept) {
-      summaryModel.coefficients.toArray ++ Array(summaryModel.intercept)
+    val coefficientArray = if (lrModel.getFitIntercept) {
+      lrModel.coefficients.toArray ++ Array(lrModel.intercept)
     } else {
-      summaryModel.coefficients.toArray
+      lrModel.coefficients.toArray
     }
-    val trainingSummary = new LinearRegressionTrainingSummary(
-      summaryModel.transform(dataset), predictionColName, $(labelCol), $(featuresCol),
-      summaryModel.get(summaryModel.weightCol).getOrElse(""),
-      summaryModel.numFeatures, summaryModel.getFitIntercept,
-      model.diagInvAtWA.toArray, model.objectiveHistory, coefficientArray)
-
-    lrModel.setSummary(Some(trainingSummary))
+    lrModel.createSummary(
+      dataset, model.diagInvAtWA.toArray, model.objectiveHistory, coefficientArray
+    )
+    lrModel
   }
 
   private def trainWithConstantLabel(
@@ -497,16 +486,9 @@ class LinearRegression @Since("1.3.0") (@Since("1.3.0") override val uid: String
     val intercept = yMean
 
     val model = copyValues(new LinearRegressionModel(uid, coefficients, intercept))
-    // Handle possible missing or invalid prediction columns
-    val (summaryModel, predictionColName) = model.findSummaryModelAndPredictionCol()
 
-    val trainingSummary = new LinearRegressionTrainingSummary(
-      summaryModel.transform(dataset), predictionColName, $(labelCol), $(featuresCol),
-      summaryModel.get(summaryModel.weightCol).getOrElse(""),
-      summaryModel.numFeatures, summaryModel.getFitIntercept,
-      Array(0.0), Array(0.0))
-
-    model.setSummary(Some(trainingSummary))
+    model.createSummary(dataset, Array(0.0), Array(0.0), Array.emptyDoubleArray)
+    model
   }
 
   private def createOptimizer(
@@ -800,6 +782,53 @@ class LinearRegressionModel private[ml] (
   override def toString: String = {
     s"LinearRegressionModel: uid=$uid, numFeatures=$numFeatures"
   }
+
+  private[spark] def createSummary(
+    dataset: Dataset[_],
+    diagInvAtWA: Array[Double],
+    objectiveHistory: Array[Double],
+    coefficientArray: Array[Double]
+  ): Unit = {
+    // Handle possible missing or invalid prediction columns
+    val (summaryModel, predictionColName) = findSummaryModelAndPredictionCol()
+
+    val trainingSummary = new LinearRegressionTrainingSummary(
+      summaryModel.transform(dataset), predictionColName, $(labelCol), $(featuresCol),
+      summaryModel.get(summaryModel.weightCol).getOrElse(""),
+      summaryModel.numFeatures, summaryModel.getFitIntercept,
+      diagInvAtWA, objectiveHistory, coefficientArray)
+
+    setSummary(Some(trainingSummary))
+  }
+
+  override private[spark] def saveSummary(path: String): Unit = {
+    ReadWriteUtils.saveObjectToLocal[(Array[Double], Array[Double], Array[Double])](
+      path, (summary.diagInvAtWA, summary.objectiveHistory, summary.coefficientArray),
+      (data, dos) => {
+        ReadWriteUtils.serializeDoubleArray(data._1, dos)
+        ReadWriteUtils.serializeDoubleArray(data._2, dos)
+        ReadWriteUtils.serializeDoubleArray(data._3, dos)
+      }
+    )
+  }
+
+  override private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    val (
+      diagInvAtWA: Array[Double],
+      objectiveHistory: Array[Double],
+      coefficientArray: Array[Double]
+    )
+    = ReadWriteUtils.loadObjectFromLocal[(Array[Double], Array[Double], Array[Double])](
+      path,
+      dis => {
+        val diagInvAtWA = ReadWriteUtils.deserializeDoubleArray(dis)
+        val objectiveHistory = ReadWriteUtils.deserializeDoubleArray(dis)
+        val coefficientArray = ReadWriteUtils.deserializeDoubleArray(dis)
+        (diagInvAtWA, objectiveHistory, coefficientArray)
+      }
+    )
+    createSummary(dataset, diagInvAtWA, objectiveHistory, coefficientArray)
+  }
 }
 
 private[ml] case class LinearModelData(intercept: Double, coefficients: Vector, scale: Double)
@@ -926,7 +955,7 @@ class LinearRegressionTrainingSummary private[regression] (
     private val fitIntercept: Boolean,
     diagInvAtWA: Array[Double],
     val objectiveHistory: Array[Double],
-    private val coefficientArray: Array[Double] = Array.emptyDoubleArray)
+    override private[regression] val coefficientArray: Array[Double] = Array.emptyDoubleArray)
   extends LinearRegressionSummary(
     predictions,
     predictionCol,
@@ -972,8 +1001,8 @@ class LinearRegressionSummary private[regression] (
     private val weightCol: String,
     private val numFeatures: Int,
     private val fitIntercept: Boolean,
-    private val diagInvAtWA: Array[Double],
-    private val coefficientArray: Array[Double] = Array.emptyDoubleArray)
+    private[regression] val diagInvAtWA: Array[Double],
+    private[regression] val coefficientArray: Array[Double] = Array.emptyDoubleArray)
   extends Summary with Serializable {
 
   @transient private val metrics = {
diff --git a/mllib/src/main/scala/org/apache/spark/ml/regression/RandomForestRegressor.scala b/mllib/src/main/scala/org/apache/spark/ml/regression/RandomForestRegressor.scala
index 04e36c7f27ff3..a9e2c47a3229a 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/regression/RandomForestRegressor.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/regression/RandomForestRegressor.scala
@@ -21,7 +21,7 @@ import org.json4s.{DefaultFormats, JObject}
 import org.json4s.JsonDSL._
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.ml.feature.Instance
 import org.apache.spark.ml.linalg.Vector
 import org.apache.spark.ml.param.ParamMap
diff --git a/mllib/src/main/scala/org/apache/spark/ml/source/image/ImageFileFormat.scala b/mllib/src/main/scala/org/apache/spark/ml/source/image/ImageFileFormat.scala
index f44cbd5b3acca..10a3101dbb608 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/source/image/ImageFileFormat.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/source/image/ImageFileFormat.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.ml.source.image
 
-import com.google.common.io.{ByteStreams, Closeables}
+import com.google.common.io.Closeables
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.FileStatus
 import org.apache.hadoop.mapreduce.Job
@@ -76,7 +76,7 @@ private[image] case class ImageFileFormat() extends FileFormat with DataSourceRe
         val fs = path.getFileSystem(broadcastedHadoopConf.value.value)
         val stream = fs.open(path)
         val bytes = try {
-          ByteStreams.toByteArray(stream)
+          stream.readAllBytes()
         } finally {
           Closeables.close(stream, true)
         }
diff --git a/mllib/src/main/scala/org/apache/spark/ml/tree/Node.scala b/mllib/src/main/scala/org/apache/spark/ml/tree/Node.scala
index 697d989538391..b68a5e079dc44 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/tree/Node.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/tree/Node.scala
@@ -134,7 +134,7 @@ class LeafNode private[ml] (
   override private[tree] def numDescendants: Int = 0
 
   override private[tree] def subtreeToString(indentFactor: Int = 0): String = {
-    val prefix: String = " " * indentFactor
+    val prefix: String = " ".repeat(indentFactor)
     prefix + s"Predict: $prediction\n"
   }
 
@@ -212,7 +212,7 @@ class InternalNode private[ml] (
   }
 
   override private[tree] def subtreeToString(indentFactor: Int = 0): String = {
-    val prefix: String = " " * indentFactor
+    val prefix: String = " ".repeat(indentFactor)
     prefix + s"If (${InternalNode.splitToString(split, left = true)})\n" +
       leftChild.subtreeToString(indentFactor + 1) +
       prefix + s"Else (${InternalNode.splitToString(split, left = false)})\n" +
diff --git a/mllib/src/main/scala/org/apache/spark/ml/tree/impl/DecisionTreeMetadata.scala b/mllib/src/main/scala/org/apache/spark/ml/tree/impl/DecisionTreeMetadata.scala
index 2f63f4ae073e5..181168385011d 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/tree/impl/DecisionTreeMetadata.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/tree/impl/DecisionTreeMetadata.scala
@@ -20,7 +20,7 @@ package org.apache.spark.ml.tree.impl
 import scala.collection.mutable
 import scala.util.Try
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.ml.feature.Instance
 import org.apache.spark.ml.tree.TreeEnsembleParams
 import org.apache.spark.mllib.tree.configuration.Algo._
diff --git a/mllib/src/main/scala/org/apache/spark/ml/tree/impl/GradientBoostedTrees.scala b/mllib/src/main/scala/org/apache/spark/ml/tree/impl/GradientBoostedTrees.scala
index d1cad44a15c8a..81ffa5c86a9fa 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/tree/impl/GradientBoostedTrees.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/tree/impl/GradientBoostedTrees.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.ml.tree.impl
 
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.TIMER
 import org.apache.spark.ml.EstimatorUtils
 import org.apache.spark.ml.feature.Instance
diff --git a/mllib/src/main/scala/org/apache/spark/ml/tree/impl/RandomForest.scala b/mllib/src/main/scala/org/apache/spark/ml/tree/impl/RandomForest.scala
index 118d6d7a063ac..cabbc497571b6 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/tree/impl/RandomForest.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/tree/impl/RandomForest.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable
 import scala.util.Random
 
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{MAX_MEMORY_SIZE, MEMORY_SIZE, NUM_CLASSES, NUM_EXAMPLES, NUM_FEATURES, NUM_NODES, NUM_WEIGHTED_EXAMPLES, TIMER}
 import org.apache.spark.ml.EstimatorUtils
 import org.apache.spark.ml.classification.DecisionTreeClassificationModel
diff --git a/mllib/src/main/scala/org/apache/spark/ml/tuning/CrossValidator.scala b/mllib/src/main/scala/org/apache/spark/ml/tuning/CrossValidator.scala
index bc6b747344e31..119cc47a56f4f 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/tuning/CrossValidator.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/tuning/CrossValidator.scala
@@ -27,7 +27,7 @@ import org.apache.hadoop.fs.Path
 import org.json4s.DefaultFormats
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CROSS_VALIDATION_METRIC, CROSS_VALIDATION_METRICS, ESTIMATOR_PARAM_MAP}
 import org.apache.spark.ml.{Estimator, Model}
 import org.apache.spark.ml.evaluation.Evaluator
diff --git a/mllib/src/main/scala/org/apache/spark/ml/tuning/TrainValidationSplit.scala b/mllib/src/main/scala/org/apache/spark/ml/tuning/TrainValidationSplit.scala
index 324a08ba0b5ab..6ee64ef99a668 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/tuning/TrainValidationSplit.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/tuning/TrainValidationSplit.scala
@@ -28,7 +28,7 @@ import org.apache.hadoop.fs.Path
 import org.json4s.DefaultFormats
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ESTIMATOR_PARAM_MAP, TRAIN_VALIDATION_SPLIT_METRIC, TRAIN_VALIDATION_SPLIT_METRICS}
 import org.apache.spark.ml.{Estimator, Model}
 import org.apache.spark.ml.evaluation.Evaluator
diff --git a/mllib/src/main/scala/org/apache/spark/ml/util/DatasetUtils.scala b/mllib/src/main/scala/org/apache/spark/ml/util/DatasetUtils.scala
index d5b6396e5ba80..06de43260b303 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/util/DatasetUtils.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/util/DatasetUtils.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.ml.util
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, LABEL_COLUMN, NUM_CLASSES}
 import org.apache.spark.ml.PredictorParams
 import org.apache.spark.ml.classification.ClassifierParams
diff --git a/mllib/src/main/scala/org/apache/spark/ml/util/HasTrainingSummary.scala b/mllib/src/main/scala/org/apache/spark/ml/util/HasTrainingSummary.scala
index 0ba8ce072ab4a..c6f6babf71a2b 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/util/HasTrainingSummary.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/util/HasTrainingSummary.scala
@@ -19,6 +19,7 @@ package org.apache.spark.ml.util
 
 import org.apache.spark.SparkException
 import org.apache.spark.annotation.Since
+import org.apache.spark.sql.DataFrame
 
 
 /**
@@ -49,4 +50,14 @@ private[spark] trait HasTrainingSummary[T] {
     this.trainingSummary = summary
     this
   }
+
+  private[spark] def loadSummary(path: String, dataset: DataFrame): Unit = {
+    throw new SparkException(
+      s"No loadSummary implementation for this ${this.getClass.getSimpleName}")
+  }
+
+  private[spark] def saveSummary(path: String): Unit = {
+    throw new SparkException(
+      s"No saveSummary implementation for this ${this.getClass.getSimpleName}")
+  }
 }
diff --git a/mllib/src/main/scala/org/apache/spark/ml/util/Instrumentation.scala b/mllib/src/main/scala/org/apache/spark/ml/util/Instrumentation.scala
index 9413605a31ced..ddd63736023a3 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/util/Instrumentation.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/util/Instrumentation.scala
@@ -27,7 +27,7 @@ import org.json4s._
 import org.json4s.JsonDSL._
 import org.json4s.jackson.JsonMethods._
 
-import org.apache.spark.internal.{LogEntry, Logging, MDC}
+import org.apache.spark.internal.{LogEntry, Logging}
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, NUM_PARTITIONS, PIPELINE_STAGE_UID, STORAGE_LEVEL}
 import org.apache.spark.ml.{MLEvents, PipelineStage}
 import org.apache.spark.ml.param.{Param, Params}
diff --git a/mllib/src/main/scala/org/apache/spark/ml/util/ReadWrite.scala b/mllib/src/main/scala/org/apache/spark/ml/util/ReadWrite.scala
index 3a6f7fc00d6f9..e3f31874a4c23 100644
--- a/mllib/src/main/scala/org/apache/spark/ml/util/ReadWrite.scala
+++ b/mllib/src/main/scala/org/apache/spark/ml/util/ReadWrite.scala
@@ -30,7 +30,6 @@ import scala.reflect.ClassTag
 import scala.reflect.runtime.universe.TypeTag
 import scala.util.{Failure, Success, Try, Using}
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.fs.Path
 import org.json4s._
 import org.json4s.{DefaultFormats, JObject}
@@ -39,7 +38,7 @@ import org.json4s.jackson.JsonMethods._
 
 import org.apache.spark.{SparkContext, SparkException}
 import org.apache.spark.annotation.{Since, Unstable}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.ml._
 import org.apache.spark.ml.classification.{OneVsRest, OneVsRestModel}
@@ -822,7 +821,7 @@ private[spark] class FileSystemOverwrite extends Logging {
       val filePath = new File(path)
       if (filePath.exists()) {
         if (shouldOverwrite) {
-          FileUtils.deleteDirectory(filePath)
+          Utils.deleteRecursively(filePath)
         } else {
           throw new IOException(errMsg)
         }
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/clustering/BisectingKMeans.scala b/mllib/src/main/scala/org/apache/spark/mllib/clustering/BisectingKMeans.scala
index c826654f0893c..0d94c76640291 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/clustering/BisectingKMeans.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/clustering/BisectingKMeans.scala
@@ -24,7 +24,7 @@ import scala.collection.mutable
 
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaRDD
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLUSTER_LEVEL, COST, DIVISIBLE_CLUSTER_INDICES_SIZE, FEATURE_DIMENSION, MIN_POINT_PER_CLUSTER, NUM_POINT}
 import org.apache.spark.ml.util.Instrumentation
 import org.apache.spark.mllib.linalg.{Vector, Vectors}
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/clustering/KMeans.scala b/mllib/src/main/scala/org/apache/spark/mllib/clustering/KMeans.scala
index 52fbc7a5a47f5..21c2af721428c 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/clustering/KMeans.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/clustering/KMeans.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.annotation.Since
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{COST, INIT_MODE, NUM_ITERATIONS, TOTAL_TIME}
 import org.apache.spark.ml.util.Instrumentation
 import org.apache.spark.mllib.linalg.{Vector, Vectors}
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/clustering/LocalKMeans.scala b/mllib/src/main/scala/org/apache/spark/mllib/clustering/LocalKMeans.scala
index ea83be1237298..ac31c0d3be479 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/clustering/LocalKMeans.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/clustering/LocalKMeans.scala
@@ -19,7 +19,7 @@ package org.apache.spark.mllib.clustering
 
 import scala.util.Random
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{NUM_ITERATIONS, POINT_OF_CENTER}
 import org.apache.spark.mllib.linalg.BLAS.{axpy, scal}
 import org.apache.spark.mllib.linalg.Vectors
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/clustering/PowerIterationClustering.scala b/mllib/src/main/scala/org/apache/spark/mllib/clustering/PowerIterationClustering.scala
index 639e762ef3c87..10e8a992c784e 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/clustering/PowerIterationClustering.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/clustering/PowerIterationClustering.scala
@@ -25,7 +25,7 @@ import org.apache.spark.{SparkContext, SparkException}
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaRDD
 import org.apache.spark.graphx._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DELTA, DIFF_DELTA, NORM, NUM_ITERATIONS}
 import org.apache.spark.mllib.linalg.Vectors
 import org.apache.spark.mllib.util.{Loader, MLUtils, Saveable}
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/clustering/StreamingKMeans.scala b/mllib/src/main/scala/org/apache/spark/mllib/clustering/StreamingKMeans.scala
index 641b4fa4048a6..c05ca9ecff3e9 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/clustering/StreamingKMeans.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/clustering/StreamingKMeans.scala
@@ -21,7 +21,7 @@ import scala.reflect.ClassTag
 
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaSparkContext._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{CLUSTER_CENTROIDS, CLUSTER_LABEL, CLUSTER_WEIGHT, LARGEST_CLUSTER_INDEX, SMALLEST_CLUSTER_INDEX}
 import org.apache.spark.mllib.linalg.{BLAS, Vector, Vectors}
 import org.apache.spark.rdd.RDD
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/evaluation/BinaryClassificationMetrics.scala b/mllib/src/main/scala/org/apache/spark/mllib/evaluation/BinaryClassificationMetrics.scala
index a203d3fc73537..42007e96ca3a2 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/evaluation/BinaryClassificationMetrics.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/evaluation/BinaryClassificationMetrics.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.mllib.evaluation
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{COUNT, NUM_BIN}
 import org.apache.spark.mllib.evaluation.binary._
 import org.apache.spark.rdd.RDD
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/feature/Word2Vec.scala b/mllib/src/main/scala/org/apache/spark/mllib/feature/Word2Vec.scala
index 100fa13db5180..d99dfd504cb80 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/feature/Word2Vec.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/feature/Word2Vec.scala
@@ -31,7 +31,7 @@ import org.apache.spark.SparkContext
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaRDD
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ALPHA, COUNT, NUM_TRAIN_WORD, VOCAB_SIZE}
 import org.apache.spark.internal.config.Kryo.KRYO_SERIALIZER_MAX_BUFFER_SIZE
 import org.apache.spark.ml.linalg.BLAS
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/fpm/PrefixSpan.scala b/mllib/src/main/scala/org/apache/spark/mllib/fpm/PrefixSpan.scala
index 9c16ac2ecd526..a81bd823415af 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/fpm/PrefixSpan.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/fpm/PrefixSpan.scala
@@ -33,7 +33,7 @@ import org.apache.spark.SparkContext
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaRDD
 import org.apache.spark.api.java.JavaSparkContext.fakeClassTag
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{MIN_NUM_FREQUENT_PATTERN, NUM_FREQUENT_ITEMS, NUM_LOCAL_FREQUENT_PATTERN, NUM_PREFIXES, NUM_SEQUENCES}
 import org.apache.spark.mllib.util.{Loader, Saveable}
 import org.apache.spark.rdd.RDD
@@ -460,7 +460,6 @@ object PrefixSpan extends Logging {
     def genPrefixItems: Iterator[(Int, Long)] = {
       val n1 = items.length - 1
       // For each unique item (subject to sign) in this sequence, we output exact one split.
-      // TODO: use PrimitiveKeyOpenHashMap
       val prefixes = mutable.Map.empty[Int, Long]
       // a) items that can be assembled to the last itemset of the prefix
       partialStarts.foreach { start =>
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/linalg/Matrices.scala b/mllib/src/main/scala/org/apache/spark/mllib/linalg/Matrices.scala
index fc0c8d42579a9..a0b31d3d9282b 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/linalg/Matrices.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/linalg/Matrices.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.mllib.linalg
 
-import java.util.{Arrays, Random}
+import java.util.{Arrays, Objects, Random}
 
 import scala.collection.mutable.{ArrayBuffer, ArrayBuilder => MArrayBuilder, HashSet => MHashSet}
 import scala.language.implicitConversions
@@ -314,7 +314,7 @@ class DenseMatrix @Since("1.3.0") (
   }
 
   override def hashCode: Int = {
-    com.google.common.base.Objects.hashCode(numRows: Integer, numCols: Integer, toArray)
+    Objects.hash(numRows: Integer, numCols: Integer, toArray)
   }
 
   private[mllib] def asBreeze: BM[Double] = {
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/BlockMatrix.scala b/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/BlockMatrix.scala
index 3329682d3b550..50ce6f008f07e 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/BlockMatrix.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/BlockMatrix.scala
@@ -17,13 +17,15 @@
 
 package org.apache.spark.mllib.linalg.distributed
 
+import java.util.Objects
+
 import scala.collection.mutable.ArrayBuffer
 
 import breeze.linalg.{DenseMatrix => BDM, DenseVector => BDV, Matrix => BM}
 
 import org.apache.spark.{Partitioner, PartitionIdPassthrough, SparkException}
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.mllib.linalg._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.storage.StorageLevel
@@ -90,7 +92,7 @@ private[mllib] class GridPartitioner(
   }
 
   override def hashCode: Int = {
-    com.google.common.base.Objects.hashCode(
+    Objects.hash(
       rows: java.lang.Integer,
       cols: java.lang.Integer,
       rowsPerPart: java.lang.Integer,
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/RowMatrix.scala b/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/RowMatrix.scala
index 7621489bb1f0c..01abf22ad87c6 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/RowMatrix.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/linalg/distributed/RowMatrix.scala
@@ -26,7 +26,7 @@ import breeze.linalg.{axpy => brzAxpy, inv, svd => brzSvd, DenseMatrix => BDM, D
 import breeze.numerics.{sqrt => brzSqrt}
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.MAX_RESULT_SIZE
 import org.apache.spark.mllib.linalg._
 import org.apache.spark.mllib.stat._
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/optimization/GradientDescent.scala b/mllib/src/main/scala/org/apache/spark/mllib/optimization/GradientDescent.scala
index d4ff30c6add04..c7ed8b377fdb0 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/optimization/GradientDescent.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/optimization/GradientDescent.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable.ArrayBuffer
 
 import breeze.linalg.{norm, DenseVector => BDV}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.mllib.linalg.{Vector, Vectors}
 import org.apache.spark.rdd.RDD
 
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/optimization/LBFGS.scala b/mllib/src/main/scala/org/apache/spark/mllib/optimization/LBFGS.scala
index 3a8cde3ca1e89..2d3eab2a5708c 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/optimization/LBFGS.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/optimization/LBFGS.scala
@@ -22,7 +22,7 @@ import scala.collection.mutable
 import breeze.linalg.{DenseVector => BDV}
 import breeze.optimize.{CachedDiffFunction, DiffFunction, LBFGS => BreezeLBFGS}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.mllib.linalg.{Vector, Vectors}
 import org.apache.spark.mllib.linalg.BLAS.axpy
 import org.apache.spark.rdd.RDD
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/recommendation/MatrixFactorizationModel.scala b/mllib/src/main/scala/org/apache/spark/mllib/recommendation/MatrixFactorizationModel.scala
index fb9e8ac7c8920..9d239b5b7a503 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/recommendation/MatrixFactorizationModel.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/recommendation/MatrixFactorizationModel.scala
@@ -30,7 +30,7 @@ import org.json4s.jackson.JsonMethods._
 import org.apache.spark.SparkContext
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.{JavaPairRDD, JavaRDD}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.mllib.linalg.BLAS
 import org.apache.spark.mllib.rdd.MLPairRDDFunctions._
 import org.apache.spark.mllib.util.{Loader, Saveable}
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/regression/StreamingLinearAlgorithm.scala b/mllib/src/main/scala/org/apache/spark/mllib/regression/StreamingLinearAlgorithm.scala
index 2fa1339bc72a9..124a4a6596d27 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/regression/StreamingLinearAlgorithm.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/regression/StreamingLinearAlgorithm.scala
@@ -21,7 +21,7 @@ import scala.reflect.ClassTag
 
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaSparkContext.fakeClassTag
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{MODEL_WEIGHTS, TIME}
 import org.apache.spark.mllib.linalg.Vector
 import org.apache.spark.streaming.api.java.{JavaDStream, JavaPairDStream}
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/stat/test/ChiSqTest.scala b/mllib/src/main/scala/org/apache/spark/mllib/stat/test/ChiSqTest.scala
index 2059a9f785381..15f7a700be312 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/stat/test/ChiSqTest.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/stat/test/ChiSqTest.scala
@@ -20,7 +20,7 @@ package org.apache.spark.mllib.stat.test
 import org.apache.commons.math3.distribution.ChiSquaredDistribution
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.mllib.linalg._
 import org.apache.spark.mllib.regression.LabeledPoint
 import org.apache.spark.rdd.RDD
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/DecisionTreeModel.scala b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/DecisionTreeModel.scala
index 2acc49e218f2d..299fd1073f8ed 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/DecisionTreeModel.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/DecisionTreeModel.scala
@@ -26,7 +26,7 @@ import org.json4s.jackson.JsonMethods._
 import org.apache.spark.SparkContext
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaRDD
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.mllib.linalg.Vector
 import org.apache.spark.mllib.tree.configuration.{Algo, FeatureType}
 import org.apache.spark.mllib.tree.configuration.Algo._
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/InformationGainStats.scala b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/InformationGainStats.scala
index 54d95a3ffad1b..5a29516c926e8 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/InformationGainStats.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/InformationGainStats.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.mllib.tree.model
 
+import java.util.Objects
+
 import org.apache.spark.annotation.Since
 import org.apache.spark.mllib.tree.impurity.ImpurityCalculator
 
@@ -56,7 +58,7 @@ class InformationGainStats(
   }
 
   override def hashCode: Int = {
-    com.google.common.base.Objects.hashCode(
+    Objects.hash(
       gain: java.lang.Double,
       impurity: java.lang.Double,
       leftImpurity: java.lang.Double,
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Node.scala b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Node.scala
index bac36ce6937b0..a0eec8b2afb9c 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Node.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Node.scala
@@ -137,7 +137,7 @@ class Node @Since("1.2.0") (
         }
       }
     }
-    val prefix: String = " " * indentFactor
+    val prefix: String = " ".repeat(indentFactor)
     if (isLeaf) {
       prefix + s"Predict: ${predict.predict}\n"
     } else {
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Predict.scala b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Predict.scala
index 44bc625d217f1..f3d66c4f5ba3e 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Predict.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/Predict.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.mllib.tree.model
 
+import java.util.Objects
+
 import org.apache.spark.annotation.Since
 
 /**
@@ -39,6 +41,6 @@ class Predict @Since("1.2.0") (
   }
 
   override def hashCode: Int = {
-    com.google.common.base.Objects.hashCode(predict: java.lang.Double, prob: java.lang.Double)
+    Objects.hash(predict: java.lang.Double, prob: java.lang.Double)
   }
 }
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/treeEnsembleModels.scala b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/treeEnsembleModels.scala
index af922dda13f6b..8737cd1617be0 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/tree/model/treeEnsembleModels.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/tree/model/treeEnsembleModels.scala
@@ -26,7 +26,7 @@ import org.json4s.jackson.JsonMethods._
 import org.apache.spark.SparkContext
 import org.apache.spark.annotation.Since
 import org.apache.spark.api.java.JavaRDD
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.ml.linalg.BLAS
 import org.apache.spark.mllib.linalg.Vector
 import org.apache.spark.mllib.regression.LabeledPoint
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/util/DataValidators.scala b/mllib/src/main/scala/org/apache/spark/mllib/util/DataValidators.scala
index 4857c9b00f421..d7ed3ab1e2abf 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/util/DataValidators.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/util/DataValidators.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.mllib.util
 
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{COUNT, RANGE}
 import org.apache.spark.mllib.regression.LabeledPoint
 import org.apache.spark.rdd.RDD
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/util/MLUtils.scala b/mllib/src/main/scala/org/apache/spark/mllib/util/MLUtils.scala
index b8fcb1ffcbfe1..5a213e6803486 100644
--- a/mllib/src/main/scala/org/apache/spark/mllib/util/MLUtils.scala
+++ b/mllib/src/main/scala/org/apache/spark/mllib/util/MLUtils.scala
@@ -22,7 +22,7 @@ import scala.reflect.ClassTag
 
 import org.apache.spark.{SparkContext, SparkException}
 import org.apache.spark.annotation.Since
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.OPTIMIZER_CLASS_NAME
 import org.apache.spark.ml.linalg.{MatrixUDT => MLMatrixUDT, VectorUDT => MLVectorUDT}
 import org.apache.spark.ml.util.Instrumentation
diff --git a/mllib/src/test/java/org/apache/spark/ml/source/libsvm/JavaLibSVMRelationSuite.java b/mllib/src/test/java/org/apache/spark/ml/source/libsvm/JavaLibSVMRelationSuite.java
index 5f0d22ea2a8aa..9d6fef9a55977 100644
--- a/mllib/src/test/java/org/apache/spark/ml/source/libsvm/JavaLibSVMRelationSuite.java
+++ b/mllib/src/test/java/org/apache/spark/ml/source/libsvm/JavaLibSVMRelationSuite.java
@@ -19,9 +19,7 @@
 
 import java.io.File;
 import java.io.IOException;
-import java.nio.charset.StandardCharsets;
-
-import com.google.common.io.Files;
+import java.nio.file.Files;
 
 import org.junit.jupiter.api.Assertions;
 import org.junit.jupiter.api.BeforeEach;
@@ -50,7 +48,7 @@ public void setUp() throws IOException {
     tempDir = Utils.createTempDir(System.getProperty("java.io.tmpdir"), "datasource");
     File file = new File(tempDir, "part-00000");
     String s = "1 1:1.0 3:2.0 5:3.0\n0\n0 2:4.0 4:5.0 6:6.0";
-    Files.asCharSink(file, StandardCharsets.UTF_8).write(s);
+    Files.writeString(file.toPath(), s);
     path = tempDir.toURI().toString();
   }
 
diff --git a/mllib/src/test/java/org/apache/spark/mllib/feature/JavaWord2VecSuite.java b/mllib/src/test/java/org/apache/spark/mllib/feature/JavaWord2VecSuite.java
index 6543373a5a4d9..044b92666d9b5 100644
--- a/mllib/src/test/java/org/apache/spark/mllib/feature/JavaWord2VecSuite.java
+++ b/mllib/src/test/java/org/apache/spark/mllib/feature/JavaWord2VecSuite.java
@@ -20,8 +20,6 @@
 import java.util.Arrays;
 import java.util.List;
 
-import com.google.common.base.Strings;
-
 import scala.Tuple2;
 
 import org.junit.jupiter.api.Assertions;
@@ -35,7 +33,7 @@ public class JavaWord2VecSuite extends SharedSparkSession {
   @Test
   public void word2Vec() {
     // The tests are to check Java compatibility.
-    String sentence = Strings.repeat("a b ", 100) + Strings.repeat("a c ", 10);
+    String sentence = "a b ".repeat(100) + "a c ".repeat(10);
     List<String> words = Arrays.asList(sentence.split(" "));
     List<List<String>> localDoc = Arrays.asList(words, words);
     JavaRDD<List<String>> doc = jsc.parallelize(localDoc);
diff --git a/mllib/src/test/scala/org/apache/spark/ml/MLEventsSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/MLEventsSuite.scala
index 0b7426c1701f6..e28b26011593e 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/MLEventsSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/MLEventsSuite.scala
@@ -26,7 +26,6 @@ import org.mockito.Mockito.when
 import org.scalatest.concurrent.Eventually
 import org.scalatestplus.mockito.MockitoSugar.mock
 
-import org.apache.spark.SparkConf
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.ml.param.ParamMap
 import org.apache.spark.ml.util.{DefaultParamsReader, DefaultParamsWriter, MLWriter}
@@ -44,7 +43,6 @@ class MLEventsSuite extends SparkFunSuite with MLlibTestSparkContext with Eventu
       case _ =>
     }
   }
-  private val jsonProtocol = new JsonProtocol(new SparkConf())
 
   override def beforeAll(): Unit = {
     super.beforeAll()
@@ -145,8 +143,8 @@ class MLEventsSuite extends SparkFunSuite with MLlibTestSparkContext with Eventu
     }
     // Test if they can be ser/de via JSON protocol.
     assert(events.nonEmpty)
-    events.map(jsonProtocol.sparkEventToJsonString).foreach { event =>
-      assert(jsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
+    events.map(JsonProtocol.sparkEventToJsonString).foreach { event =>
+      assert(JsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
     }
   }
 
@@ -203,8 +201,8 @@ class MLEventsSuite extends SparkFunSuite with MLlibTestSparkContext with Eventu
     }
     // Test if they can be ser/de via JSON protocol.
     assert(events.nonEmpty)
-    events.map(jsonProtocol.sparkEventToJsonString).foreach { event =>
-      assert(jsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
+    events.map(JsonProtocol.sparkEventToJsonString).foreach { event =>
+      assert(JsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
     }
   }
 
@@ -235,8 +233,8 @@ class MLEventsSuite extends SparkFunSuite with MLlibTestSparkContext with Eventu
       // Test if they can be ser/de via JSON protocol.
       eventually(timeout(10.seconds), interval(1.second)) {
         assert(events.nonEmpty)
-        events.map(jsonProtocol.sparkEventToJsonString).foreach { event =>
-          assert(jsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
+        events.map(JsonProtocol.sparkEventToJsonString).foreach { event =>
+          assert(JsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
         }
       }
       sc.listenerBus.waitUntilEmpty(timeoutMillis = 10000)
@@ -263,8 +261,8 @@ class MLEventsSuite extends SparkFunSuite with MLlibTestSparkContext with Eventu
       // Test if they can be ser/de via JSON protocol.
       eventually(timeout(10.seconds), interval(1.second)) {
         assert(events.nonEmpty)
-        events.map(jsonProtocol.sparkEventToJsonString).foreach { event =>
-          assert(jsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
+        events.map(JsonProtocol.sparkEventToJsonString).foreach { event =>
+          assert(JsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
         }
       }
     }
@@ -298,8 +296,8 @@ class MLEventsSuite extends SparkFunSuite with MLlibTestSparkContext with Eventu
       // Test if they can be ser/de via JSON protocol.
       eventually(timeout(10.seconds), interval(1.second)) {
         assert(events.nonEmpty)
-        events.map(jsonProtocol.sparkEventToJsonString).foreach { event =>
-          assert(jsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
+        events.map(JsonProtocol.sparkEventToJsonString).foreach { event =>
+          assert(JsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
         }
       }
       sc.listenerBus.waitUntilEmpty(timeoutMillis = 10000)
@@ -326,8 +324,8 @@ class MLEventsSuite extends SparkFunSuite with MLlibTestSparkContext with Eventu
       // Test if they can be ser/de via JSON protocol.
       eventually(timeout(10.seconds), interval(1.second)) {
         assert(events.nonEmpty)
-        events.map(jsonProtocol.sparkEventToJsonString).foreach { event =>
-          assert(jsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
+        events.map(JsonProtocol.sparkEventToJsonString).foreach { event =>
+          assert(JsonProtocol.sparkEventFromJson(event).isInstanceOf[MLEvent])
         }
       }
     }
diff --git a/mllib/src/test/scala/org/apache/spark/ml/feature/IDFSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/feature/IDFSuite.scala
index 582a11df793ed..4f5c8b25de772 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/feature/IDFSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/feature/IDFSuite.scala
@@ -120,9 +120,12 @@ class IDFSuite extends MLTest with DefaultReadWriteTest {
       new OldIDFModel(Vectors.dense(1.0, 2.0), Array(1, 2), 2))
       .setInputCol("myInputCol")
       .setOutputCol("myOutputCol")
-    val newInstance = testDefaultReadWrite(instance)
-    assert(newInstance.idf === instance.idf)
-    assert(newInstance.docFreq === instance.docFreq)
-    assert(newInstance.numDocs === instance.numDocs)
+
+    for (testSaveToLocal <- Seq(false, true)) {
+      val newInstance = testDefaultReadWrite(instance, testSaveToLocal = testSaveToLocal)
+      assert(newInstance.idf === instance.idf)
+      assert(newInstance.docFreq === instance.docFreq)
+      assert(newInstance.numDocs === instance.numDocs)
+    }
   }
 }
diff --git a/mllib/src/test/scala/org/apache/spark/ml/feature/InstanceSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/feature/InstanceSuite.scala
index 53be2444ecb60..58ddbebbe77d8 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/feature/InstanceSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/feature/InstanceSuite.scala
@@ -21,6 +21,7 @@ import org.apache.spark.{SparkConf, SparkFunSuite}
 import org.apache.spark.internal.config.Kryo._
 import org.apache.spark.ml.linalg.Vectors
 import org.apache.spark.serializer.KryoSerializer
+import org.apache.spark.util.collection.Utils.createArray
 
 class InstanceSuite extends SparkFunSuite {
   test("Kryo class register") {
@@ -98,7 +99,7 @@ class InstanceSuite extends SparkFunSuite {
     }
 
     // instances larger than maxMemUsage
-    val denseInstance = Instance(-1.0, 2.0, Vectors.dense(Array.fill(1000)(1.0)))
+    val denseInstance = Instance(-1.0, 2.0, Vectors.dense(createArray(1000, 1.0)))
     InstanceBlock.blokifyWithMaxMemUsage(Iterator.single(denseInstance), 64).size
     InstanceBlock.blokifyWithMaxMemUsage(Iterator.fill(10)(denseInstance), 64).size
 
@@ -109,7 +110,7 @@ class InstanceSuite extends SparkFunSuite {
 
     // nnz = 10
     val sparseInstance = Instance(-2.0, 3.0,
-      Vectors.sparse(1000, Array.range(0, 1000, 100), Array.fill(10)(0.1)))
+      Vectors.sparse(1000, Array.range(0, 1000, 100), createArray(10, 0.1)))
 
     // normally, memory usage of a block does not exceed maxMemUsage too much
     val maxMemUsage = 1 << 18
diff --git a/mllib/src/test/scala/org/apache/spark/ml/feature/RobustScalerSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/feature/RobustScalerSuite.scala
index 6f24b9db3b3eb..b3eb595b971aa 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/feature/RobustScalerSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/feature/RobustScalerSuite.scala
@@ -22,6 +22,7 @@ import org.apache.spark.ml.param.ParamsSuite
 import org.apache.spark.ml.util.{DefaultReadWriteTest, MLTest, MLTestingUtils}
 import org.apache.spark.ml.util.TestingUtils._
 import org.apache.spark.sql.Row
+import org.apache.spark.util.collection.Utils.createArray
 
 class RobustScalerSuite extends MLTest with DefaultReadWriteTest {
 
@@ -140,19 +141,19 @@ class RobustScalerSuite extends MLTest with DefaultReadWriteTest {
     // 3st quartile = [3.0, ...]
     // quantile range = IQR = [2.0, ...]
     highDimData = Array(
-      Vectors.dense(Array.fill(2000)(0.0)),
-      Vectors.dense(Array.fill(2000)(1.0)),
-      Vectors.dense(Array.fill(2000)(2.0)),
-      Vectors.dense(Array.fill(2000)(3.0)),
-      Vectors.dense(Array.fill(2000)(4.0))
+      Vectors.dense(createArray(2000, 0.0)),
+      Vectors.dense(createArray(2000, 1.0)),
+      Vectors.dense(createArray(2000, 2.0)),
+      Vectors.dense(createArray(2000, 3.0)),
+      Vectors.dense(createArray(2000, 4.0))
     )
 
     highDimRes = Array(
-      Vectors.dense(Array.fill(2000)(0.0)),
-      Vectors.dense(Array.fill(2000)(0.5)),
-      Vectors.dense(Array.fill(2000)(1.0)),
-      Vectors.dense(Array.fill(2000)(1.5)),
-      Vectors.dense(Array.fill(2000)(2.0))
+      Vectors.dense(createArray(2000, 0.0)),
+      Vectors.dense(createArray(2000, 0.5)),
+      Vectors.dense(createArray(2000, 1.0)),
+      Vectors.dense(createArray(2000, 1.5)),
+      Vectors.dense(createArray(2000, 2.0))
     )
   }
 
diff --git a/mllib/src/test/scala/org/apache/spark/ml/feature/VectorIndexerSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/feature/VectorIndexerSuite.scala
index 384fcf6ceb859..0c97e48079599 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/feature/VectorIndexerSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/feature/VectorIndexerSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.ml.feature
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CATEGORICAL_FEATURES, MAX_CATEGORIES}
 import org.apache.spark.ml.attribute._
 import org.apache.spark.ml.linalg.{SparseVector, Vector, Vectors}
diff --git a/mllib/src/test/scala/org/apache/spark/ml/feature/VectorSizeHintSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/feature/VectorSizeHintSuite.scala
index 14faa81f7bffa..ade7823326f42 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/feature/VectorSizeHintSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/feature/VectorSizeHintSuite.scala
@@ -21,7 +21,7 @@ import org.apache.spark.ml.Pipeline
 import org.apache.spark.ml.attribute.AttributeGroup
 import org.apache.spark.ml.linalg.{Vector, Vectors}
 import org.apache.spark.ml.util.{DefaultReadWriteTest, MLTest}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.streaming.StreamTest
 
 class VectorSizeHintSuite
diff --git a/mllib/src/test/scala/org/apache/spark/ml/feature/Word2VecSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/feature/Word2VecSuite.scala
index d15462f6f403f..0e38b782f5074 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/feature/Word2VecSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/feature/Word2VecSuite.scala
@@ -36,7 +36,7 @@ class Word2VecSuite extends MLTest with DefaultReadWriteTest {
   }
 
   test("Word2Vec") {
-    val sentence = "a b " * 100 + "a c " * 10
+    val sentence = "a b ".repeat(100) + "a c ".repeat(10)
     val numOfWords = sentence.split(" ").length
     val doc = sc.parallelize(Seq(sentence, sentence)).map(line => line.split(" "))
 
@@ -76,7 +76,7 @@ class Word2VecSuite extends MLTest with DefaultReadWriteTest {
   }
 
   test("getVectors") {
-    val sentence = "a b " * 100 + "a c " * 10
+    val sentence = "a b ".repeat(100) + "a c ".repeat(10)
     val doc = sc.parallelize(Seq(sentence, sentence)).map(line => line.split(" "))
     val docDF = doc.zip(doc).toDF("text", "alsotext")
 
@@ -106,7 +106,7 @@ class Word2VecSuite extends MLTest with DefaultReadWriteTest {
 
   test("findSynonyms") {
 
-    val sentence = "a b " * 100 + "a c " * 10
+    val sentence = "a b ".repeat(100) + "a c ".repeat(10)
     val doc = sc.parallelize(Seq(sentence, sentence)).map(line => line.split(" "))
     val docDF = doc.zip(doc).toDF("text", "alsotext")
 
@@ -138,7 +138,7 @@ class Word2VecSuite extends MLTest with DefaultReadWriteTest {
 
   test("window size") {
 
-    val sentence = "a q s t q s t b b b s t m s t m q " * 100 + "a c " * 10
+    val sentence = "a q s t q s t b b b s t m s t m q ".repeat(100) + "a c ".repeat(10)
     val doc = sc.parallelize(Seq(sentence, sentence)).map(line => line.split(" "))
     val docDF = doc.zip(doc).toDF("text", "alsotext")
 
diff --git a/mllib/src/test/scala/org/apache/spark/ml/recommendation/ALSSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/recommendation/ALSSuite.scala
index 4da67a92d7075..e6e15bb1b3487 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/recommendation/ALSSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/recommendation/ALSSuite.scala
@@ -24,11 +24,8 @@ import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
-import org.apache.commons.io.filefilter.TrueFileFilter
-
 import org.apache.spark._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{RMSE, TEST_SIZE, TRAINING_SIZE}
 import org.apache.spark.ml.linalg.{BLAS, Vectors}
 import org.apache.spark.ml.recommendation.ALS._
@@ -1027,13 +1024,7 @@ class ALSCleanerSuite extends SparkFunSuite with LocalRootDirsTest {
     val conf = new SparkConf()
     val localDir = Utils.createTempDir()
     val checkpointDir = Utils.createTempDir()
-    def getAllFiles: Set[File] = {
-      val files = FileUtils.listFiles(
-        localDir,
-        TrueFileFilter.INSTANCE,
-        TrueFileFilter.INSTANCE).asScala.toSet
-      files
-    }
+    def getAllFiles: Set[File] = Utils.listFiles(localDir).asScala.toSet
     try {
       conf.set("spark.local.dir", localDir.getAbsolutePath)
       val sc = new SparkContext("local[2]", "ALSCleanerSuite", conf)
diff --git a/mllib/src/test/scala/org/apache/spark/ml/source/libsvm/LibSVMRelationSuite.scala b/mllib/src/test/scala/org/apache/spark/ml/source/libsvm/LibSVMRelationSuite.scala
index 6a0d7b1237ee4..e6650fa580135 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/source/libsvm/LibSVMRelationSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/source/libsvm/LibSVMRelationSuite.scala
@@ -18,9 +18,7 @@
 package org.apache.spark.ml.source.libsvm
 
 import java.io.{File, IOException}
-import java.nio.charset.StandardCharsets
-
-import com.google.common.io.Files
+import java.nio.file.Files
 
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.ml.attribute.AttributeGroup
@@ -65,9 +63,9 @@ class LibSVMRelationSuite
     val succ = new File(dir, "_SUCCESS")
     val file0 = new File(dir, "part-00000")
     val file1 = new File(dir, "part-00001")
-    Files.asCharSink(succ, StandardCharsets.UTF_8).write("")
-    Files.asCharSink(file0, StandardCharsets.UTF_8).write(lines0)
-    Files.asCharSink(file1, StandardCharsets.UTF_8).write(lines1)
+    Files.writeString(succ.toPath, "")
+    Files.writeString(file0.toPath, lines0)
+    Files.writeString(file1.toPath, lines1)
     path = dir.getPath
   }
 
diff --git a/mllib/src/test/scala/org/apache/spark/ml/util/MLTest.scala b/mllib/src/test/scala/org/apache/spark/ml/util/MLTest.scala
index 18cce169b4ce9..a35b19b2816e4 100644
--- a/mllib/src/test/scala/org/apache/spark/ml/util/MLTest.scala
+++ b/mllib/src/test/scala/org/apache/spark/ml/util/MLTest.scala
@@ -28,7 +28,7 @@ import org.apache.spark.ml.attribute._
 import org.apache.spark.ml.classification._
 import org.apache.spark.ml.linalg._
 import org.apache.spark.sql.{DataFrame, Dataset, Encoder, Row}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamTest
diff --git a/mllib/src/test/scala/org/apache/spark/mllib/feature/PCASuite.scala b/mllib/src/test/scala/org/apache/spark/mllib/feature/PCASuite.scala
index ea02f58ca906c..cf1f6005b4af9 100644
--- a/mllib/src/test/scala/org/apache/spark/mllib/feature/PCASuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/mllib/feature/PCASuite.scala
@@ -23,6 +23,7 @@ import org.apache.spark.mllib.linalg.distributed.RowMatrix
 import org.apache.spark.mllib.util.MLlibTestSparkContext
 import org.apache.spark.mllib.util.TestingUtils._
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.collection.Utils.createArray
 
 class PCASuite extends SparkFunSuite with MLlibTestSparkContext {
 
@@ -58,8 +59,8 @@ class PCASuite extends SparkFunSuite with MLlibTestSparkContext {
 
   test("number of features more than 65535") {
     val data1 = sc.parallelize(Seq(
-      Vectors.dense(Array.fill(100000)(2.0)),
-      Vectors.dense(Array.fill(100000)(0.0))
+      Vectors.dense(createArray(100000, 2.0)),
+      Vectors.dense(createArray(100000, 0.0))
     ), 2)
 
     val pca = new PCA(2).fit(data1)
diff --git a/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala b/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala
index 0b81a7c8aaf30..5e305262d6f40 100644
--- a/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala
@@ -29,7 +29,7 @@ class Word2VecSuite extends SparkFunSuite with MLlibTestSparkContext {
   // TODO: add more tests
 
   test("Word2Vec") {
-    val sentence = "a b " * 100 + "a c " * 10
+    val sentence = "a b ".repeat(100) + "a c ".repeat(10)
     val localDoc = Seq(sentence, sentence)
     val doc = sc.parallelize(localDoc)
       .map(line => line.split(" ").toSeq)
diff --git a/mllib/src/test/scala/org/apache/spark/mllib/linalg/UDTSerializationBenchmark.scala b/mllib/src/test/scala/org/apache/spark/mllib/linalg/UDTSerializationBenchmark.scala
index 37bbe76b9b531..22c514a0a0170 100644
--- a/mllib/src/test/scala/org/apache/spark/mllib/linalg/UDTSerializationBenchmark.scala
+++ b/mllib/src/test/scala/org/apache/spark/mllib/linalg/UDTSerializationBenchmark.scala
@@ -19,6 +19,7 @@ package org.apache.spark.mllib.linalg
 
 import org.apache.spark.benchmark.{Benchmark, BenchmarkBase}
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
+import org.apache.spark.util.collection.Utils.createArray
 
 /**
  * Serialization benchmark for VectorUDT.
@@ -45,7 +46,7 @@ object UDTSerializationBenchmark extends BenchmarkBase {
       val fromRow = encoder.createDeserializer()
 
       val vectors = (1 to numRows).map { i =>
-        Vectors.dense(Array.fill(1e5.toInt)(1.0 * i))
+        Vectors.dense(createArray(1e5.toInt, 1.0 * i))
       }.toArray
       val rows = vectors.map(toRow)
 
diff --git a/mllib/src/test/scala/org/apache/spark/mllib/linalg/VectorsSuite.scala b/mllib/src/test/scala/org/apache/spark/mllib/linalg/VectorsSuite.scala
index 135d7e26c6d8c..5f681317a58b6 100644
--- a/mllib/src/test/scala/org/apache/spark/mllib/linalg/VectorsSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/mllib/linalg/VectorsSuite.scala
@@ -26,7 +26,6 @@ import org.json4s.jackson.JsonMethods.{parse => parseJson}
 
 import org.apache.spark.{SparkConf, SparkException, SparkFunSuite}
 import org.apache.spark.internal.LogKeys.MALFORMATTED_STRING
-import org.apache.spark.internal.MDC
 import org.apache.spark.internal.config.Kryo._
 import org.apache.spark.ml.{linalg => newlinalg}
 import org.apache.spark.mllib.util.TestingUtils._
diff --git a/mllib/src/test/scala/org/apache/spark/mllib/tree/GradientBoostedTreesSuite.scala b/mllib/src/test/scala/org/apache/spark/mllib/tree/GradientBoostedTreesSuite.scala
index e654eac83649c..4240da825ce57 100644
--- a/mllib/src/test/scala/org/apache/spark/mllib/tree/GradientBoostedTreesSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/mllib/tree/GradientBoostedTreesSuite.scala
@@ -18,8 +18,8 @@
 package org.apache.spark.mllib.tree
 
 import org.apache.spark.SparkFunSuite
-import org.apache.spark.internal.{MDC, MessageWithContext}
 import org.apache.spark.internal.LogKeys.{LEARNING_RATE, NUM_ITERATIONS, SUBSAMPLING_RATE}
+import org.apache.spark.internal.MessageWithContext
 import org.apache.spark.mllib.regression.LabeledPoint
 import org.apache.spark.mllib.tree.configuration.{BoostingStrategy, Strategy}
 import org.apache.spark.mllib.tree.configuration.Algo._
diff --git a/mllib/src/test/scala/org/apache/spark/mllib/util/MLUtilsSuite.scala b/mllib/src/test/scala/org/apache/spark/mllib/util/MLUtilsSuite.scala
index c4dc3b1715720..5f6ac1b716cc9 100644
--- a/mllib/src/test/scala/org/apache/spark/mllib/util/MLUtilsSuite.scala
+++ b/mllib/src/test/scala/org/apache/spark/mllib/util/MLUtilsSuite.scala
@@ -18,12 +18,10 @@
 package org.apache.spark.mllib.util
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
 import scala.io.Source
 
-import com.google.common.io.Files
-
 import org.apache.spark.{SparkException, SparkFunSuite, SparkRuntimeException}
 import org.apache.spark.mllib.linalg.{DenseVector, Matrices, SparseVector, Vector, Vectors}
 import org.apache.spark.mllib.regression.LabeledPoint
@@ -93,7 +91,7 @@ class MLUtilsSuite extends SparkFunSuite with MLlibTestSparkContext {
       """.stripMargin
     val tempDir = Utils.createTempDir()
     val file = new File(tempDir.getPath, "part-00000")
-    Files.asCharSink(file, StandardCharsets.UTF_8).write(lines)
+    Files.writeString(file.toPath, lines)
     val path = tempDir.toURI.toString
 
     val pointsWithNumFeatures = loadLibSVMFile(sc, path, 6).collect()
@@ -126,7 +124,7 @@ class MLUtilsSuite extends SparkFunSuite with MLlibTestSparkContext {
       """.stripMargin
     val tempDir = Utils.createTempDir()
     val file = new File(tempDir.getPath, "part-00000")
-    Files.asCharSink(file, StandardCharsets.UTF_8).write(lines)
+    Files.writeString(file.toPath, lines)
     val path = tempDir.toURI.toString
 
     intercept[SparkException] {
@@ -143,7 +141,7 @@ class MLUtilsSuite extends SparkFunSuite with MLlibTestSparkContext {
       """.stripMargin
     val tempDir = Utils.createTempDir()
     val file = new File(tempDir.getPath, "part-00000")
-    Files.asCharSink(file, StandardCharsets.UTF_8).write(lines)
+    Files.writeString(file.toPath, lines)
     val path = tempDir.toURI.toString
 
     intercept[SparkException] {
diff --git a/pom.xml b/pom.xml
index 2ad0603357a21..e6cb98665d109 100644
--- a/pom.xml
+++ b/pom.xml
@@ -82,6 +82,7 @@
     <module>common/network-shuffle</module>
     <module>common/unsafe</module>
     <module>common/utils</module>
+    <module>common/utils-java</module>
     <module>common/variant</module>
     <module>common/tags</module>
     <module>sql/connect/shims</module>
@@ -116,20 +117,21 @@
     <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
     <project.reporting.outputEncoding>UTF-8</project.reporting.outputEncoding>
     <java.version>17</java.version>
+    <java.minimum.version>17.0.11</java.minimum.version>
     <maven.compiler.release>${java.version}</maven.compiler.release>
-    <maven.version>3.9.10</maven.version>
-    <exec-maven-plugin.version>3.5.0</exec-maven-plugin.version>
+    <maven.version>3.9.11</maven.version>
+    <exec-maven-plugin.version>3.5.1</exec-maven-plugin.version>
     <sbt.project.name>spark</sbt.project.name>
     <asm.version>9.8</asm.version>
     <slf4j.version>2.0.17</slf4j.version>
-    <log4j.version>2.24.3</log4j.version>
+    <log4j.version>2.25.1</log4j.version>
     <!-- make sure to update IsolatedClientLoader whenever this version is changed -->
-    <hadoop.version>3.4.1</hadoop.version>
+    <hadoop.version>3.4.2</hadoop.version>
     <!-- SPARK-41247: When updating `protobuf.version`, also need to update `protoVersion` in `SparkBuild.scala` -->
     <protobuf.version>4.29.3</protobuf.version>
     <protoc-jar-maven-plugin.version>3.11.4</protoc-jar-maven-plugin.version>
     <zookeeper.version>3.9.3</zookeeper.version>
-    <curator.version>5.7.1</curator.version>
+    <curator.version>5.9.0</curator.version>
     <hive.group>org.apache.hive</hive.group>
     <hive.classifier>core</hive.classifier>
     <!-- Version used in Maven Hive dependency -->
@@ -139,7 +141,7 @@
     <!-- After 10.17.1.0, the minimum required version is JDK19 -->
     <derby.version>10.16.1.1</derby.version>
     <parquet.version>1.15.2</parquet.version>
-    <orc.version>2.1.2</orc.version>
+    <orc.version>2.2.0</orc.version>
     <orc.classifier>shaded-protobuf</orc.classifier>
     <jetty.version>11.0.25</jetty.version>
     <jakartaservlet.version>5.0.0</jakartaservlet.version>
@@ -153,7 +155,7 @@
     If you change codahale.metrics.version, you also need to change
     the link to metrics.dropwizard.io in docs/monitoring.md.
     -->
-    <codahale.metrics.version>4.2.30</codahale.metrics.version>
+    <codahale.metrics.version>4.2.33</codahale.metrics.version>
     <!-- Should be consistent with SparkBuild.scala and docs -->
     <avro.version>1.12.0</avro.version>
     <aws.kinesis.client.version>1.12.0</aws.kinesis.client.version>
@@ -163,7 +165,7 @@
     <!-- the producer is used in tests -->
     <aws.kinesis.producer.version>0.12.8</aws.kinesis.producer.version>
     <!-- Do not use 3.0.0: https://github.com/GoogleCloudDataproc/hadoop-connectors/issues/1114 -->
-    <gcs-connector.version>hadoop3-2.2.26</gcs-connector.version>
+    <gcs-connector.version>hadoop3-2.2.28</gcs-connector.version>
     <!--  org.apache.httpcomponents/httpclient-->
     <commons.httpclient.version>4.5.14</commons.httpclient.version>
     <commons.httpcore.version>4.4.16</commons.httpcore.version>
@@ -174,35 +176,33 @@
     <scala.version>2.13.16</scala.version>
     <scala.binary.version>2.13</scala.binary.version>
     <scalatest-maven-plugin.version>2.2.0</scalatest-maven-plugin.version>
-    <scala-maven-plugin.version>4.9.2</scala-maven-plugin.version>
+    <scala-maven-plugin.version>4.9.5</scala-maven-plugin.version>
     <maven.scaladoc.skip>false</maven.scaladoc.skip>
     <versions-maven-plugin.version>2.18.0</versions-maven-plugin.version>
     <!-- for now, not running scalafmt as part of default verify pipeline -->
     <scalafmt.skip>true</scalafmt.skip>
     <scalafmt.validateOnly>true</scalafmt.validateOnly>
     <scalafmt.changedOnly>true</scalafmt.changedOnly>
-    <codehaus.jackson.version>1.9.13</codehaus.jackson.version>
-    <fasterxml.jackson.version>2.19.0</fasterxml.jackson.version>
-    <fasterxml.jackson.databind.version>2.19.0</fasterxml.jackson.databind.version>
+    <fasterxml.jackson.version>2.19.2</fasterxml.jackson.version>
+    <fasterxml.jackson.databind.version>2.19.2</fasterxml.jackson.databind.version>
     <ws.xmlschema.version>2.3.1</ws.xmlschema.version>
-    <snappy.version>1.1.10.7</snappy.version>
-    <netlib.ludovic.dev.version>3.0.3</netlib.ludovic.dev.version>
-    <commons-codec.version>1.18.0</commons-codec.version>
-    <commons-compress.version>1.27.1</commons-compress.version>
-    <commons-io.version>2.19.0</commons-io.version>
+    <snappy.version>1.1.10.8</snappy.version>
+    <netlib.ludovic.dev.version>3.0.4</netlib.ludovic.dev.version>
+    <commons-codec.version>1.19.0</commons-codec.version>
+    <commons-compress.version>1.28.0</commons-compress.version>
+    <commons-io.version>2.20.0</commons-io.version>
     <!-- To support Hive UDF jars built by Hive 2.0.0 ~ 2.3.9 and 3.0.0 ~ 3.1.3. -->
     <commons-lang2.version>2.6</commons-lang2.version>
     <!-- org.apache.commons/commons-lang3/-->
-    <commons-lang3.version>3.17.0</commons-lang3.version>
+    <commons-lang3.version>3.18.0</commons-lang3.version>
     <!-- org.apache.commons/commons-pool2/-->
     <commons-pool2.version>2.12.1</commons-pool2.version>
     <datanucleus-core.version>4.1.17</datanucleus-core.version>
     <guava.version>33.4.0-jre</guava.version>
     <gson.version>2.11.0</gson.version>
     <janino.version>3.1.9</janino.version>
-    <jersey.version>3.0.17</jersey.version>
-    <joda.version>2.13.0</joda.version>
-    <jodd.version>3.5.2</jodd.version>
+    <jersey.version>3.0.18</jersey.version>
+    <joda.version>2.14.0</joda.version>
     <jsr305.version>3.0.0</jsr305.version>
     <jaxb.version>2.2.11</jaxb.version>
     <libthrift.version>0.16.0</libthrift.version>
@@ -212,27 +212,27 @@
     <htmlunit3-driver.version>4.21.0</htmlunit3-driver.version>
     <maven-antrun.version>3.1.0</maven-antrun.version>
     <commons-crypto.version>1.1.0</commons-crypto.version>
-    <commons-cli.version>1.9.0</commons-cli.version>
-    <bouncycastle.version>1.80</bouncycastle.version>
+    <commons-cli.version>1.10.0</commons-cli.version>
+    <bouncycastle.version>1.81</bouncycastle.version>
     <tink.version>1.16.0</tink.version>
     <datasketches.version>6.2.0</datasketches.version>
-    <netty.version>4.1.121.Final</netty.version>
-    <netty-tcnative.version>2.0.70.Final</netty-tcnative.version>
+    <netty.version>4.1.124.Final</netty.version>
+    <netty-tcnative.version>2.0.72.Final</netty-tcnative.version>
     <icu4j.version>77.1</icu4j.version>
-    <junit-jupiter.version>5.12.2</junit-jupiter.version>
-    <junit-platform.version>1.12.2</junit-platform.version>
+    <junit-jupiter.version>5.13.1</junit-jupiter.version>
+    <junit-platform.version>1.13.1</junit-platform.version>
     <!--
       SPARK-50299: When updating `sbt-jupiter-interface.version`,
       also need to update the version in `SparkBuild.scala` and `plugins.sbt`.
     -->
-    <sbt-jupiter-interface.version>0.14.0</sbt-jupiter-interface.version>
+    <sbt-jupiter-interface.version>0.15.0</sbt-jupiter-interface.version>
     <!--
     If you are changing Arrow version specification, please check
     ./python/pyspark/sql/pandas/utils.py, ./python/packaging/classic/setup.py,
     ./python/packaging/client/setup.py, and ./python/packaging/connect/setup.py too.
     -->
     <arrow.version>18.3.0</arrow.version>
-    <ammonite.version>3.0.1</ammonite.version>
+    <ammonite.version>3.0.2</ammonite.version>
     <jjwt.version>0.12.6</jjwt.version>
 
     <!-- org.fusesource.leveldbjni will be used except on arm64 platform. -->
@@ -281,7 +281,6 @@
     <hive.deps.scope>compile</hive.deps.scope>
     <hive.storage.version>2.8.1</hive.storage.version>
     <hive.storage.scope>compile</hive.storage.scope>
-    <hive.jackson.scope>compile</hive.jackson.scope>
     <hive.common.scope>compile</hive.common.scope>
     <hive.llap.scope>test</hive.llap.scope>
     <hive.serde.scope>compile</hive.serde.scope>
@@ -310,7 +309,7 @@
     <tomcat.annotations.api.version>6.0.53</tomcat.annotations.api.version>
 
     <!-- Version used in Profiler -->
-    <ap-loader.version>3.0-9</ap-loader.version>
+    <ap-loader.version>4.0-10</ap-loader.version>
 
     <CodeCacheSize>128m</CodeCacheSize>
     <!-- Needed for consistent times -->
@@ -340,7 +339,7 @@
     </extraJavaTestArgs>
     <mariadb.java.client.version>2.7.12</mariadb.java.client.version>
     <mysql.connector.version>9.2.0</mysql.connector.version>
-    <postgresql.version>42.7.5</postgresql.version>
+    <postgresql.version>42.7.7</postgresql.version>
     <db2.jcc.version>11.5.9.0</db2.jcc.version>
     <mssql.jdbc.version>12.8.1.jre11</mssql.jdbc.version>
     <ojdbc17.version>23.6.0.24.10</ojdbc17.version>
@@ -518,12 +517,12 @@
       </dependency>
       <!--
         SPARK-51806: Kryo 4.0.x depends on objenesis 2.5.1, while Spark currently
-        depends on objenesis 3.3. Here, it is uniformly defined as version 3.3.
+        depends on objenesis 3.4. Here, it is uniformly defined as version 3.4.
         -->
       <dependency>
         <groupId>org.objenesis</groupId>
         <artifactId>objenesis</artifactId>
-        <version>3.3</version>
+        <version>3.4</version>
       </dependency>
       <dependency>
         <groupId>com.github.jnr</groupId>
@@ -666,7 +665,7 @@
       <dependency>
         <groupId>org.apache.commons</groupId>
         <artifactId>commons-text</artifactId>
-        <version>1.13.1</version>
+        <version>1.14.0</version>
       </dependency>
       <dependency>
         <groupId>commons-lang</groupId>
@@ -874,7 +873,7 @@
       <dependency>
         <groupId>com.github.luben</groupId>
         <artifactId>zstd-jni</artifactId>
-        <version>1.5.7-3</version>
+        <version>1.5.7-4</version>
       </dependency>
       <dependency>
         <groupId>com.clearspring.analytics</groupId>
@@ -1152,6 +1151,10 @@
             <groupId>org.apache.commons</groupId>
             <artifactId>commons-math3</artifactId>
           </exclusion>
+          <exclusion>
+            <groupId>org.scala-lang.modules</groupId>
+            <artifactId>scala-collection-compat_${scala.binary.version}</artifactId>
+          </exclusion>
         </exclusions>
       </dependency>
       <dependency>
@@ -1240,13 +1243,13 @@
       <dependency>
         <groupId>net.bytebuddy</groupId>
         <artifactId>byte-buddy</artifactId>
-        <version>1.17.0</version>
+        <version>1.17.6</version>
         <scope>test</scope>
       </dependency>
       <dependency>
         <groupId>net.bytebuddy</groupId>
         <artifactId>byte-buddy-agent</artifactId>
-        <version>1.17.0</version>
+        <version>1.17.6</version>
         <scope>test</scope>
       </dependency>
       <dependency>
@@ -1623,19 +1626,6 @@
           </exclusion>
         </exclusions>
       </dependency>
-      <!-- Hive 2.3 need this to init Hive's FunctionRegistry -->
-      <dependency>
-        <groupId>org.codehaus.jackson</groupId>
-        <artifactId>jackson-core-asl</artifactId>
-        <version>${codehaus.jackson.version}</version>
-        <scope>${hive.jackson.scope}</scope>
-      </dependency>
-      <dependency>
-        <groupId>org.codehaus.jackson</groupId>
-        <artifactId>jackson-mapper-asl</artifactId>
-        <version>${codehaus.jackson.version}</version>
-        <scope>${hive.jackson.scope}</scope>
-      </dependency>
       <dependency>
         <groupId>${hive.group}</groupId>
         <artifactId>hive-beeline</artifactId>
@@ -2320,7 +2310,7 @@
       <dependency>
         <groupId>org.apache.orc</groupId>
         <artifactId>orc-format</artifactId>
-        <version>1.1.0</version>
+        <version>1.1.1</version>
         <classifier>${orc.classifier}</classifier>
         <scope>${orc.deps.scope}</scope>
       </dependency>
@@ -2463,11 +2453,6 @@
         <artifactId>joda-time</artifactId>
         <version>${joda.version}</version>
       </dependency>
-      <dependency>
-        <groupId>org.jodd</groupId>
-        <artifactId>jodd-core</artifactId>
-        <version>${jodd.version}</version>
-      </dependency>
       <dependency>
         <groupId>org.datanucleus</groupId>
         <artifactId>datanucleus-core</artifactId>
@@ -2631,7 +2616,7 @@
         <plugin>
           <groupId>org.apache.maven.plugins</groupId>
           <artifactId>maven-enforcer-plugin</artifactId>
-          <version>3.5.0</version>
+          <version>3.6.0</version>
           <executions>
             <execution>
               <id>enforce-versions</id>
@@ -2685,14 +2670,14 @@
             <dependency>
               <groupId>org.codehaus.mojo</groupId>
               <artifactId>extra-enforcer-rules</artifactId>
-              <version>1.9.0</version>
+              <version>1.10.0</version>
             </dependency>
           </dependencies>
         </plugin>
         <plugin>
           <groupId>org.codehaus.mojo</groupId>
           <artifactId>build-helper-maven-plugin</artifactId>
-          <version>3.6.0</version>
+          <version>3.6.1</version>
           <executions>
             <execution>
               <id>module-timestamp-property</id>
@@ -2808,6 +2793,7 @@
               <javacArg>--release</javacArg>
               <javacArg>${java.version}</javacArg>
               <javacArg>-Xlint:all,-serial,-path,-try</javacArg>
+              <javacArg>-proc:full</javacArg>
             </javacArgs>
           </configuration>
         </plugin>
@@ -2829,7 +2815,7 @@
         <plugin>
           <groupId>org.apache.maven.plugins</groupId>
           <artifactId>maven-surefire-plugin</artifactId>
-          <version>3.5.2</version>
+          <version>3.5.3</version>
           <!-- Note config is repeated in scalatest config -->
           <configuration>
             <includes>
@@ -2967,7 +2953,7 @@
         <plugin>
           <groupId>org.apache.maven.plugins</groupId>
           <artifactId>maven-clean-plugin</artifactId>
-          <version>3.4.1</version>
+          <version>3.5.0</version>
           <configuration>
             <filesets>
               <fileset>
diff --git a/project/MimaExcludes.scala b/project/MimaExcludes.scala
index 5f1c0cbca0d0b..57ab8e196da91 100644
--- a/project/MimaExcludes.scala
+++ b/project/MimaExcludes.scala
@@ -39,7 +39,10 @@ object MimaExcludes {
     ProblemFilters.exclude[ReversedMissingMethodProblem]("org.apache.spark.ml.linalg.Vector.getSizeInBytes"),
 
     // [SPARK-52221][SQL] Refactor SqlScriptingLocalVariableManager into more generic context manager
-    ProblemFilters.exclude[DirectMissingMethodProblem]("org.apache.spark.sql.scripting.SqlScriptingExecution.withLocalVariableManager")
+    ProblemFilters.exclude[DirectMissingMethodProblem]("org.apache.spark.sql.scripting.SqlScriptingExecution.withLocalVariableManager"),
+
+    // [SPARK-53391][CORE] Remove unused PrimitiveKeyOpenHashMap
+    ProblemFilters.exclude[MissingClassProblem]("org.apache.spark.util.collection.PrimitiveKeyOpenHashMap*")
   )
 
   // Default exclude rules
@@ -83,6 +86,13 @@ object MimaExcludes {
     // SPARK-51267: Match local Spark Connect server logic between Python and Scala
     ProblemFilters.exclude[MissingFieldProblem]("org.apache.spark.launcher.SparkLauncher.SPARK_LOCAL_REMOTE"),
 
+    // SPARK-53138: Split common/utils Java code into a new module common/utils-java
+    ProblemFilters.exclude[MissingClassProblem]("org.apache.spark.QueryContext"),
+    ProblemFilters.exclude[MissingClassProblem]("org.apache.spark.QueryContextType"),
+    ProblemFilters.exclude[MissingClassProblem]("org.apache.spark.api.java.function.*"),
+    ProblemFilters.exclude[MissingClassProblem]("org.apache.spark.network.util.ByteUnit"),
+    ProblemFilters.exclude[MissingClassProblem]("org.apache.spark.network.util.JavaUtils"),
+
     (problem: Problem) => problem match {
       case MissingClassProblem(cls) => !cls.fullName.startsWith("org.sparkproject.jpmml") &&
           !cls.fullName.startsWith("org.sparkproject.dmg.pmml")
diff --git a/project/SparkBuild.scala b/project/SparkBuild.scala
index 77001e6bdf227..b1bbdad17759b 100644
--- a/project/SparkBuild.scala
+++ b/project/SparkBuild.scala
@@ -16,6 +16,7 @@
  */
 
 import java.io._
+import java.lang.{Runtime => JRuntime}
 import java.nio.charset.StandardCharsets.UTF_8
 import java.nio.file.{Files, Paths, StandardCopyOption}
 import java.util.Locale
@@ -58,10 +59,10 @@ object BuildCommons {
 
   val allProjects@Seq(
     core, graphx, mllib, mllibLocal, repl, networkCommon, networkShuffle, launcher, unsafe, tags, sketch, kvstore,
-    commonUtils, variant, pipelines, _*
+    commonUtils, commonUtilsJava, variant, pipelines, _*
   ) = Seq(
     "core", "graphx", "mllib", "mllib-local", "repl", "network-common", "network-shuffle", "launcher", "unsafe",
-    "tags", "sketch", "kvstore", "common-utils", "variant", "pipelines"
+    "tags", "sketch", "kvstore", "common-utils", "common-utils-java", "variant", "pipelines"
   ).map(ProjectRef(buildLocation, _)) ++ sqlProjects ++ streamingProjects ++ connectProjects
 
   val optionallyEnabledProjects@Seq(kubernetes, yarn,
@@ -99,6 +100,30 @@ object SparkBuild extends PomBuild {
   import sbtunidoc.GenJavadocPlugin.autoImport._
   import scala.collection.mutable.Map
 
+  lazy val checkJavaVersion = taskKey[Unit]("Check Java Version")
+  lazy val checkJavaVersionSettings: Seq[Setting[?]] = Seq(
+    checkJavaVersion := {
+      val currentVersion = JRuntime.version()
+      val currentVersionFeature = currentVersion.feature()
+      val currentVersionUpdate = currentVersion.update()
+      val minimumVersion = JRuntime.Version.parse(
+        SbtPomKeys.effectivePom.value.getProperties
+          .get("java.minimum.version").asInstanceOf[String])
+      val minimumVersionFeature = minimumVersion.feature()
+      val minimumVersionUpdate = minimumVersion.update()
+      val isCompatible = currentVersionFeature > minimumVersionFeature ||
+        (currentVersionFeature == minimumVersionFeature &&
+          currentVersionUpdate >= minimumVersionUpdate)
+      if (!isCompatible) {
+        throw new MessageOnlyException(
+          "The Java version used to build the project is outdated. " +
+            s"Please use Java $minimumVersion or later.")
+      }
+    },
+    (Compile / compile) := ((Compile / compile) dependsOn checkJavaVersion).value,
+    (Test / compile) := ((Test / compile) dependsOn checkJavaVersion).value
+  )
+
   val projectsMap: Map[String, Seq[Setting[_]]] = Map.empty
 
   override val profiles = {
@@ -261,7 +286,8 @@ object SparkBuild extends PomBuild {
 
   val noLintOnCompile = sys.env.contains("NOLINT_ON_COMPILE") &&
       !sys.env.get("NOLINT_ON_COMPILE").contains("false")
-  lazy val sharedSettings = sparkGenjavadocSettings ++
+  lazy val sharedSettings = checkJavaVersionSettings ++
+                            sparkGenjavadocSettings ++
                             compilerWarningSettings ++
       (if (noLintOnCompile) Nil else enableScalaStyle) ++ Seq(
     (Compile / exportJars) := true,
@@ -313,6 +339,7 @@ object SparkBuild extends PomBuild {
     (Compile / javacOptions) ++= Seq(
       "-encoding", UTF_8.name(),
       "-g",
+      "-proc:full",
       "--release", javaVersion.value
     ),
     // This -target and Xlint:unchecked options cannot be set in the Compile configuration scope since
@@ -373,7 +400,7 @@ object SparkBuild extends PomBuild {
     Seq(
       spark, hive, hiveThriftServer, repl, networkCommon, networkShuffle, networkYarn,
       unsafe, tags, tokenProviderKafka010, sqlKafka010, pipelines, connectCommon, connect,
-      connectClient, variant, connectShims, profiler
+      connectClient, variant, connectShims, profiler, commonUtilsJava
     ).contains(x)
   }
 
@@ -1078,6 +1105,7 @@ object ExcludedDependencies {
     libraryDependencies ~= { libs => libs.filterNot(_.name == "groovy-all") },
     excludeDependencies ++= Seq(
       ExclusionRule(organization = "ch.qos.logback"),
+      ExclusionRule("org.slf4j", "slf4j-simple"),
       ExclusionRule("javax.servlet", "javax.servlet-api"))
   )
 }
@@ -1516,6 +1544,9 @@ object CopyDependencies {
       val fid = (LocalProject("connect") / assembly).value
       val fidClient = (LocalProject("connect-client-jvm") / assembly).value
       val fidProtobuf = (LocalProject("protobuf") / assembly).value
+      val noProvidedSparkJars: Boolean = sys.env.getOrElse("NO_PROVIDED_SPARK_JARS", "1") == "1" ||
+        sys.env.getOrElse("NO_PROVIDED_SPARK_JARS", "true")
+          .toLowerCase(Locale.getDefault()) == "true"
 
       (Compile / dependencyClasspath).value.map(_.data)
         .filter { jar => jar.isFile() }
@@ -1526,17 +1557,18 @@ object CopyDependencies {
             destJar.delete()
           }
 
-          if (jar.getName.contains("spark-connect-common") &&
-            !SbtPomKeys.profiles.value.contains("noshade-connect")) {
+          if (jar.getName.contains("spark-connect-common")) {
             // Don't copy the spark connect common JAR as it is shaded in the spark connect.
           } else if (jar.getName.contains("connect-client-jvm")) {
             // Do not place Spark Connect client jars as it is not built-in.
-          } else if (jar.getName.contains("spark-connect") &&
-            !SbtPomKeys.profiles.value.contains("noshade-connect")) {
+          } else if (noProvidedSparkJars && jar.getName.contains("spark-avro")) {
+            // Do not place Spark Avro jars as it is not built-in.
+          } else if (jar.getName.contains("spark-connect")) {
             Files.copy(fid.toPath, destJar.toPath)
-          } else if (jar.getName.contains("spark-protobuf") &&
-            !SbtPomKeys.profiles.value.contains("noshade-protobuf")) {
-            Files.copy(fidProtobuf.toPath, destJar.toPath)
+          } else if (jar.getName.contains("spark-protobuf")) {
+            if (!noProvidedSparkJars) {
+              Files.copy(fidProtobuf.toPath, destJar.toPath)
+            }
           } else {
             Files.copy(jar.toPath(), destJar.toPath())
           }
@@ -1651,6 +1683,7 @@ object TestSettings {
     (Test / javaOptions) ++= System.getProperties.asScala.filter(_._1.startsWith("spark"))
       .map { case (k,v) => s"-D$k=$v" }.toSeq,
     (Test / javaOptions) += "-ea",
+    (Test / javaOptions) += s"-XX:ErrorFile=${baseDirectory.value}/target/hs_err_pid%p.log",
     (Test / javaOptions) ++= {
       val metaspaceSize = sys.env.get("METASPACE_SIZE").getOrElse("1300m")
       val heapSize = sys.env.get("HEAP_SIZE").getOrElse("4g")
@@ -1722,7 +1755,7 @@ object TestSettings {
     (Test / testOptions) += Tests.Argument(TestFrameworks.ScalaTest, "-W", "120", "300"),
     (Test / testOptions) += Tests.Argument(TestFrameworks.JUnit, "-v", "-a"),
     // Enable Junit testing.
-    libraryDependencies += "com.github.sbt.junit" % "jupiter-interface" % "0.14.0" % "test",
+    libraryDependencies += "com.github.sbt.junit" % "jupiter-interface" % "0.15.0" % "test",
     // `parallelExecutionInTest` controls whether test suites belonging to the same SBT project
     // can run in parallel with one another. It does NOT control whether tests execute in parallel
     // within the same JVM (which is controlled by `testForkedParallel`) or whether test cases
diff --git a/project/plugins.sbt b/project/plugins.sbt
index 579020e5af0ce..0e5ce79c8b567 100644
--- a/project/plugins.sbt
+++ b/project/plugins.sbt
@@ -41,6 +41,6 @@ addSbtPlugin("com.simplytyped" % "sbt-antlr4" % "0.8.3")
 
 addSbtPlugin("com.github.sbt" % "sbt-pom-reader" % "2.4.0")
 
-addSbtPlugin("com.github.sbt.junit" % "sbt-jupiter-interface" % "0.14.0")
+addSbtPlugin("com.github.sbt.junit" % "sbt-jupiter-interface" % "0.15.0")
 
 addSbtPlugin("com.thesamet" % "sbt-protoc" % "1.0.7")
diff --git a/python/docs/Makefile b/python/docs/Makefile
index eba8a3fffbcd1..045b03a1afd1b 100644
--- a/python/docs/Makefile
+++ b/python/docs/Makefile
@@ -22,7 +22,6 @@ SOURCEDIR     ?= source
 BUILDDIR      ?= build
 
 export PYTHONPATH=$(realpath ..):$(realpath ../lib/py4j-0.10.9.9-src.zip)
-export SPARK_ANSI_SQL_MODE=false
 
 # Put it first so that "make" without argument is like "make help".
 help:
diff --git a/python/docs/source/development/contributing.rst b/python/docs/source/development/contributing.rst
index fc2a1cc586040..4103a1e650930 100644
--- a/python/docs/source/development/contributing.rst
+++ b/python/docs/source/development/contributing.rst
@@ -129,8 +129,8 @@ If you are using Conda, the development environment can be set as follows.
 
 .. code-block:: bash
 
-    # Python 3.9+ is required
-    conda create --name pyspark-dev-env python=3.9
+    # Python 3.10+ is required
+    conda create --name pyspark-dev-env python=3.10
     conda activate pyspark-dev-env
     pip install --upgrade -r dev/requirements.txt
 
@@ -145,7 +145,7 @@ Now, you can start developing and `running the tests <testing.rst>`_.
 pip
 ~~~
 
-With Python 3.9+, pip can be used as below to install and set up the development environment.
+With Python 3.10+, pip can be used as below to install and set up the development environment.
 
 .. code-block:: bash
 
diff --git a/python/docs/source/development/debugging.rst b/python/docs/source/development/debugging.rst
index 0aa2426cf862d..9fa9a0c526cea 100644
--- a/python/docs/source/development/debugging.rst
+++ b/python/docs/source/development/debugging.rst
@@ -215,7 +215,7 @@ Python/Pandas UDF
 ~~~~~~~~~~~~~~~~~
 
 PySpark provides remote `memory_profiler <https://github.com/pythonprofilers/memory_profiler>`_ for
-Python/Pandas UDFs. That can be used on editors with line numbers such as Jupyter notebooks. UDFs with iterators as inputs/outputs are not supported.
+Python/Pandas UDFs. That can be used on editors with line numbers such as Jupyter notebooks. UDFs that are generator functions are not supported.
 
 SparkSession-based memory profiler can be enabled by setting the `Runtime SQL configuration <https://spark.apache.org/docs/latest/configuration.html#runtime-sql-configuration>`_
 ``spark.sql.pyspark.udf.profiler`` to ``memory``. An example on a Jupyter notebook is as shown below.
@@ -320,7 +320,7 @@ Python/Pandas UDF
 ~~~~~~~~~~~~~~~~~
 
 PySpark provides remote `Python Profilers <https://docs.python.org/3/library/profile.html>`_ for
-Python/Pandas UDFs. UDFs with iterators as inputs/outputs are not supported.
+Python/Pandas UDFs. UDFs that are generator functions are not supported.
 
 SparkSession-based performance profiler can be enabled by setting the `Runtime SQL configuration <https://spark.apache.org/docs/latest/configuration.html#runtime-sql-configuration>`_
 ``spark.sql.pyspark.udf.profiler`` to ``perf``. An example is as shown below.
diff --git a/python/docs/source/getting_started/install.rst b/python/docs/source/getting_started/install.rst
index 5f445c8aa5242..82db489651ff9 100644
--- a/python/docs/source/getting_started/install.rst
+++ b/python/docs/source/getting_started/install.rst
@@ -30,7 +30,7 @@ and building from the source.
 Python Versions Supported
 -------------------------
 
-Python 3.9 and above.
+Python 3.10 and above.
 
 
 Using PyPI
@@ -143,7 +143,7 @@ the same session as pyspark (you can install in several steps too).
 
 .. code-block:: bash
 
-    conda install -c conda-forge pyspark  # can also add "python=3.9 some_package [etc.]" here
+    conda install -c conda-forge pyspark  # can also add "python=3.10 some_package [etc.]" here
 
 Note that `PySpark for conda <https://anaconda.org/conda-forge/pyspark>`_ is maintained
 separately by the community; while new versions generally get packaged quickly, the
@@ -225,8 +225,8 @@ Installable with ``pip install "pyspark[connect]"``.
 ========================== ================= ==========================
 Package                    Supported version Note
 ========================== ================= ==========================
-`pandas`                   >=2.0.0           Required for Spark Connect
-`pyarrow`                  >=11.0.0          Required for Spark Connect
+`pandas`                   >=2.2.0           Required for Spark Connect
+`pyarrow`                  >=15.0.0          Required for Spark Connect
 `grpcio`                   >=1.67.0          Required for Spark Connect
 `grpcio-status`            >=1.67.0          Required for Spark Connect
 `googleapis-common-protos` >=1.65.0          Required for Spark Connect
@@ -241,8 +241,8 @@ Installable with ``pip install "pyspark[sql]"``.
 ========= ================= ======================
 Package   Supported version Note
 ========= ================= ======================
-`pandas`  >=2.0.0           Required for Spark SQL
-`pyarrow` >=11.0.0          Required for Spark SQL
+`pandas`  >=2.2.0           Required for Spark SQL
+`pyarrow` >=15.0.0          Required for Spark SQL
 ========= ================= ======================
 
 Additional libraries that enhance functionality but are not included in the installation packages:
@@ -259,7 +259,7 @@ Installable with ``pip install "pyspark[pandas_on_spark]"``.
 Package   Supported version Note
 ========= ================= ================================
 `pandas`  >=2.2.0           Required for Pandas API on Spark
-`pyarrow` >=11.0.0          Required for Pandas API on Spark
+`pyarrow` >=15.0.0          Required for Pandas API on Spark
 ========= ================= ================================
 
 Additional libraries that enhance functionality but are not included in the installation packages:
@@ -277,7 +277,7 @@ Installable with ``pip install "pyspark[ml]"``.
 ======= ================= ======================================
 Package Supported version Note
 ======= ================= ======================================
-`numpy` >=1.21            Required for MLlib DataFrame-based API
+`numpy` >=1.22            Required for MLlib DataFrame-based API
 ======= ================= ======================================
 
 Additional libraries that enhance functionality but are not included in the installation packages:
@@ -297,5 +297,22 @@ Installable with ``pip install "pyspark[mllib]"``.
 ======= ================= ==================
 Package Supported version Note
 ======= ================= ==================
-`numpy` >=1.21            Required for MLlib
+`numpy` >=1.22            Required for MLlib
 ======= ================= ==================
+
+Declarative Pipelines
+^^^^^^^^^^^^^^^^^^^^^
+
+Installable with ``pip install "pyspark[pipelines]"``. Includes all dependencies for both Spark SQL and Spark Connect, because Declarative Pipelines is built on top of both.
+
+========================== ================= ===================================================
+Package                    Supported version Note
+========================== ================= ===================================================
+`pandas`                   >=2.2.0           Required for Spark Connect and Spark SQL
+`pyarrow`                  >=15.0.0          Required for Spark Connect and Spark SQL
+`grpcio`                   >=1.67.0          Required for Spark Connect
+`grpcio-status`            >=1.67.0          Required for Spark Connect
+`googleapis-common-protos` >=1.65.0          Required for Spark Connect
+`pyyaml`                   >=3.11            Required for spark-pipelines command line interface
+`graphviz`                 >=0.20            Optional for Spark Connect
+========================== ================= ===================================================
diff --git a/python/docs/source/migration_guide/pyspark_upgrade.rst b/python/docs/source/migration_guide/pyspark_upgrade.rst
index f91e297539649..f7d80fe10786d 100644
--- a/python/docs/source/migration_guide/pyspark_upgrade.rst
+++ b/python/docs/source/migration_guide/pyspark_upgrade.rst
@@ -22,10 +22,16 @@ Upgrading PySpark
 Upgrading from PySpark 4.0 to 4.1
 ---------------------------------
 
+* In Spark 4.1, Python 3.9 support was dropped in PySpark.
+* In Spark 4.1, the minimum supported version for PyArrow has been raised from 11.0.0 to 15.0.0 in PySpark.
+* In Spark 4.1, the minimum supported version for Pandas has been raised from 2.0.0 to 2.2.0 in PySpark.
+* In Spark 4.1, ``DataFrame['name']`` on Spark Connect Python Client no longer eagerly validate the column name. To restore the legacy behavior, set ``PYSPARK_VALIDATE_COLUMN_NAME_LEGACY`` environment variable to ``1``.
 * In Spark 4.1, Arrow-optimized Python UDF supports UDT input / output instead of falling back to the regular UDF. To restore the legacy behavior, set ``spark.sql.execution.pythonUDF.arrow.legacy.fallbackOnUDT`` to ``true``.
-
+* In Spark 4.1, unnecessary conversion to pandas instances is removed when ``spark.sql.execution.pythonUDF.arrow.enabled`` is enabled. As a result, the type coercion changes when the produced output has a schema different from the specified schema. To restore the previous behavior, enable ``spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled``.
 * In Spark 4.1, unnecessary conversion to pandas instances is removed when ``spark.sql.execution.pythonUDTF.arrow.enabled`` is enabled. As a result, the type coercion changes when the produced output has a schema different from the specified schema. To restore the previous behavior, enable ``spark.sql.legacy.execution.pythonUDTF.pandas.conversion.enabled``.
 
+* In Spark 4.1, the ``spark.sql.execution.pandas.convertToArrowArraySafely`` configuration is enabled by default. When this setting is enabled, PyArrow raises errors for unsafe conversions such as integer overflows, floating point truncation, and loss of precision. This change affects the return data serialization of arrow-enabled UDFs/pandas_udfs, and the creation of PySpark DataFrames. To restore the previous behavior, set the configuration to ``false``.
+* In Spark 4.1, pandas API on Spark works under ANSI mode when ``compute.ansi_mode_support`` is set to ``True`` (default). The safeguard option ``compute.fail_on_ansi_mode`` remains available, but it only takes effect when ``compute.ansi_mode_support`` is ``False``.
 
 Upgrading from PySpark 3.5 to 4.0
 ---------------------------------
diff --git a/python/docs/source/reference/pyspark.errors.rst b/python/docs/source/reference/pyspark.errors.rst
index 4d2bf76127795..1204cccc8df5b 100644
--- a/python/docs/source/reference/pyspark.errors.rst
+++ b/python/docs/source/reference/pyspark.errors.rst
@@ -50,7 +50,6 @@ Classes
     QueryContext
     QueryContextType
     QueryExecutionException
-    RetriesExceeded
     SessionNotSameException
     SparkRuntimeException
     SparkUpgradeException
diff --git a/python/docs/source/reference/pyspark.sql/data_types.rst b/python/docs/source/reference/pyspark.sql/data_types.rst
index d201be271a6a6..99f8c5bb87ef9 100644
--- a/python/docs/source/reference/pyspark.sql/data_types.rst
+++ b/python/docs/source/reference/pyspark.sql/data_types.rst
@@ -31,6 +31,7 @@ Data Types
     ByteType
     DataType
     DateType
+    TimeType
     DecimalType
     DoubleType
     FloatType
diff --git a/python/docs/source/reference/pyspark.sql/functions.rst b/python/docs/source/reference/pyspark.sql/functions.rst
index a3a2e11daf2e1..7bec529407667 100644
--- a/python/docs/source/reference/pyspark.sql/functions.rst
+++ b/python/docs/source/reference/pyspark.sql/functions.rst
@@ -253,6 +253,7 @@ Date and Timestamp Functions
     convert_timezone
     curdate
     current_date
+    current_time
     current_timestamp
     current_timezone
     date_add
@@ -279,6 +280,7 @@ Date and Timestamp Functions
     make_date
     make_dt_interval
     make_interval
+    make_time
     make_timestamp
     make_timestamp_ltz
     make_timestamp_ntz
@@ -297,7 +299,9 @@ Date and Timestamp Functions
     timestamp_micros
     timestamp_millis
     timestamp_seconds
+    time_trunc
     to_date
+    to_time
     to_timestamp
     to_timestamp_ltz
     to_timestamp_ntz
@@ -308,7 +312,9 @@ Date and Timestamp Functions
     try_make_timestamp
     try_make_timestamp_ltz
     try_make_timestamp_ntz
+    try_to_time
     try_to_timestamp
+    try_to_date
     unix_date
     unix_micros
     unix_millis
@@ -643,6 +649,8 @@ UDF, UDTF and UDT
 .. autosummary::
     :toctree: api/
 
+    arrow_udf
+    arrow_udtf
     call_udf
     pandas_udf
     udf
diff --git a/python/docs/source/tutorial/pandas_on_spark/options.rst b/python/docs/source/tutorial/pandas_on_spark/options.rst
index 74197a5d99750..25e9ceb5171d6 100644
--- a/python/docs/source/tutorial/pandas_on_spark/options.rst
+++ b/python/docs/source/tutorial/pandas_on_spark/options.rst
@@ -324,10 +324,10 @@ compute.fail_on_ansi_mode       True                    'compute.fail_on_ansi_mo
                                                         an exception if the underlying Spark is working with
                                                         ANSI mode enabled and the option
                                                         'compute.ansi_mode_support' is False.
-compute.ansi_mode_support       False                   'compute.ansi_mode_support' sets whether or not to
+compute.ansi_mode_support       True                    'compute.ansi_mode_support' sets whether or not to
                                                         support the ANSI mode of the underlying Spark. If
                                                         False, pandas API on Spark may hit unexpected results
-                                                        or errors. The default is False.
+                                                        or errors. The default is True.
 plotting.max_rows               1000                    'plotting.max_rows' sets the visual limit on top-n-
                                                         based plots such as `plot.bar` and `plot.pie`. If it
                                                         is set to 1000, the first 1000 data points will be
diff --git a/python/docs/source/tutorial/pandas_on_spark/typehints.rst b/python/docs/source/tutorial/pandas_on_spark/typehints.rst
index 23126664d78a6..7045ce7f75987 100644
--- a/python/docs/source/tutorial/pandas_on_spark/typehints.rst
+++ b/python/docs/source/tutorial/pandas_on_spark/typehints.rst
@@ -62,7 +62,7 @@ it as a Spark schema. As an example, you can specify the return type hint as bel
 Notice that the function ``pandas_div`` actually takes and outputs a pandas DataFrame instead of
 pandas-on-Spark :class:`DataFrame`. So, technically the correct types should be of pandas.
 
-With Python 3.9+, you can specify the type hints by using pandas instances as follows:
+With Python 3.10+, you can specify the type hints by using pandas instances as follows:
 
 .. code-block:: python
 
diff --git a/python/docs/source/tutorial/sql/arrow_pandas.rst b/python/docs/source/tutorial/sql/arrow_pandas.rst
index ffff59f136cbe..3bef50874d7ff 100644
--- a/python/docs/source/tutorial/sql/arrow_pandas.rst
+++ b/python/docs/source/tutorial/sql/arrow_pandas.rst
@@ -375,6 +375,12 @@ fallback for type mismatches, leading to potential ambiguity and data loss. Addi
 and tuples to strings can yield ambiguous results. Arrow Python UDFs, on the other hand, leverage Arrow's
 capabilities to standardize type coercion and address these issues effectively.
 
+A note on Arrow Python UDF type coercion: In Spark 4.1, unnecessary conversion to pandas instances is removed in the serializer
+when ``spark.sql.execution.pythonUDF.arrow.enabled`` is enabled. As a result, the type coercion changes
+when the produced output has a schema different from the specified schema. To restore the previous behavior,
+enable ``spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled``. 
+The behavior difference is summarized in the tables `here <https://github.com/apache/spark/pull/51225>`__.
+
 Usage Notes
 -----------
 
@@ -434,7 +440,7 @@ working with timestamps in ``pandas_udf``\s to get the best performance, see
 Recommended Pandas and PyArrow Versions
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
-For usage with pyspark.sql, the minimum supported versions of Pandas is 2.0.0 and PyArrow is 11.0.0.
+For usage with pyspark.sql, the minimum supported versions of Pandas is 2.2.0 and PyArrow is 11.0.0.
 Higher versions may be used, however, compatibility and data correctness can not be guaranteed and should
 be verified by the user.
 
diff --git a/python/docs/source/tutorial/sql/arrow_python_udtf.rst b/python/docs/source/tutorial/sql/arrow_python_udtf.rst
new file mode 100644
index 0000000000000..3e933fea722f0
--- /dev/null
+++ b/python/docs/source/tutorial/sql/arrow_python_udtf.rst
@@ -0,0 +1,237 @@
+..  Licensed to the Apache Software Foundation (ASF) under one
+    or more contributor license agreements.  See the NOTICE file
+    distributed with this work for additional information
+    regarding copyright ownership.  The ASF licenses this file
+    to you under the Apache License, Version 2.0 (the
+    "License"); you may not use this file except in compliance
+    with the License.  You may obtain a copy of the License at
+
+..    http://www.apache.org/licenses/LICENSE-2.0
+
+..  Unless required by applicable law or agreed to in writing,
+    software distributed under the License is distributed on an
+    "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+    KIND, either express or implied.  See the License for the
+    specific language governing permissions and limitations
+    under the License.
+
+======================================================
+Vectorized Python User-defined Table Functions (UDTFs)
+======================================================
+
+Spark 4.1 introduces the Vectorized Python user-defined table function (UDTF), a new type of user-defined table-valued function.
+It can be used via the ``@arrow_udtf`` decorator.
+Unlike scalar functions that return a single result value from each call, each UDTF is invoked in
+the ``FROM`` clause of a query and returns an entire table as output.
+Unlike the traditional Python UDTF that evaluates row by row, the Vectorized Python UDTF lets you directly operate on top of Apache Arrow arrays and column batches.
+This allows you to leverage vectorized operations and improve the performance of your UDTF.
+
+Vectorized Python UDTF Interface
+--------------------------------
+
+.. currentmodule:: pyspark.sql.functions
+
+.. code-block:: python
+
+    class NameYourArrowPythonUDTF:
+
+        def __init__(self) -> None:
+            """
+            Initializes the user-defined table function (UDTF). This is optional.
+
+            This method serves as the default constructor and is called once when the
+            UDTF is instantiated on the executor side.
+
+            Any class fields assigned in this method will be available for subsequent
+            calls to the `eval`, `terminate` and `cleanup` methods.
+
+            Notes
+            -----
+            - You cannot create or reference the Spark session within the UDTF. Any
+              attempt to do so will result in a serialization error.
+            """
+            ...
+
+        def eval(self, *args: Any) -> Iterator[pa.RecordBatch | pa.Table]:
+            """
+            Evaluates the function using the given input arguments.
+
+            This method is required and must be implemented.
+
+            Argument Mapping:
+            - Each provided scalar expression maps to exactly one value in the
+              `*args` list with type `pa.Array`.
+            - Each provided table argument maps to a `pa.RecordBatch` object containing
+              the columns in the order they appear in the provided input table,
+              and with the names computed by the query analyzer.
+
+            This method is called on every batch of input rows, and can produce zero or more
+            output pyarrow record batches or pyarrow tables. Each element in the output tuple
+            corresponds to one column specified in the return type of the UDTF.
+
+            Parameters
+            ----------
+            *args : Any
+                Arbitrary positional arguments representing the input to the UDTF.
+
+            Yields
+            ------
+            iterator
+                An iterator of `pa.RecordBatch` or `pa.Table` objects representing a batch of rows
+                in the UDTF result table. Yield as many times as needed to produce multiple batches.
+
+            Notes
+            -----
+            - UDTFs can instead accept keyword arguments during the function call if needed.
+            - The `eval` method can raise a `SkipRestOfInputTableException` to indicate that the
+              UDTF wants to skip consuming all remaining rows from the current partition of the
+              input table. This will cause the UDTF to proceed directly to the `terminate` method.
+            - The `eval` method can raise any other exception to indicate that the UDTF should be
+              aborted entirely. This will cause the UDTF to skip the `terminate` method and proceed
+              directly to the `cleanup` method, and then the exception will be propagated to the
+              query processor causing the invoking query to fail.
+
+            Examples
+            --------
+            This `eval` method takes a table argument and returns an arrow record batch for each input batch.
+
+            >>> def eval(self, batch: pa.RecordBatch):
+            ...     yield batch
+
+            This `eval` method takes a table argument and returns a pyarrow table for each input batch.
+
+            >>> def eval(self, batch: pa.RecordBatch):
+            ...     yield pa.table({"x": batch.column(0), "y": batch.column(1)})
+
+            This `eval` method takes both table and scalar arguments and returns a pyarrow table for each input batch.
+
+            >>> def eval(self, batch: pa.RecordBatch, x: pa.Array):
+            ...     yield pa.table({"x": x, "y": batch.column(0)})
+            """
+            ...
+
+        def terminate(self) -> Iterator[pa.RecordBatch | pa.Table]:
+            """
+            Called when the UDTF has successfully processed all input rows.
+
+            This method is optional to implement and is useful for performing any
+            finalization operations after the UDTF has finished processing
+            all rows. It can also be used to yield additional rows if needed.
+            Table functions that consume all rows in the entire input partition
+            and then compute and return the entire output table can do so from
+            this method as well (please be mindful of memory usage when doing
+            this).
+
+            If any exceptions occur during input row processing, this method
+            won't be called.
+
+            Yields
+            ------
+            iterator
+                An iterator of `pa.RecordBatch` or `pa.Table` objects representing a batch of rows
+                in the UDTF result table. Yield as many times as needed to produce multiple batches.
+
+            Examples
+            --------
+            >>> def terminate(self) -> Iterator[pa.RecordBatch | pa.Table]:
+            >>>     yield pa.table({"x": pa.array([1, 2, 3])})
+            """
+            ...
+
+        def cleanup(self) -> None:
+            """
+            Invoked after the UDTF completes processing input rows.
+
+            This method is optional to implement and is useful for final cleanup
+            regardless of whether the UDTF processed all input rows successfully
+            or was aborted due to exceptions.
+
+            Examples
+            --------
+            >>> def cleanup(self) -> None:
+            >>>     self.conn.close()
+            """
+            ...
+
+Defining the Output Schema
+--------------------------
+
+The return type of the UDTF defines the schema of the table it outputs.
+You can specify it in the ``@arrow_udtf`` decorator.
+
+It must be either a ``StructType``:
+
+.. code-block:: python
+
+    @arrow_udtf(returnType=StructType().add("c1", StringType()).add("c2", IntegerType()))
+    class YourArrowPythonUDTF:
+        ...
+
+or a DDL string representing a struct type:
+
+.. code-block:: python
+
+    @arrow_udtf(returnType="c1 string, c2 int")
+    class YourArrowPythonUDTF:
+        ...
+
+Emitting Output Rows
+--------------------
+
+The `eval` and `terminate` methods then emit zero or more output batches conforming to this schema by
+yielding ``pa.RecordBatch`` or ``pa.Table`` objects.
+
+.. code-block:: python
+
+    @arrow_udtf(returnType="c1 int, c2 int")
+    class YourArrowPythonUDTF:
+        def eval(self, batch: pa.RecordBatch):
+            yield pa.table({"c1": batch.column(0), "c2": batch.column(1)})
+
+You can also yield multiple pyarrow tables in the `eval` method.
+
+.. code-block:: python
+
+    @arrow_udtf(returnType="c1 int")
+    class YourArrowPythonUDTF:
+        def eval(self, batch: pa.RecordBatch):
+            yield pa.table({"c1": batch.column(0)})
+            yield pa.table({"c1": batch.column(1)})
+
+You can also yield multiple pyarrow record batches in the `eval` method.
+
+.. code-block:: python
+
+    @arrow_udtf(returnType="c1 int")
+    class YourArrowPythonUDTF:
+        def eval(self, batch: pa.RecordBatch):
+            new_batch = pa.record_batch(
+                {"c1": batch.column(0).slice(0, len(batch) // 2)})
+            yield new_batch
+
+
+Usage Examples
+--------------
+
+Here's how to use these UDTFs in DataFrame:
+
+.. code-block:: python
+
+    import pyarrow as pa
+    from pyspark.sql.functions import arrow_udtf
+
+    @arrow_udtf(returnType="c1 string")
+    class MyArrowPythonUDTF:
+        def eval(self, batch: pa.RecordBatch):
+            yield pa.table({"c1": batch.column("value")})
+
+    df = spark.range(10).selectExpr("id", "cast(id as string) as value")
+    MyArrowPythonUDTF(df.asTable()).show()
+
+    # Register the UDTF
+    spark.udtf.register("my_arrow_udtf", MyArrowPythonUDTF)
+
+    # Use in SQL queries
+    df = spark.sql("""
+        SELECT * FROM my_arrow_udtf(TABLE(SELECT id, cast(id as string) as value FROM range(10)))
+    """)
diff --git a/python/docs/source/tutorial/sql/index.rst b/python/docs/source/tutorial/sql/index.rst
index d1b67f7eeb909..c2f2c57baadaf 100644
--- a/python/docs/source/tutorial/sql/index.rst
+++ b/python/docs/source/tutorial/sql/index.rst
@@ -24,6 +24,7 @@ Spark SQL
    :maxdepth: 2
 
    arrow_pandas
+   arrow_python_udtf
    python_udtf
    python_data_source
    type_conversions
diff --git a/python/docs/source/tutorial/sql/python_data_source.rst b/python/docs/source/tutorial/sql/python_data_source.rst
index 22b2a0b5f3c7b..41b76c95d5806 100644
--- a/python/docs/source/tutorial/sql/python_data_source.rst
+++ b/python/docs/source/tutorial/sql/python_data_source.rst
@@ -520,4 +520,6 @@ The following example demonstrates how to implement a basic Data Source using Ar
 Usage Notes
 -----------
 
-- During Data Source resolution, built-in and Scala/Java Data Sources take precedence over Python Data Sources with the same name; to explicitly use a Python Data Source, make sure its name does not conflict with the other Data Sources.
+- During Data Source resolution, built-in and Scala/Java Data Sources take precedence over Python Data Sources with the same name; to explicitly use a Python Data Source, make sure its name does not conflict with the other non-Python Data Sources.
+- It is allowed to register multiple Python Data Sources with the same name. Later registrations will overwrite earlier ones.
+- To automatically register a data source, export it as ``DefaultSource`` in a top level module with name prefix ``pyspark_``. See `pyspark_huggingface <https://github.com/huggingface/pyspark_huggingface>`_ for an example.
diff --git a/python/docs/source/tutorial/sql/python_udtf.rst b/python/docs/source/tutorial/sql/python_udtf.rst
index ac394d9e5360f..a989848448c9d 100644
--- a/python/docs/source/tutorial/sql/python_udtf.rst
+++ b/python/docs/source/tutorial/sql/python_udtf.rst
@@ -351,7 +351,7 @@ or a DDL string representing a struct type:
 
 .. code-block:: python
 
-    c1: string
+    c1 string
 
 Emitting Output Rows
 --------------------
diff --git a/python/docs/source/user_guide/ansi_migration_guide.ipynb b/python/docs/source/user_guide/ansi_migration_guide.ipynb
new file mode 100644
index 0000000000000..5193b307aadf3
--- /dev/null
+++ b/python/docs/source/user_guide/ansi_migration_guide.ipynb
@@ -0,0 +1,196 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "4fa81d13",
+   "metadata": {},
+   "source": [
+    "# ANSI Migration Guide - Pandas API on Spark\n",
+    "ANSI mode is now on by default for Pandas API on Spark. This guide helps you understand the key behavior differences you’ll see.\n",
+    "In short, with ANSI mode on, Pandas API on Spark behavior matches native pandas in cases where Pandas API on Spark with ANSI off did not."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "6e1c7952",
+   "metadata": {},
+   "source": [
+    "## Behavior Change\n",
+    "### String Number Comparison\n",
+    "**ANSI off:** Spark implicitly casts numbers and strings, so `1` and `'1'` are considered equal.\n",
+    "\n",
+    "**ANSI on:** behaves like pandas, `1 == '1'` is False."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "69474e28-c1cd-40fe-8ec6-7373b56c4dee",
+   "metadata": {},
+   "source": [
+    "Examples are as shown below:\n",
+    "\n",
+    "```python\n",
+    ">>> pdf = pd.DataFrame({\"int\": [1, 2], \"str\": [\"1\", \"2\"]})\n",
+    ">>> psdf = ps.from_pandas(pdf)\n",
+    "\n",
+    "# ANSI on\n",
+    ">>> spark.conf.set(\"spark.sql.ansi.enabled\", True)\n",
+    ">>> psdf[\"int\"] == psdf[\"str\"]\n",
+    "0    False\n",
+    "1    False\n",
+    "dtype: bool\n",
+    "\n",
+    "# ANSI off\n",
+    ">>> spark.conf.set(\"spark.sql.ansi.enabled\", False)\n",
+    ">>> psdf[\"int\"] == psdf[\"str\"]\n",
+    "0    True\n",
+    "1    True\n",
+    "dtype: bool\n",
+    "\n",
+    "# Pandas\n",
+    ">>> pdf[\"int\"] == pdf[\"str\"]\n",
+    "0    False\n",
+    "1    False\n",
+    "dtype: bool\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "90a4ea8d",
+   "metadata": {},
+   "source": [
+    "### Strict Casting\n",
+    "**ANSI off:** invalid casts (e.g., `'a' → int`) quietly became NULL.\n",
+    "\n",
+    "**ANSI on:** the same casts raise errors."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "b361febc-4435-4bd1-9ee1-4874413d770c",
+   "metadata": {},
+   "source": [
+    "Examples are as shown below:\n",
+    "\n",
+    "```python\n",
+    ">>> pdf = pd.DataFrame({\"str\": [\"a\"]})\n",
+    ">>> psdf = ps.from_pandas(pdf)\n",
+    "\n",
+    "# ANSI on\n",
+    ">>> spark.conf.set(\"spark.sql.ansi.enabled\", True)\n",
+    ">>> psdf[\"str\"].astype(int)\n",
+    "Traceback (most recent call last):\n",
+    "...\n",
+    "pyspark.errors.exceptions.captured.NumberFormatException: [CAST_INVALID_INPUT] ...\n",
+    "\n",
+    "# ANSI off\n",
+    ">>> spark.conf.set(\"spark.sql.ansi.enabled\", False)\n",
+    ">>> psdf[\"str\"].astype(int)\n",
+    "0   NaN\n",
+    "Name: str, dtype: float64\n",
+    "\n",
+    "# Pandas\n",
+    ">>> pdf[\"str\"].astype(int)\n",
+    "Traceback (most recent call last):\n",
+    "...\n",
+    "ValueError: invalid literal for int() with base 10: 'a'\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "e11583e2",
+   "metadata": {},
+   "source": [
+    "### MultiIndex.to_series Return\n",
+    "**ANSI off:** Each row is returned as an `ArrayType` value, e.g. `[1, red]`.\n",
+    "\n",
+    "**ANSI on:** Each row is returned as a `StructType` value, which appears as a tuple (e.g., `(1, red)`) if the Runtime SQL Configuration `spark.sql.execution.pandas.structHandlingMode` is set to `'row'`. Otherwise, the result may vary depending on whether Arrow is used. See more in the [Spark Runtime SQL Configuration docs](https://spark.apache.org/docs/latest/configuration.html#runtime-sql-configuration)."
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4671a895-ed40-4bc4-b1bc-fa9fbb86cc18",
+   "metadata": {},
+   "source": [
+    "Examples are as shown below:\n",
+    "\n",
+    "```python\n",
+    ">>> arrays = [[1,  2], [\"red\", \"blue\"]]\n",
+    ">>> pidx = pd.MultiIndex.from_arrays(arrays, names=(\"number\", \"color\"))\n",
+    ">>> psidx = ps.from_pandas(pidx)\n",
+    "\n",
+    "# ANSI on\n",
+    ">>> spark.conf.set(\"spark.sql.ansi.enabled\", True)\n",
+    ">>> spark.conf.set(\"spark.sql.execution.pandas.structHandlingMode\", \"row\")\n",
+    ">>> psidx.to_series()\n",
+    "number  color\n",
+    "1       red       (1, red)\n",
+    "2       blue     (2, blue)\n",
+    "dtype: object\n",
+    "\n",
+    "# ANSI off\n",
+    ">>> spark.conf.set(\"spark.sql.ansi.enabled\", False)\n",
+    ">>> psidx.to_series()\n",
+    "number  color\n",
+    "1       red       [1, red]\n",
+    "2       blue     [2, blue]\n",
+    "dtype: object\n",
+    "\n",
+    "# Pandas\n",
+    ">>> pidx.to_series()\n",
+    "number  color\n",
+    "1       red       (1, red)\n",
+    "2       blue     (2, blue)\n",
+    "dtype: object\n",
+    "```"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "fe146afd",
+   "metadata": {},
+   "source": [
+    "## Related Configurations\n",
+    "\n",
+    "### `spark.sql.ansi.enabled` (Spark config)\n",
+    "- Native Spark setting that controls ANSI mode.  \n",
+    "- The most powerful config to control both SQL and pandas API behavior.  \n",
+    "- If set to **False**, Spark reverts to the old behavior, and the other configs are not effective.\n",
+    "\n",
+    "### `compute.ansi_mode_support` (Pandas API on Spark option)\n",
+    "- Indicates whether ANSI mode is fully supported.  \n",
+    "- Effective only when ANSI is enabled.  \n",
+    "- If set to **False**, pandas API on Spark may hit unexpected results or errors.  \n",
+    "- Default is **True**.\n",
+    "\n",
+    "### `compute.fail_on_ansi_mode` (Pandas API on Spark option)\n",
+    "- Controls whether pandas API on Spark fails immediately when ANSI mode is enabled.  \n",
+    "- Effective only when ANSI is enabled and `compute.ansi_mode_support` is **False**.  \n",
+    "- If set to **False**, forces pandas API on Spark to work with the old behavior even when ANSI is enabled."
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.13"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/python/docs/source/user_guide/index.rst b/python/docs/source/user_guide/index.rst
index 1da4dd2e6eb13..e95a6ec0c64d8 100644
--- a/python/docs/source/user_guide/index.rst
+++ b/python/docs/source/user_guide/index.rst
@@ -33,5 +33,6 @@ Each of the below sections contains code-driven examples to help you get familia
    udfandudtf
    sql
    loadandbehold
+   ansi_migration_guide
 
 
diff --git a/python/packaging/classic/setup.py b/python/packaging/classic/setup.py
index 51ab69c6e4cc6..fcb607a561b3d 100755
--- a/python/packaging/classic/setup.py
+++ b/python/packaging/classic/setup.py
@@ -150,9 +150,9 @@ def _supports_symlinks():
 # binary format protocol with the Java version, see ARROW_HOME/format/* for specifications.
 # Also don't forget to update python/docs/source/getting_started/install.rst,
 # python/packaging/client/setup.py, and python/packaging/connect/setup.py
-_minimum_pandas_version = "2.0.0"
+_minimum_pandas_version = "2.2.0"
 _minimum_numpy_version = "1.21"
-_minimum_pyarrow_version = "11.0.0"
+_minimum_pyarrow_version = "15.0.0"
 _minimum_grpc_version = "1.67.0"
 _minimum_googleapis_common_protos_version = "1.65.0"
 _minimum_pyyaml_version = "3.11"
@@ -366,14 +366,21 @@ def run(self):
                 "grpcio-status>=%s" % _minimum_grpc_version,
                 "googleapis-common-protos>=%s" % _minimum_googleapis_common_protos_version,
                 "numpy>=%s" % _minimum_numpy_version,
+            ],
+            "pipelines": [
+                "pandas>=%s" % _minimum_pandas_version,
+                "pyarrow>=%s" % _minimum_pyarrow_version,
+                "numpy>=%s" % _minimum_numpy_version,
+                "grpcio>=%s" % _minimum_grpc_version,
+                "grpcio-status>=%s" % _minimum_grpc_version,
+                "googleapis-common-protos>=%s" % _minimum_googleapis_common_protos_version,
                 "pyyaml>=%s" % _minimum_pyyaml_version,
             ],
         },
-        python_requires=">=3.9",
+        python_requires=">=3.10",
         classifiers=[
             "Development Status :: 5 - Production/Stable",
             "License :: OSI Approved :: Apache Software License",
-            "Programming Language :: Python :: 3.9",
             "Programming Language :: Python :: 3.10",
             "Programming Language :: Python :: 3.11",
             "Programming Language :: Python :: 3.12",
diff --git a/python/packaging/client/setup.py b/python/packaging/client/setup.py
index ac80e3a1ff585..d70c17465331d 100755
--- a/python/packaging/client/setup.py
+++ b/python/packaging/client/setup.py
@@ -133,9 +133,9 @@
     # binary format protocol with the Java version, see ARROW_HOME/format/* for specifications.
     # Also don't forget to update python/docs/source/getting_started/install.rst,
     # python/packaging/classic/setup.py, and python/packaging/connect/setup.py
-    _minimum_pandas_version = "2.0.0"
+    _minimum_pandas_version = "2.2.0"
     _minimum_numpy_version = "1.21"
-    _minimum_pyarrow_version = "11.0.0"
+    _minimum_pyarrow_version = "15.0.0"
     _minimum_grpc_version = "1.67.0"
     _minimum_googleapis_common_protos_version = "1.65.0"
     _minimum_pyyaml_version = "3.11"
@@ -214,11 +214,10 @@
             "numpy>=%s" % _minimum_numpy_version,
             "pyyaml>=%s" % _minimum_pyyaml_version,
         ],
-        python_requires=">=3.9",
+        python_requires=">=3.10",
         classifiers=[
             "Development Status :: 5 - Production/Stable",
             "License :: OSI Approved :: Apache Software License",
-            "Programming Language :: Python :: 3.9",
             "Programming Language :: Python :: 3.10",
             "Programming Language :: Python :: 3.11",
             "Programming Language :: Python :: 3.12",
diff --git a/python/pyspark/errors/__init__.py b/python/pyspark/errors/__init__.py
index 98f8aa593371e..c20b057b74e61 100644
--- a/python/pyspark/errors/__init__.py
+++ b/python/pyspark/errors/__init__.py
@@ -46,7 +46,6 @@
     PySparkAssertionError,
     PySparkNotImplementedError,
     PySparkPicklingError,
-    RetriesExceeded,
     PySparkKeyError,
     QueryContext,
     QueryContextType,
@@ -83,7 +82,6 @@
     "PySparkAssertionError",
     "PySparkNotImplementedError",
     "PySparkPicklingError",
-    "RetriesExceeded",
     "PySparkKeyError",
     "QueryContext",
     "QueryContextType",
diff --git a/python/pyspark/errors/error-conditions.json b/python/pyspark/errors/error-conditions.json
index b9ed246753906..1da6b8e154784 100644
--- a/python/pyspark/errors/error-conditions.json
+++ b/python/pyspark/errors/error-conditions.json
@@ -174,6 +174,13 @@
       "`<func_name>` does not allow a Column in a list."
     ]
   },
+  "CONFLICTING_PIPELINE_REFRESH_OPTIONS" : {
+    "message" : [
+      "--full-refresh-all option conflicts with <conflicting_option>",
+      "The --full-refresh-all option performs a full refresh of all datasets, ",
+      "so specifying individual datasets with <conflicting_option> is not allowed."
+    ]
+  },
   "CONNECT_URL_ALREADY_DEFINED": {
     "message": [
       "Only one Spark Connect client URL can be set; however, got a different URL [<new_url>] from the existing [<existing_url>]."
@@ -377,6 +384,11 @@
       "The return type of the arrow-optimized Python UDTF should be of type 'pandas.DataFrame', but the '<func>' method returned a value of type <return_type> with value: <value>."
     ]
   },
+  "INVALID_ARROW_UDTF_WITH_ANALYZE": {
+    "message": [
+      "The arrow UDTF '<name>' is invalid. Arrow UDTFs do not support the 'analyze' method. Please remove the 'analyze' method from '<name>' and specify a returnType instead."
+    ]
+  },
   "INVALID_BROADCAST_OPERATION": {
     "message": [
       "Broadcast can only be <operation> in driver."
@@ -884,6 +896,11 @@
       "No pipeline.yaml or pipeline.yml file provided in arguments or found in directory `<dir_path>` or readable ancestor directories."
     ]
   },
+  "PIPELINE_SPEC_MISSING_REQUIRED_FIELD": {
+    "message": [
+      "Pipeline spec missing required field `<field_name>`."
+    ]
+  },
   "PIPELINE_SPEC_UNEXPECTED_FIELD": {
     "message": [
       "Pipeline spec field `<field_name>` is unexpected."
@@ -970,14 +987,14 @@
       "Columns do not match in their data type: <mismatch>."
     ]
   },
-  "RETRIES_EXCEEDED": {
+  "REUSE_OBSERVATION": {
     "message": [
-      "The maximum number of retries has been exceeded."
+      "An Observation can be used with a DataFrame only once."
     ]
   },
-  "REUSE_OBSERVATION": {
+  "SCHEMA_MISMATCH_FOR_ARROW_PYTHON_UDF": {
     "message": [
-      "An Observation can be used with a DataFrame only once."
+      "Result vector from <udf_type> was not the required length: expected <expected>, got <actual>."
     ]
   },
   "SCHEMA_MISMATCH_FOR_PANDAS_UDF": {
@@ -990,6 +1007,73 @@
       "Cannot start a remote Spark session because there is a regular Spark session already running."
     ]
   },
+  "SESSION_MUTATION_IN_DECLARATIVE_PIPELINE": {
+    "message": [
+      "Session mutation <method> is not allowed in declarative pipelines."
+    ],
+    "sub_class": {
+      "SET_RUNTIME_CONF": {
+        "message": [
+          "Instead set configuration via the pipeline spec or use the 'spark_conf' argument in various decorators."
+        ]
+      },
+      "SET_CURRENT_CATALOG": {
+        "message": [
+          "Instead set catalog via the pipeline spec or the 'name' argument on the dataset decorators."
+        ]
+      },
+      "SET_CURRENT_DATABASE": {
+        "message": [
+          "Instead set database via the pipeline spec or the 'name' argument on the dataset decorators."
+        ]
+      },
+      "DROP_TEMP_VIEW": {
+        "message": [
+          "Instead remove the temporary view definition directly."
+        ]
+      },
+      "DROP_GLOBAL_TEMP_VIEW": {
+        "message": [
+          "Instead remove the temporary view definition directly."
+        ]
+      },
+      "CREATE_TEMP_VIEW": {
+        "message": [
+          "Instead use the @temporary_view decorator to define temporary views."
+        ]
+      },
+      "CREATE_OR_REPLACE_TEMP_VIEW": {
+        "message": [
+          "Instead use the @temporary_view decorator to define temporary views."
+        ]
+      },
+      "CREATE_GLOBAL_TEMP_VIEW": {
+        "message": [
+          "Instead use the @temporary_view decorator to define temporary views."
+        ]
+      },
+      "CREATE_OR_REPLACE_GLOBAL_TEMP_VIEW": {
+        "message": [
+          "Instead use the @temporary_view decorator to define temporary views."
+        ]
+      },
+      "REGISTER_UDF": {
+        "message": [
+          ""
+        ]
+      },
+      "REGISTER_JAVA_UDF": {
+        "message": [
+          ""
+        ]
+      },
+      "REGISTER_JAVA_UDAF": {
+        "message": [
+          ""
+        ]
+      }
+    }
+  },
   "SESSION_NEED_CONN_STR_OR_BUILDER": {
     "message": [
       "Needs either connection string or channelBuilder (mutually exclusive) to create a new SparkSession."
@@ -1062,7 +1146,7 @@
   },
   "UDTF_ARROW_TYPE_CONVERSION_ERROR": {
     "message": [
-      "Cannot convert the output value of the input '<data>' with type '<schema>' to the specified return type of the column: '<arrow_schema>'. Please check if the data types match and try again."
+      "PyArrow UDTF must return an iterator of pyarrow.Table or pyarrow.RecordBatch objects."
     ]
   },
   "UDTF_CONSTRUCTOR_INVALID_IMPLEMENTS_ANALYZE_METHOD": {
diff --git a/python/pyspark/errors/exceptions/base.py b/python/pyspark/errors/exceptions/base.py
index 4fa7ea92e34cb..b0455b64dabfb 100644
--- a/python/pyspark/errors/exceptions/base.py
+++ b/python/pyspark/errors/exceptions/base.py
@@ -350,13 +350,6 @@ class PySparkPicklingError(PySparkException, PicklingError):
     """
 
 
-class RetriesExceeded(PySparkException):
-    """
-    Represents an exception which is considered retriable, but retry limits
-    were exceeded
-    """
-
-
 class PySparkKeyError(PySparkException, KeyError):
     """
     Wrapper class for KeyError to support error classes.
diff --git a/python/pyspark/errors/tests/test_connect_errors_conversion.py b/python/pyspark/errors/tests/test_connect_errors_conversion.py
index 344af2ad62331..f80a6301d61b6 100644
--- a/python/pyspark/errors/tests/test_connect_errors_conversion.py
+++ b/python/pyspark/errors/tests/test_connect_errors_conversion.py
@@ -18,7 +18,7 @@
 
 import unittest
 
-from pyspark.testing import should_test_connect, connect_requirement_message
+from pyspark.testing.utils import should_test_connect, connect_requirement_message
 
 if should_test_connect:
     from pyspark.errors.exceptions.connect import (
diff --git a/python/pyspark/ml/classification.py b/python/pyspark/ml/classification.py
index a5fdaed0db2c4..f66fc762971b5 100644
--- a/python/pyspark/ml/classification.py
+++ b/python/pyspark/ml/classification.py
@@ -889,15 +889,14 @@ def summary(self) -> "LinearSVCTrainingSummary":  # type: ignore[override]
         Gets summary (accuracy/precision/recall, objective history, total iterations) of model
         trained on the training set. An exception is thrown if `trainingSummary is None`.
         """
-        if self.hasSummary:
-            s = LinearSVCTrainingSummary(super(LinearSVCModel, self).summary)
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
+        return super().summary
+
+    @property
+    def _summaryCls(self) -> type:
+        return LinearSVCTrainingSummary
+
+    def _summary_dataset(self, train_dataset: DataFrame) -> DataFrame:
+        return train_dataset
 
     def evaluate(self, dataset: DataFrame) -> "LinearSVCSummary":
         """
@@ -1577,29 +1576,6 @@ def interceptVector(self) -> Vector:
         """
         return self._call_java("interceptVector")
 
-    @property
-    @since("2.0.0")
-    def summary(self) -> "LogisticRegressionTrainingSummary":
-        """
-        Gets summary (accuracy/precision/recall, objective history, total iterations) of model
-        trained on the training set. An exception is thrown if `trainingSummary is None`.
-        """
-        if self.hasSummary:
-            s: LogisticRegressionTrainingSummary
-            if self.numClasses <= 2:
-                s = BinaryLogisticRegressionTrainingSummary(
-                    super(LogisticRegressionModel, self).summary
-                )
-            else:
-                s = LogisticRegressionTrainingSummary(super(LogisticRegressionModel, self).summary)
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
-
     def evaluate(self, dataset: DataFrame) -> "LogisticRegressionSummary":
         """
         Evaluates the model on a test dataset.
@@ -1623,6 +1599,15 @@ def evaluate(self, dataset: DataFrame) -> "LogisticRegressionSummary":
             s.__source_transformer__ = self  # type: ignore[attr-defined]
         return s
 
+    @property
+    def _summaryCls(self) -> type:
+        if self.numClasses <= 2:
+            return BinaryLogisticRegressionTrainingSummary
+        return LogisticRegressionTrainingSummary
+
+    def _summary_dataset(self, train_dataset: DataFrame) -> DataFrame:
+        return train_dataset
+
 
 class LogisticRegressionSummary(_ClassificationSummary):
     """
@@ -2315,29 +2300,13 @@ def trees(self) -> List[DecisionTreeClassificationModel]:
         return [DecisionTreeClassificationModel(m) for m in list(self._call_java("trees"))]
 
     @property
-    @since("3.1.0")
-    def summary(self) -> "RandomForestClassificationTrainingSummary":
-        """
-        Gets summary (accuracy/precision/recall, objective history, total iterations) of model
-        trained on the training set. An exception is thrown if `trainingSummary is None`.
-        """
-        if self.hasSummary:
-            s: RandomForestClassificationTrainingSummary
-            if self.numClasses <= 2:
-                s = BinaryRandomForestClassificationTrainingSummary(
-                    super(RandomForestClassificationModel, self).summary
-                )
-            else:
-                s = RandomForestClassificationTrainingSummary(
-                    super(RandomForestClassificationModel, self).summary
-                )
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
+    def _summaryCls(self) -> type:
+        if self.numClasses <= 2:
+            return BinaryRandomForestClassificationTrainingSummary
+        return RandomForestClassificationTrainingSummary
+
+    def _summary_dataset(self, train_dataset: DataFrame) -> DataFrame:
+        return train_dataset
 
     def evaluate(self, dataset: DataFrame) -> "RandomForestClassificationSummary":
         """
@@ -3372,17 +3341,14 @@ def summary(  # type: ignore[override]
         Gets summary (accuracy/precision/recall, objective history, total iterations) of model
         trained on the training set. An exception is thrown if `trainingSummary is None`.
         """
-        if self.hasSummary:
-            s = MultilayerPerceptronClassificationTrainingSummary(
-                super(MultilayerPerceptronClassificationModel, self).summary
-            )
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
+        return super().summary
+
+    @property
+    def _summaryCls(self) -> type:
+        return MultilayerPerceptronClassificationTrainingSummary
+
+    def _summary_dataset(self, train_dataset: DataFrame) -> DataFrame:
+        return train_dataset
 
     def evaluate(self, dataset: DataFrame) -> "MultilayerPerceptronClassificationSummary":
         """
@@ -4321,22 +4287,6 @@ def factors(self) -> Matrix:
         """
         return self._call_java("factors")
 
-    @since("3.1.0")
-    def summary(self) -> "FMClassificationTrainingSummary":
-        """
-        Gets summary (accuracy/precision/recall, objective history, total iterations) of model
-        trained on the training set. An exception is thrown if `trainingSummary is None`.
-        """
-        if self.hasSummary:
-            s = FMClassificationTrainingSummary(super(FMClassificationModel, self).summary)
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
-
     def evaluate(self, dataset: DataFrame) -> "FMClassificationSummary":
         """
         Evaluates the model on a test dataset.
@@ -4356,6 +4306,21 @@ def evaluate(self, dataset: DataFrame) -> "FMClassificationSummary":
             s.__source_transformer__ = self  # type: ignore[attr-defined]
         return s
 
+    @since("3.1.0")
+    def summary(self) -> "FMClassificationTrainingSummary":
+        """
+        Gets summary (accuracy/precision/recall, objective history, total iterations) of model
+        trained on the training set. An exception is thrown if `trainingSummary is None`.
+        """
+        return super().summary
+
+    @property
+    def _summaryCls(self) -> type:
+        return FMClassificationTrainingSummary
+
+    def _summary_dataset(self, train_dataset: DataFrame) -> DataFrame:
+        return train_dataset
+
 
 class FMClassificationSummary(_BinaryClassificationSummary):
     """
diff --git a/python/pyspark/ml/clustering.py b/python/pyspark/ml/clustering.py
index 7267ee2805987..0e26398de3c45 100644
--- a/python/pyspark/ml/clustering.py
+++ b/python/pyspark/ml/clustering.py
@@ -255,23 +255,6 @@ def gaussiansDF(self) -> DataFrame:
         """
         return self._call_java("gaussiansDF")
 
-    @property
-    @since("2.1.0")
-    def summary(self) -> "GaussianMixtureSummary":
-        """
-        Gets summary (cluster assignments, cluster sizes) of the model trained on the
-        training set. An exception is thrown if no summary exists.
-        """
-        if self.hasSummary:
-            s = GaussianMixtureSummary(super(GaussianMixtureModel, self).summary)
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
-
     @since("3.0.0")
     def predict(self, value: Vector) -> int:
         """
@@ -286,6 +269,10 @@ def predictProbability(self, value: Vector) -> Vector:
         """
         return self._call_java("predictProbability", value)
 
+    @property
+    def _summaryCls(self) -> type:
+        return GaussianMixtureSummary
+
 
 @inherit_doc
 class GaussianMixture(
@@ -705,23 +692,6 @@ def numFeatures(self) -> int:
         """
         return self._call_java("numFeatures")
 
-    @property
-    @since("2.1.0")
-    def summary(self) -> KMeansSummary:
-        """
-        Gets summary (cluster assignments, cluster sizes) of the model trained on the
-        training set. An exception is thrown if no summary exists.
-        """
-        if self.hasSummary:
-            s = KMeansSummary(super(KMeansModel, self).summary)
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
-
     @since("3.0.0")
     def predict(self, value: Vector) -> int:
         """
@@ -729,6 +699,10 @@ def predict(self, value: Vector) -> int:
         """
         return self._call_java("predict", value)
 
+    @property
+    def _summaryCls(self) -> type:
+        return KMeansSummary
+
 
 @inherit_doc
 class KMeans(JavaEstimator[KMeansModel], _KMeansParams, JavaMLWritable, JavaMLReadable["KMeans"]):
@@ -1055,23 +1029,6 @@ def numFeatures(self) -> int:
         """
         return self._call_java("numFeatures")
 
-    @property
-    @since("2.1.0")
-    def summary(self) -> "BisectingKMeansSummary":
-        """
-        Gets summary (cluster assignments, cluster sizes) of the model trained on the
-        training set. An exception is thrown if no summary exists.
-        """
-        if self.hasSummary:
-            s = BisectingKMeansSummary(super(BisectingKMeansModel, self).summary)
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
-
     @since("3.0.0")
     def predict(self, value: Vector) -> int:
         """
@@ -1079,6 +1036,10 @@ def predict(self, value: Vector) -> int:
         """
         return self._call_java("predict", value)
 
+    @property
+    def _summaryCls(self) -> type:
+        return BisectingKMeansSummary
+
 
 @inherit_doc
 class BisectingKMeans(
diff --git a/python/pyspark/ml/connect/functions.py b/python/pyspark/ml/connect/functions.py
index 22ff32a5946de..8df40a400c5fe 100644
--- a/python/pyspark/ml/connect/functions.py
+++ b/python/pyspark/ml/connect/functions.py
@@ -58,7 +58,7 @@ def _test() -> None:
         print("Not supported in no-GIL mode", file=sys.stderr)
         sys.exit(0)
 
-    from pyspark.testing import should_test_connect
+    from pyspark.testing.utils import should_test_connect
 
     if not should_test_connect:
         print("Skipping pyspark.ml.connect.functions doctests", file=sys.stderr)
diff --git a/python/pyspark/ml/connect/proto.py b/python/pyspark/ml/connect/proto.py
index 31f100859281a..7cffd32631ba5 100644
--- a/python/pyspark/ml/connect/proto.py
+++ b/python/pyspark/ml/connect/proto.py
@@ -70,8 +70,13 @@ class AttributeRelation(LogicalPlan):
     could be a model or a summary. This attribute returns a DataFrame.
     """
 
-    def __init__(self, ref_id: str, methods: List[pb2.Fetch.Method]) -> None:
-        super().__init__(None)
+    def __init__(
+        self,
+        ref_id: str,
+        methods: List[pb2.Fetch.Method],
+        child: Optional["LogicalPlan"] = None,
+    ) -> None:
+        super().__init__(child)
         self._ref_id = ref_id
         self._methods = methods
 
@@ -79,4 +84,6 @@ def plan(self, session: "SparkConnectClient") -> pb2.Relation:
         plan = self._create_proto_relation()
         plan.ml_relation.fetch.obj_ref.CopyFrom(pb2.ObjectRef(id=self._ref_id))
         plan.ml_relation.fetch.methods.extend(self._methods)
+        if self._child is not None:
+            plan.ml_relation.model_summary_dataset.CopyFrom(self._child.plan(session))
         return plan
diff --git a/python/pyspark/ml/regression.py b/python/pyspark/ml/regression.py
index 66d6dbd6a2678..ce97b98f6665c 100644
--- a/python/pyspark/ml/regression.py
+++ b/python/pyspark/ml/regression.py
@@ -479,22 +479,11 @@ def scale(self) -> float:
         return self._call_java("scale")
 
     @property
-    @since("2.0.0")
-    def summary(self) -> "LinearRegressionTrainingSummary":
-        """
-        Gets summary (residuals, MSE, r-squared ) of model on
-        training set. An exception is thrown if
-        `trainingSummary is None`.
-        """
-        if self.hasSummary:
-            s = LinearRegressionTrainingSummary(super(LinearRegressionModel, self).summary)
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
+    def _summaryCls(self) -> type:
+        return LinearRegressionTrainingSummary
+
+    def _summary_dataset(self, train_dataset: DataFrame) -> DataFrame:
+        return train_dataset
 
     def evaluate(self, dataset: DataFrame) -> "LinearRegressionSummary":
         """
@@ -2774,24 +2763,11 @@ def intercept(self) -> float:
         return self._call_java("intercept")
 
     @property
-    @since("2.0.0")
-    def summary(self) -> "GeneralizedLinearRegressionTrainingSummary":
-        """
-        Gets summary (residuals, deviance, p-values) of model on
-        training set. An exception is thrown if
-        `trainingSummary is None`.
-        """
-        if self.hasSummary:
-            s = GeneralizedLinearRegressionTrainingSummary(
-                super(GeneralizedLinearRegressionModel, self).summary
-            )
-            if is_remote():
-                s.__source_transformer__ = self  # type: ignore[attr-defined]
-            return s
-        else:
-            raise RuntimeError(
-                "No training summary available for this %s" % self.__class__.__name__
-            )
+    def _summaryCls(self) -> type:
+        return GeneralizedLinearRegressionTrainingSummary
+
+    def _summary_dataset(self, train_dataset: DataFrame) -> DataFrame:
+        return train_dataset
 
     def evaluate(self, dataset: DataFrame) -> "GeneralizedLinearRegressionSummary":
         """
diff --git a/python/pyspark/ml/tests/connect/test_connect_cache.py b/python/pyspark/ml/tests/connect/test_connect_cache.py
index 8d156a0f11e1d..b6c801f32eaf0 100644
--- a/python/pyspark/ml/tests/connect/test_connect_cache.py
+++ b/python/pyspark/ml/tests/connect/test_connect_cache.py
@@ -48,20 +48,27 @@ def test_delete_model(self):
             "obj: class org.apache.spark.ml.classification.LinearSVCModel" in cache_info[0],
             cache_info,
         )
-        assert model._java_obj._ref_count == 1
+        # the `model._summary` holds another ref to the remote model.
+        assert model._java_obj._ref_count == 2
+
+        model_size = spark.client._query_model_size(model._java_obj.ref_id)
+        assert isinstance(model_size, int) and model_size > 0
 
         model2 = model.copy()
         cache_info = spark.client._get_ml_cache_info()
         self.assertEqual(len(cache_info), 1)
-        assert model._java_obj._ref_count == 2
-        assert model2._java_obj._ref_count == 2
+        assert model._java_obj._ref_count == 3
+        assert model2._java_obj._ref_count == 3
 
         # explicitly delete the model
         del model
 
         cache_info = spark.client._get_ml_cache_info()
         self.assertEqual(len(cache_info), 1)
-        assert model2._java_obj._ref_count == 1
+        # Note the copied model 'model2' also holds the `_summary` object,
+        # and the `_summary` object holds another ref to the remote model.
+        # so the ref count is 2.
+        assert model2._java_obj._ref_count == 2
 
         del model2
         cache_info = spark.client._get_ml_cache_info()
@@ -99,7 +106,6 @@ def test_cleanup_ml_cache(self):
             cache_info,
         )
 
-        # explicitly delete the model1
         del model1
 
         cache_info = spark.client._get_ml_cache_info()
diff --git a/python/pyspark/ml/tests/connect/test_parity_classification.py b/python/pyspark/ml/tests/connect/test_parity_classification.py
index 3c7e8ff71a2d6..7805546dba707 100644
--- a/python/pyspark/ml/tests/connect/test_parity_classification.py
+++ b/python/pyspark/ml/tests/connect/test_parity_classification.py
@@ -21,6 +21,8 @@
 from pyspark.testing.connectutils import ReusedConnectTestCase
 
 
+# TODO(SPARK-52764): Re-enable this test after fixing the flakiness.
+@unittest.skip("Disabled due to flakiness, should be enabled after fixing the issue")
 class ClassificationParityTests(ClassificationTestsMixin, ReusedConnectTestCase):
     pass
 
diff --git a/python/pyspark/ml/tests/connect/test_parity_clustering.py b/python/pyspark/ml/tests/connect/test_parity_clustering.py
index 99714b0d6962b..bbfd2a2aea806 100644
--- a/python/pyspark/ml/tests/connect/test_parity_clustering.py
+++ b/python/pyspark/ml/tests/connect/test_parity_clustering.py
@@ -21,6 +21,8 @@
 from pyspark.testing.connectutils import ReusedConnectTestCase
 
 
+# TODO(SPARK-52764): Re-enable this test after fixing the flakiness.
+@unittest.skip("Disabled due to flakiness, should be enabled after fixing the issue")
 class ClusteringParityTests(ClusteringTestsMixin, ReusedConnectTestCase):
     pass
 
diff --git a/python/pyspark/ml/tests/connect/test_parity_regression.py b/python/pyspark/ml/tests/connect/test_parity_regression.py
index 7c2743a938fa0..407280827076c 100644
--- a/python/pyspark/ml/tests/connect/test_parity_regression.py
+++ b/python/pyspark/ml/tests/connect/test_parity_regression.py
@@ -21,6 +21,8 @@
 from pyspark.testing.connectutils import ReusedConnectTestCase
 
 
+# TODO(SPARK-52764): Re-enable this test after fixing the flakiness.
+@unittest.skip("Disabled due to flakiness, should be enabled after fixing the issue")
 class RegressionParityTests(RegressionTestsMixin, ReusedConnectTestCase):
     pass
 
diff --git a/python/pyspark/ml/tests/connect/test_parity_torch_distributor.py b/python/pyspark/ml/tests/connect/test_parity_torch_distributor.py
index fc0500b8e83a7..3061ecb60c1d9 100644
--- a/python/pyspark/ml/tests/connect/test_parity_torch_distributor.py
+++ b/python/pyspark/ml/tests/connect/test_parity_torch_distributor.py
@@ -21,8 +21,12 @@
 
 from pyspark.util import is_remote_only
 from pyspark.sql import SparkSession
-from pyspark.testing import should_test_connect, connect_requirement_message
-from pyspark.testing.utils import have_torch, torch_requirement_message
+from pyspark.testing.utils import (
+    have_torch,
+    torch_requirement_message,
+    should_test_connect,
+    connect_requirement_message,
+)
 
 if not is_remote_only() and should_test_connect:
     from pyspark.ml.torch.tests.test_distributor import (
diff --git a/python/pyspark/ml/tests/test_classification.py b/python/pyspark/ml/tests/test_classification.py
index 57e4c0ef86dc0..21bce70e8735b 100644
--- a/python/pyspark/ml/tests/test_classification.py
+++ b/python/pyspark/ml/tests/test_classification.py
@@ -55,6 +55,7 @@
     MultilayerPerceptronClassificationTrainingSummary,
 )
 from pyspark.ml.regression import DecisionTreeRegressionModel
+from pyspark.sql import is_remote
 from pyspark.testing.sqlutils import ReusedSQLTestCase
 
 
@@ -241,37 +242,45 @@ def test_binary_logistic_regression_summary(self):
         model = lr.fit(df)
         self.assertEqual(lr.uid, model.uid)
         self.assertTrue(model.hasSummary)
-        s = model.summary
-        # test that api is callable and returns expected types
-        self.assertTrue(isinstance(s.predictions, DataFrame))
-        self.assertEqual(s.probabilityCol, "probability")
-        self.assertEqual(s.labelCol, "label")
-        self.assertEqual(s.featuresCol, "features")
-        self.assertEqual(s.predictionCol, "prediction")
-        objHist = s.objectiveHistory
-        self.assertTrue(isinstance(objHist, list) and isinstance(objHist[0], float))
-        self.assertGreater(s.totalIterations, 0)
-        self.assertTrue(isinstance(s.labels, list))
-        self.assertTrue(isinstance(s.truePositiveRateByLabel, list))
-        self.assertTrue(isinstance(s.falsePositiveRateByLabel, list))
-        self.assertTrue(isinstance(s.precisionByLabel, list))
-        self.assertTrue(isinstance(s.recallByLabel, list))
-        self.assertTrue(isinstance(s.fMeasureByLabel(), list))
-        self.assertTrue(isinstance(s.fMeasureByLabel(1.0), list))
-        self.assertTrue(isinstance(s.roc, DataFrame))
-        self.assertAlmostEqual(s.areaUnderROC, 1.0, 2)
-        self.assertTrue(isinstance(s.pr, DataFrame))
-        self.assertTrue(isinstance(s.fMeasureByThreshold, DataFrame))
-        self.assertTrue(isinstance(s.precisionByThreshold, DataFrame))
-        self.assertTrue(isinstance(s.recallByThreshold, DataFrame))
-        self.assertAlmostEqual(s.accuracy, 1.0, 2)
-        self.assertAlmostEqual(s.weightedTruePositiveRate, 1.0, 2)
-        self.assertAlmostEqual(s.weightedFalsePositiveRate, 0.0, 2)
-        self.assertAlmostEqual(s.weightedRecall, 1.0, 2)
-        self.assertAlmostEqual(s.weightedPrecision, 1.0, 2)
-        self.assertAlmostEqual(s.weightedFMeasure(), 1.0, 2)
-        self.assertAlmostEqual(s.weightedFMeasure(1.0), 1.0, 2)
 
+        def check_summary():
+            s = model.summary
+            # test that api is callable and returns expected types
+            self.assertTrue(isinstance(s.predictions, DataFrame))
+            self.assertEqual(s.probabilityCol, "probability")
+            self.assertEqual(s.labelCol, "label")
+            self.assertEqual(s.featuresCol, "features")
+            self.assertEqual(s.predictionCol, "prediction")
+            objHist = s.objectiveHistory
+            self.assertTrue(isinstance(objHist, list) and isinstance(objHist[0], float))
+            self.assertGreater(s.totalIterations, 0)
+            self.assertTrue(isinstance(s.labels, list))
+            self.assertTrue(isinstance(s.truePositiveRateByLabel, list))
+            self.assertTrue(isinstance(s.falsePositiveRateByLabel, list))
+            self.assertTrue(isinstance(s.precisionByLabel, list))
+            self.assertTrue(isinstance(s.recallByLabel, list))
+            self.assertTrue(isinstance(s.fMeasureByLabel(), list))
+            self.assertTrue(isinstance(s.fMeasureByLabel(1.0), list))
+            self.assertTrue(isinstance(s.roc, DataFrame))
+            self.assertAlmostEqual(s.areaUnderROC, 1.0, 2)
+            self.assertTrue(isinstance(s.pr, DataFrame))
+            self.assertTrue(isinstance(s.fMeasureByThreshold, DataFrame))
+            self.assertTrue(isinstance(s.precisionByThreshold, DataFrame))
+            self.assertTrue(isinstance(s.recallByThreshold, DataFrame))
+            self.assertAlmostEqual(s.accuracy, 1.0, 2)
+            self.assertAlmostEqual(s.weightedTruePositiveRate, 1.0, 2)
+            self.assertAlmostEqual(s.weightedFalsePositiveRate, 0.0, 2)
+            self.assertAlmostEqual(s.weightedRecall, 1.0, 2)
+            self.assertAlmostEqual(s.weightedPrecision, 1.0, 2)
+            self.assertAlmostEqual(s.weightedFMeasure(), 1.0, 2)
+            self.assertAlmostEqual(s.weightedFMeasure(1.0), 1.0, 2)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
+
+        s = model.summary
         # test evaluation (with training dataset) produces a summary with same values
         # one check is enough to verify a summary is returned, Scala version runs full test
         sameSummary = model.evaluate(df)
@@ -292,31 +301,39 @@ def test_multiclass_logistic_regression_summary(self):
         lr = LogisticRegression(maxIter=5, regParam=0.01, weightCol="weight", fitIntercept=False)
         model = lr.fit(df)
         self.assertTrue(model.hasSummary)
-        s = model.summary
-        # test that api is callable and returns expected types
-        self.assertTrue(isinstance(s.predictions, DataFrame))
-        self.assertEqual(s.probabilityCol, "probability")
-        self.assertEqual(s.labelCol, "label")
-        self.assertEqual(s.featuresCol, "features")
-        self.assertEqual(s.predictionCol, "prediction")
-        objHist = s.objectiveHistory
-        self.assertTrue(isinstance(objHist, list) and isinstance(objHist[0], float))
-        self.assertGreater(s.totalIterations, 0)
-        self.assertTrue(isinstance(s.labels, list))
-        self.assertTrue(isinstance(s.truePositiveRateByLabel, list))
-        self.assertTrue(isinstance(s.falsePositiveRateByLabel, list))
-        self.assertTrue(isinstance(s.precisionByLabel, list))
-        self.assertTrue(isinstance(s.recallByLabel, list))
-        self.assertTrue(isinstance(s.fMeasureByLabel(), list))
-        self.assertTrue(isinstance(s.fMeasureByLabel(1.0), list))
-        self.assertAlmostEqual(s.accuracy, 0.75, 2)
-        self.assertAlmostEqual(s.weightedTruePositiveRate, 0.75, 2)
-        self.assertAlmostEqual(s.weightedFalsePositiveRate, 0.25, 2)
-        self.assertAlmostEqual(s.weightedRecall, 0.75, 2)
-        self.assertAlmostEqual(s.weightedPrecision, 0.583, 2)
-        self.assertAlmostEqual(s.weightedFMeasure(), 0.65, 2)
-        self.assertAlmostEqual(s.weightedFMeasure(1.0), 0.65, 2)
 
+        def check_summary():
+            s = model.summary
+            # test that api is callable and returns expected types
+            self.assertTrue(isinstance(s.predictions, DataFrame))
+            self.assertEqual(s.probabilityCol, "probability")
+            self.assertEqual(s.labelCol, "label")
+            self.assertEqual(s.featuresCol, "features")
+            self.assertEqual(s.predictionCol, "prediction")
+            objHist = s.objectiveHistory
+            self.assertTrue(isinstance(objHist, list) and isinstance(objHist[0], float))
+            self.assertGreater(s.totalIterations, 0)
+            self.assertTrue(isinstance(s.labels, list))
+            self.assertTrue(isinstance(s.truePositiveRateByLabel, list))
+            self.assertTrue(isinstance(s.falsePositiveRateByLabel, list))
+            self.assertTrue(isinstance(s.precisionByLabel, list))
+            self.assertTrue(isinstance(s.recallByLabel, list))
+            self.assertTrue(isinstance(s.fMeasureByLabel(), list))
+            self.assertTrue(isinstance(s.fMeasureByLabel(1.0), list))
+            self.assertAlmostEqual(s.accuracy, 0.75, 2)
+            self.assertAlmostEqual(s.weightedTruePositiveRate, 0.75, 2)
+            self.assertAlmostEqual(s.weightedFalsePositiveRate, 0.25, 2)
+            self.assertAlmostEqual(s.weightedRecall, 0.75, 2)
+            self.assertAlmostEqual(s.weightedPrecision, 0.583, 2)
+            self.assertAlmostEqual(s.weightedFMeasure(), 0.65, 2)
+            self.assertAlmostEqual(s.weightedFMeasure(1.0), 0.65, 2)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
+
+        s = model.summary
         # test evaluation (with training dataset) produces a summary with same values
         # one check is enough to verify a summary is returned, Scala version runs full test
         sameSummary = model.evaluate(df)
@@ -426,15 +443,21 @@ def test_linear_svc(self):
         self.assertEqual(output.columns, expected_cols)
         self.assertEqual(output.count(), 4)
 
-        # model summary
-        self.assertTrue(model.hasSummary)
-        summary = model.summary()
-        self.assertIsInstance(summary, LinearSVCSummary)
-        self.assertIsInstance(summary, LinearSVCTrainingSummary)
-        self.assertEqual(summary.labels, [0.0, 1.0])
-        self.assertEqual(summary.accuracy, 0.5)
-        self.assertEqual(summary.areaUnderROC, 0.75)
-        self.assertEqual(summary.predictions.columns, expected_cols)
+        def check_summary():
+            # model summary
+            self.assertTrue(model.hasSummary)
+            summary = model.summary()
+            self.assertIsInstance(summary, LinearSVCSummary)
+            self.assertIsInstance(summary, LinearSVCTrainingSummary)
+            self.assertEqual(summary.labels, [0.0, 1.0])
+            self.assertEqual(summary.accuracy, 0.5)
+            self.assertEqual(summary.areaUnderROC, 0.75)
+            self.assertEqual(summary.predictions.columns, expected_cols)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         summary2 = model.evaluate(df)
         self.assertIsInstance(summary2, LinearSVCSummary)
@@ -526,13 +549,20 @@ def test_factorization_machine(self):
 
         # model summary
         self.assertTrue(model.hasSummary)
-        summary = model.summary()
-        self.assertIsInstance(summary, FMClassificationSummary)
-        self.assertIsInstance(summary, FMClassificationTrainingSummary)
-        self.assertEqual(summary.labels, [0.0, 1.0])
-        self.assertEqual(summary.accuracy, 0.25)
-        self.assertEqual(summary.areaUnderROC, 0.5)
-        self.assertEqual(summary.predictions.columns, expected_cols)
+
+        def check_summary():
+            summary = model.summary()
+            self.assertIsInstance(summary, FMClassificationSummary)
+            self.assertIsInstance(summary, FMClassificationTrainingSummary)
+            self.assertEqual(summary.labels, [0.0, 1.0])
+            self.assertEqual(summary.accuracy, 0.25)
+            self.assertEqual(summary.areaUnderROC, 0.5)
+            self.assertEqual(summary.predictions.columns, expected_cols)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         summary2 = model.evaluate(df)
         self.assertIsInstance(summary2, FMClassificationSummary)
@@ -773,21 +803,27 @@ def test_binary_random_forest_classifier(self):
             self.assertEqual(tree.transform(df).count(), 4)
             self.assertEqual(tree.transform(df).columns, expected_cols)
 
-        # model summary
-        summary = model.summary
-        self.assertTrue(isinstance(summary, BinaryRandomForestClassificationSummary))
-        self.assertTrue(isinstance(summary, BinaryRandomForestClassificationTrainingSummary))
-        self.assertEqual(summary.labels, [0.0, 1.0])
-        self.assertEqual(summary.accuracy, 0.75)
-        self.assertEqual(summary.areaUnderROC, 0.875)
-        self.assertEqual(summary.predictions.columns, expected_cols)
+        def check_summary():
+            # model summary
+            summary = model.summary
+            self.assertTrue(isinstance(summary, BinaryRandomForestClassificationSummary))
+            self.assertTrue(isinstance(summary, BinaryRandomForestClassificationTrainingSummary))
+            self.assertEqual(summary.labels, [0.0, 1.0])
+            self.assertEqual(summary.accuracy, 0.75)
+            self.assertEqual(summary.areaUnderROC, 0.875)
+            self.assertEqual(summary.predictions.columns, expected_cols)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         summary2 = model.evaluate(df)
         self.assertTrue(isinstance(summary2, BinaryRandomForestClassificationSummary))
         self.assertFalse(isinstance(summary2, BinaryRandomForestClassificationTrainingSummary))
         self.assertEqual(summary2.labels, [0.0, 1.0])
         self.assertEqual(summary2.accuracy, 0.75)
-        self.assertEqual(summary.areaUnderROC, 0.875)
+        self.assertEqual(summary2.areaUnderROC, 0.875)
         self.assertEqual(summary2.predictions.columns, expected_cols)
 
         # Model save & load
@@ -859,13 +895,19 @@ def test_multiclass_random_forest_classifier(self):
         self.assertEqual(output.columns, expected_cols)
         self.assertEqual(output.count(), 4)
 
-        # model summary
-        summary = model.summary
-        self.assertTrue(isinstance(summary, RandomForestClassificationSummary))
-        self.assertTrue(isinstance(summary, RandomForestClassificationTrainingSummary))
-        self.assertEqual(summary.labels, [0.0, 1.0, 2.0])
-        self.assertEqual(summary.accuracy, 0.5)
-        self.assertEqual(summary.predictions.columns, expected_cols)
+        def check_summary():
+            # model summary
+            summary = model.summary
+            self.assertTrue(isinstance(summary, RandomForestClassificationSummary))
+            self.assertTrue(isinstance(summary, RandomForestClassificationTrainingSummary))
+            self.assertEqual(summary.labels, [0.0, 1.0, 2.0])
+            self.assertEqual(summary.accuracy, 0.5)
+            self.assertEqual(summary.predictions.columns, expected_cols)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         summary2 = model.evaluate(df)
         self.assertTrue(isinstance(summary2, RandomForestClassificationSummary))
@@ -953,14 +995,20 @@ def test_mlp(self):
         self.assertEqual(output.columns, expected_cols)
         self.assertEqual(output.count(), 4)
 
-        # model summary
-        self.assertTrue(model.hasSummary)
-        summary = model.summary()
-        self.assertIsInstance(summary, MultilayerPerceptronClassificationSummary)
-        self.assertIsInstance(summary, MultilayerPerceptronClassificationTrainingSummary)
-        self.assertEqual(summary.labels, [0.0, 1.0])
-        self.assertEqual(summary.accuracy, 0.75)
-        self.assertEqual(summary.predictions.columns, expected_cols)
+        def check_summary():
+            # model summary
+            self.assertTrue(model.hasSummary)
+            summary = model.summary()
+            self.assertIsInstance(summary, MultilayerPerceptronClassificationSummary)
+            self.assertIsInstance(summary, MultilayerPerceptronClassificationTrainingSummary)
+            self.assertEqual(summary.labels, [0.0, 1.0])
+            self.assertEqual(summary.accuracy, 0.75)
+            self.assertEqual(summary.predictions.columns, expected_cols)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         summary2 = model.evaluate(df)
         self.assertIsInstance(summary2, MultilayerPerceptronClassificationSummary)
diff --git a/python/pyspark/ml/tests/test_clustering.py b/python/pyspark/ml/tests/test_clustering.py
index 1b8eb73135a96..fbf012babcc3d 100644
--- a/python/pyspark/ml/tests/test_clustering.py
+++ b/python/pyspark/ml/tests/test_clustering.py
@@ -85,23 +85,39 @@ def test_kmeans(self):
 
         self.assertTrue(np.allclose(model.predict(Vectors.dense(0.0, 5.0)), 1, atol=1e-4))
 
-        # Model summary
-        self.assertTrue(model.hasSummary)
-        summary = model.summary
-        self.assertTrue(isinstance(summary, KMeansSummary))
-        self.assertEqual(summary.k, 2)
-        self.assertEqual(summary.numIter, 2)
-        self.assertEqual(summary.clusterSizes, [4, 2])
-        self.assertTrue(np.allclose(summary.trainingCost, 1.35710375, atol=1e-4))
+        def check_summary():
+            # Model summary
+            self.assertTrue(model.hasSummary)
+            summary = model.summary
+            self.assertTrue(isinstance(summary, KMeansSummary))
+            self.assertEqual(summary.k, 2)
+            self.assertEqual(summary.numIter, 2)
+            self.assertEqual(summary.clusterSizes, [4, 2])
+            self.assertTrue(np.allclose(summary.trainingCost, 1.35710375, atol=1e-4))
 
-        self.assertEqual(summary.featuresCol, "features")
-        self.assertEqual(summary.predictionCol, "prediction")
+            self.assertEqual(summary.featuresCol, "features")
+            self.assertEqual(summary.predictionCol, "prediction")
 
-        self.assertEqual(summary.cluster.columns, ["prediction"])
-        self.assertEqual(summary.cluster.count(), 6)
+            self.assertEqual(summary.cluster.columns, ["prediction"])
+            self.assertEqual(summary.cluster.count(), 6)
 
-        self.assertEqual(summary.predictions.columns, expected_cols)
-        self.assertEqual(summary.predictions.count(), 6)
+            self.assertEqual(summary.predictions.columns, expected_cols)
+            self.assertEqual(summary.predictions.count(), 6)
+
+        # check summary before model offloading occurs
+        check_summary()
+
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            # check summary "try_remote_call" path after model offloading occurs
+            self.assertEqual(model.summary.numIter, 2)
+
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            # check summary "invoke_remote_attribute_relation" path after model offloading occurs
+            self.assertEqual(model.summary.cluster.count(), 6)
+
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         # save & load
         with tempfile.TemporaryDirectory(prefix="kmeans_model") as d:
@@ -112,6 +128,9 @@ def test_kmeans(self):
             model.write().overwrite().save(d)
             model2 = KMeansModel.load(d)
             self.assertEqual(str(model), str(model2))
+            self.assertFalse(model2.hasSummary)
+            with self.assertRaisesRegex(Exception, "No training summary available"):
+                model2.summary
 
     def test_bisecting_kmeans(self):
         df = (
@@ -278,30 +297,36 @@ def test_gaussian_mixture(self):
         self.assertEqual(output.columns, expected_cols)
         self.assertEqual(output.count(), 6)
 
-        # Model summary
-        self.assertTrue(model.hasSummary)
-        summary = model.summary
-        self.assertTrue(isinstance(summary, GaussianMixtureSummary))
-        self.assertEqual(summary.k, 2)
-        self.assertEqual(summary.numIter, 2)
-        self.assertEqual(len(summary.clusterSizes), 2)
-        self.assertEqual(summary.clusterSizes, [3, 3])
-        ll = summary.logLikelihood
-        self.assertTrue(ll < 0, ll)
-        self.assertTrue(np.allclose(ll, -1.311264553744033, atol=1e-4), ll)
-
-        self.assertEqual(summary.featuresCol, "features")
-        self.assertEqual(summary.predictionCol, "prediction")
-        self.assertEqual(summary.probabilityCol, "probability")
-
-        self.assertEqual(summary.cluster.columns, ["prediction"])
-        self.assertEqual(summary.cluster.count(), 6)
-
-        self.assertEqual(summary.predictions.columns, expected_cols)
-        self.assertEqual(summary.predictions.count(), 6)
-
-        self.assertEqual(summary.probability.columns, ["probability"])
-        self.assertEqual(summary.predictions.count(), 6)
+        def check_summary():
+            # Model summary
+            self.assertTrue(model.hasSummary)
+            summary = model.summary
+            self.assertTrue(isinstance(summary, GaussianMixtureSummary))
+            self.assertEqual(summary.k, 2)
+            self.assertEqual(summary.numIter, 2)
+            self.assertEqual(len(summary.clusterSizes), 2)
+            self.assertEqual(summary.clusterSizes, [3, 3])
+            ll = summary.logLikelihood
+            self.assertTrue(ll < 0, ll)
+            self.assertTrue(np.allclose(ll, -1.311264553744033, atol=1e-4), ll)
+
+            self.assertEqual(summary.featuresCol, "features")
+            self.assertEqual(summary.predictionCol, "prediction")
+            self.assertEqual(summary.probabilityCol, "probability")
+
+            self.assertEqual(summary.cluster.columns, ["prediction"])
+            self.assertEqual(summary.cluster.count(), 6)
+
+            self.assertEqual(summary.predictions.columns, expected_cols)
+            self.assertEqual(summary.predictions.count(), 6)
+
+            self.assertEqual(summary.probability.columns, ["probability"])
+            self.assertEqual(summary.predictions.count(), 6)
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         # save & load
         with tempfile.TemporaryDirectory(prefix="gaussian_mixture") as d:
diff --git a/python/pyspark/ml/tests/test_pipeline.py b/python/pyspark/ml/tests/test_pipeline.py
index 892ce72e32bc4..fe12f9e504f1d 100644
--- a/python/pyspark/ml/tests/test_pipeline.py
+++ b/python/pyspark/ml/tests/test_pipeline.py
@@ -174,6 +174,7 @@ def test_clustering_pipeline(self):
             self.assertEqual(str(model), str(model2))
             self.assertEqual(str(model.stages), str(model2.stages))
 
+    @unittest.skip("Disabled due to flakiness, it might hang forever occasionally.")
     def test_model_gc(self):
         spark = self.spark
         df1 = spark.createDataFrame(
@@ -201,6 +202,7 @@ def fit_transform_and_union(df1, df2):
         output2 = fit_transform_and_union(df1, df2)
         self.assertEqual(output2.count(), 13)
 
+    @unittest.skip("Disabled due to flakiness, it might hang forever occasionally.")
     def test_model_training_summary_gc(self):
         spark = self.spark
         df1 = spark.createDataFrame(
@@ -228,6 +230,7 @@ def fit_predictions_and_union(df1, df2):
         output2 = fit_predictions_and_union(df1, df2)
         self.assertEqual(output2.count(), 13)
 
+    @unittest.skip("Disabled due to flakiness, it might hang forever occasionally.")
     def test_model_testing_summary_gc(self):
         spark = self.spark
         df1 = spark.createDataFrame(
@@ -255,6 +258,7 @@ def fit_predictions_and_union(df1, df2):
         output2 = fit_predictions_and_union(df1, df2)
         self.assertEqual(output2.count(), 13)
 
+    @unittest.skip("Disabled due to flakiness, it might hang forever occasionally.")
     def test_model_attr_df_gc(self):
         spark = self.spark
         df1 = (
diff --git a/python/pyspark/ml/tests/test_regression.py b/python/pyspark/ml/tests/test_regression.py
index 8638fb4d6078e..52688fdd63cf2 100644
--- a/python/pyspark/ml/tests/test_regression.py
+++ b/python/pyspark/ml/tests/test_regression.py
@@ -43,6 +43,7 @@
     GBTRegressor,
     GBTRegressionModel,
 )
+from pyspark.sql import is_remote
 from pyspark.testing.sqlutils import ReusedSQLTestCase
 
 
@@ -193,50 +194,58 @@ def test_linear_regression(self):
             np.allclose(model.predict(Vectors.dense(0.0, 5.0)), 0.21249999999999963, atol=1e-4)
         )
 
-        # Model summary
-        summary = model.summary
-        self.assertTrue(isinstance(summary, LinearRegressionSummary))
-        self.assertTrue(isinstance(summary, LinearRegressionTrainingSummary))
-        self.assertEqual(summary.predictions.columns, expected_cols)
-        self.assertEqual(summary.predictions.count(), 4)
-        self.assertEqual(summary.residuals.columns, ["residuals"])
-        self.assertEqual(summary.residuals.count(), 4)
-
-        self.assertEqual(summary.degreesOfFreedom, 1)
-        self.assertEqual(summary.numInstances, 4)
-        self.assertEqual(summary.objectiveHistory, [0.0])
-        self.assertTrue(
-            np.allclose(
-                summary.coefficientStandardErrors,
-                [1.2859821149611763, 0.6248749874975031, 3.1645497310044184],
-                atol=1e-4,
+        def check_summary():
+            # Model summary
+            summary = model.summary
+            self.assertTrue(isinstance(summary, LinearRegressionSummary))
+            self.assertTrue(isinstance(summary, LinearRegressionTrainingSummary))
+            self.assertEqual(summary.predictions.columns, expected_cols)
+            self.assertEqual(summary.predictions.count(), 4)
+            self.assertEqual(summary.residuals.columns, ["residuals"])
+            self.assertEqual(summary.residuals.count(), 4)
+
+            self.assertEqual(summary.degreesOfFreedom, 1)
+            self.assertEqual(summary.numInstances, 4)
+            self.assertEqual(summary.objectiveHistory, [0.0])
+            self.assertTrue(
+                np.allclose(
+                    summary.coefficientStandardErrors,
+                    [1.2859821149611763, 0.6248749874975031, 3.1645497310044184],
+                    atol=1e-4,
+                )
             )
-        )
-        self.assertTrue(
-            np.allclose(
-                summary.devianceResiduals, [-0.7424621202458727, 0.7875000000000003], atol=1e-4
+            self.assertTrue(
+                np.allclose(
+                    summary.devianceResiduals, [-0.7424621202458727, 0.7875000000000003], atol=1e-4
+                )
             )
-        )
-        self.assertTrue(
-            np.allclose(
-                summary.pValues,
-                [0.7020630236843428, 0.8866003086182783, 0.9298746994547682],
-                atol=1e-4,
+            self.assertTrue(
+                np.allclose(
+                    summary.pValues,
+                    [0.7020630236843428, 0.8866003086182783, 0.9298746994547682],
+                    atol=1e-4,
+                )
             )
-        )
-        self.assertTrue(
-            np.allclose(
-                summary.tValues,
-                [0.5054502643838291, 0.1800360108036021, -0.11060025272186746],
-                atol=1e-4,
+            self.assertTrue(
+                np.allclose(
+                    summary.tValues,
+                    [0.5054502643838291, 0.1800360108036021, -0.11060025272186746],
+                    atol=1e-4,
+                )
             )
-        )
-        self.assertTrue(np.allclose(summary.explainedVariance, 0.07997500000000031, atol=1e-4))
-        self.assertTrue(np.allclose(summary.meanAbsoluteError, 0.4200000000000002, atol=1e-4))
-        self.assertTrue(np.allclose(summary.meanSquaredError, 0.20212500000000005, atol=1e-4))
-        self.assertTrue(np.allclose(summary.rootMeanSquaredError, 0.44958314025327956, atol=1e-4))
-        self.assertTrue(np.allclose(summary.r2, 0.4427212572373862, atol=1e-4))
-        self.assertTrue(np.allclose(summary.r2adj, -0.6718362282878414, atol=1e-4))
+            self.assertTrue(np.allclose(summary.explainedVariance, 0.07997500000000031, atol=1e-4))
+            self.assertTrue(np.allclose(summary.meanAbsoluteError, 0.4200000000000002, atol=1e-4))
+            self.assertTrue(np.allclose(summary.meanSquaredError, 0.20212500000000005, atol=1e-4))
+            self.assertTrue(
+                np.allclose(summary.rootMeanSquaredError, 0.44958314025327956, atol=1e-4)
+            )
+            self.assertTrue(np.allclose(summary.r2, 0.4427212572373862, atol=1e-4))
+            self.assertTrue(np.allclose(summary.r2adj, -0.6718362282878414, atol=1e-4))
+
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
 
         summary2 = model.evaluate(df)
         self.assertTrue(isinstance(summary2, LinearRegressionSummary))
@@ -318,36 +327,43 @@ def test_generalized_linear_regression(self):
         self.assertEqual(output.columns, expected_cols)
         self.assertEqual(output.count(), 4)
 
-        # Model summary
-        self.assertTrue(model.hasSummary)
-
-        summary = model.summary
-        self.assertIsInstance(summary, GeneralizedLinearRegressionSummary)
-        self.assertIsInstance(summary, GeneralizedLinearRegressionTrainingSummary)
-        self.assertEqual(summary.numIterations, 1)
-        self.assertEqual(summary.numInstances, 4)
-        self.assertEqual(summary.rank, 3)
-        self.assertTrue(
-            np.allclose(
+        def check_summary():
+            # Model summary
+            self.assertTrue(model.hasSummary)
+
+            summary = model.summary
+            self.assertIsInstance(summary, GeneralizedLinearRegressionSummary)
+            self.assertIsInstance(summary, GeneralizedLinearRegressionTrainingSummary)
+            self.assertEqual(summary.numIterations, 1)
+            self.assertEqual(summary.numInstances, 4)
+            self.assertEqual(summary.rank, 3)
+            self.assertTrue(
+                np.allclose(
+                    summary.tValues,
+                    [0.3725037662281711, -0.49418209022924164, 2.6589353685797654],
+                    atol=1e-4,
+                ),
                 summary.tValues,
-                [0.3725037662281711, -0.49418209022924164, 2.6589353685797654],
-                atol=1e-4,
-            ),
-            summary.tValues,
-        )
-        self.assertTrue(
-            np.allclose(
+            )
+            self.assertTrue(
+                np.allclose(
+                    summary.pValues,
+                    [0.7729938686180984, 0.707802691825973, 0.22900885781807023],
+                    atol=1e-4,
+                ),
                 summary.pValues,
-                [0.7729938686180984, 0.707802691825973, 0.22900885781807023],
-                atol=1e-4,
-            ),
-            summary.pValues,
-        )
-        self.assertEqual(summary.predictions.columns, expected_cols)
-        self.assertEqual(summary.predictions.count(), 4)
-        self.assertEqual(summary.residuals().columns, ["devianceResiduals"])
-        self.assertEqual(summary.residuals().count(), 4)
+            )
+            self.assertEqual(summary.predictions.columns, expected_cols)
+            self.assertEqual(summary.predictions.count(), 4)
+            self.assertEqual(summary.residuals().columns, ["devianceResiduals"])
+            self.assertEqual(summary.residuals().count(), 4)
 
+        check_summary()
+        if is_remote():
+            self.spark.client._delete_ml_cache([model._java_obj._ref_id], evict_only=True)
+            check_summary()
+
+        summary = model.summary
         summary2 = model.evaluate(df)
         self.assertIsInstance(summary2, GeneralizedLinearRegressionSummary)
         self.assertNotIsInstance(summary2, GeneralizedLinearRegressionTrainingSummary)
diff --git a/python/pyspark/ml/util.py b/python/pyspark/ml/util.py
index b86178a97c382..9072e88ca29fb 100644
--- a/python/pyspark/ml/util.py
+++ b/python/pyspark/ml/util.py
@@ -72,20 +72,6 @@
 _logger = logging.getLogger("pyspark.ml.util")
 
 
-def try_remote_intermediate_result(f: FuncT) -> FuncT:
-    """Mark the function/property that returns the intermediate result of the remote call.
-    Eg, model.summary"""
-
-    @functools.wraps(f)
-    def wrapped(self: "JavaWrapper") -> Any:
-        if is_remote() and "PYSPARK_NO_NAMESPACE_SHARE" not in os.environ:
-            return f"{str(self._java_obj)}.{f.__name__}"
-        else:
-            return f(self)
-
-    return cast(FuncT, wrapped)
-
-
 def invoke_helper_attr(method: str, *args: Any) -> Any:
     from pyspark.ml.wrapper import JavaWrapper
 
@@ -125,7 +111,12 @@ def invoke_remote_attribute_relation(
         object_id = instance._java_obj  # type: ignore
     methods, obj_ref = _extract_id_methods(object_id)
     methods.append(pb2.Fetch.Method(method=method, args=serialize(session.client, *args)))
-    plan = AttributeRelation(obj_ref, methods)
+
+    if methods[0].method == "summary":
+        child = instance._summary_dataset._plan  # type: ignore
+    else:
+        child = None
+    plan = AttributeRelation(obj_ref, methods, child=child)
 
     # To delay the GC of the model, keep a reference to the source instance,
     # might be a model or a summary.
@@ -204,6 +195,15 @@ def wrapped(self: "JavaEstimator", dataset: "ConnectDataFrame") -> Any:
                 _logger.warning(warning_msg)
             remote_model_ref = RemoteModelRef(model_info.obj_ref.id)
             model = self._create_model(remote_model_ref)
+            if isinstance(model, HasTrainingSummary):
+                summary_dataset = model._summary_dataset(dataset)
+
+                summary = model._summaryCls(f"{str(model._java_obj)}.summary")  # type: ignore
+                summary._summary_dataset = summary_dataset
+                summary._remote_model_obj = model._java_obj  # type: ignore
+                summary._remote_model_obj.add_ref()
+
+                model._summary = summary  # type: ignore
             if model.__class__.__name__ not in ["Bucketizer"]:
                 model._resetUid(self.uid)
             return self._copyValues(model)
@@ -279,42 +279,69 @@ def try_remote_call(f: FuncT) -> FuncT:
     @functools.wraps(f)
     def wrapped(self: "JavaWrapper", name: str, *args: Any) -> Any:
         if is_remote() and "PYSPARK_NO_NAMESPACE_SHARE" not in os.environ:
-            # Launch a remote call if possible
+            from pyspark.errors.exceptions.connect import SparkException
             import pyspark.sql.connect.proto as pb2
             from pyspark.sql.connect.session import SparkSession
-            from pyspark.ml.connect.util import _extract_id_methods
-            from pyspark.ml.connect.serialize import serialize, deserialize
-            from pyspark.ml.wrapper import JavaModel
 
             session = SparkSession.getActiveSession()
-            assert session is not None
-            if self._java_obj == ML_CONNECT_HELPER_ID:
-                obj_id = ML_CONNECT_HELPER_ID
-            else:
-                if isinstance(self, JavaModel):
-                    assert isinstance(self._java_obj, RemoteModelRef)
-                    obj_id = self._java_obj.ref_id
+
+            def remote_call() -> Any:
+                from pyspark.ml.connect.util import _extract_id_methods
+                from pyspark.ml.connect.serialize import serialize, deserialize
+                from pyspark.ml.wrapper import JavaModel
+
+                assert session is not None
+                if self._java_obj == ML_CONNECT_HELPER_ID:
+                    obj_id = ML_CONNECT_HELPER_ID
                 else:
-                    # model summary
-                    obj_id = self._java_obj  # type: ignore
-            methods, obj_ref = _extract_id_methods(obj_id)
-            methods.append(pb2.Fetch.Method(method=name, args=serialize(session.client, *args)))
-            command = pb2.Command()
-            command.ml_command.fetch.CopyFrom(
-                pb2.Fetch(obj_ref=pb2.ObjectRef(id=obj_ref), methods=methods)
-            )
-            (_, properties, _) = session.client.execute_command(command)
-            ml_command_result = properties["ml_command_result"]
-            if ml_command_result.HasField("summary"):
-                summary = ml_command_result.summary
-                return summary
-            elif ml_command_result.HasField("operator_info"):
-                model_info = deserialize(properties)
-                # get a new model ref id from the existing model,
-                # it is up to the caller to build the model
-                return model_info.obj_ref.id
-            else:
-                return deserialize(properties)
+                    if isinstance(self, JavaModel):
+                        assert isinstance(self._java_obj, RemoteModelRef)
+                        obj_id = self._java_obj.ref_id
+                    else:
+                        # model summary
+                        obj_id = self._java_obj  # type: ignore
+                methods, obj_ref = _extract_id_methods(obj_id)
+                methods.append(pb2.Fetch.Method(method=name, args=serialize(session.client, *args)))
+                command = pb2.Command()
+                command.ml_command.fetch.CopyFrom(
+                    pb2.Fetch(obj_ref=pb2.ObjectRef(id=obj_ref), methods=methods)
+                )
+                (_, properties, _) = session.client.execute_command(command)
+                ml_command_result = properties["ml_command_result"]
+                if ml_command_result.HasField("summary"):
+                    summary = ml_command_result.summary
+                    return summary
+                elif ml_command_result.HasField("operator_info"):
+                    model_info = deserialize(properties)
+                    # get a new model ref id from the existing model,
+                    # it is up to the caller to build the model
+                    return model_info.obj_ref.id
+                else:
+                    return deserialize(properties)
+
+            try:
+                return remote_call()
+            except SparkException as e:
+                if e.getErrorClass() == "CONNECT_ML.MODEL_SUMMARY_LOST":
+                    # the model summary is lost because the remote model was offloaded,
+                    # send request to restore model.summary
+                    create_summary_command = pb2.Command()
+                    create_summary_command.ml_command.create_summary.CopyFrom(
+                        pb2.MlCommand.CreateSummary(
+                            model_ref=pb2.ObjectRef(
+                                id=self._remote_model_obj.ref_id  # type: ignore
+                            ),
+                            dataset=self._summary_dataset._plan.plan(  # type: ignore
+                                session.client  # type: ignore
+                            ),
+                        )
+                    )
+                    session.client.execute_command(create_summary_command)  # type: ignore
+
+                    return remote_call()
+
+                # for other unexpected error, re-raise it.
+                raise
         else:
             return f(self, name, *args)
 
@@ -346,8 +373,11 @@ def wrapped(self: "JavaWrapper") -> Any:
         except Exception:
             return
 
-        if in_remote and isinstance(self._java_obj, RemoteModelRef):
-            self._java_obj.release_ref()
+        if in_remote:
+            if isinstance(self._java_obj, RemoteModelRef):
+                self._java_obj.release_ref()
+            if hasattr(self, "_remote_model_obj"):
+                self._remote_model_obj.release_ref()
             return
         else:
             return f(self)
@@ -1076,17 +1106,32 @@ def hasSummary(self) -> bool:
         Indicates whether a training summary exists for this model
         instance.
         """
+        if is_remote() and "PYSPARK_NO_NAMESPACE_SHARE" not in os.environ:
+            return hasattr(self, "_summary")
         return cast("JavaWrapper", self)._call_java("hasSummary")
 
     @property
     @since("2.1.0")
-    @try_remote_intermediate_result
     def summary(self) -> T:
         """
         Gets summary of the model trained on the training set. An exception is thrown if
         no summary exists.
         """
-        return cast("JavaWrapper", self)._call_java("summary")
+        if is_remote() and "PYSPARK_NO_NAMESPACE_SHARE" not in os.environ:
+            if hasattr(self, "_summary"):
+                return self._summary
+            else:
+                raise RuntimeError(
+                    "No training summary available for this %s" % self.__class__.__name__
+                )
+        return self._summaryCls(cast("JavaWrapper", self)._call_java("summary"))
+
+    @property
+    def _summaryCls(self) -> type:
+        raise NotImplementedError()
+
+    def _summary_dataset(self, train_dataset: "DataFrame") -> "DataFrame":
+        return self.transform(train_dataset)  # type: ignore
 
 
 class MetaAlgorithmReadWrite:
diff --git a/python/pyspark/pandas/base.py b/python/pyspark/pandas/base.py
index 01e23214d662d..a16a8902f9f06 100644
--- a/python/pyspark/pandas/base.py
+++ b/python/pyspark/pandas/base.py
@@ -42,6 +42,7 @@
 from pyspark.pandas.spark.accessors import SparkIndexOpsMethods
 from pyspark.pandas.typedef import extension_dtypes
 from pyspark.pandas.utils import (
+    ansi_mode_context,
     combine_frames,
     same_anchor,
     scol_for,
@@ -269,6 +270,14 @@ def wrapper(self: SeriesOrIndex, *args: Any) -> SeriesOrIndex:
     return wrapper
 
 
+def _exclude_pd_np_operand(other: Any) -> None:
+    if isinstance(other, (pd.Series, pd.Index, pd.DataFrame, np.ndarray)):
+        raise TypeError(
+            f"Operand of type {type(other).__module__}.{type(other).__qualname__} "
+            f"is not supported for this operation. "
+        )
+
+
 class IndexOpsMixin(object, metaclass=ABCMeta):
     """common ops mixin to support a unified interface / docs for Series / Index
 
@@ -313,16 +322,20 @@ def copy(self: IndexOpsLike) -> IndexOpsLike:
 
     # arithmetic operators
     def __neg__(self: IndexOpsLike) -> IndexOpsLike:
-        return self._dtype_op.neg(self)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.neg(self)
 
     def __add__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.add(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.add(self, other)
 
     def __sub__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.sub(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.sub(self, other)
 
     def __mul__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.mul(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.mul(self, other)
 
     def __truediv__(self, other: Any) -> SeriesOrIndex:
         """
@@ -342,22 +355,28 @@ def __truediv__(self, other: Any) -> SeriesOrIndex:
         |          -10          |   null  | -np.inf |
         +-----------------------|---------|---------+
         """
-        return self._dtype_op.truediv(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.truediv(self, other)
 
     def __mod__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.mod(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.mod(self, other)
 
     def __radd__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.radd(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.radd(self, other)
 
     def __rsub__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rsub(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rsub(self, other)
 
     def __rmul__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rmul(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rmul(self, other)
 
     def __rtruediv__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rtruediv(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rtruediv(self, other)
 
     def __floordiv__(self, other: Any) -> SeriesOrIndex:
         """
@@ -377,68 +396,93 @@ def __floordiv__(self, other: Any) -> SeriesOrIndex:
         |          -10          |   null  | -np.inf |
         +-----------------------|---------|---------+
         """
-        return self._dtype_op.floordiv(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.floordiv(self, other)
 
     def __rfloordiv__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rfloordiv(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rfloordiv(self, other)
 
     def __rmod__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rmod(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rmod(self, other)
 
     def __pow__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.pow(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.pow(self, other)
 
     def __rpow__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rpow(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rpow(self, other)
 
     def __abs__(self: IndexOpsLike) -> IndexOpsLike:
-        return self._dtype_op.abs(self)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.abs(self)
 
     # comparison operators
     def __eq__(self, other: Any) -> SeriesOrIndex:  # type: ignore[override]
         # pandas always returns False for all items with dict and set.
-        if isinstance(other, (dict, set)):
-            return self != self
-        else:
-            return self._dtype_op.eq(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            _exclude_pd_np_operand(other)
+            if isinstance(other, (dict, set)):
+                return self != self
+            else:
+                return self._dtype_op.eq(self, other)
 
     def __ne__(self, other: Any) -> SeriesOrIndex:  # type: ignore[override]
-        return self._dtype_op.ne(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            _exclude_pd_np_operand(other)
+            return self._dtype_op.ne(self, other)
 
     def __lt__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.lt(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            _exclude_pd_np_operand(other)
+            return self._dtype_op.lt(self, other)
 
     def __le__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.le(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            _exclude_pd_np_operand(other)
+            return self._dtype_op.le(self, other)
 
     def __ge__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.ge(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            _exclude_pd_np_operand(other)
+            return self._dtype_op.ge(self, other)
 
     def __gt__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.gt(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            _exclude_pd_np_operand(other)
+            return self._dtype_op.gt(self, other)
 
     def __invert__(self: IndexOpsLike) -> IndexOpsLike:
-        return self._dtype_op.invert(self)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.invert(self)
 
     # `and`, `or`, `not` cannot be overloaded in Python,
     # so use bitwise operators as boolean operators
     def __and__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.__and__(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.__and__(self, other)
 
     def __or__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.__or__(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.__or__(self, other)
 
     def __rand__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rand(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rand(self, other)
 
     def __ror__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.ror(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.ror(self, other)
 
     def __xor__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.xor(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.xor(self, other)
 
     def __rxor__(self, other: Any) -> SeriesOrIndex:
-        return self._dtype_op.rxor(self, other)
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return self._dtype_op.rxor(self, other)
 
     def __len__(self) -> int:
         return len(self._psdf)
diff --git a/python/pyspark/pandas/config.py b/python/pyspark/pandas/config.py
index 290bee4340c0a..e89bcf835f8bd 100644
--- a/python/pyspark/pandas/config.py
+++ b/python/pyspark/pandas/config.py
@@ -24,7 +24,7 @@
 
 from pyspark._globals import _NoValue, _NoValueType
 from pyspark.sql.session import SparkSession
-from pyspark.pandas.utils import default_session, is_testing
+from pyspark.pandas.utils import default_session
 
 
 __all__ = ["get_option", "set_option", "reset_option", "options", "option_context"]
@@ -287,7 +287,7 @@ def validate(self, v: Any) -> None:
             "If False, pandas API on Spark may hit unexpected results or errors. "
             "The default is False."
         ),
-        default=is_testing(),
+        default=True,
         types=bool,
     ),
     Option(
diff --git a/python/pyspark/pandas/correlation.py b/python/pyspark/pandas/correlation.py
index da51dc2cc6126..9327b5eb71a45 100644
--- a/python/pyspark/pandas/correlation.py
+++ b/python/pyspark/pandas/correlation.py
@@ -19,7 +19,7 @@
 
 from pyspark.sql import DataFrame as SparkDataFrame, functions as F
 from pyspark.sql.window import Window
-from pyspark.pandas.utils import verify_temp_column_name
+from pyspark.pandas.utils import verify_temp_column_name, is_ansi_mode_enabled
 
 
 CORRELATION_VALUE_1_COLUMN = "__correlation_value_1_input__"
@@ -60,6 +60,7 @@ def compute(sdf: SparkDataFrame, groupKeys: List[str], method: str) -> SparkData
             .alias(CORRELATION_VALUE_2_COLUMN),
         ],
     )
+    spark_session = sdf.sparkSession
 
     if method in ["pearson", "spearman"]:
         # convert values to avg ranks for spearman correlation
@@ -125,16 +126,20 @@ def compute(sdf: SparkDataFrame, groupKeys: List[str], method: str) -> SparkData
                 )
             )
 
+        if is_ansi_mode_enabled(spark_session):
+            corr_expr = F.try_divide(
+                F.covar_samp(CORRELATION_VALUE_1_COLUMN, CORRELATION_VALUE_2_COLUMN),
+                F.stddev_samp(CORRELATION_VALUE_1_COLUMN)
+                * F.stddev_samp(CORRELATION_VALUE_2_COLUMN),
+            )
+        else:
+            corr_expr = F.corr(CORRELATION_VALUE_1_COLUMN, CORRELATION_VALUE_2_COLUMN)
+
         sdf = sdf.groupby(groupKeys).agg(
-            F.corr(CORRELATION_VALUE_1_COLUMN, CORRELATION_VALUE_2_COLUMN).alias(
-                CORRELATION_CORR_OUTPUT_COLUMN
+            corr_expr.alias(CORRELATION_CORR_OUTPUT_COLUMN),
+            F.count(F.when(~F.isnull(CORRELATION_VALUE_1_COLUMN), 1)).alias(
+                CORRELATION_COUNT_OUTPUT_COLUMN
             ),
-            F.count(
-                F.when(
-                    ~F.isnull(CORRELATION_VALUE_1_COLUMN),
-                    1,
-                )
-            ).alias(CORRELATION_COUNT_OUTPUT_COLUMN),
         )
 
         return sdf
@@ -219,6 +224,42 @@ def compute(sdf: SparkDataFrame, groupKeys: List[str], method: str) -> SparkData
             F.col(CORRELATION_VALUE_2_COLUMN) == F.col(CORRELATION_VALUE_Y_COLUMN)
         )
 
+        if is_ansi_mode_enabled(spark_session):
+            corr_expr = F.try_divide(
+                F.col(CORRELATION_KENDALL_P_COLUMN) - F.col(CORRELATION_KENDALL_Q_COLUMN),
+                F.sqrt(
+                    (
+                        F.col(CORRELATION_KENDALL_P_COLUMN)
+                        + F.col(CORRELATION_KENDALL_Q_COLUMN)
+                        + F.col(CORRELATION_KENDALL_T_COLUMN)
+                    )
+                    * (
+                        F.col(CORRELATION_KENDALL_P_COLUMN)
+                        + F.col(CORRELATION_KENDALL_Q_COLUMN)
+                        + F.col(CORRELATION_KENDALL_U_COLUMN)
+                    )
+                ),
+            )
+        else:
+            corr_expr = (
+                F.col(CORRELATION_KENDALL_P_COLUMN) - F.col(CORRELATION_KENDALL_Q_COLUMN)
+            ) / F.sqrt(
+                (
+                    (
+                        F.col(CORRELATION_KENDALL_P_COLUMN)
+                        + F.col(CORRELATION_KENDALL_Q_COLUMN)
+                        + (F.col(CORRELATION_KENDALL_T_COLUMN))
+                    )
+                )
+                * (
+                    (
+                        F.col(CORRELATION_KENDALL_P_COLUMN)
+                        + F.col(CORRELATION_KENDALL_Q_COLUMN)
+                        + (F.col(CORRELATION_KENDALL_U_COLUMN))
+                    )
+                )
+            )
+
         sdf = (
             sdf.groupby(groupKeys)
             .agg(
@@ -232,26 +273,7 @@ def compute(sdf: SparkDataFrame, groupKeys: List[str], method: str) -> SparkData
                     ).otherwise(F.lit(0))
                 ).alias(CORRELATION_COUNT_OUTPUT_COLUMN),
             )
-            .withColumn(
-                CORRELATION_CORR_OUTPUT_COLUMN,
-                (F.col(CORRELATION_KENDALL_P_COLUMN) - F.col(CORRELATION_KENDALL_Q_COLUMN))
-                / F.sqrt(
-                    (
-                        (
-                            F.col(CORRELATION_KENDALL_P_COLUMN)
-                            + F.col(CORRELATION_KENDALL_Q_COLUMN)
-                            + (F.col(CORRELATION_KENDALL_T_COLUMN))
-                        )
-                    )
-                    * (
-                        (
-                            F.col(CORRELATION_KENDALL_P_COLUMN)
-                            + F.col(CORRELATION_KENDALL_Q_COLUMN)
-                            + (F.col(CORRELATION_KENDALL_U_COLUMN))
-                        )
-                    )
-                ),
-            )
+            .withColumn(CORRELATION_CORR_OUTPUT_COLUMN, corr_expr)
         )
 
         sdf = sdf.select(
diff --git a/python/pyspark/pandas/data_type_ops/base.py b/python/pyspark/pandas/data_type_ops/base.py
index b4a6b1abbcaf9..bb2ef8b09aead 100644
--- a/python/pyspark/pandas/data_type_ops/base.py
+++ b/python/pyspark/pandas/data_type_ops/base.py
@@ -23,6 +23,7 @@
 import numpy as np
 import pandas as pd
 from pandas.api.types import CategoricalDtype
+from pandas.core.dtypes.common import is_numeric_dtype
 
 from pyspark.sql import functions as F, Column as PySparkColumn
 from pyspark.sql.types import (
@@ -52,6 +53,7 @@
     extension_object_dtypes_available,
     spark_type_to_pandas_dtype,
 )
+from pyspark.pandas.utils import is_ansi_mode_enabled
 
 if extension_dtypes_available:
     from pandas import Int8Dtype, Int16Dtype, Int32Dtype, Int64Dtype
@@ -108,6 +110,33 @@ def transform_boolean_operand_to_numeric(
         return operand
 
 
+def _should_return_all_false(left: IndexOpsLike, right: Any) -> bool:
+    """
+    Determine if binary comparison should short-circuit to all False,
+    based on incompatible dtypes: non-numeric vs. numeric (including bools).
+    """
+    from pyspark.pandas.base import IndexOpsMixin
+    from pandas.api.types import is_list_like  # type: ignore[attr-defined]
+
+    def are_both_numeric(left_dtype: Dtype, right_dtype: Dtype) -> bool:
+        return is_numeric_dtype(left_dtype) and is_numeric_dtype(right_dtype)
+
+    left_dtype = left.dtype
+
+    if isinstance(right, IndexOpsMixin):
+        right_dtype = right.dtype
+    elif isinstance(right, (list, tuple)):
+        right_dtype = pd.Series(right).dtype
+    else:
+        assert not is_list_like(right), (
+            "Only ps.Series, ps.Index, list, tuple, or scalar is supported as the "
+            "right-hand operand."
+        )
+        right_dtype = pd.Series([right]).dtype
+
+    return left_dtype != right_dtype and not are_both_numeric(left_dtype, right_dtype)
+
+
 def _as_categorical_type(
     index_ops: IndexOpsLike, dtype: CategoricalDtype, spark_type: DataType
 ) -> IndexOpsLike:
@@ -392,6 +421,10 @@ def ge(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         raise TypeError(">= can not be applied to %s." % self.pretty_name)
 
     def eq(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
+        if is_ansi_mode_enabled(left._internal.spark_frame.sparkSession):
+            if _should_return_all_false(left, right):
+                return left._with_new_scol(F.lit(False)).rename(None)  # type: ignore[attr-defined]
+
         if isinstance(right, (list, tuple)):
             from pyspark.pandas.series import first_series, scol_for
             from pyspark.pandas.frame import DataFrame
diff --git a/python/pyspark/pandas/data_type_ops/boolean_ops.py b/python/pyspark/pandas/data_type_ops/boolean_ops.py
index 765ec6a946347..d8fccb9d18847 100644
--- a/python/pyspark/pandas/data_type_ops/boolean_ops.py
+++ b/python/pyspark/pandas/data_type_ops/boolean_ops.py
@@ -19,9 +19,11 @@
 from typing import Any, Union
 
 import pandas as pd
-from pandas.api.types import CategoricalDtype
+from pandas.api.types import CategoricalDtype, is_integer_dtype  # type: ignore[attr-defined]
+from pandas.core.dtypes.common import is_numeric_dtype
 
-from pyspark.pandas.base import column_op, IndexOpsMixin, numpy_column_op
+from pyspark.pandas.base import column_op, IndexOpsMixin
+from pyspark.pandas.config import get_option
 from pyspark.pandas._typing import Dtype, IndexOpsLike, SeriesOrIndex
 from pyspark.pandas.data_type_ops.base import (
     DataTypeOps,
@@ -137,21 +139,13 @@ def mod(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
             raise TypeError(
                 "Modulo can not be applied to %s and the given type." % self.pretty_name
             )
-        spark_session = left._internal.spark_frame.sparkSession
-
-        def safe_mod(left_col: PySparkColumn, right_val: Any) -> PySparkColumn:
-            if is_ansi_mode_enabled(spark_session):
-                return F.when(F.lit(right_val == 0), F.lit(None)).otherwise(left_col % right_val)
-            else:
-                return left_col % right_val
-
         if isinstance(right, numbers.Number):
             left = transform_boolean_operand_to_numeric(left, spark_type=as_spark_type(type(right)))
-            return numpy_column_op(safe_mod)(left, right)
+            return left % right
         else:
             assert isinstance(right, IndexOpsMixin)
             left = transform_boolean_operand_to_numeric(left, spark_type=right.spark.data_type)
-            return numpy_column_op(safe_mod)(left, right)
+            return left % right
 
     def pow(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
@@ -235,18 +229,7 @@ def rmod(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if isinstance(right, numbers.Number) and not isinstance(right, bool):
             left = transform_boolean_operand_to_numeric(left, spark_type=as_spark_type(type(right)))
-            spark_session = left._internal.spark_frame.sparkSession
-
-            if is_ansi_mode_enabled(spark_session):
-
-                def safe_rmod(left_col: PySparkColumn, right_val: Any) -> PySparkColumn:
-                    return F.when(left_col != 0, F.pmod(F.lit(right_val), left_col)).otherwise(
-                        F.lit(None)
-                    )
-
-                return numpy_column_op(safe_rmod)(left, right)
-            else:
-                return right % left
+            return right % left
         else:
             raise TypeError(
                 "Modulo can not be applied to %s and the given type." % self.pretty_name
@@ -339,6 +322,13 @@ def astype(self, index_ops: IndexOpsLike, dtype: Union[str, type, Dtype]) -> Ind
                 ),
             )
         else:
+            is_ansi = is_ansi_mode_enabled(index_ops._internal.spark_frame.sparkSession)
+            if is_ansi and get_option("compute.eager_check"):
+                if is_integer_dtype(dtype) and not isinstance(dtype, extension_dtypes):
+                    if index_ops.hasnans:
+                        raise ValueError(
+                            "Cannot convert %s with missing values to integer" % self.pretty_name
+                        )
             return _as_other_type(index_ops, dtype, spark_type)
 
     def neg(self, operand: IndexOpsLike) -> IndexOpsLike:
@@ -347,6 +337,24 @@ def neg(self, operand: IndexOpsLike) -> IndexOpsLike:
     def abs(self, operand: IndexOpsLike) -> IndexOpsLike:
         return operand
 
+    def eq(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
+        if is_ansi_mode_enabled(left._internal.spark_frame.sparkSession):
+            # Handle bool vs. non-bool numeric comparisons
+            left_is_bool = _is_boolean_type(left)
+            right_is_non_bool_numeric = is_numeric_dtype(right) and not _is_boolean_type(right)
+
+            if left_is_bool and right_is_non_bool_numeric:
+                if isinstance(right, numbers.Number):
+                    left = transform_boolean_operand_to_numeric(
+                        left, spark_type=as_spark_type(type(right))
+                    )
+                else:
+                    left = transform_boolean_operand_to_numeric(
+                        left, spark_type=right.spark.data_type
+                    )
+
+        return super().eq(left, right)
+
     def lt(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         return column_op(PySparkColumn.__lt__)(left, right)
diff --git a/python/pyspark/pandas/data_type_ops/num_ops.py b/python/pyspark/pandas/data_type_ops/num_ops.py
index 34d313af8232e..940eb0ef40af2 100644
--- a/python/pyspark/pandas/data_type_ops/num_ops.py
+++ b/python/pyspark/pandas/data_type_ops/num_ops.py
@@ -16,13 +16,15 @@
 #
 
 import numbers
-from typing import Any, Union
+from typing import Any, Union, Callable
 
 import numpy as np
 import pandas as pd
 from pandas.api.types import (  # type: ignore[attr-defined]
     is_bool_dtype,
     is_integer_dtype,
+    is_float_dtype,
+    is_numeric_dtype,
     CategoricalDtype,
     is_list_like,
 )
@@ -41,8 +43,9 @@
     _sanitize_list_like,
     _is_valid_for_logical_operator,
     _is_boolean_type,
+    _should_return_all_false,
 )
-from pyspark.pandas.typedef.typehints import extension_dtypes, pandas_on_spark_type
+from pyspark.pandas.typedef.typehints import extension_dtypes, pandas_on_spark_type, as_spark_type
 from pyspark.pandas.utils import is_ansi_mode_enabled
 from pyspark.sql import functions as F, Column as PySparkColumn
 from pyspark.sql.types import (
@@ -69,6 +72,27 @@ def _non_fractional_astype(
         return _as_other_type(index_ops, dtype, spark_type)
 
 
+def _cast_back_float(
+    expr: PySparkColumn, left_dtype: Union[str, type, Dtype], right: Any
+) -> PySparkColumn:
+    """
+    Cast the result expression back to the original float dtype if needed.
+
+    This function ensures pandas on Spark matches pandas behavior when performing
+    arithmetic operations involving float32 and numeric values. In such cases, under ANSI mode,
+    Spark implicitly widen float32 to float64, when the other operand is a numeric type
+    but not float32 (e.g., int, bool), which deviates from pandas behavior where the result
+    retains float32.
+    """
+    is_left_float = is_float_dtype(left_dtype)
+    is_right_numeric = isinstance(right, (int, float, bool)) or (
+        hasattr(right, "dtype") and is_numeric_dtype(right.dtype)
+    )
+    if is_left_float and is_right_numeric:
+        return expr.cast(as_spark_type(left_dtype))
+    return expr
+
+
 class NumericOps(DataTypeOps):
     """The class for binary operations of numeric pandas-on-Spark objects."""
 
@@ -80,28 +104,51 @@ def add(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not is_valid_operand_for_numeric_arithmetic(right):
             raise TypeError("Addition can not be applied to given types.")
+        spark_session = left._internal.spark_frame.sparkSession
+        new_right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
 
-        right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
-        return column_op(PySparkColumn.__add__)(left, right)
+        def wrapped_add(lc: PySparkColumn, rc: Any) -> PySparkColumn:
+            expr = PySparkColumn.__add__(lc, rc)
+            if is_ansi_mode_enabled(spark_session):
+                expr = _cast_back_float(expr, left.dtype, right)
+            return expr
+
+        return column_op(wrapped_add)(left, new_right)
 
     def sub(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not is_valid_operand_for_numeric_arithmetic(right):
             raise TypeError("Subtraction can not be applied to given types.")
+        spark_session = left._internal.spark_frame.sparkSession
+        new_right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
 
-        right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
-        return column_op(PySparkColumn.__sub__)(left, right)
+        def wrapped_sub(lc: PySparkColumn, rc: Any) -> PySparkColumn:
+            expr = PySparkColumn.__sub__(lc, rc)
+            if is_ansi_mode_enabled(spark_session):
+                expr = _cast_back_float(expr, left.dtype, right)
+            return expr
+
+        return column_op(wrapped_sub)(left, new_right)
 
     def mod(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not is_valid_operand_for_numeric_arithmetic(right):
             raise TypeError("Modulo can not be applied to given types.")
+        spark_session = left._internal.spark_frame.sparkSession
 
-        def mod(left: PySparkColumn, right: Any) -> PySparkColumn:
-            return ((left % right) + right) % right
+        def mod(left_op: PySparkColumn, right_op: Any) -> PySparkColumn:
+            if is_ansi_mode_enabled(spark_session):
+                expr = F.when(F.lit(right_op == 0), F.lit(None)).otherwise(
+                    ((left_op % right_op) + right_op) % right_op
+                )
+                expr = _cast_back_float(expr, left.dtype, right)
+            else:
+                expr = ((left_op % right_op) + right_op) % right_op
+            return expr
 
-        right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
-        return column_op(mod)(left, right)
+        new_right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
+
+        return column_op(mod)(left, new_right)
 
     def pow(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
@@ -122,22 +169,46 @@ def radd(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not isinstance(right, numbers.Number):
             raise TypeError("Addition can not be applied to given types.")
-        right = transform_boolean_operand_to_numeric(right)
-        return column_op(PySparkColumn.__radd__)(left, right)
+        spark_session = left._internal.spark_frame.sparkSession
+        new_right = transform_boolean_operand_to_numeric(right)
+
+        def wrapped_radd(lc: PySparkColumn, rc: Any) -> PySparkColumn:
+            expr = PySparkColumn.__radd__(lc, rc)
+            if is_ansi_mode_enabled(spark_session):
+                expr = _cast_back_float(expr, left.dtype, right)
+            return expr
+
+        return column_op(wrapped_radd)(left, new_right)
 
     def rsub(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not isinstance(right, numbers.Number):
             raise TypeError("Subtraction can not be applied to given types.")
-        right = transform_boolean_operand_to_numeric(right)
-        return column_op(PySparkColumn.__rsub__)(left, right)
+        spark_session = left._internal.spark_frame.sparkSession
+        new_right = transform_boolean_operand_to_numeric(right)
+
+        def wrapped_rsub(lc: PySparkColumn, rc: Any) -> PySparkColumn:
+            expr = PySparkColumn.__rsub__(lc, rc)
+            if is_ansi_mode_enabled(spark_session):
+                expr = _cast_back_float(expr, left.dtype, right)
+            return expr
+
+        return column_op(wrapped_rsub)(left, new_right)
 
     def rmul(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not isinstance(right, numbers.Number):
             raise TypeError("Multiplication can not be applied to given types.")
-        right = transform_boolean_operand_to_numeric(right)
-        return column_op(PySparkColumn.__rmul__)(left, right)
+        spark_session = left._internal.spark_frame.sparkSession
+        new_right = transform_boolean_operand_to_numeric(right)
+
+        def wrapped_rmul(lc: PySparkColumn, rc: Any) -> PySparkColumn:
+            expr = PySparkColumn.__mul__(lc, rc)
+            if is_ansi_mode_enabled(spark_session):
+                expr = _cast_back_float(expr, left.dtype, right)
+            return expr
+
+        return column_op(wrapped_rmul)(left, new_right)
 
     def rpow(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
@@ -154,12 +225,22 @@ def rmod(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not isinstance(right, numbers.Number):
             raise TypeError("Modulo can not be applied to given types.")
+        spark_session = left._internal.spark_frame.sparkSession
 
-        def rmod(left: PySparkColumn, right: Any) -> PySparkColumn:
-            return ((right % left) + left) % left
+        new_right = transform_boolean_operand_to_numeric(right)
 
-        right = transform_boolean_operand_to_numeric(right)
-        return column_op(rmod)(left, right)
+        def safe_rmod(left_op: PySparkColumn, right_op: Any) -> PySparkColumn:
+            if is_ansi_mode_enabled(spark_session):
+                # Java-style modulo -> Python-style modulo
+                result = F.when(
+                    left_op != 0, ((F.lit(right_op) % left_op) + left_op) % left_op
+                ).otherwise(F.lit(None))
+                result = _cast_back_float(result, left.dtype, right)
+                return result
+            else:
+                return ((right_op % left_op) + left_op) % left_op
+
+        return column_op(safe_rmod)(left, new_right)
 
     def neg(self, operand: IndexOpsLike) -> IndexOpsLike:
         return operand._with_new_scol(-operand.spark.column, field=operand._internal.data_fields[0])
@@ -173,7 +254,16 @@ def eq(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         # We can directly use `super().eq` when given object is list, tuple, dict or set.
         if not isinstance(right, IndexOpsMixin) and is_list_like(right):
             return super().eq(left, right)
-        return pyspark_column_op("__eq__", left, right, fillna=False)
+        else:
+            if is_ansi_mode_enabled(left._internal.spark_frame.sparkSession):
+                if _should_return_all_false(left, right):
+                    left_scol = left._with_new_scol(F.lit(False))
+                    return left_scol.rename(None)  # type: ignore[attr-defined]
+                if _is_boolean_type(right):  # numeric vs. bool
+                    right = transform_boolean_operand_to_numeric(
+                        right, spark_type=left.spark.data_type
+                    )
+            return pyspark_column_op("__eq__", left, right, fillna=False)
 
     def ne(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
@@ -271,13 +361,22 @@ def floordiv(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not is_valid_operand_for_numeric_arithmetic(right):
             raise TypeError("Floor division can not be applied to given types.")
+        spark_session = left._internal.spark_frame.sparkSession
+        use_try_divide = is_ansi_mode_enabled(spark_session)
+
+        def fallback_div(x: PySparkColumn, y: PySparkColumn) -> PySparkColumn:
+            return x.__div__(y)
+
+        safe_div: Callable[[PySparkColumn, PySparkColumn], PySparkColumn] = (
+            F.try_divide if use_try_divide else fallback_div
+        )
 
         def floordiv(left: PySparkColumn, right: Any) -> PySparkColumn:
             return F.when(F.lit(right is np.nan), np.nan).otherwise(
                 F.when(
                     F.lit(right != 0) | F.lit(right).isNull(),
                     F.floor(left.__div__(right)),
-                ).otherwise(F.lit(np.inf).__div__(left))
+                ).otherwise(safe_div(F.lit(np.inf), left))
             )
 
         right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
@@ -334,56 +433,76 @@ def mul(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         if not is_valid_operand_for_numeric_arithmetic(right):
             raise TypeError("Multiplication can not be applied to given types.")
 
-        right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
+        spark_session = left._internal.spark_frame.sparkSession
+        new_right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
 
-        return column_op(PySparkColumn.__mul__)(left, right)
+        def wrapped_mul(lc: PySparkColumn, rc: Any) -> PySparkColumn:
+            expr = PySparkColumn.__mul__(lc, rc)
+            if is_ansi_mode_enabled(spark_session):
+                expr = _cast_back_float(expr, left.dtype, right)
+            return expr
+
+        return column_op(wrapped_mul)(left, new_right)
 
     def truediv(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not is_valid_operand_for_numeric_arithmetic(right):
             raise TypeError("True division can not be applied to given types.")
         spark_session = left._internal.spark_frame.sparkSession
-        right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
+        new_right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
+        left_dtype = left.dtype
 
-        def truediv(left: PySparkColumn, right: Any) -> PySparkColumn:
+        def truediv(lc: PySparkColumn, rc: Any) -> PySparkColumn:
             if is_ansi_mode_enabled(spark_session):
-                return F.when(
-                    F.lit(right == 0),
-                    F.when(left < 0, F.lit(float("-inf")))
-                    .when(left > 0, F.lit(float("inf")))
+                expr = F.when(
+                    F.lit(rc == 0),
+                    F.when(lc < 0, F.lit(float("-inf")))
+                    .when(lc > 0, F.lit(float("inf")))
                     .otherwise(F.lit(np.nan)),
-                ).otherwise(left / right)
+                ).otherwise(lc / rc)
             else:
-                return F.when(
-                    F.lit(right != 0) | F.lit(right).isNull(),
-                    left.__div__(right),
+                expr = F.when(
+                    F.lit(rc != 0) | F.lit(rc).isNull(),
+                    lc.__div__(rc),
                 ).otherwise(
-                    F.when(F.lit(left == np.inf) | F.lit(left == -np.inf), left).otherwise(
-                        F.lit(np.inf).__div__(left)
+                    F.when(F.lit(lc == np.inf) | F.lit(lc == -np.inf), lc).otherwise(
+                        F.lit(np.inf).__div__(lc)
                     )
                 )
+            return _cast_back_float(expr, left_dtype, right)
 
-        return numpy_column_op(truediv)(left, right)
+        return numpy_column_op(truediv)(left, new_right)
 
     def floordiv(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
         if not is_valid_operand_for_numeric_arithmetic(right):
             raise TypeError("Floor division can not be applied to given types.")
+        spark_session = left._internal.spark_frame.sparkSession
+        use_try_divide = is_ansi_mode_enabled(spark_session)
+        left_dtype = left.dtype
 
-        def floordiv(left: PySparkColumn, right: Any) -> PySparkColumn:
-            return F.when(F.lit(right is np.nan), np.nan).otherwise(
+        def fallback_div(x: PySparkColumn, y: PySparkColumn) -> PySparkColumn:
+            return x.__div__(y)
+
+        safe_div: Callable[[PySparkColumn, PySparkColumn], PySparkColumn] = (
+            F.try_divide if use_try_divide else fallback_div
+        )
+
+        def floordiv(lc: PySparkColumn, rc: Any) -> PySparkColumn:
+            expr = F.when(F.lit(rc is np.nan), np.nan).otherwise(
                 F.when(
-                    F.lit(right != 0) | F.lit(right).isNull(),
-                    F.floor(left.__div__(right)),
+                    F.lit(rc != 0) | F.lit(rc).isNull(),
+                    F.floor(lc.__div__(rc)),
                 ).otherwise(
-                    F.when(F.lit(left == np.inf) | F.lit(left == -np.inf), left).otherwise(
-                        F.lit(np.inf).__div__(left)
+                    F.when(F.lit(lc == np.inf) | F.lit(lc == -np.inf), lc).otherwise(
+                        safe_div(F.lit(np.inf), lc)
                     )
                 )
             )
+            return _cast_back_float(expr, left_dtype, right)
 
-        right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
-        return numpy_column_op(floordiv)(left, right)
+        new_right = transform_boolean_operand_to_numeric(right, spark_type=left.spark.data_type)
+        return numpy_column_op(floordiv)(left, new_right)
 
     def rtruediv(self, left: IndexOpsLike, right: Any) -> SeriesOrIndex:
         _sanitize_list_like(right)
diff --git a/python/pyspark/pandas/frame.py b/python/pyspark/pandas/frame.py
index a6f737d0d01bf..745551e8b8f9b 100644
--- a/python/pyspark/pandas/frame.py
+++ b/python/pyspark/pandas/frame.py
@@ -25,7 +25,7 @@
 import inspect
 import json
 import types
-from functools import partial, reduce
+from functools import partial, reduce, wraps
 import sys
 from itertools import zip_longest, chain
 from types import TracebackType
@@ -42,6 +42,7 @@
     Sequence,
     Tuple,
     Type,
+    TypeVar,
     Union,
     cast,
     no_type_check,
@@ -109,9 +110,11 @@
 from pyspark.pandas.spark.accessors import SparkFrameMethods, CachedSparkFrameMethods
 from pyspark.pandas.utils import (
     align_diff_frames,
+    ansi_mode_context,
     column_labels_level,
     combine_frames,
     default_session,
+    is_ansi_mode_enabled,
     is_name_like_tuple,
     is_name_like_value,
     is_testing,
@@ -168,6 +171,18 @@
 )
 
 
+FuncT = TypeVar("FuncT", bound=Callable[..., Any])
+
+
+def with_ansi_mode_context(f: FuncT) -> FuncT:
+    @wraps(f)
+    def _with_ansi_mode_context(self: "DataFrame", *args: Any, **kwargs: Any) -> Any:
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return f(self, *args, **kwargs)
+
+    return cast(FuncT, _with_ansi_mode_context)
+
+
 _flex_doc_FRAME = """
 Get {desc} of dataframe and other, element-wise (binary operator `{op_name}`).
 
@@ -739,6 +754,7 @@ def axes(self) -> List:
         """
         return [self.index, self.columns]
 
+    @with_ansi_mode_context
     def _reduce_for_stat_function(
         self,
         sfun: Callable[["Series"], PySparkColumn],
@@ -869,6 +885,7 @@ def _psser_for(self, label: Label) -> "Series":
         """
         return self._pssers[label]
 
+    @with_ansi_mode_context
     def _apply_series_op(
         self,
         op: Callable[["Series"], Union["Series", PySparkColumn]],
@@ -883,6 +900,7 @@ def _apply_series_op(
         return DataFrame(internal)
 
     # Arithmetic Operators
+    @with_ansi_mode_context
     def _map_series_op(self, op: str, other: Any) -> "DataFrame":
         from pyspark.pandas.base import IndexOpsMixin
 
@@ -1506,6 +1524,7 @@ def aggregate(self, func: Union[List[str], Dict[Name, List[str]]]) -> "DataFrame
 
     agg = aggregate
 
+    @with_ansi_mode_context
     def corr(self, method: str = "pearson", min_periods: Optional[int] = None) -> "DataFrame":
         """
         Compute pairwise correlation of columns, excluding NA/null values.
@@ -1725,6 +1744,7 @@ def corr(self, method: str = "pearson", min_periods: Optional[int] = None) -> "D
             )
         )
 
+    @with_ansi_mode_context
     def corrwith(
         self, other: DataFrameOrSeries, axis: Axis = 0, drop: bool = False, method: str = "pearson"
     ) -> "Series":
@@ -8383,6 +8403,7 @@ def nsmallest(
         by_scols = self._prepare_sort_by_scols(columns)
         return self._sort(by=by_scols, ascending=True, na_position="last", keep=keep).head(n=n)
 
+    @with_ansi_mode_context
     def isin(self, values: Union[List, Dict]) -> "DataFrame":
         """
         Whether each element in the DataFrame is contained in values.
@@ -8456,7 +8477,13 @@ def isin(self, values: Union[List, Dict]) -> "DataFrame":
             )
 
             for label in self._internal.column_labels:
-                scol = self._internal.spark_column_for(label).isin([F.lit(v) for v in values])
+                if is_ansi_mode_enabled(self._internal.spark_frame.sparkSession):
+                    col_type = self._internal.spark_type_for(label)
+                    scol = self._internal.spark_column_for(label).isin(
+                        [F.lit(v).try_cast(col_type) for v in values]
+                    )
+                else:
+                    scol = self._internal.spark_column_for(label).isin([F.lit(v) for v in values])
                 scol = F.coalesce(scol, F.lit(False))
                 data_spark_columns.append(scol.alias(self._internal.spark_column_name_for(label)))
         else:
@@ -10425,6 +10452,7 @@ def reindex_like(self, other: "DataFrame", copy: bool = True) -> "DataFrame":
         else:
             raise TypeError("other must be a pandas-on-Spark DataFrame")
 
+    @with_ansi_mode_context
     def melt(
         self,
         id_vars: Optional[Union[Name, List[Name]]] = None,
@@ -10610,12 +10638,35 @@ def melt(
         else:
             var_name = [var_name]  # type: ignore[list-item]
 
+        use_cast = is_ansi_mode_enabled(self._internal.spark_frame.sparkSession)
+        string_cast_required_type = None
+        if use_cast:
+            field_by_label = {
+                label: field
+                for label, field in zip(self._internal.column_labels, self._internal.data_fields)
+            }
+
+            value_col_types = [field_by_label[label].spark_type for label in value_vars]
+            # If any value column is of StringType, cast all value columns to StringType to avoid
+            # ANSI mode errors during explode - mixing strings and integers.
+            string_cast_required_type = (
+                StringType() if any(isinstance(t, StringType) for t in value_col_types) else None
+            )
+
         pairs = F.explode(
             F.array(
                 *[
                     F.struct(
                         *[F.lit(c).alias(name) for c, name in zip(label, var_name)],
-                        *[self._internal.spark_column_for(label).alias(value_name)],
+                        *[
+                            (
+                                self._internal.spark_column_for(label).cast(
+                                    string_cast_required_type
+                                )
+                                if use_cast and string_cast_required_type is not None
+                                else self._internal.spark_column_for(label)
+                            ).alias(value_name)
+                        ],
                     )
                     for label in column_labels
                     if label in value_vars
@@ -13778,32 +13829,12 @@ def _test() -> None:
     import uuid
     from pyspark.sql import SparkSession
     import pyspark.pandas.frame
-    from pyspark.testing.utils import is_ansi_mode_test
 
     os.chdir(os.environ["SPARK_HOME"])
 
     globs = pyspark.pandas.frame.__dict__.copy()
     globs["ps"] = pyspark.pandas
 
-    if is_ansi_mode_test:
-        del pyspark.pandas.frame.DataFrame.add.__doc__
-        del pyspark.pandas.frame.DataFrame.div.__doc__
-        del pyspark.pandas.frame.DataFrame.floordiv.__doc__
-        del pyspark.pandas.frame.DataFrame.melt.__doc__
-        del pyspark.pandas.frame.DataFrame.mod.__doc__
-        del pyspark.pandas.frame.DataFrame.mul.__doc__
-        del pyspark.pandas.frame.DataFrame.pow.__doc__
-        del pyspark.pandas.frame.DataFrame.radd.__doc__
-        del pyspark.pandas.frame.DataFrame.rdiv.__doc__
-        del pyspark.pandas.frame.DataFrame.rfloordiv.__doc__
-        del pyspark.pandas.frame.DataFrame.rmod.__doc__
-        del pyspark.pandas.frame.DataFrame.rmul.__doc__
-        del pyspark.pandas.frame.DataFrame.rpow.__doc__
-        del pyspark.pandas.frame.DataFrame.rsub.__doc__
-        del pyspark.pandas.frame.DataFrame.rtruediv.__doc__
-        del pyspark.pandas.frame.DataFrame.sub.__doc__
-        del pyspark.pandas.frame.DataFrame.truediv.__doc__
-
     spark = (
         SparkSession.builder.master("local[4]").appName("pyspark.pandas.frame tests").getOrCreate()
     )
diff --git a/python/pyspark/pandas/generic.py b/python/pyspark/pandas/generic.py
index 1244ee2d88aac..dd9cc311f2742 100644
--- a/python/pyspark/pandas/generic.py
+++ b/python/pyspark/pandas/generic.py
@@ -156,7 +156,7 @@ def cummin(self: FrameLike, skipna: bool = True) -> FrameLike:
         Returns a DataFrame or Series of the same size containing the cumulative minimum.
 
         .. note:: the current implementation of cummin uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into a
+            specifying partition specification. This leads to moving all data into a
             single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -216,7 +216,7 @@ def cummax(self: FrameLike, skipna: bool = True) -> FrameLike:
         Returns a DataFrame or Series of the same size containing the cumulative maximum.
 
         .. note:: the current implementation of cummax uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into a
+            specifying partition specification. This leads to moving all data into a
             single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -277,7 +277,7 @@ def cumsum(self: FrameLike, skipna: bool = True) -> FrameLike:
         Returns a DataFrame or Series of the same size containing the cumulative sum.
 
         .. note:: the current implementation of cumsum uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into a
+            specifying partition specification. This leads to moving all data into a
             single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -338,7 +338,7 @@ def cumprod(self: FrameLike, skipna: bool = True) -> FrameLike:
         Returns a DataFrame or Series of the same size containing the cumulative product.
 
         .. note:: the current implementation of cumprod uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into a
+            specifying partition specification. This leads to moving all data into a
             single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -3330,7 +3330,7 @@ def bfill(
         Synonym for `DataFrame.fillna()` or `Series.fillna()` with ``method=`bfill```.
 
         .. note:: the current implementation of 'bfill' uses Spark's Window
-            without specifying partition specification. This leads to moveing all data into a
+            without specifying partition specification. This leads to moving all data into a
             single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -3409,7 +3409,7 @@ def ffill(
         Synonym for `DataFrame.fillna()` or `Series.fillna()` with ``method=`ffill```.
 
         .. note:: the current implementation of 'ffill' uses Spark's Window
-            without specifying partition specification. This leads to moveing all data into a
+            without specifying partition specification. This leads to moving all data into a
             single a partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -3489,7 +3489,7 @@ def interpolate(
         Fill NaN values using an interpolation method.
 
         .. note:: the current implementation of interpolate uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into a
+            specifying partition specification. This leads to moving all data into a
             single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
diff --git a/python/pyspark/pandas/groupby.py b/python/pyspark/pandas/groupby.py
index 93cbf6ff0a2c0..24a6dbe2e40f2 100644
--- a/python/pyspark/pandas/groupby.py
+++ b/python/pyspark/pandas/groupby.py
@@ -21,7 +21,7 @@
 from abc import ABCMeta, abstractmethod
 import inspect
 from collections import defaultdict, namedtuple
-from functools import partial
+from functools import partial, wraps
 from itertools import product
 from typing import (
     Any,
@@ -36,6 +36,7 @@
     Set,
     Tuple,
     Type,
+    TypeVar,
     Union,
     cast,
     TYPE_CHECKING,
@@ -85,6 +86,7 @@
 )
 from pyspark.pandas.utils import (
     align_diff_frames,
+    ansi_mode_context,
     is_name_like_tuple,
     is_name_like_value,
     name_like_string,
@@ -100,6 +102,18 @@
     from pyspark.pandas.window import RollingGroupby, ExpandingGroupby, ExponentialMovingGroupby
 
 
+FuncT = TypeVar("FuncT", bound=Callable[..., Any])
+
+
+def with_ansi_mode_context(f: FuncT) -> FuncT:
+    @wraps(f)
+    def _with_ansi_mode_context(self: "GroupBy", *args: Any, **kwargs: Any) -> Any:
+        with ansi_mode_context(self._psdf._internal.spark_frame.sparkSession):
+            return f(self, *args, **kwargs)
+
+    return cast(FuncT, _with_ansi_mode_context)
+
+
 # to keep it the same as pandas
 NamedAgg = namedtuple("NamedAgg", ["column", "aggfunc"])
 
@@ -3940,6 +3954,7 @@ def describe(self) -> DataFrame:
         # Cast columns to ``"float64"`` to match `pandas.DataFrame.groupby`.
         return DataFrame(internal).astype("float64")
 
+    @with_ansi_mode_context
     def corr(
         self,
         method: str = "pearson",
@@ -4595,7 +4610,6 @@ def _test() -> None:
     import numpy
     from pyspark.sql import SparkSession
     import pyspark.pandas.groupby
-    from pyspark.testing.utils import is_ansi_mode_test
 
     os.chdir(os.environ["SPARK_HOME"])
 
@@ -4603,9 +4617,6 @@ def _test() -> None:
     globs["np"] = numpy
     globs["ps"] = pyspark.pandas
 
-    if is_ansi_mode_test:
-        del pyspark.pandas.groupby.DataFrameGroupBy.corr.__doc__
-
     spark = (
         SparkSession.builder.master("local[4]")
         .appName("pyspark.pandas.groupby tests")
diff --git a/python/pyspark/pandas/indexes/base.py b/python/pyspark/pandas/indexes/base.py
index 2627baac8bc6f..17cb3bf3f74a7 100644
--- a/python/pyspark/pandas/indexes/base.py
+++ b/python/pyspark/pandas/indexes/base.py
@@ -62,6 +62,7 @@
 from pyspark.pandas.series import Series, first_series
 from pyspark.pandas.spark.accessors import SparkIndexMethods
 from pyspark.pandas.utils import (
+    is_ansi_mode_enabled,
     is_name_like_tuple,
     is_name_like_value,
     name_like_string,
@@ -922,13 +923,17 @@ def to_series(self, name: Optional[Name] = None) -> Series:
             return result
         else:
             # MultiIndex
-            def struct_to_array(scol: Column) -> Column:
-                field_names = result._internal.spark_type_for(
-                    scol
-                ).fieldNames()  # type: ignore[attr-defined]
-                return F.array([scol[field] for field in field_names])
+            if is_ansi_mode_enabled(self._internal.spark_frame.sparkSession):
+                return result
+            else:
+
+                def struct_to_array(scol: Column) -> Column:
+                    field_names = result._internal.spark_type_for(
+                        scol
+                    ).fieldNames()  # type: ignore[attr-defined]
+                    return F.array([scol[field] for field in field_names])
 
-            return result.spark.transform(struct_to_array)
+                return result.spark.transform(struct_to_array)
 
     def to_frame(self, index: bool = True, name: Optional[Name] = None) -> DataFrame:
         """
diff --git a/python/pyspark/pandas/internal.py b/python/pyspark/pandas/internal.py
index 3f6831b600678..5739c66f1f421 100644
--- a/python/pyspark/pandas/internal.py
+++ b/python/pyspark/pandas/internal.py
@@ -1200,10 +1200,10 @@ def with_new_sdf(
 
         :param spark_frame: the new Spark DataFrame
         :param index_fields: the new InternalFields for the index columns.
-                             If None, the original dtyeps are used.
+                             If None, the original dtypes are used.
         :param data_columns: the new column names. If None, the original one is used.
         :param data_fields: the new InternalFields for the data columns.
-                            If None, the original dtyeps are used.
+                            If None, the original dtypes are used.
         :return: the copied InternalFrame.
         """
         if index_fields is None:
diff --git a/python/pyspark/pandas/namespace.py b/python/pyspark/pandas/namespace.py
index 0073c3851065a..a5f2b5ee4f6aa 100644
--- a/python/pyspark/pandas/namespace.py
+++ b/python/pyspark/pandas/namespace.py
@@ -76,6 +76,7 @@
 from pyspark.pandas.utils import (
     align_diff_frames,
     default_session,
+    is_ansi_mode_enabled,
     is_name_like_tuple,
     is_name_like_value,
     name_like_string,
@@ -3630,7 +3631,11 @@ def to_numeric(arg, errors="raise"):
     """
     if isinstance(arg, Series):
         if errors == "coerce":
-            return arg._with_new_scol(arg.spark.column.cast("float"))
+            spark_session = arg._internal.spark_frame.sparkSession
+            if is_ansi_mode_enabled(spark_session):
+                return arg._with_new_scol(arg.spark.column.try_cast("float"))
+            else:
+                return arg._with_new_scol(arg.spark.column.cast("float"))
         elif errors == "raise":
             scol = arg.spark.column
             scol_casted = scol.cast("float")
@@ -3874,7 +3879,6 @@ def _test() -> None:
     from pyspark.sql import SparkSession
     import pyspark.pandas.namespace
     from pandas.util.version import Version
-    from pyspark.testing.utils import is_ansi_mode_test
 
     os.chdir(os.environ["SPARK_HOME"])
 
@@ -3888,10 +3892,6 @@ def _test() -> None:
     globs["ps"] = pyspark.pandas
     globs["sf"] = F
 
-    if is_ansi_mode_test:
-        del pyspark.pandas.namespace.melt.__doc__
-        del pyspark.pandas.namespace.to_numeric.__doc__
-
     spark = (
         SparkSession.builder.master("local[4]")
         .appName("pyspark.pandas.namespace tests")
diff --git a/python/pyspark/pandas/series.py b/python/pyspark/pandas/series.py
index f7f8c89ab2783..e5c8890b646c6 100644
--- a/python/pyspark/pandas/series.py
+++ b/python/pyspark/pandas/series.py
@@ -23,7 +23,7 @@
 import inspect
 import warnings
 from collections.abc import Mapping
-from functools import partial, reduce
+from functools import partial, reduce, wraps
 from typing import (
     Any,
     Callable,
@@ -36,6 +36,7 @@
     Sequence,
     Tuple,
     Type,
+    TypeVar,
     Union,
     cast,
     no_type_check,
@@ -103,7 +104,9 @@
 from pyspark.pandas.missing.series import MissingPandasLikeSeries
 from pyspark.pandas.plot import PandasOnSparkPlotAccessor
 from pyspark.pandas.utils import (
+    ansi_mode_context,
     combine_frames,
+    is_ansi_mode_enabled,
     is_name_like_tuple,
     is_name_like_value,
     name_like_string,
@@ -142,6 +145,18 @@
 # This pattern basically seeks the footer string from pandas'
 REPR_PATTERN = re.compile(r"Length: (?P<length>[0-9]+)")
 
+FuncT = TypeVar("FuncT", bound=Callable[..., Any])
+
+
+def with_ansi_mode_context(f: FuncT) -> FuncT:
+    @wraps(f)
+    def _with_ansi_mode_context(self: "Series", *args: Any, **kwargs: Any) -> Any:
+        with ansi_mode_context(self._internal.spark_frame.sparkSession):
+            return f(self, *args, **kwargs)
+
+    return cast(FuncT, _with_ansi_mode_context)
+
+
 _flex_doc_SERIES = """
 Return {desc} of series and other, element-wise (binary operator `{op_name}`).
 
@@ -369,6 +384,10 @@ class Series(Frame, IndexOpsMixin, Generic[T]):
     pandas-on-Spark Series that corresponds to pandas Series logically. This holds Spark Column
     internally.
 
+    .. versionchanged:: 4.1.0
+        Support construction from a pandas-on-Spark Series input, which can be used with
+        additional parameters index, dtype, and name for overriding the original value.
+
     :ivar _internal: an internal immutable Frame to manage metadata.
     :type _internal: InternalFrame
     :ivar _psdf: Parent's pandas-on-Spark DataFrame
@@ -376,9 +395,10 @@ class Series(Frame, IndexOpsMixin, Generic[T]):
 
     Parameters
     ----------
-    data : array-like, dict, or scalar value, pandas Series
+    data : array-like, dict, or scalar value, pandas Series, pandas-on-Spark Series
         Contains data stored in Series
-        Note that if `data` is a pandas Series, other arguments should not be used.
+        Note that if `data` is a Series, index, dtype, or name can also be
+        specified to override the original value.
     index : array-like or Index (1d)
         Values must be hashable and have the same length as `data`.
         Non-unique index values are allowed. Will default to
@@ -387,6 +407,8 @@ class Series(Frame, IndexOpsMixin, Generic[T]):
         dict.
     dtype : numpy.dtype or None
         If None, dtype will be inferred
+    name : str, default None
+        The name to give to the Series.
     copy : boolean, default False
         Copy input data
     """
@@ -406,6 +428,24 @@ def __init__(  # type: ignore[no-untyped-def]
 
             self._anchor = data
             self._col_label = index
+
+        elif isinstance(data, Series):
+            assert not copy
+            assert not fastpath
+
+            if name:
+                data = data.rename(name)
+
+            if index:
+                data = data.reindex(index)
+
+            if dtype:
+                data = data.astype(dtype)
+
+            anchor = DataFrame(data)
+            self._anchor = anchor
+            self._col_label = anchor._internal.column_labels[0]
+            object.__setattr__(anchor, "_psseries", {self._column_label: self})
         else:
             if isinstance(data, pd.Series):
                 assert index is None
@@ -2061,7 +2101,7 @@ def fillna(
         """Fill NA/NaN values.
 
         .. note:: the current implementation of 'method' parameter in fillna uses Spark's Window
-            without specifying partition specification. This leads to moveing all data into
+            without specifying partition specification. This leads to moving all data into
             a single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -3310,7 +3350,7 @@ def autocorr(self, lag: int = 1) -> float:
         the Series and its shifted self.
 
         .. note:: the current implementation of rank uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into
+            specifying partition specification. This leads to moving all data into
             a single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -3370,13 +3410,21 @@ def autocorr(self, lag: int = 1) -> float:
         else:
             lag_scol = F.lag(scol, lag).over(Window.orderBy(NATURAL_ORDER_COLUMN_NAME))
             lag_col_name = verify_temp_column_name(sdf, "__autocorr_lag_tmp_col__")
-            corr = (
-                sdf.withColumn(lag_col_name, lag_scol)
-                .select(F.corr(scol, F.col(lag_col_name)))
-                .head()[0]
-            )
+
+            sdf_lag = sdf.withColumn(lag_col_name, lag_scol)
+            if is_ansi_mode_enabled(sdf.sparkSession):
+                # Compute covariance between the original and lagged columns.
+                # If the covariance is None or zero (indicating no linear relationship),
+                # return NaN, otherwise, proceeding to compute correlation may raise
+                # DIVIDE_BY_ZERO under ANSI mode.
+                cov_value = sdf_lag.select(F.covar_samp(scol, F.col(lag_col_name))).head()[0]
+                if cov_value is None or cov_value == 0.0:
+                    return np.nan
+            corr = sdf_lag.select(F.corr(scol, F.col(lag_col_name))).head()[0]
+
         return np.nan if corr is None else corr
 
+    @with_ansi_mode_context
     def corr(
         self, other: "Series", method: str = "pearson", min_periods: Optional[int] = None
     ) -> float:
@@ -4066,7 +4114,7 @@ def rank(
         assigned a rank that is the average of the ranks of those values.
 
         .. note:: the current implementation of rank uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into
+            specifying partition specification. This leads to moving all data into
             a single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -4244,7 +4292,7 @@ def diff(self, periods: int = 1) -> "Series":
         DataFrame (default is the element in the same column of the previous row).
 
         .. note:: the current implementation of diff uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into
+            specifying partition specification. This leads to moving all data into
             a single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -4856,6 +4904,7 @@ def keys(self) -> "ps.Index":
         return self.index
 
     # TODO: introduce 'in_place'; fully support 'regex'
+    @with_ansi_mode_context
     def replace(
         self,
         to_replace: Optional[Union[Any, List, Tuple, Dict]] = None,
@@ -5081,33 +5130,68 @@ def replace(
                     )
                 )
             to_replace = {k: v for k, v in zip(to_replace, value)}
+
+        spark_session = self._internal.spark_frame.sparkSession
+        ansi_mode = is_ansi_mode_enabled(spark_session)
+        col_type = self.spark.data_type
+
         if isinstance(to_replace, dict):
             is_start = True
             if len(to_replace) == 0:
                 current = self.spark.column
             else:
                 for to_replace_, value in to_replace.items():
-                    cond = (
-                        (F.isnan(self.spark.column) | self.spark.column.isNull())
-                        if pd.isna(to_replace_)
-                        else (self.spark.column == F.lit(to_replace_))
-                    )
+                    if pd.isna(to_replace_):
+                        if ansi_mode and isinstance(col_type, NumericType):
+                            cond = F.isnan(self.spark.column) | self.spark.column.isNull()
+                        else:
+                            cond = self.spark.column.isNull()
+                    else:
+                        to_replace_lit = (
+                            F.lit(to_replace_).try_cast(col_type)
+                            if ansi_mode
+                            else F.lit(to_replace_)
+                        )
+                        cond = self.spark.column == to_replace_lit
+                    value_expr = F.lit(value).try_cast(col_type) if ansi_mode else F.lit(value)
                     if is_start:
-                        current = F.when(cond, value)
+                        current = F.when(cond, value_expr)
                         is_start = False
                     else:
-                        current = current.when(cond, value)
+                        current = current.when(cond, value_expr)
                 current = current.otherwise(self.spark.column)
         else:
             if regex:
                 # to_replace must be a string
                 cond = self.spark.column.rlike(cast(str, to_replace))
             else:
-                cond = self.spark.column.isin(to_replace)
+                if ansi_mode:
+                    to_replace_values = (
+                        [to_replace]
+                        if not is_list_like(to_replace) or isinstance(to_replace, str)
+                        else to_replace
+                    )
+                    to_replace_values = cast(List[Any], to_replace_values)
+                    literals = [F.lit(v).try_cast(col_type) for v in to_replace_values]
+                    cond = self.spark.column.isin(literals)
+                else:
+                    cond = self.spark.column.isin(to_replace)
                 # to_replace may be a scalar
                 if np.array(pd.isna(to_replace)).any():
-                    cond = cond | F.isnan(self.spark.column) | self.spark.column.isNull()
-            current = F.when(cond, value).otherwise(self.spark.column)
+                    if ansi_mode:
+                        if isinstance(col_type, NumericType):
+                            cond = cond | F.isnan(self.spark.column) | self.spark.column.isNull()
+                        else:
+                            cond = cond | self.spark.column.isNull()
+                    else:
+                        cond = cond | F.isnan(self.spark.column) | self.spark.column.isNull()
+
+            if ansi_mode:
+                value_expr = F.lit(value).try_cast(col_type)
+                current = F.when(cond, value_expr).otherwise(self.spark.column.try_cast(col_type))
+
+            else:
+                current = F.when(cond, value).otherwise(self.spark.column)
 
         return self._with_new_scol(current)  # TODO: dtype?
 
@@ -5486,7 +5570,7 @@ def pct_change(self, periods: int = 1) -> "Series":
         Percentage change between the current and a prior element.
 
         .. note:: the current implementation of this API uses Spark's Window without
-            specifying partition specification. This leads to moveing all data into
+            specifying partition specification. This leads to moving all data into
             a single partition in a single machine and could cause serious
             performance degradation. Avoid this method with very large datasets.
 
@@ -7336,16 +7420,12 @@ def _test() -> None:
     import sys
     from pyspark.sql import SparkSession
     import pyspark.pandas.series
-    from pyspark.testing.utils import is_ansi_mode_test
 
     os.chdir(os.environ["SPARK_HOME"])
 
     globs = pyspark.pandas.series.__dict__.copy()
     globs["ps"] = pyspark.pandas
 
-    if is_ansi_mode_test:
-        del pyspark.pandas.series.Series.autocorr.__doc__
-
     spark = (
         SparkSession.builder.master("local[4]").appName("pyspark.pandas.series tests").getOrCreate()
     )
diff --git a/python/pyspark/pandas/strings.py b/python/pyspark/pandas/strings.py
index dc1544d8be39d..05d678d123f47 100644
--- a/python/pyspark/pandas/strings.py
+++ b/python/pyspark/pandas/strings.py
@@ -18,12 +18,14 @@
 """
 String functions on pandas-on-Spark Series
 """
+from functools import wraps
 from typing import (
     Any,
     Callable,
     Dict,
     List,
     Optional,
+    TypeVar,
     Union,
     cast,
     no_type_check,
@@ -32,13 +34,25 @@
 import numpy as np
 import pandas as pd
 
-from pyspark.pandas.utils import is_ansi_mode_enabled
+from pyspark.pandas.utils import ansi_mode_context, is_ansi_mode_enabled
 from pyspark.sql.types import StringType, BinaryType, ArrayType, LongType, MapType
 from pyspark.sql import functions as F
 from pyspark.sql.functions import pandas_udf
 import pyspark.pandas as ps
 
 
+FuncT = TypeVar("FuncT", bound=Callable[..., Any])
+
+
+def with_ansi_mode_context(f: FuncT) -> FuncT:
+    @wraps(f)
+    def _with_ansi_mode_context(self: "StringMethods", *args: Any, **kwargs: Any) -> Any:
+        with ansi_mode_context(self._data._internal.spark_frame.sparkSession):
+            return f(self, *args, **kwargs)
+
+    return cast(FuncT, _with_ansi_mode_context)
+
+
 class StringMethods:
     """String methods for pandas-on-Spark Series"""
 
@@ -1890,6 +1904,7 @@ def pandas_slice_replace(s) -> ps.Series[str]:  # type: ignore[no-untyped-def]
 
         return self._data.pandas_on_spark.transform_batch(pandas_slice_replace)
 
+    @with_ansi_mode_context
     def split(
         self, pat: Optional[str] = None, n: int = -1, expand: bool = False
     ) -> Union["ps.Series", "ps.DataFrame"]:
@@ -2052,6 +2067,7 @@ def pudf(s: pd.Series) -> pd.Series:
         else:
             return psser
 
+    @with_ansi_mode_context
     def rsplit(
         self, pat: Optional[str] = None, n: int = -1, expand: bool = False
     ) -> Union["ps.Series", "ps.DataFrame"]:
diff --git a/python/pyspark/pandas/supported_api_gen.py b/python/pyspark/pandas/supported_api_gen.py
index f2a73cb1c1adf..595c11c559d05 100644
--- a/python/pyspark/pandas/supported_api_gen.py
+++ b/python/pyspark/pandas/supported_api_gen.py
@@ -38,7 +38,7 @@
 MAX_MISSING_PARAMS_SIZE = 5
 COMMON_PARAMETER_SET = {"kwargs", "args", "cls"}
 MODULE_GROUP_MATCH = [(pd, ps), (pdw, psw), (pdg, psg)]
-PANDAS_LATEST_VERSION = "2.2.3"
+PANDAS_LATEST_VERSION = "2.3.2"
 
 RST_HEADER = """
 =====================
@@ -108,7 +108,9 @@ def _check_pandas_version() -> None:
     """
     Check if the installed pandas version matches the expected version.
     """
-    if LooseVersion(pd.__version__) != LooseVersion(PANDAS_LATEST_VERSION):
+    # Work around pandas version string issue,
+    # see https://github.com/pandas-dev/pandas/issues/61579.
+    if LooseVersion(pd.__version__.split("+")[0]) != LooseVersion(PANDAS_LATEST_VERSION):
         msg = (
             f"Warning: pandas {PANDAS_LATEST_VERSION} is required; your version is {pd.__version__}"
         )
diff --git a/python/pyspark/pandas/tests/computation/test_binary_ops.py b/python/pyspark/pandas/tests/computation/test_binary_ops.py
index 3c9b7293d5d53..1f76064cd6df1 100644
--- a/python/pyspark/pandas/tests/computation/test_binary_ops.py
+++ b/python/pyspark/pandas/tests/computation/test_binary_ops.py
@@ -23,7 +23,6 @@
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 # This file contains test cases for 'Binary operator functions'
@@ -122,8 +121,7 @@ def test_divide_by_zero_behavior(self):
             dtype=np.float32,
         )
         psdf = ps.from_pandas(pdf)
-        # TODO(SPARK-52332): Fix promotion from float32 to float64 during division
-        self.assert_eq(psdf["a"] / psdf["b"], (pdf["a"] / pdf["b"]).astype(np.float64))
+        self.assert_eq(psdf["a"] / psdf["b"], pdf["a"] / pdf["b"])
 
         # np.float64
         pdf = pd.DataFrame(
@@ -195,6 +193,11 @@ def test_binary_operator_truediv(self):
 
         self.assert_eq(psdf["a"] / psdf["b"], pdf["a"] / pdf["b"])
 
+        pser = pd.Series([1.1, 2.2, 3.3], dtype=np.float32)
+        psser = ps.from_pandas(pser)
+        self.assert_eq(psser / 1, pser / 1)
+        self.assert_eq(psser / 0, pser / 0)
+
         # Negative
         psdf = ps.DataFrame({"a": ["x"], "b": [1]})
 
@@ -208,7 +211,15 @@ def test_binary_operator_truediv(self):
         self.assertRaisesRegex(TypeError, ks_err_msg, lambda: 1 / psdf["a"])
 
     def test_binary_operator_floordiv(self):
-        psdf = ps.DataFrame({"a": ["x"], "b": [1]})
+        pdf = pd.DataFrame({"a": ["x"], "b": [1], "c": [1.0], "d": [0]})
+        psdf = ps.from_pandas(pdf)
+        self.assert_eq(pdf["b"] // 0, psdf["b"] // 0)
+        self.assert_eq(pdf["c"] // 0, psdf["c"] // 0)
+        self.assert_eq(pdf["d"] // 0, psdf["d"] // 0)
+
+        pser = pd.Series([1.1, 2.2, 3.3], dtype=np.float32)
+        psser = ps.from_pandas(pser)
+        self.assert_eq(psser // 1, pser // 1)
 
         ks_err_msg = "Floor division can not be applied to strings"
         self.assertRaisesRegex(TypeError, ks_err_msg, lambda: psdf["a"] // psdf["b"])
@@ -221,10 +232,12 @@ def test_binary_operator_floordiv(self):
 
     def test_binary_operator_mod(self):
         # Positive
-        pdf = pd.DataFrame({"a": [3], "b": [2]})
+        pdf = pd.DataFrame({"a": [3], "b": [2], "c": [0]})
         psdf = ps.from_pandas(pdf)
 
         self.assert_eq(psdf["a"] % psdf["b"], pdf["a"] % pdf["b"])
+        self.assert_eq(psdf["a"] % 0, pdf["a"] % 0)
+        self.assert_eq(1 % psdf["c"], 1 % pdf["c"])
 
         # Negative
         psdf = ps.DataFrame({"a": ["x"], "b": [1]})
diff --git a/python/pyspark/pandas/tests/computation/test_corr.py b/python/pyspark/pandas/tests/computation/test_corr.py
index ad982717e9a4c..49cb84ca22e04 100644
--- a/python/pyspark/pandas/tests/computation/test_corr.py
+++ b/python/pyspark/pandas/tests/computation/test_corr.py
@@ -22,11 +22,9 @@
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase, SPARK_CONF_ARROW_ENABLED
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 class FrameCorrMixin:
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_dataframe_corr(self):
         pdf = pd.DataFrame(
             index=[
diff --git a/python/pyspark/pandas/tests/computation/test_describe.py b/python/pyspark/pandas/tests/computation/test_describe.py
index f88eac7942d17..8df07f1945d24 100644
--- a/python/pyspark/pandas/tests/computation/test_describe.py
+++ b/python/pyspark/pandas/tests/computation/test_describe.py
@@ -26,6 +26,12 @@
 
 
 class FrameDescribeMixin:
+    @classmethod
+    def setUpClass(cls):
+        super(FrameDescribeMixin, cls).setUpClass()
+        # Some nanosecond->microsecond conversions throw loss of precision errors
+        cls.spark.conf.set("spark.sql.execution.pandas.convertToArrowArraySafely", "false")
+
     @property
     def pdf(self):
         return pd.DataFrame(
diff --git a/python/pyspark/pandas/tests/computation/test_missing_data.py b/python/pyspark/pandas/tests/computation/test_missing_data.py
index dfecaf4be20b0..c777499aea85f 100644
--- a/python/pyspark/pandas/tests/computation/test_missing_data.py
+++ b/python/pyspark/pandas/tests/computation/test_missing_data.py
@@ -23,7 +23,6 @@
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 # This file contains test cases for 'Missing data handling'
@@ -274,7 +273,6 @@ def test_fillna(self):
             pdf.fillna({("x", "a"): -1, ("x", "b"): -2, ("y", "c"): -5}),
         )
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_replace(self):
         pdf = pd.DataFrame(
             {
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_as_type.py b/python/pyspark/pandas/tests/data_type_ops/test_as_type.py
index 379d055d585d3..76debd10848a4 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_as_type.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_as_type.py
@@ -32,19 +32,17 @@
 
 
 class AsTypeTestsMixin:
-    """Unit tests for arithmetic operations of numeric data types.
-
-    A few test cases are disabled because pandas-on-Spark returns float64 whereas pandas
-    returns float32.
-    The underlying reason is the respective Spark operations return DoubleType always.
-    """
+    """Unit tests for arithmetic operations of numeric data types."""
 
     def test_astype(self):
         pdf, psdf = self.pdf, self.psdf
+        int_types = [int, np.int32, np.int16, np.int8]
+        cat_type = CategoricalDtype(categories=[2, 1, 3])
+        other_types = [float, np.float32, bool, str, "category", cat_type]
         for col in self.numeric_df_cols:
             pser, psser = pdf[col], psdf[col]
 
-            for int_type in [int, np.int32, np.int16, np.int8]:
+            for int_type in int_types:
                 if not pser.hasnans:
                     self.assert_eq(pser.astype(int_type), psser.astype(int_type))
                 else:
@@ -54,14 +52,9 @@ def test_astype(self):
                         "values to integer" % psser._dtype_op.pretty_name,
                         lambda: psser.astype(int_type),
                     )
+            for other_type in other_types:
+                self.assert_eq(pser.astype(other_type), psser.astype(other_type))
 
-            self.assert_eq(pser.astype(bool), psser.astype(bool))
-            self.assert_eq(pser.astype(float), psser.astype(float))
-            self.assert_eq(pser.astype(np.float32), psser.astype(np.float32))
-            self.assert_eq(pser.astype(str), psser.astype(str))
-            self.assert_eq(pser.astype("category"), psser.astype("category"))
-            cat_type = CategoricalDtype(categories=[2, 1, 3])
-            self.assert_eq(pser.astype(cat_type), psser.astype(cat_type))
         if extension_object_dtypes_available and extension_float_dtypes_available:
             pser = pd.Series(pd.Categorical([1.0, 2.0, 3.0]), dtype=pd.Float64Dtype())
             psser = ps.from_pandas(pser)
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_boolean_ops.py b/python/pyspark/pandas/tests/data_type_ops/test_boolean_ops.py
index 6969c527b5f74..ea4b23d537f9a 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_boolean_ops.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_boolean_ops.py
@@ -25,7 +25,6 @@
 from pyspark import pandas as ps
 from pyspark.pandas import option_context
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 from pyspark.pandas.tests.data_type_ops.testing_utils import OpsTestBase
 from pyspark.pandas.typedef.typehints import (
     extension_float_dtypes_available,
@@ -100,11 +99,11 @@ def test_mul(self):
             else:
                 self.assertRaises(TypeError, lambda: b_psser * psser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_truediv(self):
         pdf, psdf = self.pdf, self.psdf
 
         b_pser, b_psser = pdf["bool"], psdf["bool"]
+        self.assert_eq(b_pser / 0, b_psser / 0)
         self.assert_eq(b_pser / 1, b_psser / 1)
         self.assert_eq(b_pser / 0.1, b_psser / 0.1)
         self.assert_eq(b_pser / b_pser.astype(int), b_psser / b_psser.astype(int))
@@ -116,7 +115,6 @@ def test_truediv(self):
         for col in self.non_numeric_df_cols:
             self.assertRaises(TypeError, lambda: b_psser / psdf[col])
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_floordiv(self):
         pdf, psdf = self.pdf, self.psdf
 
@@ -124,6 +122,7 @@ def test_floordiv(self):
 
         # float is always returned in pandas-on-Spark
         self.assert_eq((b_pser // 1).astype("float"), b_psser // 1)
+        self.assert_eq((b_pser // 0).astype("float"), b_psser // 0)
 
         # in pandas, 1 // 0.1 = 9.0; in pandas-on-Spark, 1 // 0.1 = 10.0
         # self.assert_eq(b_pser // 0.1, b_psser // 0.1)
@@ -141,6 +140,7 @@ def test_mod(self):
         pdf, psdf = self.pdf, self.psdf
 
         b_pser, b_psser = pdf["bool"], psdf["bool"]
+        self.assert_eq(b_pser % 0, b_psser % 0)
         self.assert_eq(b_pser % 1, b_psser % 1)
         self.assert_eq(b_pser % 0.1, b_psser % 0.1)
         self.assert_eq(b_pser % b_pser.astype(float), b_psser % b_psser.astype(float))
@@ -238,16 +238,13 @@ def test_rpow(self):
 
     def test_rmod(self):
         psdf = self.psdf
+        pdf = self.pdf
 
         b_psser = psdf["bool"]
-        # 1 % False is 0.0 in pandas
-        self.assert_eq(pd.Series([0, 0, None], dtype=float, name="bool"), 1 % b_psser)
-        # 0.1 / True is 0.1 in pandas
-        self.assert_eq(
-            pd.Series([0.10000000000000009, 0.10000000000000009, None], dtype=float, name="bool"),
-            0.1 % b_psser,
-            check_exact=False,  # [0.1, 0.1, nan] for pandas-on-Spark
-        )
+        b_pser = pdf["bool"]
+        self.assert_eq(1 % b_pser.astype(float), 1 % b_psser)
+        # # Allow float precision diff: pandas:  0.10000000000000009; pandas on spark: 0.1
+        self.assert_eq(0.1 % b_pser, 0.1 % b_psser, almost=True)
         self.assertRaises(TypeError, lambda: datetime.date(1994, 1, 1) % b_psser)
         self.assertRaises(TypeError, lambda: True % b_psser)
 
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_date_ops.py b/python/pyspark/pandas/tests/data_type_ops/test_date_ops.py
index c2b29ee8a1d35..a584497832b25 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_date_ops.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_date_ops.py
@@ -208,31 +208,37 @@ def test_eq(self):
         pdf, psdf = self.date_pdf, self.date_psdf
         self.assert_eq(pdf["this"] == pdf["that"], psdf["this"] == psdf["that"])
         self.assert_eq(pdf["this"] == pdf["this"], psdf["this"] == psdf["this"])
+        self.assertRaises(TypeError, lambda: psdf["this"] == pdf["this"])
 
     def test_ne(self):
         pdf, psdf = self.date_pdf, self.date_psdf
         self.assert_eq(pdf["this"] != pdf["that"], psdf["this"] != psdf["that"])
         self.assert_eq(pdf["this"] != pdf["this"], psdf["this"] != psdf["this"])
+        self.assertRaises(TypeError, lambda: psdf["this"] != pdf["this"])
 
     def test_lt(self):
         pdf, psdf = self.date_pdf, self.date_psdf
         self.assert_eq(pdf["this"] < pdf["that"], psdf["this"] < psdf["that"])
         self.assert_eq(pdf["this"] < pdf["this"], psdf["this"] < psdf["this"])
+        self.assertRaises(TypeError, lambda: psdf["this"] < pdf["this"])
 
     def test_le(self):
         pdf, psdf = self.date_pdf, self.date_psdf
         self.assert_eq(pdf["this"] <= pdf["that"], psdf["this"] <= psdf["that"])
         self.assert_eq(pdf["this"] <= pdf["this"], psdf["this"] <= psdf["this"])
+        self.assertRaises(TypeError, lambda: psdf["this"] <= pdf["this"])
 
     def test_gt(self):
         pdf, psdf = self.date_pdf, self.date_psdf
         self.assert_eq(pdf["this"] > pdf["that"], psdf["this"] > psdf["that"])
         self.assert_eq(pdf["this"] > pdf["this"], psdf["this"] > psdf["this"])
+        self.assertRaises(TypeError, lambda: psdf["this"] > pdf["this"])
 
     def test_ge(self):
         pdf, psdf = self.date_pdf, self.date_psdf
         self.assert_eq(pdf["this"] >= pdf["that"], psdf["this"] >= psdf["that"])
         self.assert_eq(pdf["this"] >= pdf["this"], psdf["this"] >= psdf["this"])
+        self.assertRaises(TypeError, lambda: psdf["this"] >= pdf["this"])
 
 
 class DateOpsTests(
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_num_arithmetic.py b/python/pyspark/pandas/tests/data_type_ops/test_num_arithmetic.py
index 0201dd6fa1f5f..798a49ae121ed 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_num_arithmetic.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_num_arithmetic.py
@@ -20,8 +20,8 @@
 import pandas as pd
 
 from pyspark import pandas as ps
+from pyspark.testing.utils import is_ansi_mode_test
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 from pyspark.pandas.tests.data_type_ops.testing_utils import OpsTestBase
 
 
@@ -41,14 +41,12 @@ def float_pser(self):
     def float_psser(self):
         return ps.from_pandas(self.float_pser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_add(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
             pser, psser = pdf[col], psdf[col]
             self.assert_eq(pser + pser, psser + psser, check_exact=False)
             self.assert_eq(pser + 1, psser + 1, check_exact=False)
-            # self.assert_eq(pser + 0.1, psser + 0.1)
             self.assert_eq(pser + pser.astype(bool), psser + psser.astype(bool), check_exact=False)
             self.assert_eq(pser + True, psser + True, check_exact=False)
             self.assert_eq(pser + False, psser + False, check_exact=False)
@@ -59,14 +57,15 @@ def test_add(self):
                 else:
                     self.assertRaises(TypeError, lambda: psser + psdf[n_col])
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
+            if is_ansi_mode_test and not col.startswith("decimal"):
+                self.assert_eq(pser + 0.1, psser + 0.1)
+
     def test_sub(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
             pser, psser = pdf[col], psdf[col]
             self.assert_eq(pser - pser, psser - psser, check_exact=False)
             self.assert_eq(pser - 1, psser - 1, check_exact=False)
-            # self.assert_eq(pser - 0.1, psser - 0.1)
             self.assert_eq(pser - pser.astype(bool), psser - psser.astype(bool), check_exact=False)
             self.assert_eq(pser - True, psser - True, check_exact=False)
             self.assert_eq(pser - False, psser - False, check_exact=False)
@@ -77,6 +76,9 @@ def test_sub(self):
                 else:
                     self.assertRaises(TypeError, lambda: psser - psdf[n_col])
 
+            if is_ansi_mode_test and not col.startswith("decimal"):
+                self.assert_eq(pser - 0.1, psser - 0.1)
+
 
 class ArithmeticTests(
     ArithmeticTestsMixin,
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_num_mod.py b/python/pyspark/pandas/tests/data_type_ops/test_num_mod.py
index 5e4b6f46f4333..b1961437a96eb 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_num_mod.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_num_mod.py
@@ -22,7 +22,6 @@
 
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 from pyspark.pandas.tests.data_type_ops.testing_utils import OpsTestBase
 
 
@@ -35,7 +34,6 @@ def float_pser(self):
     def float_psser(self):
         return ps.from_pandas(self.float_pser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_mod(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
@@ -43,6 +41,9 @@ def test_mod(self):
             self.assert_eq(pser % pser, psser % psser, check_exact=False)
             self.assert_eq(pser % pser.astype(bool), psser % psser.astype(bool), check_exact=False)
             self.assert_eq(pser % True, psser % True, check_exact=False)
+            self.assert_eq(pser % 1, psser % 1, check_exact=False)
+            if not col.startswith("decimal"):
+                self.assert_eq(pser % 0, psser % 0, check_exact=False)
             if col in ["int", "int32"]:
                 self.assert_eq(
                     pd.Series([np.nan, np.nan, np.nan], dtype=float, name=col), psser % False
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_num_mul_div.py b/python/pyspark/pandas/tests/data_type_ops/test_num_mul_div.py
index 3c58e4655125e..8a719fe9fd88c 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_num_mul_div.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_num_mul_div.py
@@ -22,7 +22,6 @@
 
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 from pyspark.pandas.tests.data_type_ops.testing_utils import OpsTestBase
 
 
@@ -35,7 +34,6 @@ def float_pser(self):
     def float_psser(self):
         return ps.from_pandas(self.float_pser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_mul(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_num_ops.py b/python/pyspark/pandas/tests/data_type_ops/test_num_ops.py
index 03a794771a910..00fc04e362312 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_num_ops.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_num_ops.py
@@ -23,6 +23,7 @@
 from pyspark import pandas as ps
 from pyspark.pandas.config import option_context
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
+from pyspark.testing.utils import is_ansi_mode_test
 from pyspark.pandas.tests.data_type_ops.testing_utils import OpsTestBase
 from pyspark.pandas.typedef.typehints import (
     extension_dtypes_available,
@@ -128,6 +129,18 @@ def test_invert(self):
             else:
                 self.assertRaises(TypeError, lambda: ~psser)
 
+    def test_comparison_dtype_compatibility(self):
+        pdf = pd.DataFrame(
+            {"int": [1, 2], "bool": [True, False], "float": [0.1, 0.2], "str": ["1", "2"]}
+        )
+        psdf = ps.from_pandas(pdf)
+        self.assert_eq(pdf["int"] == pdf["bool"], psdf["int"] == psdf["bool"])
+        self.assert_eq(pdf["bool"] == pdf["int"], psdf["bool"] == psdf["int"])
+        self.assert_eq(pdf["int"] == pdf["float"], psdf["int"] == psdf["float"])
+        if is_ansi_mode_test:  # TODO: match non-ansi behavior with pandas
+            self.assert_eq(pdf["int"] == pdf["str"], psdf["int"] == psdf["str"])
+        self.assert_eq(pdf["float"] == pdf["bool"], psdf["float"] == psdf["bool"])
+
     def test_eq(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_num_reverse.py b/python/pyspark/pandas/tests/data_type_ops/test_num_reverse.py
index 38341bce80308..a14177348cd00 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_num_reverse.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_num_reverse.py
@@ -22,7 +22,6 @@
 
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 from pyspark.pandas.tests.data_type_ops.testing_utils import OpsTestBase
 
 
@@ -42,7 +41,6 @@ def float_pser(self):
     def float_psser(self):
         return ps.from_pandas(self.float_pser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_radd(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
@@ -55,7 +53,6 @@ def test_radd(self):
             self.assertRaises(TypeError, lambda: datetime.date(1994, 1, 1) + psser)
             self.assertRaises(TypeError, lambda: datetime.datetime(1994, 1, 1) + psser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_rsub(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
@@ -68,7 +65,6 @@ def test_rsub(self):
             self.assertRaises(TypeError, lambda: datetime.date(1994, 1, 1) - psser)
             self.assertRaises(TypeError, lambda: datetime.datetime(1994, 1, 1) - psser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_rmul(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
@@ -117,7 +113,6 @@ def test_rpow(self):
             self.assertRaises(TypeError, lambda: datetime.date(1994, 1, 1) ** psser)
             self.assertRaises(TypeError, lambda: datetime.datetime(1994, 1, 1) ** psser)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_rmod(self):
         pdf, psdf = self.pdf, self.psdf
         for col in self.numeric_df_cols:
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_string_ops.py b/python/pyspark/pandas/tests/data_type_ops/test_string_ops.py
index 9648ad9ab2c0f..9c3f4cf1dec4b 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_string_ops.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_string_ops.py
@@ -33,19 +33,19 @@
 
 class StringOpsTestsMixin:
     @property
-    def bool_pdf(self):
+    def str_pdf(self):
         return pd.DataFrame({"this": ["x", "y", "z"], "that": ["z", "y", "x"]})
 
     @property
-    def bool_non_numeric_pdf(self):
-        return pd.concat([self.bool_pdf, self.non_numeric_pdf], axis=1)
+    def str_non_numeric_pdf(self):
+        return pd.concat([self.str_pdf, self.non_numeric_pdf], axis=1)
 
     @property
-    def bool_non_numeric_psdf(self):
-        return ps.from_pandas(self.bool_non_numeric_pdf)
+    def str_non_numeric_psdf(self):
+        return ps.from_pandas(self.str_non_numeric_pdf)
 
     def test_add(self):
-        pdf, psdf = self.bool_non_numeric_pdf, self.bool_non_numeric_psdf
+        pdf, psdf = self.str_non_numeric_pdf, self.str_non_numeric_psdf
         pser, psser = pdf["this"], psdf["this"]
         other_pser, other_psser = pdf["that"], psdf["that"]
         self.assert_eq(pser + "x", psser + "x")
@@ -188,42 +188,42 @@ def test_invert(self):
         self.assertRaises(TypeError, lambda: ~self.psdf["string"])
 
     def test_eq(self):
-        pdf, psdf = self.bool_non_numeric_pdf, self.bool_non_numeric_psdf
+        pdf, psdf = self.str_non_numeric_pdf, self.str_non_numeric_psdf
         pser, psser = pdf["this"], psdf["this"]
         other_pser, other_psser = pdf["that"], psdf["that"]
         self.assert_eq(pser == other_pser, psser == other_psser)
         self.assert_eq(pser == pser, psser == psser)
 
     def test_ne(self):
-        pdf, psdf = self.bool_non_numeric_pdf, self.bool_non_numeric_psdf
+        pdf, psdf = self.str_non_numeric_pdf, self.str_non_numeric_psdf
         pser, psser = pdf["this"], psdf["this"]
         other_pser, other_psser = pdf["that"], psdf["that"]
         self.assert_eq(pser != other_pser, psser != other_psser)
         self.assert_eq(pser != pser, psser != psser)
 
     def test_lt(self):
-        pdf, psdf = self.bool_non_numeric_pdf, self.bool_non_numeric_psdf
+        pdf, psdf = self.str_non_numeric_pdf, self.str_non_numeric_psdf
         pser, psser = pdf["this"], psdf["this"]
         other_pser, other_psser = pdf["that"], psdf["that"]
         self.assert_eq(pser < other_pser, psser < other_psser)
         self.assert_eq(pser < pser, psser < psser)
 
     def test_le(self):
-        pdf, psdf = self.bool_non_numeric_pdf, self.bool_non_numeric_psdf
+        pdf, psdf = self.str_non_numeric_pdf, self.str_non_numeric_psdf
         pser, psser = pdf["this"], psdf["this"]
         other_pser, other_psser = pdf["that"], psdf["that"]
         self.assert_eq(pser <= other_pser, psser <= other_psser)
         self.assert_eq(pser <= pser, psser <= psser)
 
     def test_gt(self):
-        pdf, psdf = self.bool_non_numeric_pdf, self.bool_non_numeric_psdf
+        pdf, psdf = self.str_non_numeric_pdf, self.str_non_numeric_psdf
         pser, psser = pdf["this"], psdf["this"]
         other_pser, other_psser = pdf["that"], psdf["that"]
         self.assert_eq(pser > other_pser, psser > other_psser)
         self.assert_eq(pser > pser, psser > psser)
 
     def test_ge(self):
-        pdf, psdf = self.bool_non_numeric_pdf, self.bool_non_numeric_psdf
+        pdf, psdf = self.str_non_numeric_pdf, self.str_non_numeric_psdf
         pser, psser = pdf["this"], psdf["this"]
         other_pser, other_psser = pdf["that"], psdf["that"]
         self.assert_eq(pser >= other_pser, psser >= other_psser)
diff --git a/python/pyspark/pandas/tests/data_type_ops/test_udt_ops.py b/python/pyspark/pandas/tests/data_type_ops/test_udt_ops.py
index 60b4153198a34..f4f833ea9cf55 100644
--- a/python/pyspark/pandas/tests/data_type_ops/test_udt_ops.py
+++ b/python/pyspark/pandas/tests/data_type_ops/test_udt_ops.py
@@ -130,6 +130,26 @@ def test_from_to_pandas(self):
         self.assert_eq(pser, psser._to_pandas())
         self.assert_eq(ps.from_pandas(pser), psser)
 
+    def test_with_first_null(self):
+        lst = [None, None, None, SparseVector(1, {0: 0.1})]
+        pser = pd.Series(lst)
+        psser = ps.Series(lst)
+        self.assert_eq(pser, psser._to_pandas())
+        self.assert_eq(ps.from_pandas(pser), psser)
+
+        lst2 = [SparseVector(1, {0: 0.1}), None, None, None]
+        pdf = pd.DataFrame({"a": lst, "b": lst2})
+        psdf = ps.DataFrame({"a": lst, "b": lst2})
+        self.assert_eq(pdf, psdf._to_pandas())
+        self.assert_eq(ps.from_pandas(pdf), psdf)
+
+    def test_with_all_null(self):
+        lst = [None, None, None, None]
+        pser = pd.Series(lst, dtype=object)
+        psser = ps.Series(lst, dtype=object)
+        self.assert_eq(pser, psser._to_pandas())
+        self.assert_eq(ps.from_pandas(pser), psser)
+
     def test_isnull(self):
         self.assert_eq(self.pser.isnull(), self.psser.isnull())
 
diff --git a/python/pyspark/pandas/tests/data_type_ops/testing_utils.py b/python/pyspark/pandas/tests/data_type_ops/testing_utils.py
index 089b929db1b33..17ac2bc5c4747 100644
--- a/python/pyspark/pandas/tests/data_type_ops/testing_utils.py
+++ b/python/pyspark/pandas/tests/data_type_ops/testing_utils.py
@@ -41,6 +41,12 @@
 class OpsTestBase:
     """The test base for arithmetic operations of different data types."""
 
+    @classmethod
+    def setUpClass(cls):
+        super(OpsTestBase, cls).setUpClass()
+        # Some nanosecond->microsecond conversions throw loss of precision errors
+        cls.spark.conf.set("spark.sql.execution.pandas.convertToArrowArraySafely", "false")
+
     @property
     def numeric_pdf(self):
         dtypes = [np.int32, int, np.float32, float]
diff --git a/python/pyspark/pandas/tests/diff_frames_ops/test_corrwith.py b/python/pyspark/pandas/tests/diff_frames_ops/test_corrwith.py
index b6474ba9f0ecd..1bd274b45a742 100644
--- a/python/pyspark/pandas/tests/diff_frames_ops/test_corrwith.py
+++ b/python/pyspark/pandas/tests/diff_frames_ops/test_corrwith.py
@@ -20,11 +20,9 @@
 import numpy as np
 
 from pyspark import pandas as ps
-from pyspark.loose_version import LooseVersion
 from pyspark.pandas.config import set_option, reset_option
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 class DiffFramesCorrWithMixin:
@@ -82,7 +80,6 @@ def tearDownClass(cls):
         reset_option("compute.ops_on_diff_frames")
         super().tearDownClass()
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_corrwith(self):
         df1 = ps.DataFrame({"A": [1, np.nan, 7, 8], "X": [5, 8, np.nan, 3], "C": [10, 4, 9, 3]})
         df2 = ps.DataFrame({"A": [5, 3, 6, 4], "B": [11, 2, 4, 3], "C": [4, 3, 8, np.nan]})
@@ -96,11 +93,7 @@ def test_corrwith(self):
         # and https://github.com/pandas-dev/pandas/pull/46174 for the initial PR that causes.
         df_bool = ps.DataFrame({"A": [True, True, False, False], "B": [True, False, False, True]})
         ser_bool = ps.Series([True, True, False, True])
-        if LooseVersion(pd.__version__) == LooseVersion("1.5.0"):
-            expected = ps.Series([0.5773502691896257, 0.5773502691896257], index=["B", "A"])
-            self.assert_eq(df_bool.corrwith(ser_bool), expected, almost=True)
-        else:
-            self._test_corrwith(df_bool, ser_bool)
+        self._test_corrwith(df_bool, ser_bool)
 
         self._test_corrwith(self.psdf1, self.psdf1)
         self._test_corrwith(self.psdf1, self.psdf2)
@@ -108,15 +101,7 @@ def test_corrwith(self):
         self._test_corrwith(self.psdf3, self.psdf4)
 
         self._test_corrwith(self.psdf1, self.psdf1.a)
-        # There was a regression in pandas 1.5.0, and fixed in pandas 1.5.1.
-        # Therefore, we only test the pandas 1.5.0 in different way.
-        # See https://github.com/pandas-dev/pandas/issues/49141 for the reported issue,
-        # and https://github.com/pandas-dev/pandas/pull/46174 for the initial PR that causes.
-        if LooseVersion(pd.__version__) == LooseVersion("1.5.0"):
-            expected = ps.Series([-0.08827348295047496, 0.4413674147523748], index=["b", "a"])
-            self.assert_eq(self.psdf1.corrwith(self.psdf2.b), expected, almost=True)
-        else:
-            self._test_corrwith(self.psdf1, self.psdf2.b)
+        self._test_corrwith(self.psdf1, self.psdf2.b)
 
         self._test_corrwith(self.psdf2, self.psdf3.c)
         self._test_corrwith(self.psdf3, self.psdf4.f)
diff --git a/python/pyspark/pandas/tests/diff_frames_ops/test_dot_frame.py b/python/pyspark/pandas/tests/diff_frames_ops/test_dot_frame.py
index 628136d3519db..7a94e1858f09e 100644
--- a/python/pyspark/pandas/tests/diff_frames_ops/test_dot_frame.py
+++ b/python/pyspark/pandas/tests/diff_frames_ops/test_dot_frame.py
@@ -21,7 +21,6 @@
 from pyspark.pandas.config import set_option, reset_option
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 class DiffFramesDotFrameMixin:
@@ -35,7 +34,6 @@ def tearDownClass(cls):
         reset_option("compute.ops_on_diff_frames")
         super().tearDownClass()
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_frame_dot(self):
         pdf = pd.DataFrame([[0, 1, -2, -1], [1, 1, 1, 1]])
         psdf = ps.from_pandas(pdf)
diff --git a/python/pyspark/pandas/tests/frame/test_constructor.py b/python/pyspark/pandas/tests/frame/test_constructor.py
index 2d4f0f541f107..d0d842d8264c7 100644
--- a/python/pyspark/pandas/tests/frame/test_constructor.py
+++ b/python/pyspark/pandas/tests/frame/test_constructor.py
@@ -30,7 +30,6 @@
 
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 # This file contains test cases for 'Constructor'
@@ -549,7 +548,6 @@ def test_astype_extension_object_dtypes(self):
     @unittest.skipIf(
         not extension_float_dtypes_available, "pandas extension float dtypes are not available"
     )
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_extension_float_dtypes(self):
         pdf = pd.DataFrame(
             {
diff --git a/python/pyspark/pandas/tests/frame/test_reindexing.py b/python/pyspark/pandas/tests/frame/test_reindexing.py
index ebfaa8910cb7c..0d231a4a6cc71 100644
--- a/python/pyspark/pandas/tests/frame/test_reindexing.py
+++ b/python/pyspark/pandas/tests/frame/test_reindexing.py
@@ -25,7 +25,6 @@
 from pyspark.pandas.config import option_context
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 # This file contains test cases for 'Reindexing / Selection / Label manipulation'
@@ -765,7 +764,6 @@ def test_swapaxes(self):
         self.assertRaises(AssertionError, lambda: psdf.swapaxes(0, 1, copy=False))
         self.assertRaises(ValueError, lambda: psdf.swapaxes(0, -1))
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_isin(self):
         pdf = pd.DataFrame(
             {
diff --git a/python/pyspark/pandas/tests/groupby/test_corr.py b/python/pyspark/pandas/tests/groupby/test_corr.py
index b44087c828090..39d6d91de4b0a 100644
--- a/python/pyspark/pandas/tests/groupby/test_corr.py
+++ b/python/pyspark/pandas/tests/groupby/test_corr.py
@@ -21,7 +21,6 @@
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 class CorrMixin:
@@ -48,7 +47,6 @@ def test_corr(self):
                 almost=True,
             )
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_method(self):
         for m in ["pearson", "spearman", "kendall"]:
             self.assert_eq(
diff --git a/python/pyspark/pandas/tests/indexes/test_category.py b/python/pyspark/pandas/tests/indexes/test_category.py
index 761e1100d8afa..acd80378333e8 100644
--- a/python/pyspark/pandas/tests/indexes/test_category.py
+++ b/python/pyspark/pandas/tests/indexes/test_category.py
@@ -21,7 +21,6 @@
 from pandas.api.types import CategoricalDtype
 
 import pyspark.pandas as ps
-from pyspark.loose_version import LooseVersion
 from pyspark.testing.pandasutils import PandasOnSparkTestCase, TestUtils
 
 
@@ -202,18 +201,9 @@ def test_append(self):
         psidx3 = ps.from_pandas(pidx3)
 
         self.assert_eq(psidx1.append(psidx2), pidx1.append(pidx2))
-        if LooseVersion(pd.__version__) >= LooseVersion("1.5.0"):
-            self.assert_eq(
-                psidx1.append(psidx3.astype("category")), pidx1.append(pidx3.astype("category"))
-            )
-        else:
-            expected_result = ps.CategoricalIndex(
-                ["x", "y", "z", "y", "x", "w", "z"],
-                categories=["z", "y", "x", "w"],
-                ordered=False,
-                dtype="category",
-            )
-            self.assert_eq(psidx1.append(psidx3.astype("category")), expected_result)
+        self.assert_eq(
+            psidx1.append(psidx3.astype("category")), pidx1.append(pidx3.astype("category"))
+        )
 
         # TODO: append non-categorical or categorical with a different category
         self.assertRaises(NotImplementedError, lambda: psidx1.append(psidx3))
diff --git a/python/pyspark/pandas/tests/indexes/test_conversion.py b/python/pyspark/pandas/tests/indexes/test_conversion.py
index 9759a3d06a759..3ccc9697070fc 100644
--- a/python/pyspark/pandas/tests/indexes/test_conversion.py
+++ b/python/pyspark/pandas/tests/indexes/test_conversion.py
@@ -20,9 +20,13 @@
 import pandas as pd
 
 from pyspark import pandas as ps
-from pyspark.loose_version import LooseVersion
-from pyspark.testing.pandasutils import PandasOnSparkTestCase, SPARK_CONF_ARROW_ENABLED
+from pyspark.testing.pandasutils import PandasOnSparkTestCase
+from pyspark.pandas.utils import (
+    SPARK_CONF_ARROW_ENABLED,
+    SPARK_CONF_PANDAS_STRUCT_MODE,
+)
 from pyspark.testing.sqlutils import SQLTestUtils
+from pyspark.testing.utils import is_ansi_mode_test
 
 
 class ConversionMixin:
@@ -102,15 +106,10 @@ def test_multi_index_from_index(self):
         self.assert_eq(pmidx, psmidx)
 
         # Specify the `names`
-        # Specify the `names` while Index creating is no longer supported from pandas 2.0.0.
-        if LooseVersion(pd.__version__) >= LooseVersion("2.0.0"):
-            pmidx = pd.Index(tuples)
-            pmidx.names = ["Hello", "Koalas"]
-            psmidx = ps.Index(tuples)
-            psmidx.names = ["Hello", "Koalas"]
-        else:
-            pmidx = pd.Index(tuples, names=["Hello", "Koalas"])
-            psmidx = ps.Index(tuples, names=["Hello", "Koalas"])
+        pmidx = pd.Index(tuples)
+        pmidx.names = ["Hello", "Koalas"]
+        psmidx = ps.Index(tuples)
+        psmidx.names = ["Hello", "Koalas"]
 
         self.assertTrue(isinstance(psmidx, ps.MultiIndex))
         self.assert_eq(pmidx, psmidx)
@@ -191,10 +190,28 @@ def test_to_series(self):
 
         self.assert_eq((psidx + 1).to_series(), (pidx + 1).to_series())
 
+        # Multiindex
+        arrays = [[1, 2], ["red", "blue"]]
+        pidx = pd.MultiIndex.from_arrays(arrays, names=("number", "color"))
+        psidx = ps.from_pandas(pidx)
+
+        if is_ansi_mode_test:
+            with self.sql_conf(
+                {
+                    SPARK_CONF_PANDAS_STRUCT_MODE: "row",
+                }
+            ):
+                self.assert_eq(
+                    list(psidx.to_series().values),
+                    list(pidx.to_series().values),
+                )
+        else:
+            self.assert_eq(list(psidx.to_series().values), [["1", "red"], ["2", "blue"]])
+
         pidx = self.pdf.set_index("b", append=True).index
         psidx = self.psdf.set_index("b", append=True).index
 
-        with self.sql_conf({SPARK_CONF_ARROW_ENABLED: False}):
+        with self.sql_conf({SPARK_CONF_ARROW_ENABLED: False, SPARK_CONF_PANDAS_STRUCT_MODE: "row"}):
             self.assert_eq(psidx.to_series(), pidx.to_series(), check_exact=False)
             self.assert_eq(psidx.to_series(name="a"), pidx.to_series(name="a"), check_exact=False)
 
@@ -243,36 +260,30 @@ def test_to_frame(self):
         # non-string names
         self.assert_eq(psidx.to_frame(name=[10, 20]), pidx.to_frame(name=[10, 20]))
         self.assert_eq(psidx.to_frame(name=("x", 10)), pidx.to_frame(name=("x", 10)))
-        if LooseVersion(pd.__version__) < LooseVersion("1.5.0"):
-            self.assert_eq(
-                psidx.to_frame(name=[("x", 10), ("y", 20)]),
-                pidx.to_frame(name=[("x", 10), ("y", 20)]),
-            )
-        else:
-            # Since pandas 1.5.0, the result is changed as below:
-            #      (x, 10)  (y, 20)
-            #   b
-            # 0 4        0        4
-            # 1 5        1        5
-            # 3 6        3        6
-            # 5 3        5        3
-            # 6 2        6        2
-            # 8 1        8        1
-            # 9 0        9        0
-            #   0        9        0
-            #   0        9        0
-            #
-            # The columns should be `Index([('x', 20), ('y', 20)], dtype='object')`,
-            # but pandas API on Spark doesn't support such a way for creating Index.
-            # So, we currently cannot follow the behavior of pandas.
-            expected_result = ps.DataFrame(
-                {("x", 10): [0, 1, 3, 5, 6, 8, 9, 9, 9], ("y", 20): [4, 5, 6, 3, 2, 1, 0, 0, 0]},
-                index=ps.MultiIndex.from_tuples(
-                    [(0, 4), (1, 5), (3, 6), (5, 3), (6, 2), (8, 1), (9, 0), (9, 0), (9, 0)],
-                    names=[None, "b"],
-                ),
-            )
-            self.assert_eq(psidx.to_frame(name=[("x", 10), ("y", 20)]), expected_result)
+        # Since pandas 1.5.0, the result is changed as below:
+        #      (x, 10)  (y, 20)
+        #   b
+        # 0 4        0        4
+        # 1 5        1        5
+        # 3 6        3        6
+        # 5 3        5        3
+        # 6 2        6        2
+        # 8 1        8        1
+        # 9 0        9        0
+        #   0        9        0
+        #   0        9        0
+        #
+        # The columns should be `Index([('x', 20), ('y', 20)], dtype='object')`,
+        # but pandas API on Spark doesn't support such a way for creating Index.
+        # So, we currently cannot follow the behavior of pandas.
+        expected_result = ps.DataFrame(
+            {("x", 10): [0, 1, 3, 5, 6, 8, 9, 9, 9], ("y", 20): [4, 5, 6, 3, 2, 1, 0, 0, 0]},
+            index=ps.MultiIndex.from_tuples(
+                [(0, 4), (1, 5), (3, 6), (5, 3), (6, 2), (8, 1), (9, 0), (9, 0), (9, 0)],
+                names=[None, "b"],
+            ),
+        )
+        self.assert_eq(psidx.to_frame(name=[("x", 10), ("y", 20)]), expected_result)
 
     def test_to_list(self):
         # Index
diff --git a/python/pyspark/pandas/tests/indexes/test_insert.py b/python/pyspark/pandas/tests/indexes/test_insert.py
index a95c6ee194f54..71fd2f6ad04f6 100644
--- a/python/pyspark/pandas/tests/indexes/test_insert.py
+++ b/python/pyspark/pandas/tests/indexes/test_insert.py
@@ -27,14 +27,8 @@ def test_insert(self):
         # Integer
         pidx = pd.Index([1, 2, 3], name="Koalas")
         psidx = ps.from_pandas(pidx)
-        self.assert_eq(
-            pidx.insert(1, 100).sort_values(),
-            psidx.insert(1, 100).sort_values(),
-        )
-        self.assert_eq(
-            pidx.insert(-1, 100).sort_values(),
-            psidx.insert(-1, 100).sort_values(),
-        )
+        self.assert_eq(pidx.insert(1, 100), psidx.insert(1, 100))
+        self.assert_eq(pidx.insert(-1, 100), psidx.insert(-1, 100))
         err_msg = "index 100 is out of bounds for axis 0 with size 3"
         with self.assertRaisesRegex(IndexError, err_msg):
             psidx.insert(100, 100)
@@ -45,14 +39,8 @@ def test_insert(self):
         # Floating
         pidx = pd.Index([1.0, 2.0, 3.0], name="Koalas")
         psidx = ps.from_pandas(pidx)
-        self.assert_eq(
-            pidx.insert(1, 100.0).sort_values(),
-            psidx.insert(1, 100.0).sort_values(),
-        )
-        self.assert_eq(
-            pidx.insert(-1, 100.0).sort_values(),
-            psidx.insert(-1, 100.0).sort_values(),
-        )
+        self.assert_eq(pidx.insert(1, 100.0), psidx.insert(1, 100.0))
+        self.assert_eq(pidx.insert(-1, 100.0), psidx.insert(-1, 100.0))
         err_msg = "index 100 is out of bounds for axis 0 with size 3"
         with self.assertRaisesRegex(IndexError, err_msg):
             psidx.insert(100, 100)
@@ -63,14 +51,8 @@ def test_insert(self):
         # String
         pidx = pd.Index(["a", "b", "c"], name="Koalas")
         psidx = ps.from_pandas(pidx)
-        self.assert_eq(
-            pidx.insert(1, "x").sort_values(),
-            psidx.insert(1, "x").sort_values(),
-        )
-        self.assert_eq(
-            pidx.insert(-1, "x").sort_values(),
-            psidx.insert(-1, "x").sort_values(),
-        )
+        self.assert_eq(pidx.insert(1, "x"), psidx.insert(1, "x"))
+        self.assert_eq(pidx.insert(-1, "x"), psidx.insert(-1, "x"))
         err_msg = "index 100 is out of bounds for axis 0 with size 3"
         with self.assertRaisesRegex(IndexError, err_msg):
             psidx.insert(100, "x")
@@ -81,14 +63,8 @@ def test_insert(self):
         # Boolean
         pidx = pd.Index([True, False, True, False], name="Koalas")
         psidx = ps.from_pandas(pidx)
-        self.assert_eq(
-            pidx.insert(1, True).sort_values(),
-            psidx.insert(1, True).sort_values(),
-        )
-        self.assert_eq(
-            pidx.insert(-1, True).sort_values(),
-            psidx.insert(-1, True).sort_values(),
-        )
+        self.assert_eq(pidx.insert(1, True), psidx.insert(1, True))
+        self.assert_eq(pidx.insert(-1, True), psidx.insert(-1, True))
         err_msg = "index 100 is out of bounds for axis 0 with size 4"
         with self.assertRaisesRegex(IndexError, err_msg):
             psidx.insert(100, True)
@@ -101,14 +77,8 @@ def test_insert(self):
             [("a", "x"), ("b", "y"), ("c", "z")], names=["Hello", "Koalas"]
         )
         psmidx = ps.from_pandas(pmidx)
-        self.assert_eq(
-            pmidx.insert(2, ("h", "j")).sort_values(),
-            psmidx.insert(2, ("h", "j")).sort_values(),
-        )
-        self.assert_eq(
-            pmidx.insert(-1, ("h", "j")).sort_values(),
-            psmidx.insert(-1, ("h", "j")).sort_values(),
-        )
+        self.assert_eq(pmidx.insert(2, ("h", "j")), psmidx.insert(2, ("h", "j")))
+        self.assert_eq(pmidx.insert(-1, ("h", "j")), psmidx.insert(-1, ("h", "j")))
 
         err_msg = "index 4 is out of bounds for axis 0 with size 3"
         with self.assertRaisesRegex(IndexError, err_msg):
diff --git a/python/pyspark/pandas/tests/indexes/test_name.py b/python/pyspark/pandas/tests/indexes/test_name.py
index cacf3efcb38b1..d7e3bf1786e8a 100644
--- a/python/pyspark/pandas/tests/indexes/test_name.py
+++ b/python/pyspark/pandas/tests/indexes/test_name.py
@@ -20,7 +20,6 @@
 import pandas as pd
 
 from pyspark import pandas as ps
-from pyspark.loose_version import LooseVersion
 from pyspark.pandas.exceptions import PandasNotImplementedError
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
@@ -88,12 +87,6 @@ def test_index_names(self):
             psidx.name = ["renamed"]
         with self.assertRaisesRegex(TypeError, expected_error_message):
             psidx.name = ["0", "1"]
-        # Specifying `names` when creating Index is no longer supported from pandas 2.0.0.
-        if LooseVersion(pd.__version__) >= LooseVersion("2.0.0"):
-            pass
-        else:
-            with self.assertRaisesRegex(TypeError, expected_error_message):
-                ps.Index([(1, 2), (3, 4)], names=["a", ["b"]])
 
     def test_multi_index_names(self):
         arrays = [[1, 1, 2, 2], ["red", "blue", "red", "blue"]]
diff --git a/python/pyspark/pandas/tests/indexes/test_symmetric_diff.py b/python/pyspark/pandas/tests/indexes/test_symmetric_diff.py
index 2eca8cf4a4312..310fea2035926 100644
--- a/python/pyspark/pandas/tests/indexes/test_symmetric_diff.py
+++ b/python/pyspark/pandas/tests/indexes/test_symmetric_diff.py
@@ -20,7 +20,6 @@
 import pandas as pd
 
 import pyspark.pandas as ps
-from pyspark.loose_version import LooseVersion
 from pyspark.testing.pandasutils import PandasOnSparkTestCase, TestUtils
 
 
@@ -39,17 +38,10 @@ def test_index_symmetric_difference(self):
             (psidx1 + 1).symmetric_difference(psidx2).sort_values(),
             (pidx1 + 1).symmetric_difference(pidx2).sort_values(),
         )
-        # No longer supported from pandas 2.0.0.
-        if LooseVersion(pd.__version__) >= LooseVersion("2.0.0"):
-            self.assert_eq(
-                (psidx1 ^ psidx2).sort_values(),
-                ps.Index([1, 5], dtype="int64"),
-            )
-        else:
-            self.assert_eq(
-                (psidx1 ^ psidx2).sort_values(),
-                (pidx1 ^ pidx2).sort_values(),
-            )
+        self.assert_eq(
+            (psidx1 ^ psidx2).sort_values(),
+            ps.Index([1, 5], dtype="int64"),
+        )
         self.assert_eq(
             psidx1.symmetric_difference(psidx2, result_name="result").sort_values(),
             pidx1.symmetric_difference(pidx2, result_name="result").sort_values(),
diff --git a/python/pyspark/pandas/tests/io/test_dataframe_spark_io.py b/python/pyspark/pandas/tests/io/test_dataframe_spark_io.py
index af77ea8aa64ff..065a0e8d6ecd5 100644
--- a/python/pyspark/pandas/tests/io/test_dataframe_spark_io.py
+++ b/python/pyspark/pandas/tests/io/test_dataframe_spark_io.py
@@ -21,7 +21,6 @@
 import pandas as pd
 
 from pyspark import pandas as ps
-from pyspark.loose_version import LooseVersion
 from pyspark.testing.pandasutils import PandasOnSparkTestCase, TestUtils
 from pyspark.testing.utils import have_openpyxl, openpyxl_requirement_message
 
@@ -96,17 +95,9 @@ def test_parquet_read_with_pandas_metadata(self):
             self.assert_eq(ps.read_parquet(path2, pandas_metadata=True), expected2)
 
             expected3 = expected2.set_index("index", append=True)
-            # There is a bug in `to_parquet` from pandas 1.5.0 when writing MultiIndex.
-            # See https://github.com/pandas-dev/pandas/issues/48848 for the reported issue.
-            if LooseVersion(pd.__version__) > LooseVersion("1.5.0"):
-                expected_psdf = ps.read_parquet(path2, pandas_metadata=True).set_index(
-                    "index", append=True
-                )
-            else:
-                path3 = "{}/file3.parquet".format(tmp)
-                expected3.to_parquet(path3)
-                expected_psdf = ps.read_parquet(path3, pandas_metadata=True)
-
+            expected_psdf = ps.read_parquet(path2, pandas_metadata=True).set_index(
+                "index", append=True
+            )
             self.assert_eq(expected_psdf, expected3)
 
     def test_parquet_write(self):
diff --git a/python/pyspark/pandas/tests/series/test_as_type.py b/python/pyspark/pandas/tests/series/test_as_type.py
index dfd66ee05d382..da9a399abf7be 100644
--- a/python/pyspark/pandas/tests/series/test_as_type.py
+++ b/python/pyspark/pandas/tests/series/test_as_type.py
@@ -22,6 +22,7 @@
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
+from pyspark.testing.utils import is_ansi_mode_test
 from pyspark.pandas.typedef.typehints import (
     extension_dtypes_available,
     extension_float_dtypes_available,
@@ -31,6 +32,7 @@
 
 class SeriesAsTypeMixin:
     def test_astype(self):
+        # numeric
         psers = [pd.Series([10, 20, 15, 30, 45], name="x")]
 
         if extension_dtypes_available:
@@ -41,12 +43,14 @@ def test_astype(self):
         for pser in psers:
             self._test_numeric_astype(pser)
 
+        # numeric with nulls
         pser = pd.Series([10, 20, 15, 30, 45, None, np.nan], name="x")
         psser = ps.Series(pser)
 
         self.assert_eq(psser.astype(bool), pser.astype(bool))
         self.assert_eq(psser.astype(str), pser.astype(str))
 
+        # strings
         pser = pd.Series(["hi", "hi ", " ", " \t", "", None], name="x")
         psser = ps.Series(pser)
 
@@ -60,12 +64,16 @@ def test_astype(self):
             self._check_extension(psser.astype("string"), pser.astype("string"))
             self._check_extension(psser.astype(StringDtype()), pser.astype(StringDtype()))
 
+        # bools
         pser = pd.Series([True, False, None], name="x")
         psser = ps.Series(pser)
-
         self.assert_eq(psser.astype(bool), pser.astype(bool))
         self.assert_eq(psser.astype(str), pser.astype(str))
 
+        if is_ansi_mode_test:
+            with self.assertRaisesRegex(ValueError, "with missing values to integer"):
+                self.assert_eq(psser.astype(int))
+
         if extension_object_dtypes_available:
             from pandas import BooleanDtype, StringDtype
 
@@ -74,6 +82,7 @@ def test_astype(self):
             self._check_extension(psser.astype("string"), pser.astype("string"))
             self._check_extension(psser.astype(StringDtype()), pser.astype(StringDtype()))
 
+        # datetimes
         pser = pd.Series(["2020-10-27 00:00:01", None], name="x")
         psser = ps.Series(pser)
 
diff --git a/python/pyspark/pandas/tests/series/test_series.py b/python/pyspark/pandas/tests/series/test_series.py
index 7409bcc26c29d..26045b5beb947 100644
--- a/python/pyspark/pandas/tests/series/test_series.py
+++ b/python/pyspark/pandas/tests/series/test_series.py
@@ -30,7 +30,6 @@
     SPARK_CONF_ARROW_ENABLED,
 )
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 from pyspark.pandas.exceptions import PandasNotImplementedError
 from pyspark.pandas.missing.series import MissingPandasLikeSeries
 from pyspark.pandas.typedef.typehints import extension_object_dtypes_available
@@ -103,6 +102,29 @@ def test_empty_series(self):
 
         self.assertTrue(pser_a.empty)
 
+    def test_series_from_series(self):
+        psser = ps.Series([1, 2, 3, 4, 5, 6, 7], name="x")
+
+        psser_from_psser = ps.Series(psser)
+        self.assert_eq(psser_from_psser, psser)
+
+        psser = ps.Series([1, 2, 3])
+
+        # Specify new index
+        psser_from_psser = ps.Series(psser, index=[1])
+        self.assert_eq(psser_from_psser, ps.Series([2], index=[1]))
+
+        psser_from_psser = ps.Series(psser, index=[1, 2])
+        self.assert_eq(psser_from_psser, ps.Series([2, 3], index=[1, 2]))
+
+        # Specify new out-of-order index
+        psser_from_psser = ps.Series(psser, index=[1, 2, 0])
+        self.assert_eq(psser_from_psser, ps.Series([2, 3, 1], index=[1, 2, 0]))
+
+        # Specify new dtype and name
+        psser_from_psser = ps.Series(psser, name="y", dtype=float)
+        self.assert_eq(psser_from_psser, ps.Series([1, 2, 3], name="y", dtype=float))
+
     def test_all_null_series(self):
         pser_a = pd.Series([None, None, None], dtype="float64")
         pser_b = pd.Series([None, None, None], dtype="str")
@@ -662,7 +684,6 @@ def test_items(self):
             self.assert_eq(p_name, k_name)
             self.assert_eq(p_items, k_items)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_dot(self):
         pdf = pd.DataFrame({"a": [1, 2, 3], "b": [4, 5, 6]})
         psdf = ps.from_pandas(pdf)
diff --git a/python/pyspark/pandas/tests/series/test_stat.py b/python/pyspark/pandas/tests/series/test_stat.py
index a779ca558da65..077a8e31d20ad 100644
--- a/python/pyspark/pandas/tests/series/test_stat.py
+++ b/python/pyspark/pandas/tests/series/test_stat.py
@@ -23,7 +23,6 @@
 from pyspark import pandas as ps
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 class SeriesStatMixin:
@@ -443,7 +442,6 @@ def test_rdivmod(self):
         self.assert_eq(krdiv, prdiv)
         self.assert_eq(krmod, prmod)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_mod(self):
         pser = pd.Series([100, None, -300, None, 500, -700], name="Koalas")
         psser = ps.from_pandas(pser)
@@ -608,6 +606,9 @@ def test_autocorr(self):
         with self.assertRaisesRegex(TypeError, r"lag should be an int; however, got"):
             psser.autocorr(1.0)
 
+        psser = ps.Series([1, 0, 0, 0])
+        self.assertTrue(bool(np.isnan(psser.autocorr())))
+
     def _test_autocorr(self, pdf):
         psdf = ps.from_pandas(pdf)
         for lag in range(-10, 10):
diff --git a/python/pyspark/pandas/tests/test_categorical.py b/python/pyspark/pandas/tests/test_categorical.py
index 2730723b27e35..49cbcee47b80c 100644
--- a/python/pyspark/pandas/tests/test_categorical.py
+++ b/python/pyspark/pandas/tests/test_categorical.py
@@ -91,7 +91,6 @@ def test_add_categories(self):
         self.assert_eq(pser.cat.add_categories([4, 5]), psser.cat.add_categories([4, 5]))
         self.assert_eq(pser.cat.add_categories([]), psser.cat.add_categories([]))
 
-        pser = pser.cat.add_categories(4)
         psser = psser.cat.add_categories(4)
 
         self.assertRaises(ValueError, lambda: psser.cat.add_categories(4))
diff --git a/python/pyspark/pandas/tests/test_namespace.py b/python/pyspark/pandas/tests/test_namespace.py
index c86cb17c0e5d0..141c6873d7f59 100644
--- a/python/pyspark/pandas/tests/test_namespace.py
+++ b/python/pyspark/pandas/tests/test_namespace.py
@@ -29,7 +29,6 @@
 from pyspark.pandas.missing.general_functions import MissingPandasLikeGeneralFunctions
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 from pyspark.pandas.testing import assert_frame_equal
 
 
@@ -561,7 +560,6 @@ def test_read_delta_with_wrong_input(self):
             lambda: read_delta("fake_path", version="0", timestamp="2021-06-22"),
         )
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_to_numeric(self):
         pser = pd.Series(["1", "2", None, "4", "hello"])
         psser = ps.from_pandas(pser)
diff --git a/python/pyspark/pandas/tests/test_numpy_compat.py b/python/pyspark/pandas/tests/test_numpy_compat.py
index 39786c6ac2286..f754ee08a7835 100644
--- a/python/pyspark/pandas/tests/test_numpy_compat.py
+++ b/python/pyspark/pandas/tests/test_numpy_compat.py
@@ -23,10 +23,15 @@
 from pyspark.pandas import set_option, reset_option
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 class NumPyCompatTestsMixin:
+    @classmethod
+    def setUpClass(cls):
+        super(NumPyCompatTestsMixin, cls).setUpClass()
+        # Some nanosecond->microsecond conversions throw loss of precision errors
+        cls.spark.conf.set("spark.sql.execution.pandas.convertToArrowArraySafely", "false")
+
     blacklist = [
         # Pandas-on-Spark does not currently support
         "conj",
@@ -132,7 +137,6 @@ def test_np_spark_compat_series(self):
         finally:
             reset_option("compute.ops_on_diff_frames")
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_np_spark_compat_frame(self):
         from pyspark.pandas.numpy_compat import unary_np_spark_mappings, binary_np_spark_mappings
 
diff --git a/python/pyspark/pandas/tests/test_utils.py b/python/pyspark/pandas/tests/test_utils.py
index 26f571233a8bd..6286df8e54690 100644
--- a/python/pyspark/pandas/tests/test_utils.py
+++ b/python/pyspark/pandas/tests/test_utils.py
@@ -163,6 +163,60 @@ def test_index_error_assert_pandas_equal(self):
             },
         )
 
+    def test_dataframe_error_assert_pandas_almost_equal(self):
+        pdf1 = pd.DataFrame({"a": [1, 2, 3], "b": [4, 5, 6]})
+        pdf2 = pd.DataFrame({"a": [1, 3, 3], "b": [4, 5, 6]})
+
+        with self.assertRaises(PySparkAssertionError) as pe:
+            _assert_pandas_almost_equal(pdf1, pdf2, True)
+
+        self.check_error(
+            exception=pe.exception,
+            errorClass="DIFFERENT_PANDAS_DATAFRAME",
+            messageParameters={
+                "left": pdf1.to_string(),
+                "left_dtype": str(pdf1.dtypes),
+                "right": pdf2.to_string(),
+                "right_dtype": str(pdf2.dtypes),
+            },
+        )
+
+    def test_series_error_assert_pandas_equal(self):
+        series1 = pd.Series([1, 2, 3])
+        series2 = pd.Series([4, 5, 6])
+
+        with self.assertRaises(PySparkAssertionError) as pe:
+            _assert_pandas_almost_equal(series1, series2, True)
+
+        self.check_error(
+            exception=pe.exception,
+            errorClass="DIFFERENT_PANDAS_SERIES",
+            messageParameters={
+                "left": series1.to_string(),
+                "left_dtype": str(series1.dtype),
+                "right": series2.to_string(),
+                "right_dtype": str(series2.dtype),
+            },
+        )
+
+    def test_index_error_assert_pandas_almost_equal(self):
+        index1 = pd.Index([1, 2, 3])
+        index2 = pd.Index([4, 5, 6])
+
+        with self.assertRaises(PySparkAssertionError) as pe:
+            _assert_pandas_almost_equal(index1, index2, True)
+
+        self.check_error(
+            exception=pe.exception,
+            errorClass="DIFFERENT_PANDAS_INDEX",
+            messageParameters={
+                "left": index1,
+                "left_dtype": str(index1.dtype),
+                "right": index2,
+                "right_dtype": str(index2.dtype),
+            },
+        )
+
     def test_multiindex_error_assert_pandas_almost_equal(self):
         pdf1 = pd.DataFrame({"a": [1, 2], "b": [4, 10]}, index=[0, 1])
         pdf2 = pd.DataFrame({"a": [1, 5, 3], "b": [1, 5, 6]}, index=[0, 1, 3])
diff --git a/python/pyspark/pandas/typedef/typehints.py b/python/pyspark/pandas/typedef/typehints.py
index 4244f5831aa50..48545d124b2d8 100644
--- a/python/pyspark/pandas/typedef/typehints.py
+++ b/python/pyspark/pandas/typedef/typehints.py
@@ -362,8 +362,9 @@ def infer_pd_series_spark_type(
     if dtype == np.dtype("object"):
         if len(pser) == 0 or pser.isnull().all():
             return types.NullType()
-        elif hasattr(pser.iloc[0], "__UDT__"):
-            return pser.iloc[0].__UDT__
+        notnull = pser[pser.notnull()]
+        if hasattr(notnull.iloc[0], "__UDT__"):
+            return notnull.iloc[0].__UDT__
         else:
             return from_arrow_type(pa.Array.from_pandas(pser).type, prefer_timestamp_ntz)
     elif isinstance(dtype, CategoricalDtype):
diff --git a/python/pyspark/pandas/utils.py b/python/pyspark/pandas/utils.py
index 23350c06a147e..6a0561fad9c5a 100644
--- a/python/pyspark/pandas/utils.py
+++ b/python/pyspark/pandas/utils.py
@@ -20,7 +20,9 @@
 
 import functools
 from contextlib import contextmanager
+import json
 import os
+import threading
 from typing import (
     Any,
     Callable,
@@ -69,6 +71,7 @@
 
 
 SPARK_CONF_ARROW_ENABLED = "spark.sql.execution.arrow.pyspark.enabled"
+SPARK_CONF_PANDAS_STRUCT_MODE = "spark.sql.execution.pandas.structHandlingMode"
 
 
 class PandasAPIOnSparkAdviceWarning(Warning):
@@ -1070,11 +1073,101 @@ def xor(df1: PySparkDataFrame, df2: PySparkDataFrame) -> PySparkDataFrame:
     )
 
 
+_ansi_mode_enabled = threading.local()
+
+
+def _is_in_ansi_mode_context(spark: SparkSession) -> bool:
+    if is_remote():
+        from pyspark.sql.connect.session import SparkSession as ConnectSession
+
+        session_id = cast(ConnectSession, spark).session_id
+        return hasattr(_ansi_mode_enabled, session_id)
+    else:
+        return hasattr(_ansi_mode_enabled, "enabled")
+
+
+def _set_ansi_mode_enabled_in_context(spark: SparkSession, enabled: Optional[bool] = None) -> None:
+    if enabled is not None:
+        assert _is_in_ansi_mode_context(spark)
+
+    if is_remote():
+        from pyspark.sql.connect.session import SparkSession as ConnectSession
+
+        session_id = cast(ConnectSession, spark).session_id
+        setattr(_ansi_mode_enabled, session_id, enabled)
+    else:
+        _ansi_mode_enabled.enabled = enabled
+
+
+def _get_ansi_mode_enabled_in_context(spark: SparkSession) -> Optional[bool]:
+    assert _is_in_ansi_mode_context(spark)
+
+    if is_remote():
+        from pyspark.sql.connect.session import SparkSession as ConnectSession
+
+        session_id = cast(ConnectSession, spark).session_id
+        return getattr(_ansi_mode_enabled, session_id)
+    else:
+        return _ansi_mode_enabled.enabled
+
+
+def _unset_ansi_mode_enabled_in_context(spark: SparkSession) -> None:
+    assert _is_in_ansi_mode_context(spark)
+
+    if is_remote():
+        from pyspark.sql.connect.session import SparkSession as ConnectSession
+
+        session_id = cast(ConnectSession, spark).session_id
+        delattr(_ansi_mode_enabled, session_id)
+    else:
+        del _ansi_mode_enabled.enabled
+
+
+@contextmanager
+def ansi_mode_context(spark: SparkSession) -> Iterator[None]:
+    if _is_in_ansi_mode_context(spark):
+        yield
+    else:
+        _set_ansi_mode_enabled_in_context(spark)
+        try:
+            yield
+        finally:
+            _unset_ansi_mode_enabled_in_context(spark)
+
+
 def is_ansi_mode_enabled(spark: SparkSession) -> bool:
-    return (
-        ps.get_option("compute.ansi_mode_support", spark_session=spark)
-        and spark.conf.get("spark.sql.ansi.enabled") == "true"
-    )
+    def _is_ansi_mode_enabled() -> bool:
+        if is_remote():
+            from pyspark.sql.connect.session import SparkSession as ConnectSession
+            from pyspark.pandas.config import _key_format, _options_dict
+
+            client = cast(ConnectSession, spark).client
+            (ansi_mode_support, ansi_enabled) = client.get_config_with_defaults(
+                (
+                    _key_format("compute.ansi_mode_support"),
+                    json.dumps(_options_dict["compute.ansi_mode_support"].default),
+                ),
+                ("spark.sql.ansi.enabled", None),
+            )
+            if ansi_enabled is None:
+                ansi_enabled = spark.conf.get("spark.sql.ansi.enabled")
+                # Explicitly set the default value to reduce the roundtrip for the next time.
+                spark.conf.set("spark.sql.ansi.enabled", ansi_enabled)
+            return json.loads(ansi_mode_support) and ansi_enabled.lower() == "true"
+        else:
+            return (
+                ps.get_option("compute.ansi_mode_support", spark_session=spark)
+                and spark.conf.get("spark.sql.ansi.enabled").lower() == "true"
+            )
+
+    if _is_in_ansi_mode_context(spark):
+        enabled = _get_ansi_mode_enabled_in_context(spark)
+        if enabled is None:
+            enabled = _is_ansi_mode_enabled()
+            _set_ansi_mode_enabled_in_context(spark, enabled)
+        return enabled
+    else:
+        return _is_ansi_mode_enabled()
 
 
 def _test() -> None:
diff --git a/python/pyspark/pipelines/api.py b/python/pyspark/pipelines/api.py
index 57de64e970351..35beff19c981d 100644
--- a/python/pyspark/pipelines/api.py
+++ b/python/pyspark/pipelines/api.py
@@ -35,21 +35,16 @@ def append_flow(
     *,
     target: str,
     name: Optional[str] = None,
-    comment: Optional[str] = None,
     spark_conf: Optional[Dict[str, str]] = None,
-    once: bool = False,
 ) -> Callable[[QueryFunction], None]:
     """
     Return a decorator on a query function to define a flow in a pipeline.
 
     :param name: The name of the flow. If unspecified, the query function's name will be used.
     :param target: The name of the dataset this flow writes to. Must be specified.
-    :param comment: Description of the flow. If unspecified, the dataset's comment will be used.
     :param spark_conf: A dict whose keys are the conf names and values are the conf values. \
         These confs will be set when the flow is executed; they can override confs set for the \
         destination, for the pipeline, or on the cluster.
-    :param once: If True, indicates this flow should run only once. (It will be rerun upon a full \
-        refresh operation.)
     """
     if name is not None and type(name) is not str:
         raise PySparkTypeError(
@@ -69,7 +64,6 @@ def outer(func: QueryFunction) -> None:
             target=target,
             spark_conf=spark_conf,
             source_code_location=source_code_location,
-            once=once,
             func=func,
         )
         get_active_graph_element_registry().register_flow(flow)
@@ -179,7 +173,6 @@ def outer(
                 target=resolved_name,
                 spark_conf=spark_conf or {},
                 source_code_location=source_code_location,
-                once=False,
                 func=decorated,
             )
         )
@@ -282,7 +275,6 @@ def outer(
                 target=resolved_name,
                 spark_conf=spark_conf or {},
                 source_code_location=source_code_location,
-                once=False,
                 func=decorated,
             )
         )
@@ -373,7 +365,6 @@ def outer(decorated: QueryFunction) -> None:
                 spark_conf=spark_conf or {},
                 name=resolved_name,
                 source_code_location=source_code_location,
-                once=False,
             )
         )
 
@@ -409,7 +400,6 @@ def create_streaming_table(
     name: str,
     *,
     comment: Optional[str] = None,
-    spark_conf: Optional[Dict[str, str]] = None,
     table_properties: Optional[Dict[str, str]] = None,
     partition_cols: Optional[List[str]] = None,
     schema: Optional[Union[StructType, str]] = None,
@@ -423,9 +413,6 @@ def create_streaming_table(
 
     :param name: The name of the table.
     :param comment: Description of the table.
-    :param spark_conf: A dict whose keys are the conf names and values are the conf values. \
-        These confs will be set when the query for the dataset is executed and they can override \
-        confs set for the pipeline or on the cluster.
     :param table_properties: A dict where the keys are the property names and the values are the \
         property values. These properties will be set on the table.
     :param partition_cols: A list containing the column names of the partition columns.
diff --git a/python/pyspark/pipelines/block_session_mutations.py b/python/pyspark/pipelines/block_session_mutations.py
new file mode 100644
index 0000000000000..df63d2023a4ba
--- /dev/null
+++ b/python/pyspark/pipelines/block_session_mutations.py
@@ -0,0 +1,135 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+from contextlib import contextmanager
+from typing import Generator, NoReturn, List, Callable
+
+from pyspark.errors import PySparkException
+from pyspark.sql.connect.catalog import Catalog
+from pyspark.sql.connect.conf import RuntimeConf
+from pyspark.sql.connect.dataframe import DataFrame
+from pyspark.sql.connect.udf import UDFRegistration
+
+# pyspark methods that should be blocked from executing in python pipeline definition files
+ERROR_CLASS = "SESSION_MUTATION_IN_DECLARATIVE_PIPELINE"
+BLOCKED_METHODS: List = [
+    {
+        "class": RuntimeConf,
+        "method": "set",
+        "error_sub_class": "SET_RUNTIME_CONF",
+    },
+    {
+        "class": Catalog,
+        "method": "setCurrentCatalog",
+        "error_sub_class": "SET_CURRENT_CATALOG",
+    },
+    {
+        "class": Catalog,
+        "method": "setCurrentDatabase",
+        "error_sub_class": "SET_CURRENT_DATABASE",
+    },
+    {
+        "class": Catalog,
+        "method": "dropTempView",
+        "error_sub_class": "DROP_TEMP_VIEW",
+    },
+    {
+        "class": Catalog,
+        "method": "dropGlobalTempView",
+        "error_sub_class": "DROP_GLOBAL_TEMP_VIEW",
+    },
+    {
+        "class": DataFrame,
+        "method": "createTempView",
+        "error_sub_class": "CREATE_TEMP_VIEW",
+    },
+    {
+        "class": DataFrame,
+        "method": "createOrReplaceTempView",
+        "error_sub_class": "CREATE_OR_REPLACE_TEMP_VIEW",
+    },
+    {
+        "class": DataFrame,
+        "method": "createGlobalTempView",
+        "error_sub_class": "CREATE_GLOBAL_TEMP_VIEW",
+    },
+    {
+        "class": DataFrame,
+        "method": "createOrReplaceGlobalTempView",
+        "error_sub_class": "CREATE_OR_REPLACE_GLOBAL_TEMP_VIEW",
+    },
+    {
+        "class": UDFRegistration,
+        "method": "register",
+        "error_sub_class": "REGISTER_UDF",
+    },
+    {
+        "class": UDFRegistration,
+        "method": "registerJavaFunction",
+        "error_sub_class": "REGISTER_JAVA_UDF",
+    },
+    {
+        "class": UDFRegistration,
+        "method": "registerJavaUDAF",
+        "error_sub_class": "REGISTER_JAVA_UDAF",
+    },
+]
+
+
+def _create_blocked_method(error_method_name: str, error_sub_class: str) -> Callable:
+    def blocked_method(*args: object, **kwargs: object) -> NoReturn:
+        raise PySparkException(
+            errorClass=f"{ERROR_CLASS}.{error_sub_class}",
+            messageParameters={
+                "method": error_method_name,
+            },
+        )
+
+    return blocked_method
+
+
+@contextmanager
+def block_session_mutations() -> Generator[None, None, None]:
+    """
+    Context manager that blocks imperative constructs found in a pipeline python definition file
+    See BLOCKED_METHODS above for a list
+    """
+    # Store original methods
+    original_methods = {}
+    for method_info in BLOCKED_METHODS:
+        cls = method_info["class"]
+        method_name = method_info["method"]
+        original_methods[(cls, method_name)] = getattr(cls, method_name)
+
+    try:
+        # Replace methods with blocked versions
+        for method_info in BLOCKED_METHODS:
+            cls = method_info["class"]
+            method_name = method_info["method"]
+            error_method_name = f"'{cls.__name__}.{method_name}'"
+            blocked_method = _create_blocked_method(
+                error_method_name, method_info["error_sub_class"]
+            )
+            setattr(cls, method_name, blocked_method)
+
+        yield
+    finally:
+        # Restore original methods
+        for method_info in BLOCKED_METHODS:
+            cls = method_info["class"]
+            method_name = method_info["method"]
+            original_method = original_methods[(cls, method_name)]
+            setattr(cls, method_name, original_method)
diff --git a/python/pyspark/pipelines/cli.py b/python/pyspark/pipelines/cli.py
index 824c2a5fff166..43f9ae150f3f3 100644
--- a/python/pyspark/pipelines/cli.py
+++ b/python/pyspark/pipelines/cli.py
@@ -28,10 +28,11 @@
 import yaml
 from dataclasses import dataclass
 from pathlib import Path
-from typing import Any, Generator, Mapping, Optional, Sequence
+from typing import Any, Generator, List, Mapping, Optional, Sequence
 
 from pyspark.errors import PySparkException, PySparkTypeError
 from pyspark.sql import SparkSession
+from pyspark.pipelines.block_session_mutations import block_session_mutations
 from pyspark.pipelines.graph_element_registry import (
     graph_element_registration_context,
     GraphElementRegistry,
@@ -61,12 +62,14 @@ class DefinitionsGlob:
 class PipelineSpec:
     """Spec for a pipeline.
 
+    :param name: The name of the pipeline.
     :param catalog: The default catalog to use for the pipeline.
     :param database: The default database to use for the pipeline.
     :param configuration: A dictionary of Spark configuration properties to set for the pipeline.
     :param definitions: A list of glob patterns for finding pipeline definitions files.
     """
 
+    name: str
     catalog: Optional[str]
     database: Optional[str]
     configuration: Mapping[str, str]
@@ -110,13 +113,23 @@ def load_pipeline_spec(spec_path: Path) -> PipelineSpec:
 
 
 def unpack_pipeline_spec(spec_data: Mapping[str, Any]) -> PipelineSpec:
+    ALLOWED_FIELDS = {"name", "catalog", "database", "schema", "configuration", "definitions"}
+    REQUIRED_FIELDS = ["name"]
     for key in spec_data.keys():
-        if key not in ["catalog", "database", "schema", "configuration", "definitions"]:
+        if key not in ALLOWED_FIELDS:
             raise PySparkException(
                 errorClass="PIPELINE_SPEC_UNEXPECTED_FIELD", messageParameters={"field_name": key}
             )
 
+    for key in REQUIRED_FIELDS:
+        if key not in spec_data:
+            raise PySparkException(
+                errorClass="PIPELINE_SPEC_MISSING_REQUIRED_FIELD",
+                messageParameters={"field_name": key},
+            )
+
     return PipelineSpec(
+        name=spec_data["name"],
         catalog=spec_data.get("catalog"),
         database=spec_data.get("database", spec_data.get("schema")),
         configuration=validate_str_dict(spec_data.get("configuration", {}), "configuration"),
@@ -180,7 +193,8 @@ def register_definitions(
                         assert (
                             module_spec.loader is not None
                         ), f"Module spec has no loader for {file}"
-                        module_spec.loader.exec_module(module)
+                        with block_session_mutations():
+                            module_spec.loader.exec_module(module)
                     elif file.suffix == ".sql":
                         log_with_curr_timestamp(f"Registering SQL file {file}...")
                         with file.open("r") as f:
@@ -205,17 +219,46 @@ def change_dir(path: Path) -> Generator[None, None, None]:
         os.chdir(prev)
 
 
-def run(spec_path: Path, remote: str) -> None:
-    """Run the pipeline defined with the given spec."""
+def run(
+    spec_path: Path,
+    full_refresh: Sequence[str],
+    full_refresh_all: bool,
+    refresh: Sequence[str],
+    dry: bool,
+) -> None:
+    """Run the pipeline defined with the given spec.
+
+    :param spec_path: Path to the pipeline specification file.
+    :param full_refresh: List of datasets to reset and recompute.
+    :param full_refresh_all: Perform a full graph reset and recompute.
+    :param refresh: List of datasets to update.
+    """
+    # Validate conflicting arguments
+    if full_refresh_all:
+        if full_refresh:
+            raise PySparkException(
+                errorClass="CONFLICTING_PIPELINE_REFRESH_OPTIONS",
+                messageParameters={
+                    "conflicting_option": "--full_refresh",
+                },
+            )
+        if refresh:
+            raise PySparkException(
+                errorClass="CONFLICTING_PIPELINE_REFRESH_OPTIONS",
+                messageParameters={
+                    "conflicting_option": "--refresh",
+                },
+            )
+
     log_with_curr_timestamp(f"Loading pipeline spec from {spec_path}...")
     spec = load_pipeline_spec(spec_path)
 
     log_with_curr_timestamp("Creating Spark session...")
-    spark_builder = SparkSession.builder.remote(remote)
+    spark_builder = SparkSession.builder
     for key, value in spec.configuration.items():
         spark_builder = spark_builder.config(key, value)
 
-    spark = spark_builder.create()
+    spark = spark_builder.getOrCreate()
 
     log_with_curr_timestamp("Creating dataflow graph...")
     dataflow_graph_id = create_dataflow_graph(
@@ -230,23 +273,60 @@ def run(spec_path: Path, remote: str) -> None:
     register_definitions(spec_path, registry, spec)
 
     log_with_curr_timestamp("Starting run...")
-    result_iter = start_run(spark, dataflow_graph_id)
+    result_iter = start_run(
+        spark,
+        dataflow_graph_id,
+        full_refresh=full_refresh,
+        full_refresh_all=full_refresh_all,
+        refresh=refresh,
+        dry=dry,
+    )
     try:
         handle_pipeline_events(result_iter)
     finally:
         spark.stop()
 
 
+def parse_table_list(value: str) -> List[str]:
+    """Parse a comma-separated list of table names, handling whitespace."""
+    return [table.strip() for table in value.split(",") if table.strip()]
+
+
 if __name__ == "__main__":
     parser = argparse.ArgumentParser(description="Pipeline CLI")
     subparsers = parser.add_subparsers(dest="command", required=True)
 
     # "run" subcommand
-    run_parser = subparsers.add_parser("run", help="Run a pipeline.")
+    run_parser = subparsers.add_parser(
+        "run",
+        help="Run a pipeline. If no refresh options specified, "
+        "a default incremental update is performed.",
+    )
     run_parser.add_argument("--spec", help="Path to the pipeline spec.")
     run_parser.add_argument(
-        "--remote", help="The Spark Connect remote to connect to.", required=True
+        "--full-refresh",
+        type=parse_table_list,
+        action="extend",
+        help="List of datasets to reset and recompute (comma-separated).",
+        default=[],
+    )
+    run_parser.add_argument(
+        "--full-refresh-all", action="store_true", help="Perform a full graph reset and recompute."
     )
+    run_parser.add_argument(
+        "--refresh",
+        type=parse_table_list,
+        action="extend",
+        help="List of datasets to update (comma-separated).",
+        default=[],
+    )
+
+    # "dry-run" subcommand
+    dry_run_parser = subparsers.add_parser(
+        "dry-run",
+        help="Launch a run that just validates the graph and checks for errors.",
+    )
+    dry_run_parser.add_argument("--spec", help="Path to the pipeline spec.")
 
     # "init" subcommand
     init_parser = subparsers.add_parser(
@@ -261,9 +341,9 @@ def run(spec_path: Path, remote: str) -> None:
     )
 
     args = parser.parse_args()
-    assert args.command in ["run", "init"]
+    assert args.command in ["run", "dry-run", "init"]
 
-    if args.command == "run":
+    if args.command in ["run", "dry-run"]:
         if args.spec is not None:
             spec_path = Path(args.spec)
             if not spec_path.is_file():
@@ -274,6 +354,22 @@ def run(spec_path: Path, remote: str) -> None:
         else:
             spec_path = find_pipeline_spec(Path.cwd())
 
-        run(spec_path=spec_path, remote=args.remote)
+        if args.command == "run":
+            run(
+                spec_path=spec_path,
+                full_refresh=args.full_refresh,
+                full_refresh_all=args.full_refresh_all,
+                refresh=args.refresh,
+                dry=args.command == "dry-run",
+            )
+        else:
+            assert args.command == "dry-run"
+            run(
+                spec_path=spec_path,
+                full_refresh=[],
+                full_refresh_all=False,
+                refresh=[],
+                dry=True,
+            )
     elif args.command == "init":
         init(args.name)
diff --git a/python/pyspark/pipelines/dataset.py b/python/pyspark/pipelines/dataset.py
index 1355794f25be7..b46bc9f6e2b6b 100644
--- a/python/pyspark/pipelines/dataset.py
+++ b/python/pyspark/pipelines/dataset.py
@@ -64,7 +64,7 @@ class MaterializedView(Table):
 
 @dataclass(frozen=True)
 class StreamingTable(Table):
-    """Definition of a materialized view in a pipeline dataflow graph. A streaming table is a
+    """Definition of a streaming table in a pipeline dataflow graph. A streaming table is a
     table whose contents are produced by one or more streaming flows."""
 
 
diff --git a/python/pyspark/pipelines/flow.py b/python/pyspark/pipelines/flow.py
index c2f8599ebf9f5..7c499c0b36221 100644
--- a/python/pyspark/pipelines/flow.py
+++ b/python/pyspark/pipelines/flow.py
@@ -33,7 +33,6 @@ class Flow:
     :param spark_conf: A dict where the keys are the Spark configuration property names and the
         values are the property values. These properties will be set on the flow.
     :param source_code_location: The location of the source code that created this flow.
-    :param once: If True, the flow will be executed once per run.
     :param func: The function that defines the flow. This function should return a DataFrame.
     """
 
@@ -41,5 +40,4 @@ class Flow:
     target: str
     spark_conf: Dict[str, str]
     source_code_location: SourceCodeLocation
-    once: bool
     func: QueryFunction
diff --git a/python/pyspark/pipelines/init_cli.py b/python/pyspark/pipelines/init_cli.py
index 1be4f288fad03..227e5aa5deca6 100644
--- a/python/pyspark/pipelines/init_cli.py
+++ b/python/pyspark/pipelines/init_cli.py
@@ -18,6 +18,7 @@
 from pathlib import Path
 
 SPEC = """
+name: {{ name }}
 definitions:
   - glob:
       include: transformations/**/*.py
@@ -25,12 +26,12 @@
       include: transformations/**/*.sql
 """
 
-PYTHON_EXAMPLE = """from pyspark import pipelines as sdp
+PYTHON_EXAMPLE = """from pyspark import pipelines as dp
 from pyspark.sql import DataFrame, SparkSession
 
 spark = SparkSession.active()
 
-@sdp.materialized_view
+@dp.materialized_view
 def example_python_materialized_view() -> DataFrame:
     return spark.range(10)
 """
@@ -49,7 +50,7 @@ def init(name: str) -> None:
     # Write the spec file to the project directory
     spec_file = project_dir / "pipeline.yml"
     with open(spec_file, "w") as f:
-        f.write(SPEC)
+        f.write(SPEC.replace("{{ name }}", name))
 
     # Create the transformations directory
     transformations_dir = project_dir / "transformations"
diff --git a/python/pyspark/pipelines/spark_connect_graph_element_registry.py b/python/pyspark/pipelines/spark_connect_graph_element_registry.py
index 8bc4aeefd2264..020c7989138d4 100644
--- a/python/pyspark/pipelines/spark_connect_graph_element_registry.py
+++ b/python/pyspark/pipelines/spark_connect_graph_element_registry.py
@@ -93,9 +93,8 @@ def register_flow(self, flow: Flow) -> None:
             dataflow_graph_id=self._dataflow_graph_id,
             flow_name=flow.name,
             target_dataset_name=flow.target,
-            plan=relation,
+            relation=relation,
             sql_conf=flow.spark_conf,
-            once=flow.once,
         )
         command = pb2.Command()
         command.pipeline_command.define_flow.CopyFrom(inner_command)
diff --git a/python/pyspark/pipelines/spark_connect_pipeline.py b/python/pyspark/pipelines/spark_connect_pipeline.py
index 12f43a236c289..61b72956e5ccc 100644
--- a/python/pyspark/pipelines/spark_connect_pipeline.py
+++ b/python/pyspark/pipelines/spark_connect_pipeline.py
@@ -15,7 +15,7 @@
 # limitations under the License.
 #
 from datetime import timezone
-from typing import Any, Dict, Mapping, Iterator, Optional, cast
+from typing import Any, Dict, Mapping, Iterator, Optional, cast, Sequence
 
 import pyspark.sql.connect.proto as pb2
 from pyspark.sql import SparkSession
@@ -65,12 +65,28 @@ def handle_pipeline_events(iter: Iterator[Dict[str, Any]]) -> None:
             log_with_provided_timestamp(event.message, dt)
 
 
-def start_run(spark: SparkSession, dataflow_graph_id: str) -> Iterator[Dict[str, Any]]:
+def start_run(
+    spark: SparkSession,
+    dataflow_graph_id: str,
+    full_refresh: Optional[Sequence[str]],
+    full_refresh_all: bool,
+    refresh: Optional[Sequence[str]],
+    dry: bool,
+) -> Iterator[Dict[str, Any]]:
     """Start a run of the dataflow graph in the Spark Connect server.
 
     :param dataflow_graph_id: The ID of the dataflow graph to start.
+    :param full_refresh: List of datasets to reset and recompute.
+    :param full_refresh_all: Perform a full graph reset and recompute.
+    :param refresh: List of datasets to update.
     """
-    inner_command = pb2.PipelineCommand.StartRun(dataflow_graph_id=dataflow_graph_id)
+    inner_command = pb2.PipelineCommand.StartRun(
+        dataflow_graph_id=dataflow_graph_id,
+        full_refresh_selection=full_refresh or [],
+        full_refresh_all=full_refresh_all,
+        refresh_selection=refresh or [],
+        dry=dry,
+    )
     command = pb2.Command()
     command.pipeline_command.start_run.CopyFrom(inner_command)
     # Cast because mypy seems to think `spark`` is a function, not an object. Likely related to
diff --git a/python/pyspark/pipelines/tests/test_block_session_mutations.py b/python/pyspark/pipelines/tests/test_block_session_mutations.py
new file mode 100644
index 0000000000000..3384a5fcbfb35
--- /dev/null
+++ b/python/pyspark/pipelines/tests/test_block_session_mutations.py
@@ -0,0 +1,260 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import unittest
+
+from pyspark.errors import PySparkException
+from pyspark.sql.types import StringType
+from pyspark.testing.connectutils import (
+    ReusedConnectTestCase,
+    should_test_connect,
+    connect_requirement_message,
+)
+
+if should_test_connect:
+    from pyspark.pipelines.block_session_mutations import (
+        block_session_mutations,
+        BLOCKED_METHODS,
+        ERROR_CLASS,
+    )
+
+
+@unittest.skipIf(not should_test_connect, connect_requirement_message or "Connect not available")
+class BlockImperativeConfSetConnectTests(ReusedConnectTestCase):
+    def test_blocks_runtime_conf_set(self):
+        """Test that spark.conf.set() is blocked."""
+        config = self.spark.conf
+
+        test_cases = [
+            ("spark.test.string", "string_value"),
+            ("spark.test.int", 42),
+            ("spark.test.bool", True),
+        ]
+
+        for key, value in test_cases:
+            with self.subTest(key=key, value=value):
+                with block_session_mutations():
+                    with self.assertRaises(PySparkException) as context:
+                        config.set(key, value)
+
+                    self.assertEqual(
+                        context.exception.getCondition(),
+                        f"{ERROR_CLASS}.SET_RUNTIME_CONF",
+                    )
+                    self.assertIn("'RuntimeConf.set'", str(context.exception))
+
+    def test_blocks_catalog_set_current_catalog(self):
+        """Test that spark.catalog.setCurrentCatalog() is blocked."""
+        catalog = self.spark.catalog
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                catalog.setCurrentCatalog("test_catalog")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.SET_CURRENT_CATALOG",
+            )
+            self.assertIn("'Catalog.setCurrentCatalog'", str(context.exception))
+
+    def test_blocks_catalog_set_current_database(self):
+        """Test that spark.catalog.setCurrentDatabase() is blocked."""
+        catalog = self.spark.catalog
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                catalog.setCurrentDatabase("test_db")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.SET_CURRENT_DATABASE",
+            )
+            self.assertIn("'Catalog.setCurrentDatabase'", str(context.exception))
+
+    def test_blocks_catalog_drop_temp_view(self):
+        """Test that spark.catalog.dropTempView() is blocked."""
+        catalog = self.spark.catalog
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                catalog.dropTempView("test_view")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.DROP_TEMP_VIEW",
+            )
+            self.assertIn("'Catalog.dropTempView'", str(context.exception))
+
+    def test_blocks_catalog_drop_global_temp_view(self):
+        """Test that spark.catalog.dropGlobalTempView() is blocked."""
+        catalog = self.spark.catalog
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                catalog.dropGlobalTempView("test_view")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.DROP_GLOBAL_TEMP_VIEW",
+            )
+            self.assertIn("'Catalog.dropGlobalTempView'", str(context.exception))
+
+    def test_blocks_dataframe_create_temp_view(self):
+        """Test that DataFrame.createTempView() is blocked."""
+        df = self.spark.range(1)
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                df.createTempView("test_view")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.CREATE_TEMP_VIEW",
+            )
+            self.assertIn("'DataFrame.createTempView'", str(context.exception))
+
+    def test_blocks_dataframe_create_or_replace_temp_view(self):
+        """Test that DataFrame.createOrReplaceTempView() is blocked."""
+        df = self.spark.range(1)
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                df.createOrReplaceTempView("test_view")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.CREATE_OR_REPLACE_TEMP_VIEW",
+            )
+            self.assertIn("'DataFrame.createOrReplaceTempView'", str(context.exception))
+
+    def test_blocks_dataframe_create_global_temp_view(self):
+        """Test that DataFrame.createGlobalTempView() is blocked."""
+        df = self.spark.range(1)
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                df.createGlobalTempView("test_view")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.CREATE_GLOBAL_TEMP_VIEW",
+            )
+            self.assertIn("'DataFrame.createGlobalTempView'", str(context.exception))
+
+    def test_blocks_dataframe_create_or_replace_global_temp_view(self):
+        """Test that DataFrame.createOrReplaceGlobalTempView() is blocked."""
+        df = self.spark.range(1)
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                df.createOrReplaceGlobalTempView("test_view")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.CREATE_OR_REPLACE_GLOBAL_TEMP_VIEW",
+            )
+            self.assertIn("'DataFrame.createOrReplaceGlobalTempView'", str(context.exception))
+
+    def test_blocks_udf_register(self):
+        """Test that spark.udf.register() is blocked."""
+        udf_registry = self.spark.udf
+
+        def test_func(x):
+            return x + 1
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                udf_registry.register("test_udf", test_func, StringType())
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.REGISTER_UDF",
+            )
+            self.assertIn("'UDFRegistration.register'", str(context.exception))
+
+    def test_blocks_udf_register_java_function(self):
+        """Test that spark.udf.registerJavaFunction() is blocked."""
+        udf_registry = self.spark.udf
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                udf_registry.registerJavaFunction(
+                    "test_java_udf", "com.example.TestUDF", StringType()
+                )
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.REGISTER_JAVA_UDF",
+            )
+            self.assertIn("'UDFRegistration.registerJavaFunction'", str(context.exception))
+
+    def test_blocks_udf_register_java_udaf(self):
+        """Test that spark.udf.registerJavaUDAF() is blocked."""
+        udf_registry = self.spark.udf
+
+        with block_session_mutations():
+            with self.assertRaises(PySparkException) as context:
+                udf_registry.registerJavaUDAF("test_java_udaf", "com.example.TestUDAF")
+
+            self.assertEqual(
+                context.exception.getCondition(),
+                f"{ERROR_CLASS}.REGISTER_JAVA_UDAF",
+            )
+            self.assertIn("'UDFRegistration.registerJavaUDAF'", str(context.exception))
+
+    def test_restores_original_methods_after_context(self):
+        """Test that all methods are properly restored after context manager exits."""
+        # Store original methods
+        original_methods = {}
+        for method_info in BLOCKED_METHODS:
+            cls = method_info["class"]
+            method_name = method_info["method"]
+            original_methods[(cls, method_name)] = getattr(cls, method_name)
+
+        # Verify methods are originally set correctly
+        for method_info in BLOCKED_METHODS:
+            cls = method_info["class"]
+            method_name = method_info["method"]
+            with self.subTest(class_method=f"{cls.__name__}.{method_name}"):
+                self.assertIs(getattr(cls, method_name), original_methods[(cls, method_name)])
+
+        # Verify methods are replaced during context
+        with block_session_mutations():
+            for method_info in BLOCKED_METHODS:
+                cls = method_info["class"]
+                method_name = method_info["method"]
+                with self.subTest(class_method=f"{cls.__name__}.{method_name}"):
+                    self.assertIsNot(
+                        getattr(cls, method_name), original_methods[(cls, method_name)]
+                    )
+
+        # Verify methods are restored after context
+        for method_info in BLOCKED_METHODS:
+            cls = method_info["class"]
+            method_name = method_info["method"]
+            with self.subTest(class_method=f"{cls.__name__}.{method_name}"):
+                self.assertIs(getattr(cls, method_name), original_methods[(cls, method_name)])
+
+
+if __name__ == "__main__":
+    try:
+        import xmlrunner  # type: ignore
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/pipelines/tests/test_cli.py b/python/pyspark/pipelines/tests/test_cli.py
index 92de53029f78b..8055723ddc5ae 100644
--- a/python/pyspark/pipelines/tests/test_cli.py
+++ b/python/pyspark/pipelines/tests/test_cli.py
@@ -36,6 +36,7 @@
         unpack_pipeline_spec,
         DefinitionsGlob,
         PipelineSpec,
+        run,
     )
     from pyspark.pipelines.tests.local_graph_element_registry import LocalGraphElementRegistry
 
@@ -50,6 +51,7 @@ def test_load_pipeline_spec(self):
             tmpfile.write(
                 """
                 {
+                    "name": "test_pipeline",
                     "catalog": "test_catalog",
                     "database": "test_database",
                     "configuration": {
@@ -64,17 +66,44 @@ def test_load_pipeline_spec(self):
             )
             tmpfile.flush()
             spec = load_pipeline_spec(Path(tmpfile.name))
+            assert spec.name == "test_pipeline"
             assert spec.catalog == "test_catalog"
             assert spec.database == "test_database"
             assert spec.configuration == {"key1": "value1", "key2": "value2"}
             assert len(spec.definitions) == 1
             assert spec.definitions[0].include == "test_include"
 
+    def test_load_pipeline_spec_name_is_required(self):
+        with tempfile.NamedTemporaryFile(mode="w") as tmpfile:
+            tmpfile.write(
+                """
+                {
+                    "catalog": "test_catalog",
+                    "database": "test_database",
+                    "configuration": {
+                        "key1": "value1",
+                        "key2": "value2"
+                    },
+                    "definitions": [
+                        {"glob": {"include": "test_include"}}
+                    ]
+                }
+                """
+            )
+            tmpfile.flush()
+            with self.assertRaises(PySparkException) as context:
+                load_pipeline_spec(Path(tmpfile.name))
+            self.assertEqual(
+                context.exception.getCondition(), "PIPELINE_SPEC_MISSING_REQUIRED_FIELD"
+            )
+            self.assertEqual(context.exception.getMessageParameters(), {"field_name": "name"})
+
     def test_load_pipeline_spec_schema_fallback(self):
         with tempfile.NamedTemporaryFile(mode="w") as tmpfile:
             tmpfile.write(
                 """
                 {
+                    "name": "test_pipeline",
                     "catalog": "test_catalog",
                     "schema": "test_database",
                     "configuration": {
@@ -120,20 +149,22 @@ def test_load_pipeline_spec_invalid(self):
             )
 
     def test_unpack_empty_pipeline_spec(self):
-        empty_spec = PipelineSpec(catalog=None, database=None, configuration={}, definitions=[])
-        self.assertEqual(unpack_pipeline_spec({}), empty_spec)
+        empty_spec = PipelineSpec(
+            name="test_pipeline", catalog=None, database=None, configuration={}, definitions=[]
+        )
+        self.assertEqual(unpack_pipeline_spec({"name": "test_pipeline"}), empty_spec)
 
     def test_unpack_pipeline_spec_bad_configuration(self):
         with self.assertRaises(TypeError) as context:
-            unpack_pipeline_spec({"configuration": "not_a_dict"})
+            unpack_pipeline_spec({"name": "test_pipeline", "configuration": "not_a_dict"})
         self.assertIn("should be a dict", str(context.exception))
 
         with self.assertRaises(TypeError) as context:
-            unpack_pipeline_spec({"configuration": {"key": {}}})
+            unpack_pipeline_spec({"name": "test_pipeline", "configuration": {"key": {}}})
         self.assertIn("key", str(context.exception))
 
         with self.assertRaises(TypeError) as context:
-            unpack_pipeline_spec({"configuration": {1: "something"}})
+            unpack_pipeline_spec({"name": "test_pipeline", "configuration": {1: "something"}})
         self.assertIn("int", str(context.exception))
 
     def test_find_pipeline_spec_in_current_directory(self):
@@ -205,6 +236,7 @@ def test_find_pipeline_spec_in_parent_directory(self):
 
     def test_register_definitions(self):
         spec = PipelineSpec(
+            name="test_pipeline",
             catalog=None,
             database=None,
             configuration={},
@@ -220,8 +252,8 @@ def test_register_definitions(self):
                 f.write(
                     textwrap.dedent(
                         """
-                        from pyspark import pipelines as sdp
-                        @sdp.materialized_view
+                        from pyspark import pipelines as dp
+                        @dp.materialized_view
                         def mv1():
                             raise NotImplementedError()
                     """
@@ -232,7 +264,7 @@ def mv1():
                 f.write(
                     textwrap.dedent(
                         """
-                        from pyspark import pipelines as sdp
+                        from pyspark import pipelines as dp
                         def mv2():
                             raise NotImplementedError()
                     """
@@ -247,6 +279,7 @@ def mv2():
     def test_register_definitions_file_raises_error(self):
         """Errors raised while executing definitions code should make it to the outer context."""
         spec = PipelineSpec(
+            name="test_pipeline",
             catalog=None,
             database=None,
             configuration={},
@@ -264,6 +297,7 @@ def test_register_definitions_file_raises_error(self):
 
     def test_register_definitions_unsupported_file_extension_matches_glob(self):
         spec = PipelineSpec(
+            name="test_pipeline",
             catalog=None,
             database=None,
             configuration={},
@@ -317,6 +351,7 @@ def test_python_import_current_directory(self):
                     inner_dir1 / "pipeline.yaml",
                     registry,
                     PipelineSpec(
+                        name="test_pipeline",
                         catalog=None,
                         database=None,
                         configuration={},
@@ -324,6 +359,98 @@ def test_python_import_current_directory(self):
                     ),
                 )
 
+    def test_full_refresh_all_conflicts_with_full_refresh(self):
+        with tempfile.TemporaryDirectory() as temp_dir:
+            # Create a minimal pipeline spec
+            spec_path = Path(temp_dir) / "pipeline.yaml"
+            with spec_path.open("w") as f:
+                f.write('{"name": "test_pipeline"}')
+
+            # Test that providing both --full-refresh-all and --full-refresh raises an exception
+            with self.assertRaises(PySparkException) as context:
+                run(
+                    spec_path=spec_path,
+                    full_refresh=["table1", "table2"],
+                    full_refresh_all=True,
+                    refresh=[],
+                    dry=False,
+                )
+
+            self.assertEqual(
+                context.exception.getCondition(), "CONFLICTING_PIPELINE_REFRESH_OPTIONS"
+            )
+            self.assertEqual(
+                context.exception.getMessageParameters(), {"conflicting_option": "--full_refresh"}
+            )
+
+    def test_full_refresh_all_conflicts_with_refresh(self):
+        with tempfile.TemporaryDirectory() as temp_dir:
+            # Create a minimal pipeline spec
+            spec_path = Path(temp_dir) / "pipeline.yaml"
+            with spec_path.open("w") as f:
+                f.write('{"name": "test_pipeline"}')
+
+            # Test that providing both --full-refresh-all and --refresh raises an exception
+            with self.assertRaises(PySparkException) as context:
+                run(
+                    spec_path=spec_path,
+                    full_refresh=[],
+                    full_refresh_all=True,
+                    refresh=["table1", "table2"],
+                    dry=False,
+                )
+
+            self.assertEqual(
+                context.exception.getCondition(), "CONFLICTING_PIPELINE_REFRESH_OPTIONS"
+            )
+            self.assertEqual(
+                context.exception.getMessageParameters(),
+                {"conflicting_option": "--refresh"},
+            )
+
+    def test_full_refresh_all_conflicts_with_both(self):
+        with tempfile.TemporaryDirectory() as temp_dir:
+            # Create a minimal pipeline spec
+            spec_path = Path(temp_dir) / "pipeline.yaml"
+            with spec_path.open("w") as f:
+                f.write('{"name": "test_pipeline"}')
+
+            # Test that providing --full-refresh-all with both other options raises an exception
+            # (it should catch the first conflict - full_refresh)
+            with self.assertRaises(PySparkException) as context:
+                run(
+                    spec_path=spec_path,
+                    full_refresh=["table1"],
+                    full_refresh_all=True,
+                    refresh=["table2"],
+                    dry=False,
+                )
+
+            self.assertEqual(
+                context.exception.getCondition(), "CONFLICTING_PIPELINE_REFRESH_OPTIONS"
+            )
+
+    def test_parse_table_list_single_table(self):
+        """Test parsing a single table name."""
+        from pyspark.pipelines.cli import parse_table_list
+
+        result = parse_table_list("table1")
+        self.assertEqual(result, ["table1"])
+
+    def test_parse_table_list_multiple_tables(self):
+        """Test parsing multiple table names."""
+        from pyspark.pipelines.cli import parse_table_list
+
+        result = parse_table_list("table1,table2,table3")
+        self.assertEqual(result, ["table1", "table2", "table3"])
+
+    def test_parse_table_list_with_spaces(self):
+        """Test parsing table names with spaces."""
+        from pyspark.pipelines.cli import parse_table_list
+
+        result = parse_table_list("table1, table2 , table3")
+        self.assertEqual(result, ["table1", "table2", "table3"])
+
 
 if __name__ == "__main__":
     try:
diff --git a/python/pyspark/pipelines/tests/test_decorators.py b/python/pyspark/pipelines/tests/test_decorators.py
index ac575b43d1090..31a966da164d1 100644
--- a/python/pyspark/pipelines/tests/test_decorators.py
+++ b/python/pyspark/pipelines/tests/test_decorators.py
@@ -18,12 +18,12 @@
 import unittest
 
 from pyspark.errors import PySparkTypeError
-from pyspark import pipelines as sdp
+from pyspark import pipelines as dp
 
 
 class DecoratorsTest(unittest.TestCase):
     def test_dataset_name_not_string(self):
-        for decorator in [sdp.table, sdp.temporary_view, sdp.materialized_view]:
+        for decorator in [dp.table, dp.temporary_view, dp.materialized_view]:
             with self.assertRaises(PySparkTypeError) as context:
 
                 @decorator(name=5)
@@ -37,7 +37,7 @@ def dataset_with_non_string_name():
             }, context.exception.getMessageParameters()
 
     def test_invalid_partition_cols(self):
-        for decorator in [sdp.table, sdp.materialized_view]:
+        for decorator in [dp.table, dp.materialized_view]:
             with self.assertRaises(PySparkTypeError) as context:
 
                 @decorator(partition_cols=["a", 1, 2])  # type: ignore
@@ -51,7 +51,7 @@ def dataset_with_invalid_partition_cols():
             }, context.exception.getMessageParameters()
 
     def test_decorator_with_positional_arg(self):
-        for decorator in [sdp.table, sdp.temporary_view, sdp.materialized_view]:
+        for decorator in [dp.table, dp.temporary_view, dp.materialized_view]:
             with self.assertRaises(PySparkTypeError) as context:
                 decorator("table1")
 
diff --git a/python/pyspark/pipelines/tests/test_graph_element_registry.py b/python/pyspark/pipelines/tests/test_graph_element_registry.py
index 9ebf29d1ed47b..2f9d2c69b7d5c 100644
--- a/python/pyspark/pipelines/tests/test_graph_element_registry.py
+++ b/python/pyspark/pipelines/tests/test_graph_element_registry.py
@@ -19,7 +19,7 @@
 
 from pyspark.errors import PySparkException
 from pyspark.pipelines.graph_element_registry import graph_element_registration_context
-from pyspark import pipelines as sdp
+from pyspark import pipelines as dp
 from pyspark.pipelines.tests.local_graph_element_registry import LocalGraphElementRegistry
 
 
@@ -28,21 +28,21 @@ def test_graph_element_registry(self):
         registry = LocalGraphElementRegistry()
         with graph_element_registration_context(registry):
 
-            @sdp.materialized_view
+            @dp.materialized_view
             def mv():
                 raise NotImplementedError()
 
-            @sdp.table
+            @dp.table
             def st():
                 raise NotImplementedError()
 
-            sdp.create_streaming_table("st2")
+            dp.create_streaming_table("st2")
 
-            @sdp.append_flow(target="st2", once=True)
+            @dp.append_flow(target="st2")
             def flow1():
                 raise NotImplementedError()
 
-            @sdp.append_flow(target="st2", once=False)
+            @dp.append_flow(target="st2")
             def flow2():
                 raise NotImplementedError()
 
@@ -74,17 +74,15 @@ def flow2():
         st2_flow1_obj = registry.flows[2]
         self.assertEqual(st2_flow1_obj.name, "flow1")
         self.assertEqual(st2_flow1_obj.target, "st2")
-        self.assertEqual(st2_flow1_obj.once, True)
         assert mv_flow_obj.source_code_location.filename.endswith("test_graph_element_registry.py")
 
         st2_flow1_obj = registry.flows[3]
         self.assertEqual(st2_flow1_obj.name, "flow2")
         self.assertEqual(st2_flow1_obj.target, "st2")
-        self.assertEqual(st2_flow1_obj.once, False)
         assert mv_flow_obj.source_code_location.filename.endswith("test_graph_element_registry.py")
 
     def test_definition_without_graph_element_registry(self):
-        for decorator in [sdp.table, sdp.temporary_view, sdp.materialized_view]:
+        for decorator in [dp.table, dp.temporary_view, dp.materialized_view]:
             with self.assertRaises(PySparkException) as context:
 
                 @decorator
@@ -97,7 +95,7 @@ def a():
             )
 
         with self.assertRaises(PySparkException) as context:
-            sdp.create_streaming_table("st")
+            dp.create_streaming_table("st")
 
         self.assertEqual(
             context.exception.getCondition(),
@@ -106,7 +104,7 @@ def a():
 
         with self.assertRaises(PySparkException) as context:
 
-            @sdp.append_flow(target="st")
+            @dp.append_flow(target="st")
             def b():
                 raise NotImplementedError()
 
diff --git a/python/pyspark/pipelines/tests/test_init_cli.py b/python/pyspark/pipelines/tests/test_init_cli.py
index 656e4b609eaa2..f2390853d0f3e 100644
--- a/python/pyspark/pipelines/tests/test_init_cli.py
+++ b/python/pyspark/pipelines/tests/test_init_cli.py
@@ -50,6 +50,7 @@ def test_init(self):
             with change_dir(Path(temp_dir) / project_name):
                 spec_path = find_pipeline_spec(Path.cwd())
                 spec = load_pipeline_spec(spec_path)
+                assert spec.name == project_name
                 registry = LocalGraphElementRegistry()
                 register_definitions(spec_path, registry, spec)
                 self.assertEqual(len(registry.datasets), 1)
diff --git a/python/pyspark/pipelines/tests/test_spark_connect.py b/python/pyspark/pipelines/tests/test_spark_connect.py
new file mode 100644
index 0000000000000..6d81a98c8c44d
--- /dev/null
+++ b/python/pyspark/pipelines/tests/test_spark_connect.py
@@ -0,0 +1,97 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+"""
+Tests that run Pipelines against a Spark Connect server.
+"""
+
+import unittest
+
+from pyspark.errors.exceptions.connect import AnalysisException
+from pyspark.pipelines.graph_element_registry import graph_element_registration_context
+from pyspark.pipelines.spark_connect_graph_element_registry import (
+    SparkConnectGraphElementRegistry,
+)
+from pyspark.pipelines.spark_connect_pipeline import (
+    create_dataflow_graph,
+    start_run,
+    handle_pipeline_events,
+)
+from pyspark import pipelines as dp
+from pyspark.testing.connectutils import (
+    ReusedConnectTestCase,
+    should_test_connect,
+    connect_requirement_message,
+)
+
+
+@unittest.skipIf(not should_test_connect, connect_requirement_message)
+class SparkConnectPipelinesTest(ReusedConnectTestCase):
+    def test_dry_run(self):
+        dataflow_graph_id = create_dataflow_graph(self.spark, None, None, None)
+        registry = SparkConnectGraphElementRegistry(self.spark, dataflow_graph_id)
+
+        with graph_element_registration_context(registry):
+
+            @dp.materialized_view
+            def mv():
+                return self.spark.range(1)
+
+        result_iter = start_run(
+            self.spark,
+            dataflow_graph_id,
+            full_refresh=None,
+            refresh=None,
+            full_refresh_all=False,
+            dry=True,
+        )
+        handle_pipeline_events(result_iter)
+
+    def test_dry_run_failure(self):
+        dataflow_graph_id = create_dataflow_graph(self.spark, None, None, None)
+        registry = SparkConnectGraphElementRegistry(self.spark, dataflow_graph_id)
+
+        with graph_element_registration_context(registry):
+
+            @dp.table
+            def st():
+                # Invalid because a streaming query is expected
+                return self.spark.range(1)
+
+        result_iter = start_run(
+            self.spark,
+            dataflow_graph_id,
+            full_refresh=None,
+            refresh=None,
+            full_refresh_all=False,
+            dry=True,
+        )
+        with self.assertRaises(AnalysisException) as context:
+            handle_pipeline_events(result_iter)
+        self.assertIn(
+            "INVALID_FLOW_QUERY_TYPE.BATCH_RELATION_FOR_STREAMING_TABLE", str(context.exception)
+        )
+
+
+if __name__ == "__main__":
+    try:
+        import xmlrunner  # type: ignore
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/_typing.pyi b/python/pyspark/sql/_typing.pyi
index 27fa0f2a90133..fafc9bdf15fc5 100644
--- a/python/pyspark/sql/_typing.pyi
+++ b/python/pyspark/sql/_typing.pyi
@@ -65,6 +65,7 @@ SQLBatchedUDFType = Literal[100]
 SQLArrowBatchedUDFType = Literal[101]
 SQLTableUDFType = Literal[300]
 SQLArrowTableUDFType = Literal[301]
+SQLArrowUDTFType = Literal[302]
 
 class SupportsOpen(Protocol):
     def open(self, partition_id: int, epoch_id: int) -> bool: ...
diff --git a/python/pyspark/sql/classic/dataframe.py b/python/pyspark/sql/classic/dataframe.py
index f72c066a65723..722f0615b370a 100644
--- a/python/pyspark/sql/classic/dataframe.py
+++ b/python/pyspark/sql/classic/dataframe.py
@@ -207,7 +207,7 @@ def schema(self) -> StructType:
         except Exception as e:
             raise PySparkValueError(
                 errorClass="CANNOT_PARSE_DATATYPE",
-                messageParameters={"error": str(e)},
+                messageParameters={"msg": str(e)},
             )
 
     def printSchema(self, level: Optional[int] = None) -> None:
diff --git a/python/pyspark/sql/connect/client/core.py b/python/pyspark/sql/connect/client/core.py
index 34719f2b0ba6e..9d2e18ebb7600 100644
--- a/python/pyspark/sql/connect/client/core.py
+++ b/python/pyspark/sql/connect/client/core.py
@@ -63,7 +63,6 @@
 
 from pyspark.util import is_remote_only
 from pyspark.accumulators import SpecialAccumulatorIds
-from pyspark.loose_version import LooseVersion
 from pyspark.version import __version__
 from pyspark.resource.information import ResourceInformation
 from pyspark.sql.metrics import MetricValue, PlanMetrics, ExecutionInfo, ObservedMetrics
@@ -109,6 +108,7 @@
 if TYPE_CHECKING:
     from google.rpc.error_details_pb2 import ErrorInfo
     from pyspark.sql.connect._typing import DataTypeOrString
+    from pyspark.sql.connect.session import SparkSession
     from pyspark.sql.datasource import DataSource
 
 
@@ -606,6 +606,7 @@ def __init__(
         channel_options: Optional[List[Tuple[str, Any]]] = None,
         retry_policy: Optional[Dict[str, Any]] = None,
         use_reattachable_execute: bool = True,
+        session_hooks: Optional[list["SparkSession.Hook"]] = None,
     ):
         """
         Creates a new SparkSession for the Spark Connect interface.
@@ -636,6 +637,8 @@ def __init__(
                     a failed request. Default: 60000(ms).
         use_reattachable_execute: bool
             Enable reattachable execution.
+        session_hooks: list[SparkSession.Hook], optional
+            List of session hooks to call.
         """
         self.thread_local = threading.local()
 
@@ -675,6 +678,7 @@ def __init__(
             self._user_id, self._session_id, self._channel, self._builder.metadata()
         )
         self._use_reattachable_execute = use_reattachable_execute
+        self._session_hooks = session_hooks or []
         # Configure logging for the SparkConnect client.
 
         # Capture the server-side session ID and set it to None initially. It will
@@ -963,7 +967,7 @@ def to_pandas(
             # Rename columns to avoid duplicated column names.
             renamed_table = table.rename_columns([f"col_{i}" for i in range(table.num_columns)])
 
-            pandas_options = {}
+            pandas_options = {"coerce_temporal_nanoseconds": True}
             if self_destruct:
                 # Configure PyArrow to use as little memory as possible:
                 # self_destruct - free columns as they are converted
@@ -976,15 +980,6 @@ def to_pandas(
                         "use_threads": False,
                     }
                 )
-            if LooseVersion(pa.__version__) >= LooseVersion("13.0.0"):
-                # A legacy option to coerce date32, date64, duration, and timestamp
-                # time units to nanoseconds when converting to pandas.
-                # This option can only be added since 13.0.0.
-                pandas_options.update(
-                    {
-                        "coerce_temporal_nanoseconds": True,
-                    }
-                )
             pdf = renamed_table.to_pandas(**pandas_options)
             pdf.columns = schema.names
 
@@ -1365,6 +1360,9 @@ def _execute(self, req: pb2.ExecutePlanRequest) -> None:
         """
         logger.debug("Execute")
 
+        for hook in self._session_hooks:
+            req = hook.on_execute_plan(req)
+
         def handle_response(b: pb2.ExecutePlanResponse) -> None:
             self._verify_response_integrity(b)
 
@@ -1406,6 +1404,9 @@ def _execute_and_fetch_as_iterator(
             # when not at debug log level.
             logger.debug(f"ExecuteAndFetchAsIterator. Request: {self._proto_to_string(req)}")
 
+        for hook in self._session_hooks:
+            req = hook.on_execute_plan(req)
+
         num_records = 0
 
         def handle_response(
@@ -1985,7 +1986,7 @@ def _create_profile(self, profile: pb2.ResourceProfile) -> int:
         profile_id = properties["create_resource_profile_command_result"]
         return profile_id
 
-    def _delete_ml_cache(self, cache_ids: List[str]) -> List[str]:
+    def _delete_ml_cache(self, cache_ids: List[str], evict_only: bool = False) -> List[str]:
         # try best to delete the cache
         try:
             if len(cache_ids) > 0:
@@ -1993,6 +1994,7 @@ def _delete_ml_cache(self, cache_ids: List[str]) -> List[str]:
                 command.ml_command.delete.obj_refs.extend(
                     [pb2.ObjectRef(id=cache_id) for cache_id in cache_ids]
                 )
+                command.ml_command.delete.evict_only = evict_only
                 (_, properties, _) = self.execute_command(command)
 
                 assert properties is not None
@@ -2025,3 +2027,15 @@ def _get_ml_cache_info(self) -> List[str]:
             return [item.string for item in ml_command_result.param.array.elements]
 
         return []
+
+    def _query_model_size(self, model_ref_id: str) -> int:
+        command = pb2.Command()
+        command.ml_command.get_model_size.CopyFrom(
+            pb2.MlCommand.GetModelSize(model_ref=pb2.ObjectRef(id=model_ref_id))
+        )
+        (_, properties, _) = self.execute_command(command)
+
+        assert properties is not None
+
+        ml_command_result = properties["ml_command_result"]
+        return ml_command_result.param.long
diff --git a/python/pyspark/sql/connect/client/reattach.py b/python/pyspark/sql/connect/client/reattach.py
index 78b783371ab56..06a4fe17c29f9 100644
--- a/python/pyspark/sql/connect/client/reattach.py
+++ b/python/pyspark/sql/connect/client/reattach.py
@@ -79,8 +79,9 @@ def shutdown(cls: Type["ExecutePlanResponseReattachableIterator"]) -> None:
         """
         with cls._lock:
             if cls._release_thread_pool_instance is not None:
-                cls._get_or_create_release_thread_pool().shutdown()
+                thread_pool = cls._release_thread_pool_instance
                 cls._release_thread_pool_instance = None
+                thread_pool.shutdown()
 
     def __init__(
         self,
diff --git a/python/pyspark/sql/connect/client/retries.py b/python/pyspark/sql/connect/client/retries.py
index e27100133b5ae..898d976f2628e 100644
--- a/python/pyspark/sql/connect/client/retries.py
+++ b/python/pyspark/sql/connect/client/retries.py
@@ -19,10 +19,13 @@
 import random
 import time
 import typing
-from typing import Optional, Callable, Generator, List, Type
+import warnings
+from google.rpc import error_details_pb2
+from grpc_status import rpc_status
+from typing import Optional, Callable, Generator, List, Type, cast
 from types import TracebackType
 from pyspark.sql.connect.logging import logger
-from pyspark.errors import PySparkRuntimeError, RetriesExceeded
+from pyspark.errors import PySparkRuntimeError
 
 """
 This module contains retry system. The system is designed to be
@@ -45,6 +48,34 @@ class RetryPolicy:
     Describes key aspects of RetryPolicy.
 
     It's advised that different policies are implemented as different subclasses.
+
+    Parameters
+    ----------
+    max_retries: int, optional
+        Maximum number of retries.
+    initial_backoff: int
+        Start value of the exponential backoff.
+    max_backoff: int, optional
+        Maximal value of the exponential backoff.
+    backoff_multiplier: float
+        Multiplicative base of the exponential backoff.
+    jitter: int
+        Sample a random value uniformly from the range [0, jitter] and add it to the backoff.
+    min_jitter_threshold: int
+        Minimal value of the backoff to add random jitter.
+    recognize_server_retry_delay: bool
+        Per gRPC standard, the server can send error messages that contain `RetryInfo` message
+        with `retry_delay` field indicating that the client should wait for at least `retry_delay`
+        amount of time before retrying again, see:
+        https://github.com/googleapis/googleapis/blob/master/google/rpc/error_details.proto#L91
+
+        If this flag is set to true, RetryPolicy will use `RetryInfo.retry_delay` field
+        in the backoff computation. Server's `retry_delay` can override client's `max_backoff`.
+
+        This flag does not change which errors are retried, only how the backoff is computed.
+        `DefaultPolicy` additionally has a rule for retrying any error that contains `RetryInfo`.
+    max_server_retry_delay: int, optional
+        Limit for the server-provided `retry_delay`.
     """
 
     def __init__(
@@ -55,6 +86,8 @@ def __init__(
         backoff_multiplier: float = 1.0,
         jitter: int = 0,
         min_jitter_threshold: int = 0,
+        recognize_server_retry_delay: bool = False,
+        max_server_retry_delay: Optional[int] = None,
     ):
         self.max_retries = max_retries
         self.initial_backoff = initial_backoff
@@ -62,6 +95,8 @@ def __init__(
         self.backoff_multiplier = backoff_multiplier
         self.jitter = jitter
         self.min_jitter_threshold = min_jitter_threshold
+        self.recognize_server_retry_delay = recognize_server_retry_delay
+        self.max_server_retry_delay = max_server_retry_delay
         self._name = self.__class__.__name__
 
     @property
@@ -98,7 +133,7 @@ def name(self) -> str:
     def can_retry(self, exception: BaseException) -> bool:
         return self.policy.can_retry(exception)
 
-    def next_attempt(self) -> Optional[int]:
+    def next_attempt(self, exception: Optional[BaseException] = None) -> Optional[int]:
         """
         Returns
         -------
@@ -119,6 +154,14 @@ def next_attempt(self) -> Optional[int]:
                 float(self.policy.max_backoff), wait_time * self.policy.backoff_multiplier
             )
 
+        if exception is not None and self.policy.recognize_server_retry_delay:
+            retry_delay = extract_retry_delay(exception)
+            if retry_delay is not None:
+                logger.debug(f"The server has sent a retry delay of {retry_delay} ms.")
+                if self.policy.max_server_retry_delay is not None:
+                    retry_delay = min(retry_delay, self.policy.max_server_retry_delay)
+                wait_time = max(wait_time, retry_delay)
+
         # Jitter current backoff, after the future backoff was computed
         if wait_time >= self.policy.min_jitter_threshold:
             wait_time += random.uniform(0, self.policy.jitter)
@@ -160,6 +203,7 @@ class Retrying:
     This class is a point of entry into the retry logic.
     The class accepts a list of retry policies and applies them in given order.
     The first policy accepting an exception will be used.
+    If the error was matched by one policy, the other policies will be skipped.
 
     The usage of the class should be as follows:
     for attempt in Retrying(...):
@@ -167,7 +211,7 @@ class Retrying:
             Do something that can throw exception
 
     In case error is considered retriable, it would be retried based on policies, and
-    RetriesExceeded will be raised if the retries limit would exceed.
+    it will be raised if the retries limit would exceed.
 
     Exceptions not considered retriable will be passed through transparently.
     """
@@ -217,23 +261,25 @@ def _wait(self) -> None:
             return
 
         # Attempt to find a policy to wait with
+        matched_policy = None
         for policy in self._policies:
-            if not policy.can_retry(exception):
-                continue
-
-            wait_time = policy.next_attempt()
+            if policy.can_retry(exception):
+                matched_policy = policy
+                break
+        if matched_policy is not None:
+            wait_time = matched_policy.next_attempt(exception)
             if wait_time is not None:
                 logger.debug(
                     f"Got error: {repr(exception)}. "
-                    + f"Will retry after {wait_time} ms (policy: {policy.name})"
+                    + f"Will retry after {wait_time} ms (policy: {matched_policy.name})"
                 )
-
                 self._sleep(wait_time / 1000)
                 return
 
         # Exceeded retries
         logger.debug(f"Given up on retrying. error: {repr(exception)}")
-        raise RetriesExceeded(errorClass="RETRIES_EXCEEDED", messageParameters={}) from exception
+        warnings.warn("[RETRIES_EXCEEDED] The maximum number of retries has been exceeded.")
+        raise exception
 
     def __iter__(self) -> Generator[AttemptManager, None, None]:
         """
@@ -274,6 +320,8 @@ def __init__(
         max_backoff: Optional[int] = 60000,
         jitter: int = 500,
         min_jitter_threshold: int = 2000,
+        recognize_server_retry_delay: bool = True,
+        max_server_retry_delay: Optional[int] = 10 * 60 * 1000,  # 10 minutes
     ):
         super().__init__(
             max_retries=max_retries,
@@ -282,6 +330,8 @@ def __init__(
             max_backoff=max_backoff,
             jitter=jitter,
             min_jitter_threshold=min_jitter_threshold,
+            recognize_server_retry_delay=recognize_server_retry_delay,
+            max_server_retry_delay=max_server_retry_delay,
         )
 
     def can_retry(self, e: BaseException) -> bool:
@@ -314,4 +364,29 @@ def can_retry(self, e: BaseException) -> bool:
         if e.code() == grpc.StatusCode.UNAVAILABLE:
             return True
 
+        if extract_retry_info(e) is not None:
+            # All errors messages containing `RetryInfo` should be retried.
+            return True
+
         return False
+
+
+def extract_retry_info(exception: BaseException) -> Optional[error_details_pb2.RetryInfo]:
+    """Extract and return RetryInfo from the grpc.RpcError"""
+    if isinstance(exception, grpc.RpcError):
+        status = rpc_status.from_call(cast(grpc.Call, exception))
+        if status:
+            for d in status.details:
+                if d.Is(error_details_pb2.RetryInfo.DESCRIPTOR):
+                    info = error_details_pb2.RetryInfo()
+                    d.Unpack(info)
+                    return info
+    return None
+
+
+def extract_retry_delay(exception: BaseException) -> Optional[int]:
+    """Extract and return RetryInfo.retry_delay in milliseconds from grpc.RpcError if present."""
+    retry_info = extract_retry_info(exception)
+    if retry_info is not None:
+        return retry_info.retry_delay.ToMilliseconds()
+    return None
diff --git a/python/pyspark/sql/connect/dataframe.py b/python/pyspark/sql/connect/dataframe.py
index 101ae06f10edc..7998167976026 100644
--- a/python/pyspark/sql/connect/dataframe.py
+++ b/python/pyspark/sql/connect/dataframe.py
@@ -22,6 +22,7 @@
     PySparkAttributeError,
 )
 from pyspark.resource import ResourceProfile
+from pyspark.sql.connect.logging import logger
 from pyspark.sql.connect.utils import check_dependencies
 
 check_dependencies(__name__)
@@ -43,6 +44,7 @@
 )
 
 import copy
+import os
 import sys
 import random
 import pyarrow as pa
@@ -69,6 +71,7 @@
     PySparkRuntimeError,
 )
 from pyspark.util import PythonEvalType
+from pyspark.serializers import CPickleSerializer
 from pyspark.storagelevel import StorageLevel
 import pyspark.sql.connect.plan as plan
 from pyspark.sql.conversion import ArrowTableToRowsConversion
@@ -141,6 +144,7 @@ def __init__(
         # by __repr__ and _repr_html_ while eager evaluation opens.
         self._support_repr_html = False
         self._cached_schema: Optional[StructType] = None
+        self._cached_schema_serialized: Optional[bytes] = None
         self._execution_info: Optional["ExecutionInfo"] = None
 
     def __reduce__(self) -> Tuple:
@@ -1737,7 +1741,9 @@ def __getitem__(
                 # }
 
                 # validate the column name
-                if not hasattr(self._session, "is_mock_session"):
+                if os.environ.get("PYSPARK_VALIDATE_COLUMN_NAME_LEGACY") == "1" and not hasattr(
+                    self._session, "is_mock_session"
+                ):
                     from pyspark.sql.connect.types import verify_col_name
 
                     # Try best to verify the column name with cached schema
@@ -1836,11 +1842,24 @@ def _schema(self) -> StructType:
         if self._cached_schema is None:
             query = self._plan.to_proto(self._session.client)
             self._cached_schema = self._session.client.schema(query)
+            try:
+                self._cached_schema_serialized = CPickleSerializer().dumps(self._schema)
+            except Exception as e:
+                logger.warn(f"DataFrame schema pickle dumps failed with exception: {e}.")
+                self._cached_schema_serialized = None
         return self._cached_schema
 
     @property
     def schema(self) -> StructType:
-        return copy.deepcopy(self._schema)
+        # self._schema call will cache the schema and serialize it if it is not cached yet.
+        _schema = self._schema
+        if self._cached_schema_serialized is not None:
+            try:
+                return CPickleSerializer().loads(self._cached_schema_serialized)
+            except Exception as e:
+                logger.warn(f"DataFrame schema pickle loads failed with exception: {e}.")
+        # In case of pickle ser/de failure, fallback to deepcopy approach.
+        return copy.deepcopy(_schema)
 
     @functools.cache
     def isLocal(self) -> bool:
diff --git a/python/pyspark/sql/connect/expressions.py b/python/pyspark/sql/connect/expressions.py
index 872770ee22911..4ddf13757db41 100644
--- a/python/pyspark/sql/connect/expressions.py
+++ b/python/pyspark/sql/connect/expressions.py
@@ -54,6 +54,7 @@
     DecimalType,
     StringType,
     DataType,
+    TimeType,
     TimestampType,
     TimestampNTZType,
     DayTimeIntervalType,
@@ -248,6 +249,7 @@ def __init__(self, value: Any, dataType: DataType) -> None:
                 DecimalType,
                 StringType,
                 DateType,
+                TimeType,
                 TimestampType,
                 TimestampNTZType,
                 DayTimeIntervalType,
@@ -298,6 +300,9 @@ def __init__(self, value: Any, dataType: DataType) -> None:
                     value = DateType().toInternal(value)
                 else:
                     value = DateType().toInternal(value.date())
+            elif isinstance(dataType, TimeType):
+                assert isinstance(value, datetime.time)
+                value = TimeType().toInternal(value)
             elif isinstance(dataType, TimestampType):
                 assert isinstance(value, datetime.datetime)
                 value = TimestampType().toInternal(value)
@@ -352,6 +357,8 @@ def _infer_type(cls, value: Any) -> DataType:
             return TimestampNTZType() if is_timestamp_ntz_preferred() else TimestampType()
         elif isinstance(value, datetime.date):
             return DateType()
+        elif isinstance(value, datetime.time):
+            return TimeType()
         elif isinstance(value, datetime.timedelta):
             return DayTimeIntervalType()
         elif isinstance(value, np.generic):
@@ -416,6 +423,9 @@ def _to_value(
         elif literal.HasField("date"):
             assert dataType is None or isinstance(dataType, DataType)
             return DateType().fromInternal(literal.date)
+        elif literal.HasField("time"):
+            assert dataType is None or isinstance(dataType, TimeType)
+            return TimeType().fromInternal(literal.time.nano)
         elif literal.HasField("timestamp"):
             assert dataType is None or isinstance(dataType, TimestampType)
             return TimestampType().fromInternal(literal.timestamp)
@@ -468,6 +478,9 @@ def to_plan(self, session: "SparkConnectClient") -> "proto.Expression":
             expr.literal.string = str(self._value)
         elif isinstance(self._dataType, DateType):
             expr.literal.date = int(self._value)
+        elif isinstance(self._dataType, TimeType):
+            expr.literal.time.precision = self._dataType.precision
+            expr.literal.time.nano = int(self._value)
         elif isinstance(self._dataType, TimestampType):
             expr.literal.timestamp = int(self._value)
         elif isinstance(self._dataType, TimestampNTZType):
@@ -496,6 +509,10 @@ def __repr__(self) -> str:
             dt = DateType().fromInternal(self._value)
             if dt is not None and isinstance(dt, datetime.date):
                 return dt.strftime("%Y-%m-%d")
+        elif isinstance(self._dataType, TimeType):
+            t = TimeType().fromInternal(self._value)
+            if t is not None and isinstance(t, datetime.time):
+                return t.strftime("%H:%M:%S.%f")
         elif isinstance(self._dataType, TimestampType):
             ts = TimestampType().fromInternal(self._value)
             if ts is not None and isinstance(ts, datetime.datetime):
diff --git a/python/pyspark/sql/connect/functions/__init__.py b/python/pyspark/sql/connect/functions/__init__.py
index 087a51e8616b9..4f3657b643a87 100644
--- a/python/pyspark/sql/connect/functions/__init__.py
+++ b/python/pyspark/sql/connect/functions/__init__.py
@@ -16,7 +16,7 @@
 #
 
 """PySpark Functions with Spark Connect"""
-from pyspark.testing import should_test_connect
+from pyspark.testing.utils import should_test_connect
 
 if should_test_connect:
     from pyspark.sql.connect.functions.builtin import *  # noqa: F401,F403
diff --git a/python/pyspark/sql/connect/functions/builtin.py b/python/pyspark/sql/connect/functions/builtin.py
index 85d78ccac3015..0380b517e6e5e 100644
--- a/python/pyspark/sql/connect/functions/builtin.py
+++ b/python/pyspark/sql/connect/functions/builtin.py
@@ -60,7 +60,7 @@
 )
 from pyspark.sql.connect.udf import _create_py_udf
 from pyspark.sql.connect.udtf import AnalyzeArgument, AnalyzeResult  # noqa: F401
-from pyspark.sql.connect.udtf import _create_py_udtf
+from pyspark.sql.connect.udtf import _create_py_udtf, _create_pyarrow_udtf
 from pyspark.sql import functions as pysparkfuncs
 from pyspark.sql.types import (
     _from_numpy_type,
@@ -73,7 +73,7 @@
 
 # The implementation of pandas_udf is embedded in pyspark.sql.function.pandas_udf
 # for code reuse.
-from pyspark.sql.functions import pandas_udf  # noqa: F401
+from pyspark.sql.functions import arrow_udf, pandas_udf  # noqa: F401
 
 
 if TYPE_CHECKING:
@@ -3140,6 +3140,26 @@ def current_date() -> Column:
 current_date.__doc__ = pysparkfuncs.current_date.__doc__
 
 
+@overload
+def current_time() -> Column:
+    ...
+
+
+@overload
+def current_time(precision: int) -> Column:
+    ...
+
+
+def current_time(precision: Optional[int] = None) -> Column:
+    if precision is None:
+        return _invoke_function("current_time")
+    else:
+        return _invoke_function("current_time", lit(precision))
+
+
+current_time.__doc__ = pysparkfuncs.current_time.__doc__
+
+
 def current_timestamp() -> Column:
     return _invoke_function("current_timestamp")
 
@@ -3375,6 +3395,16 @@ def to_date(col: "ColumnOrName", format: Optional[str] = None) -> Column:
 to_date.__doc__ = pysparkfuncs.to_date.__doc__
 
 
+def try_to_date(col: "ColumnOrName", format: Optional[str] = None) -> Column:
+    if format is None:
+        return _invoke_function_over_columns("try_to_date", col)
+    else:
+        return _invoke_function("try_to_date", _to_col(col), lit(format))
+
+
+try_to_date.__doc__ = pysparkfuncs.try_to_date.__doc__
+
+
 def unix_date(col: "ColumnOrName") -> Column:
     return _invoke_function_over_columns("unix_date", col)
 
@@ -3403,6 +3433,26 @@ def unix_seconds(col: "ColumnOrName") -> Column:
 unix_seconds.__doc__ = pysparkfuncs.unix_seconds.__doc__
 
 
+@overload
+def to_time(str: "ColumnOrName") -> Column:
+    ...
+
+
+@overload
+def to_time(str: "ColumnOrName", format: "ColumnOrName") -> Column:
+    ...
+
+
+def to_time(str: "ColumnOrName", format: Optional["ColumnOrName"] = None) -> Column:
+    if format is None:
+        return _invoke_function_over_columns("to_time", str)
+    else:
+        return _invoke_function_over_columns("to_time", str, format)
+
+
+to_time.__doc__ = pysparkfuncs.to_time.__doc__
+
+
 @overload
 def to_timestamp(col: "ColumnOrName") -> Column:
     ...
@@ -3423,6 +3473,26 @@ def to_timestamp(col: "ColumnOrName", format: Optional[str] = None) -> Column:
 to_timestamp.__doc__ = pysparkfuncs.to_timestamp.__doc__
 
 
+@overload
+def try_to_time(str: "ColumnOrName") -> Column:
+    ...
+
+
+@overload
+def try_to_time(str: "ColumnOrName", format: "ColumnOrName") -> Column:
+    ...
+
+
+def try_to_time(str: "ColumnOrName", format: Optional["ColumnOrName"] = None) -> Column:
+    if format is None:
+        return _invoke_function_over_columns("try_to_time", str)
+    else:
+        return _invoke_function_over_columns("try_to_time", str, format)
+
+
+try_to_time.__doc__ = pysparkfuncs.try_to_time.__doc__
+
+
 def try_to_timestamp(col: "ColumnOrName", format: Optional["ColumnOrName"] = None) -> Column:
     if format is not None:
         return _invoke_function_over_columns("try_to_timestamp", col, format)
@@ -3573,6 +3643,13 @@ def timestamp_seconds(col: "ColumnOrName") -> Column:
 timestamp_seconds.__doc__ = pysparkfuncs.timestamp_seconds.__doc__
 
 
+def time_trunc(unit: "ColumnOrName", time: "ColumnOrName") -> Column:
+    return _invoke_function_over_columns("time_trunc", unit, time)
+
+
+time_trunc.__doc__ = pysparkfuncs.time_trunc.__doc__
+
+
 def timestamp_millis(col: "ColumnOrName") -> Column:
     return _invoke_function_over_columns("timestamp_millis", col)
 
@@ -3847,6 +3924,13 @@ def make_interval(
 make_interval.__doc__ = pysparkfuncs.make_interval.__doc__
 
 
+def make_time(hour: "ColumnOrName", minute: "ColumnOrName", second: "ColumnOrName") -> Column:
+    return _invoke_function_over_columns("make_time", hour, minute, second)
+
+
+make_time.__doc__ = pysparkfuncs.make_time.__doc__
+
+
 def make_timestamp(
     years: "ColumnOrName",
     months: "ColumnOrName",
@@ -4416,6 +4500,20 @@ def udtf(
 udtf.__doc__ = pysparkfuncs.udtf.__doc__
 
 
+def arrow_udtf(
+    cls: Optional[Type] = None,
+    *,
+    returnType: Optional[Union[StructType, str]] = None,
+) -> Union["UserDefinedTableFunction", Callable[[Type], "UserDefinedTableFunction"]]:
+    if cls is None:
+        return functools.partial(_create_pyarrow_udtf, returnType=returnType)
+    else:
+        return _create_pyarrow_udtf(cls=cls, returnType=returnType)
+
+
+arrow_udtf.__doc__ = pysparkfuncs.arrow_udtf.__doc__
+
+
 def call_function(funcName: str, *cols: "ColumnOrName") -> Column:
     from pyspark.sql.connect.column import Column as ConnectColumn
 
diff --git a/python/pyspark/sql/connect/proto/expressions_pb2.py b/python/pyspark/sql/connect/proto/expressions_pb2.py
index 0cec23f4857df..3ce27567f1e04 100644
--- a/python/pyspark/sql/connect/proto/expressions_pb2.py
+++ b/python/pyspark/sql/connect/proto/expressions_pb2.py
@@ -40,7 +40,7 @@
 
 
 DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(
-    b'\n\x1fspark/connect/expressions.proto\x12\rspark.connect\x1a\x19google/protobuf/any.proto\x1a\x19spark/connect/types.proto\x1a\x1aspark/connect/common.proto"\xf3\x34\n\nExpression\x12\x37\n\x06\x63ommon\x18\x12 \x01(\x0b\x32\x1f.spark.connect.ExpressionCommonR\x06\x63ommon\x12=\n\x07literal\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralH\x00R\x07literal\x12\x62\n\x14unresolved_attribute\x18\x02 \x01(\x0b\x32-.spark.connect.Expression.UnresolvedAttributeH\x00R\x13unresolvedAttribute\x12_\n\x13unresolved_function\x18\x03 \x01(\x0b\x32,.spark.connect.Expression.UnresolvedFunctionH\x00R\x12unresolvedFunction\x12Y\n\x11\x65xpression_string\x18\x04 \x01(\x0b\x32*.spark.connect.Expression.ExpressionStringH\x00R\x10\x65xpressionString\x12S\n\x0funresolved_star\x18\x05 \x01(\x0b\x32(.spark.connect.Expression.UnresolvedStarH\x00R\x0eunresolvedStar\x12\x37\n\x05\x61lias\x18\x06 \x01(\x0b\x32\x1f.spark.connect.Expression.AliasH\x00R\x05\x61lias\x12\x34\n\x04\x63\x61st\x18\x07 \x01(\x0b\x32\x1e.spark.connect.Expression.CastH\x00R\x04\x63\x61st\x12V\n\x10unresolved_regex\x18\x08 \x01(\x0b\x32).spark.connect.Expression.UnresolvedRegexH\x00R\x0funresolvedRegex\x12\x44\n\nsort_order\x18\t \x01(\x0b\x32#.spark.connect.Expression.SortOrderH\x00R\tsortOrder\x12S\n\x0flambda_function\x18\n \x01(\x0b\x32(.spark.connect.Expression.LambdaFunctionH\x00R\x0elambdaFunction\x12:\n\x06window\x18\x0b \x01(\x0b\x32 .spark.connect.Expression.WindowH\x00R\x06window\x12l\n\x18unresolved_extract_value\x18\x0c \x01(\x0b\x32\x30.spark.connect.Expression.UnresolvedExtractValueH\x00R\x16unresolvedExtractValue\x12M\n\rupdate_fields\x18\r \x01(\x0b\x32&.spark.connect.Expression.UpdateFieldsH\x00R\x0cupdateFields\x12\x82\x01\n unresolved_named_lambda_variable\x18\x0e \x01(\x0b\x32\x37.spark.connect.Expression.UnresolvedNamedLambdaVariableH\x00R\x1dunresolvedNamedLambdaVariable\x12~\n#common_inline_user_defined_function\x18\x0f \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionH\x00R\x1f\x63ommonInlineUserDefinedFunction\x12\x42\n\rcall_function\x18\x10 \x01(\x0b\x32\x1b.spark.connect.CallFunctionH\x00R\x0c\x63\x61llFunction\x12\x64\n\x19named_argument_expression\x18\x11 \x01(\x0b\x32&.spark.connect.NamedArgumentExpressionH\x00R\x17namedArgumentExpression\x12?\n\x0cmerge_action\x18\x13 \x01(\x0b\x32\x1a.spark.connect.MergeActionH\x00R\x0bmergeAction\x12g\n\x1atyped_aggregate_expression\x18\x14 \x01(\x0b\x32\'.spark.connect.TypedAggregateExpressionH\x00R\x18typedAggregateExpression\x12T\n\x13subquery_expression\x18\x15 \x01(\x0b\x32!.spark.connect.SubqueryExpressionH\x00R\x12subqueryExpression\x12\x35\n\textension\x18\xe7\x07 \x01(\x0b\x32\x14.google.protobuf.AnyH\x00R\textension\x1a\x8f\x06\n\x06Window\x12\x42\n\x0fwindow_function\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x0ewindowFunction\x12@\n\x0epartition_spec\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\rpartitionSpec\x12\x42\n\norder_spec\x18\x03 \x03(\x0b\x32#.spark.connect.Expression.SortOrderR\torderSpec\x12K\n\nframe_spec\x18\x04 \x01(\x0b\x32,.spark.connect.Expression.Window.WindowFrameR\tframeSpec\x1a\xed\x03\n\x0bWindowFrame\x12U\n\nframe_type\x18\x01 \x01(\x0e\x32\x36.spark.connect.Expression.Window.WindowFrame.FrameTypeR\tframeType\x12P\n\x05lower\x18\x02 \x01(\x0b\x32:.spark.connect.Expression.Window.WindowFrame.FrameBoundaryR\x05lower\x12P\n\x05upper\x18\x03 \x01(\x0b\x32:.spark.connect.Expression.Window.WindowFrame.FrameBoundaryR\x05upper\x1a\x91\x01\n\rFrameBoundary\x12!\n\x0b\x63urrent_row\x18\x01 \x01(\x08H\x00R\ncurrentRow\x12\x1e\n\tunbounded\x18\x02 \x01(\x08H\x00R\tunbounded\x12\x31\n\x05value\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionH\x00R\x05valueB\n\n\x08\x62oundary"O\n\tFrameType\x12\x18\n\x14\x46RAME_TYPE_UNDEFINED\x10\x00\x12\x12\n\x0e\x46RAME_TYPE_ROW\x10\x01\x12\x14\n\x10\x46RAME_TYPE_RANGE\x10\x02\x1a\xa9\x03\n\tSortOrder\x12/\n\x05\x63hild\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05\x63hild\x12O\n\tdirection\x18\x02 \x01(\x0e\x32\x31.spark.connect.Expression.SortOrder.SortDirectionR\tdirection\x12U\n\rnull_ordering\x18\x03 \x01(\x0e\x32\x30.spark.connect.Expression.SortOrder.NullOrderingR\x0cnullOrdering"l\n\rSortDirection\x12\x1e\n\x1aSORT_DIRECTION_UNSPECIFIED\x10\x00\x12\x1c\n\x18SORT_DIRECTION_ASCENDING\x10\x01\x12\x1d\n\x19SORT_DIRECTION_DESCENDING\x10\x02"U\n\x0cNullOrdering\x12\x1a\n\x16SORT_NULLS_UNSPECIFIED\x10\x00\x12\x14\n\x10SORT_NULLS_FIRST\x10\x01\x12\x13\n\x0fSORT_NULLS_LAST\x10\x02\x1a\xbb\x02\n\x04\x43\x61st\x12-\n\x04\x65xpr\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x04\x65xpr\x12-\n\x04type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\x04type\x12\x1b\n\x08type_str\x18\x03 \x01(\tH\x00R\x07typeStr\x12\x44\n\teval_mode\x18\x04 \x01(\x0e\x32\'.spark.connect.Expression.Cast.EvalModeR\x08\x65valMode"b\n\x08\x45valMode\x12\x19\n\x15\x45VAL_MODE_UNSPECIFIED\x10\x00\x12\x14\n\x10\x45VAL_MODE_LEGACY\x10\x01\x12\x12\n\x0e\x45VAL_MODE_ANSI\x10\x02\x12\x11\n\rEVAL_MODE_TRY\x10\x03\x42\x0e\n\x0c\x63\x61st_to_type\x1a\xc1\x0f\n\x07Literal\x12-\n\x04null\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\x04null\x12\x18\n\x06\x62inary\x18\x02 \x01(\x0cH\x00R\x06\x62inary\x12\x1a\n\x07\x62oolean\x18\x03 \x01(\x08H\x00R\x07\x62oolean\x12\x14\n\x04\x62yte\x18\x04 \x01(\x05H\x00R\x04\x62yte\x12\x16\n\x05short\x18\x05 \x01(\x05H\x00R\x05short\x12\x1a\n\x07integer\x18\x06 \x01(\x05H\x00R\x07integer\x12\x14\n\x04long\x18\x07 \x01(\x03H\x00R\x04long\x12\x16\n\x05\x66loat\x18\n \x01(\x02H\x00R\x05\x66loat\x12\x18\n\x06\x64ouble\x18\x0b \x01(\x01H\x00R\x06\x64ouble\x12\x45\n\x07\x64\x65\x63imal\x18\x0c \x01(\x0b\x32).spark.connect.Expression.Literal.DecimalH\x00R\x07\x64\x65\x63imal\x12\x18\n\x06string\x18\r \x01(\tH\x00R\x06string\x12\x14\n\x04\x64\x61te\x18\x10 \x01(\x05H\x00R\x04\x64\x61te\x12\x1e\n\ttimestamp\x18\x11 \x01(\x03H\x00R\ttimestamp\x12%\n\rtimestamp_ntz\x18\x12 \x01(\x03H\x00R\x0ctimestampNtz\x12\x61\n\x11\x63\x61lendar_interval\x18\x13 \x01(\x0b\x32\x32.spark.connect.Expression.Literal.CalendarIntervalH\x00R\x10\x63\x61lendarInterval\x12\x30\n\x13year_month_interval\x18\x14 \x01(\x05H\x00R\x11yearMonthInterval\x12,\n\x11\x64\x61y_time_interval\x18\x15 \x01(\x03H\x00R\x0f\x64\x61yTimeInterval\x12?\n\x05\x61rray\x18\x16 \x01(\x0b\x32\'.spark.connect.Expression.Literal.ArrayH\x00R\x05\x61rray\x12\x39\n\x03map\x18\x17 \x01(\x0b\x32%.spark.connect.Expression.Literal.MapH\x00R\x03map\x12\x42\n\x06struct\x18\x18 \x01(\x0b\x32(.spark.connect.Expression.Literal.StructH\x00R\x06struct\x12\x61\n\x11specialized_array\x18\x19 \x01(\x0b\x32\x32.spark.connect.Expression.Literal.SpecializedArrayH\x00R\x10specializedArray\x1au\n\x07\x44\x65\x63imal\x12\x14\n\x05value\x18\x01 \x01(\tR\x05value\x12!\n\tprecision\x18\x02 \x01(\x05H\x00R\tprecision\x88\x01\x01\x12\x19\n\x05scale\x18\x03 \x01(\x05H\x01R\x05scale\x88\x01\x01\x42\x0c\n\n_precisionB\x08\n\x06_scale\x1a\x62\n\x10\x43\x61lendarInterval\x12\x16\n\x06months\x18\x01 \x01(\x05R\x06months\x12\x12\n\x04\x64\x61ys\x18\x02 \x01(\x05R\x04\x64\x61ys\x12"\n\x0cmicroseconds\x18\x03 \x01(\x03R\x0cmicroseconds\x1a\x82\x01\n\x05\x41rray\x12:\n\x0c\x65lement_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x0b\x65lementType\x12=\n\x08\x65lements\x18\x02 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x08\x65lements\x1a\xe3\x01\n\x03Map\x12\x32\n\x08key_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x07keyType\x12\x36\n\nvalue_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeR\tvalueType\x12\x35\n\x04keys\x18\x03 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x04keys\x12\x39\n\x06values\x18\x04 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x06values\x1a\x81\x01\n\x06Struct\x12\x38\n\x0bstruct_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\nstructType\x12=\n\x08\x65lements\x18\x02 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x08\x65lements\x1a\xc0\x02\n\x10SpecializedArray\x12,\n\x05\x62ools\x18\x01 \x01(\x0b\x32\x14.spark.connect.BoolsH\x00R\x05\x62ools\x12)\n\x04ints\x18\x02 \x01(\x0b\x32\x13.spark.connect.IntsH\x00R\x04ints\x12,\n\x05longs\x18\x03 \x01(\x0b\x32\x14.spark.connect.LongsH\x00R\x05longs\x12/\n\x06\x66loats\x18\x04 \x01(\x0b\x32\x15.spark.connect.FloatsH\x00R\x06\x66loats\x12\x32\n\x07\x64oubles\x18\x05 \x01(\x0b\x32\x16.spark.connect.DoublesH\x00R\x07\x64oubles\x12\x32\n\x07strings\x18\x06 \x01(\x0b\x32\x16.spark.connect.StringsH\x00R\x07stringsB\x0c\n\nvalue_typeB\x0e\n\x0cliteral_type\x1a\xba\x01\n\x13UnresolvedAttribute\x12/\n\x13unparsed_identifier\x18\x01 \x01(\tR\x12unparsedIdentifier\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x00R\x06planId\x88\x01\x01\x12\x31\n\x12is_metadata_column\x18\x03 \x01(\x08H\x01R\x10isMetadataColumn\x88\x01\x01\x42\n\n\x08_plan_idB\x15\n\x13_is_metadata_column\x1a\x82\x02\n\x12UnresolvedFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12\x37\n\targuments\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments\x12\x1f\n\x0bis_distinct\x18\x03 \x01(\x08R\nisDistinct\x12\x37\n\x18is_user_defined_function\x18\x04 \x01(\x08R\x15isUserDefinedFunction\x12$\n\x0bis_internal\x18\x05 \x01(\x08H\x00R\nisInternal\x88\x01\x01\x42\x0e\n\x0c_is_internal\x1a\x32\n\x10\x45xpressionString\x12\x1e\n\nexpression\x18\x01 \x01(\tR\nexpression\x1a|\n\x0eUnresolvedStar\x12,\n\x0funparsed_target\x18\x01 \x01(\tH\x00R\x0eunparsedTarget\x88\x01\x01\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x01R\x06planId\x88\x01\x01\x42\x12\n\x10_unparsed_targetB\n\n\x08_plan_id\x1aV\n\x0fUnresolvedRegex\x12\x19\n\x08\x63ol_name\x18\x01 \x01(\tR\x07\x63olName\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x00R\x06planId\x88\x01\x01\x42\n\n\x08_plan_id\x1a\x84\x01\n\x16UnresolvedExtractValue\x12/\n\x05\x63hild\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05\x63hild\x12\x39\n\nextraction\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\nextraction\x1a\xbb\x01\n\x0cUpdateFields\x12\x46\n\x11struct_expression\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x10structExpression\x12\x1d\n\nfield_name\x18\x02 \x01(\tR\tfieldName\x12\x44\n\x10value_expression\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x0fvalueExpression\x1ax\n\x05\x41lias\x12-\n\x04\x65xpr\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x04\x65xpr\x12\x12\n\x04name\x18\x02 \x03(\tR\x04name\x12\x1f\n\x08metadata\x18\x03 \x01(\tH\x00R\x08metadata\x88\x01\x01\x42\x0b\n\t_metadata\x1a\x9e\x01\n\x0eLambdaFunction\x12\x35\n\x08\x66unction\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x08\x66unction\x12U\n\targuments\x18\x02 \x03(\x0b\x32\x37.spark.connect.Expression.UnresolvedNamedLambdaVariableR\targuments\x1a>\n\x1dUnresolvedNamedLambdaVariable\x12\x1d\n\nname_parts\x18\x01 \x03(\tR\tnamePartsB\x0b\n\texpr_type"A\n\x10\x45xpressionCommon\x12-\n\x06origin\x18\x01 \x01(\x0b\x32\x15.spark.connect.OriginR\x06origin"\x8d\x03\n\x1f\x43ommonInlineUserDefinedFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12$\n\rdeterministic\x18\x02 \x01(\x08R\rdeterministic\x12\x37\n\targuments\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments\x12\x39\n\npython_udf\x18\x04 \x01(\x0b\x32\x18.spark.connect.PythonUDFH\x00R\tpythonUdf\x12I\n\x10scalar_scala_udf\x18\x05 \x01(\x0b\x32\x1d.spark.connect.ScalarScalaUDFH\x00R\x0escalarScalaUdf\x12\x33\n\x08java_udf\x18\x06 \x01(\x0b\x32\x16.spark.connect.JavaUDFH\x00R\x07javaUdf\x12\x1f\n\x0bis_distinct\x18\x07 \x01(\x08R\nisDistinctB\n\n\x08\x66unction"\xcc\x01\n\tPythonUDF\x12\x38\n\x0boutput_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\noutputType\x12\x1b\n\teval_type\x18\x02 \x01(\x05R\x08\x65valType\x12\x18\n\x07\x63ommand\x18\x03 \x01(\x0cR\x07\x63ommand\x12\x1d\n\npython_ver\x18\x04 \x01(\tR\tpythonVer\x12/\n\x13\x61\x64\x64itional_includes\x18\x05 \x03(\tR\x12\x61\x64\x64itionalIncludes"\xd6\x01\n\x0eScalarScalaUDF\x12\x18\n\x07payload\x18\x01 \x01(\x0cR\x07payload\x12\x37\n\ninputTypes\x18\x02 \x03(\x0b\x32\x17.spark.connect.DataTypeR\ninputTypes\x12\x37\n\noutputType\x18\x03 \x01(\x0b\x32\x17.spark.connect.DataTypeR\noutputType\x12\x1a\n\x08nullable\x18\x04 \x01(\x08R\x08nullable\x12\x1c\n\taggregate\x18\x05 \x01(\x08R\taggregate"\x95\x01\n\x07JavaUDF\x12\x1d\n\nclass_name\x18\x01 \x01(\tR\tclassName\x12=\n\x0boutput_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\noutputType\x88\x01\x01\x12\x1c\n\taggregate\x18\x03 \x01(\x08R\taggregateB\x0e\n\x0c_output_type"c\n\x18TypedAggregateExpression\x12G\n\x10scalar_scala_udf\x18\x01 \x01(\x0b\x32\x1d.spark.connect.ScalarScalaUDFR\x0escalarScalaUdf"l\n\x0c\x43\x61llFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12\x37\n\targuments\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments"\\\n\x17NamedArgumentExpression\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12/\n\x05value\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05value"\x80\x04\n\x0bMergeAction\x12\x46\n\x0b\x61\x63tion_type\x18\x01 \x01(\x0e\x32%.spark.connect.MergeAction.ActionTypeR\nactionType\x12<\n\tcondition\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionH\x00R\tcondition\x88\x01\x01\x12G\n\x0b\x61ssignments\x18\x03 \x03(\x0b\x32%.spark.connect.MergeAction.AssignmentR\x0b\x61ssignments\x1aj\n\nAssignment\x12+\n\x03key\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x03key\x12/\n\x05value\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05value"\xa7\x01\n\nActionType\x12\x17\n\x13\x41\x43TION_TYPE_INVALID\x10\x00\x12\x16\n\x12\x41\x43TION_TYPE_DELETE\x10\x01\x12\x16\n\x12\x41\x43TION_TYPE_INSERT\x10\x02\x12\x1b\n\x17\x41\x43TION_TYPE_INSERT_STAR\x10\x03\x12\x16\n\x12\x41\x43TION_TYPE_UPDATE\x10\x04\x12\x1b\n\x17\x41\x43TION_TYPE_UPDATE_STAR\x10\x05\x42\x0c\n\n_condition"\xc5\x05\n\x12SubqueryExpression\x12\x17\n\x07plan_id\x18\x01 \x01(\x03R\x06planId\x12S\n\rsubquery_type\x18\x02 \x01(\x0e\x32..spark.connect.SubqueryExpression.SubqueryTypeR\x0csubqueryType\x12\x62\n\x11table_arg_options\x18\x03 \x01(\x0b\x32\x31.spark.connect.SubqueryExpression.TableArgOptionsH\x00R\x0ftableArgOptions\x88\x01\x01\x12G\n\x12in_subquery_values\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x10inSubqueryValues\x1a\xea\x01\n\x0fTableArgOptions\x12@\n\x0epartition_spec\x18\x01 \x03(\x0b\x32\x19.spark.connect.ExpressionR\rpartitionSpec\x12\x42\n\norder_spec\x18\x02 \x03(\x0b\x32#.spark.connect.Expression.SortOrderR\torderSpec\x12\x37\n\x15with_single_partition\x18\x03 \x01(\x08H\x00R\x13withSinglePartition\x88\x01\x01\x42\x18\n\x16_with_single_partition"\x90\x01\n\x0cSubqueryType\x12\x19\n\x15SUBQUERY_TYPE_UNKNOWN\x10\x00\x12\x18\n\x14SUBQUERY_TYPE_SCALAR\x10\x01\x12\x18\n\x14SUBQUERY_TYPE_EXISTS\x10\x02\x12\x1b\n\x17SUBQUERY_TYPE_TABLE_ARG\x10\x03\x12\x14\n\x10SUBQUERY_TYPE_IN\x10\x04\x42\x14\n\x12_table_arg_optionsB6\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3'
+    b'\n\x1fspark/connect/expressions.proto\x12\rspark.connect\x1a\x19google/protobuf/any.proto\x1a\x19spark/connect/types.proto\x1a\x1aspark/connect/common.proto"\xce\x37\n\nExpression\x12\x37\n\x06\x63ommon\x18\x12 \x01(\x0b\x32\x1f.spark.connect.ExpressionCommonR\x06\x63ommon\x12=\n\x07literal\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralH\x00R\x07literal\x12\x62\n\x14unresolved_attribute\x18\x02 \x01(\x0b\x32-.spark.connect.Expression.UnresolvedAttributeH\x00R\x13unresolvedAttribute\x12_\n\x13unresolved_function\x18\x03 \x01(\x0b\x32,.spark.connect.Expression.UnresolvedFunctionH\x00R\x12unresolvedFunction\x12Y\n\x11\x65xpression_string\x18\x04 \x01(\x0b\x32*.spark.connect.Expression.ExpressionStringH\x00R\x10\x65xpressionString\x12S\n\x0funresolved_star\x18\x05 \x01(\x0b\x32(.spark.connect.Expression.UnresolvedStarH\x00R\x0eunresolvedStar\x12\x37\n\x05\x61lias\x18\x06 \x01(\x0b\x32\x1f.spark.connect.Expression.AliasH\x00R\x05\x61lias\x12\x34\n\x04\x63\x61st\x18\x07 \x01(\x0b\x32\x1e.spark.connect.Expression.CastH\x00R\x04\x63\x61st\x12V\n\x10unresolved_regex\x18\x08 \x01(\x0b\x32).spark.connect.Expression.UnresolvedRegexH\x00R\x0funresolvedRegex\x12\x44\n\nsort_order\x18\t \x01(\x0b\x32#.spark.connect.Expression.SortOrderH\x00R\tsortOrder\x12S\n\x0flambda_function\x18\n \x01(\x0b\x32(.spark.connect.Expression.LambdaFunctionH\x00R\x0elambdaFunction\x12:\n\x06window\x18\x0b \x01(\x0b\x32 .spark.connect.Expression.WindowH\x00R\x06window\x12l\n\x18unresolved_extract_value\x18\x0c \x01(\x0b\x32\x30.spark.connect.Expression.UnresolvedExtractValueH\x00R\x16unresolvedExtractValue\x12M\n\rupdate_fields\x18\r \x01(\x0b\x32&.spark.connect.Expression.UpdateFieldsH\x00R\x0cupdateFields\x12\x82\x01\n unresolved_named_lambda_variable\x18\x0e \x01(\x0b\x32\x37.spark.connect.Expression.UnresolvedNamedLambdaVariableH\x00R\x1dunresolvedNamedLambdaVariable\x12~\n#common_inline_user_defined_function\x18\x0f \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionH\x00R\x1f\x63ommonInlineUserDefinedFunction\x12\x42\n\rcall_function\x18\x10 \x01(\x0b\x32\x1b.spark.connect.CallFunctionH\x00R\x0c\x63\x61llFunction\x12\x64\n\x19named_argument_expression\x18\x11 \x01(\x0b\x32&.spark.connect.NamedArgumentExpressionH\x00R\x17namedArgumentExpression\x12?\n\x0cmerge_action\x18\x13 \x01(\x0b\x32\x1a.spark.connect.MergeActionH\x00R\x0bmergeAction\x12g\n\x1atyped_aggregate_expression\x18\x14 \x01(\x0b\x32\'.spark.connect.TypedAggregateExpressionH\x00R\x18typedAggregateExpression\x12T\n\x13subquery_expression\x18\x15 \x01(\x0b\x32!.spark.connect.SubqueryExpressionH\x00R\x12subqueryExpression\x12\x35\n\textension\x18\xe7\x07 \x01(\x0b\x32\x14.google.protobuf.AnyH\x00R\textension\x1a\x8f\x06\n\x06Window\x12\x42\n\x0fwindow_function\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x0ewindowFunction\x12@\n\x0epartition_spec\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\rpartitionSpec\x12\x42\n\norder_spec\x18\x03 \x03(\x0b\x32#.spark.connect.Expression.SortOrderR\torderSpec\x12K\n\nframe_spec\x18\x04 \x01(\x0b\x32,.spark.connect.Expression.Window.WindowFrameR\tframeSpec\x1a\xed\x03\n\x0bWindowFrame\x12U\n\nframe_type\x18\x01 \x01(\x0e\x32\x36.spark.connect.Expression.Window.WindowFrame.FrameTypeR\tframeType\x12P\n\x05lower\x18\x02 \x01(\x0b\x32:.spark.connect.Expression.Window.WindowFrame.FrameBoundaryR\x05lower\x12P\n\x05upper\x18\x03 \x01(\x0b\x32:.spark.connect.Expression.Window.WindowFrame.FrameBoundaryR\x05upper\x1a\x91\x01\n\rFrameBoundary\x12!\n\x0b\x63urrent_row\x18\x01 \x01(\x08H\x00R\ncurrentRow\x12\x1e\n\tunbounded\x18\x02 \x01(\x08H\x00R\tunbounded\x12\x31\n\x05value\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionH\x00R\x05valueB\n\n\x08\x62oundary"O\n\tFrameType\x12\x18\n\x14\x46RAME_TYPE_UNDEFINED\x10\x00\x12\x12\n\x0e\x46RAME_TYPE_ROW\x10\x01\x12\x14\n\x10\x46RAME_TYPE_RANGE\x10\x02\x1a\xa9\x03\n\tSortOrder\x12/\n\x05\x63hild\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05\x63hild\x12O\n\tdirection\x18\x02 \x01(\x0e\x32\x31.spark.connect.Expression.SortOrder.SortDirectionR\tdirection\x12U\n\rnull_ordering\x18\x03 \x01(\x0e\x32\x30.spark.connect.Expression.SortOrder.NullOrderingR\x0cnullOrdering"l\n\rSortDirection\x12\x1e\n\x1aSORT_DIRECTION_UNSPECIFIED\x10\x00\x12\x1c\n\x18SORT_DIRECTION_ASCENDING\x10\x01\x12\x1d\n\x19SORT_DIRECTION_DESCENDING\x10\x02"U\n\x0cNullOrdering\x12\x1a\n\x16SORT_NULLS_UNSPECIFIED\x10\x00\x12\x14\n\x10SORT_NULLS_FIRST\x10\x01\x12\x13\n\x0fSORT_NULLS_LAST\x10\x02\x1a\xbb\x02\n\x04\x43\x61st\x12-\n\x04\x65xpr\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x04\x65xpr\x12-\n\x04type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\x04type\x12\x1b\n\x08type_str\x18\x03 \x01(\tH\x00R\x07typeStr\x12\x44\n\teval_mode\x18\x04 \x01(\x0e\x32\'.spark.connect.Expression.Cast.EvalModeR\x08\x65valMode"b\n\x08\x45valMode\x12\x19\n\x15\x45VAL_MODE_UNSPECIFIED\x10\x00\x12\x14\n\x10\x45VAL_MODE_LEGACY\x10\x01\x12\x12\n\x0e\x45VAL_MODE_ANSI\x10\x02\x12\x11\n\rEVAL_MODE_TRY\x10\x03\x42\x0e\n\x0c\x63\x61st_to_type\x1a\x9c\x12\n\x07Literal\x12-\n\x04null\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\x04null\x12\x18\n\x06\x62inary\x18\x02 \x01(\x0cH\x00R\x06\x62inary\x12\x1a\n\x07\x62oolean\x18\x03 \x01(\x08H\x00R\x07\x62oolean\x12\x14\n\x04\x62yte\x18\x04 \x01(\x05H\x00R\x04\x62yte\x12\x16\n\x05short\x18\x05 \x01(\x05H\x00R\x05short\x12\x1a\n\x07integer\x18\x06 \x01(\x05H\x00R\x07integer\x12\x14\n\x04long\x18\x07 \x01(\x03H\x00R\x04long\x12\x16\n\x05\x66loat\x18\n \x01(\x02H\x00R\x05\x66loat\x12\x18\n\x06\x64ouble\x18\x0b \x01(\x01H\x00R\x06\x64ouble\x12\x45\n\x07\x64\x65\x63imal\x18\x0c \x01(\x0b\x32).spark.connect.Expression.Literal.DecimalH\x00R\x07\x64\x65\x63imal\x12\x18\n\x06string\x18\r \x01(\tH\x00R\x06string\x12\x14\n\x04\x64\x61te\x18\x10 \x01(\x05H\x00R\x04\x64\x61te\x12\x1e\n\ttimestamp\x18\x11 \x01(\x03H\x00R\ttimestamp\x12%\n\rtimestamp_ntz\x18\x12 \x01(\x03H\x00R\x0ctimestampNtz\x12\x61\n\x11\x63\x61lendar_interval\x18\x13 \x01(\x0b\x32\x32.spark.connect.Expression.Literal.CalendarIntervalH\x00R\x10\x63\x61lendarInterval\x12\x30\n\x13year_month_interval\x18\x14 \x01(\x05H\x00R\x11yearMonthInterval\x12,\n\x11\x64\x61y_time_interval\x18\x15 \x01(\x03H\x00R\x0f\x64\x61yTimeInterval\x12?\n\x05\x61rray\x18\x16 \x01(\x0b\x32\'.spark.connect.Expression.Literal.ArrayH\x00R\x05\x61rray\x12\x39\n\x03map\x18\x17 \x01(\x0b\x32%.spark.connect.Expression.Literal.MapH\x00R\x03map\x12\x42\n\x06struct\x18\x18 \x01(\x0b\x32(.spark.connect.Expression.Literal.StructH\x00R\x06struct\x12\x61\n\x11specialized_array\x18\x19 \x01(\x0b\x32\x32.spark.connect.Expression.Literal.SpecializedArrayH\x00R\x10specializedArray\x12<\n\x04time\x18\x1a \x01(\x0b\x32&.spark.connect.Expression.Literal.TimeH\x00R\x04time\x1au\n\x07\x44\x65\x63imal\x12\x14\n\x05value\x18\x01 \x01(\tR\x05value\x12!\n\tprecision\x18\x02 \x01(\x05H\x00R\tprecision\x88\x01\x01\x12\x19\n\x05scale\x18\x03 \x01(\x05H\x01R\x05scale\x88\x01\x01\x42\x0c\n\n_precisionB\x08\n\x06_scale\x1a\x62\n\x10\x43\x61lendarInterval\x12\x16\n\x06months\x18\x01 \x01(\x05R\x06months\x12\x12\n\x04\x64\x61ys\x18\x02 \x01(\x05R\x04\x64\x61ys\x12"\n\x0cmicroseconds\x18\x03 \x01(\x03R\x0cmicroseconds\x1a\xc2\x01\n\x05\x41rray\x12>\n\x0c\x65lement_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeB\x02\x18\x01R\x0b\x65lementType\x12=\n\x08\x65lements\x18\x02 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x08\x65lements\x12:\n\tdata_type\x18\x03 \x01(\x0b\x32\x1d.spark.connect.DataType.ArrayR\x08\x64\x61taType\x1a\xa5\x02\n\x03Map\x12\x36\n\x08key_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeB\x02\x18\x01R\x07keyType\x12:\n\nvalue_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeB\x02\x18\x01R\tvalueType\x12\x35\n\x04keys\x18\x03 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x04keys\x12\x39\n\x06values\x18\x04 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x06values\x12\x38\n\tdata_type\x18\x05 \x01(\x0b\x32\x1b.spark.connect.DataType.MapR\x08\x64\x61taType\x1a\xcf\x01\n\x06Struct\x12<\n\x0bstruct_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeB\x02\x18\x01R\nstructType\x12=\n\x08\x65lements\x18\x02 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x08\x65lements\x12H\n\x10\x64\x61ta_type_struct\x18\x03 \x01(\x0b\x32\x1e.spark.connect.DataType.StructR\x0e\x64\x61taTypeStruct\x1a\xc0\x02\n\x10SpecializedArray\x12,\n\x05\x62ools\x18\x01 \x01(\x0b\x32\x14.spark.connect.BoolsH\x00R\x05\x62ools\x12)\n\x04ints\x18\x02 \x01(\x0b\x32\x13.spark.connect.IntsH\x00R\x04ints\x12,\n\x05longs\x18\x03 \x01(\x0b\x32\x14.spark.connect.LongsH\x00R\x05longs\x12/\n\x06\x66loats\x18\x04 \x01(\x0b\x32\x15.spark.connect.FloatsH\x00R\x06\x66loats\x12\x32\n\x07\x64oubles\x18\x05 \x01(\x0b\x32\x16.spark.connect.DoublesH\x00R\x07\x64oubles\x12\x32\n\x07strings\x18\x06 \x01(\x0b\x32\x16.spark.connect.StringsH\x00R\x07stringsB\x0c\n\nvalue_type\x1aK\n\x04Time\x12\x12\n\x04nano\x18\x01 \x01(\x03R\x04nano\x12!\n\tprecision\x18\x02 \x01(\x05H\x00R\tprecision\x88\x01\x01\x42\x0c\n\n_precisionB\x0e\n\x0cliteral_type\x1a\xba\x01\n\x13UnresolvedAttribute\x12/\n\x13unparsed_identifier\x18\x01 \x01(\tR\x12unparsedIdentifier\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x00R\x06planId\x88\x01\x01\x12\x31\n\x12is_metadata_column\x18\x03 \x01(\x08H\x01R\x10isMetadataColumn\x88\x01\x01\x42\n\n\x08_plan_idB\x15\n\x13_is_metadata_column\x1a\x82\x02\n\x12UnresolvedFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12\x37\n\targuments\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments\x12\x1f\n\x0bis_distinct\x18\x03 \x01(\x08R\nisDistinct\x12\x37\n\x18is_user_defined_function\x18\x04 \x01(\x08R\x15isUserDefinedFunction\x12$\n\x0bis_internal\x18\x05 \x01(\x08H\x00R\nisInternal\x88\x01\x01\x42\x0e\n\x0c_is_internal\x1a\x32\n\x10\x45xpressionString\x12\x1e\n\nexpression\x18\x01 \x01(\tR\nexpression\x1a|\n\x0eUnresolvedStar\x12,\n\x0funparsed_target\x18\x01 \x01(\tH\x00R\x0eunparsedTarget\x88\x01\x01\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x01R\x06planId\x88\x01\x01\x42\x12\n\x10_unparsed_targetB\n\n\x08_plan_id\x1aV\n\x0fUnresolvedRegex\x12\x19\n\x08\x63ol_name\x18\x01 \x01(\tR\x07\x63olName\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x00R\x06planId\x88\x01\x01\x42\n\n\x08_plan_id\x1a\x84\x01\n\x16UnresolvedExtractValue\x12/\n\x05\x63hild\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05\x63hild\x12\x39\n\nextraction\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\nextraction\x1a\xbb\x01\n\x0cUpdateFields\x12\x46\n\x11struct_expression\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x10structExpression\x12\x1d\n\nfield_name\x18\x02 \x01(\tR\tfieldName\x12\x44\n\x10value_expression\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x0fvalueExpression\x1ax\n\x05\x41lias\x12-\n\x04\x65xpr\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x04\x65xpr\x12\x12\n\x04name\x18\x02 \x03(\tR\x04name\x12\x1f\n\x08metadata\x18\x03 \x01(\tH\x00R\x08metadata\x88\x01\x01\x42\x0b\n\t_metadata\x1a\x9e\x01\n\x0eLambdaFunction\x12\x35\n\x08\x66unction\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x08\x66unction\x12U\n\targuments\x18\x02 \x03(\x0b\x32\x37.spark.connect.Expression.UnresolvedNamedLambdaVariableR\targuments\x1a>\n\x1dUnresolvedNamedLambdaVariable\x12\x1d\n\nname_parts\x18\x01 \x03(\tR\tnamePartsB\x0b\n\texpr_type"A\n\x10\x45xpressionCommon\x12-\n\x06origin\x18\x01 \x01(\x0b\x32\x15.spark.connect.OriginR\x06origin"\x8d\x03\n\x1f\x43ommonInlineUserDefinedFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12$\n\rdeterministic\x18\x02 \x01(\x08R\rdeterministic\x12\x37\n\targuments\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments\x12\x39\n\npython_udf\x18\x04 \x01(\x0b\x32\x18.spark.connect.PythonUDFH\x00R\tpythonUdf\x12I\n\x10scalar_scala_udf\x18\x05 \x01(\x0b\x32\x1d.spark.connect.ScalarScalaUDFH\x00R\x0escalarScalaUdf\x12\x33\n\x08java_udf\x18\x06 \x01(\x0b\x32\x16.spark.connect.JavaUDFH\x00R\x07javaUdf\x12\x1f\n\x0bis_distinct\x18\x07 \x01(\x08R\nisDistinctB\n\n\x08\x66unction"\xcc\x01\n\tPythonUDF\x12\x38\n\x0boutput_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\noutputType\x12\x1b\n\teval_type\x18\x02 \x01(\x05R\x08\x65valType\x12\x18\n\x07\x63ommand\x18\x03 \x01(\x0cR\x07\x63ommand\x12\x1d\n\npython_ver\x18\x04 \x01(\tR\tpythonVer\x12/\n\x13\x61\x64\x64itional_includes\x18\x05 \x03(\tR\x12\x61\x64\x64itionalIncludes"\xd6\x01\n\x0eScalarScalaUDF\x12\x18\n\x07payload\x18\x01 \x01(\x0cR\x07payload\x12\x37\n\ninputTypes\x18\x02 \x03(\x0b\x32\x17.spark.connect.DataTypeR\ninputTypes\x12\x37\n\noutputType\x18\x03 \x01(\x0b\x32\x17.spark.connect.DataTypeR\noutputType\x12\x1a\n\x08nullable\x18\x04 \x01(\x08R\x08nullable\x12\x1c\n\taggregate\x18\x05 \x01(\x08R\taggregate"\x95\x01\n\x07JavaUDF\x12\x1d\n\nclass_name\x18\x01 \x01(\tR\tclassName\x12=\n\x0boutput_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\noutputType\x88\x01\x01\x12\x1c\n\taggregate\x18\x03 \x01(\x08R\taggregateB\x0e\n\x0c_output_type"c\n\x18TypedAggregateExpression\x12G\n\x10scalar_scala_udf\x18\x01 \x01(\x0b\x32\x1d.spark.connect.ScalarScalaUDFR\x0escalarScalaUdf"l\n\x0c\x43\x61llFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12\x37\n\targuments\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments"\\\n\x17NamedArgumentExpression\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12/\n\x05value\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05value"\x80\x04\n\x0bMergeAction\x12\x46\n\x0b\x61\x63tion_type\x18\x01 \x01(\x0e\x32%.spark.connect.MergeAction.ActionTypeR\nactionType\x12<\n\tcondition\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionH\x00R\tcondition\x88\x01\x01\x12G\n\x0b\x61ssignments\x18\x03 \x03(\x0b\x32%.spark.connect.MergeAction.AssignmentR\x0b\x61ssignments\x1aj\n\nAssignment\x12+\n\x03key\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x03key\x12/\n\x05value\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05value"\xa7\x01\n\nActionType\x12\x17\n\x13\x41\x43TION_TYPE_INVALID\x10\x00\x12\x16\n\x12\x41\x43TION_TYPE_DELETE\x10\x01\x12\x16\n\x12\x41\x43TION_TYPE_INSERT\x10\x02\x12\x1b\n\x17\x41\x43TION_TYPE_INSERT_STAR\x10\x03\x12\x16\n\x12\x41\x43TION_TYPE_UPDATE\x10\x04\x12\x1b\n\x17\x41\x43TION_TYPE_UPDATE_STAR\x10\x05\x42\x0c\n\n_condition"\xc5\x05\n\x12SubqueryExpression\x12\x17\n\x07plan_id\x18\x01 \x01(\x03R\x06planId\x12S\n\rsubquery_type\x18\x02 \x01(\x0e\x32..spark.connect.SubqueryExpression.SubqueryTypeR\x0csubqueryType\x12\x62\n\x11table_arg_options\x18\x03 \x01(\x0b\x32\x31.spark.connect.SubqueryExpression.TableArgOptionsH\x00R\x0ftableArgOptions\x88\x01\x01\x12G\n\x12in_subquery_values\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x10inSubqueryValues\x1a\xea\x01\n\x0fTableArgOptions\x12@\n\x0epartition_spec\x18\x01 \x03(\x0b\x32\x19.spark.connect.ExpressionR\rpartitionSpec\x12\x42\n\norder_spec\x18\x02 \x03(\x0b\x32#.spark.connect.Expression.SortOrderR\torderSpec\x12\x37\n\x15with_single_partition\x18\x03 \x01(\x08H\x00R\x13withSinglePartition\x88\x01\x01\x42\x18\n\x16_with_single_partition"\x90\x01\n\x0cSubqueryType\x12\x19\n\x15SUBQUERY_TYPE_UNKNOWN\x10\x00\x12\x18\n\x14SUBQUERY_TYPE_SCALAR\x10\x01\x12\x18\n\x14SUBQUERY_TYPE_EXISTS\x10\x02\x12\x1b\n\x17SUBQUERY_TYPE_TABLE_ARG\x10\x03\x12\x14\n\x10SUBQUERY_TYPE_IN\x10\x04\x42\x14\n\x12_table_arg_optionsB6\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3'
 )
 
 _globals = globals()
@@ -53,8 +53,22 @@
     _globals[
         "DESCRIPTOR"
     ]._serialized_options = b"\n\036org.apache.spark.connect.protoP\001Z\022internal/generated"
+    _globals["_EXPRESSION_LITERAL_ARRAY"].fields_by_name["element_type"]._loaded_options = None
+    _globals["_EXPRESSION_LITERAL_ARRAY"].fields_by_name[
+        "element_type"
+    ]._serialized_options = b"\030\001"
+    _globals["_EXPRESSION_LITERAL_MAP"].fields_by_name["key_type"]._loaded_options = None
+    _globals["_EXPRESSION_LITERAL_MAP"].fields_by_name["key_type"]._serialized_options = b"\030\001"
+    _globals["_EXPRESSION_LITERAL_MAP"].fields_by_name["value_type"]._loaded_options = None
+    _globals["_EXPRESSION_LITERAL_MAP"].fields_by_name[
+        "value_type"
+    ]._serialized_options = b"\030\001"
+    _globals["_EXPRESSION_LITERAL_STRUCT"].fields_by_name["struct_type"]._loaded_options = None
+    _globals["_EXPRESSION_LITERAL_STRUCT"].fields_by_name[
+        "struct_type"
+    ]._serialized_options = b"\030\001"
     _globals["_EXPRESSION"]._serialized_start = 133
-    _globals["_EXPRESSION"]._serialized_end = 6904
+    _globals["_EXPRESSION"]._serialized_end = 7251
     _globals["_EXPRESSION_WINDOW"]._serialized_start = 1986
     _globals["_EXPRESSION_WINDOW"]._serialized_end = 2769
     _globals["_EXPRESSION_WINDOW_WINDOWFRAME"]._serialized_start = 2276
@@ -74,65 +88,67 @@
     _globals["_EXPRESSION_CAST_EVALMODE"]._serialized_start = 3401
     _globals["_EXPRESSION_CAST_EVALMODE"]._serialized_end = 3499
     _globals["_EXPRESSION_LITERAL"]._serialized_start = 3518
-    _globals["_EXPRESSION_LITERAL"]._serialized_end = 5503
-    _globals["_EXPRESSION_LITERAL_DECIMAL"]._serialized_start = 4452
-    _globals["_EXPRESSION_LITERAL_DECIMAL"]._serialized_end = 4569
-    _globals["_EXPRESSION_LITERAL_CALENDARINTERVAL"]._serialized_start = 4571
-    _globals["_EXPRESSION_LITERAL_CALENDARINTERVAL"]._serialized_end = 4669
-    _globals["_EXPRESSION_LITERAL_ARRAY"]._serialized_start = 4672
-    _globals["_EXPRESSION_LITERAL_ARRAY"]._serialized_end = 4802
-    _globals["_EXPRESSION_LITERAL_MAP"]._serialized_start = 4805
-    _globals["_EXPRESSION_LITERAL_MAP"]._serialized_end = 5032
-    _globals["_EXPRESSION_LITERAL_STRUCT"]._serialized_start = 5035
-    _globals["_EXPRESSION_LITERAL_STRUCT"]._serialized_end = 5164
-    _globals["_EXPRESSION_LITERAL_SPECIALIZEDARRAY"]._serialized_start = 5167
-    _globals["_EXPRESSION_LITERAL_SPECIALIZEDARRAY"]._serialized_end = 5487
-    _globals["_EXPRESSION_UNRESOLVEDATTRIBUTE"]._serialized_start = 5506
-    _globals["_EXPRESSION_UNRESOLVEDATTRIBUTE"]._serialized_end = 5692
-    _globals["_EXPRESSION_UNRESOLVEDFUNCTION"]._serialized_start = 5695
-    _globals["_EXPRESSION_UNRESOLVEDFUNCTION"]._serialized_end = 5953
-    _globals["_EXPRESSION_EXPRESSIONSTRING"]._serialized_start = 5955
-    _globals["_EXPRESSION_EXPRESSIONSTRING"]._serialized_end = 6005
-    _globals["_EXPRESSION_UNRESOLVEDSTAR"]._serialized_start = 6007
-    _globals["_EXPRESSION_UNRESOLVEDSTAR"]._serialized_end = 6131
-    _globals["_EXPRESSION_UNRESOLVEDREGEX"]._serialized_start = 6133
-    _globals["_EXPRESSION_UNRESOLVEDREGEX"]._serialized_end = 6219
-    _globals["_EXPRESSION_UNRESOLVEDEXTRACTVALUE"]._serialized_start = 6222
-    _globals["_EXPRESSION_UNRESOLVEDEXTRACTVALUE"]._serialized_end = 6354
-    _globals["_EXPRESSION_UPDATEFIELDS"]._serialized_start = 6357
-    _globals["_EXPRESSION_UPDATEFIELDS"]._serialized_end = 6544
-    _globals["_EXPRESSION_ALIAS"]._serialized_start = 6546
-    _globals["_EXPRESSION_ALIAS"]._serialized_end = 6666
-    _globals["_EXPRESSION_LAMBDAFUNCTION"]._serialized_start = 6669
-    _globals["_EXPRESSION_LAMBDAFUNCTION"]._serialized_end = 6827
-    _globals["_EXPRESSION_UNRESOLVEDNAMEDLAMBDAVARIABLE"]._serialized_start = 6829
-    _globals["_EXPRESSION_UNRESOLVEDNAMEDLAMBDAVARIABLE"]._serialized_end = 6891
-    _globals["_EXPRESSIONCOMMON"]._serialized_start = 6906
-    _globals["_EXPRESSIONCOMMON"]._serialized_end = 6971
-    _globals["_COMMONINLINEUSERDEFINEDFUNCTION"]._serialized_start = 6974
-    _globals["_COMMONINLINEUSERDEFINEDFUNCTION"]._serialized_end = 7371
-    _globals["_PYTHONUDF"]._serialized_start = 7374
-    _globals["_PYTHONUDF"]._serialized_end = 7578
-    _globals["_SCALARSCALAUDF"]._serialized_start = 7581
-    _globals["_SCALARSCALAUDF"]._serialized_end = 7795
-    _globals["_JAVAUDF"]._serialized_start = 7798
-    _globals["_JAVAUDF"]._serialized_end = 7947
-    _globals["_TYPEDAGGREGATEEXPRESSION"]._serialized_start = 7949
-    _globals["_TYPEDAGGREGATEEXPRESSION"]._serialized_end = 8048
-    _globals["_CALLFUNCTION"]._serialized_start = 8050
-    _globals["_CALLFUNCTION"]._serialized_end = 8158
-    _globals["_NAMEDARGUMENTEXPRESSION"]._serialized_start = 8160
-    _globals["_NAMEDARGUMENTEXPRESSION"]._serialized_end = 8252
-    _globals["_MERGEACTION"]._serialized_start = 8255
-    _globals["_MERGEACTION"]._serialized_end = 8767
-    _globals["_MERGEACTION_ASSIGNMENT"]._serialized_start = 8477
-    _globals["_MERGEACTION_ASSIGNMENT"]._serialized_end = 8583
-    _globals["_MERGEACTION_ACTIONTYPE"]._serialized_start = 8586
-    _globals["_MERGEACTION_ACTIONTYPE"]._serialized_end = 8753
-    _globals["_SUBQUERYEXPRESSION"]._serialized_start = 8770
-    _globals["_SUBQUERYEXPRESSION"]._serialized_end = 9479
-    _globals["_SUBQUERYEXPRESSION_TABLEARGOPTIONS"]._serialized_start = 9076
-    _globals["_SUBQUERYEXPRESSION_TABLEARGOPTIONS"]._serialized_end = 9310
-    _globals["_SUBQUERYEXPRESSION_SUBQUERYTYPE"]._serialized_start = 9313
-    _globals["_SUBQUERYEXPRESSION_SUBQUERYTYPE"]._serialized_end = 9457
+    _globals["_EXPRESSION_LITERAL"]._serialized_end = 5850
+    _globals["_EXPRESSION_LITERAL_DECIMAL"]._serialized_start = 4514
+    _globals["_EXPRESSION_LITERAL_DECIMAL"]._serialized_end = 4631
+    _globals["_EXPRESSION_LITERAL_CALENDARINTERVAL"]._serialized_start = 4633
+    _globals["_EXPRESSION_LITERAL_CALENDARINTERVAL"]._serialized_end = 4731
+    _globals["_EXPRESSION_LITERAL_ARRAY"]._serialized_start = 4734
+    _globals["_EXPRESSION_LITERAL_ARRAY"]._serialized_end = 4928
+    _globals["_EXPRESSION_LITERAL_MAP"]._serialized_start = 4931
+    _globals["_EXPRESSION_LITERAL_MAP"]._serialized_end = 5224
+    _globals["_EXPRESSION_LITERAL_STRUCT"]._serialized_start = 5227
+    _globals["_EXPRESSION_LITERAL_STRUCT"]._serialized_end = 5434
+    _globals["_EXPRESSION_LITERAL_SPECIALIZEDARRAY"]._serialized_start = 5437
+    _globals["_EXPRESSION_LITERAL_SPECIALIZEDARRAY"]._serialized_end = 5757
+    _globals["_EXPRESSION_LITERAL_TIME"]._serialized_start = 5759
+    _globals["_EXPRESSION_LITERAL_TIME"]._serialized_end = 5834
+    _globals["_EXPRESSION_UNRESOLVEDATTRIBUTE"]._serialized_start = 5853
+    _globals["_EXPRESSION_UNRESOLVEDATTRIBUTE"]._serialized_end = 6039
+    _globals["_EXPRESSION_UNRESOLVEDFUNCTION"]._serialized_start = 6042
+    _globals["_EXPRESSION_UNRESOLVEDFUNCTION"]._serialized_end = 6300
+    _globals["_EXPRESSION_EXPRESSIONSTRING"]._serialized_start = 6302
+    _globals["_EXPRESSION_EXPRESSIONSTRING"]._serialized_end = 6352
+    _globals["_EXPRESSION_UNRESOLVEDSTAR"]._serialized_start = 6354
+    _globals["_EXPRESSION_UNRESOLVEDSTAR"]._serialized_end = 6478
+    _globals["_EXPRESSION_UNRESOLVEDREGEX"]._serialized_start = 6480
+    _globals["_EXPRESSION_UNRESOLVEDREGEX"]._serialized_end = 6566
+    _globals["_EXPRESSION_UNRESOLVEDEXTRACTVALUE"]._serialized_start = 6569
+    _globals["_EXPRESSION_UNRESOLVEDEXTRACTVALUE"]._serialized_end = 6701
+    _globals["_EXPRESSION_UPDATEFIELDS"]._serialized_start = 6704
+    _globals["_EXPRESSION_UPDATEFIELDS"]._serialized_end = 6891
+    _globals["_EXPRESSION_ALIAS"]._serialized_start = 6893
+    _globals["_EXPRESSION_ALIAS"]._serialized_end = 7013
+    _globals["_EXPRESSION_LAMBDAFUNCTION"]._serialized_start = 7016
+    _globals["_EXPRESSION_LAMBDAFUNCTION"]._serialized_end = 7174
+    _globals["_EXPRESSION_UNRESOLVEDNAMEDLAMBDAVARIABLE"]._serialized_start = 7176
+    _globals["_EXPRESSION_UNRESOLVEDNAMEDLAMBDAVARIABLE"]._serialized_end = 7238
+    _globals["_EXPRESSIONCOMMON"]._serialized_start = 7253
+    _globals["_EXPRESSIONCOMMON"]._serialized_end = 7318
+    _globals["_COMMONINLINEUSERDEFINEDFUNCTION"]._serialized_start = 7321
+    _globals["_COMMONINLINEUSERDEFINEDFUNCTION"]._serialized_end = 7718
+    _globals["_PYTHONUDF"]._serialized_start = 7721
+    _globals["_PYTHONUDF"]._serialized_end = 7925
+    _globals["_SCALARSCALAUDF"]._serialized_start = 7928
+    _globals["_SCALARSCALAUDF"]._serialized_end = 8142
+    _globals["_JAVAUDF"]._serialized_start = 8145
+    _globals["_JAVAUDF"]._serialized_end = 8294
+    _globals["_TYPEDAGGREGATEEXPRESSION"]._serialized_start = 8296
+    _globals["_TYPEDAGGREGATEEXPRESSION"]._serialized_end = 8395
+    _globals["_CALLFUNCTION"]._serialized_start = 8397
+    _globals["_CALLFUNCTION"]._serialized_end = 8505
+    _globals["_NAMEDARGUMENTEXPRESSION"]._serialized_start = 8507
+    _globals["_NAMEDARGUMENTEXPRESSION"]._serialized_end = 8599
+    _globals["_MERGEACTION"]._serialized_start = 8602
+    _globals["_MERGEACTION"]._serialized_end = 9114
+    _globals["_MERGEACTION_ASSIGNMENT"]._serialized_start = 8824
+    _globals["_MERGEACTION_ASSIGNMENT"]._serialized_end = 8930
+    _globals["_MERGEACTION_ACTIONTYPE"]._serialized_start = 8933
+    _globals["_MERGEACTION_ACTIONTYPE"]._serialized_end = 9100
+    _globals["_SUBQUERYEXPRESSION"]._serialized_start = 9117
+    _globals["_SUBQUERYEXPRESSION"]._serialized_end = 9826
+    _globals["_SUBQUERYEXPRESSION_TABLEARGOPTIONS"]._serialized_start = 9423
+    _globals["_SUBQUERYEXPRESSION_TABLEARGOPTIONS"]._serialized_end = 9657
+    _globals["_SUBQUERYEXPRESSION_SUBQUERYTYPE"]._serialized_start = 9660
+    _globals["_SUBQUERYEXPRESSION_SUBQUERYTYPE"]._serialized_end = 9804
 # @@protoc_insertion_point(module_scope)
diff --git a/python/pyspark/sql/connect/proto/expressions_pb2.pyi b/python/pyspark/sql/connect/proto/expressions_pb2.pyi
index 25fc04c0319e6..508a11a01c85e 100644
--- a/python/pyspark/sql/connect/proto/expressions_pb2.pyi
+++ b/python/pyspark/sql/connect/proto/expressions_pb2.pyi
@@ -474,27 +474,51 @@ class Expression(google.protobuf.message.Message):
 
             ELEMENT_TYPE_FIELD_NUMBER: builtins.int
             ELEMENTS_FIELD_NUMBER: builtins.int
+            DATA_TYPE_FIELD_NUMBER: builtins.int
             @property
-            def element_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType: ...
+            def element_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType:
+                """(Deprecated) The element type of the array.
+
+                This field is deprecated since Spark 4.1+ and should only be set
+                if the data_type field is not set. Use data_type field instead.
+                """
             @property
             def elements(
                 self,
             ) -> google.protobuf.internal.containers.RepeatedCompositeFieldContainer[
                 global___Expression.Literal
-            ]: ...
+            ]:
+                """The literal values that make up the array elements."""
+            @property
+            def data_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType.Array:
+                """The type of the array.
+
+                If the element type can be inferred from the first element of the elements field,
+                then you don't need to set data_type.element_type to save space. On the other hand,
+                redundant type information is also acceptable.
+                """
             def __init__(
                 self,
                 *,
                 element_type: pyspark.sql.connect.proto.types_pb2.DataType | None = ...,
                 elements: collections.abc.Iterable[global___Expression.Literal] | None = ...,
+                data_type: pyspark.sql.connect.proto.types_pb2.DataType.Array | None = ...,
             ) -> None: ...
             def HasField(
-                self, field_name: typing_extensions.Literal["element_type", b"element_type"]
+                self,
+                field_name: typing_extensions.Literal[
+                    "data_type", b"data_type", "element_type", b"element_type"
+                ],
             ) -> builtins.bool: ...
             def ClearField(
                 self,
                 field_name: typing_extensions.Literal[
-                    "element_type", b"element_type", "elements", b"elements"
+                    "data_type",
+                    b"data_type",
+                    "element_type",
+                    b"element_type",
+                    "elements",
+                    b"elements",
                 ],
             ) -> None: ...
 
@@ -505,22 +529,43 @@ class Expression(google.protobuf.message.Message):
             VALUE_TYPE_FIELD_NUMBER: builtins.int
             KEYS_FIELD_NUMBER: builtins.int
             VALUES_FIELD_NUMBER: builtins.int
+            DATA_TYPE_FIELD_NUMBER: builtins.int
             @property
-            def key_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType: ...
+            def key_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType:
+                """(Deprecated) The key type of the map.
+
+                This field is deprecated since Spark 4.1+ and should only be set
+                if the data_type field is not set. Use data_type field instead.
+                """
             @property
-            def value_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType: ...
+            def value_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType:
+                """(Deprecated) The value type of the map.
+
+                This field is deprecated since Spark 4.1+ and should only be set
+                if the data_type field is not set. Use data_type field instead.
+                """
             @property
             def keys(
                 self,
             ) -> google.protobuf.internal.containers.RepeatedCompositeFieldContainer[
                 global___Expression.Literal
-            ]: ...
+            ]:
+                """The literal keys that make up the map."""
             @property
             def values(
                 self,
             ) -> google.protobuf.internal.containers.RepeatedCompositeFieldContainer[
                 global___Expression.Literal
-            ]: ...
+            ]:
+                """The literal values that make up the map."""
+            @property
+            def data_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType.Map:
+                """The type of the map.
+
+                If the key/value types can be inferred from the first element of the keys/values fields,
+                then you don't need to set data_type.key_type/data_type.value_type to save space.
+                On the other hand, redundant type information is also acceptable.
+                """
             def __init__(
                 self,
                 *,
@@ -528,16 +573,19 @@ class Expression(google.protobuf.message.Message):
                 value_type: pyspark.sql.connect.proto.types_pb2.DataType | None = ...,
                 keys: collections.abc.Iterable[global___Expression.Literal] | None = ...,
                 values: collections.abc.Iterable[global___Expression.Literal] | None = ...,
+                data_type: pyspark.sql.connect.proto.types_pb2.DataType.Map | None = ...,
             ) -> None: ...
             def HasField(
                 self,
                 field_name: typing_extensions.Literal[
-                    "key_type", b"key_type", "value_type", b"value_type"
+                    "data_type", b"data_type", "key_type", b"key_type", "value_type", b"value_type"
                 ],
             ) -> builtins.bool: ...
             def ClearField(
                 self,
                 field_name: typing_extensions.Literal[
+                    "data_type",
+                    b"data_type",
                     "key_type",
                     b"key_type",
                     "keys",
@@ -554,27 +602,51 @@ class Expression(google.protobuf.message.Message):
 
             STRUCT_TYPE_FIELD_NUMBER: builtins.int
             ELEMENTS_FIELD_NUMBER: builtins.int
+            DATA_TYPE_STRUCT_FIELD_NUMBER: builtins.int
             @property
-            def struct_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType: ...
+            def struct_type(self) -> pyspark.sql.connect.proto.types_pb2.DataType:
+                """(Deprecated) The type of the struct.
+
+                This field is deprecated since Spark 4.1+ because using DataType as the type of a struct
+                is ambiguous. This field should only be set if the data_type_struct field is not set.
+                Use data_type_struct field instead.
+                """
             @property
             def elements(
                 self,
             ) -> google.protobuf.internal.containers.RepeatedCompositeFieldContainer[
                 global___Expression.Literal
-            ]: ...
+            ]:
+                """(Required) The literal values that make up the struct elements."""
+            @property
+            def data_type_struct(self) -> pyspark.sql.connect.proto.types_pb2.DataType.Struct:
+                """The type of the struct.
+
+                Whether data_type_struct.fields.data_type should be set depends on
+                whether each field's type can be inferred from the elements field.
+                """
             def __init__(
                 self,
                 *,
                 struct_type: pyspark.sql.connect.proto.types_pb2.DataType | None = ...,
                 elements: collections.abc.Iterable[global___Expression.Literal] | None = ...,
+                data_type_struct: pyspark.sql.connect.proto.types_pb2.DataType.Struct | None = ...,
             ) -> None: ...
             def HasField(
-                self, field_name: typing_extensions.Literal["struct_type", b"struct_type"]
+                self,
+                field_name: typing_extensions.Literal[
+                    "data_type_struct", b"data_type_struct", "struct_type", b"struct_type"
+                ],
             ) -> builtins.bool: ...
             def ClearField(
                 self,
                 field_name: typing_extensions.Literal[
-                    "elements", b"elements", "struct_type", b"struct_type"
+                    "data_type_struct",
+                    b"data_type_struct",
+                    "elements",
+                    b"elements",
+                    "struct_type",
+                    b"struct_type",
                 ],
             ) -> None: ...
 
@@ -654,6 +726,36 @@ class Expression(google.protobuf.message.Message):
                 | None
             ): ...
 
+        class Time(google.protobuf.message.Message):
+            DESCRIPTOR: google.protobuf.descriptor.Descriptor
+
+            NANO_FIELD_NUMBER: builtins.int
+            PRECISION_FIELD_NUMBER: builtins.int
+            nano: builtins.int
+            precision: builtins.int
+            """The precision of this time, if omitted, uses the default value of MICROS_PRECISION."""
+            def __init__(
+                self,
+                *,
+                nano: builtins.int = ...,
+                precision: builtins.int | None = ...,
+            ) -> None: ...
+            def HasField(
+                self,
+                field_name: typing_extensions.Literal[
+                    "_precision", b"_precision", "precision", b"precision"
+                ],
+            ) -> builtins.bool: ...
+            def ClearField(
+                self,
+                field_name: typing_extensions.Literal[
+                    "_precision", b"_precision", "nano", b"nano", "precision", b"precision"
+                ],
+            ) -> None: ...
+            def WhichOneof(
+                self, oneof_group: typing_extensions.Literal["_precision", b"_precision"]
+            ) -> typing_extensions.Literal["precision"] | None: ...
+
         NULL_FIELD_NUMBER: builtins.int
         BINARY_FIELD_NUMBER: builtins.int
         BOOLEAN_FIELD_NUMBER: builtins.int
@@ -675,6 +777,7 @@ class Expression(google.protobuf.message.Message):
         MAP_FIELD_NUMBER: builtins.int
         STRUCT_FIELD_NUMBER: builtins.int
         SPECIALIZED_ARRAY_FIELD_NUMBER: builtins.int
+        TIME_FIELD_NUMBER: builtins.int
         @property
         def null(self) -> pyspark.sql.connect.proto.types_pb2.DataType: ...
         binary: builtins.bytes
@@ -706,6 +809,8 @@ class Expression(google.protobuf.message.Message):
         def struct(self) -> global___Expression.Literal.Struct: ...
         @property
         def specialized_array(self) -> global___Expression.Literal.SpecializedArray: ...
+        @property
+        def time(self) -> global___Expression.Literal.Time: ...
         def __init__(
             self,
             *,
@@ -730,6 +835,7 @@ class Expression(google.protobuf.message.Message):
             map: global___Expression.Literal.Map | None = ...,
             struct: global___Expression.Literal.Struct | None = ...,
             specialized_array: global___Expression.Literal.SpecializedArray | None = ...,
+            time: global___Expression.Literal.Time | None = ...,
         ) -> None: ...
         def HasField(
             self,
@@ -772,6 +878,8 @@ class Expression(google.protobuf.message.Message):
                 b"string",
                 "struct",
                 b"struct",
+                "time",
+                b"time",
                 "timestamp",
                 b"timestamp",
                 "timestamp_ntz",
@@ -821,6 +929,8 @@ class Expression(google.protobuf.message.Message):
                 b"string",
                 "struct",
                 b"struct",
+                "time",
+                b"time",
                 "timestamp",
                 b"timestamp",
                 "timestamp_ntz",
@@ -854,6 +964,7 @@ class Expression(google.protobuf.message.Message):
                 "map",
                 "struct",
                 "specialized_array",
+                "time",
             ]
             | None
         ): ...
diff --git a/python/pyspark/sql/connect/proto/ml_pb2.py b/python/pyspark/sql/connect/proto/ml_pb2.py
index 46fc82131a9e7..4c1b4038c35e3 100644
--- a/python/pyspark/sql/connect/proto/ml_pb2.py
+++ b/python/pyspark/sql/connect/proto/ml_pb2.py
@@ -40,7 +40,7 @@
 
 
 DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(
-    b'\n\x16spark/connect/ml.proto\x12\rspark.connect\x1a\x1dspark/connect/relations.proto\x1a\x1fspark/connect/expressions.proto\x1a\x1dspark/connect/ml_common.proto"\xb2\x0b\n\tMlCommand\x12\x30\n\x03\x66it\x18\x01 \x01(\x0b\x32\x1c.spark.connect.MlCommand.FitH\x00R\x03\x66it\x12,\n\x05\x66\x65tch\x18\x02 \x01(\x0b\x32\x14.spark.connect.FetchH\x00R\x05\x66\x65tch\x12\x39\n\x06\x64\x65lete\x18\x03 \x01(\x0b\x32\x1f.spark.connect.MlCommand.DeleteH\x00R\x06\x64\x65lete\x12\x36\n\x05write\x18\x04 \x01(\x0b\x32\x1e.spark.connect.MlCommand.WriteH\x00R\x05write\x12\x33\n\x04read\x18\x05 \x01(\x0b\x32\x1d.spark.connect.MlCommand.ReadH\x00R\x04read\x12?\n\x08\x65valuate\x18\x06 \x01(\x0b\x32!.spark.connect.MlCommand.EvaluateH\x00R\x08\x65valuate\x12\x46\n\x0b\x63lean_cache\x18\x07 \x01(\x0b\x32#.spark.connect.MlCommand.CleanCacheH\x00R\ncleanCache\x12M\n\x0eget_cache_info\x18\x08 \x01(\x0b\x32%.spark.connect.MlCommand.GetCacheInfoH\x00R\x0cgetCacheInfo\x1a\xb2\x01\n\x03\x46it\x12\x37\n\testimator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorR\testimator\x12\x34\n\x06params\x18\x02 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x00R\x06params\x88\x01\x01\x12\x31\n\x07\x64\x61taset\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x07\x64\x61tasetB\t\n\x07_params\x1a=\n\x06\x44\x65lete\x12\x33\n\x08obj_refs\x18\x01 \x03(\x0b\x32\x18.spark.connect.ObjectRefR\x07objRefs\x1a\x0c\n\nCleanCache\x1a\x0e\n\x0cGetCacheInfo\x1a\x9a\x03\n\x05Write\x12\x37\n\x08operator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorH\x00R\x08operator\x12\x33\n\x07obj_ref\x18\x02 \x01(\x0b\x32\x18.spark.connect.ObjectRefH\x00R\x06objRef\x12\x34\n\x06params\x18\x03 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x01R\x06params\x88\x01\x01\x12\x12\n\x04path\x18\x04 \x01(\tR\x04path\x12.\n\x10should_overwrite\x18\x05 \x01(\x08H\x02R\x0fshouldOverwrite\x88\x01\x01\x12\x45\n\x07options\x18\x06 \x03(\x0b\x32+.spark.connect.MlCommand.Write.OptionsEntryR\x07options\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\x06\n\x04typeB\t\n\x07_paramsB\x13\n\x11_should_overwrite\x1aQ\n\x04Read\x12\x35\n\x08operator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorR\x08operator\x12\x12\n\x04path\x18\x02 \x01(\tR\x04path\x1a\xb7\x01\n\x08\x45valuate\x12\x37\n\tevaluator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorR\tevaluator\x12\x34\n\x06params\x18\x02 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x00R\x06params\x88\x01\x01\x12\x31\n\x07\x64\x61taset\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x07\x64\x61tasetB\t\n\x07_paramsB\t\n\x07\x63ommand"\xd5\x03\n\x0fMlCommandResult\x12\x39\n\x05param\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralH\x00R\x05param\x12\x1a\n\x07summary\x18\x02 \x01(\tH\x00R\x07summary\x12T\n\roperator_info\x18\x03 \x01(\x0b\x32-.spark.connect.MlCommandResult.MlOperatorInfoH\x00R\x0coperatorInfo\x1a\x85\x02\n\x0eMlOperatorInfo\x12\x33\n\x07obj_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefH\x00R\x06objRef\x12\x14\n\x04name\x18\x02 \x01(\tH\x00R\x04name\x12\x15\n\x03uid\x18\x03 \x01(\tH\x01R\x03uid\x88\x01\x01\x12\x34\n\x06params\x18\x04 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x02R\x06params\x88\x01\x01\x12,\n\x0fwarning_message\x18\x05 \x01(\tH\x03R\x0ewarningMessage\x88\x01\x01\x42\x06\n\x04typeB\x06\n\x04_uidB\t\n\x07_paramsB\x12\n\x10_warning_messageB\r\n\x0bresult_typeB6\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3'
+    b'\n\x16spark/connect/ml.proto\x12\rspark.connect\x1a\x1dspark/connect/relations.proto\x1a\x1fspark/connect/expressions.proto\x1a\x1dspark/connect/ml_common.proto"\xc7\x0e\n\tMlCommand\x12\x30\n\x03\x66it\x18\x01 \x01(\x0b\x32\x1c.spark.connect.MlCommand.FitH\x00R\x03\x66it\x12,\n\x05\x66\x65tch\x18\x02 \x01(\x0b\x32\x14.spark.connect.FetchH\x00R\x05\x66\x65tch\x12\x39\n\x06\x64\x65lete\x18\x03 \x01(\x0b\x32\x1f.spark.connect.MlCommand.DeleteH\x00R\x06\x64\x65lete\x12\x36\n\x05write\x18\x04 \x01(\x0b\x32\x1e.spark.connect.MlCommand.WriteH\x00R\x05write\x12\x33\n\x04read\x18\x05 \x01(\x0b\x32\x1d.spark.connect.MlCommand.ReadH\x00R\x04read\x12?\n\x08\x65valuate\x18\x06 \x01(\x0b\x32!.spark.connect.MlCommand.EvaluateH\x00R\x08\x65valuate\x12\x46\n\x0b\x63lean_cache\x18\x07 \x01(\x0b\x32#.spark.connect.MlCommand.CleanCacheH\x00R\ncleanCache\x12M\n\x0eget_cache_info\x18\x08 \x01(\x0b\x32%.spark.connect.MlCommand.GetCacheInfoH\x00R\x0cgetCacheInfo\x12O\n\x0e\x63reate_summary\x18\t \x01(\x0b\x32&.spark.connect.MlCommand.CreateSummaryH\x00R\rcreateSummary\x12M\n\x0eget_model_size\x18\n \x01(\x0b\x32%.spark.connect.MlCommand.GetModelSizeH\x00R\x0cgetModelSize\x1a\xb2\x01\n\x03\x46it\x12\x37\n\testimator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorR\testimator\x12\x34\n\x06params\x18\x02 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x00R\x06params\x88\x01\x01\x12\x31\n\x07\x64\x61taset\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x07\x64\x61tasetB\t\n\x07_params\x1ap\n\x06\x44\x65lete\x12\x33\n\x08obj_refs\x18\x01 \x03(\x0b\x32\x18.spark.connect.ObjectRefR\x07objRefs\x12"\n\nevict_only\x18\x02 \x01(\x08H\x00R\tevictOnly\x88\x01\x01\x42\r\n\x0b_evict_only\x1a\x0c\n\nCleanCache\x1a\x0e\n\x0cGetCacheInfo\x1a\x9a\x03\n\x05Write\x12\x37\n\x08operator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorH\x00R\x08operator\x12\x33\n\x07obj_ref\x18\x02 \x01(\x0b\x32\x18.spark.connect.ObjectRefH\x00R\x06objRef\x12\x34\n\x06params\x18\x03 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x01R\x06params\x88\x01\x01\x12\x12\n\x04path\x18\x04 \x01(\tR\x04path\x12.\n\x10should_overwrite\x18\x05 \x01(\x08H\x02R\x0fshouldOverwrite\x88\x01\x01\x12\x45\n\x07options\x18\x06 \x03(\x0b\x32+.spark.connect.MlCommand.Write.OptionsEntryR\x07options\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\x06\n\x04typeB\t\n\x07_paramsB\x13\n\x11_should_overwrite\x1aQ\n\x04Read\x12\x35\n\x08operator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorR\x08operator\x12\x12\n\x04path\x18\x02 \x01(\tR\x04path\x1a\xb7\x01\n\x08\x45valuate\x12\x37\n\tevaluator\x18\x01 \x01(\x0b\x32\x19.spark.connect.MlOperatorR\tevaluator\x12\x34\n\x06params\x18\x02 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x00R\x06params\x88\x01\x01\x12\x31\n\x07\x64\x61taset\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x07\x64\x61tasetB\t\n\x07_params\x1ay\n\rCreateSummary\x12\x35\n\tmodel_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefR\x08modelRef\x12\x31\n\x07\x64\x61taset\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\x07\x64\x61taset\x1a\x45\n\x0cGetModelSize\x12\x35\n\tmodel_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefR\x08modelRefB\t\n\x07\x63ommand"\xd5\x03\n\x0fMlCommandResult\x12\x39\n\x05param\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralH\x00R\x05param\x12\x1a\n\x07summary\x18\x02 \x01(\tH\x00R\x07summary\x12T\n\roperator_info\x18\x03 \x01(\x0b\x32-.spark.connect.MlCommandResult.MlOperatorInfoH\x00R\x0coperatorInfo\x1a\x85\x02\n\x0eMlOperatorInfo\x12\x33\n\x07obj_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefH\x00R\x06objRef\x12\x14\n\x04name\x18\x02 \x01(\tH\x00R\x04name\x12\x15\n\x03uid\x18\x03 \x01(\tH\x01R\x03uid\x88\x01\x01\x12\x34\n\x06params\x18\x04 \x01(\x0b\x32\x17.spark.connect.MlParamsH\x02R\x06params\x88\x01\x01\x12,\n\x0fwarning_message\x18\x05 \x01(\tH\x03R\x0ewarningMessage\x88\x01\x01\x42\x06\n\x04typeB\x06\n\x04_uidB\t\n\x07_paramsB\x12\n\x10_warning_messageB\r\n\x0bresult_typeB6\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3'
 )
 
 _globals = globals()
@@ -54,25 +54,29 @@
     _globals["_MLCOMMAND_WRITE_OPTIONSENTRY"]._loaded_options = None
     _globals["_MLCOMMAND_WRITE_OPTIONSENTRY"]._serialized_options = b"8\001"
     _globals["_MLCOMMAND"]._serialized_start = 137
-    _globals["_MLCOMMAND"]._serialized_end = 1595
-    _globals["_MLCOMMAND_FIT"]._serialized_start = 631
-    _globals["_MLCOMMAND_FIT"]._serialized_end = 809
-    _globals["_MLCOMMAND_DELETE"]._serialized_start = 811
-    _globals["_MLCOMMAND_DELETE"]._serialized_end = 872
-    _globals["_MLCOMMAND_CLEANCACHE"]._serialized_start = 874
-    _globals["_MLCOMMAND_CLEANCACHE"]._serialized_end = 886
-    _globals["_MLCOMMAND_GETCACHEINFO"]._serialized_start = 888
-    _globals["_MLCOMMAND_GETCACHEINFO"]._serialized_end = 902
-    _globals["_MLCOMMAND_WRITE"]._serialized_start = 905
-    _globals["_MLCOMMAND_WRITE"]._serialized_end = 1315
-    _globals["_MLCOMMAND_WRITE_OPTIONSENTRY"]._serialized_start = 1217
-    _globals["_MLCOMMAND_WRITE_OPTIONSENTRY"]._serialized_end = 1275
-    _globals["_MLCOMMAND_READ"]._serialized_start = 1317
-    _globals["_MLCOMMAND_READ"]._serialized_end = 1398
-    _globals["_MLCOMMAND_EVALUATE"]._serialized_start = 1401
-    _globals["_MLCOMMAND_EVALUATE"]._serialized_end = 1584
-    _globals["_MLCOMMANDRESULT"]._serialized_start = 1598
-    _globals["_MLCOMMANDRESULT"]._serialized_end = 2067
-    _globals["_MLCOMMANDRESULT_MLOPERATORINFO"]._serialized_start = 1791
-    _globals["_MLCOMMANDRESULT_MLOPERATORINFO"]._serialized_end = 2052
+    _globals["_MLCOMMAND"]._serialized_end = 2000
+    _globals["_MLCOMMAND_FIT"]._serialized_start = 791
+    _globals["_MLCOMMAND_FIT"]._serialized_end = 969
+    _globals["_MLCOMMAND_DELETE"]._serialized_start = 971
+    _globals["_MLCOMMAND_DELETE"]._serialized_end = 1083
+    _globals["_MLCOMMAND_CLEANCACHE"]._serialized_start = 1085
+    _globals["_MLCOMMAND_CLEANCACHE"]._serialized_end = 1097
+    _globals["_MLCOMMAND_GETCACHEINFO"]._serialized_start = 1099
+    _globals["_MLCOMMAND_GETCACHEINFO"]._serialized_end = 1113
+    _globals["_MLCOMMAND_WRITE"]._serialized_start = 1116
+    _globals["_MLCOMMAND_WRITE"]._serialized_end = 1526
+    _globals["_MLCOMMAND_WRITE_OPTIONSENTRY"]._serialized_start = 1428
+    _globals["_MLCOMMAND_WRITE_OPTIONSENTRY"]._serialized_end = 1486
+    _globals["_MLCOMMAND_READ"]._serialized_start = 1528
+    _globals["_MLCOMMAND_READ"]._serialized_end = 1609
+    _globals["_MLCOMMAND_EVALUATE"]._serialized_start = 1612
+    _globals["_MLCOMMAND_EVALUATE"]._serialized_end = 1795
+    _globals["_MLCOMMAND_CREATESUMMARY"]._serialized_start = 1797
+    _globals["_MLCOMMAND_CREATESUMMARY"]._serialized_end = 1918
+    _globals["_MLCOMMAND_GETMODELSIZE"]._serialized_start = 1920
+    _globals["_MLCOMMAND_GETMODELSIZE"]._serialized_end = 1989
+    _globals["_MLCOMMANDRESULT"]._serialized_start = 2003
+    _globals["_MLCOMMANDRESULT"]._serialized_end = 2472
+    _globals["_MLCOMMANDRESULT_MLOPERATORINFO"]._serialized_start = 2196
+    _globals["_MLCOMMANDRESULT_MLOPERATORINFO"]._serialized_end = 2457
 # @@protoc_insertion_point(module_scope)
diff --git a/python/pyspark/sql/connect/proto/ml_pb2.pyi b/python/pyspark/sql/connect/proto/ml_pb2.pyi
index 88cc6cb625ded..156ef846a8d10 100644
--- a/python/pyspark/sql/connect/proto/ml_pb2.pyi
+++ b/python/pyspark/sql/connect/proto/ml_pb2.pyi
@@ -118,21 +118,39 @@ class MlCommand(google.protobuf.message.Message):
         DESCRIPTOR: google.protobuf.descriptor.Descriptor
 
         OBJ_REFS_FIELD_NUMBER: builtins.int
+        EVICT_ONLY_FIELD_NUMBER: builtins.int
         @property
         def obj_refs(
             self,
         ) -> google.protobuf.internal.containers.RepeatedCompositeFieldContainer[
             pyspark.sql.connect.proto.ml_common_pb2.ObjectRef
         ]: ...
+        evict_only: builtins.bool
+        """if set `evict_only` to true, only evict the cached model from memory,
+        but keep the offloaded model in Spark driver local disk.
+        """
         def __init__(
             self,
             *,
             obj_refs: collections.abc.Iterable[pyspark.sql.connect.proto.ml_common_pb2.ObjectRef]
             | None = ...,
+            evict_only: builtins.bool | None = ...,
         ) -> None: ...
+        def HasField(
+            self,
+            field_name: typing_extensions.Literal[
+                "_evict_only", b"_evict_only", "evict_only", b"evict_only"
+            ],
+        ) -> builtins.bool: ...
         def ClearField(
-            self, field_name: typing_extensions.Literal["obj_refs", b"obj_refs"]
+            self,
+            field_name: typing_extensions.Literal[
+                "_evict_only", b"_evict_only", "evict_only", b"evict_only", "obj_refs", b"obj_refs"
+            ],
         ) -> None: ...
+        def WhichOneof(
+            self, oneof_group: typing_extensions.Literal["_evict_only", b"_evict_only"]
+        ) -> typing_extensions.Literal["evict_only"] | None: ...
 
     class CleanCache(google.protobuf.message.Message):
         """Force to clean up all the ML cached objects"""
@@ -342,6 +360,54 @@ class MlCommand(google.protobuf.message.Message):
             self, oneof_group: typing_extensions.Literal["_params", b"_params"]
         ) -> typing_extensions.Literal["params"] | None: ...
 
+    class CreateSummary(google.protobuf.message.Message):
+        """This is for re-creating the model summary when the model summary is lost
+        (model summary is lost when the model is offloaded and then loaded back)
+        """
+
+        DESCRIPTOR: google.protobuf.descriptor.Descriptor
+
+        MODEL_REF_FIELD_NUMBER: builtins.int
+        DATASET_FIELD_NUMBER: builtins.int
+        @property
+        def model_ref(self) -> pyspark.sql.connect.proto.ml_common_pb2.ObjectRef: ...
+        @property
+        def dataset(self) -> pyspark.sql.connect.proto.relations_pb2.Relation: ...
+        def __init__(
+            self,
+            *,
+            model_ref: pyspark.sql.connect.proto.ml_common_pb2.ObjectRef | None = ...,
+            dataset: pyspark.sql.connect.proto.relations_pb2.Relation | None = ...,
+        ) -> None: ...
+        def HasField(
+            self,
+            field_name: typing_extensions.Literal["dataset", b"dataset", "model_ref", b"model_ref"],
+        ) -> builtins.bool: ...
+        def ClearField(
+            self,
+            field_name: typing_extensions.Literal["dataset", b"dataset", "model_ref", b"model_ref"],
+        ) -> None: ...
+
+    class GetModelSize(google.protobuf.message.Message):
+        """This is for query the model estimated in-memory size"""
+
+        DESCRIPTOR: google.protobuf.descriptor.Descriptor
+
+        MODEL_REF_FIELD_NUMBER: builtins.int
+        @property
+        def model_ref(self) -> pyspark.sql.connect.proto.ml_common_pb2.ObjectRef: ...
+        def __init__(
+            self,
+            *,
+            model_ref: pyspark.sql.connect.proto.ml_common_pb2.ObjectRef | None = ...,
+        ) -> None: ...
+        def HasField(
+            self, field_name: typing_extensions.Literal["model_ref", b"model_ref"]
+        ) -> builtins.bool: ...
+        def ClearField(
+            self, field_name: typing_extensions.Literal["model_ref", b"model_ref"]
+        ) -> None: ...
+
     FIT_FIELD_NUMBER: builtins.int
     FETCH_FIELD_NUMBER: builtins.int
     DELETE_FIELD_NUMBER: builtins.int
@@ -350,6 +416,8 @@ class MlCommand(google.protobuf.message.Message):
     EVALUATE_FIELD_NUMBER: builtins.int
     CLEAN_CACHE_FIELD_NUMBER: builtins.int
     GET_CACHE_INFO_FIELD_NUMBER: builtins.int
+    CREATE_SUMMARY_FIELD_NUMBER: builtins.int
+    GET_MODEL_SIZE_FIELD_NUMBER: builtins.int
     @property
     def fit(self) -> global___MlCommand.Fit: ...
     @property
@@ -366,6 +434,10 @@ class MlCommand(google.protobuf.message.Message):
     def clean_cache(self) -> global___MlCommand.CleanCache: ...
     @property
     def get_cache_info(self) -> global___MlCommand.GetCacheInfo: ...
+    @property
+    def create_summary(self) -> global___MlCommand.CreateSummary: ...
+    @property
+    def get_model_size(self) -> global___MlCommand.GetModelSize: ...
     def __init__(
         self,
         *,
@@ -377,6 +449,8 @@ class MlCommand(google.protobuf.message.Message):
         evaluate: global___MlCommand.Evaluate | None = ...,
         clean_cache: global___MlCommand.CleanCache | None = ...,
         get_cache_info: global___MlCommand.GetCacheInfo | None = ...,
+        create_summary: global___MlCommand.CreateSummary | None = ...,
+        get_model_size: global___MlCommand.GetModelSize | None = ...,
     ) -> None: ...
     def HasField(
         self,
@@ -385,6 +459,8 @@ class MlCommand(google.protobuf.message.Message):
             b"clean_cache",
             "command",
             b"command",
+            "create_summary",
+            b"create_summary",
             "delete",
             b"delete",
             "evaluate",
@@ -395,6 +471,8 @@ class MlCommand(google.protobuf.message.Message):
             b"fit",
             "get_cache_info",
             b"get_cache_info",
+            "get_model_size",
+            b"get_model_size",
             "read",
             b"read",
             "write",
@@ -408,6 +486,8 @@ class MlCommand(google.protobuf.message.Message):
             b"clean_cache",
             "command",
             b"command",
+            "create_summary",
+            b"create_summary",
             "delete",
             b"delete",
             "evaluate",
@@ -418,6 +498,8 @@ class MlCommand(google.protobuf.message.Message):
             b"fit",
             "get_cache_info",
             b"get_cache_info",
+            "get_model_size",
+            b"get_model_size",
             "read",
             b"read",
             "write",
@@ -428,7 +510,16 @@ class MlCommand(google.protobuf.message.Message):
         self, oneof_group: typing_extensions.Literal["command", b"command"]
     ) -> (
         typing_extensions.Literal[
-            "fit", "fetch", "delete", "write", "read", "evaluate", "clean_cache", "get_cache_info"
+            "fit",
+            "fetch",
+            "delete",
+            "write",
+            "read",
+            "evaluate",
+            "clean_cache",
+            "get_cache_info",
+            "create_summary",
+            "get_model_size",
         ]
         | None
     ): ...
diff --git a/python/pyspark/sql/connect/proto/pipelines_pb2.py b/python/pyspark/sql/connect/proto/pipelines_pb2.py
index 017e7285f8848..08b39a39e831a 100644
--- a/python/pyspark/sql/connect/proto/pipelines_pb2.py
+++ b/python/pyspark/sql/connect/proto/pipelines_pb2.py
@@ -40,7 +40,7 @@
 
 
 DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(
-    b'\n\x1dspark/connect/pipelines.proto\x12\rspark.connect\x1a\x1fgoogle/protobuf/timestamp.proto\x1a\x1dspark/connect/relations.proto\x1a\x19spark/connect/types.proto"\xe6\x12\n\x0fPipelineCommand\x12h\n\x15\x63reate_dataflow_graph\x18\x01 \x01(\x0b\x32\x32.spark.connect.PipelineCommand.CreateDataflowGraphH\x00R\x13\x63reateDataflowGraph\x12U\n\x0e\x64\x65\x66ine_dataset\x18\x02 \x01(\x0b\x32,.spark.connect.PipelineCommand.DefineDatasetH\x00R\rdefineDataset\x12L\n\x0b\x64\x65\x66ine_flow\x18\x03 \x01(\x0b\x32).spark.connect.PipelineCommand.DefineFlowH\x00R\ndefineFlow\x12\x62\n\x13\x64rop_dataflow_graph\x18\x04 \x01(\x0b\x32\x30.spark.connect.PipelineCommand.DropDataflowGraphH\x00R\x11\x64ropDataflowGraph\x12\x46\n\tstart_run\x18\x05 \x01(\x0b\x32\'.spark.connect.PipelineCommand.StartRunH\x00R\x08startRun\x12r\n\x19\x64\x65\x66ine_sql_graph_elements\x18\x06 \x01(\x0b\x32\x35.spark.connect.PipelineCommand.DefineSqlGraphElementsH\x00R\x16\x64\x65\x66ineSqlGraphElements\x1a\x87\x03\n\x13\x43reateDataflowGraph\x12,\n\x0f\x64\x65\x66\x61ult_catalog\x18\x01 \x01(\tH\x00R\x0e\x64\x65\x66\x61ultCatalog\x88\x01\x01\x12.\n\x10\x64\x65\x66\x61ult_database\x18\x02 \x01(\tH\x01R\x0f\x64\x65\x66\x61ultDatabase\x88\x01\x01\x12Z\n\x08sql_conf\x18\x05 \x03(\x0b\x32?.spark.connect.PipelineCommand.CreateDataflowGraph.SqlConfEntryR\x07sqlConf\x1a:\n\x0cSqlConfEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x1aQ\n\x08Response\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x42\x14\n\x12_dataflow_graph_idB\x12\n\x10_default_catalogB\x13\n\x11_default_database\x1aZ\n\x11\x44ropDataflowGraph\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x42\x14\n\x12_dataflow_graph_id\x1a\xd1\x04\n\rDefineDataset\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x12&\n\x0c\x64\x61taset_name\x18\x02 \x01(\tH\x01R\x0b\x64\x61tasetName\x88\x01\x01\x12\x42\n\x0c\x64\x61taset_type\x18\x03 \x01(\x0e\x32\x1a.spark.connect.DatasetTypeH\x02R\x0b\x64\x61tasetType\x88\x01\x01\x12\x1d\n\x07\x63omment\x18\x04 \x01(\tH\x03R\x07\x63omment\x88\x01\x01\x12l\n\x10table_properties\x18\x05 \x03(\x0b\x32\x41.spark.connect.PipelineCommand.DefineDataset.TablePropertiesEntryR\x0ftableProperties\x12%\n\x0epartition_cols\x18\x06 \x03(\tR\rpartitionCols\x12\x34\n\x06schema\x18\x07 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x04R\x06schema\x88\x01\x01\x12\x1b\n\x06\x66ormat\x18\x08 \x01(\tH\x05R\x06\x66ormat\x88\x01\x01\x1a\x42\n\x14TablePropertiesEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\x14\n\x12_dataflow_graph_idB\x0f\n\r_dataset_nameB\x0f\n\r_dataset_typeB\n\n\x08_commentB\t\n\x07_schemaB\t\n\x07_format\x1a\xbc\x03\n\nDefineFlow\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x12 \n\tflow_name\x18\x02 \x01(\tH\x01R\x08\x66lowName\x88\x01\x01\x12\x33\n\x13target_dataset_name\x18\x03 \x01(\tH\x02R\x11targetDatasetName\x88\x01\x01\x12\x30\n\x04plan\x18\x04 \x01(\x0b\x32\x17.spark.connect.RelationH\x03R\x04plan\x88\x01\x01\x12Q\n\x08sql_conf\x18\x05 \x03(\x0b\x32\x36.spark.connect.PipelineCommand.DefineFlow.SqlConfEntryR\x07sqlConf\x12\x17\n\x04once\x18\x06 \x01(\x08H\x04R\x04once\x88\x01\x01\x1a:\n\x0cSqlConfEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\x14\n\x12_dataflow_graph_idB\x0c\n\n_flow_nameB\x16\n\x14_target_dataset_nameB\x07\n\x05_planB\x07\n\x05_once\x1aQ\n\x08StartRun\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x42\x14\n\x12_dataflow_graph_id\x1a\xc7\x01\n\x16\x44\x65\x66ineSqlGraphElements\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x12\'\n\rsql_file_path\x18\x02 \x01(\tH\x01R\x0bsqlFilePath\x88\x01\x01\x12\x1e\n\x08sql_text\x18\x03 \x01(\tH\x02R\x07sqlText\x88\x01\x01\x42\x14\n\x12_dataflow_graph_idB\x10\n\x0e_sql_file_pathB\x0b\n\t_sql_textB\x0e\n\x0c\x63ommand_type"\x8e\x02\n\x15PipelineCommandResult\x12\x81\x01\n\x1c\x63reate_dataflow_graph_result\x18\x01 \x01(\x0b\x32>.spark.connect.PipelineCommandResult.CreateDataflowGraphResultH\x00R\x19\x63reateDataflowGraphResult\x1a\x62\n\x19\x43reateDataflowGraphResult\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x42\x14\n\x12_dataflow_graph_idB\r\n\x0bresult_type"I\n\x13PipelineEventResult\x12\x32\n\x05\x65vent\x18\x01 \x01(\x0b\x32\x1c.spark.connect.PipelineEventR\x05\x65vent"t\n\rPipelineEvent\x12\x38\n\ttimestamp\x18\x01 \x01(\x0b\x32\x1a.google.protobuf.TimestampR\ttimestamp\x12\x1d\n\x07message\x18\x02 \x01(\tH\x00R\x07message\x88\x01\x01\x42\n\n\x08_message*a\n\x0b\x44\x61tasetType\x12\x1c\n\x18\x44\x41TASET_TYPE_UNSPECIFIED\x10\x00\x12\x15\n\x11MATERIALIZED_VIEW\x10\x01\x12\t\n\x05TABLE\x10\x02\x12\x12\n\x0eTEMPORARY_VIEW\x10\x03\x42"\n\x1eorg.apache.spark.connect.protoP\x01\x62\x06proto3'
+    b'\n\x1dspark/connect/pipelines.proto\x12\rspark.connect\x1a\x1fgoogle/protobuf/timestamp.proto\x1a\x1dspark/connect/relations.proto\x1a\x19spark/connect/types.proto"\x97\x14\n\x0fPipelineCommand\x12h\n\x15\x63reate_dataflow_graph\x18\x01 \x01(\x0b\x32\x32.spark.connect.PipelineCommand.CreateDataflowGraphH\x00R\x13\x63reateDataflowGraph\x12U\n\x0e\x64\x65\x66ine_dataset\x18\x02 \x01(\x0b\x32,.spark.connect.PipelineCommand.DefineDatasetH\x00R\rdefineDataset\x12L\n\x0b\x64\x65\x66ine_flow\x18\x03 \x01(\x0b\x32).spark.connect.PipelineCommand.DefineFlowH\x00R\ndefineFlow\x12\x62\n\x13\x64rop_dataflow_graph\x18\x04 \x01(\x0b\x32\x30.spark.connect.PipelineCommand.DropDataflowGraphH\x00R\x11\x64ropDataflowGraph\x12\x46\n\tstart_run\x18\x05 \x01(\x0b\x32\'.spark.connect.PipelineCommand.StartRunH\x00R\x08startRun\x12r\n\x19\x64\x65\x66ine_sql_graph_elements\x18\x06 \x01(\x0b\x32\x35.spark.connect.PipelineCommand.DefineSqlGraphElementsH\x00R\x16\x64\x65\x66ineSqlGraphElements\x1a\x87\x03\n\x13\x43reateDataflowGraph\x12,\n\x0f\x64\x65\x66\x61ult_catalog\x18\x01 \x01(\tH\x00R\x0e\x64\x65\x66\x61ultCatalog\x88\x01\x01\x12.\n\x10\x64\x65\x66\x61ult_database\x18\x02 \x01(\tH\x01R\x0f\x64\x65\x66\x61ultDatabase\x88\x01\x01\x12Z\n\x08sql_conf\x18\x05 \x03(\x0b\x32?.spark.connect.PipelineCommand.CreateDataflowGraph.SqlConfEntryR\x07sqlConf\x1a:\n\x0cSqlConfEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x1aQ\n\x08Response\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x42\x14\n\x12_dataflow_graph_idB\x12\n\x10_default_catalogB\x13\n\x11_default_database\x1aZ\n\x11\x44ropDataflowGraph\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x42\x14\n\x12_dataflow_graph_id\x1a\xd1\x04\n\rDefineDataset\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x12&\n\x0c\x64\x61taset_name\x18\x02 \x01(\tH\x01R\x0b\x64\x61tasetName\x88\x01\x01\x12\x42\n\x0c\x64\x61taset_type\x18\x03 \x01(\x0e\x32\x1a.spark.connect.DatasetTypeH\x02R\x0b\x64\x61tasetType\x88\x01\x01\x12\x1d\n\x07\x63omment\x18\x04 \x01(\tH\x03R\x07\x63omment\x88\x01\x01\x12l\n\x10table_properties\x18\x05 \x03(\x0b\x32\x41.spark.connect.PipelineCommand.DefineDataset.TablePropertiesEntryR\x0ftableProperties\x12%\n\x0epartition_cols\x18\x06 \x03(\tR\rpartitionCols\x12\x34\n\x06schema\x18\x07 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x04R\x06schema\x88\x01\x01\x12\x1b\n\x06\x66ormat\x18\x08 \x01(\tH\x05R\x06\x66ormat\x88\x01\x01\x1a\x42\n\x14TablePropertiesEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\x14\n\x12_dataflow_graph_idB\x0f\n\r_dataset_nameB\x0f\n\r_dataset_typeB\n\n\x08_commentB\t\n\x07_schemaB\t\n\x07_format\x1a\xa6\x03\n\nDefineFlow\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x12 \n\tflow_name\x18\x02 \x01(\tH\x01R\x08\x66lowName\x88\x01\x01\x12\x33\n\x13target_dataset_name\x18\x03 \x01(\tH\x02R\x11targetDatasetName\x88\x01\x01\x12\x38\n\x08relation\x18\x04 \x01(\x0b\x32\x17.spark.connect.RelationH\x03R\x08relation\x88\x01\x01\x12Q\n\x08sql_conf\x18\x05 \x03(\x0b\x32\x36.spark.connect.PipelineCommand.DefineFlow.SqlConfEntryR\x07sqlConf\x1a:\n\x0cSqlConfEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\x14\n\x12_dataflow_graph_idB\x0c\n\n_flow_nameB\x16\n\x14_target_dataset_nameB\x0b\n\t_relation\x1a\x97\x02\n\x08StartRun\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x12\x34\n\x16\x66ull_refresh_selection\x18\x02 \x03(\tR\x14\x66ullRefreshSelection\x12-\n\x10\x66ull_refresh_all\x18\x03 \x01(\x08H\x01R\x0e\x66ullRefreshAll\x88\x01\x01\x12+\n\x11refresh_selection\x18\x04 \x03(\tR\x10refreshSelection\x12\x15\n\x03\x64ry\x18\x05 \x01(\x08H\x02R\x03\x64ry\x88\x01\x01\x42\x14\n\x12_dataflow_graph_idB\x13\n\x11_full_refresh_allB\x06\n\x04_dry\x1a\xc7\x01\n\x16\x44\x65\x66ineSqlGraphElements\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x12\'\n\rsql_file_path\x18\x02 \x01(\tH\x01R\x0bsqlFilePath\x88\x01\x01\x12\x1e\n\x08sql_text\x18\x03 \x01(\tH\x02R\x07sqlText\x88\x01\x01\x42\x14\n\x12_dataflow_graph_idB\x10\n\x0e_sql_file_pathB\x0b\n\t_sql_textB\x0e\n\x0c\x63ommand_type"\x8e\x02\n\x15PipelineCommandResult\x12\x81\x01\n\x1c\x63reate_dataflow_graph_result\x18\x01 \x01(\x0b\x32>.spark.connect.PipelineCommandResult.CreateDataflowGraphResultH\x00R\x19\x63reateDataflowGraphResult\x1a\x62\n\x19\x43reateDataflowGraphResult\x12/\n\x11\x64\x61taflow_graph_id\x18\x01 \x01(\tH\x00R\x0f\x64\x61taflowGraphId\x88\x01\x01\x42\x14\n\x12_dataflow_graph_idB\r\n\x0bresult_type"I\n\x13PipelineEventResult\x12\x32\n\x05\x65vent\x18\x01 \x01(\x0b\x32\x1c.spark.connect.PipelineEventR\x05\x65vent"t\n\rPipelineEvent\x12\x38\n\ttimestamp\x18\x01 \x01(\x0b\x32\x1a.google.protobuf.TimestampR\ttimestamp\x12\x1d\n\x07message\x18\x02 \x01(\tH\x00R\x07message\x88\x01\x01\x42\n\n\x08_message*a\n\x0b\x44\x61tasetType\x12\x1c\n\x18\x44\x41TASET_TYPE_UNSPECIFIED\x10\x00\x12\x15\n\x11MATERIALIZED_VIEW\x10\x01\x12\t\n\x05TABLE\x10\x02\x12\x12\n\x0eTEMPORARY_VIEW\x10\x03\x42\x36\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3'
 )
 
 _globals = globals()
@@ -50,17 +50,19 @@
 )
 if not _descriptor._USE_C_DESCRIPTORS:
     _globals["DESCRIPTOR"]._loaded_options = None
-    _globals["DESCRIPTOR"]._serialized_options = b"\n\036org.apache.spark.connect.protoP\001"
+    _globals[
+        "DESCRIPTOR"
+    ]._serialized_options = b"\n\036org.apache.spark.connect.protoP\001Z\022internal/generated"
     _globals["_PIPELINECOMMAND_CREATEDATAFLOWGRAPH_SQLCONFENTRY"]._loaded_options = None
     _globals["_PIPELINECOMMAND_CREATEDATAFLOWGRAPH_SQLCONFENTRY"]._serialized_options = b"8\001"
     _globals["_PIPELINECOMMAND_DEFINEDATASET_TABLEPROPERTIESENTRY"]._loaded_options = None
     _globals["_PIPELINECOMMAND_DEFINEDATASET_TABLEPROPERTIESENTRY"]._serialized_options = b"8\001"
     _globals["_PIPELINECOMMAND_DEFINEFLOW_SQLCONFENTRY"]._loaded_options = None
     _globals["_PIPELINECOMMAND_DEFINEFLOW_SQLCONFENTRY"]._serialized_options = b"8\001"
-    _globals["_DATASETTYPE"]._serialized_start = 3014
-    _globals["_DATASETTYPE"]._serialized_end = 3111
+    _globals["_DATASETTYPE"]._serialized_start = 3191
+    _globals["_DATASETTYPE"]._serialized_end = 3288
     _globals["_PIPELINECOMMAND"]._serialized_start = 140
-    _globals["_PIPELINECOMMAND"]._serialized_end = 2546
+    _globals["_PIPELINECOMMAND"]._serialized_end = 2723
     _globals["_PIPELINECOMMAND_CREATEDATAFLOWGRAPH"]._serialized_start = 719
     _globals["_PIPELINECOMMAND_CREATEDATAFLOWGRAPH"]._serialized_end = 1110
     _globals["_PIPELINECOMMAND_CREATEDATAFLOWGRAPH_SQLCONFENTRY"]._serialized_start = 928
@@ -74,19 +76,19 @@
     _globals["_PIPELINECOMMAND_DEFINEDATASET_TABLEPROPERTIESENTRY"]._serialized_start = 1642
     _globals["_PIPELINECOMMAND_DEFINEDATASET_TABLEPROPERTIESENTRY"]._serialized_end = 1708
     _globals["_PIPELINECOMMAND_DEFINEFLOW"]._serialized_start = 1801
-    _globals["_PIPELINECOMMAND_DEFINEFLOW"]._serialized_end = 2245
+    _globals["_PIPELINECOMMAND_DEFINEFLOW"]._serialized_end = 2223
     _globals["_PIPELINECOMMAND_DEFINEFLOW_SQLCONFENTRY"]._serialized_start = 928
     _globals["_PIPELINECOMMAND_DEFINEFLOW_SQLCONFENTRY"]._serialized_end = 986
-    _globals["_PIPELINECOMMAND_STARTRUN"]._serialized_start = 2247
-    _globals["_PIPELINECOMMAND_STARTRUN"]._serialized_end = 2328
-    _globals["_PIPELINECOMMAND_DEFINESQLGRAPHELEMENTS"]._serialized_start = 2331
-    _globals["_PIPELINECOMMAND_DEFINESQLGRAPHELEMENTS"]._serialized_end = 2530
-    _globals["_PIPELINECOMMANDRESULT"]._serialized_start = 2549
-    _globals["_PIPELINECOMMANDRESULT"]._serialized_end = 2819
-    _globals["_PIPELINECOMMANDRESULT_CREATEDATAFLOWGRAPHRESULT"]._serialized_start = 2706
-    _globals["_PIPELINECOMMANDRESULT_CREATEDATAFLOWGRAPHRESULT"]._serialized_end = 2804
-    _globals["_PIPELINEEVENTRESULT"]._serialized_start = 2821
-    _globals["_PIPELINEEVENTRESULT"]._serialized_end = 2894
-    _globals["_PIPELINEEVENT"]._serialized_start = 2896
-    _globals["_PIPELINEEVENT"]._serialized_end = 3012
+    _globals["_PIPELINECOMMAND_STARTRUN"]._serialized_start = 2226
+    _globals["_PIPELINECOMMAND_STARTRUN"]._serialized_end = 2505
+    _globals["_PIPELINECOMMAND_DEFINESQLGRAPHELEMENTS"]._serialized_start = 2508
+    _globals["_PIPELINECOMMAND_DEFINESQLGRAPHELEMENTS"]._serialized_end = 2707
+    _globals["_PIPELINECOMMANDRESULT"]._serialized_start = 2726
+    _globals["_PIPELINECOMMANDRESULT"]._serialized_end = 2996
+    _globals["_PIPELINECOMMANDRESULT_CREATEDATAFLOWGRAPHRESULT"]._serialized_start = 2883
+    _globals["_PIPELINECOMMANDRESULT_CREATEDATAFLOWGRAPHRESULT"]._serialized_end = 2981
+    _globals["_PIPELINEEVENTRESULT"]._serialized_start = 2998
+    _globals["_PIPELINEEVENTRESULT"]._serialized_end = 3071
+    _globals["_PIPELINEEVENT"]._serialized_start = 3073
+    _globals["_PIPELINEEVENT"]._serialized_end = 3189
 # @@protoc_insertion_point(module_scope)
diff --git a/python/pyspark/sql/connect/proto/pipelines_pb2.pyi b/python/pyspark/sql/connect/proto/pipelines_pb2.pyi
index cf2cb8d3053b7..6287aabafc6b2 100644
--- a/python/pyspark/sql/connect/proto/pipelines_pb2.pyi
+++ b/python/pyspark/sql/connect/proto/pipelines_pb2.pyi
@@ -418,9 +418,8 @@ class PipelineCommand(google.protobuf.message.Message):
         DATAFLOW_GRAPH_ID_FIELD_NUMBER: builtins.int
         FLOW_NAME_FIELD_NUMBER: builtins.int
         TARGET_DATASET_NAME_FIELD_NUMBER: builtins.int
-        PLAN_FIELD_NUMBER: builtins.int
+        RELATION_FIELD_NUMBER: builtins.int
         SQL_CONF_FIELD_NUMBER: builtins.int
-        ONCE_FIELD_NUMBER: builtins.int
         dataflow_graph_id: builtins.str
         """The graph to attach this flow to."""
         flow_name: builtins.str
@@ -428,24 +427,21 @@ class PipelineCommand(google.protobuf.message.Message):
         target_dataset_name: builtins.str
         """Name of the dataset this flow writes to. Can be partially or fully qualified."""
         @property
-        def plan(self) -> pyspark.sql.connect.proto.relations_pb2.Relation:
+        def relation(self) -> pyspark.sql.connect.proto.relations_pb2.Relation:
             """An unresolved relation that defines the dataset's flow."""
         @property
         def sql_conf(
             self,
         ) -> google.protobuf.internal.containers.ScalarMap[builtins.str, builtins.str]:
             """SQL configurations set when running this flow."""
-        once: builtins.bool
-        """If true, this flow will only be run once per full refresh."""
         def __init__(
             self,
             *,
             dataflow_graph_id: builtins.str | None = ...,
             flow_name: builtins.str | None = ...,
             target_dataset_name: builtins.str | None = ...,
-            plan: pyspark.sql.connect.proto.relations_pb2.Relation | None = ...,
+            relation: pyspark.sql.connect.proto.relations_pb2.Relation | None = ...,
             sql_conf: collections.abc.Mapping[builtins.str, builtins.str] | None = ...,
-            once: builtins.bool | None = ...,
         ) -> None: ...
         def HasField(
             self,
@@ -454,20 +450,16 @@ class PipelineCommand(google.protobuf.message.Message):
                 b"_dataflow_graph_id",
                 "_flow_name",
                 b"_flow_name",
-                "_once",
-                b"_once",
-                "_plan",
-                b"_plan",
+                "_relation",
+                b"_relation",
                 "_target_dataset_name",
                 b"_target_dataset_name",
                 "dataflow_graph_id",
                 b"dataflow_graph_id",
                 "flow_name",
                 b"flow_name",
-                "once",
-                b"once",
-                "plan",
-                b"plan",
+                "relation",
+                b"relation",
                 "target_dataset_name",
                 b"target_dataset_name",
             ],
@@ -479,20 +471,16 @@ class PipelineCommand(google.protobuf.message.Message):
                 b"_dataflow_graph_id",
                 "_flow_name",
                 b"_flow_name",
-                "_once",
-                b"_once",
-                "_plan",
-                b"_plan",
+                "_relation",
+                b"_relation",
                 "_target_dataset_name",
                 b"_target_dataset_name",
                 "dataflow_graph_id",
                 b"dataflow_graph_id",
                 "flow_name",
                 b"flow_name",
-                "once",
-                b"once",
-                "plan",
-                b"plan",
+                "relation",
+                b"relation",
                 "sql_conf",
                 b"sql_conf",
                 "target_dataset_name",
@@ -510,12 +498,8 @@ class PipelineCommand(google.protobuf.message.Message):
         ) -> typing_extensions.Literal["flow_name"] | None: ...
         @typing.overload
         def WhichOneof(
-            self, oneof_group: typing_extensions.Literal["_once", b"_once"]
-        ) -> typing_extensions.Literal["once"] | None: ...
-        @typing.overload
-        def WhichOneof(
-            self, oneof_group: typing_extensions.Literal["_plan", b"_plan"]
-        ) -> typing_extensions.Literal["plan"] | None: ...
+            self, oneof_group: typing_extensions.Literal["_relation", b"_relation"]
+        ) -> typing_extensions.Literal["relation"] | None: ...
         @typing.overload
         def WhichOneof(
             self,
@@ -530,20 +514,52 @@ class PipelineCommand(google.protobuf.message.Message):
         DESCRIPTOR: google.protobuf.descriptor.Descriptor
 
         DATAFLOW_GRAPH_ID_FIELD_NUMBER: builtins.int
+        FULL_REFRESH_SELECTION_FIELD_NUMBER: builtins.int
+        FULL_REFRESH_ALL_FIELD_NUMBER: builtins.int
+        REFRESH_SELECTION_FIELD_NUMBER: builtins.int
+        DRY_FIELD_NUMBER: builtins.int
         dataflow_graph_id: builtins.str
         """The graph to start."""
+        @property
+        def full_refresh_selection(
+            self,
+        ) -> google.protobuf.internal.containers.RepeatedScalarFieldContainer[builtins.str]:
+            """List of dataset to reset and recompute."""
+        full_refresh_all: builtins.bool
+        """Perform a full graph reset and recompute."""
+        @property
+        def refresh_selection(
+            self,
+        ) -> google.protobuf.internal.containers.RepeatedScalarFieldContainer[builtins.str]:
+            """List of dataset to update."""
+        dry: builtins.bool
+        """If true, the run will not actually execute any flows, but will only validate the graph and
+        check for any errors. This is useful for testing and validation purposes.
+        """
         def __init__(
             self,
             *,
             dataflow_graph_id: builtins.str | None = ...,
+            full_refresh_selection: collections.abc.Iterable[builtins.str] | None = ...,
+            full_refresh_all: builtins.bool | None = ...,
+            refresh_selection: collections.abc.Iterable[builtins.str] | None = ...,
+            dry: builtins.bool | None = ...,
         ) -> None: ...
         def HasField(
             self,
             field_name: typing_extensions.Literal[
                 "_dataflow_graph_id",
                 b"_dataflow_graph_id",
+                "_dry",
+                b"_dry",
+                "_full_refresh_all",
+                b"_full_refresh_all",
                 "dataflow_graph_id",
                 b"dataflow_graph_id",
+                "dry",
+                b"dry",
+                "full_refresh_all",
+                b"full_refresh_all",
             ],
         ) -> builtins.bool: ...
         def ClearField(
@@ -551,14 +567,35 @@ class PipelineCommand(google.protobuf.message.Message):
             field_name: typing_extensions.Literal[
                 "_dataflow_graph_id",
                 b"_dataflow_graph_id",
+                "_dry",
+                b"_dry",
+                "_full_refresh_all",
+                b"_full_refresh_all",
                 "dataflow_graph_id",
                 b"dataflow_graph_id",
+                "dry",
+                b"dry",
+                "full_refresh_all",
+                b"full_refresh_all",
+                "full_refresh_selection",
+                b"full_refresh_selection",
+                "refresh_selection",
+                b"refresh_selection",
             ],
         ) -> None: ...
+        @typing.overload
         def WhichOneof(
             self,
             oneof_group: typing_extensions.Literal["_dataflow_graph_id", b"_dataflow_graph_id"],
         ) -> typing_extensions.Literal["dataflow_graph_id"] | None: ...
+        @typing.overload
+        def WhichOneof(
+            self, oneof_group: typing_extensions.Literal["_dry", b"_dry"]
+        ) -> typing_extensions.Literal["dry"] | None: ...
+        @typing.overload
+        def WhichOneof(
+            self, oneof_group: typing_extensions.Literal["_full_refresh_all", b"_full_refresh_all"]
+        ) -> typing_extensions.Literal["full_refresh_all"] | None: ...
 
     class DefineSqlGraphElements(google.protobuf.message.Message):
         """Parses the SQL file and registers all datasets and flows."""
diff --git a/python/pyspark/sql/connect/proto/relations_pb2.py b/python/pyspark/sql/connect/proto/relations_pb2.py
index 525ba88ff67c6..3774bcbdbfb0e 100644
--- a/python/pyspark/sql/connect/proto/relations_pb2.py
+++ b/python/pyspark/sql/connect/proto/relations_pb2.py
@@ -43,7 +43,7 @@
 
 
 DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(
-    b'\n\x1dspark/connect/relations.proto\x12\rspark.connect\x1a\x19google/protobuf/any.proto\x1a\x1fspark/connect/expressions.proto\x1a\x19spark/connect/types.proto\x1a\x1bspark/connect/catalog.proto\x1a\x1aspark/connect/common.proto\x1a\x1dspark/connect/ml_common.proto"\x9c\x1d\n\x08Relation\x12\x35\n\x06\x63ommon\x18\x01 \x01(\x0b\x32\x1d.spark.connect.RelationCommonR\x06\x63ommon\x12)\n\x04read\x18\x02 \x01(\x0b\x32\x13.spark.connect.ReadH\x00R\x04read\x12\x32\n\x07project\x18\x03 \x01(\x0b\x32\x16.spark.connect.ProjectH\x00R\x07project\x12/\n\x06\x66ilter\x18\x04 \x01(\x0b\x32\x15.spark.connect.FilterH\x00R\x06\x66ilter\x12)\n\x04join\x18\x05 \x01(\x0b\x32\x13.spark.connect.JoinH\x00R\x04join\x12\x34\n\x06set_op\x18\x06 \x01(\x0b\x32\x1b.spark.connect.SetOperationH\x00R\x05setOp\x12)\n\x04sort\x18\x07 \x01(\x0b\x32\x13.spark.connect.SortH\x00R\x04sort\x12,\n\x05limit\x18\x08 \x01(\x0b\x32\x14.spark.connect.LimitH\x00R\x05limit\x12\x38\n\taggregate\x18\t \x01(\x0b\x32\x18.spark.connect.AggregateH\x00R\taggregate\x12&\n\x03sql\x18\n \x01(\x0b\x32\x12.spark.connect.SQLH\x00R\x03sql\x12\x45\n\x0elocal_relation\x18\x0b \x01(\x0b\x32\x1c.spark.connect.LocalRelationH\x00R\rlocalRelation\x12/\n\x06sample\x18\x0c \x01(\x0b\x32\x15.spark.connect.SampleH\x00R\x06sample\x12/\n\x06offset\x18\r \x01(\x0b\x32\x15.spark.connect.OffsetH\x00R\x06offset\x12>\n\x0b\x64\x65\x64uplicate\x18\x0e \x01(\x0b\x32\x1a.spark.connect.DeduplicateH\x00R\x0b\x64\x65\x64uplicate\x12,\n\x05range\x18\x0f \x01(\x0b\x32\x14.spark.connect.RangeH\x00R\x05range\x12\x45\n\x0esubquery_alias\x18\x10 \x01(\x0b\x32\x1c.spark.connect.SubqueryAliasH\x00R\rsubqueryAlias\x12>\n\x0brepartition\x18\x11 \x01(\x0b\x32\x1a.spark.connect.RepartitionH\x00R\x0brepartition\x12*\n\x05to_df\x18\x12 \x01(\x0b\x32\x13.spark.connect.ToDFH\x00R\x04toDf\x12U\n\x14with_columns_renamed\x18\x13 \x01(\x0b\x32!.spark.connect.WithColumnsRenamedH\x00R\x12withColumnsRenamed\x12<\n\x0bshow_string\x18\x14 \x01(\x0b\x32\x19.spark.connect.ShowStringH\x00R\nshowString\x12)\n\x04\x64rop\x18\x15 \x01(\x0b\x32\x13.spark.connect.DropH\x00R\x04\x64rop\x12)\n\x04tail\x18\x16 \x01(\x0b\x32\x13.spark.connect.TailH\x00R\x04tail\x12?\n\x0cwith_columns\x18\x17 \x01(\x0b\x32\x1a.spark.connect.WithColumnsH\x00R\x0bwithColumns\x12)\n\x04hint\x18\x18 \x01(\x0b\x32\x13.spark.connect.HintH\x00R\x04hint\x12\x32\n\x07unpivot\x18\x19 \x01(\x0b\x32\x16.spark.connect.UnpivotH\x00R\x07unpivot\x12\x36\n\tto_schema\x18\x1a \x01(\x0b\x32\x17.spark.connect.ToSchemaH\x00R\x08toSchema\x12\x64\n\x19repartition_by_expression\x18\x1b \x01(\x0b\x32&.spark.connect.RepartitionByExpressionH\x00R\x17repartitionByExpression\x12\x45\n\x0emap_partitions\x18\x1c \x01(\x0b\x32\x1c.spark.connect.MapPartitionsH\x00R\rmapPartitions\x12H\n\x0f\x63ollect_metrics\x18\x1d \x01(\x0b\x32\x1d.spark.connect.CollectMetricsH\x00R\x0e\x63ollectMetrics\x12,\n\x05parse\x18\x1e \x01(\x0b\x32\x14.spark.connect.ParseH\x00R\x05parse\x12\x36\n\tgroup_map\x18\x1f \x01(\x0b\x32\x17.spark.connect.GroupMapH\x00R\x08groupMap\x12=\n\x0c\x63o_group_map\x18  \x01(\x0b\x32\x19.spark.connect.CoGroupMapH\x00R\ncoGroupMap\x12\x45\n\x0ewith_watermark\x18! \x01(\x0b\x32\x1c.spark.connect.WithWatermarkH\x00R\rwithWatermark\x12\x63\n\x1a\x61pply_in_pandas_with_state\x18" \x01(\x0b\x32%.spark.connect.ApplyInPandasWithStateH\x00R\x16\x61pplyInPandasWithState\x12<\n\x0bhtml_string\x18# \x01(\x0b\x32\x19.spark.connect.HtmlStringH\x00R\nhtmlString\x12X\n\x15\x63\x61\x63hed_local_relation\x18$ \x01(\x0b\x32".spark.connect.CachedLocalRelationH\x00R\x13\x63\x61\x63hedLocalRelation\x12[\n\x16\x63\x61\x63hed_remote_relation\x18% \x01(\x0b\x32#.spark.connect.CachedRemoteRelationH\x00R\x14\x63\x61\x63hedRemoteRelation\x12\x8e\x01\n)common_inline_user_defined_table_function\x18& \x01(\x0b\x32\x33.spark.connect.CommonInlineUserDefinedTableFunctionH\x00R$commonInlineUserDefinedTableFunction\x12\x37\n\nas_of_join\x18\' \x01(\x0b\x32\x17.spark.connect.AsOfJoinH\x00R\x08\x61sOfJoin\x12\x85\x01\n&common_inline_user_defined_data_source\x18( \x01(\x0b\x32\x30.spark.connect.CommonInlineUserDefinedDataSourceH\x00R!commonInlineUserDefinedDataSource\x12\x45\n\x0ewith_relations\x18) \x01(\x0b\x32\x1c.spark.connect.WithRelationsH\x00R\rwithRelations\x12\x38\n\ttranspose\x18* \x01(\x0b\x32\x18.spark.connect.TransposeH\x00R\ttranspose\x12w\n unresolved_table_valued_function\x18+ \x01(\x0b\x32,.spark.connect.UnresolvedTableValuedFunctionH\x00R\x1dunresolvedTableValuedFunction\x12?\n\x0clateral_join\x18, \x01(\x0b\x32\x1a.spark.connect.LateralJoinH\x00R\x0blateralJoin\x12\x30\n\x07\x66ill_na\x18Z \x01(\x0b\x32\x15.spark.connect.NAFillH\x00R\x06\x66illNa\x12\x30\n\x07\x64rop_na\x18[ \x01(\x0b\x32\x15.spark.connect.NADropH\x00R\x06\x64ropNa\x12\x34\n\x07replace\x18\\ \x01(\x0b\x32\x18.spark.connect.NAReplaceH\x00R\x07replace\x12\x36\n\x07summary\x18\x64 \x01(\x0b\x32\x1a.spark.connect.StatSummaryH\x00R\x07summary\x12\x39\n\x08\x63rosstab\x18\x65 \x01(\x0b\x32\x1b.spark.connect.StatCrosstabH\x00R\x08\x63rosstab\x12\x39\n\x08\x64\x65scribe\x18\x66 \x01(\x0b\x32\x1b.spark.connect.StatDescribeH\x00R\x08\x64\x65scribe\x12*\n\x03\x63ov\x18g \x01(\x0b\x32\x16.spark.connect.StatCovH\x00R\x03\x63ov\x12-\n\x04\x63orr\x18h \x01(\x0b\x32\x17.spark.connect.StatCorrH\x00R\x04\x63orr\x12L\n\x0f\x61pprox_quantile\x18i \x01(\x0b\x32!.spark.connect.StatApproxQuantileH\x00R\x0e\x61pproxQuantile\x12=\n\nfreq_items\x18j \x01(\x0b\x32\x1c.spark.connect.StatFreqItemsH\x00R\tfreqItems\x12:\n\tsample_by\x18k \x01(\x0b\x32\x1b.spark.connect.StatSampleByH\x00R\x08sampleBy\x12\x33\n\x07\x63\x61talog\x18\xc8\x01 \x01(\x0b\x32\x16.spark.connect.CatalogH\x00R\x07\x63\x61talog\x12=\n\x0bml_relation\x18\xac\x02 \x01(\x0b\x32\x19.spark.connect.MlRelationH\x00R\nmlRelation\x12\x35\n\textension\x18\xe6\x07 \x01(\x0b\x32\x14.google.protobuf.AnyH\x00R\textension\x12\x33\n\x07unknown\x18\xe7\x07 \x01(\x0b\x32\x16.spark.connect.UnknownH\x00R\x07unknownB\n\n\x08rel_type"\xf8\x02\n\nMlRelation\x12\x43\n\ttransform\x18\x01 \x01(\x0b\x32#.spark.connect.MlRelation.TransformH\x00R\ttransform\x12,\n\x05\x66\x65tch\x18\x02 \x01(\x0b\x32\x14.spark.connect.FetchH\x00R\x05\x66\x65tch\x1a\xeb\x01\n\tTransform\x12\x33\n\x07obj_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefH\x00R\x06objRef\x12=\n\x0btransformer\x18\x02 \x01(\x0b\x32\x19.spark.connect.MlOperatorH\x00R\x0btransformer\x12-\n\x05input\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12/\n\x06params\x18\x04 \x01(\x0b\x32\x17.spark.connect.MlParamsR\x06paramsB\n\n\x08operatorB\t\n\x07ml_type"\xcb\x02\n\x05\x46\x65tch\x12\x31\n\x07obj_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefR\x06objRef\x12\x35\n\x07methods\x18\x02 \x03(\x0b\x32\x1b.spark.connect.Fetch.MethodR\x07methods\x1a\xd7\x01\n\x06Method\x12\x16\n\x06method\x18\x01 \x01(\tR\x06method\x12\x34\n\x04\x61rgs\x18\x02 \x03(\x0b\x32 .spark.connect.Fetch.Method.ArgsR\x04\x61rgs\x1a\x7f\n\x04\x41rgs\x12\x39\n\x05param\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralH\x00R\x05param\x12/\n\x05input\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationH\x00R\x05inputB\x0b\n\targs_type"\t\n\x07Unknown"\x8e\x01\n\x0eRelationCommon\x12#\n\x0bsource_info\x18\x01 \x01(\tB\x02\x18\x01R\nsourceInfo\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x00R\x06planId\x88\x01\x01\x12-\n\x06origin\x18\x03 \x01(\x0b\x32\x15.spark.connect.OriginR\x06originB\n\n\x08_plan_id"\xde\x03\n\x03SQL\x12\x14\n\x05query\x18\x01 \x01(\tR\x05query\x12\x34\n\x04\x61rgs\x18\x02 \x03(\x0b\x32\x1c.spark.connect.SQL.ArgsEntryB\x02\x18\x01R\x04\x61rgs\x12@\n\x08pos_args\x18\x03 \x03(\x0b\x32!.spark.connect.Expression.LiteralB\x02\x18\x01R\x07posArgs\x12O\n\x0fnamed_arguments\x18\x04 \x03(\x0b\x32&.spark.connect.SQL.NamedArgumentsEntryR\x0enamedArguments\x12>\n\rpos_arguments\x18\x05 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0cposArguments\x1aZ\n\tArgsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x37\n\x05value\x18\x02 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x05value:\x02\x38\x01\x1a\\\n\x13NamedArgumentsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12/\n\x05value\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05value:\x02\x38\x01"u\n\rWithRelations\x12+\n\x04root\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04root\x12\x37\n\nreferences\x18\x02 \x03(\x0b\x32\x17.spark.connect.RelationR\nreferences"\x97\x05\n\x04Read\x12\x41\n\x0bnamed_table\x18\x01 \x01(\x0b\x32\x1e.spark.connect.Read.NamedTableH\x00R\nnamedTable\x12\x41\n\x0b\x64\x61ta_source\x18\x02 \x01(\x0b\x32\x1e.spark.connect.Read.DataSourceH\x00R\ndataSource\x12!\n\x0cis_streaming\x18\x03 \x01(\x08R\x0bisStreaming\x1a\xc0\x01\n\nNamedTable\x12/\n\x13unparsed_identifier\x18\x01 \x01(\tR\x12unparsedIdentifier\x12\x45\n\x07options\x18\x02 \x03(\x0b\x32+.spark.connect.Read.NamedTable.OptionsEntryR\x07options\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x1a\x95\x02\n\nDataSource\x12\x1b\n\x06\x66ormat\x18\x01 \x01(\tH\x00R\x06\x66ormat\x88\x01\x01\x12\x1b\n\x06schema\x18\x02 \x01(\tH\x01R\x06schema\x88\x01\x01\x12\x45\n\x07options\x18\x03 \x03(\x0b\x32+.spark.connect.Read.DataSource.OptionsEntryR\x07options\x12\x14\n\x05paths\x18\x04 \x03(\tR\x05paths\x12\x1e\n\npredicates\x18\x05 \x03(\tR\npredicates\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\t\n\x07_formatB\t\n\x07_schemaB\x0b\n\tread_type"u\n\x07Project\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12;\n\x0b\x65xpressions\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0b\x65xpressions"p\n\x06\x46ilter\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x37\n\tcondition\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\tcondition"\x95\x05\n\x04Join\x12+\n\x04left\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04left\x12-\n\x05right\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\x05right\x12@\n\x0ejoin_condition\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\rjoinCondition\x12\x39\n\tjoin_type\x18\x04 \x01(\x0e\x32\x1c.spark.connect.Join.JoinTypeR\x08joinType\x12#\n\rusing_columns\x18\x05 \x03(\tR\x0cusingColumns\x12K\n\x0ejoin_data_type\x18\x06 \x01(\x0b\x32 .spark.connect.Join.JoinDataTypeH\x00R\x0cjoinDataType\x88\x01\x01\x1a\\\n\x0cJoinDataType\x12$\n\x0eis_left_struct\x18\x01 \x01(\x08R\x0cisLeftStruct\x12&\n\x0fis_right_struct\x18\x02 \x01(\x08R\risRightStruct"\xd0\x01\n\x08JoinType\x12\x19\n\x15JOIN_TYPE_UNSPECIFIED\x10\x00\x12\x13\n\x0fJOIN_TYPE_INNER\x10\x01\x12\x18\n\x14JOIN_TYPE_FULL_OUTER\x10\x02\x12\x18\n\x14JOIN_TYPE_LEFT_OUTER\x10\x03\x12\x19\n\x15JOIN_TYPE_RIGHT_OUTER\x10\x04\x12\x17\n\x13JOIN_TYPE_LEFT_ANTI\x10\x05\x12\x17\n\x13JOIN_TYPE_LEFT_SEMI\x10\x06\x12\x13\n\x0fJOIN_TYPE_CROSS\x10\x07\x42\x11\n\x0f_join_data_type"\xdf\x03\n\x0cSetOperation\x12\x36\n\nleft_input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\tleftInput\x12\x38\n\x0bright_input\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\nrightInput\x12\x45\n\x0bset_op_type\x18\x03 \x01(\x0e\x32%.spark.connect.SetOperation.SetOpTypeR\tsetOpType\x12\x1a\n\x06is_all\x18\x04 \x01(\x08H\x00R\x05isAll\x88\x01\x01\x12\x1c\n\x07\x62y_name\x18\x05 \x01(\x08H\x01R\x06\x62yName\x88\x01\x01\x12\x37\n\x15\x61llow_missing_columns\x18\x06 \x01(\x08H\x02R\x13\x61llowMissingColumns\x88\x01\x01"r\n\tSetOpType\x12\x1b\n\x17SET_OP_TYPE_UNSPECIFIED\x10\x00\x12\x19\n\x15SET_OP_TYPE_INTERSECT\x10\x01\x12\x15\n\x11SET_OP_TYPE_UNION\x10\x02\x12\x16\n\x12SET_OP_TYPE_EXCEPT\x10\x03\x42\t\n\x07_is_allB\n\n\x08_by_nameB\x18\n\x16_allow_missing_columns"L\n\x05Limit\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x14\n\x05limit\x18\x02 \x01(\x05R\x05limit"O\n\x06Offset\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x16\n\x06offset\x18\x02 \x01(\x05R\x06offset"K\n\x04Tail\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x14\n\x05limit\x18\x02 \x01(\x05R\x05limit"\xfe\x05\n\tAggregate\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x41\n\ngroup_type\x18\x02 \x01(\x0e\x32".spark.connect.Aggregate.GroupTypeR\tgroupType\x12L\n\x14grouping_expressions\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x13groupingExpressions\x12N\n\x15\x61ggregate_expressions\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x14\x61ggregateExpressions\x12\x34\n\x05pivot\x18\x05 \x01(\x0b\x32\x1e.spark.connect.Aggregate.PivotR\x05pivot\x12J\n\rgrouping_sets\x18\x06 \x03(\x0b\x32%.spark.connect.Aggregate.GroupingSetsR\x0cgroupingSets\x1ao\n\x05Pivot\x12+\n\x03\x63ol\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x03\x63ol\x12\x39\n\x06values\x18\x02 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x06values\x1aL\n\x0cGroupingSets\x12<\n\x0cgrouping_set\x18\x01 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0bgroupingSet"\x9f\x01\n\tGroupType\x12\x1a\n\x16GROUP_TYPE_UNSPECIFIED\x10\x00\x12\x16\n\x12GROUP_TYPE_GROUPBY\x10\x01\x12\x15\n\x11GROUP_TYPE_ROLLUP\x10\x02\x12\x13\n\x0fGROUP_TYPE_CUBE\x10\x03\x12\x14\n\x10GROUP_TYPE_PIVOT\x10\x04\x12\x1c\n\x18GROUP_TYPE_GROUPING_SETS\x10\x05"\xa0\x01\n\x04Sort\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x39\n\x05order\x18\x02 \x03(\x0b\x32#.spark.connect.Expression.SortOrderR\x05order\x12 \n\tis_global\x18\x03 \x01(\x08H\x00R\x08isGlobal\x88\x01\x01\x42\x0c\n\n_is_global"\x8d\x01\n\x04\x44rop\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x33\n\x07\x63olumns\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x07\x63olumns\x12!\n\x0c\x63olumn_names\x18\x03 \x03(\tR\x0b\x63olumnNames"\xf0\x01\n\x0b\x44\x65\x64uplicate\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12!\n\x0c\x63olumn_names\x18\x02 \x03(\tR\x0b\x63olumnNames\x12\x32\n\x13\x61ll_columns_as_keys\x18\x03 \x01(\x08H\x00R\x10\x61llColumnsAsKeys\x88\x01\x01\x12.\n\x10within_watermark\x18\x04 \x01(\x08H\x01R\x0fwithinWatermark\x88\x01\x01\x42\x16\n\x14_all_columns_as_keysB\x13\n\x11_within_watermark"Y\n\rLocalRelation\x12\x17\n\x04\x64\x61ta\x18\x01 \x01(\x0cH\x00R\x04\x64\x61ta\x88\x01\x01\x12\x1b\n\x06schema\x18\x02 \x01(\tH\x01R\x06schema\x88\x01\x01\x42\x07\n\x05_dataB\t\n\x07_schema"H\n\x13\x43\x61\x63hedLocalRelation\x12\x12\n\x04hash\x18\x03 \x01(\tR\x04hashJ\x04\x08\x01\x10\x02J\x04\x08\x02\x10\x03R\x06userIdR\tsessionId"7\n\x14\x43\x61\x63hedRemoteRelation\x12\x1f\n\x0brelation_id\x18\x01 \x01(\tR\nrelationId"\x91\x02\n\x06Sample\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x1f\n\x0blower_bound\x18\x02 \x01(\x01R\nlowerBound\x12\x1f\n\x0bupper_bound\x18\x03 \x01(\x01R\nupperBound\x12.\n\x10with_replacement\x18\x04 \x01(\x08H\x00R\x0fwithReplacement\x88\x01\x01\x12\x17\n\x04seed\x18\x05 \x01(\x03H\x01R\x04seed\x88\x01\x01\x12/\n\x13\x64\x65terministic_order\x18\x06 \x01(\x08R\x12\x64\x65terministicOrderB\x13\n\x11_with_replacementB\x07\n\x05_seed"\x91\x01\n\x05Range\x12\x19\n\x05start\x18\x01 \x01(\x03H\x00R\x05start\x88\x01\x01\x12\x10\n\x03\x65nd\x18\x02 \x01(\x03R\x03\x65nd\x12\x12\n\x04step\x18\x03 \x01(\x03R\x04step\x12*\n\x0enum_partitions\x18\x04 \x01(\x05H\x01R\rnumPartitions\x88\x01\x01\x42\x08\n\x06_startB\x11\n\x0f_num_partitions"r\n\rSubqueryAlias\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x14\n\x05\x61lias\x18\x02 \x01(\tR\x05\x61lias\x12\x1c\n\tqualifier\x18\x03 \x03(\tR\tqualifier"\x8e\x01\n\x0bRepartition\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12%\n\x0enum_partitions\x18\x02 \x01(\x05R\rnumPartitions\x12\x1d\n\x07shuffle\x18\x03 \x01(\x08H\x00R\x07shuffle\x88\x01\x01\x42\n\n\x08_shuffle"\x8e\x01\n\nShowString\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x19\n\x08num_rows\x18\x02 \x01(\x05R\x07numRows\x12\x1a\n\x08truncate\x18\x03 \x01(\x05R\x08truncate\x12\x1a\n\x08vertical\x18\x04 \x01(\x08R\x08vertical"r\n\nHtmlString\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x19\n\x08num_rows\x18\x02 \x01(\x05R\x07numRows\x12\x1a\n\x08truncate\x18\x03 \x01(\x05R\x08truncate"\\\n\x0bStatSummary\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x1e\n\nstatistics\x18\x02 \x03(\tR\nstatistics"Q\n\x0cStatDescribe\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols"e\n\x0cStatCrosstab\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ol1\x18\x02 \x01(\tR\x04\x63ol1\x12\x12\n\x04\x63ol2\x18\x03 \x01(\tR\x04\x63ol2"`\n\x07StatCov\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ol1\x18\x02 \x01(\tR\x04\x63ol1\x12\x12\n\x04\x63ol2\x18\x03 \x01(\tR\x04\x63ol2"\x89\x01\n\x08StatCorr\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ol1\x18\x02 \x01(\tR\x04\x63ol1\x12\x12\n\x04\x63ol2\x18\x03 \x01(\tR\x04\x63ol2\x12\x1b\n\x06method\x18\x04 \x01(\tH\x00R\x06method\x88\x01\x01\x42\t\n\x07_method"\xa4\x01\n\x12StatApproxQuantile\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12$\n\rprobabilities\x18\x03 \x03(\x01R\rprobabilities\x12%\n\x0erelative_error\x18\x04 \x01(\x01R\rrelativeError"}\n\rStatFreqItems\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12\x1d\n\x07support\x18\x03 \x01(\x01H\x00R\x07support\x88\x01\x01\x42\n\n\x08_support"\xb5\x02\n\x0cStatSampleBy\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12+\n\x03\x63ol\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x03\x63ol\x12\x42\n\tfractions\x18\x03 \x03(\x0b\x32$.spark.connect.StatSampleBy.FractionR\tfractions\x12\x17\n\x04seed\x18\x05 \x01(\x03H\x00R\x04seed\x88\x01\x01\x1a\x63\n\x08\x46raction\x12;\n\x07stratum\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x07stratum\x12\x1a\n\x08\x66raction\x18\x02 \x01(\x01R\x08\x66ractionB\x07\n\x05_seed"\x86\x01\n\x06NAFill\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12\x39\n\x06values\x18\x03 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x06values"\x86\x01\n\x06NADrop\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12\'\n\rmin_non_nulls\x18\x03 \x01(\x05H\x00R\x0bminNonNulls\x88\x01\x01\x42\x10\n\x0e_min_non_nulls"\xa8\x02\n\tNAReplace\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12H\n\x0creplacements\x18\x03 \x03(\x0b\x32$.spark.connect.NAReplace.ReplacementR\x0creplacements\x1a\x8d\x01\n\x0bReplacement\x12>\n\told_value\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x08oldValue\x12>\n\tnew_value\x18\x02 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x08newValue"X\n\x04ToDF\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12!\n\x0c\x63olumn_names\x18\x02 \x03(\tR\x0b\x63olumnNames"\xfe\x02\n\x12WithColumnsRenamed\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12i\n\x12rename_columns_map\x18\x02 \x03(\x0b\x32\x37.spark.connect.WithColumnsRenamed.RenameColumnsMapEntryB\x02\x18\x01R\x10renameColumnsMap\x12\x42\n\x07renames\x18\x03 \x03(\x0b\x32(.spark.connect.WithColumnsRenamed.RenameR\x07renames\x1a\x43\n\x15RenameColumnsMapEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x1a\x45\n\x06Rename\x12\x19\n\x08\x63ol_name\x18\x01 \x01(\tR\x07\x63olName\x12 \n\x0cnew_col_name\x18\x02 \x01(\tR\nnewColName"w\n\x0bWithColumns\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x39\n\x07\x61liases\x18\x02 \x03(\x0b\x32\x1f.spark.connect.Expression.AliasR\x07\x61liases"\x86\x01\n\rWithWatermark\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x1d\n\nevent_time\x18\x02 \x01(\tR\teventTime\x12\'\n\x0f\x64\x65lay_threshold\x18\x03 \x01(\tR\x0e\x64\x65layThreshold"\x84\x01\n\x04Hint\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04name\x18\x02 \x01(\tR\x04name\x12\x39\n\nparameters\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\nparameters"\xc7\x02\n\x07Unpivot\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12+\n\x03ids\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x03ids\x12:\n\x06values\x18\x03 \x01(\x0b\x32\x1d.spark.connect.Unpivot.ValuesH\x00R\x06values\x88\x01\x01\x12\x30\n\x14variable_column_name\x18\x04 \x01(\tR\x12variableColumnName\x12*\n\x11value_column_name\x18\x05 \x01(\tR\x0fvalueColumnName\x1a;\n\x06Values\x12\x31\n\x06values\x18\x01 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x06valuesB\t\n\x07_values"z\n\tTranspose\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12>\n\rindex_columns\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0cindexColumns"}\n\x1dUnresolvedTableValuedFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12\x37\n\targuments\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments"j\n\x08ToSchema\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12/\n\x06schema\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x06schema"\xcb\x01\n\x17RepartitionByExpression\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x42\n\x0fpartition_exprs\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0epartitionExprs\x12*\n\x0enum_partitions\x18\x03 \x01(\x05H\x00R\rnumPartitions\x88\x01\x01\x42\x11\n\x0f_num_partitions"\xe8\x01\n\rMapPartitions\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x42\n\x04\x66unc\x18\x02 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12"\n\nis_barrier\x18\x03 \x01(\x08H\x00R\tisBarrier\x88\x01\x01\x12"\n\nprofile_id\x18\x04 \x01(\x05H\x01R\tprofileId\x88\x01\x01\x42\r\n\x0b_is_barrierB\r\n\x0b_profile_id"\xd2\x06\n\x08GroupMap\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12L\n\x14grouping_expressions\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x13groupingExpressions\x12\x42\n\x04\x66unc\x18\x03 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12J\n\x13sorting_expressions\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x12sortingExpressions\x12<\n\rinitial_input\x18\x05 \x01(\x0b\x32\x17.spark.connect.RelationR\x0cinitialInput\x12[\n\x1cinitial_grouping_expressions\x18\x06 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x1ainitialGroupingExpressions\x12;\n\x18is_map_groups_with_state\x18\x07 \x01(\x08H\x00R\x14isMapGroupsWithState\x88\x01\x01\x12$\n\x0boutput_mode\x18\x08 \x01(\tH\x01R\noutputMode\x88\x01\x01\x12&\n\x0ctimeout_conf\x18\t \x01(\tH\x02R\x0btimeoutConf\x88\x01\x01\x12?\n\x0cstate_schema\x18\n \x01(\x0b\x32\x17.spark.connect.DataTypeH\x03R\x0bstateSchema\x88\x01\x01\x12\x65\n\x19transform_with_state_info\x18\x0b \x01(\x0b\x32%.spark.connect.TransformWithStateInfoH\x04R\x16transformWithStateInfo\x88\x01\x01\x42\x1b\n\x19_is_map_groups_with_stateB\x0e\n\x0c_output_modeB\x0f\n\r_timeout_confB\x0f\n\r_state_schemaB\x1c\n\x1a_transform_with_state_info"\xdf\x01\n\x16TransformWithStateInfo\x12\x1b\n\ttime_mode\x18\x01 \x01(\tR\x08timeMode\x12\x38\n\x16\x65vent_time_column_name\x18\x02 \x01(\tH\x00R\x13\x65ventTimeColumnName\x88\x01\x01\x12\x41\n\routput_schema\x18\x03 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x01R\x0coutputSchema\x88\x01\x01\x42\x19\n\x17_event_time_column_nameB\x10\n\x0e_output_schema"\x8e\x04\n\nCoGroupMap\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12W\n\x1ainput_grouping_expressions\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x18inputGroupingExpressions\x12-\n\x05other\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x05other\x12W\n\x1aother_grouping_expressions\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x18otherGroupingExpressions\x12\x42\n\x04\x66unc\x18\x05 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12U\n\x19input_sorting_expressions\x18\x06 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x17inputSortingExpressions\x12U\n\x19other_sorting_expressions\x18\x07 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x17otherSortingExpressions"\xe5\x02\n\x16\x41pplyInPandasWithState\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12L\n\x14grouping_expressions\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x13groupingExpressions\x12\x42\n\x04\x66unc\x18\x03 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12#\n\routput_schema\x18\x04 \x01(\tR\x0coutputSchema\x12!\n\x0cstate_schema\x18\x05 \x01(\tR\x0bstateSchema\x12\x1f\n\x0boutput_mode\x18\x06 \x01(\tR\noutputMode\x12!\n\x0ctimeout_conf\x18\x07 \x01(\tR\x0btimeoutConf"\xf4\x01\n$CommonInlineUserDefinedTableFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12$\n\rdeterministic\x18\x02 \x01(\x08R\rdeterministic\x12\x37\n\targuments\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments\x12<\n\x0bpython_udtf\x18\x04 \x01(\x0b\x32\x19.spark.connect.PythonUDTFH\x00R\npythonUdtfB\n\n\x08\x66unction"\xb1\x01\n\nPythonUDTF\x12=\n\x0breturn_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\nreturnType\x88\x01\x01\x12\x1b\n\teval_type\x18\x02 \x01(\x05R\x08\x65valType\x12\x18\n\x07\x63ommand\x18\x03 \x01(\x0cR\x07\x63ommand\x12\x1d\n\npython_ver\x18\x04 \x01(\tR\tpythonVerB\x0e\n\x0c_return_type"\x97\x01\n!CommonInlineUserDefinedDataSource\x12\x12\n\x04name\x18\x01 \x01(\tR\x04name\x12O\n\x12python_data_source\x18\x02 \x01(\x0b\x32\x1f.spark.connect.PythonDataSourceH\x00R\x10pythonDataSourceB\r\n\x0b\x64\x61ta_source"K\n\x10PythonDataSource\x12\x18\n\x07\x63ommand\x18\x01 \x01(\x0cR\x07\x63ommand\x12\x1d\n\npython_ver\x18\x02 \x01(\tR\tpythonVer"\x88\x01\n\x0e\x43ollectMetrics\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04name\x18\x02 \x01(\tR\x04name\x12\x33\n\x07metrics\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x07metrics"\x84\x03\n\x05Parse\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x38\n\x06\x66ormat\x18\x02 \x01(\x0e\x32 .spark.connect.Parse.ParseFormatR\x06\x66ormat\x12\x34\n\x06schema\x18\x03 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\x06schema\x88\x01\x01\x12;\n\x07options\x18\x04 \x03(\x0b\x32!.spark.connect.Parse.OptionsEntryR\x07options\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01"X\n\x0bParseFormat\x12\x1c\n\x18PARSE_FORMAT_UNSPECIFIED\x10\x00\x12\x14\n\x10PARSE_FORMAT_CSV\x10\x01\x12\x15\n\x11PARSE_FORMAT_JSON\x10\x02\x42\t\n\x07_schema"\xdb\x03\n\x08\x41sOfJoin\x12+\n\x04left\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04left\x12-\n\x05right\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\x05right\x12\x37\n\nleft_as_of\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x08leftAsOf\x12\x39\n\x0bright_as_of\x18\x04 \x01(\x0b\x32\x19.spark.connect.ExpressionR\trightAsOf\x12\x36\n\tjoin_expr\x18\x05 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x08joinExpr\x12#\n\rusing_columns\x18\x06 \x03(\tR\x0cusingColumns\x12\x1b\n\tjoin_type\x18\x07 \x01(\tR\x08joinType\x12\x37\n\ttolerance\x18\x08 \x01(\x0b\x32\x19.spark.connect.ExpressionR\ttolerance\x12.\n\x13\x61llow_exact_matches\x18\t \x01(\x08R\x11\x61llowExactMatches\x12\x1c\n\tdirection\x18\n \x01(\tR\tdirection"\xe6\x01\n\x0bLateralJoin\x12+\n\x04left\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04left\x12-\n\x05right\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\x05right\x12@\n\x0ejoin_condition\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\rjoinCondition\x12\x39\n\tjoin_type\x18\x04 \x01(\x0e\x32\x1c.spark.connect.Join.JoinTypeR\x08joinTypeB6\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3'
+    b'\n\x1dspark/connect/relations.proto\x12\rspark.connect\x1a\x19google/protobuf/any.proto\x1a\x1fspark/connect/expressions.proto\x1a\x19spark/connect/types.proto\x1a\x1bspark/connect/catalog.proto\x1a\x1aspark/connect/common.proto\x1a\x1dspark/connect/ml_common.proto"\x9c\x1d\n\x08Relation\x12\x35\n\x06\x63ommon\x18\x01 \x01(\x0b\x32\x1d.spark.connect.RelationCommonR\x06\x63ommon\x12)\n\x04read\x18\x02 \x01(\x0b\x32\x13.spark.connect.ReadH\x00R\x04read\x12\x32\n\x07project\x18\x03 \x01(\x0b\x32\x16.spark.connect.ProjectH\x00R\x07project\x12/\n\x06\x66ilter\x18\x04 \x01(\x0b\x32\x15.spark.connect.FilterH\x00R\x06\x66ilter\x12)\n\x04join\x18\x05 \x01(\x0b\x32\x13.spark.connect.JoinH\x00R\x04join\x12\x34\n\x06set_op\x18\x06 \x01(\x0b\x32\x1b.spark.connect.SetOperationH\x00R\x05setOp\x12)\n\x04sort\x18\x07 \x01(\x0b\x32\x13.spark.connect.SortH\x00R\x04sort\x12,\n\x05limit\x18\x08 \x01(\x0b\x32\x14.spark.connect.LimitH\x00R\x05limit\x12\x38\n\taggregate\x18\t \x01(\x0b\x32\x18.spark.connect.AggregateH\x00R\taggregate\x12&\n\x03sql\x18\n \x01(\x0b\x32\x12.spark.connect.SQLH\x00R\x03sql\x12\x45\n\x0elocal_relation\x18\x0b \x01(\x0b\x32\x1c.spark.connect.LocalRelationH\x00R\rlocalRelation\x12/\n\x06sample\x18\x0c \x01(\x0b\x32\x15.spark.connect.SampleH\x00R\x06sample\x12/\n\x06offset\x18\r \x01(\x0b\x32\x15.spark.connect.OffsetH\x00R\x06offset\x12>\n\x0b\x64\x65\x64uplicate\x18\x0e \x01(\x0b\x32\x1a.spark.connect.DeduplicateH\x00R\x0b\x64\x65\x64uplicate\x12,\n\x05range\x18\x0f \x01(\x0b\x32\x14.spark.connect.RangeH\x00R\x05range\x12\x45\n\x0esubquery_alias\x18\x10 \x01(\x0b\x32\x1c.spark.connect.SubqueryAliasH\x00R\rsubqueryAlias\x12>\n\x0brepartition\x18\x11 \x01(\x0b\x32\x1a.spark.connect.RepartitionH\x00R\x0brepartition\x12*\n\x05to_df\x18\x12 \x01(\x0b\x32\x13.spark.connect.ToDFH\x00R\x04toDf\x12U\n\x14with_columns_renamed\x18\x13 \x01(\x0b\x32!.spark.connect.WithColumnsRenamedH\x00R\x12withColumnsRenamed\x12<\n\x0bshow_string\x18\x14 \x01(\x0b\x32\x19.spark.connect.ShowStringH\x00R\nshowString\x12)\n\x04\x64rop\x18\x15 \x01(\x0b\x32\x13.spark.connect.DropH\x00R\x04\x64rop\x12)\n\x04tail\x18\x16 \x01(\x0b\x32\x13.spark.connect.TailH\x00R\x04tail\x12?\n\x0cwith_columns\x18\x17 \x01(\x0b\x32\x1a.spark.connect.WithColumnsH\x00R\x0bwithColumns\x12)\n\x04hint\x18\x18 \x01(\x0b\x32\x13.spark.connect.HintH\x00R\x04hint\x12\x32\n\x07unpivot\x18\x19 \x01(\x0b\x32\x16.spark.connect.UnpivotH\x00R\x07unpivot\x12\x36\n\tto_schema\x18\x1a \x01(\x0b\x32\x17.spark.connect.ToSchemaH\x00R\x08toSchema\x12\x64\n\x19repartition_by_expression\x18\x1b \x01(\x0b\x32&.spark.connect.RepartitionByExpressionH\x00R\x17repartitionByExpression\x12\x45\n\x0emap_partitions\x18\x1c \x01(\x0b\x32\x1c.spark.connect.MapPartitionsH\x00R\rmapPartitions\x12H\n\x0f\x63ollect_metrics\x18\x1d \x01(\x0b\x32\x1d.spark.connect.CollectMetricsH\x00R\x0e\x63ollectMetrics\x12,\n\x05parse\x18\x1e \x01(\x0b\x32\x14.spark.connect.ParseH\x00R\x05parse\x12\x36\n\tgroup_map\x18\x1f \x01(\x0b\x32\x17.spark.connect.GroupMapH\x00R\x08groupMap\x12=\n\x0c\x63o_group_map\x18  \x01(\x0b\x32\x19.spark.connect.CoGroupMapH\x00R\ncoGroupMap\x12\x45\n\x0ewith_watermark\x18! \x01(\x0b\x32\x1c.spark.connect.WithWatermarkH\x00R\rwithWatermark\x12\x63\n\x1a\x61pply_in_pandas_with_state\x18" \x01(\x0b\x32%.spark.connect.ApplyInPandasWithStateH\x00R\x16\x61pplyInPandasWithState\x12<\n\x0bhtml_string\x18# \x01(\x0b\x32\x19.spark.connect.HtmlStringH\x00R\nhtmlString\x12X\n\x15\x63\x61\x63hed_local_relation\x18$ \x01(\x0b\x32".spark.connect.CachedLocalRelationH\x00R\x13\x63\x61\x63hedLocalRelation\x12[\n\x16\x63\x61\x63hed_remote_relation\x18% \x01(\x0b\x32#.spark.connect.CachedRemoteRelationH\x00R\x14\x63\x61\x63hedRemoteRelation\x12\x8e\x01\n)common_inline_user_defined_table_function\x18& \x01(\x0b\x32\x33.spark.connect.CommonInlineUserDefinedTableFunctionH\x00R$commonInlineUserDefinedTableFunction\x12\x37\n\nas_of_join\x18\' \x01(\x0b\x32\x17.spark.connect.AsOfJoinH\x00R\x08\x61sOfJoin\x12\x85\x01\n&common_inline_user_defined_data_source\x18( \x01(\x0b\x32\x30.spark.connect.CommonInlineUserDefinedDataSourceH\x00R!commonInlineUserDefinedDataSource\x12\x45\n\x0ewith_relations\x18) \x01(\x0b\x32\x1c.spark.connect.WithRelationsH\x00R\rwithRelations\x12\x38\n\ttranspose\x18* \x01(\x0b\x32\x18.spark.connect.TransposeH\x00R\ttranspose\x12w\n unresolved_table_valued_function\x18+ \x01(\x0b\x32,.spark.connect.UnresolvedTableValuedFunctionH\x00R\x1dunresolvedTableValuedFunction\x12?\n\x0clateral_join\x18, \x01(\x0b\x32\x1a.spark.connect.LateralJoinH\x00R\x0blateralJoin\x12\x30\n\x07\x66ill_na\x18Z \x01(\x0b\x32\x15.spark.connect.NAFillH\x00R\x06\x66illNa\x12\x30\n\x07\x64rop_na\x18[ \x01(\x0b\x32\x15.spark.connect.NADropH\x00R\x06\x64ropNa\x12\x34\n\x07replace\x18\\ \x01(\x0b\x32\x18.spark.connect.NAReplaceH\x00R\x07replace\x12\x36\n\x07summary\x18\x64 \x01(\x0b\x32\x1a.spark.connect.StatSummaryH\x00R\x07summary\x12\x39\n\x08\x63rosstab\x18\x65 \x01(\x0b\x32\x1b.spark.connect.StatCrosstabH\x00R\x08\x63rosstab\x12\x39\n\x08\x64\x65scribe\x18\x66 \x01(\x0b\x32\x1b.spark.connect.StatDescribeH\x00R\x08\x64\x65scribe\x12*\n\x03\x63ov\x18g \x01(\x0b\x32\x16.spark.connect.StatCovH\x00R\x03\x63ov\x12-\n\x04\x63orr\x18h \x01(\x0b\x32\x17.spark.connect.StatCorrH\x00R\x04\x63orr\x12L\n\x0f\x61pprox_quantile\x18i \x01(\x0b\x32!.spark.connect.StatApproxQuantileH\x00R\x0e\x61pproxQuantile\x12=\n\nfreq_items\x18j \x01(\x0b\x32\x1c.spark.connect.StatFreqItemsH\x00R\tfreqItems\x12:\n\tsample_by\x18k \x01(\x0b\x32\x1b.spark.connect.StatSampleByH\x00R\x08sampleBy\x12\x33\n\x07\x63\x61talog\x18\xc8\x01 \x01(\x0b\x32\x16.spark.connect.CatalogH\x00R\x07\x63\x61talog\x12=\n\x0bml_relation\x18\xac\x02 \x01(\x0b\x32\x19.spark.connect.MlRelationH\x00R\nmlRelation\x12\x35\n\textension\x18\xe6\x07 \x01(\x0b\x32\x14.google.protobuf.AnyH\x00R\textension\x12\x33\n\x07unknown\x18\xe7\x07 \x01(\x0b\x32\x16.spark.connect.UnknownH\x00R\x07unknownB\n\n\x08rel_type"\xe4\x03\n\nMlRelation\x12\x43\n\ttransform\x18\x01 \x01(\x0b\x32#.spark.connect.MlRelation.TransformH\x00R\ttransform\x12,\n\x05\x66\x65tch\x18\x02 \x01(\x0b\x32\x14.spark.connect.FetchH\x00R\x05\x66\x65tch\x12P\n\x15model_summary_dataset\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationH\x01R\x13modelSummaryDataset\x88\x01\x01\x1a\xeb\x01\n\tTransform\x12\x33\n\x07obj_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefH\x00R\x06objRef\x12=\n\x0btransformer\x18\x02 \x01(\x0b\x32\x19.spark.connect.MlOperatorH\x00R\x0btransformer\x12-\n\x05input\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12/\n\x06params\x18\x04 \x01(\x0b\x32\x17.spark.connect.MlParamsR\x06paramsB\n\n\x08operatorB\t\n\x07ml_typeB\x18\n\x16_model_summary_dataset"\xcb\x02\n\x05\x46\x65tch\x12\x31\n\x07obj_ref\x18\x01 \x01(\x0b\x32\x18.spark.connect.ObjectRefR\x06objRef\x12\x35\n\x07methods\x18\x02 \x03(\x0b\x32\x1b.spark.connect.Fetch.MethodR\x07methods\x1a\xd7\x01\n\x06Method\x12\x16\n\x06method\x18\x01 \x01(\tR\x06method\x12\x34\n\x04\x61rgs\x18\x02 \x03(\x0b\x32 .spark.connect.Fetch.Method.ArgsR\x04\x61rgs\x1a\x7f\n\x04\x41rgs\x12\x39\n\x05param\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralH\x00R\x05param\x12/\n\x05input\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationH\x00R\x05inputB\x0b\n\targs_type"\t\n\x07Unknown"\x8e\x01\n\x0eRelationCommon\x12#\n\x0bsource_info\x18\x01 \x01(\tB\x02\x18\x01R\nsourceInfo\x12\x1c\n\x07plan_id\x18\x02 \x01(\x03H\x00R\x06planId\x88\x01\x01\x12-\n\x06origin\x18\x03 \x01(\x0b\x32\x15.spark.connect.OriginR\x06originB\n\n\x08_plan_id"\xde\x03\n\x03SQL\x12\x14\n\x05query\x18\x01 \x01(\tR\x05query\x12\x34\n\x04\x61rgs\x18\x02 \x03(\x0b\x32\x1c.spark.connect.SQL.ArgsEntryB\x02\x18\x01R\x04\x61rgs\x12@\n\x08pos_args\x18\x03 \x03(\x0b\x32!.spark.connect.Expression.LiteralB\x02\x18\x01R\x07posArgs\x12O\n\x0fnamed_arguments\x18\x04 \x03(\x0b\x32&.spark.connect.SQL.NamedArgumentsEntryR\x0enamedArguments\x12>\n\rpos_arguments\x18\x05 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0cposArguments\x1aZ\n\tArgsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x37\n\x05value\x18\x02 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x05value:\x02\x38\x01\x1a\\\n\x13NamedArgumentsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12/\n\x05value\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x05value:\x02\x38\x01"u\n\rWithRelations\x12+\n\x04root\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04root\x12\x37\n\nreferences\x18\x02 \x03(\x0b\x32\x17.spark.connect.RelationR\nreferences"\x97\x05\n\x04Read\x12\x41\n\x0bnamed_table\x18\x01 \x01(\x0b\x32\x1e.spark.connect.Read.NamedTableH\x00R\nnamedTable\x12\x41\n\x0b\x64\x61ta_source\x18\x02 \x01(\x0b\x32\x1e.spark.connect.Read.DataSourceH\x00R\ndataSource\x12!\n\x0cis_streaming\x18\x03 \x01(\x08R\x0bisStreaming\x1a\xc0\x01\n\nNamedTable\x12/\n\x13unparsed_identifier\x18\x01 \x01(\tR\x12unparsedIdentifier\x12\x45\n\x07options\x18\x02 \x03(\x0b\x32+.spark.connect.Read.NamedTable.OptionsEntryR\x07options\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x1a\x95\x02\n\nDataSource\x12\x1b\n\x06\x66ormat\x18\x01 \x01(\tH\x00R\x06\x66ormat\x88\x01\x01\x12\x1b\n\x06schema\x18\x02 \x01(\tH\x01R\x06schema\x88\x01\x01\x12\x45\n\x07options\x18\x03 \x03(\x0b\x32+.spark.connect.Read.DataSource.OptionsEntryR\x07options\x12\x14\n\x05paths\x18\x04 \x03(\tR\x05paths\x12\x1e\n\npredicates\x18\x05 \x03(\tR\npredicates\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x42\t\n\x07_formatB\t\n\x07_schemaB\x0b\n\tread_type"u\n\x07Project\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12;\n\x0b\x65xpressions\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0b\x65xpressions"p\n\x06\x46ilter\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x37\n\tcondition\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\tcondition"\x95\x05\n\x04Join\x12+\n\x04left\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04left\x12-\n\x05right\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\x05right\x12@\n\x0ejoin_condition\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\rjoinCondition\x12\x39\n\tjoin_type\x18\x04 \x01(\x0e\x32\x1c.spark.connect.Join.JoinTypeR\x08joinType\x12#\n\rusing_columns\x18\x05 \x03(\tR\x0cusingColumns\x12K\n\x0ejoin_data_type\x18\x06 \x01(\x0b\x32 .spark.connect.Join.JoinDataTypeH\x00R\x0cjoinDataType\x88\x01\x01\x1a\\\n\x0cJoinDataType\x12$\n\x0eis_left_struct\x18\x01 \x01(\x08R\x0cisLeftStruct\x12&\n\x0fis_right_struct\x18\x02 \x01(\x08R\risRightStruct"\xd0\x01\n\x08JoinType\x12\x19\n\x15JOIN_TYPE_UNSPECIFIED\x10\x00\x12\x13\n\x0fJOIN_TYPE_INNER\x10\x01\x12\x18\n\x14JOIN_TYPE_FULL_OUTER\x10\x02\x12\x18\n\x14JOIN_TYPE_LEFT_OUTER\x10\x03\x12\x19\n\x15JOIN_TYPE_RIGHT_OUTER\x10\x04\x12\x17\n\x13JOIN_TYPE_LEFT_ANTI\x10\x05\x12\x17\n\x13JOIN_TYPE_LEFT_SEMI\x10\x06\x12\x13\n\x0fJOIN_TYPE_CROSS\x10\x07\x42\x11\n\x0f_join_data_type"\xdf\x03\n\x0cSetOperation\x12\x36\n\nleft_input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\tleftInput\x12\x38\n\x0bright_input\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\nrightInput\x12\x45\n\x0bset_op_type\x18\x03 \x01(\x0e\x32%.spark.connect.SetOperation.SetOpTypeR\tsetOpType\x12\x1a\n\x06is_all\x18\x04 \x01(\x08H\x00R\x05isAll\x88\x01\x01\x12\x1c\n\x07\x62y_name\x18\x05 \x01(\x08H\x01R\x06\x62yName\x88\x01\x01\x12\x37\n\x15\x61llow_missing_columns\x18\x06 \x01(\x08H\x02R\x13\x61llowMissingColumns\x88\x01\x01"r\n\tSetOpType\x12\x1b\n\x17SET_OP_TYPE_UNSPECIFIED\x10\x00\x12\x19\n\x15SET_OP_TYPE_INTERSECT\x10\x01\x12\x15\n\x11SET_OP_TYPE_UNION\x10\x02\x12\x16\n\x12SET_OP_TYPE_EXCEPT\x10\x03\x42\t\n\x07_is_allB\n\n\x08_by_nameB\x18\n\x16_allow_missing_columns"L\n\x05Limit\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x14\n\x05limit\x18\x02 \x01(\x05R\x05limit"O\n\x06Offset\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x16\n\x06offset\x18\x02 \x01(\x05R\x06offset"K\n\x04Tail\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x14\n\x05limit\x18\x02 \x01(\x05R\x05limit"\xfe\x05\n\tAggregate\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x41\n\ngroup_type\x18\x02 \x01(\x0e\x32".spark.connect.Aggregate.GroupTypeR\tgroupType\x12L\n\x14grouping_expressions\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x13groupingExpressions\x12N\n\x15\x61ggregate_expressions\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x14\x61ggregateExpressions\x12\x34\n\x05pivot\x18\x05 \x01(\x0b\x32\x1e.spark.connect.Aggregate.PivotR\x05pivot\x12J\n\rgrouping_sets\x18\x06 \x03(\x0b\x32%.spark.connect.Aggregate.GroupingSetsR\x0cgroupingSets\x1ao\n\x05Pivot\x12+\n\x03\x63ol\x18\x01 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x03\x63ol\x12\x39\n\x06values\x18\x02 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x06values\x1aL\n\x0cGroupingSets\x12<\n\x0cgrouping_set\x18\x01 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0bgroupingSet"\x9f\x01\n\tGroupType\x12\x1a\n\x16GROUP_TYPE_UNSPECIFIED\x10\x00\x12\x16\n\x12GROUP_TYPE_GROUPBY\x10\x01\x12\x15\n\x11GROUP_TYPE_ROLLUP\x10\x02\x12\x13\n\x0fGROUP_TYPE_CUBE\x10\x03\x12\x14\n\x10GROUP_TYPE_PIVOT\x10\x04\x12\x1c\n\x18GROUP_TYPE_GROUPING_SETS\x10\x05"\xa0\x01\n\x04Sort\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x39\n\x05order\x18\x02 \x03(\x0b\x32#.spark.connect.Expression.SortOrderR\x05order\x12 \n\tis_global\x18\x03 \x01(\x08H\x00R\x08isGlobal\x88\x01\x01\x42\x0c\n\n_is_global"\x8d\x01\n\x04\x44rop\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x33\n\x07\x63olumns\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x07\x63olumns\x12!\n\x0c\x63olumn_names\x18\x03 \x03(\tR\x0b\x63olumnNames"\xf0\x01\n\x0b\x44\x65\x64uplicate\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12!\n\x0c\x63olumn_names\x18\x02 \x03(\tR\x0b\x63olumnNames\x12\x32\n\x13\x61ll_columns_as_keys\x18\x03 \x01(\x08H\x00R\x10\x61llColumnsAsKeys\x88\x01\x01\x12.\n\x10within_watermark\x18\x04 \x01(\x08H\x01R\x0fwithinWatermark\x88\x01\x01\x42\x16\n\x14_all_columns_as_keysB\x13\n\x11_within_watermark"Y\n\rLocalRelation\x12\x17\n\x04\x64\x61ta\x18\x01 \x01(\x0cH\x00R\x04\x64\x61ta\x88\x01\x01\x12\x1b\n\x06schema\x18\x02 \x01(\tH\x01R\x06schema\x88\x01\x01\x42\x07\n\x05_dataB\t\n\x07_schema"H\n\x13\x43\x61\x63hedLocalRelation\x12\x12\n\x04hash\x18\x03 \x01(\tR\x04hashJ\x04\x08\x01\x10\x02J\x04\x08\x02\x10\x03R\x06userIdR\tsessionId"7\n\x14\x43\x61\x63hedRemoteRelation\x12\x1f\n\x0brelation_id\x18\x01 \x01(\tR\nrelationId"\x91\x02\n\x06Sample\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x1f\n\x0blower_bound\x18\x02 \x01(\x01R\nlowerBound\x12\x1f\n\x0bupper_bound\x18\x03 \x01(\x01R\nupperBound\x12.\n\x10with_replacement\x18\x04 \x01(\x08H\x00R\x0fwithReplacement\x88\x01\x01\x12\x17\n\x04seed\x18\x05 \x01(\x03H\x01R\x04seed\x88\x01\x01\x12/\n\x13\x64\x65terministic_order\x18\x06 \x01(\x08R\x12\x64\x65terministicOrderB\x13\n\x11_with_replacementB\x07\n\x05_seed"\x91\x01\n\x05Range\x12\x19\n\x05start\x18\x01 \x01(\x03H\x00R\x05start\x88\x01\x01\x12\x10\n\x03\x65nd\x18\x02 \x01(\x03R\x03\x65nd\x12\x12\n\x04step\x18\x03 \x01(\x03R\x04step\x12*\n\x0enum_partitions\x18\x04 \x01(\x05H\x01R\rnumPartitions\x88\x01\x01\x42\x08\n\x06_startB\x11\n\x0f_num_partitions"r\n\rSubqueryAlias\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x14\n\x05\x61lias\x18\x02 \x01(\tR\x05\x61lias\x12\x1c\n\tqualifier\x18\x03 \x03(\tR\tqualifier"\x8e\x01\n\x0bRepartition\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12%\n\x0enum_partitions\x18\x02 \x01(\x05R\rnumPartitions\x12\x1d\n\x07shuffle\x18\x03 \x01(\x08H\x00R\x07shuffle\x88\x01\x01\x42\n\n\x08_shuffle"\x8e\x01\n\nShowString\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x19\n\x08num_rows\x18\x02 \x01(\x05R\x07numRows\x12\x1a\n\x08truncate\x18\x03 \x01(\x05R\x08truncate\x12\x1a\n\x08vertical\x18\x04 \x01(\x08R\x08vertical"r\n\nHtmlString\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x19\n\x08num_rows\x18\x02 \x01(\x05R\x07numRows\x12\x1a\n\x08truncate\x18\x03 \x01(\x05R\x08truncate"\\\n\x0bStatSummary\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x1e\n\nstatistics\x18\x02 \x03(\tR\nstatistics"Q\n\x0cStatDescribe\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols"e\n\x0cStatCrosstab\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ol1\x18\x02 \x01(\tR\x04\x63ol1\x12\x12\n\x04\x63ol2\x18\x03 \x01(\tR\x04\x63ol2"`\n\x07StatCov\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ol1\x18\x02 \x01(\tR\x04\x63ol1\x12\x12\n\x04\x63ol2\x18\x03 \x01(\tR\x04\x63ol2"\x89\x01\n\x08StatCorr\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ol1\x18\x02 \x01(\tR\x04\x63ol1\x12\x12\n\x04\x63ol2\x18\x03 \x01(\tR\x04\x63ol2\x12\x1b\n\x06method\x18\x04 \x01(\tH\x00R\x06method\x88\x01\x01\x42\t\n\x07_method"\xa4\x01\n\x12StatApproxQuantile\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12$\n\rprobabilities\x18\x03 \x03(\x01R\rprobabilities\x12%\n\x0erelative_error\x18\x04 \x01(\x01R\rrelativeError"}\n\rStatFreqItems\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12\x1d\n\x07support\x18\x03 \x01(\x01H\x00R\x07support\x88\x01\x01\x42\n\n\x08_support"\xb5\x02\n\x0cStatSampleBy\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12+\n\x03\x63ol\x18\x02 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x03\x63ol\x12\x42\n\tfractions\x18\x03 \x03(\x0b\x32$.spark.connect.StatSampleBy.FractionR\tfractions\x12\x17\n\x04seed\x18\x05 \x01(\x03H\x00R\x04seed\x88\x01\x01\x1a\x63\n\x08\x46raction\x12;\n\x07stratum\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x07stratum\x12\x1a\n\x08\x66raction\x18\x02 \x01(\x01R\x08\x66ractionB\x07\n\x05_seed"\x86\x01\n\x06NAFill\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12\x39\n\x06values\x18\x03 \x03(\x0b\x32!.spark.connect.Expression.LiteralR\x06values"\x86\x01\n\x06NADrop\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12\'\n\rmin_non_nulls\x18\x03 \x01(\x05H\x00R\x0bminNonNulls\x88\x01\x01\x42\x10\n\x0e_min_non_nulls"\xa8\x02\n\tNAReplace\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04\x63ols\x18\x02 \x03(\tR\x04\x63ols\x12H\n\x0creplacements\x18\x03 \x03(\x0b\x32$.spark.connect.NAReplace.ReplacementR\x0creplacements\x1a\x8d\x01\n\x0bReplacement\x12>\n\told_value\x18\x01 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x08oldValue\x12>\n\tnew_value\x18\x02 \x01(\x0b\x32!.spark.connect.Expression.LiteralR\x08newValue"X\n\x04ToDF\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12!\n\x0c\x63olumn_names\x18\x02 \x03(\tR\x0b\x63olumnNames"\xfe\x02\n\x12WithColumnsRenamed\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12i\n\x12rename_columns_map\x18\x02 \x03(\x0b\x32\x37.spark.connect.WithColumnsRenamed.RenameColumnsMapEntryB\x02\x18\x01R\x10renameColumnsMap\x12\x42\n\x07renames\x18\x03 \x03(\x0b\x32(.spark.connect.WithColumnsRenamed.RenameR\x07renames\x1a\x43\n\x15RenameColumnsMapEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01\x1a\x45\n\x06Rename\x12\x19\n\x08\x63ol_name\x18\x01 \x01(\tR\x07\x63olName\x12 \n\x0cnew_col_name\x18\x02 \x01(\tR\nnewColName"w\n\x0bWithColumns\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x39\n\x07\x61liases\x18\x02 \x03(\x0b\x32\x1f.spark.connect.Expression.AliasR\x07\x61liases"\x86\x01\n\rWithWatermark\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x1d\n\nevent_time\x18\x02 \x01(\tR\teventTime\x12\'\n\x0f\x64\x65lay_threshold\x18\x03 \x01(\tR\x0e\x64\x65layThreshold"\x84\x01\n\x04Hint\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04name\x18\x02 \x01(\tR\x04name\x12\x39\n\nparameters\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\nparameters"\xc7\x02\n\x07Unpivot\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12+\n\x03ids\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x03ids\x12:\n\x06values\x18\x03 \x01(\x0b\x32\x1d.spark.connect.Unpivot.ValuesH\x00R\x06values\x88\x01\x01\x12\x30\n\x14variable_column_name\x18\x04 \x01(\tR\x12variableColumnName\x12*\n\x11value_column_name\x18\x05 \x01(\tR\x0fvalueColumnName\x1a;\n\x06Values\x12\x31\n\x06values\x18\x01 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x06valuesB\t\n\x07_values"z\n\tTranspose\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12>\n\rindex_columns\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0cindexColumns"}\n\x1dUnresolvedTableValuedFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12\x37\n\targuments\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments"j\n\x08ToSchema\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12/\n\x06schema\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x06schema"\xcb\x01\n\x17RepartitionByExpression\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x42\n\x0fpartition_exprs\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x0epartitionExprs\x12*\n\x0enum_partitions\x18\x03 \x01(\x05H\x00R\rnumPartitions\x88\x01\x01\x42\x11\n\x0f_num_partitions"\xe8\x01\n\rMapPartitions\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x42\n\x04\x66unc\x18\x02 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12"\n\nis_barrier\x18\x03 \x01(\x08H\x00R\tisBarrier\x88\x01\x01\x12"\n\nprofile_id\x18\x04 \x01(\x05H\x01R\tprofileId\x88\x01\x01\x42\r\n\x0b_is_barrierB\r\n\x0b_profile_id"\xd2\x06\n\x08GroupMap\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12L\n\x14grouping_expressions\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x13groupingExpressions\x12\x42\n\x04\x66unc\x18\x03 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12J\n\x13sorting_expressions\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x12sortingExpressions\x12<\n\rinitial_input\x18\x05 \x01(\x0b\x32\x17.spark.connect.RelationR\x0cinitialInput\x12[\n\x1cinitial_grouping_expressions\x18\x06 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x1ainitialGroupingExpressions\x12;\n\x18is_map_groups_with_state\x18\x07 \x01(\x08H\x00R\x14isMapGroupsWithState\x88\x01\x01\x12$\n\x0boutput_mode\x18\x08 \x01(\tH\x01R\noutputMode\x88\x01\x01\x12&\n\x0ctimeout_conf\x18\t \x01(\tH\x02R\x0btimeoutConf\x88\x01\x01\x12?\n\x0cstate_schema\x18\n \x01(\x0b\x32\x17.spark.connect.DataTypeH\x03R\x0bstateSchema\x88\x01\x01\x12\x65\n\x19transform_with_state_info\x18\x0b \x01(\x0b\x32%.spark.connect.TransformWithStateInfoH\x04R\x16transformWithStateInfo\x88\x01\x01\x42\x1b\n\x19_is_map_groups_with_stateB\x0e\n\x0c_output_modeB\x0f\n\r_timeout_confB\x0f\n\r_state_schemaB\x1c\n\x1a_transform_with_state_info"\xdf\x01\n\x16TransformWithStateInfo\x12\x1b\n\ttime_mode\x18\x01 \x01(\tR\x08timeMode\x12\x38\n\x16\x65vent_time_column_name\x18\x02 \x01(\tH\x00R\x13\x65ventTimeColumnName\x88\x01\x01\x12\x41\n\routput_schema\x18\x03 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x01R\x0coutputSchema\x88\x01\x01\x42\x19\n\x17_event_time_column_nameB\x10\n\x0e_output_schema"\x8e\x04\n\nCoGroupMap\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12W\n\x1ainput_grouping_expressions\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x18inputGroupingExpressions\x12-\n\x05other\x18\x03 \x01(\x0b\x32\x17.spark.connect.RelationR\x05other\x12W\n\x1aother_grouping_expressions\x18\x04 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x18otherGroupingExpressions\x12\x42\n\x04\x66unc\x18\x05 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12U\n\x19input_sorting_expressions\x18\x06 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x17inputSortingExpressions\x12U\n\x19other_sorting_expressions\x18\x07 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x17otherSortingExpressions"\xe5\x02\n\x16\x41pplyInPandasWithState\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12L\n\x14grouping_expressions\x18\x02 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x13groupingExpressions\x12\x42\n\x04\x66unc\x18\x03 \x01(\x0b\x32..spark.connect.CommonInlineUserDefinedFunctionR\x04\x66unc\x12#\n\routput_schema\x18\x04 \x01(\tR\x0coutputSchema\x12!\n\x0cstate_schema\x18\x05 \x01(\tR\x0bstateSchema\x12\x1f\n\x0boutput_mode\x18\x06 \x01(\tR\noutputMode\x12!\n\x0ctimeout_conf\x18\x07 \x01(\tR\x0btimeoutConf"\xf4\x01\n$CommonInlineUserDefinedTableFunction\x12#\n\rfunction_name\x18\x01 \x01(\tR\x0c\x66unctionName\x12$\n\rdeterministic\x18\x02 \x01(\x08R\rdeterministic\x12\x37\n\targuments\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\targuments\x12<\n\x0bpython_udtf\x18\x04 \x01(\x0b\x32\x19.spark.connect.PythonUDTFH\x00R\npythonUdtfB\n\n\x08\x66unction"\xb1\x01\n\nPythonUDTF\x12=\n\x0breturn_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\nreturnType\x88\x01\x01\x12\x1b\n\teval_type\x18\x02 \x01(\x05R\x08\x65valType\x12\x18\n\x07\x63ommand\x18\x03 \x01(\x0cR\x07\x63ommand\x12\x1d\n\npython_ver\x18\x04 \x01(\tR\tpythonVerB\x0e\n\x0c_return_type"\x97\x01\n!CommonInlineUserDefinedDataSource\x12\x12\n\x04name\x18\x01 \x01(\tR\x04name\x12O\n\x12python_data_source\x18\x02 \x01(\x0b\x32\x1f.spark.connect.PythonDataSourceH\x00R\x10pythonDataSourceB\r\n\x0b\x64\x61ta_source"K\n\x10PythonDataSource\x12\x18\n\x07\x63ommand\x18\x01 \x01(\x0cR\x07\x63ommand\x12\x1d\n\npython_ver\x18\x02 \x01(\tR\tpythonVer"\x88\x01\n\x0e\x43ollectMetrics\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x12\n\x04name\x18\x02 \x01(\tR\x04name\x12\x33\n\x07metrics\x18\x03 \x03(\x0b\x32\x19.spark.connect.ExpressionR\x07metrics"\x84\x03\n\x05Parse\x12-\n\x05input\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x05input\x12\x38\n\x06\x66ormat\x18\x02 \x01(\x0e\x32 .spark.connect.Parse.ParseFormatR\x06\x66ormat\x12\x34\n\x06schema\x18\x03 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x00R\x06schema\x88\x01\x01\x12;\n\x07options\x18\x04 \x03(\x0b\x32!.spark.connect.Parse.OptionsEntryR\x07options\x1a:\n\x0cOptionsEntry\x12\x10\n\x03key\x18\x01 \x01(\tR\x03key\x12\x14\n\x05value\x18\x02 \x01(\tR\x05value:\x02\x38\x01"X\n\x0bParseFormat\x12\x1c\n\x18PARSE_FORMAT_UNSPECIFIED\x10\x00\x12\x14\n\x10PARSE_FORMAT_CSV\x10\x01\x12\x15\n\x11PARSE_FORMAT_JSON\x10\x02\x42\t\n\x07_schema"\xdb\x03\n\x08\x41sOfJoin\x12+\n\x04left\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04left\x12-\n\x05right\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\x05right\x12\x37\n\nleft_as_of\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x08leftAsOf\x12\x39\n\x0bright_as_of\x18\x04 \x01(\x0b\x32\x19.spark.connect.ExpressionR\trightAsOf\x12\x36\n\tjoin_expr\x18\x05 \x01(\x0b\x32\x19.spark.connect.ExpressionR\x08joinExpr\x12#\n\rusing_columns\x18\x06 \x03(\tR\x0cusingColumns\x12\x1b\n\tjoin_type\x18\x07 \x01(\tR\x08joinType\x12\x37\n\ttolerance\x18\x08 \x01(\x0b\x32\x19.spark.connect.ExpressionR\ttolerance\x12.\n\x13\x61llow_exact_matches\x18\t \x01(\x08R\x11\x61llowExactMatches\x12\x1c\n\tdirection\x18\n \x01(\tR\tdirection"\xe6\x01\n\x0bLateralJoin\x12+\n\x04left\x18\x01 \x01(\x0b\x32\x17.spark.connect.RelationR\x04left\x12-\n\x05right\x18\x02 \x01(\x0b\x32\x17.spark.connect.RelationR\x05right\x12@\n\x0ejoin_condition\x18\x03 \x01(\x0b\x32\x19.spark.connect.ExpressionR\rjoinCondition\x12\x39\n\tjoin_type\x18\x04 \x01(\x0e\x32\x1c.spark.connect.Join.JoinTypeR\x08joinTypeB6\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3'
 )
 
 _globals = globals()
@@ -81,169 +81,169 @@
     _globals["_RELATION"]._serialized_start = 224
     _globals["_RELATION"]._serialized_end = 3964
     _globals["_MLRELATION"]._serialized_start = 3967
-    _globals["_MLRELATION"]._serialized_end = 4343
-    _globals["_MLRELATION_TRANSFORM"]._serialized_start = 4097
-    _globals["_MLRELATION_TRANSFORM"]._serialized_end = 4332
-    _globals["_FETCH"]._serialized_start = 4346
-    _globals["_FETCH"]._serialized_end = 4677
-    _globals["_FETCH_METHOD"]._serialized_start = 4462
-    _globals["_FETCH_METHOD"]._serialized_end = 4677
-    _globals["_FETCH_METHOD_ARGS"]._serialized_start = 4550
-    _globals["_FETCH_METHOD_ARGS"]._serialized_end = 4677
-    _globals["_UNKNOWN"]._serialized_start = 4679
-    _globals["_UNKNOWN"]._serialized_end = 4688
-    _globals["_RELATIONCOMMON"]._serialized_start = 4691
-    _globals["_RELATIONCOMMON"]._serialized_end = 4833
-    _globals["_SQL"]._serialized_start = 4836
-    _globals["_SQL"]._serialized_end = 5314
-    _globals["_SQL_ARGSENTRY"]._serialized_start = 5130
-    _globals["_SQL_ARGSENTRY"]._serialized_end = 5220
-    _globals["_SQL_NAMEDARGUMENTSENTRY"]._serialized_start = 5222
-    _globals["_SQL_NAMEDARGUMENTSENTRY"]._serialized_end = 5314
-    _globals["_WITHRELATIONS"]._serialized_start = 5316
-    _globals["_WITHRELATIONS"]._serialized_end = 5433
-    _globals["_READ"]._serialized_start = 5436
-    _globals["_READ"]._serialized_end = 6099
-    _globals["_READ_NAMEDTABLE"]._serialized_start = 5614
-    _globals["_READ_NAMEDTABLE"]._serialized_end = 5806
-    _globals["_READ_NAMEDTABLE_OPTIONSENTRY"]._serialized_start = 5748
-    _globals["_READ_NAMEDTABLE_OPTIONSENTRY"]._serialized_end = 5806
-    _globals["_READ_DATASOURCE"]._serialized_start = 5809
-    _globals["_READ_DATASOURCE"]._serialized_end = 6086
-    _globals["_READ_DATASOURCE_OPTIONSENTRY"]._serialized_start = 5748
-    _globals["_READ_DATASOURCE_OPTIONSENTRY"]._serialized_end = 5806
-    _globals["_PROJECT"]._serialized_start = 6101
-    _globals["_PROJECT"]._serialized_end = 6218
-    _globals["_FILTER"]._serialized_start = 6220
-    _globals["_FILTER"]._serialized_end = 6332
-    _globals["_JOIN"]._serialized_start = 6335
-    _globals["_JOIN"]._serialized_end = 6996
-    _globals["_JOIN_JOINDATATYPE"]._serialized_start = 6674
-    _globals["_JOIN_JOINDATATYPE"]._serialized_end = 6766
-    _globals["_JOIN_JOINTYPE"]._serialized_start = 6769
-    _globals["_JOIN_JOINTYPE"]._serialized_end = 6977
-    _globals["_SETOPERATION"]._serialized_start = 6999
-    _globals["_SETOPERATION"]._serialized_end = 7478
-    _globals["_SETOPERATION_SETOPTYPE"]._serialized_start = 7315
-    _globals["_SETOPERATION_SETOPTYPE"]._serialized_end = 7429
-    _globals["_LIMIT"]._serialized_start = 7480
-    _globals["_LIMIT"]._serialized_end = 7556
-    _globals["_OFFSET"]._serialized_start = 7558
-    _globals["_OFFSET"]._serialized_end = 7637
-    _globals["_TAIL"]._serialized_start = 7639
-    _globals["_TAIL"]._serialized_end = 7714
-    _globals["_AGGREGATE"]._serialized_start = 7717
-    _globals["_AGGREGATE"]._serialized_end = 8483
-    _globals["_AGGREGATE_PIVOT"]._serialized_start = 8132
-    _globals["_AGGREGATE_PIVOT"]._serialized_end = 8243
-    _globals["_AGGREGATE_GROUPINGSETS"]._serialized_start = 8245
-    _globals["_AGGREGATE_GROUPINGSETS"]._serialized_end = 8321
-    _globals["_AGGREGATE_GROUPTYPE"]._serialized_start = 8324
-    _globals["_AGGREGATE_GROUPTYPE"]._serialized_end = 8483
-    _globals["_SORT"]._serialized_start = 8486
-    _globals["_SORT"]._serialized_end = 8646
-    _globals["_DROP"]._serialized_start = 8649
-    _globals["_DROP"]._serialized_end = 8790
-    _globals["_DEDUPLICATE"]._serialized_start = 8793
-    _globals["_DEDUPLICATE"]._serialized_end = 9033
-    _globals["_LOCALRELATION"]._serialized_start = 9035
-    _globals["_LOCALRELATION"]._serialized_end = 9124
-    _globals["_CACHEDLOCALRELATION"]._serialized_start = 9126
-    _globals["_CACHEDLOCALRELATION"]._serialized_end = 9198
-    _globals["_CACHEDREMOTERELATION"]._serialized_start = 9200
-    _globals["_CACHEDREMOTERELATION"]._serialized_end = 9255
-    _globals["_SAMPLE"]._serialized_start = 9258
-    _globals["_SAMPLE"]._serialized_end = 9531
-    _globals["_RANGE"]._serialized_start = 9534
-    _globals["_RANGE"]._serialized_end = 9679
-    _globals["_SUBQUERYALIAS"]._serialized_start = 9681
-    _globals["_SUBQUERYALIAS"]._serialized_end = 9795
-    _globals["_REPARTITION"]._serialized_start = 9798
-    _globals["_REPARTITION"]._serialized_end = 9940
-    _globals["_SHOWSTRING"]._serialized_start = 9943
-    _globals["_SHOWSTRING"]._serialized_end = 10085
-    _globals["_HTMLSTRING"]._serialized_start = 10087
-    _globals["_HTMLSTRING"]._serialized_end = 10201
-    _globals["_STATSUMMARY"]._serialized_start = 10203
-    _globals["_STATSUMMARY"]._serialized_end = 10295
-    _globals["_STATDESCRIBE"]._serialized_start = 10297
-    _globals["_STATDESCRIBE"]._serialized_end = 10378
-    _globals["_STATCROSSTAB"]._serialized_start = 10380
-    _globals["_STATCROSSTAB"]._serialized_end = 10481
-    _globals["_STATCOV"]._serialized_start = 10483
-    _globals["_STATCOV"]._serialized_end = 10579
-    _globals["_STATCORR"]._serialized_start = 10582
-    _globals["_STATCORR"]._serialized_end = 10719
-    _globals["_STATAPPROXQUANTILE"]._serialized_start = 10722
-    _globals["_STATAPPROXQUANTILE"]._serialized_end = 10886
-    _globals["_STATFREQITEMS"]._serialized_start = 10888
-    _globals["_STATFREQITEMS"]._serialized_end = 11013
-    _globals["_STATSAMPLEBY"]._serialized_start = 11016
-    _globals["_STATSAMPLEBY"]._serialized_end = 11325
-    _globals["_STATSAMPLEBY_FRACTION"]._serialized_start = 11217
-    _globals["_STATSAMPLEBY_FRACTION"]._serialized_end = 11316
-    _globals["_NAFILL"]._serialized_start = 11328
-    _globals["_NAFILL"]._serialized_end = 11462
-    _globals["_NADROP"]._serialized_start = 11465
-    _globals["_NADROP"]._serialized_end = 11599
-    _globals["_NAREPLACE"]._serialized_start = 11602
-    _globals["_NAREPLACE"]._serialized_end = 11898
-    _globals["_NAREPLACE_REPLACEMENT"]._serialized_start = 11757
-    _globals["_NAREPLACE_REPLACEMENT"]._serialized_end = 11898
-    _globals["_TODF"]._serialized_start = 11900
-    _globals["_TODF"]._serialized_end = 11988
-    _globals["_WITHCOLUMNSRENAMED"]._serialized_start = 11991
-    _globals["_WITHCOLUMNSRENAMED"]._serialized_end = 12373
-    _globals["_WITHCOLUMNSRENAMED_RENAMECOLUMNSMAPENTRY"]._serialized_start = 12235
-    _globals["_WITHCOLUMNSRENAMED_RENAMECOLUMNSMAPENTRY"]._serialized_end = 12302
-    _globals["_WITHCOLUMNSRENAMED_RENAME"]._serialized_start = 12304
-    _globals["_WITHCOLUMNSRENAMED_RENAME"]._serialized_end = 12373
-    _globals["_WITHCOLUMNS"]._serialized_start = 12375
-    _globals["_WITHCOLUMNS"]._serialized_end = 12494
-    _globals["_WITHWATERMARK"]._serialized_start = 12497
-    _globals["_WITHWATERMARK"]._serialized_end = 12631
-    _globals["_HINT"]._serialized_start = 12634
-    _globals["_HINT"]._serialized_end = 12766
-    _globals["_UNPIVOT"]._serialized_start = 12769
-    _globals["_UNPIVOT"]._serialized_end = 13096
-    _globals["_UNPIVOT_VALUES"]._serialized_start = 13026
-    _globals["_UNPIVOT_VALUES"]._serialized_end = 13085
-    _globals["_TRANSPOSE"]._serialized_start = 13098
-    _globals["_TRANSPOSE"]._serialized_end = 13220
-    _globals["_UNRESOLVEDTABLEVALUEDFUNCTION"]._serialized_start = 13222
-    _globals["_UNRESOLVEDTABLEVALUEDFUNCTION"]._serialized_end = 13347
-    _globals["_TOSCHEMA"]._serialized_start = 13349
-    _globals["_TOSCHEMA"]._serialized_end = 13455
-    _globals["_REPARTITIONBYEXPRESSION"]._serialized_start = 13458
-    _globals["_REPARTITIONBYEXPRESSION"]._serialized_end = 13661
-    _globals["_MAPPARTITIONS"]._serialized_start = 13664
-    _globals["_MAPPARTITIONS"]._serialized_end = 13896
-    _globals["_GROUPMAP"]._serialized_start = 13899
-    _globals["_GROUPMAP"]._serialized_end = 14749
-    _globals["_TRANSFORMWITHSTATEINFO"]._serialized_start = 14752
-    _globals["_TRANSFORMWITHSTATEINFO"]._serialized_end = 14975
-    _globals["_COGROUPMAP"]._serialized_start = 14978
-    _globals["_COGROUPMAP"]._serialized_end = 15504
-    _globals["_APPLYINPANDASWITHSTATE"]._serialized_start = 15507
-    _globals["_APPLYINPANDASWITHSTATE"]._serialized_end = 15864
-    _globals["_COMMONINLINEUSERDEFINEDTABLEFUNCTION"]._serialized_start = 15867
-    _globals["_COMMONINLINEUSERDEFINEDTABLEFUNCTION"]._serialized_end = 16111
-    _globals["_PYTHONUDTF"]._serialized_start = 16114
-    _globals["_PYTHONUDTF"]._serialized_end = 16291
-    _globals["_COMMONINLINEUSERDEFINEDDATASOURCE"]._serialized_start = 16294
-    _globals["_COMMONINLINEUSERDEFINEDDATASOURCE"]._serialized_end = 16445
-    _globals["_PYTHONDATASOURCE"]._serialized_start = 16447
-    _globals["_PYTHONDATASOURCE"]._serialized_end = 16522
-    _globals["_COLLECTMETRICS"]._serialized_start = 16525
-    _globals["_COLLECTMETRICS"]._serialized_end = 16661
-    _globals["_PARSE"]._serialized_start = 16664
-    _globals["_PARSE"]._serialized_end = 17052
-    _globals["_PARSE_OPTIONSENTRY"]._serialized_start = 5748
-    _globals["_PARSE_OPTIONSENTRY"]._serialized_end = 5806
-    _globals["_PARSE_PARSEFORMAT"]._serialized_start = 16953
-    _globals["_PARSE_PARSEFORMAT"]._serialized_end = 17041
-    _globals["_ASOFJOIN"]._serialized_start = 17055
-    _globals["_ASOFJOIN"]._serialized_end = 17530
-    _globals["_LATERALJOIN"]._serialized_start = 17533
-    _globals["_LATERALJOIN"]._serialized_end = 17763
+    _globals["_MLRELATION"]._serialized_end = 4451
+    _globals["_MLRELATION_TRANSFORM"]._serialized_start = 4179
+    _globals["_MLRELATION_TRANSFORM"]._serialized_end = 4414
+    _globals["_FETCH"]._serialized_start = 4454
+    _globals["_FETCH"]._serialized_end = 4785
+    _globals["_FETCH_METHOD"]._serialized_start = 4570
+    _globals["_FETCH_METHOD"]._serialized_end = 4785
+    _globals["_FETCH_METHOD_ARGS"]._serialized_start = 4658
+    _globals["_FETCH_METHOD_ARGS"]._serialized_end = 4785
+    _globals["_UNKNOWN"]._serialized_start = 4787
+    _globals["_UNKNOWN"]._serialized_end = 4796
+    _globals["_RELATIONCOMMON"]._serialized_start = 4799
+    _globals["_RELATIONCOMMON"]._serialized_end = 4941
+    _globals["_SQL"]._serialized_start = 4944
+    _globals["_SQL"]._serialized_end = 5422
+    _globals["_SQL_ARGSENTRY"]._serialized_start = 5238
+    _globals["_SQL_ARGSENTRY"]._serialized_end = 5328
+    _globals["_SQL_NAMEDARGUMENTSENTRY"]._serialized_start = 5330
+    _globals["_SQL_NAMEDARGUMENTSENTRY"]._serialized_end = 5422
+    _globals["_WITHRELATIONS"]._serialized_start = 5424
+    _globals["_WITHRELATIONS"]._serialized_end = 5541
+    _globals["_READ"]._serialized_start = 5544
+    _globals["_READ"]._serialized_end = 6207
+    _globals["_READ_NAMEDTABLE"]._serialized_start = 5722
+    _globals["_READ_NAMEDTABLE"]._serialized_end = 5914
+    _globals["_READ_NAMEDTABLE_OPTIONSENTRY"]._serialized_start = 5856
+    _globals["_READ_NAMEDTABLE_OPTIONSENTRY"]._serialized_end = 5914
+    _globals["_READ_DATASOURCE"]._serialized_start = 5917
+    _globals["_READ_DATASOURCE"]._serialized_end = 6194
+    _globals["_READ_DATASOURCE_OPTIONSENTRY"]._serialized_start = 5856
+    _globals["_READ_DATASOURCE_OPTIONSENTRY"]._serialized_end = 5914
+    _globals["_PROJECT"]._serialized_start = 6209
+    _globals["_PROJECT"]._serialized_end = 6326
+    _globals["_FILTER"]._serialized_start = 6328
+    _globals["_FILTER"]._serialized_end = 6440
+    _globals["_JOIN"]._serialized_start = 6443
+    _globals["_JOIN"]._serialized_end = 7104
+    _globals["_JOIN_JOINDATATYPE"]._serialized_start = 6782
+    _globals["_JOIN_JOINDATATYPE"]._serialized_end = 6874
+    _globals["_JOIN_JOINTYPE"]._serialized_start = 6877
+    _globals["_JOIN_JOINTYPE"]._serialized_end = 7085
+    _globals["_SETOPERATION"]._serialized_start = 7107
+    _globals["_SETOPERATION"]._serialized_end = 7586
+    _globals["_SETOPERATION_SETOPTYPE"]._serialized_start = 7423
+    _globals["_SETOPERATION_SETOPTYPE"]._serialized_end = 7537
+    _globals["_LIMIT"]._serialized_start = 7588
+    _globals["_LIMIT"]._serialized_end = 7664
+    _globals["_OFFSET"]._serialized_start = 7666
+    _globals["_OFFSET"]._serialized_end = 7745
+    _globals["_TAIL"]._serialized_start = 7747
+    _globals["_TAIL"]._serialized_end = 7822
+    _globals["_AGGREGATE"]._serialized_start = 7825
+    _globals["_AGGREGATE"]._serialized_end = 8591
+    _globals["_AGGREGATE_PIVOT"]._serialized_start = 8240
+    _globals["_AGGREGATE_PIVOT"]._serialized_end = 8351
+    _globals["_AGGREGATE_GROUPINGSETS"]._serialized_start = 8353
+    _globals["_AGGREGATE_GROUPINGSETS"]._serialized_end = 8429
+    _globals["_AGGREGATE_GROUPTYPE"]._serialized_start = 8432
+    _globals["_AGGREGATE_GROUPTYPE"]._serialized_end = 8591
+    _globals["_SORT"]._serialized_start = 8594
+    _globals["_SORT"]._serialized_end = 8754
+    _globals["_DROP"]._serialized_start = 8757
+    _globals["_DROP"]._serialized_end = 8898
+    _globals["_DEDUPLICATE"]._serialized_start = 8901
+    _globals["_DEDUPLICATE"]._serialized_end = 9141
+    _globals["_LOCALRELATION"]._serialized_start = 9143
+    _globals["_LOCALRELATION"]._serialized_end = 9232
+    _globals["_CACHEDLOCALRELATION"]._serialized_start = 9234
+    _globals["_CACHEDLOCALRELATION"]._serialized_end = 9306
+    _globals["_CACHEDREMOTERELATION"]._serialized_start = 9308
+    _globals["_CACHEDREMOTERELATION"]._serialized_end = 9363
+    _globals["_SAMPLE"]._serialized_start = 9366
+    _globals["_SAMPLE"]._serialized_end = 9639
+    _globals["_RANGE"]._serialized_start = 9642
+    _globals["_RANGE"]._serialized_end = 9787
+    _globals["_SUBQUERYALIAS"]._serialized_start = 9789
+    _globals["_SUBQUERYALIAS"]._serialized_end = 9903
+    _globals["_REPARTITION"]._serialized_start = 9906
+    _globals["_REPARTITION"]._serialized_end = 10048
+    _globals["_SHOWSTRING"]._serialized_start = 10051
+    _globals["_SHOWSTRING"]._serialized_end = 10193
+    _globals["_HTMLSTRING"]._serialized_start = 10195
+    _globals["_HTMLSTRING"]._serialized_end = 10309
+    _globals["_STATSUMMARY"]._serialized_start = 10311
+    _globals["_STATSUMMARY"]._serialized_end = 10403
+    _globals["_STATDESCRIBE"]._serialized_start = 10405
+    _globals["_STATDESCRIBE"]._serialized_end = 10486
+    _globals["_STATCROSSTAB"]._serialized_start = 10488
+    _globals["_STATCROSSTAB"]._serialized_end = 10589
+    _globals["_STATCOV"]._serialized_start = 10591
+    _globals["_STATCOV"]._serialized_end = 10687
+    _globals["_STATCORR"]._serialized_start = 10690
+    _globals["_STATCORR"]._serialized_end = 10827
+    _globals["_STATAPPROXQUANTILE"]._serialized_start = 10830
+    _globals["_STATAPPROXQUANTILE"]._serialized_end = 10994
+    _globals["_STATFREQITEMS"]._serialized_start = 10996
+    _globals["_STATFREQITEMS"]._serialized_end = 11121
+    _globals["_STATSAMPLEBY"]._serialized_start = 11124
+    _globals["_STATSAMPLEBY"]._serialized_end = 11433
+    _globals["_STATSAMPLEBY_FRACTION"]._serialized_start = 11325
+    _globals["_STATSAMPLEBY_FRACTION"]._serialized_end = 11424
+    _globals["_NAFILL"]._serialized_start = 11436
+    _globals["_NAFILL"]._serialized_end = 11570
+    _globals["_NADROP"]._serialized_start = 11573
+    _globals["_NADROP"]._serialized_end = 11707
+    _globals["_NAREPLACE"]._serialized_start = 11710
+    _globals["_NAREPLACE"]._serialized_end = 12006
+    _globals["_NAREPLACE_REPLACEMENT"]._serialized_start = 11865
+    _globals["_NAREPLACE_REPLACEMENT"]._serialized_end = 12006
+    _globals["_TODF"]._serialized_start = 12008
+    _globals["_TODF"]._serialized_end = 12096
+    _globals["_WITHCOLUMNSRENAMED"]._serialized_start = 12099
+    _globals["_WITHCOLUMNSRENAMED"]._serialized_end = 12481
+    _globals["_WITHCOLUMNSRENAMED_RENAMECOLUMNSMAPENTRY"]._serialized_start = 12343
+    _globals["_WITHCOLUMNSRENAMED_RENAMECOLUMNSMAPENTRY"]._serialized_end = 12410
+    _globals["_WITHCOLUMNSRENAMED_RENAME"]._serialized_start = 12412
+    _globals["_WITHCOLUMNSRENAMED_RENAME"]._serialized_end = 12481
+    _globals["_WITHCOLUMNS"]._serialized_start = 12483
+    _globals["_WITHCOLUMNS"]._serialized_end = 12602
+    _globals["_WITHWATERMARK"]._serialized_start = 12605
+    _globals["_WITHWATERMARK"]._serialized_end = 12739
+    _globals["_HINT"]._serialized_start = 12742
+    _globals["_HINT"]._serialized_end = 12874
+    _globals["_UNPIVOT"]._serialized_start = 12877
+    _globals["_UNPIVOT"]._serialized_end = 13204
+    _globals["_UNPIVOT_VALUES"]._serialized_start = 13134
+    _globals["_UNPIVOT_VALUES"]._serialized_end = 13193
+    _globals["_TRANSPOSE"]._serialized_start = 13206
+    _globals["_TRANSPOSE"]._serialized_end = 13328
+    _globals["_UNRESOLVEDTABLEVALUEDFUNCTION"]._serialized_start = 13330
+    _globals["_UNRESOLVEDTABLEVALUEDFUNCTION"]._serialized_end = 13455
+    _globals["_TOSCHEMA"]._serialized_start = 13457
+    _globals["_TOSCHEMA"]._serialized_end = 13563
+    _globals["_REPARTITIONBYEXPRESSION"]._serialized_start = 13566
+    _globals["_REPARTITIONBYEXPRESSION"]._serialized_end = 13769
+    _globals["_MAPPARTITIONS"]._serialized_start = 13772
+    _globals["_MAPPARTITIONS"]._serialized_end = 14004
+    _globals["_GROUPMAP"]._serialized_start = 14007
+    _globals["_GROUPMAP"]._serialized_end = 14857
+    _globals["_TRANSFORMWITHSTATEINFO"]._serialized_start = 14860
+    _globals["_TRANSFORMWITHSTATEINFO"]._serialized_end = 15083
+    _globals["_COGROUPMAP"]._serialized_start = 15086
+    _globals["_COGROUPMAP"]._serialized_end = 15612
+    _globals["_APPLYINPANDASWITHSTATE"]._serialized_start = 15615
+    _globals["_APPLYINPANDASWITHSTATE"]._serialized_end = 15972
+    _globals["_COMMONINLINEUSERDEFINEDTABLEFUNCTION"]._serialized_start = 15975
+    _globals["_COMMONINLINEUSERDEFINEDTABLEFUNCTION"]._serialized_end = 16219
+    _globals["_PYTHONUDTF"]._serialized_start = 16222
+    _globals["_PYTHONUDTF"]._serialized_end = 16399
+    _globals["_COMMONINLINEUSERDEFINEDDATASOURCE"]._serialized_start = 16402
+    _globals["_COMMONINLINEUSERDEFINEDDATASOURCE"]._serialized_end = 16553
+    _globals["_PYTHONDATASOURCE"]._serialized_start = 16555
+    _globals["_PYTHONDATASOURCE"]._serialized_end = 16630
+    _globals["_COLLECTMETRICS"]._serialized_start = 16633
+    _globals["_COLLECTMETRICS"]._serialized_end = 16769
+    _globals["_PARSE"]._serialized_start = 16772
+    _globals["_PARSE"]._serialized_end = 17160
+    _globals["_PARSE_OPTIONSENTRY"]._serialized_start = 5856
+    _globals["_PARSE_OPTIONSENTRY"]._serialized_end = 5914
+    _globals["_PARSE_PARSEFORMAT"]._serialized_start = 17061
+    _globals["_PARSE_PARSEFORMAT"]._serialized_end = 17149
+    _globals["_ASOFJOIN"]._serialized_start = 17163
+    _globals["_ASOFJOIN"]._serialized_end = 17638
+    _globals["_LATERALJOIN"]._serialized_start = 17641
+    _globals["_LATERALJOIN"]._serialized_end = 17871
 # @@protoc_insertion_point(module_scope)
diff --git a/python/pyspark/sql/connect/proto/relations_pb2.pyi b/python/pyspark/sql/connect/proto/relations_pb2.pyi
index beeeb712da762..e1eb7945c19f0 100644
--- a/python/pyspark/sql/connect/proto/relations_pb2.pyi
+++ b/python/pyspark/sql/connect/proto/relations_pb2.pyi
@@ -707,28 +707,57 @@ class MlRelation(google.protobuf.message.Message):
 
     TRANSFORM_FIELD_NUMBER: builtins.int
     FETCH_FIELD_NUMBER: builtins.int
+    MODEL_SUMMARY_DATASET_FIELD_NUMBER: builtins.int
     @property
     def transform(self) -> global___MlRelation.Transform: ...
     @property
     def fetch(self) -> global___Fetch: ...
+    @property
+    def model_summary_dataset(self) -> global___Relation:
+        """(Optional) the dataset for restoring the model summary"""
     def __init__(
         self,
         *,
         transform: global___MlRelation.Transform | None = ...,
         fetch: global___Fetch | None = ...,
+        model_summary_dataset: global___Relation | None = ...,
     ) -> None: ...
     def HasField(
         self,
         field_name: typing_extensions.Literal[
-            "fetch", b"fetch", "ml_type", b"ml_type", "transform", b"transform"
+            "_model_summary_dataset",
+            b"_model_summary_dataset",
+            "fetch",
+            b"fetch",
+            "ml_type",
+            b"ml_type",
+            "model_summary_dataset",
+            b"model_summary_dataset",
+            "transform",
+            b"transform",
         ],
     ) -> builtins.bool: ...
     def ClearField(
         self,
         field_name: typing_extensions.Literal[
-            "fetch", b"fetch", "ml_type", b"ml_type", "transform", b"transform"
+            "_model_summary_dataset",
+            b"_model_summary_dataset",
+            "fetch",
+            b"fetch",
+            "ml_type",
+            b"ml_type",
+            "model_summary_dataset",
+            b"model_summary_dataset",
+            "transform",
+            b"transform",
         ],
     ) -> None: ...
+    @typing.overload
+    def WhichOneof(
+        self,
+        oneof_group: typing_extensions.Literal["_model_summary_dataset", b"_model_summary_dataset"],
+    ) -> typing_extensions.Literal["model_summary_dataset"] | None: ...
+    @typing.overload
     def WhichOneof(
         self, oneof_group: typing_extensions.Literal["ml_type", b"ml_type"]
     ) -> typing_extensions.Literal["transform", "fetch"] | None: ...
diff --git a/python/pyspark/sql/connect/proto/types_pb2.py b/python/pyspark/sql/connect/proto/types_pb2.py
index 2e0ef70484666..3f43bf35af40f 100644
--- a/python/pyspark/sql/connect/proto/types_pb2.py
+++ b/python/pyspark/sql/connect/proto/types_pb2.py
@@ -35,7 +35,7 @@
 
 
 DESCRIPTOR = _descriptor_pool.Default().AddSerializedFile(
-    b"\n\x19spark/connect/types.proto\x12\rspark.connect\"\xf9!\n\x08\x44\x61taType\x12\x32\n\x04null\x18\x01 \x01(\x0b\x32\x1c.spark.connect.DataType.NULLH\x00R\x04null\x12\x38\n\x06\x62inary\x18\x02 \x01(\x0b\x32\x1e.spark.connect.DataType.BinaryH\x00R\x06\x62inary\x12;\n\x07\x62oolean\x18\x03 \x01(\x0b\x32\x1f.spark.connect.DataType.BooleanH\x00R\x07\x62oolean\x12\x32\n\x04\x62yte\x18\x04 \x01(\x0b\x32\x1c.spark.connect.DataType.ByteH\x00R\x04\x62yte\x12\x35\n\x05short\x18\x05 \x01(\x0b\x32\x1d.spark.connect.DataType.ShortH\x00R\x05short\x12;\n\x07integer\x18\x06 \x01(\x0b\x32\x1f.spark.connect.DataType.IntegerH\x00R\x07integer\x12\x32\n\x04long\x18\x07 \x01(\x0b\x32\x1c.spark.connect.DataType.LongH\x00R\x04long\x12\x35\n\x05\x66loat\x18\x08 \x01(\x0b\x32\x1d.spark.connect.DataType.FloatH\x00R\x05\x66loat\x12\x38\n\x06\x64ouble\x18\t \x01(\x0b\x32\x1e.spark.connect.DataType.DoubleH\x00R\x06\x64ouble\x12;\n\x07\x64\x65\x63imal\x18\n \x01(\x0b\x32\x1f.spark.connect.DataType.DecimalH\x00R\x07\x64\x65\x63imal\x12\x38\n\x06string\x18\x0b \x01(\x0b\x32\x1e.spark.connect.DataType.StringH\x00R\x06string\x12\x32\n\x04\x63har\x18\x0c \x01(\x0b\x32\x1c.spark.connect.DataType.CharH\x00R\x04\x63har\x12<\n\x08var_char\x18\r \x01(\x0b\x32\x1f.spark.connect.DataType.VarCharH\x00R\x07varChar\x12\x32\n\x04\x64\x61te\x18\x0e \x01(\x0b\x32\x1c.spark.connect.DataType.DateH\x00R\x04\x64\x61te\x12\x41\n\ttimestamp\x18\x0f \x01(\x0b\x32!.spark.connect.DataType.TimestampH\x00R\ttimestamp\x12K\n\rtimestamp_ntz\x18\x10 \x01(\x0b\x32$.spark.connect.DataType.TimestampNTZH\x00R\x0ctimestampNtz\x12W\n\x11\x63\x61lendar_interval\x18\x11 \x01(\x0b\x32(.spark.connect.DataType.CalendarIntervalH\x00R\x10\x63\x61lendarInterval\x12[\n\x13year_month_interval\x18\x12 \x01(\x0b\x32).spark.connect.DataType.YearMonthIntervalH\x00R\x11yearMonthInterval\x12U\n\x11\x64\x61y_time_interval\x18\x13 \x01(\x0b\x32'.spark.connect.DataType.DayTimeIntervalH\x00R\x0f\x64\x61yTimeInterval\x12\x35\n\x05\x61rray\x18\x14 \x01(\x0b\x32\x1d.spark.connect.DataType.ArrayH\x00R\x05\x61rray\x12\x38\n\x06struct\x18\x15 \x01(\x0b\x32\x1e.spark.connect.DataType.StructH\x00R\x06struct\x12/\n\x03map\x18\x16 \x01(\x0b\x32\x1b.spark.connect.DataType.MapH\x00R\x03map\x12;\n\x07variant\x18\x19 \x01(\x0b\x32\x1f.spark.connect.DataType.VariantH\x00R\x07variant\x12/\n\x03udt\x18\x17 \x01(\x0b\x32\x1b.spark.connect.DataType.UDTH\x00R\x03udt\x12>\n\x08unparsed\x18\x18 \x01(\x0b\x32 .spark.connect.DataType.UnparsedH\x00R\x08unparsed\x1a\x43\n\x07\x42oolean\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04\x42yte\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x41\n\x05Short\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x43\n\x07Integer\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04Long\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x41\n\x05\x46loat\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x42\n\x06\x44ouble\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a`\n\x06String\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x12\x1c\n\tcollation\x18\x02 \x01(\tR\tcollation\x1a\x42\n\x06\x42inary\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04NULL\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x45\n\tTimestamp\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04\x44\x61te\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1aH\n\x0cTimestampNTZ\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1aL\n\x10\x43\x61lendarInterval\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\xb3\x01\n\x11YearMonthInterval\x12$\n\x0bstart_field\x18\x01 \x01(\x05H\x00R\nstartField\x88\x01\x01\x12 \n\tend_field\x18\x02 \x01(\x05H\x01R\x08\x65ndField\x88\x01\x01\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReferenceB\x0e\n\x0c_start_fieldB\x0c\n\n_end_field\x1a\xb1\x01\n\x0f\x44\x61yTimeInterval\x12$\n\x0bstart_field\x18\x01 \x01(\x05H\x00R\nstartField\x88\x01\x01\x12 \n\tend_field\x18\x02 \x01(\x05H\x01R\x08\x65ndField\x88\x01\x01\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReferenceB\x0e\n\x0c_start_fieldB\x0c\n\n_end_field\x1aX\n\x04\x43har\x12\x16\n\x06length\x18\x01 \x01(\x05R\x06length\x12\x38\n\x18type_variation_reference\x18\x02 \x01(\rR\x16typeVariationReference\x1a[\n\x07VarChar\x12\x16\n\x06length\x18\x01 \x01(\x05R\x06length\x12\x38\n\x18type_variation_reference\x18\x02 \x01(\rR\x16typeVariationReference\x1a\x99\x01\n\x07\x44\x65\x63imal\x12\x19\n\x05scale\x18\x01 \x01(\x05H\x00R\x05scale\x88\x01\x01\x12!\n\tprecision\x18\x02 \x01(\x05H\x01R\tprecision\x88\x01\x01\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReferenceB\x08\n\x06_scaleB\x0c\n\n_precision\x1a\xa1\x01\n\x0bStructField\x12\x12\n\x04name\x18\x01 \x01(\tR\x04name\x12\x34\n\tdata_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x08\x64\x61taType\x12\x1a\n\x08nullable\x18\x03 \x01(\x08R\x08nullable\x12\x1f\n\x08metadata\x18\x04 \x01(\tH\x00R\x08metadata\x88\x01\x01\x42\x0b\n\t_metadata\x1a\x7f\n\x06Struct\x12;\n\x06\x66ields\x18\x01 \x03(\x0b\x32#.spark.connect.DataType.StructFieldR\x06\x66ields\x12\x38\n\x18type_variation_reference\x18\x02 \x01(\rR\x16typeVariationReference\x1a\xa2\x01\n\x05\x41rray\x12:\n\x0c\x65lement_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x0b\x65lementType\x12#\n\rcontains_null\x18\x02 \x01(\x08R\x0c\x63ontainsNull\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReference\x1a\xdb\x01\n\x03Map\x12\x32\n\x08key_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x07keyType\x12\x36\n\nvalue_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeR\tvalueType\x12.\n\x13value_contains_null\x18\x03 \x01(\x08R\x11valueContainsNull\x12\x38\n\x18type_variation_reference\x18\x04 \x01(\rR\x16typeVariationReference\x1a\x43\n\x07Variant\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\xa1\x02\n\x03UDT\x12\x12\n\x04type\x18\x01 \x01(\tR\x04type\x12 \n\tjvm_class\x18\x02 \x01(\tH\x00R\x08jvmClass\x88\x01\x01\x12&\n\x0cpython_class\x18\x03 \x01(\tH\x01R\x0bpythonClass\x88\x01\x01\x12;\n\x17serialized_python_class\x18\x04 \x01(\tH\x02R\x15serializedPythonClass\x88\x01\x01\x12\x37\n\x08sql_type\x18\x05 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x03R\x07sqlType\x88\x01\x01\x42\x0c\n\n_jvm_classB\x0f\n\r_python_classB\x1a\n\x18_serialized_python_classB\x0b\n\t_sql_type\x1a\x34\n\x08Unparsed\x12(\n\x10\x64\x61ta_type_string\x18\x01 \x01(\tR\x0e\x64\x61taTypeStringB\x06\n\x04kindB6\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3"
+    b"\n\x19spark/connect/types.proto\x12\rspark.connect\"\xac#\n\x08\x44\x61taType\x12\x32\n\x04null\x18\x01 \x01(\x0b\x32\x1c.spark.connect.DataType.NULLH\x00R\x04null\x12\x38\n\x06\x62inary\x18\x02 \x01(\x0b\x32\x1e.spark.connect.DataType.BinaryH\x00R\x06\x62inary\x12;\n\x07\x62oolean\x18\x03 \x01(\x0b\x32\x1f.spark.connect.DataType.BooleanH\x00R\x07\x62oolean\x12\x32\n\x04\x62yte\x18\x04 \x01(\x0b\x32\x1c.spark.connect.DataType.ByteH\x00R\x04\x62yte\x12\x35\n\x05short\x18\x05 \x01(\x0b\x32\x1d.spark.connect.DataType.ShortH\x00R\x05short\x12;\n\x07integer\x18\x06 \x01(\x0b\x32\x1f.spark.connect.DataType.IntegerH\x00R\x07integer\x12\x32\n\x04long\x18\x07 \x01(\x0b\x32\x1c.spark.connect.DataType.LongH\x00R\x04long\x12\x35\n\x05\x66loat\x18\x08 \x01(\x0b\x32\x1d.spark.connect.DataType.FloatH\x00R\x05\x66loat\x12\x38\n\x06\x64ouble\x18\t \x01(\x0b\x32\x1e.spark.connect.DataType.DoubleH\x00R\x06\x64ouble\x12;\n\x07\x64\x65\x63imal\x18\n \x01(\x0b\x32\x1f.spark.connect.DataType.DecimalH\x00R\x07\x64\x65\x63imal\x12\x38\n\x06string\x18\x0b \x01(\x0b\x32\x1e.spark.connect.DataType.StringH\x00R\x06string\x12\x32\n\x04\x63har\x18\x0c \x01(\x0b\x32\x1c.spark.connect.DataType.CharH\x00R\x04\x63har\x12<\n\x08var_char\x18\r \x01(\x0b\x32\x1f.spark.connect.DataType.VarCharH\x00R\x07varChar\x12\x32\n\x04\x64\x61te\x18\x0e \x01(\x0b\x32\x1c.spark.connect.DataType.DateH\x00R\x04\x64\x61te\x12\x41\n\ttimestamp\x18\x0f \x01(\x0b\x32!.spark.connect.DataType.TimestampH\x00R\ttimestamp\x12K\n\rtimestamp_ntz\x18\x10 \x01(\x0b\x32$.spark.connect.DataType.TimestampNTZH\x00R\x0ctimestampNtz\x12W\n\x11\x63\x61lendar_interval\x18\x11 \x01(\x0b\x32(.spark.connect.DataType.CalendarIntervalH\x00R\x10\x63\x61lendarInterval\x12[\n\x13year_month_interval\x18\x12 \x01(\x0b\x32).spark.connect.DataType.YearMonthIntervalH\x00R\x11yearMonthInterval\x12U\n\x11\x64\x61y_time_interval\x18\x13 \x01(\x0b\x32'.spark.connect.DataType.DayTimeIntervalH\x00R\x0f\x64\x61yTimeInterval\x12\x35\n\x05\x61rray\x18\x14 \x01(\x0b\x32\x1d.spark.connect.DataType.ArrayH\x00R\x05\x61rray\x12\x38\n\x06struct\x18\x15 \x01(\x0b\x32\x1e.spark.connect.DataType.StructH\x00R\x06struct\x12/\n\x03map\x18\x16 \x01(\x0b\x32\x1b.spark.connect.DataType.MapH\x00R\x03map\x12;\n\x07variant\x18\x19 \x01(\x0b\x32\x1f.spark.connect.DataType.VariantH\x00R\x07variant\x12/\n\x03udt\x18\x17 \x01(\x0b\x32\x1b.spark.connect.DataType.UDTH\x00R\x03udt\x12>\n\x08unparsed\x18\x18 \x01(\x0b\x32 .spark.connect.DataType.UnparsedH\x00R\x08unparsed\x12\x32\n\x04time\x18\x1c \x01(\x0b\x32\x1c.spark.connect.DataType.TimeH\x00R\x04time\x1a\x43\n\x07\x42oolean\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04\x42yte\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x41\n\x05Short\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x43\n\x07Integer\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04Long\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x41\n\x05\x46loat\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x42\n\x06\x44ouble\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a`\n\x06String\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x12\x1c\n\tcollation\x18\x02 \x01(\tR\tcollation\x1a\x42\n\x06\x42inary\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04NULL\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\x45\n\tTimestamp\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a@\n\x04\x44\x61te\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1aH\n\x0cTimestampNTZ\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1aq\n\x04Time\x12!\n\tprecision\x18\x01 \x01(\x05H\x00R\tprecision\x88\x01\x01\x12\x38\n\x18type_variation_reference\x18\x02 \x01(\rR\x16typeVariationReferenceB\x0c\n\n_precision\x1aL\n\x10\x43\x61lendarInterval\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\xb3\x01\n\x11YearMonthInterval\x12$\n\x0bstart_field\x18\x01 \x01(\x05H\x00R\nstartField\x88\x01\x01\x12 \n\tend_field\x18\x02 \x01(\x05H\x01R\x08\x65ndField\x88\x01\x01\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReferenceB\x0e\n\x0c_start_fieldB\x0c\n\n_end_field\x1a\xb1\x01\n\x0f\x44\x61yTimeInterval\x12$\n\x0bstart_field\x18\x01 \x01(\x05H\x00R\nstartField\x88\x01\x01\x12 \n\tend_field\x18\x02 \x01(\x05H\x01R\x08\x65ndField\x88\x01\x01\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReferenceB\x0e\n\x0c_start_fieldB\x0c\n\n_end_field\x1aX\n\x04\x43har\x12\x16\n\x06length\x18\x01 \x01(\x05R\x06length\x12\x38\n\x18type_variation_reference\x18\x02 \x01(\rR\x16typeVariationReference\x1a[\n\x07VarChar\x12\x16\n\x06length\x18\x01 \x01(\x05R\x06length\x12\x38\n\x18type_variation_reference\x18\x02 \x01(\rR\x16typeVariationReference\x1a\x99\x01\n\x07\x44\x65\x63imal\x12\x19\n\x05scale\x18\x01 \x01(\x05H\x00R\x05scale\x88\x01\x01\x12!\n\tprecision\x18\x02 \x01(\x05H\x01R\tprecision\x88\x01\x01\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReferenceB\x08\n\x06_scaleB\x0c\n\n_precision\x1a\xa1\x01\n\x0bStructField\x12\x12\n\x04name\x18\x01 \x01(\tR\x04name\x12\x34\n\tdata_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x08\x64\x61taType\x12\x1a\n\x08nullable\x18\x03 \x01(\x08R\x08nullable\x12\x1f\n\x08metadata\x18\x04 \x01(\tH\x00R\x08metadata\x88\x01\x01\x42\x0b\n\t_metadata\x1a\x7f\n\x06Struct\x12;\n\x06\x66ields\x18\x01 \x03(\x0b\x32#.spark.connect.DataType.StructFieldR\x06\x66ields\x12\x38\n\x18type_variation_reference\x18\x02 \x01(\rR\x16typeVariationReference\x1a\xa2\x01\n\x05\x41rray\x12:\n\x0c\x65lement_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x0b\x65lementType\x12#\n\rcontains_null\x18\x02 \x01(\x08R\x0c\x63ontainsNull\x12\x38\n\x18type_variation_reference\x18\x03 \x01(\rR\x16typeVariationReference\x1a\xdb\x01\n\x03Map\x12\x32\n\x08key_type\x18\x01 \x01(\x0b\x32\x17.spark.connect.DataTypeR\x07keyType\x12\x36\n\nvalue_type\x18\x02 \x01(\x0b\x32\x17.spark.connect.DataTypeR\tvalueType\x12.\n\x13value_contains_null\x18\x03 \x01(\x08R\x11valueContainsNull\x12\x38\n\x18type_variation_reference\x18\x04 \x01(\rR\x16typeVariationReference\x1a\x43\n\x07Variant\x12\x38\n\x18type_variation_reference\x18\x01 \x01(\rR\x16typeVariationReference\x1a\xa1\x02\n\x03UDT\x12\x12\n\x04type\x18\x01 \x01(\tR\x04type\x12 \n\tjvm_class\x18\x02 \x01(\tH\x00R\x08jvmClass\x88\x01\x01\x12&\n\x0cpython_class\x18\x03 \x01(\tH\x01R\x0bpythonClass\x88\x01\x01\x12;\n\x17serialized_python_class\x18\x04 \x01(\tH\x02R\x15serializedPythonClass\x88\x01\x01\x12\x37\n\x08sql_type\x18\x05 \x01(\x0b\x32\x17.spark.connect.DataTypeH\x03R\x07sqlType\x88\x01\x01\x42\x0c\n\n_jvm_classB\x0f\n\r_python_classB\x1a\n\x18_serialized_python_classB\x0b\n\t_sql_type\x1a\x34\n\x08Unparsed\x12(\n\x10\x64\x61ta_type_string\x18\x01 \x01(\tR\x0e\x64\x61taTypeStringB\x06\n\x04kindJ\x04\x08\x1a\x10\x1bJ\x04\x08\x1b\x10\x1c\x42\x36\n\x1eorg.apache.spark.connect.protoP\x01Z\x12internal/generatedb\x06proto3"
 )
 
 _globals = globals()
@@ -47,57 +47,59 @@
         "DESCRIPTOR"
     ]._serialized_options = b"\n\036org.apache.spark.connect.protoP\001Z\022internal/generated"
     _globals["_DATATYPE"]._serialized_start = 45
-    _globals["_DATATYPE"]._serialized_end = 4390
-    _globals["_DATATYPE_BOOLEAN"]._serialized_start = 1595
-    _globals["_DATATYPE_BOOLEAN"]._serialized_end = 1662
-    _globals["_DATATYPE_BYTE"]._serialized_start = 1664
-    _globals["_DATATYPE_BYTE"]._serialized_end = 1728
-    _globals["_DATATYPE_SHORT"]._serialized_start = 1730
-    _globals["_DATATYPE_SHORT"]._serialized_end = 1795
-    _globals["_DATATYPE_INTEGER"]._serialized_start = 1797
-    _globals["_DATATYPE_INTEGER"]._serialized_end = 1864
-    _globals["_DATATYPE_LONG"]._serialized_start = 1866
-    _globals["_DATATYPE_LONG"]._serialized_end = 1930
-    _globals["_DATATYPE_FLOAT"]._serialized_start = 1932
-    _globals["_DATATYPE_FLOAT"]._serialized_end = 1997
-    _globals["_DATATYPE_DOUBLE"]._serialized_start = 1999
-    _globals["_DATATYPE_DOUBLE"]._serialized_end = 2065
-    _globals["_DATATYPE_STRING"]._serialized_start = 2067
-    _globals["_DATATYPE_STRING"]._serialized_end = 2163
-    _globals["_DATATYPE_BINARY"]._serialized_start = 2165
-    _globals["_DATATYPE_BINARY"]._serialized_end = 2231
-    _globals["_DATATYPE_NULL"]._serialized_start = 2233
-    _globals["_DATATYPE_NULL"]._serialized_end = 2297
-    _globals["_DATATYPE_TIMESTAMP"]._serialized_start = 2299
-    _globals["_DATATYPE_TIMESTAMP"]._serialized_end = 2368
-    _globals["_DATATYPE_DATE"]._serialized_start = 2370
-    _globals["_DATATYPE_DATE"]._serialized_end = 2434
-    _globals["_DATATYPE_TIMESTAMPNTZ"]._serialized_start = 2436
-    _globals["_DATATYPE_TIMESTAMPNTZ"]._serialized_end = 2508
-    _globals["_DATATYPE_CALENDARINTERVAL"]._serialized_start = 2510
-    _globals["_DATATYPE_CALENDARINTERVAL"]._serialized_end = 2586
-    _globals["_DATATYPE_YEARMONTHINTERVAL"]._serialized_start = 2589
-    _globals["_DATATYPE_YEARMONTHINTERVAL"]._serialized_end = 2768
-    _globals["_DATATYPE_DAYTIMEINTERVAL"]._serialized_start = 2771
-    _globals["_DATATYPE_DAYTIMEINTERVAL"]._serialized_end = 2948
-    _globals["_DATATYPE_CHAR"]._serialized_start = 2950
-    _globals["_DATATYPE_CHAR"]._serialized_end = 3038
-    _globals["_DATATYPE_VARCHAR"]._serialized_start = 3040
-    _globals["_DATATYPE_VARCHAR"]._serialized_end = 3131
-    _globals["_DATATYPE_DECIMAL"]._serialized_start = 3134
-    _globals["_DATATYPE_DECIMAL"]._serialized_end = 3287
-    _globals["_DATATYPE_STRUCTFIELD"]._serialized_start = 3290
-    _globals["_DATATYPE_STRUCTFIELD"]._serialized_end = 3451
-    _globals["_DATATYPE_STRUCT"]._serialized_start = 3453
-    _globals["_DATATYPE_STRUCT"]._serialized_end = 3580
-    _globals["_DATATYPE_ARRAY"]._serialized_start = 3583
-    _globals["_DATATYPE_ARRAY"]._serialized_end = 3745
-    _globals["_DATATYPE_MAP"]._serialized_start = 3748
-    _globals["_DATATYPE_MAP"]._serialized_end = 3967
-    _globals["_DATATYPE_VARIANT"]._serialized_start = 3969
-    _globals["_DATATYPE_VARIANT"]._serialized_end = 4036
-    _globals["_DATATYPE_UDT"]._serialized_start = 4039
-    _globals["_DATATYPE_UDT"]._serialized_end = 4328
-    _globals["_DATATYPE_UNPARSED"]._serialized_start = 4330
-    _globals["_DATATYPE_UNPARSED"]._serialized_end = 4382
+    _globals["_DATATYPE"]._serialized_end = 4569
+    _globals["_DATATYPE_BOOLEAN"]._serialized_start = 1647
+    _globals["_DATATYPE_BOOLEAN"]._serialized_end = 1714
+    _globals["_DATATYPE_BYTE"]._serialized_start = 1716
+    _globals["_DATATYPE_BYTE"]._serialized_end = 1780
+    _globals["_DATATYPE_SHORT"]._serialized_start = 1782
+    _globals["_DATATYPE_SHORT"]._serialized_end = 1847
+    _globals["_DATATYPE_INTEGER"]._serialized_start = 1849
+    _globals["_DATATYPE_INTEGER"]._serialized_end = 1916
+    _globals["_DATATYPE_LONG"]._serialized_start = 1918
+    _globals["_DATATYPE_LONG"]._serialized_end = 1982
+    _globals["_DATATYPE_FLOAT"]._serialized_start = 1984
+    _globals["_DATATYPE_FLOAT"]._serialized_end = 2049
+    _globals["_DATATYPE_DOUBLE"]._serialized_start = 2051
+    _globals["_DATATYPE_DOUBLE"]._serialized_end = 2117
+    _globals["_DATATYPE_STRING"]._serialized_start = 2119
+    _globals["_DATATYPE_STRING"]._serialized_end = 2215
+    _globals["_DATATYPE_BINARY"]._serialized_start = 2217
+    _globals["_DATATYPE_BINARY"]._serialized_end = 2283
+    _globals["_DATATYPE_NULL"]._serialized_start = 2285
+    _globals["_DATATYPE_NULL"]._serialized_end = 2349
+    _globals["_DATATYPE_TIMESTAMP"]._serialized_start = 2351
+    _globals["_DATATYPE_TIMESTAMP"]._serialized_end = 2420
+    _globals["_DATATYPE_DATE"]._serialized_start = 2422
+    _globals["_DATATYPE_DATE"]._serialized_end = 2486
+    _globals["_DATATYPE_TIMESTAMPNTZ"]._serialized_start = 2488
+    _globals["_DATATYPE_TIMESTAMPNTZ"]._serialized_end = 2560
+    _globals["_DATATYPE_TIME"]._serialized_start = 2562
+    _globals["_DATATYPE_TIME"]._serialized_end = 2675
+    _globals["_DATATYPE_CALENDARINTERVAL"]._serialized_start = 2677
+    _globals["_DATATYPE_CALENDARINTERVAL"]._serialized_end = 2753
+    _globals["_DATATYPE_YEARMONTHINTERVAL"]._serialized_start = 2756
+    _globals["_DATATYPE_YEARMONTHINTERVAL"]._serialized_end = 2935
+    _globals["_DATATYPE_DAYTIMEINTERVAL"]._serialized_start = 2938
+    _globals["_DATATYPE_DAYTIMEINTERVAL"]._serialized_end = 3115
+    _globals["_DATATYPE_CHAR"]._serialized_start = 3117
+    _globals["_DATATYPE_CHAR"]._serialized_end = 3205
+    _globals["_DATATYPE_VARCHAR"]._serialized_start = 3207
+    _globals["_DATATYPE_VARCHAR"]._serialized_end = 3298
+    _globals["_DATATYPE_DECIMAL"]._serialized_start = 3301
+    _globals["_DATATYPE_DECIMAL"]._serialized_end = 3454
+    _globals["_DATATYPE_STRUCTFIELD"]._serialized_start = 3457
+    _globals["_DATATYPE_STRUCTFIELD"]._serialized_end = 3618
+    _globals["_DATATYPE_STRUCT"]._serialized_start = 3620
+    _globals["_DATATYPE_STRUCT"]._serialized_end = 3747
+    _globals["_DATATYPE_ARRAY"]._serialized_start = 3750
+    _globals["_DATATYPE_ARRAY"]._serialized_end = 3912
+    _globals["_DATATYPE_MAP"]._serialized_start = 3915
+    _globals["_DATATYPE_MAP"]._serialized_end = 4134
+    _globals["_DATATYPE_VARIANT"]._serialized_start = 4136
+    _globals["_DATATYPE_VARIANT"]._serialized_end = 4203
+    _globals["_DATATYPE_UDT"]._serialized_start = 4206
+    _globals["_DATATYPE_UDT"]._serialized_end = 4495
+    _globals["_DATATYPE_UNPARSED"]._serialized_start = 4497
+    _globals["_DATATYPE_UNPARSED"]._serialized_end = 4549
 # @@protoc_insertion_point(module_scope)
diff --git a/python/pyspark/sql/connect/proto/types_pb2.pyi b/python/pyspark/sql/connect/proto/types_pb2.pyi
index fcf35b8c1f196..d46770c4f888e 100644
--- a/python/pyspark/sql/connect/proto/types_pb2.pyi
+++ b/python/pyspark/sql/connect/proto/types_pb2.pyi
@@ -279,6 +279,40 @@ class DataType(google.protobuf.message.Message):
             ],
         ) -> None: ...
 
+    class Time(google.protobuf.message.Message):
+        DESCRIPTOR: google.protobuf.descriptor.Descriptor
+
+        PRECISION_FIELD_NUMBER: builtins.int
+        TYPE_VARIATION_REFERENCE_FIELD_NUMBER: builtins.int
+        precision: builtins.int
+        type_variation_reference: builtins.int
+        def __init__(
+            self,
+            *,
+            precision: builtins.int | None = ...,
+            type_variation_reference: builtins.int = ...,
+        ) -> None: ...
+        def HasField(
+            self,
+            field_name: typing_extensions.Literal[
+                "_precision", b"_precision", "precision", b"precision"
+            ],
+        ) -> builtins.bool: ...
+        def ClearField(
+            self,
+            field_name: typing_extensions.Literal[
+                "_precision",
+                b"_precision",
+                "precision",
+                b"precision",
+                "type_variation_reference",
+                b"type_variation_reference",
+            ],
+        ) -> None: ...
+        def WhichOneof(
+            self, oneof_group: typing_extensions.Literal["_precision", b"_precision"]
+        ) -> typing_extensions.Literal["precision"] | None: ...
+
     class CalendarInterval(google.protobuf.message.Message):
         DESCRIPTOR: google.protobuf.descriptor.Descriptor
 
@@ -788,6 +822,7 @@ class DataType(google.protobuf.message.Message):
     VARIANT_FIELD_NUMBER: builtins.int
     UDT_FIELD_NUMBER: builtins.int
     UNPARSED_FIELD_NUMBER: builtins.int
+    TIME_FIELD_NUMBER: builtins.int
     @property
     def null(self) -> global___DataType.NULL: ...
     @property
@@ -845,6 +880,8 @@ class DataType(google.protobuf.message.Message):
     @property
     def unparsed(self) -> global___DataType.Unparsed:
         """UnparsedDataType"""
+    @property
+    def time(self) -> global___DataType.Time: ...
     def __init__(
         self,
         *,
@@ -873,6 +910,7 @@ class DataType(google.protobuf.message.Message):
         variant: global___DataType.Variant | None = ...,
         udt: global___DataType.UDT | None = ...,
         unparsed: global___DataType.Unparsed | None = ...,
+        time: global___DataType.Time | None = ...,
     ) -> None: ...
     def HasField(
         self,
@@ -915,6 +953,8 @@ class DataType(google.protobuf.message.Message):
             b"string",
             "struct",
             b"struct",
+            "time",
+            b"time",
             "timestamp",
             b"timestamp",
             "timestamp_ntz",
@@ -972,6 +1012,8 @@ class DataType(google.protobuf.message.Message):
             b"string",
             "struct",
             b"struct",
+            "time",
+            b"time",
             "timestamp",
             b"timestamp",
             "timestamp_ntz",
@@ -1017,6 +1059,7 @@ class DataType(google.protobuf.message.Message):
             "variant",
             "udt",
             "unparsed",
+            "time",
         ]
         | None
     ): ...
diff --git a/python/pyspark/sql/connect/session.py b/python/pyspark/sql/connect/session.py
index 303b9c9aac127..6ccffc718d064 100644
--- a/python/pyspark/sql/connect/session.py
+++ b/python/pyspark/sql/connect/session.py
@@ -23,7 +23,7 @@
 import threading
 import os
 import warnings
-from collections.abc import Sized
+from collections.abc import Callable, Sized
 import functools
 from threading import RLock
 from typing import (
@@ -106,6 +106,7 @@
 )
 
 if TYPE_CHECKING:
+    import pyspark.sql.connect.proto as pb2
     from pyspark.sql.connect._typing import OptionalPrimitiveType
     from pyspark.sql.connect.catalog import Catalog
     from pyspark.sql.connect.udf import UDFRegistration
@@ -130,6 +131,7 @@ class Builder:
         def __init__(self) -> None:
             self._options: Dict[str, Any] = {}
             self._channel_builder: Optional[DefaultChannelBuilder] = None
+            self._hook_factories: list["Callable[[SparkSession], SparkSession.Hook]"] = []
 
         @overload
         def config(self, key: str, value: Any) -> "SparkSession.Builder":
@@ -191,6 +193,13 @@ class CustomChannelBuilder(ChannelBuilder):
                 self._channel_builder = channelBuilder
                 return self
 
+        def _registerHook(
+            self, hook_factory: "Callable[[SparkSession], SparkSession.Hook]"
+        ) -> "SparkSession.Builder":
+            with self._lock:
+                self._hook_factories.append(hook_factory)
+                return self
+
         def enableHiveSupport(self) -> "SparkSession.Builder":
             raise PySparkNotImplementedError(
                 errorClass="NOT_IMPLEMENTED", messageParameters={"feature": "enableHiveSupport"}
@@ -235,11 +244,13 @@ def create(self) -> "SparkSession":
 
             if has_channel_builder:
                 assert self._channel_builder is not None
-                session = SparkSession(connection=self._channel_builder)
+                session = SparkSession(
+                    connection=self._channel_builder, hook_factories=self._hook_factories
+                )
             else:
                 spark_remote = to_str(self._options.get("spark.remote"))
                 assert spark_remote is not None
-                session = SparkSession(connection=spark_remote)
+                session = SparkSession(connection=spark_remote, hook_factories=self._hook_factories)
 
             SparkSession._set_default_and_active_session(session)
             self._apply_options(session)
@@ -255,6 +266,16 @@ def getOrCreate(self) -> "SparkSession":
                 self._apply_options(session)
                 return session
 
+    class Hook:
+        """A Hook can be used to inject behavior into the session."""
+
+        def on_execute_plan(self, request: "pb2.ExecutePlanRequest") -> "pb2.ExecutePlanRequest":
+            """Called before sending an ExecutePlanRequest.
+
+            The request is replaced with the one returned by this method.
+            """
+            return request
+
     _client: SparkConnectClient
 
     # SPARK-47544: Explicitly declaring this as an identifier instead of a method.
@@ -262,7 +283,12 @@ def getOrCreate(self) -> "SparkSession":
     builder: Builder = classproperty(lambda cls: cls.Builder())  # type: ignore
     builder.__doc__ = PySparkSession.builder.__doc__
 
-    def __init__(self, connection: Union[str, DefaultChannelBuilder], userId: Optional[str] = None):
+    def __init__(
+        self,
+        connection: Union[str, DefaultChannelBuilder],
+        userId: Optional[str] = None,
+        hook_factories: Optional[list["Callable[[SparkSession], Hook]"]] = None,
+    ) -> None:
         """
         Creates a new SparkSession for the Spark Connect interface.
 
@@ -277,8 +303,15 @@ def __init__(self, connection: Union[str, DefaultChannelBuilder], userId: Option
             isolate their Spark Sessions. If the `user_id` is not set, will default to
             the $USER environment. Defining the user ID as part of the connection string
             takes precedence.
+        hook_factories: list[Callable[[SparkSession], Hook]], optional
+            Optional list of hook factories for hooks that should be registered for this session.
         """
-        self._client = SparkConnectClient(connection=connection, user_id=userId)
+        hook_factories = hook_factories or []
+        self._client = SparkConnectClient(
+            connection=connection,
+            user_id=userId,
+            session_hooks=[factory(self) for factory in hook_factories],
+        )
         self._session_id = self._client._session_id
 
         # Set to false to prevent client.release_session on close() (testing only)
@@ -586,7 +619,7 @@ def createDataFrame(
 
             safecheck = configs["spark.sql.execution.pandas.convertToArrowArraySafely"]
 
-            ser = ArrowStreamPandasSerializer(cast(str, timezone), safecheck == "true")
+            ser = ArrowStreamPandasSerializer(cast(str, timezone), safecheck == "true", False)
 
             _table = pa.Table.from_batches(
                 [
diff --git a/python/pyspark/sql/connect/tvf.py b/python/pyspark/sql/connect/tvf.py
index cf94fdb64915f..59a4e4fbe344e 100644
--- a/python/pyspark/sql/connect/tvf.py
+++ b/python/pyspark/sql/connect/tvf.py
@@ -127,7 +127,7 @@ def _test() -> None:
         print("Not supported in no-GIL mode", file=sys.stderr)
         sys.exit(0)
 
-    from pyspark.testing import should_test_connect
+    from pyspark.testing.utils import should_test_connect
 
     if not should_test_connect:
         print("Skipping pyspark.sql.connect.tvf doctests", file=sys.stderr)
diff --git a/python/pyspark/sql/connect/types.py b/python/pyspark/sql/connect/types.py
index c2eb5f4e017f0..8f9e7c0561cc0 100644
--- a/python/pyspark/sql/connect/types.py
+++ b/python/pyspark/sql/connect/types.py
@@ -29,6 +29,7 @@
     IntegerType,
     FloatType,
     DateType,
+    TimeType,
     TimestampType,
     TimestampNTZType,
     DayTimeIntervalType,
@@ -128,6 +129,10 @@ def pyspark_types_to_proto_types(data_type: DataType) -> pb2.DataType:
     ret = pb2.DataType()
     if isinstance(data_type, NullType):
         ret.null.CopyFrom(pb2.DataType.NULL())
+    elif isinstance(data_type, CharType):
+        ret.char.length = data_type.length
+    elif isinstance(data_type, VarcharType):
+        ret.var_char.length = data_type.length
     elif isinstance(data_type, StringType):
         ret.string.collation = data_type.collation
     elif isinstance(data_type, BooleanType):
@@ -151,6 +156,8 @@ def pyspark_types_to_proto_types(data_type: DataType) -> pb2.DataType:
         ret.decimal.precision = data_type.precision
     elif isinstance(data_type, DateType):
         ret.date.CopyFrom(pb2.DataType.Date())
+    elif isinstance(data_type, TimeType):
+        ret.time.precision = data_type.precision
     elif isinstance(data_type, TimestampType):
         ret.timestamp.CopyFrom(pb2.DataType.Timestamp())
     elif isinstance(data_type, TimestampNTZType):
@@ -237,6 +244,8 @@ def proto_schema_to_pyspark_data_type(schema: pb2.DataType) -> DataType:
         return VarcharType(schema.var_char.length)
     elif schema.HasField("date"):
         return DateType()
+    elif schema.HasField("time"):
+        return TimeType(schema.time.precision) if schema.time.HasField("precision") else TimeType()
     elif schema.HasField("timestamp"):
         return TimestampType()
     elif schema.HasField("timestamp_ntz"):
diff --git a/python/pyspark/sql/connect/udf.py b/python/pyspark/sql/connect/udf.py
index 7009a51695c5d..0f45690a9db33 100644
--- a/python/pyspark/sql/connect/udf.py
+++ b/python/pyspark/sql/connect/udf.py
@@ -162,7 +162,6 @@ def __init__(
     def returnType(self) -> DataType:
         # Make sure this is called after Connect Session is initialized.
         # ``_parse_datatype_string`` accesses to Connect Server for parsing a DDL formatted string.
-        # TODO: PythonEvalType.SQL_BATCHED_UDF
         if self._returnType_placeholder is None:
             if isinstance(self._returnType, DataType):
                 self._returnType_placeholder = self._returnType
@@ -280,13 +279,15 @@ def register(
                 PythonEvalType.SQL_SCALAR_PANDAS_ITER_UDF,
                 PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF,
                 PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF,
+                PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
             ]:
                 raise PySparkTypeError(
                     errorClass="INVALID_UDF_EVAL_TYPE",
                     messageParameters={
                         "eval_type": "SQL_BATCHED_UDF, SQL_ARROW_BATCHED_UDF, "
-                        "SQL_SCALAR_PANDAS_UDF, SQL_SCALAR_PANDAS_ITER_UDF or "
-                        "SQL_GROUPED_AGG_PANDAS_UDF"
+                        "SQL_SCALAR_PANDAS_UDF, SQL_SCALAR_ARROW_UDF, "
+                        "SQL_SCALAR_PANDAS_ITER_UDF, SQL_SCALAR_ARROW_ITER_UDF, "
+                        "SQL_GROUPED_AGG_PANDAS_UDF or SQL_GROUPED_AGG_ARROW_UDF"
                     },
                 )
             self.sparkSession._client.register_udf(
diff --git a/python/pyspark/sql/connect/udtf.py b/python/pyspark/sql/connect/udtf.py
index ed9ab26788f77..f049932071674 100644
--- a/python/pyspark/sql/connect/udtf.py
+++ b/python/pyspark/sql/connect/udtf.py
@@ -22,7 +22,7 @@
 check_dependencies(__name__)
 
 import warnings
-from typing import List, Type, TYPE_CHECKING, Optional, Union
+from typing import List, Type, TYPE_CHECKING, Optional, Union, Any
 
 from pyspark.util import PythonEvalType
 from pyspark.sql.connect.column import Column
@@ -34,10 +34,11 @@
 from pyspark.sql.connect.table_arg import TableArg
 from pyspark.sql.connect.types import UnparsedDataType
 from pyspark.sql.connect.utils import get_python_ver
+from pyspark.sql.pandas.utils import require_minimum_pyarrow_version, require_minimum_pandas_version
 from pyspark.sql.udtf import AnalyzeArgument, AnalyzeResult  # noqa: F401
 from pyspark.sql.udtf import UDTFRegistration as PySparkUDTFRegistration, _validate_udtf_handler
 from pyspark.sql.types import DataType, StructType
-from pyspark.errors import PySparkRuntimeError, PySparkTypeError
+from pyspark.errors import PySparkRuntimeError, PySparkTypeError, PySparkAttributeError
 
 
 if TYPE_CHECKING:
@@ -87,11 +88,6 @@ def _create_py_udtf(
     eval_type: int = PythonEvalType.SQL_TABLE_UDF
 
     if arrow_enabled:
-        from pyspark.sql.pandas.utils import (
-            require_minimum_pandas_version,
-            require_minimum_pyarrow_version,
-        )
-
         try:
             require_minimum_pandas_version()
             require_minimum_pyarrow_version()
@@ -106,6 +102,43 @@ def _create_py_udtf(
     return _create_udtf(cls, returnType, name, eval_type, deterministic)
 
 
+def _create_pyarrow_udtf(
+    cls: Type,
+    returnType: Optional[Union[StructType, str]],
+    name: Optional[str] = None,
+    deterministic: bool = False,
+) -> "UserDefinedTableFunction":
+    """Create a PyArrow-native Python UDTF."""
+    # Validate PyArrow dependencies
+    require_minimum_pyarrow_version()
+
+    # Validate the handler class with PyArrow-specific checks
+    _validate_arrow_udtf_handler(cls, returnType)
+
+    return _create_udtf(
+        cls=cls,
+        returnType=returnType,
+        name=name,
+        evalType=PythonEvalType.SQL_ARROW_UDTF,
+        deterministic=deterministic,
+    )
+
+
+def _validate_arrow_udtf_handler(cls: Any, returnType: Optional[Union[StructType, str]]) -> None:
+    """Validate the handler class of a PyArrow UDTF."""
+    # First run standard UDTF validation
+    _validate_udtf_handler(cls, returnType)
+
+    # Block analyze method usage in arrow UDTFs
+    # TODO(SPARK-53286): Support analyze method for Arrow UDTFs to enable dynamic return types
+    has_analyze = hasattr(cls, "analyze")
+    if has_analyze:
+        raise PySparkAttributeError(
+            errorClass="INVALID_ARROW_UDTF_WITH_ANALYZE",
+            messageParameters={"name": cls.__name__},
+        )
+
+
 class UserDefinedTableFunction:
     """
     User defined function in Python
@@ -203,12 +236,16 @@ def register(
                 },
             )
 
-        if f.evalType not in [PythonEvalType.SQL_TABLE_UDF, PythonEvalType.SQL_ARROW_TABLE_UDF]:
+        if f.evalType not in [
+            PythonEvalType.SQL_TABLE_UDF,
+            PythonEvalType.SQL_ARROW_TABLE_UDF,
+            PythonEvalType.SQL_ARROW_UDTF,
+        ]:
             raise PySparkTypeError(
                 errorClass="INVALID_UDTF_EVAL_TYPE",
                 messageParameters={
                     "name": name,
-                    "eval_type": "SQL_TABLE_UDF, SQL_ARROW_TABLE_UDF",
+                    "eval_type": "SQL_TABLE_UDF, SQL_ARROW_TABLE_UDF, SQL_ARROW_UDTF",
                 },
             )
 
diff --git a/python/pyspark/sql/conversion.py b/python/pyspark/sql/conversion.py
index a0cd89da38224..f1aa55c2039ac 100644
--- a/python/pyspark/sql/conversion.py
+++ b/python/pyspark/sql/conversion.py
@@ -18,7 +18,7 @@
 import array
 import datetime
 import decimal
-from typing import TYPE_CHECKING, Any, Callable, List, Sequence
+from typing import TYPE_CHECKING, Any, Callable, List, Optional, Sequence, Union, overload
 
 from pyspark.errors import PySparkValueError
 from pyspark.sql.pandas.types import _dedup_names, _deduplicate_field_names, to_arrow_schema
@@ -91,16 +91,40 @@ def _need_converter(
         else:
             return False
 
+    @overload
+    @staticmethod
+    def _create_converter(
+        dataType: DataType, nullable: bool = True, *, int_to_decimal_coercion_enabled: bool = False
+    ) -> Callable:
+        pass
+
+    @overload
     @staticmethod
     def _create_converter(
         dataType: DataType,
         nullable: bool = True,
-    ) -> Callable:
+        *,
+        none_on_identity: bool = True,
+        int_to_decimal_coercion_enabled: bool = False,
+    ) -> Optional[Callable]:
+        pass
+
+    @staticmethod
+    def _create_converter(
+        dataType: DataType,
+        nullable: bool = True,
+        *,
+        none_on_identity: bool = False,
+        int_to_decimal_coercion_enabled: bool = False,
+    ) -> Optional[Callable]:
         assert dataType is not None and isinstance(dataType, DataType)
         assert isinstance(nullable, bool)
 
         if not LocalDataToArrowConversion._need_converter(dataType, nullable):
-            return lambda value: value
+            if none_on_identity:
+                return None
+            else:
+                return lambda value: value
 
         if isinstance(dataType, NullType):
 
@@ -113,10 +137,16 @@ def convert_null(value: Any) -> Any:
 
         elif isinstance(dataType, StructType):
             field_names = dataType.fieldNames()
+            len_field_names = len(field_names)
             dedup_field_names = _dedup_names(dataType.names)
 
             field_convs = [
-                LocalDataToArrowConversion._create_converter(field.dataType, field.nullable)
+                LocalDataToArrowConversion._create_converter(
+                    field.dataType,
+                    field.nullable,
+                    none_on_identity=True,
+                    int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
+                )
                 for field in dataType.fields
             ]
 
@@ -126,71 +156,113 @@ def convert_struct(value: Any) -> Any:
                         raise PySparkValueError(f"input for {dataType} must not be None")
                     return None
                 else:
-                    assert isinstance(value, (tuple, dict)) or hasattr(
-                        value, "__dict__"
-                    ), f"{type(value)} {value}"
-
-                    _dict = {}
-                    if (
-                        not isinstance(value, Row)
-                        and not isinstance(value, tuple)  # inherited namedtuple
-                        and hasattr(value, "__dict__")
-                    ):
-                        value = value.__dict__
-                    if isinstance(value, dict):
-                        for i, field in enumerate(field_names):
-                            _dict[dedup_field_names[i]] = field_convs[i](value.get(field))
-                    else:
-                        if len(value) != len(field_names):
+                    # The `value` should be tuple, dict, or have `__dict__`.
+                    if isinstance(value, tuple):  # `Row` inherits `tuple`
+                        if len(value) != len_field_names:
                             raise PySparkValueError(
                                 errorClass="AXIS_LENGTH_MISMATCH",
                                 messageParameters={
-                                    "expected_length": str(len(field_names)),
+                                    "expected_length": str(len_field_names),
                                     "actual_length": str(len(value)),
                                 },
                             )
-                        for i in range(len(field_names)):
-                            _dict[dedup_field_names[i]] = field_convs[i](value[i])
-
-                    return _dict
+                        return {
+                            dedup_field_names[i]: (
+                                field_convs[i](value[i])  # type: ignore[misc]
+                                if field_convs[i] is not None
+                                else value[i]
+                            )
+                            for i in range(len_field_names)
+                        }
+                    elif isinstance(value, dict):
+                        return {
+                            dedup_field_names[i]: (
+                                field_convs[i](value.get(field))  # type: ignore[misc]
+                                if field_convs[i] is not None
+                                else value.get(field)
+                            )
+                            for i, field in enumerate(field_names)
+                        }
+                    else:
+                        assert hasattr(value, "__dict__"), f"{type(value)} {value}"
+                        value = value.__dict__
+                        return {
+                            dedup_field_names[i]: (
+                                field_convs[i](value.get(field))  # type: ignore[misc]
+                                if field_convs[i] is not None
+                                else value.get(field)
+                            )
+                            for i, field in enumerate(field_names)
+                        }
 
             return convert_struct
 
         elif isinstance(dataType, ArrayType):
             element_conv = LocalDataToArrowConversion._create_converter(
-                dataType.elementType, dataType.containsNull
+                dataType.elementType,
+                dataType.containsNull,
+                none_on_identity=True,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
             )
 
-            def convert_array(value: Any) -> Any:
-                if value is None:
-                    if not nullable:
-                        raise PySparkValueError(f"input for {dataType} must not be None")
-                    return None
-                else:
-                    assert isinstance(value, (list, array.array))
-                    return [element_conv(v) for v in value]
+            if element_conv is None:
+
+                def convert_array(value: Any) -> Any:
+                    if value is None:
+                        if not nullable:
+                            raise PySparkValueError(f"input for {dataType} must not be None")
+                        return None
+                    else:
+                        assert isinstance(value, (list, array.array))
+                        return list(value)
+
+            else:
+
+                def convert_array(value: Any) -> Any:
+                    if value is None:
+                        if not nullable:
+                            raise PySparkValueError(f"input for {dataType} must not be None")
+                        return None
+                    else:
+                        assert isinstance(value, (list, array.array))
+                        return [element_conv(v) for v in value]
 
             return convert_array
 
         elif isinstance(dataType, MapType):
-            key_conv = LocalDataToArrowConversion._create_converter(dataType.keyType)
+            key_conv = LocalDataToArrowConversion._create_converter(
+                dataType.keyType,
+                nullable=False,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
+            )
             value_conv = LocalDataToArrowConversion._create_converter(
-                dataType.valueType, dataType.valueContainsNull
+                dataType.valueType,
+                dataType.valueContainsNull,
+                none_on_identity=True,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
             )
 
-            def convert_map(value: Any) -> Any:
-                if value is None:
-                    if not nullable:
-                        raise PySparkValueError(f"input for {dataType} must not be None")
-                    return None
-                else:
-                    assert isinstance(value, dict)
+            if value_conv is None:
 
-                    _tuples = []
-                    for k, v in value.items():
-                        _tuples.append((key_conv(k), value_conv(v)))
+                def convert_map(value: Any) -> Any:
+                    if value is None:
+                        if not nullable:
+                            raise PySparkValueError(f"input for {dataType} must not be None")
+                        return None
+                    else:
+                        assert isinstance(value, dict)
+                        return [(key_conv(k), v) for k, v in value.items()]
+
+            else:
 
-                    return _tuples
+                def convert_map(value: Any) -> Any:
+                    if value is None:
+                        if not nullable:
+                            raise PySparkValueError(f"input for {dataType} must not be None")
+                        return None
+                    else:
+                        assert isinstance(value, dict)
+                        return [(key_conv(k), value_conv(v)) for k, v in value.items()]
 
             return convert_map
 
@@ -241,8 +313,15 @@ def convert_decimal(value: Any) -> Any:
                         raise PySparkValueError(f"input for {dataType} must not be None")
                     return None
                 else:
+                    if int_to_decimal_coercion_enabled and isinstance(value, int):
+                        value = decimal.Decimal(value)
+
                     assert isinstance(value, decimal.Decimal)
-                    return None if value.is_nan() else value
+                    if value.is_nan():
+                        if not nullable:
+                            raise PySparkValueError(f"input for {dataType} must not be None")
+                        return None
+                    return value
 
             return convert_decimal
 
@@ -255,7 +334,7 @@ def convert_string(value: Any) -> Any:
                     return None
                 else:
                     if isinstance(value, bool):
-                        # To match the PySpark which convert bool to string in
+                        # To match the PySpark Classic which convert bool to string in
                         # the JVM side (python.EvaluatePython.makeFromJava)
                         return str(value).lower()
                     else:
@@ -266,15 +345,32 @@ def convert_string(value: Any) -> Any:
         elif isinstance(dataType, UserDefinedType):
             udt: UserDefinedType = dataType
 
-            conv = LocalDataToArrowConversion._create_converter(udt.sqlType())
+            conv = LocalDataToArrowConversion._create_converter(
+                udt.sqlType(),
+                nullable=nullable,
+                none_on_identity=True,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
+            )
 
-            def convert_udt(value: Any) -> Any:
-                if value is None:
-                    if not nullable:
-                        raise PySparkValueError(f"input for {dataType} must not be None")
-                    return None
-                else:
-                    return conv(udt.serialize(value))
+            if conv is None:
+
+                def convert_udt(value: Any) -> Any:
+                    if value is None:
+                        if not nullable:
+                            raise PySparkValueError(f"input for {dataType} must not be None")
+                        return None
+                    else:
+                        return udt.serialize(value)
+
+            else:
+
+                def convert_udt(value: Any) -> Any:
+                    if value is None:
+                        if not nullable:
+                            raise PySparkValueError(f"input for {dataType} must not be None")
+                        return None
+                    else:
+                        return conv(udt.serialize(value))
 
             return convert_udt
 
@@ -301,7 +397,10 @@ def convert_other(value: Any) -> Any:
 
             return convert_other
         else:
-            return lambda value: value
+            if none_on_identity:
+                return None
+            else:
+                return lambda value: value
 
     @staticmethod
     def convert(data: Sequence[Any], schema: StructType, use_large_var_types: bool) -> "pa.Table":
@@ -313,55 +412,73 @@ def convert(data: Sequence[Any], schema: StructType, use_large_var_types: bool)
         assert schema is not None and isinstance(schema, StructType)
 
         column_names = schema.fieldNames()
+        len_column_names = len(column_names)
 
-        column_convs = [
-            LocalDataToArrowConversion._create_converter(field.dataType, field.nullable)
-            for field in schema.fields
-        ]
-
-        pylist: List[List] = [[] for _ in range(len(column_names))]
-
-        for item in data:
-            if isinstance(item, VariantVal):
+        def to_row(item: Any) -> tuple:
+            if item is None:
+                return tuple([None] * len_column_names)
+            elif isinstance(item, tuple):  # `Row` inherits `tuple`
+                if len(item) != len_column_names:
+                    raise PySparkValueError(
+                        errorClass="AXIS_LENGTH_MISMATCH",
+                        messageParameters={
+                            "expected_length": str(len_column_names),
+                            "actual_length": str(len(item)),
+                        },
+                    )
+                return tuple(item)
+            elif isinstance(item, dict):
+                return tuple([item.get(col) for col in column_names])
+            elif isinstance(item, VariantVal):
                 raise PySparkValueError("Rows cannot be of type VariantVal")
-            if (
-                not isinstance(item, Row)
-                and not isinstance(item, tuple)  # inherited namedtuple
-                and hasattr(item, "__dict__")
-            ):
+            elif hasattr(item, "__dict__"):
                 item = item.__dict__
-            if isinstance(item, dict):
-                for i, col in enumerate(column_names):
-                    pylist[i].append(column_convs[i](item.get(col)))
-            elif item is None:
-                for i, col in enumerate(column_names):
-                    pylist[i].append(None)
+                return tuple([item.get(col) for col in column_names])
             else:
-                if len(item) != len(column_names):
+                if len(item) != len_column_names:
                     raise PySparkValueError(
                         errorClass="AXIS_LENGTH_MISMATCH",
                         messageParameters={
-                            "expected_length": str(len(column_names)),
+                            "expected_length": str(len_column_names),
                             "actual_length": str(len(item)),
                         },
                     )
+                return tuple(item)
+
+        rows = [to_row(item) for item in data]
+
+        if len_column_names > 0:
+            column_convs = [
+                LocalDataToArrowConversion._create_converter(
+                    field.dataType,
+                    field.nullable,
+                    none_on_identity=True,
+                    # Default to False for general data conversion
+                    int_to_decimal_coercion_enabled=False,
+                )
+                for field in schema.fields
+            ]
 
-                for i in range(len(column_names)):
-                    pylist[i].append(column_convs[i](item[i]))
+            pylist = [
+                [conv(row[i]) for row in rows] if conv is not None else [row[i] for row in rows]
+                for i, conv in enumerate(column_convs)
+            ]
 
-        pa_schema = to_arrow_schema(
-            StructType(
-                [
-                    StructField(
-                        field.name, _deduplicate_field_names(field.dataType), field.nullable
-                    )
-                    for field in schema.fields
-                ]
-            ),
-            prefers_large_types=use_large_var_types,
-        )
+            pa_schema = to_arrow_schema(
+                StructType(
+                    [
+                        StructField(
+                            field.name, _deduplicate_field_names(field.dataType), field.nullable
+                        )
+                        for field in schema.fields
+                    ]
+                ),
+                prefers_large_types=use_large_var_types,
+            )
 
-        return pa.Table.from_arrays(pylist, schema=pa_schema)
+            return pa.Table.from_arrays(pylist, schema=pa_schema)
+        else:
+            return pa.Table.from_struct_array(pa.array([{}] * len(rows)))
 
 
 class ArrowTableToRowsConversion:
@@ -393,12 +510,29 @@ def _need_converter(dataType: DataType) -> bool:
         else:
             return False
 
+    @overload
     @staticmethod
     def _create_converter(dataType: DataType) -> Callable:
+        pass
+
+    @overload
+    @staticmethod
+    def _create_converter(
+        dataType: DataType, *, none_on_identity: bool = True
+    ) -> Optional[Callable]:
+        pass
+
+    @staticmethod
+    def _create_converter(
+        dataType: DataType, *, none_on_identity: bool = False
+    ) -> Optional[Callable]:
         assert dataType is not None and isinstance(dataType, DataType)
 
         if not ArrowTableToRowsConversion._need_converter(dataType):
-            return lambda value: value
+            if none_on_identity:
+                return None
+            else:
+                return lambda value: value
 
         if isinstance(dataType, NullType):
             return lambda value: None
@@ -408,7 +542,8 @@ def _create_converter(dataType: DataType) -> Callable:
             dedup_field_names = _dedup_names(field_names)
 
             field_convs = [
-                ArrowTableToRowsConversion._create_converter(f.dataType) for f in dataType.fields
+                ArrowTableToRowsConversion._create_converter(f.dataType, none_on_identity=True)
+                for f in dataType.fields
             ]
 
             def convert_struct(value: Any) -> Any:
@@ -418,7 +553,9 @@ def convert_struct(value: Any) -> Any:
                     assert isinstance(value, dict)
 
                     _values = [
-                        field_convs[i](value.get(name, None))
+                        field_convs[i](value.get(name, None))  # type: ignore[misc]
+                        if field_convs[i] is not None
+                        else value.get(name, None)
                         for i, name in enumerate(dedup_field_names)
                     ]
                     return _create_row(field_names, _values)
@@ -426,28 +563,79 @@ def convert_struct(value: Any) -> Any:
             return convert_struct
 
         elif isinstance(dataType, ArrayType):
-            element_conv = ArrowTableToRowsConversion._create_converter(dataType.elementType)
+            element_conv = ArrowTableToRowsConversion._create_converter(
+                dataType.elementType, none_on_identity=True
+            )
 
-            def convert_array(value: Any) -> Any:
-                if value is None:
-                    return None
-                else:
-                    assert isinstance(value, list)
-                    return [element_conv(v) for v in value]
+            if element_conv is None:
+
+                def convert_array(value: Any) -> Any:
+                    if value is None:
+                        return None
+                    else:
+                        assert isinstance(value, list)
+                        return value
+
+            else:
+
+                def convert_array(value: Any) -> Any:
+                    if value is None:
+                        return None
+                    else:
+                        assert isinstance(value, list)
+                        return [element_conv(v) for v in value]
 
             return convert_array
 
         elif isinstance(dataType, MapType):
-            key_conv = ArrowTableToRowsConversion._create_converter(dataType.keyType)
-            value_conv = ArrowTableToRowsConversion._create_converter(dataType.valueType)
+            key_conv = ArrowTableToRowsConversion._create_converter(
+                dataType.keyType, none_on_identity=True
+            )
+            value_conv = ArrowTableToRowsConversion._create_converter(
+                dataType.valueType, none_on_identity=True
+            )
+
+            if key_conv is None:
+                if value_conv is None:
+
+                    def convert_map(value: Any) -> Any:
+                        if value is None:
+                            return None
+                        else:
+                            assert isinstance(value, list)
+                            assert all(isinstance(t, tuple) and len(t) == 2 for t in value)
+                            return dict(value)
+
+                else:
+
+                    def convert_map(value: Any) -> Any:
+                        if value is None:
+                            return None
+                        else:
+                            assert isinstance(value, list)
+                            assert all(isinstance(t, tuple) and len(t) == 2 for t in value)
+                            return dict((t[0], value_conv(t[1])) for t in value)
+
+            else:
+                if value_conv is None:
+
+                    def convert_map(value: Any) -> Any:
+                        if value is None:
+                            return None
+                        else:
+                            assert isinstance(value, list)
+                            assert all(isinstance(t, tuple) and len(t) == 2 for t in value)
+                            return dict((key_conv(t[0]), t[1]) for t in value)
 
-            def convert_map(value: Any) -> Any:
-                if value is None:
-                    return None
                 else:
-                    assert isinstance(value, list)
-                    assert all(isinstance(t, tuple) and len(t) == 2 for t in value)
-                    return dict((key_conv(t[0]), value_conv(t[1])) for t in value)
+
+                    def convert_map(value: Any) -> Any:
+                        if value is None:
+                            return None
+                        else:
+                            assert isinstance(value, list)
+                            assert all(isinstance(t, tuple) and len(t) == 2 for t in value)
+                            return dict((key_conv(t[0]), value_conv(t[1])) for t in value)
 
             return convert_map
 
@@ -487,13 +675,25 @@ def convert_timestample_ntz(value: Any) -> Any:
         elif isinstance(dataType, UserDefinedType):
             udt: UserDefinedType = dataType
 
-            conv = ArrowTableToRowsConversion._create_converter(udt.sqlType())
+            conv = ArrowTableToRowsConversion._create_converter(
+                udt.sqlType(), none_on_identity=True
+            )
 
-            def convert_udt(value: Any) -> Any:
-                if value is None:
-                    return None
-                else:
-                    return udt.deserialize(conv(value))
+            if conv is None:
+
+                def convert_udt(value: Any) -> Any:
+                    if value is None:
+                        return None
+                    else:
+                        return udt.deserialize(value)
+
+            else:
+
+                def convert_udt(value: Any) -> Any:
+                    if value is None:
+                        return None
+                    else:
+                        return udt.deserialize(conv(value))
 
             return convert_udt
 
@@ -514,10 +714,29 @@ def convert_variant(value: Any) -> Any:
             return convert_variant
 
         else:
-            return lambda value: value
+            if none_on_identity:
+                return None
+            else:
+                return lambda value: value
 
+    @overload
     @staticmethod
-    def convert(table: "pa.Table", schema: StructType) -> List[Row]:
+    def convert(  # type: ignore[overload-overlap]
+        table: "pa.Table", schema: StructType
+    ) -> List[Row]:
+        pass
+
+    @overload
+    @staticmethod
+    def convert(
+        table: "pa.Table", schema: StructType, *, return_as_tuples: bool = True
+    ) -> List[tuple]:
+        pass
+
+    @staticmethod  # type: ignore[misc]
+    def convert(
+        table: "pa.Table", schema: StructType, *, return_as_tuples: bool = False
+    ) -> List[Union[Row, tuple]]:
         require_minimum_pyarrow_version()
         import pyarrow as pa
 
@@ -525,14 +744,27 @@ def convert(table: "pa.Table", schema: StructType) -> List[Row]:
 
         assert schema is not None and isinstance(schema, StructType)
 
-        field_converters = [
-            ArrowTableToRowsConversion._create_converter(f.dataType) for f in schema.fields
-        ]
+        fields = schema.fieldNames()
+
+        if len(fields) > 0:
+            field_converters = [
+                ArrowTableToRowsConversion._create_converter(f.dataType, none_on_identity=True)
+                for f in schema.fields
+            ]
 
-        columnar_data = [column.to_pylist() for column in table.columns]
+            columnar_data = [
+                [conv(v) for v in column.to_pylist()] if conv is not None else column.to_pylist()
+                for column, conv in zip(table.columns, field_converters)
+            ]
 
-        rows: List[Row] = []
-        for i in range(0, table.num_rows):
-            values = [field_converters[j](columnar_data[j][i]) for j in range(table.num_columns)]
-            rows.append(_create_row(fields=schema.fieldNames(), values=values))
-        return rows
+            if return_as_tuples:
+                rows = [tuple(cols) for cols in zip(*columnar_data)]
+            else:
+                rows = [_create_row(fields, tuple(cols)) for cols in zip(*columnar_data)]
+            assert len(rows) == table.num_rows, f"{len(rows)}, {table.num_rows}"
+            return rows
+        else:
+            if return_as_tuples:
+                return [tuple()] * table.num_rows
+            else:
+                return [_create_row(fields, tuple())] * table.num_rows
diff --git a/python/pyspark/sql/dataframe.py b/python/pyspark/sql/dataframe.py
index c00c3f484232b..675d972e3ef51 100644
--- a/python/pyspark/sql/dataframe.py
+++ b/python/pyspark/sql/dataframe.py
@@ -4182,7 +4182,10 @@ def unpivot(
         |  2| 12|   1.2|
         +---+---+------+
 
-        >>> df.unpivot("id", ["int", "double"], "var", "val").show()
+        >>> from pyspark.sql import functions as sf
+        >>> df.unpivot(
+        ...     "id", ["int", "double"], "var", "val"
+        ... ).sort("id", sf.desc("var")).show()
         +---+------+----+
         | id|   var| val|
         +---+------+----+
@@ -5234,7 +5237,7 @@ def replace(
         |NULL|  NULL|NULL|
         +----+------+----+
 
-        Example 4: Replace 10 to 20 in the 'name' column.
+        Example 4: Replace 10 to 18 in the 'age' column.
 
         >>> df.na.replace(10, 18, 'age').show()
         +----+------+-----+
diff --git a/python/pyspark/sql/datasource.py b/python/pyspark/sql/datasource.py
index c9704ff9f2599..f1908180a3ba5 100644
--- a/python/pyspark/sql/datasource.py
+++ b/python/pyspark/sql/datasource.py
@@ -43,13 +43,13 @@
     "DataSource",
     "DataSourceReader",
     "DataSourceStreamReader",
-    "SimpleDataSourceStreamReader",
     "DataSourceWriter",
     "DataSourceArrowWriter",
     "DataSourceStreamWriter",
+    "DataSourceStreamArrowWriter",
+    "SimpleDataSourceStreamReader",
     "DataSourceRegistration",
     "InputPartition",
-    "SimpleDataSourceStreamReader",
     "WriterCommitMessage",
     "Filter",
     "EqualTo",
@@ -1098,6 +1098,59 @@ def abort(self, messages: List[Optional["WriterCommitMessage"]], batchId: int) -
         ...
 
 
+class DataSourceStreamArrowWriter(DataSourceStreamWriter):
+    """
+    A base class for data stream writers that process data using PyArrow's `RecordBatch`.
+
+    Unlike :class:`DataSourceStreamWriter`, which works with an iterator of Spark Rows, this class
+    is optimized for using the Arrow format when writing streaming data. It can offer better
+    performance when interfacing with systems or libraries that natively support Arrow for
+    streaming use cases.
+
+    .. versionadded: 4.1.0
+    """
+
+    @abstractmethod
+    def write(self, iterator: Iterator["RecordBatch"]) -> "WriterCommitMessage":
+        """
+        Writes an iterator of PyArrow `RecordBatch` objects to the streaming sink.
+
+        This method is called on executors to write data to the streaming data sink in
+        each microbatch. It accepts an iterator of PyArrow `RecordBatch` objects and
+        returns a single row representing a commit message, or None if there is no commit message.
+
+        The driver collects commit messages, if any, from all executors and passes them
+        to the :class:`DataSourceStreamArrowWriter.commit` method if all tasks run
+        successfully. If any task fails, the :class:`DataSourceStreamArrowWriter.abort` method
+        will be called with the collected commit messages.
+
+        Parameters
+        ----------
+        iterator : iterator of :class:`RecordBatch`\\s
+            An iterator of PyArrow `RecordBatch` objects representing the input data.
+
+        Returns
+        -------
+        :class:`WriterCommitMessage`
+            a serializable commit message
+
+        Examples
+        --------
+        >>> from dataclasses import dataclass
+        >>> @dataclass
+        ... class MyCommitMessage(WriterCommitMessage):
+        ...     num_rows: int
+        ...     batch_id: int
+        ...
+        >>> def write(self, iterator: Iterator["RecordBatch"]) -> "WriterCommitMessage":
+        ...     total_rows = 0
+        ...     for batch in iterator:
+        ...         total_rows += len(batch)
+        ...     return MyCommitMessage(num_rows=total_rows, batch_id=self.current_batch_id)
+        """
+        ...
+
+
 class WriterCommitMessage:
     """
     A commit message returned by the :meth:`DataSourceWriter.write` and will be
diff --git a/python/pyspark/sql/functions/__init__.py b/python/pyspark/sql/functions/__init__.py
index 8ab2ac377c2a8..0d1df20d13d6f 100644
--- a/python/pyspark/sql/functions/__init__.py
+++ b/python/pyspark/sql/functions/__init__.py
@@ -202,6 +202,7 @@
     "convert_timezone",
     "curdate",
     "current_date",
+    "current_time",
     "current_timestamp",
     "current_timezone",
     "date_add",
@@ -228,6 +229,7 @@
     "make_date",
     "make_dt_interval",
     "make_interval",
+    "make_time",
     "make_timestamp",
     "make_timestamp_ltz",
     "make_timestamp_ntz",
@@ -246,7 +248,9 @@
     "timestamp_micros",
     "timestamp_millis",
     "timestamp_seconds",
+    "time_trunc",
     "to_date",
+    "to_time",
     "to_timestamp",
     "to_timestamp_ltz",
     "to_timestamp_ntz",
@@ -257,7 +261,9 @@
     "try_make_timestamp",
     "try_make_timestamp_ltz",
     "try_make_timestamp_ntz",
+    "try_to_time",
     "try_to_timestamp",
+    "try_to_date",
     "unix_date",
     "unix_micros",
     "unix_millis",
@@ -498,6 +504,7 @@
     # UDF, UDTF and UDT
     "AnalyzeArgument",
     "AnalyzeResult",
+    "ArrowUDFType",
     "OrderingColumn",
     "PandasUDFType",
     "PartitioningColumn",
@@ -505,9 +512,11 @@
     "SkipRestOfInputTableException",
     "UserDefinedFunction",
     "UserDefinedTableFunction",
+    "arrow_udf",
     "call_udf",
     "pandas_udf",
     "udf",
     "udtf",
+    "arrow_udtf",
     "unwrap_udt",
 ]
diff --git a/python/pyspark/sql/functions/builtin.py b/python/pyspark/sql/functions/builtin.py
index 37b65c3203da8..b09713e0c289e 100644
--- a/python/pyspark/sql/functions/builtin.py
+++ b/python/pyspark/sql/functions/builtin.py
@@ -57,10 +57,15 @@
 from pyspark.sql.udtf import AnalyzeArgument, AnalyzeResult  # noqa: F401
 from pyspark.sql.udtf import OrderingColumn, PartitioningColumn, SelectedColumn  # noqa: F401
 from pyspark.sql.udtf import SkipRestOfInputTableException  # noqa: F401
-from pyspark.sql.udtf import UserDefinedTableFunction, _create_py_udtf
+from pyspark.sql.udtf import UserDefinedTableFunction, _create_py_udtf, _create_pyarrow_udtf
 
 # Keep pandas_udf and PandasUDFType import for backwards compatible import; moved in SPARK-28264
-from pyspark.sql.pandas.functions import pandas_udf, PandasUDFType  # noqa: F401
+from pyspark.sql.pandas.functions import (  # noqa: F401
+    arrow_udf,  # noqa: F401
+    pandas_udf,  # noqa: F401
+    ArrowUDFType,  # noqa: F401
+    PandasUDFType,  # noqa: F401
+)  # noqa: F401
 
 from pyspark.sql.utils import (
     to_str as _to_str,
@@ -9288,6 +9293,68 @@ def current_timezone() -> Column:
     return _invoke_function("current_timezone")
 
 
+@overload
+def current_time() -> Column:
+    ...
+
+
+@overload
+def current_time(precision: int) -> Column:
+    ...
+
+
+@_try_remote_functions
+def current_time(precision: Optional[int] = None) -> Column:
+    """
+    Returns the current time at the start of query evaluation as a :class:`TimeType` column. All
+    calls of current_time within the same query return the same value.
+
+    .. versionadded:: 4.1.0
+
+    Parameters
+    ----------
+    precision: literal int, optional
+        number in the range [0..6], indicating how many fractional digits of seconds to include.
+        If omitted, the default is 6.
+
+    Returns
+    -------
+    :class:`~pyspark.sql.Column`
+        current time.
+
+    See Also
+    --------
+    :meth:`pyspark.sql.functions.current_date`
+    :meth:`pyspark.sql.functions.current_timestamp`
+
+    Examples
+    --------
+    Example 1: Current time with default precision
+
+    >>> from pyspark.sql import functions as sf
+    >>> spark.range(1).select(sf.current_time().alias("time")).show() # doctest: +SKIP
+    +---------------+
+    |           time|
+    +---------------+
+    |16:57:04.304361|
+    +---------------+
+
+    Example 2: Current time with specified precision
+
+    >>> from pyspark.sql import functions as sf
+    >>> spark.range(1).select(sf.current_time(3).alias("time")).show() # doctest: +SKIP
+    +------------+
+    |        time|
+    +------------+
+    |16:57:04.304|
+    +------------+
+    """
+    if precision is None:
+        return _invoke_function("current_time")
+    else:
+        return _invoke_function("current_time", _enum_to_value(precision))
+
+
 @_try_remote_functions
 def current_timestamp() -> Column:
     """
@@ -10127,10 +10194,13 @@ def hour(col: "ColumnOrName") -> Column:
     .. versionchanged:: 3.4.0
         Supports Spark Connect.
 
+    .. versionchanged:: 4.1.0
+        Added support for time type.
+
     Parameters
     ----------
     col : :class:`~pyspark.sql.Column` or column name
-        target date/timestamp column to work on.
+        target date/time/timestamp column to work on.
 
     Returns
     -------
@@ -10177,6 +10247,21 @@ def hour(col: "ColumnOrName") -> Column:
     |2015-04-08 13:08:15| timestamp|      13|
     |2024-10-31 10:09:16| timestamp|      10|
     +-------------------+----------+--------+
+
+    Example 3: Extract the hours from a time column
+
+    >>> import datetime
+    >>> from pyspark.sql import functions as sf
+    >>> df = spark.createDataFrame([
+    ...     ("13:08:15",),
+    ...     ("10:09:16",)], ['t']).withColumn("t", sf.col("t").cast("time"))
+    >>> df.select("*", sf.typeof('t'), sf.hour('t')).show()
+    +--------+---------+-------+
+    |       t|typeof(t)|hour(t)|
+    +--------+---------+-------+
+    |13:08:15|  time(6)|     13|
+    |10:09:16|  time(6)|     10|
+    +--------+---------+-------+
     """
     return _invoke_function_over_columns("hour", col)
 
@@ -10191,10 +10276,13 @@ def minute(col: "ColumnOrName") -> Column:
     .. versionchanged:: 3.4.0
         Supports Spark Connect.
 
+    .. versionchanged:: 4.1.0
+        Added support for time type.
+
     Parameters
     ----------
     col : :class:`~pyspark.sql.Column` or column name
-        target date/timestamp column to work on.
+        target date/time/timestamp column to work on.
 
     See Also
     --------
@@ -10241,6 +10329,21 @@ def minute(col: "ColumnOrName") -> Column:
     |2015-04-08 13:08:15| timestamp|         8|
     |2024-10-31 10:09:16| timestamp|         9|
     +-------------------+----------+----------+
+
+    Example 3: Extract the minutes from a time column
+
+    >>> import datetime
+    >>> from pyspark.sql import functions as sf
+    >>> df = spark.createDataFrame([
+    ...     ("13:08:15",),
+    ...     ("10:09:16",)], ['t']).withColumn("t", sf.col("t").cast("time"))
+    >>> df.select("*", sf.typeof('t'), sf.minute('t')).show()
+    +--------+---------+---------+
+    |       t|typeof(t)|minute(t)|
+    +--------+---------+---------+
+    |13:08:15|  time(6)|        8|
+    |10:09:16|  time(6)|        9|
+    +--------+---------+---------+
     """
     return _invoke_function_over_columns("minute", col)
 
@@ -10255,10 +10358,13 @@ def second(col: "ColumnOrName") -> Column:
     .. versionchanged:: 3.4.0
         Supports Spark Connect.
 
+    .. versionchanged:: 4.1.0
+        Added support for time type.
+
     Parameters
     ----------
     col : :class:`~pyspark.sql.Column` or column name
-        target date/timestamp column to work on.
+        target date/time/timestamp column to work on.
 
     Returns
     -------
@@ -10305,6 +10411,21 @@ def second(col: "ColumnOrName") -> Column:
     |2015-04-08 13:08:15| timestamp|        15|
     |2024-10-31 10:09:16| timestamp|        16|
     +-------------------+----------+----------+
+
+    Example 3: Extract the seconds from a time column
+
+    >>> import datetime
+    >>> from pyspark.sql import functions as sf
+    >>> df = spark.createDataFrame([
+    ...     ("13:08:15",),
+    ...     ("10:09:16",)], ['t']).withColumn("t", sf.col("t").cast("time"))
+    >>> df.select("*", sf.typeof('t'), sf.second('t')).show()
+    +--------+---------+---------+
+    |       t|typeof(t)|second(t)|
+    +--------+---------+---------+
+    |13:08:15|  time(6)|       15|
+    |10:09:16|  time(6)|       16|
+    +--------+---------+---------+
     """
     return _invoke_function_over_columns("second", col)
 
@@ -11344,6 +11465,70 @@ def to_date(col: "ColumnOrName", format: Optional[str] = None) -> Column:
         return _invoke_function("to_date", _to_java_column(col), _enum_to_value(format))
 
 
+@_try_remote_functions
+def try_to_date(col: "ColumnOrName", format: Optional[str] = None) -> Column:
+    """This is a special version of `try_to_date` that performs the same operation, but returns a
+    NULL value instead of raising an error if date cannot be created.
+
+    .. _datetime pattern: https://spark.apache.org/docs/latest/sql-ref-datetime-pattern.html
+
+    .. versionadded:: 4.0.0
+
+    Parameters
+    ----------
+    col : :class:`~pyspark.sql.Column` or column name
+        input column of values to convert.
+    format: literal string, optional
+        format to use to convert date values.
+
+    Returns
+    -------
+    :class:`~pyspark.sql.Column`
+        date value as :class:`pyspark.sql.types.DateType` type.
+
+    See Also
+    --------
+    :meth:`pyspark.sql.functions.to_timestamp`
+    :meth:`pyspark.sql.functions.to_timestamp_ltz`
+    :meth:`pyspark.sql.functions.to_timestamp_ntz`
+    :meth:`pyspark.sql.functions.to_utc_timestamp`
+    :meth:`pyspark.sql.functions.try_to_timestamp`
+    :meth:`pyspark.sql.functions.date_format`
+
+    Examples
+    --------
+    >>> import pyspark.sql.functions as sf
+    >>> df = spark.createDataFrame([('1997-02-28',)], ['ts'])
+    >>> df.select('*', sf.try_to_date(df.ts)).show()
+    +----------+---------------+
+    |        ts|try_to_date(ts)|
+    +----------+---------------+
+    |1997-02-28|     1997-02-28|
+    +----------+---------------+
+
+    >>> df.select('*', sf.try_to_date('ts', 'yyyy-MM-dd')).show()
+    +----------+---------------------------+
+    |        ts|try_to_date(ts, yyyy-MM-dd)|
+    +----------+---------------------------+
+    |1997-02-28|                 1997-02-28|
+    +----------+---------------------------+
+
+    >>> df = spark.createDataFrame([('foo',)], ['ts'])
+    >>> df.select(sf.try_to_date(df.ts)).show()
+    +---------------+
+    |try_to_date(ts)|
+    +---------------+
+    |           NULL|
+    +---------------+
+    """
+    from pyspark.sql.classic.column import _to_java_column
+
+    if format is None:
+        return _invoke_function_over_columns("try_to_date", col)
+    else:
+        return _invoke_function("try_to_date", _to_java_column(col), _enum_to_value(format))
+
+
 @_try_remote_functions
 def unix_date(col: "ColumnOrName") -> Column:
     """Returns the number of days since 1970-01-01.
@@ -11515,6 +11700,74 @@ def unix_seconds(col: "ColumnOrName") -> Column:
     return _invoke_function_over_columns("unix_seconds", col)
 
 
+@overload
+def to_time(str: "ColumnOrName") -> Column:
+    ...
+
+
+@overload
+def to_time(str: "ColumnOrName", format: "ColumnOrName") -> Column:
+    ...
+
+
+@_try_remote_functions
+def to_time(str: "ColumnOrName", format: Optional["ColumnOrName"] = None) -> Column:
+    """Converts a :class:`~pyspark.sql.Column` into :class:`pyspark.sql.types.TimeType` using the
+    optionally specified format. Specify formats according to `datetime pattern`_. By default, it
+    follows casting rules to :class:`pyspark.sql.types.TimeType` if the format is omitted.
+    Equivalent to ``col.cast("time")``.
+
+    .. _datetime pattern: https://spark.apache.org/docs/latest/sql-ref-datetime-pattern.html
+
+    .. versionadded:: 4.1.0
+
+    Parameters
+    ----------
+    str : :class:`~pyspark.sql.Column` or column name
+        string to be parsed to time.
+    format: :class:`~pyspark.sql.Column` or column name, optional
+        time format pattern to follow.
+
+    Returns
+    -------
+    :class:`~pyspark.sql.Column`
+        time value as :class:`pyspark.sql.types.TimeType` type.
+
+    See Also
+    --------
+    :meth:`pyspark.sql.functions.to_timestamp`
+    :meth:`pyspark.sql.functions.try_to_time`
+
+    Examples
+    --------
+    Example 1: Convert string to a time
+
+    >>> import pyspark.sql.functions as sf
+    >>> df = spark.createDataFrame([("10:30:00",)], ["str"])
+    >>> df.select(sf.to_time(df.str).alias("time")).show()
+    +--------+
+    |    time|
+    +--------+
+    |10:30:00|
+    +--------+
+
+    Example 2: Convert string to a time with a format
+
+    >>> import pyspark.sql.functions as sf
+    >>> df = spark.createDataFrame([("10:30:00", "HH:mm:ss")], ["str", "format"])
+    >>> df.select(sf.to_time(df.str, df.format).alias("time")).show()
+    +--------+
+    |    time|
+    +--------+
+    |10:30:00|
+    +--------+
+    """
+    if format is None:
+        return _invoke_function_over_columns("to_time", str)
+    else:
+        return _invoke_function_over_columns("to_time", str, format)
+
+
 @overload
 def to_timestamp(col: "ColumnOrName") -> Column:
     ...
@@ -11593,6 +11846,85 @@ def to_timestamp(col: "ColumnOrName", format: Optional[str] = None) -> Column:
         return _invoke_function("to_timestamp", _to_java_column(col), _enum_to_value(format))
 
 
+@overload
+def try_to_time(str: "ColumnOrName") -> Column:
+    ...
+
+
+@overload
+def try_to_time(str: "ColumnOrName", format: "ColumnOrName") -> Column:
+    ...
+
+
+@_try_remote_functions
+def try_to_time(str: "ColumnOrName", format: Optional["ColumnOrName"] = None) -> Column:
+    """Converts a :class:`~pyspark.sql.Column` into :class:`pyspark.sql.types.TimeType` using the
+    optionally specified format. Specify formats according to `datetime pattern`_. By default, it
+    follows casting rules to :class:`pyspark.sql.types.TimeType` if the format is omitted.
+    Equivalent to ``col.cast("time")``. The function always returns null on an invalid input.
+
+    .. _datetime pattern: https://spark.apache.org/docs/latest/sql-ref-datetime-pattern.html
+
+    .. versionadded:: 4.1.0
+
+    Parameters
+    ----------
+    str : :class:`~pyspark.sql.Column` or column name
+        string to be parsed to time.
+    format: :class:`~pyspark.sql.Column` or column name, optional
+        time format pattern to follow.
+
+    Returns
+    -------
+    :class:`~pyspark.sql.Column`
+        time value as :class:`pyspark.sql.types.TimeType` type.
+
+    See Also
+    --------
+    :meth:`pyspark.sql.functions.to_time`
+    :meth:`pyspark.sql.functions.try_to_timestamp`
+
+    Examples
+    --------
+    Example 1: Convert string to a time
+
+    >>> import pyspark.sql.functions as sf
+    >>> df = spark.createDataFrame([("10:30:00",)], ["str"])
+    >>> df.select(sf.try_to_time(df.str).alias("time")).show()
+    +--------+
+    |    time|
+    +--------+
+    |10:30:00|
+    +--------+
+
+    Example 2: Convert string to a time with a format
+
+    >>> import pyspark.sql.functions as sf
+    >>> df = spark.createDataFrame([("10:30:00", "HH:mm:ss")], ["str", "format"])
+    >>> df.select(sf.try_to_time(df.str, df.format).alias("time")).show()
+    +--------+
+    |    time|
+    +--------+
+    |10:30:00|
+    +--------+
+
+    Example 3: Converion failure results in NULL
+
+    >>> import pyspark.sql.functions as sf
+    >>> df = spark.createDataFrame([("malformed",)], ["str"])
+    >>> df.select(sf.try_to_time(df.str).alias("time")).show()
+    +----+
+    |time|
+    +----+
+    |NULL|
+    +----+
+    """
+    if format is None:
+        return _invoke_function_over_columns("try_to_time", str)
+    else:
+        return _invoke_function_over_columns("try_to_time", str, format)
+
+
 @_try_remote_functions
 def try_to_timestamp(col: "ColumnOrName", format: Optional["ColumnOrName"] = None) -> Column:
     """
@@ -12370,6 +12702,46 @@ def timestamp_seconds(col: "ColumnOrName") -> Column:
     return _invoke_function_over_columns("timestamp_seconds", col)
 
 
+@_try_remote_functions
+def time_trunc(unit: "ColumnOrName", time: "ColumnOrName") -> Column:
+    """
+    Returns `time` truncated to the `unit`.
+
+    .. versionadded:: 4.1.0
+
+    Parameters
+    ----------
+    unit : :class:`~pyspark.sql.Column` or column name
+        The unit to truncate the time to. Supported units are: "HOUR", "MINUTE", "SECOND",
+        "MILLISECOND", and "MICROSECOND". The unit is case-insensitive.
+    time : :class:`~pyspark.sql.Column` or column name
+        A time to truncate.
+
+    Returns
+    -------
+    :class:`~pyspark.sql.Column`
+        A time truncated to the specified unit.
+
+    See Also
+    --------
+    :meth:`pyspark.sql.functions.date_trunc`
+
+    Examples
+    --------
+    >>> from pyspark.sql import functions as sf
+    >>> df = spark.createDataFrame(
+    ...     [("HOUR", "13:08:15")],
+    ...     ['unit', 'time']).withColumn("time", sf.col("time").cast("time"))
+    >>> df.select('*', sf.time_trunc('unit', 'time')).show()
+    +----+--------+----------------------+
+    |unit|    time|time_trunc(unit, time)|
+    +----+--------+----------------------+
+    |HOUR|13:08:15|              13:00:00|
+    +----+--------+----------------------+
+    """
+    return _invoke_function_over_columns("time_trunc", unit, time)
+
+
 @_try_remote_functions
 def timestamp_millis(col: "ColumnOrName") -> Column:
     """
@@ -24305,6 +24677,41 @@ def make_interval(
     )
 
 
+@_try_remote_functions
+def make_time(hour: "ColumnOrName", minute: "ColumnOrName", second: "ColumnOrName") -> Column:
+    """
+    Create time from hour, minute and second fields. For invalid inputs it will throw an error.
+
+    .. versionadded:: 4.1.0
+
+    Parameters
+    ----------
+    hour : :class:`~pyspark.sql.Column` or column name
+        The hour to represent, from 0 to 23.
+    minute : :class:`~pyspark.sql.Column` or column name
+        The minute to represent, from 0 to 59.
+    second : :class:`~pyspark.sql.Column` or column name
+        The second to represent, from 0 to 59.999999.
+
+    Returns
+    -------
+    :class:`~pyspark.sql.Column`
+        A column representing the created time.
+
+    Examples
+    --------
+    >>> from pyspark.sql import functions as sf
+    >>> df = spark.createDataFrame([(6, 30, 45.887)], ["hour", "minute", "second"])
+    >>> df.select(sf.make_time("hour", "minute", "second").alias("time")).show()
+    +------------+
+    |        time|
+    +------------+
+    |06:30:45.887|
+    +------------+
+    """
+    return _invoke_function_over_columns("make_time", hour, minute, second)
+
+
 @_try_remote_functions
 def make_timestamp(
     years: "ColumnOrName",
@@ -26640,32 +27047,7 @@ def udf(
     # The following table shows most of Python data and SQL type conversions in normal UDFs that
     # are not yet visible to the user. Some of behaviors are buggy and might be changed in the near
     # future. The table might have to be eventually documented externally.
-    # Please see SPARK-28131's PR to see the codes in order to generate the table below.
-    #
-    # +-----------------------------+--------------+----------+------+---------------+--------------------+-----------------------------+----------+----------------------+---------+--------------------+----------------------------+------------+--------------+------------------+----------------------+  # noqa
-    # |SQL Type \ Python Value(Type)|None(NoneType)|True(bool)|1(int)|         a(str)|    1970-01-01(date)|1970-01-01 00:00:00(datetime)|1.0(float)|array('i', [1])(array)|[1](list)|         (1,)(tuple)|bytearray(b'ABC')(bytearray)|  1(Decimal)|{'a': 1}(dict)|Row(kwargs=1)(Row)|Row(namedtuple=1)(Row)|  # noqa
-    # +-----------------------------+--------------+----------+------+---------------+--------------------+-----------------------------+----------+----------------------+---------+--------------------+----------------------------+------------+--------------+------------------+----------------------+  # noqa
-    # |                      boolean|          None|      True|  None|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|                 X|                     X|  # noqa
-    # |                      tinyint|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|                 X|                     X|  # noqa
-    # |                     smallint|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|                 X|                     X|  # noqa
-    # |                          int|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|                 X|                     X|  # noqa
-    # |                       bigint|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|                 X|                     X|  # noqa
-    # |                       string|          None|    'true'|   '1'|            'a'|'java.util.Gregor...|         'java.util.Gregor...|     '1.0'|         '[I@66cbb73a'|    '[1]'|'[Ljava.lang.Obje...|               '[B@5a51eb1a'|         '1'|       '{a=1}'|                 X|                     X|  # noqa
-    # |                         date|          None|         X|     X|              X|datetime.date(197...|         datetime.date(197...|         X|                     X|        X|                   X|                           X|           X|             X|                 X|                     X|  # noqa
-    # |                    timestamp|          None|         X|     X|              X|                   X|         datetime.datetime...|         X|                     X|        X|                   X|                           X|           X|             X|                 X|                     X|  # noqa
-    # |                        float|          None|      None|  None|           None|                None|                         None|       1.0|                  None|     None|                None|                        None|        None|          None|                 X|                     X|  # noqa
-    # |                       double|          None|      None|  None|           None|                None|                         None|       1.0|                  None|     None|                None|                        None|        None|          None|                 X|                     X|  # noqa
-    # |                   array<int>|          None|      None|  None|           None|                None|                         None|      None|                   [1]|      [1]|                 [1]|                [65, 66, 67]|        None|          None|                 X|                     X|  # noqa
-    # |                       binary|          None|      None|  None|bytearray(b'a')|                None|                         None|      None|                  None|     None|                None|           bytearray(b'ABC')|        None|          None|                 X|                     X|  # noqa
-    # |                decimal(10,0)|          None|      None|  None|           None|                None|                         None|      None|                  None|     None|                None|                        None|Decimal('1')|          None|                 X|                     X|  # noqa
-    # |              map<string,int>|          None|      None|  None|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|      {'a': 1}|                 X|                     X|  # noqa
-    # |               struct<_1:int>|          None|         X|     X|              X|                   X|                            X|         X|                     X|Row(_1=1)|           Row(_1=1)|                           X|           X|  Row(_1=None)|         Row(_1=1)|             Row(_1=1)|  # noqa
-    # +-----------------------------+--------------+----------+------+---------------+--------------------+-----------------------------+----------+----------------------+---------+--------------------+----------------------------+------------+--------------+------------------+----------------------+  # noqa
-    #
-    # Note: DDL formatted string is used for 'SQL Type' for simplicity. This string can be
-    #       used in `returnType`.
-    # Note: The values inside of the table are generated by `repr`.
-    # Note: 'X' means it throws an exception during the conversion.
+    # Please see python/pyspark/sql/tests/udf_type_tests for type tests and golden files
 
     # decorator @udf, @udf(), @udf(dataType())
     if f is None or isinstance(f, (str, DataType)):
@@ -26850,6 +27232,75 @@ def udtf(
         return _create_py_udtf(cls=cls, returnType=returnType, useArrow=useArrow)
 
 
+@_try_remote_functions
+def arrow_udtf(
+    cls: Optional[Type] = None,
+    *,
+    returnType: Optional[Union[StructType, str]] = None,
+) -> Union["UserDefinedTableFunction", Callable[[Type], "UserDefinedTableFunction"]]:
+    """Creates a PyArrow-native user defined table function (UDTF).
+
+    This function provides a PyArrow-native interface for UDTFs, where the eval method
+    receives PyArrow RecordBatches or Arrays and returns an Iterator of PyArrow Tables
+    or RecordBatches.
+    This enables true vectorized computation without row-by-row processing overhead.
+
+    .. versionadded:: 4.1.0
+
+    Parameters
+    ----------
+    cls : class, optional
+        the Python user-defined table function handler class.
+    returnType : :class:`pyspark.sql.types.StructType` or str, optional
+        the return type of the user-defined table function. The value can be either a
+        :class:`pyspark.sql.types.StructType` object or a DDL-formatted struct type string.
+
+    Examples
+    --------
+    UDTF with PyArrow RecordBatch input:
+
+    >>> import pyarrow as pa
+    >>> from pyspark.sql.functions import arrow_udtf
+    >>> @arrow_udtf(returnType="x int, y int")
+    ... class MyUDTF:
+    ...     def eval(self, batch: pa.RecordBatch):
+    ...         # Process the entire batch vectorized
+    ...         x_array = batch.column('x')
+    ...         y_array = batch.column('y')
+    ...         result_table = pa.table({
+    ...             'x': x_array,
+    ...             'y': y_array
+    ...         })
+    ...         yield result_table
+    ...
+    >>> df = spark.range(10).selectExpr("id as x", "id as y")
+    >>> MyUDTF(df.asTable()).show()  # doctest: +SKIP
+
+    UDTF with PyArrow Array inputs:
+
+    >>> @arrow_udtf(returnType="x int, y int")
+    ... class MyUDTF2:
+    ...     def eval(self, x: pa.Array, y: pa.Array):
+    ...         # Process arrays vectorized
+    ...         result_table = pa.table({
+    ...             'x': x,
+    ...             'y': y
+    ...         })
+    ...         yield result_table
+    ...
+    >>> MyUDTF2(lit(1), lit(2)).show()  # doctest: +SKIP
+
+    Notes
+    -----
+    - The eval method must accept PyArrow RecordBatches or Arrays as input
+    - The eval method must yield PyArrow Tables or RecordBatches as output
+    """
+    if cls is None:
+        return functools.partial(_create_pyarrow_udtf, returnType=returnType)
+    else:
+        return _create_pyarrow_udtf(cls=cls, returnType=returnType)
+
+
 def _test() -> None:
     import doctest
     from pyspark.sql import SparkSession
diff --git a/python/pyspark/sql/pandas/_typing/__init__.pyi b/python/pyspark/sql/pandas/_typing/__init__.pyi
index 8b617ee02eea1..d1e2b7aae6f86 100644
--- a/python/pyspark/sql/pandas/_typing/__init__.pyi
+++ b/python/pyspark/sql/pandas/_typing/__init__.pyi
@@ -63,6 +63,8 @@ GroupedMapUDFTransformWithStateInitStateType = Literal[214]
 # Arrow UDFs
 ArrowScalarUDFType = Literal[250]
 ArrowScalarIterUDFType = Literal[251]
+ArrowGroupedAggUDFType = Literal[252]
+ArrowWindowAggUDFType = Literal[253]
 
 class ArrowVariadicScalarToScalarFunction(Protocol):
     def __call__(self, *_: pyarrow.Array) -> pyarrow.Array: ...
diff --git a/python/pyspark/sql/pandas/conversion.py b/python/pyspark/sql/pandas/conversion.py
index 18360fd813921..cb7dfa5552600 100644
--- a/python/pyspark/sql/pandas/conversion.py
+++ b/python/pyspark/sql/pandas/conversion.py
@@ -28,7 +28,6 @@
 from warnings import warn
 
 from pyspark.errors.exceptions.captured import unwrap_spark_exception
-from pyspark.loose_version import LooseVersion
 from pyspark.util import _load_from_socket
 from pyspark.sql.pandas.serializers import ArrowCollectSerializer
 from pyspark.sql.pandas.types import _dedup_names
@@ -121,18 +120,10 @@ def toPandas(self) -> "PandasDataFrameLike":
                         # Pandas DataFrame created from PyArrow uses datetime64[ns] for date type
                         # values, but we should use datetime.date to match the behavior with when
                         # Arrow optimization is disabled.
-                        pandas_options = {"date_as_object": True}
-
-                        if LooseVersion(pa.__version__) >= LooseVersion("13.0.0"):
-                            # A legacy option to coerce date32, date64, duration, and timestamp
-                            # time units to nanoseconds when converting to pandas.
-                            # This option can only be added since 13.0.0.
-                            pandas_options.update(
-                                {
-                                    "coerce_temporal_nanoseconds": True,
-                                }
-                            )
-
+                        pandas_options = {
+                            "date_as_object": True,
+                            "coerce_temporal_nanoseconds": True,
+                        }
                         if self_destruct:
                             # Configure PyArrow to use as little memory as possible:
                             # self_destruct - free columns as they are converted
@@ -739,7 +730,7 @@ def _create_from_pandas_with_arrow(
         jsparkSession = self._jsparkSession
 
         safecheck = self._jconf.arrowSafeTypeConversion()
-        ser = ArrowStreamPandasSerializer(timezone, safecheck)
+        ser = ArrowStreamPandasSerializer(timezone, safecheck, False)
 
         @no_type_check
         def reader_func(temp_filename):
diff --git a/python/pyspark/sql/pandas/functions.py b/python/pyspark/sql/pandas/functions.py
index 6fc15c03a6bdc..79f3f75bd573c 100644
--- a/python/pyspark/sql/pandas/functions.py
+++ b/python/pyspark/sql/pandas/functions.py
@@ -48,26 +48,292 @@ class ArrowUDFType:
 
     SCALAR_ITER = PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF
 
+    GROUPED_AGG = PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF
+
 
 def arrow_udf(f=None, returnType=None, functionType=None):
-    return vectorized_udf(f, returnType, functionType, "arrow")
+    """
+    Creates an arrow user defined function.
 
+    Arrow UDFs are user defined functions that are executed by Spark using Arrow to transfer
+    and work with the data, which allows `pyarrow.Array` operations. An Arrow UDF is defined
+    using the `arrow_udf` as a decorator or to wrap the function, and no additional configuration
+    is required. An Arrow UDF behaves as a regular PySpark function API in general.
 
-def pandas_udf(f=None, returnType=None, functionType=None):
-    return vectorized_udf(f, returnType, functionType, "pandas")
+    .. versionadded:: 4.1.0
 
+    Parameters
+    ----------
+    f : function, optional
+        user-defined function. A python function if used as a standalone function
+    returnType : :class:`pyspark.sql.types.DataType` or str, optional
+        the return type of the user-defined function. The value can be either a
+        :class:`pyspark.sql.types.DataType` object or a DDL-formatted type string.
+    functionType : int, optional
+        an enum value in :class:`pyspark.sql.functions.ArrowUDFType`.
+        Default: SCALAR. This parameter exists for compatibility.
+        Using Python type hints is encouraged.
 
-def vectorized_udf(
-    f=None,
-    returnType=None,
-    functionType=None,
-    kind: str = "pandas",
-):
+    Examples
+    --------
+    In order to use this API, customarily the below are imported:
+
+    >>> import pyarrow as pa
+    >>> from pyspark.sql.functions import arrow_udf
+
+    `Python type hints <https://www.python.org/dev/peps/pep-0484>`_
+    detect the function types as below:
+
+    >>> from pyspark.sql.functions import ArrowUDFType
+    >>> from pyspark.sql.types import IntegerType
+    >>> @arrow_udf(IntegerType(), ArrowUDFType.SCALAR)
+    ... def slen(v: pa.Array) -> pa.Array:
+    ...     return pa.compute.utf8_length(v)
+
+    Note that the type hint should use `pyarrow.Array` in all cases.
+
+    * Arrays to Arrays
+        `pyarrow.Array`, ... -> `pyarrow.Array`
+
+        The function takes one or more `pyarrow.Array` and outputs one `pyarrow.Array`.
+        The output of the function should always be of the same length as the input.
+
+        >>> @arrow_udf("string")
+        ... def to_upper(s: pa.Array) -> pa.Array:
+        ...     return pa.compute.ascii_upper(s)
+        ...
+        >>> df = spark.createDataFrame([("John Doe",)], ("name",))
+        >>> df.select(to_upper("name")).show()
+        +--------------+
+        |to_upper(name)|
+        +--------------+
+        |      JOHN DOE|
+        +--------------+
+
+        >>> @arrow_udf("first string, last string")
+        ... def split_expand(v: pa.Array) -> pa.Array:
+        ...     b = pa.compute.ascii_split_whitespace(v)
+        ...     s0 = pa.array([t[0] for t in b])
+        ...     s1 = pa.array([t[1] for t in b])
+        ...     return pa.StructArray.from_arrays([s0, s1], names=["first", "last"])
+        ...
+        >>> df = spark.createDataFrame([("John Doe",)], ("name",))
+        >>> df.select(split_expand("name")).show()
+        +------------------+
+        |split_expand(name)|
+        +------------------+
+        |       {John, Doe}|
+        +------------------+
+
+        This type of Pandas UDF can use keyword arguments:
+
+        >>> from pyspark.sql import functions as sf
+        >>> @arrow_udf(returnType=IntegerType())
+        ... def calc(a: pa.Array, b: pa.Array) -> pa.Array:
+        ...     return pa.compute.add(a, pa.compute.multiply(b, 10))
+        ...
+        >>> spark.range(2).select(calc(b=sf.col("id") * 10, a=sf.col("id"))).show()
+        +-----------------------------+
+        |calc(b => (id * 10), a => id)|
+        +-----------------------------+
+        |                            0|
+        |                          101|
+        +-----------------------------+
+
+        .. note:: The length of the input is not that of the whole input column, but is the
+            length of an internal batch used for each call to the function.
+
+    * Iterator of Arrays to Iterator of Arrays
+        `Iterator[pyarrow.Array]` -> `Iterator[pyarrow.Array]`
+
+        The function takes an iterator of `pyarrow.Array` and outputs an iterator of
+        `pyarrow.Array`. In this case, the created arrow UDF instance requires one input
+        column when this is called as a PySpark column. The length of the entire output from
+        the function should be the same length of the entire input; therefore, it can
+        prefetch the data from the input iterator as long as the lengths are the same.
+
+        It is also useful when the UDF execution
+        requires initializing some states, although internally it works identically as
+        Arrays to Arrays case. The pseudocode below illustrates the example.
+
+        .. highlight:: python
+        .. code-block:: python
+
+            @arrow_udf("long")
+            def calculate(iterator: Iterator[pa.Array]) -> Iterator[pa.Array]:
+                # Do some expensive initialization with a state
+                state = very_expensive_initialization()
+                for x in iterator:
+                    # Use that state for whole iterator.
+                    yield calculate_with_state(x, state)
+
+            df.select(calculate("value")).show()
+
+        >>> import pandas as pd
+        >>> from typing import Iterator
+        >>> @arrow_udf("long")
+        ... def plus_one(iterator: Iterator[pa.Array]) -> Iterator[pa.Array]:
+        ...     for v in iterator:
+        ...         yield pa.compute.add(v, 1)
+        ...
+        >>> df = spark.createDataFrame(pd.DataFrame([1, 2, 3], columns=["v"]))
+        >>> df.select(plus_one(df.v)).show()
+        +-----------+
+        |plus_one(v)|
+        +-----------+
+        |          2|
+        |          3|
+        |          4|
+        +-----------+
+
+        .. note:: The length of each series is the length of a batch internally used.
+
+    * Iterator of Multiple Arrays to Iterator of Arrays
+        `Iterator[Tuple[pyarrow.Array, ...]]` -> `Iterator[pyarrow.Array]`
+
+        The function takes an iterator of a tuple of multiple `pyarrow.Array` and outputs an
+        iterator of `pyarrow.Array`. In this case, the created arrow UDF instance requires
+        input columns as many as the series when this is called as a PySpark column.
+        Otherwise, it has the same characteristics and restrictions as Iterator of Arrays
+        to Iterator of Arrays case.
+
+        >>> from typing import Iterator, Tuple
+        >>> from pyspark.sql import functions as sf
+        >>> @arrow_udf("long")
+        ... def multiply(iterator: Iterator[Tuple[pa.Array, pa.Array]]) -> Iterator[pa.Array]:
+        ...     for v1, v2 in iterator:
+        ...         yield pa.compute.multiply(v1, v2.field("v"))
+        ...
+        >>> df = spark.createDataFrame(pd.DataFrame([1, 2, 3], columns=["v"]))
+        >>> df.withColumn('output', multiply(sf.col("v"), sf.struct(sf.col("v")))).show()
+        +---+------+
+        |  v|output|
+        +---+------+
+        |  1|     1|
+        |  2|     4|
+        |  3|     9|
+        +---+------+
+
+        .. note:: The length of each series is the length of a batch internally used.
+
+    * Arrays to Scalar
+        `pyarrow.Array`, ... -> `Any`
+
+        The function takes `pyarrow.Array` and returns a scalar value. The returned scalar
+        can be a python primitive type, (e.g., int or float), a numpy data type (e.g.,
+        numpy.int64 or numpy.float64), or a `pyarrow.Scalar` instance which supports complex
+        return types.
+        `Any` should ideally be a specific scalar type accordingly.
+
+        >>> @arrow_udf("double")
+        ... def mean_udf(v: pa.Array) -> float:
+        ...     return pa.compute.mean(v).as_py()
+        ...
+        >>> df = spark.createDataFrame(
+        ...     [(1, 1.0), (1, 2.0), (2, 3.0), (2, 5.0), (2, 10.0)], ("id", "v"))
+        >>> df.groupby("id").agg(mean_udf(df['v'])).show()
+        +---+-----------+
+        | id|mean_udf(v)|
+        +---+-----------+
+        |  1|        1.5|
+        |  2|        6.0|
+        +---+-----------+
+
+        The retun type can also be a complex type such as struct, list, or map.
+
+        >>> @arrow_udf("struct<m1: double, m2: double>")
+        ... def min_max_udf(v: pa.Array) -> pa.Scalar:
+        ...     m1 = pa.compute.min(v)
+        ...     m2 = pa.compute.max(v)
+        ...     t = pa.struct([pa.field("m1", pa.float64()), pa.field("m2", pa.float64())])
+        ...     return pa.scalar(value={"m1": m1.as_py(), "m2": m2.as_py()}, type=t)
+        ...
+        >>> df = spark.createDataFrame(
+        ...     [(1, 1.0), (1, 2.0), (2, 3.0), (2, 5.0), (2, 10.0)], ("id", "v"))
+        >>> df.groupby("id").agg(min_max_udf(df['v'])).show()
+        +---+--------------+
+        | id|min_max_udf(v)|
+        +---+--------------+
+        |  1|    {1.0, 2.0}|
+        |  2|   {3.0, 10.0}|
+        +---+--------------+
+
+        This type of Pandas UDF can use keyword arguments:
+
+        >>> @arrow_udf("double")
+        ... def weighted_mean_udf(v: pa.Array, w: pa.Array) -> float:
+        ...     import numpy as np
+        ...     return np.average(v.to_numpy(), weights=w)
+        ...
+        >>> df = spark.createDataFrame(
+        ...     [(1, 1.0, 1.0), (1, 2.0, 2.0), (2, 3.0, 1.0), (2, 5.0, 2.0), (2, 10.0, 3.0)],
+        ...     ("id", "v", "w"))
+        >>> df.groupby("id").agg(weighted_mean_udf(w=df["w"], v=df["v"])).show()
+        +---+---------------------------------+
+        | id|weighted_mean_udf(w => w, v => v)|
+        +---+---------------------------------+
+        |  1|               1.6666666666666667|
+        |  2|                7.166666666666667|
+        +---+---------------------------------+
+
+        This UDF can also be used as window functions as below:
+
+        >>> from pyspark.sql import Window
+        >>> @arrow_udf("double")
+        ... def mean_udf(v: pa.Array) -> float:
+        ...     return pa.compute.mean(v).as_py()
+        ...
+        >>> df = spark.createDataFrame(
+        ...     [(1, 1.0), (1, 2.0), (2, 3.0), (2, 5.0), (2, 10.0)], ("id", "v"))
+        >>> w = Window.partitionBy('id').orderBy('v').rowsBetween(-1, 0)
+        >>> df.withColumn('mean_v', mean_udf("v").over(w)).show()
+        +---+----+------+
+        | id|   v|mean_v|
+        +---+----+------+
+        |  1| 1.0|   1.0|
+        |  1| 2.0|   1.5|
+        |  2| 3.0|   3.0|
+        |  2| 5.0|   4.0|
+        |  2|10.0|   7.5|
+        +---+----+------+
+
+        .. note:: For performance reasons, the input series to window functions are not copied.
+            Therefore, mutating the input arrays is not allowed and will cause incorrect results.
+            For the same reason, users should also not rely on the index of the input arrays.
+
+    Notes
+    -----
+    The user-defined functions do not support conditional expressions or short circuiting
+    in boolean expressions and it ends up with being executed all internally. If the functions
+    can fail on special rows, the workaround is to incorporate the condition into the functions.
+
+    The user-defined functions do not take keyword arguments on the calling side.
+
+    The data type of returned `pyarrow.Array` from the user-defined functions should be
+    matched with defined `returnType` (see :meth:`types.to_arrow_type` and
+    :meth:`types.from_arrow_type`). When there is mismatch between them, Spark might do
+    conversion on returned data. The conversion is not guaranteed to be correct and results
+    should be checked for accuracy by users.
+
+    See Also
+    --------
+    pyspark.sql.GroupedData.agg
+    pyspark.sql.DataFrame.mapInArrow
+    pyspark.sql.GroupedData.applyInArrow
+    pyspark.sql.PandasCogroupedOps.applyInArrow
+    pyspark.sql.UDFRegistration.register
     """
-    Creates a vectorized user defined function.
+    require_minimum_pyarrow_version()
+
+    return vectorized_udf(f, returnType, functionType, "arrow")
+
+
+def pandas_udf(f=None, returnType=None, functionType=None):
+    """
+    Creates a pandas user defined function.
 
     Pandas UDFs are user defined functions that are executed by Spark using Arrow to transfer
-    data and Pandas to work with the data, which allows vectorized operations. A Pandas UDF
+    data and Pandas to work with the data, which allows pandas operations. A Pandas UDF
     is defined using the `pandas_udf` as a decorator or to wrap the function, and no
     additional configuration is required. A Pandas UDF behaves as a regular PySpark function
     API in general.
@@ -102,6 +368,7 @@ def vectorized_udf(
     From Spark 3.0 with Python 3.6+, `Python type hints <https://www.python.org/dev/peps/pep-0484>`_
     detect the function types as below:
 
+    >>> from pyspark.sql.types import IntegerType
     >>> @pandas_udf(IntegerType())
     ... def slen(s: pd.Series) -> pd.Series:
     ...     return s.str.len()
@@ -125,21 +392,26 @@ def vectorized_udf(
     `pandas.DataFrame` as below:
 
     >>> @pandas_udf("col1 string, col2 long")
-    >>> def func(s1: pd.Series, s2: pd.Series, s3: pd.DataFrame) -> pd.DataFrame:
+    ... def func(s1: pd.Series, s2: pd.Series, s3: pd.DataFrame) -> pd.DataFrame:
     ...     s3['col2'] = s1 + s2.str.len()
     ...     return s3
-    ...
-    >>> # Create a Spark DataFrame that has three columns including a struct column.
-    ... df = spark.createDataFrame(
+
+
+    Create a Spark DataFrame that has three columns including a struct column.
+
+    >>> df = spark.createDataFrame(
     ...     [[1, "a string", ("a nested string",)]],
     ...     "long_col long, string_col string, struct_col struct<col1:string>")
+
     >>> df.printSchema()
     root
-    |-- long_column: long (nullable = true)
-    |-- string_column: string (nullable = true)
-    |-- struct_column: struct (nullable = true)
+    |-- long_col: long (nullable = true)
+    |-- string_col: string (nullable = true)
+    |-- struct_col: struct (nullable = true)
     |    |-- col1: string (nullable = true)
+
     >>> df.select(func("long_col", "string_col", "struct_col")).printSchema()
+    root
     |-- func(long_col, string_col, struct_col): struct (nullable = true)
     |    |-- col1: string (nullable = true)
     |    |-- col2: long (nullable = true)
@@ -179,11 +451,12 @@ def vectorized_udf(
 
         This type of Pandas UDF can use keyword arguments:
 
+        >>> from pyspark.sql import functions as sf
         >>> @pandas_udf(returnType=IntegerType())
         ... def calc(a: pd.Series, b: pd.Series) -> pd.Series:
         ...     return a + 10 * b
         ...
-        >>> spark.range(2).select(calc(b=col("id") * 10, a=col("id"))).show()
+        >>> spark.range(2).select(calc(b=sf.col("id") * 10, a=sf.col("id"))).show()
         +-----------------------------+
         |calc(b => (id * 10), a => id)|
         +-----------------------------+
@@ -248,14 +521,14 @@ def calculate(iterator: Iterator[pd.Series]) -> Iterator[pd.Series]:
         to Iterator of Series case.
 
         >>> from typing import Iterator, Tuple
-        >>> from pyspark.sql.functions import struct, col
+        >>> from pyspark.sql import functions as sf
         >>> @pandas_udf("long")
         ... def multiply(iterator: Iterator[Tuple[pd.Series, pd.DataFrame]]) -> Iterator[pd.Series]:
         ...     for s1, df in iterator:
         ...         yield s1 * df.v
         ...
         >>> df = spark.createDataFrame(pd.DataFrame([1, 2, 3], columns=["v"]))
-        >>> df.withColumn('output', multiply(col("v"), struct(col("v")))).show()
+        >>> df.withColumn('output', multiply(sf.col("v"), sf.struct(sf.col("v")))).show()
         +---+------+
         |  v|output|
         +---+------+
@@ -359,40 +632,26 @@ def calculate(iterator: Iterator[pd.Series]) -> Iterator[pd.Series]:
     pyspark.sql.UDFRegistration.register
     """
 
-    # The following table shows most of Pandas data and SQL type conversions in Pandas UDFs that
-    # are not yet visible to the user. Some of behaviors are buggy and might be changed in the near
-    # future. The table might have to be eventually documented externally.
-    # Please see SPARK-28132's PR to see the codes in order to generate the table below.
-    #
-    # +-----------------------------+----------------------+------------------+------------------+------------------+--------------------+--------------------+------------------+------------------+------------------+------------------+--------------+--------------+--------------+-----------------------------------+-----------------------------------------------------+-----------------+--------------------+-----------------------------+--------------+-----------------+------------------+---------------+--------------------------------+  # noqa
-    # |SQL Type \ Pandas Value(Type)|None(object(NoneType))|        True(bool)|           1(int8)|          1(int16)|            1(int32)|            1(int64)|          1(uint8)|         1(uint16)|         1(uint32)|         1(uint64)|  1.0(float16)|  1.0(float32)|  1.0(float64)|1970-01-01 00:00:00(datetime64[ns])|1970-01-01 00:00:00-05:00(datetime64[ns, US/Eastern])|a(object(string))|  1(object(Decimal))|[1 2 3](object(array[int32]))| 1.0(float128)|(1+0j)(complex64)|(1+0j)(complex128)|    A(category)|1 days 00:00:00(timedelta64[ns])|  # noqa
-    # +-----------------------------+----------------------+------------------+------------------+------------------+--------------------+--------------------+------------------+------------------+------------------+------------------+--------------+--------------+--------------+-----------------------------------+-----------------------------------------------------+-----------------+--------------------+-----------------------------+--------------+-----------------+------------------+---------------+--------------------------------+  # noqa
-    # |                      boolean|                  None|              True|              True|              True|                True|                True|              True|              True|              True|              True|          True|          True|          True|                                  X|                                                    X|                X|                   X|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                      tinyint|                  None|                 1|                 1|                 1|                   1|                   1|                 1|                 1|                 1|                 1|             1|             1|             1|                                  X|                                                    X|                X|                   1|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                     smallint|                  None|                 1|                 1|                 1|                   1|                   1|                 1|                 1|                 1|                 1|             1|             1|             1|                                  X|                                                    X|                X|                   1|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                          int|                  None|                 1|                 1|                 1|                   1|                   1|                 1|                 1|                 1|                 1|             1|             1|             1|                                  X|                                                    X|                X|                   1|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                       bigint|                  None|                 1|                 1|                 1|                   1|                   1|                 1|                 1|                 1|                 1|             1|             1|             1|                                  0|                                       18000000000000|                X|                   1|                            X|             X|                X|                 X|              X|                  86400000000000|  # noqa
-    # |                        float|                  None|               1.0|               1.0|               1.0|                 1.0|                 1.0|               1.0|               1.0|               1.0|               1.0|           1.0|           1.0|           1.0|                                  X|                                                    X|                X|                   X|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                       double|                  None|               1.0|               1.0|               1.0|                 1.0|                 1.0|               1.0|               1.0|               1.0|               1.0|           1.0|           1.0|           1.0|                                  X|                                                    X|                X|                   X|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                         date|                  None|                 X|                 X|                 X|datetime.date(197...|                   X|                 X|                 X|                 X|                 X|             X|             X|             X|               datetime.date(197...|                                 datetime.date(197...|                X|datetime.date(197...|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                    timestamp|                  None|                 X|                 X|                 X|                   X|datetime.datetime...|                 X|                 X|                 X|                 X|             X|             X|             X|               datetime.datetime...|                                 datetime.datetime...|                X|datetime.datetime...|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                       string|                  None|                 X|                 X|                 X|                   X|                   X|                 X|                 X|                 X|                 X|             X|             X|             X|                                  X|                                                    X|              'a'|                   X|                            X|             X|                X|                 X|            'A'|                               X|  # noqa
-    # |                decimal(10,0)|                  None|                 X|                 X|                 X|                   X|                   X|                 X|                 X|                 X|                 X|             X|             X|             X|                                  X|                                                    X|                X|        Decimal('1')|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                   array<int>|                  None|                 X|                 X|                 X|                   X|                   X|                 X|                 X|                 X|                 X|             X|             X|             X|                                  X|                                                    X|                X|                   X|                    [1, 2, 3]|             X|                X|                 X|              X|                               X|  # noqa
-    # |              map<string,int>|                  None|                 X|                 X|                 X|                   X|                   X|                 X|                 X|                 X|                 X|             X|             X|             X|                                  X|                                                    X|                X|                   X|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |               struct<_1:int>|                     X|                 X|                 X|                 X|                   X|                   X|                 X|                 X|                 X|                 X|             X|             X|             X|                                  X|                                                    X|                X|                   X|                            X|             X|                X|                 X|              X|                               X|  # noqa
-    # |                       binary|                  None|bytearray(b'\x01')|bytearray(b'\x01')|bytearray(b'\x01')|  bytearray(b'\x01')|  bytearray(b'\x01')|bytearray(b'\x01')|bytearray(b'\x01')|bytearray(b'\x01')|bytearray(b'\x01')|bytearray(b'')|bytearray(b'')|bytearray(b'')|                     bytearray(b'')|                                       bytearray(b'')|  bytearray(b'a')|                   X|                            X|bytearray(b'')|   bytearray(b'')|    bytearray(b'')|bytearray(b'A')|                  bytearray(b'')|  # noqa
-    # +-----------------------------+----------------------+------------------+------------------+------------------+--------------------+--------------------+------------------+------------------+------------------+------------------+--------------+--------------+--------------+-----------------------------------+-----------------------------------------------------+-----------------+--------------------+-----------------------------+--------------+-----------------+------------------+---------------+--------------------------------+  # noqa
-    #
-    # Note: DDL formatted string is used for 'SQL Type' for simplicity. This string can be
-    #       used in `returnType`.
-    # Note: The values inside of the table are generated by `repr`.
-    # Note: Python 3.11.9, Pandas 2.2.3 and PyArrow 17.0.0 are used.
-    # Note: Timezone is KST.
-    # Note: 'X' means it throws an exception during the conversion.
+    # The return type and input type behavior of pandas_udfs is documented in
+    # python/pyspark/sql/tests/udf_type_tests.
+    # It shows most of Pandas data and SQL type conversions in Pandas UDFs that are not
+    # yet visible to the user.
+    # Some of behaviors are buggy and might be changed in the near future. The table might
+    # have to be eventually documented externally.
+    # The folder python/pyspark/sql/tests/udf_type_tests contains type tests and golden
+    # files, as well as the code to regenerate the tables.
     require_minimum_pandas_version()
     require_minimum_pyarrow_version()
 
+    return vectorized_udf(f, returnType, functionType, "pandas")
+
+
+def vectorized_udf(
+    f=None,
+    returnType=None,
+    functionType=None,
+    kind: str = "pandas",
+):
     assert kind in ["pandas", "arrow"], "kind should be either 'pandas' or 'arrow'"
 
     # decorator @pandas_udf(returnType, functionType)
@@ -454,6 +713,7 @@ def calculate(iterator: Iterator[pd.Series]) -> Iterator[pd.Series]:
     if kind == "arrow" and eval_type not in [
         PythonEvalType.SQL_SCALAR_ARROW_UDF,
         PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF,
+        PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
         None,
     ]:  # None means it should infer the type from type hints.
         raise PySparkTypeError(
@@ -524,7 +784,7 @@ def _validate_vectorized_udf(f, evalType, kind: str = "pandas") -> int:
             type_hints = get_type_hints(f)
         except NameError:
             type_hints = {}
-        evalType = infer_eval_type(signature(f), type_hints)
+        evalType = infer_eval_type(signature(f), type_hints, kind)
         assert evalType is not None
 
     if evalType is None:
@@ -541,6 +801,7 @@ def _validate_vectorized_udf(f, evalType, kind: str = "pandas") -> int:
             evalType == PythonEvalType.SQL_SCALAR_PANDAS_UDF
             or evalType == PythonEvalType.SQL_SCALAR_ARROW_UDF
             or evalType == PythonEvalType.SQL_SCALAR_PANDAS_ITER_UDF
+            or evalType == PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF
         )
         and len(argspec.args) == 0
         and argspec.varargs is None
@@ -549,7 +810,7 @@ def _validate_vectorized_udf(f, evalType, kind: str = "pandas") -> int:
             errorClass="INVALID_PANDAS_UDF",
             messageParameters={
                 "detail": f"0-arg {kind_str} are not supported. "
-                "Instead, create a 1-arg pandas_udf and ignore the arg in your function.",
+                f"Instead, create a 1-arg {kind_str} and ignore the arg in your function.",
             },
         )
 
@@ -602,3 +863,31 @@ def _create_vectorized_udf(f, returnType, evalType, kind):
         return _create_connect_udf(f, returnType, evalType)
     else:
         return _create_udf(f, returnType, evalType)
+
+
+def _test() -> None:
+    import sys
+    import doctest
+    from pyspark.sql import SparkSession
+    import pyspark.sql.pandas.functions
+
+    globs = pyspark.sql.column.__dict__.copy()
+    spark = (
+        SparkSession.builder.master("local[4]")
+        .appName("pyspark.sql.pandas.functions tests")
+        .getOrCreate()
+    )
+    globs["spark"] = spark
+
+    (failure_count, test_count) = doctest.testmod(
+        pyspark.sql.pandas.functions,
+        globs=globs,
+        optionflags=doctest.ELLIPSIS | doctest.NORMALIZE_WHITESPACE | doctest.REPORT_NDIFF,
+    )
+    spark.stop()
+    if failure_count:
+        sys.exit(-1)
+
+
+if __name__ == "__main__":
+    _test()
diff --git a/python/pyspark/sql/pandas/functions.pyi b/python/pyspark/sql/pandas/functions.pyi
index 925871bd0e61e..70ff08679b6b0 100644
--- a/python/pyspark/sql/pandas/functions.pyi
+++ b/python/pyspark/sql/pandas/functions.pyi
@@ -39,6 +39,7 @@ from pyspark.sql.pandas._typing import (
     ArrowScalarUDFType,
     ArrowScalarIterFunction,
     ArrowScalarIterUDFType,
+    ArrowGroupedAggUDFType,
 )
 
 from pyspark import since as since  # noqa: F401
@@ -54,6 +55,7 @@ class PandasUDFType:
 class ArrowUDFType:
     SCALAR: ArrowScalarUDFType
     SCALAR_ITER: ArrowScalarIterUDFType
+    GROUPED_AGG: ArrowGroupedAggUDFType
 
 @overload
 def arrow_udf(
diff --git a/python/pyspark/sql/pandas/serializers.py b/python/pyspark/sql/pandas/serializers.py
index b154318dc430c..437ceede78a69 100644
--- a/python/pyspark/sql/pandas/serializers.py
+++ b/python/pyspark/sql/pandas/serializers.py
@@ -19,12 +19,12 @@
 Serializers for PyArrow and pandas conversions. See `pyspark.serializers` for more details.
 """
 
+from decimal import Decimal
 from itertools import groupby
 from typing import TYPE_CHECKING, Optional
 
 import pyspark
 from pyspark.errors import PySparkRuntimeError, PySparkTypeError, PySparkValueError
-from pyspark.loose_version import LooseVersion
 from pyspark.serializers import (
     Serializer,
     read_int,
@@ -33,6 +33,7 @@
     CPickleSerializer,
 )
 from pyspark.sql import Row
+from pyspark.sql.conversion import LocalDataToArrowConversion, ArrowTableToRowsConversion
 from pyspark.sql.pandas.types import (
     from_arrow_type,
     is_variant,
@@ -195,6 +196,38 @@ def load_stream(self, stream):
         return ArrowStreamSerializer.load_stream(self, stream)
 
 
+class ArrowStreamArrowUDTFSerializer(ArrowStreamUDTFSerializer):
+    """
+    Serializer for PyArrow-native UDTFs that work directly with PyArrow RecordBatches and Arrays.
+    """
+
+    def __init__(self, table_arg_offsets=None):
+        super().__init__()
+        self.table_arg_offsets = table_arg_offsets if table_arg_offsets else []
+
+    def load_stream(self, stream):
+        """
+        Flatten the struct into Arrow's record batches.
+        """
+        import pyarrow as pa
+
+        batches = super().load_stream(stream)
+        for batch in batches:
+            result_batches = []
+            for i in range(batch.num_columns):
+                if i in self.table_arg_offsets:
+                    struct = batch.column(i)
+                    # Flatten the struct and create a RecordBatch from it
+                    flattened_batch = pa.RecordBatch.from_arrays(
+                        struct.flatten(), schema=pa.schema(struct.type)
+                    )
+                    result_batches.append(flattened_batch)
+                else:
+                    # Keep the column as it is for non-table columns
+                    result_batches.append(batch.column(i))
+            yield result_batches
+
+
 class ArrowStreamGroupUDFSerializer(ArrowStreamUDFSerializer):
     """
     Serializes pyarrow.RecordBatch data with Arrow streaming format.
@@ -250,12 +283,50 @@ class ArrowStreamPandasSerializer(ArrowStreamSerializer):
         If True, conversion from Arrow to Pandas checks for overflow/truncation
     assign_cols_by_name : bool
         If True, then Pandas DataFrames will get columns by name
+    int_to_decimal_coercion_enabled : bool
+        If True, applies additional coercions in Python before converting to Arrow
+        This has performance penalties.
     """
 
-    def __init__(self, timezone, safecheck):
+    def __init__(self, timezone, safecheck, int_to_decimal_coercion_enabled):
         super(ArrowStreamPandasSerializer, self).__init__()
         self._timezone = timezone
         self._safecheck = safecheck
+        self._int_to_decimal_coercion_enabled = int_to_decimal_coercion_enabled
+
+    @staticmethod
+    def _apply_python_coercions(series, arrow_type):
+        """
+        Apply additional coercions to the series in Python before converting to Arrow:
+        - Convert integer series to decimal type.
+          When we have a pandas series of integers that needs to be converted to
+          pyarrow.decimal128 (with precision < 20), PyArrow fails with precision errors.
+          Explicitly cast to Decimal first.
+
+        Parameters
+        ----------
+        series : pandas.Series
+            The series to potentially convert
+        arrow_type : pyarrow.DataType
+            The target arrow type
+
+        Returns
+        -------
+        pandas.Series
+            The potentially converted pandas series
+        """
+        import pyarrow.types as types
+        import pandas as pd
+
+        # Convert integer series to Decimal objects
+        if (
+            types.is_decimal(arrow_type)
+            and series.dtype.kind in ["i", "u"]  # integer types (signed/unsigned)
+            and not series.empty
+        ):
+            series = series.apply(lambda x: Decimal(x) if pd.notna(x) else None)
+
+        return series
 
     def arrow_to_pandas(
         self, arrow_column, idx, struct_in_pandas="dict", ndarray_as_list=False, spark_type=None
@@ -264,20 +335,10 @@ def arrow_to_pandas(
         # instead of creating datetime64[ns] as intermediate data to avoid overflow caused by
         # datetime64[ns] type handling.
         # Cast dates to objects instead of datetime64[ns] dtype to avoid overflow.
-        pandas_options = {"date_as_object": True}
-
-        import pyarrow as pa
-
-        if LooseVersion(pa.__version__) >= LooseVersion("13.0.0"):
-            # A legacy option to coerce date32, date64, duration, and timestamp
-            # time units to nanoseconds when converting to pandas.
-            # This option can only be added since 13.0.0.
-            pandas_options.update(
-                {
-                    "coerce_temporal_nanoseconds": True,
-                }
-            )
-
+        pandas_options = {
+            "date_as_object": True,
+            "coerce_temporal_nanoseconds": True,
+        }
         s = arrow_column.to_pandas(**pandas_options)
 
         # TODO(SPARK-43579): cache the converter for reuse
@@ -325,6 +386,9 @@ def _create_array(self, series, arrow_type, spark_type=None, arrow_cast=False):
             )
             series = conv(series)
 
+            if self._int_to_decimal_coercion_enabled:
+                series = self._apply_python_coercions(series, arrow_type)
+
         if hasattr(series.array, "__arrow_array__"):
             mask = None
         else:
@@ -443,8 +507,11 @@ def __init__(
         ndarray_as_list=False,
         arrow_cast=False,
         input_types=None,
+        int_to_decimal_coercion_enabled=False,
     ):
-        super(ArrowStreamPandasUDFSerializer, self).__init__(timezone, safecheck)
+        super(ArrowStreamPandasUDFSerializer, self).__init__(
+            timezone, safecheck, int_to_decimal_coercion_enabled
+        )
         self._assign_cols_by_name = assign_cols_by_name
         self._df_for_struct = df_for_struct
         self._struct_in_pandas = struct_in_pandas
@@ -653,15 +720,15 @@ def _create_array(self, arr, arrow_type, arrow_cast):
         assert isinstance(arr, pa.Array)
         assert isinstance(arrow_type, pa.DataType)
 
-        # TODO: should we handle timezone here?
-
-        try:
+        if arr.type == arrow_type:
             return arr
-        except pa.lib.ArrowException:
-            if arrow_cast:
-                return arr.cast(target_type=arrow_type, safe=self._safecheck)
-            else:
-                raise
+        elif arrow_cast:
+            return arr.cast(target_type=arrow_type, safe=self._safecheck)
+        else:
+            raise PySparkTypeError(
+                "Arrow UDFs require the return type to match the expected Arrow type. "
+                f"Expected: {arrow_type}, but got: {arr.type}."
+            )
 
     def dump_stream(self, iterator, stream):
         """
@@ -695,12 +762,119 @@ def __repr__(self):
         return "ArrowStreamArrowUDFSerializer"
 
 
+class ArrowBatchUDFSerializer(ArrowStreamArrowUDFSerializer):
+    """
+    Serializer used by Python worker to evaluate Arrow Python UDFs
+    when the legacy pandas conversion is disabled
+    (instead of legacy ArrowStreamPandasUDFSerializer).
+
+    Parameters
+    ----------
+    timezone : str
+        A timezone to respect when handling timestamp values
+    safecheck : bool
+        If True, conversion from Arrow to Pandas checks for overflow/truncation
+    input_types : list
+        List of input data types for the UDF
+    int_to_decimal_coercion_enabled : bool
+        If True, applies additional coercions in Python before converting to Arrow
+        This has performance penalties.
+    """
+
+    def __init__(
+        self,
+        timezone,
+        safecheck,
+        input_types,
+        int_to_decimal_coercion_enabled=False,
+    ):
+        super().__init__(
+            timezone=timezone,
+            safecheck=safecheck,
+            assign_cols_by_name=False,
+            arrow_cast=True,
+        )
+        self._input_types = input_types
+        self._int_to_decimal_coercion_enabled = int_to_decimal_coercion_enabled
+
+    def load_stream(self, stream):
+        """
+        Loads a stream of Arrow record batches and converts them to Python values.
+
+        Parameters
+        ----------
+        stream : object
+            Input stream containing Arrow record batches
+
+        Yields
+        ------
+        list
+            List of columns containing list of Python values.
+        """
+        converters = [
+            ArrowTableToRowsConversion._create_converter(dt, none_on_identity=True)
+            for dt in self._input_types
+        ]
+
+        for batch in super().load_stream(stream):
+            columns = [
+                [conv(v) for v in column.to_pylist()] if conv is not None else column.to_pylist()
+                for column, conv in zip(batch.itercolumns(), converters)
+            ]
+            if len(columns) == 0:
+                yield [[pyspark._NoValue] * batch.num_rows]
+            else:
+                yield columns
+
+    def dump_stream(self, iterator, stream):
+        """
+        Dumps an iterator of Python values as a stream of Arrow record batches.
+
+        Parameters
+        ----------
+        iterator : iterator
+            Iterator yielding tuples of (data, arrow_type, spark_type) for single UDF
+            or list of tuples for multiple UDFs in a projection
+        stream : object
+            Output stream to write the Arrow record batches
+
+        Returns
+        -------
+        object
+            Result of writing the Arrow stream via ArrowStreamArrowUDFSerializer dump_stream
+        """
+        import pyarrow as pa
+
+        def create_array(results, arrow_type, spark_type):
+            conv = LocalDataToArrowConversion._create_converter(
+                spark_type,
+                none_on_identity=True,
+                int_to_decimal_coercion_enabled=self._int_to_decimal_coercion_enabled,
+            )
+            converted = [conv(res) for res in results] if conv is not None else results
+            try:
+                return pa.array(converted, type=arrow_type)
+            except pa.lib.ArrowInvalid:
+                return pa.array(converted).cast(target_type=arrow_type, safe=self._safecheck)
+
+        def py_to_batch():
+            for packed in iterator:
+                if len(packed) == 3 and isinstance(packed[1], pa.DataType):
+                    # single array UDF in a projection
+                    yield create_array(packed[0], packed[1], packed[2]), packed[1]
+                else:
+                    # multiple array UDFs in a projection
+                    yield [(create_array(*t), t[1]) for t in packed]
+
+        return super().dump_stream(py_to_batch(), stream)
+
+
 class ArrowStreamPandasUDTFSerializer(ArrowStreamPandasUDFSerializer):
     """
     Serializer used by Python worker to evaluate Arrow-optimized Python UDTFs.
     """
 
-    def __init__(self, timezone, safecheck):
+    def __init__(self, timezone, safecheck, input_types, int_to_decimal_coercion_enabled):
         super(ArrowStreamPandasUDTFSerializer, self).__init__(
             timezone=timezone,
             safecheck=safecheck,
@@ -720,6 +894,9 @@ def __init__(self, timezone, safecheck):
             ndarray_as_list=True,
             # Enables explicit casting for mismatched return types of Arrow Python UDTFs.
             arrow_cast=True,
+            input_types=input_types,
+            # Enable additional coercions for UDTF serialization
+            int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
         )
         self._converter_map = dict()
 
@@ -742,35 +919,44 @@ def _create_batch(self, series):
         import pandas as pd
         import pyarrow as pa
 
-        # Make input conform to [(series1, type1), (series2, type2), ...]
-        if not isinstance(series, (list, tuple)) or (
-            len(series) == 2 and isinstance(series[1], pa.DataType)
+        # Make input conform to
+        # [(series1, arrow_type1, spark_type1), (series2, arrow_type2, spark_type2), ...]
+        if (
+            not isinstance(series, (list, tuple))
+            or (len(series) == 2 and isinstance(series[1], pa.DataType))
+            or (
+                len(series) == 3
+                and isinstance(series[1], pa.DataType)
+                and isinstance(series[2], DataType)
+            )
         ):
             series = [series]
         series = ((s, None) if not isinstance(s, (list, tuple)) else s for s in series)
+        series = ((s[0], s[1], None) if len(s) == 2 else s for s in series)
 
         arrs = []
-        for s, t in series:
+        for s, arrow_type, spark_type in series:
             if not isinstance(s, pd.DataFrame):
                 raise PySparkValueError(
                     "Output of an arrow-optimized Python UDTFs expects "
                     f"a pandas.DataFrame but got: {type(s)}"
                 )
 
-            arrs.append(self._create_struct_array(s, t))
+            arrs.append(self._create_struct_array(s, arrow_type, spark_type))
 
         return pa.RecordBatch.from_arrays(arrs, ["_%d" % i for i in range(len(arrs))])
 
     def _get_or_create_converter_from_pandas(self, dt):
-        if dt not in self._converter_map:
+        key = dt.json()
+        if key not in self._converter_map:
             conv = _create_converter_from_pandas(
                 dt,
                 timezone=self._timezone,
                 error_on_duplicated_field_names=False,
                 ignore_unexpected_complex_type_values=True,
             )
-            self._converter_map[dt] = conv
-        return self._converter_map[dt]
+            self._converter_map[key] = conv
+        return self._converter_map[key]
 
     def _create_array(self, series, arrow_type, spark_type=None, arrow_cast=False):
         """
@@ -806,6 +992,9 @@ def _create_array(self, series, arrow_type, spark_type=None, arrow_cast=False):
             conv = self._get_or_create_converter_from_pandas(dt)
             series = conv(series)
 
+            if self._int_to_decimal_coercion_enabled:
+                series = self._apply_python_coercions(series, arrow_type)
+
         if hasattr(series.array, "__arrow_array__"):
             mask = None
         else:
@@ -937,9 +1126,14 @@ def __init__(
         state_object_schema,
         arrow_max_records_per_batch,
         prefers_large_var_types,
+        int_to_decimal_coercion_enabled,
     ):
         super(ApplyInPandasWithStateSerializer, self).__init__(
-            timezone, safecheck, assign_cols_by_name
+            timezone,
+            safecheck,
+            assign_cols_by_name,
+            int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
+            arrow_cast=True,
         )
         self.pickleSer = CPickleSerializer()
         self.utf8_deserializer = UTF8Deserializer()
@@ -1307,9 +1501,20 @@ class TransformWithStateInPandasSerializer(ArrowStreamPandasUDFSerializer):
         Limit of the number of records that can be written to a single ArrowRecordBatch in memory.
     """
 
-    def __init__(self, timezone, safecheck, assign_cols_by_name, arrow_max_records_per_batch):
+    def __init__(
+        self,
+        timezone,
+        safecheck,
+        assign_cols_by_name,
+        arrow_max_records_per_batch,
+        int_to_decimal_coercion_enabled,
+    ):
         super(TransformWithStateInPandasSerializer, self).__init__(
-            timezone, safecheck, assign_cols_by_name
+            timezone,
+            safecheck,
+            assign_cols_by_name,
+            int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
+            arrow_cast=True,
         )
         self.arrow_max_records_per_batch = arrow_max_records_per_batch
         self.key_offsets = None
@@ -1383,9 +1588,20 @@ class TransformWithStateInPandasInitStateSerializer(TransformWithStateInPandasSe
     Same as input parameters in TransformWithStateInPandasSerializer.
     """
 
-    def __init__(self, timezone, safecheck, assign_cols_by_name, arrow_max_records_per_batch):
+    def __init__(
+        self,
+        timezone,
+        safecheck,
+        assign_cols_by_name,
+        arrow_max_records_per_batch,
+        int_to_decimal_coercion_enabled,
+    ):
         super(TransformWithStateInPandasInitStateSerializer, self).__init__(
-            timezone, safecheck, assign_cols_by_name, arrow_max_records_per_batch
+            timezone,
+            safecheck,
+            assign_cols_by_name,
+            arrow_max_records_per_batch,
+            int_to_decimal_coercion_enabled,
         )
         self.init_key_offsets = None
 
@@ -1398,6 +1614,7 @@ def load_stream(self, stream):
         def generate_data_batches(batches):
             """
             Deserialize ArrowRecordBatches and return a generator of pandas.Series list.
+
             The deserialization logic assumes that Arrow RecordBatches contain the data with the
             ordering that data chunks for same grouping key will appear sequentially.
             See `TransformWithStateInPandasPythonInitialStateRunner` for arrow batch schema sent
diff --git a/python/pyspark/sql/pandas/typehints.py b/python/pyspark/sql/pandas/typehints.py
index ba7801ceea559..f010489b95126 100644
--- a/python/pyspark/sql/pandas/typehints.py
+++ b/python/pyspark/sql/pandas/typehints.py
@@ -27,29 +27,23 @@
         PandasGroupedAggUDFType,
         ArrowScalarUDFType,
         ArrowScalarIterUDFType,
+        ArrowGroupedAggUDFType,
     )
 
 
-def infer_eval_type(
-    sig: Signature, type_hints: Dict[str, Any]
-) -> Union[
-    "PandasScalarUDFType",
-    "PandasScalarIterUDFType",
-    "PandasGroupedAggUDFType",
-    "ArrowScalarUDFType",
-    "ArrowScalarIterUDFType",
-]:
+def infer_pandas_eval_type(
+    sig: Signature,
+    type_hints: Dict[str, Any],
+) -> Optional[Union["PandasScalarUDFType", "PandasScalarIterUDFType", "PandasGroupedAggUDFType"]]:
     """
     Infers the evaluation type in :class:`pyspark.util.PythonEvalType` from
     :class:`inspect.Signature` instance and type hints.
     """
-    from pyspark.sql.pandas.functions import PandasUDFType, ArrowUDFType
+    from pyspark.sql.pandas.functions import PandasUDFType
 
     require_minimum_pandas_version()
-    require_minimum_pyarrow_version()
 
     import pandas as pd
-    import pyarrow as pa
 
     annotations = {}
     for param in sig.parameters.values():
@@ -83,12 +77,8 @@ def infer_eval_type(
         )
         for a in parameters_sig
     ) and (return_annotation == pd.Series or return_annotation == pd.DataFrame)
-
-    # pa.Array, ... -> pa.Array
-    is_arrow_array = all(
-        a == pa.Array or check_union_annotation(a, parameter_check_func=lambda na: na == pa.Array)
-        for a in parameters_sig
-    ) and (return_annotation == pa.Array)
+    if is_series_or_frame:
+        return PandasUDFType.SCALAR
 
     # Iterator[Tuple[Series, Frame or Union[DataFrame, Series], ...] -> Iterator[Series or Frame]
     is_iterator_tuple_series_or_frame = (
@@ -111,21 +101,8 @@ def infer_eval_type(
             return_annotation, parameter_check_func=lambda a: a == pd.DataFrame or a == pd.Series
         )
     )
-
-    # Iterator[Tuple[pa.Array, ...] -> Iterator[pa.Array]
-    is_iterator_tuple_array = (
-        len(parameters_sig) == 1
-        and check_iterator_annotation(  # Iterator
-            parameters_sig[0],
-            parameter_check_func=lambda a: check_tuple_annotation(  # Tuple
-                a,
-                parameter_check_func=lambda ta: (ta == Ellipsis or ta == pa.Array),
-            ),
-        )
-        and check_iterator_annotation(
-            return_annotation, parameter_check_func=lambda a: a == pa.Array
-        )
-    )
+    if is_iterator_tuple_series_or_frame:
+        return PandasUDFType.SCALAR_ITER
 
     # Iterator[Series, Frame or Union[DataFrame, Series]] -> Iterator[Series or Frame]
     is_iterator_series_or_frame = (
@@ -144,18 +121,8 @@ def infer_eval_type(
             return_annotation, parameter_check_func=lambda a: a == pd.DataFrame or a == pd.Series
         )
     )
-
-    # Iterator[pa.Array] -> Iterator[pa.Array]
-    is_iterator_array = (
-        len(parameters_sig) == 1
-        and check_iterator_annotation(
-            parameters_sig[0],
-            parameter_check_func=lambda a: (a == pd.Series or a == pa.Array),
-        )
-        and check_iterator_annotation(
-            return_annotation, parameter_check_func=lambda a: a == pa.Array
-        )
-    )
+    if is_iterator_series_or_frame:
+        return PandasUDFType.SCALAR_ITER
 
     # Series, Frame or Union[DataFrame, Series], ... -> Any
     is_series_or_frame_agg = all(
@@ -174,23 +141,141 @@ def infer_eval_type(
         and not check_iterator_annotation(return_annotation)
         and not check_tuple_annotation(return_annotation)
     )
+    if is_series_or_frame_agg:
+        return PandasUDFType.GROUPED_AGG
 
-    if is_series_or_frame:
-        return PandasUDFType.SCALAR
-    elif is_arrow_array:
+    return None
+
+
+def infer_arrow_eval_type(
+    sig: Signature, type_hints: Dict[str, Any]
+) -> Optional[Union["ArrowScalarUDFType", "ArrowScalarIterUDFType", "ArrowGroupedAggUDFType"]]:
+    """
+    Infers the evaluation type in :class:`pyspark.util.PythonEvalType` from
+    :class:`inspect.Signature` instance and type hints.
+    """
+    from pyspark.sql.pandas.functions import ArrowUDFType
+
+    require_minimum_pyarrow_version()
+
+    import pyarrow as pa
+
+    annotations = {}
+    for param in sig.parameters.values():
+        if param.annotation is not param.empty:
+            annotations[param.name] = type_hints.get(param.name, param.annotation)
+
+    # Check if all arguments have type hints
+    parameters_sig = [
+        annotations[parameter] for parameter in sig.parameters if parameter in annotations
+    ]
+    if len(parameters_sig) != len(sig.parameters):
+        raise PySparkValueError(
+            errorClass="TYPE_HINT_SHOULD_BE_SPECIFIED",
+            messageParameters={"target": "all parameters", "sig": str(sig)},
+        )
+
+    # Check if the return has a type hint
+    return_annotation = type_hints.get("return", sig.return_annotation)
+    if sig.empty is return_annotation:
+        raise PySparkValueError(
+            errorClass="TYPE_HINT_SHOULD_BE_SPECIFIED",
+            messageParameters={"target": "the return type", "sig": str(sig)},
+        )
+
+    # pa.Array, ... -> pa.Array
+    is_arrow_array = all(a == pa.Array for a in parameters_sig) and (return_annotation == pa.Array)
+    if is_arrow_array:
         return ArrowUDFType.SCALAR
-    elif is_iterator_tuple_series_or_frame or is_iterator_series_or_frame:
-        return PandasUDFType.SCALAR_ITER
-    elif is_iterator_tuple_array or is_iterator_array:
+
+    # Iterator[Tuple[pa.Array, ...] -> Iterator[pa.Array]
+    is_iterator_tuple_array = (
+        len(parameters_sig) == 1
+        and check_iterator_annotation(  # Iterator
+            parameters_sig[0],
+            parameter_check_func=lambda a: check_tuple_annotation(  # Tuple
+                a,
+                parameter_check_func=lambda ta: (ta == Ellipsis or ta == pa.Array),
+            ),
+        )
+        and check_iterator_annotation(
+            return_annotation, parameter_check_func=lambda a: a == pa.Array
+        )
+    )
+    if is_iterator_tuple_array:
         return ArrowUDFType.SCALAR_ITER
-    elif is_series_or_frame_agg:
-        return PandasUDFType.GROUPED_AGG
+
+    # Iterator[pa.Array] -> Iterator[pa.Array]
+    is_iterator_array = (
+        len(parameters_sig) == 1
+        and check_iterator_annotation(
+            parameters_sig[0],
+            parameter_check_func=lambda a: a == pa.Array,
+        )
+        and check_iterator_annotation(
+            return_annotation, parameter_check_func=lambda a: a == pa.Array
+        )
+    )
+    if is_iterator_array:
+        return ArrowUDFType.SCALAR_ITER
+
+    # pa.Array, ... -> Any
+    is_array_agg = all(a == pa.Array for a in parameters_sig) and (
+        return_annotation != pa.Array
+        and not check_iterator_annotation(return_annotation)
+        and not check_tuple_annotation(return_annotation)
+    )
+    if is_array_agg:
+        return ArrowUDFType.GROUPED_AGG
+
+    return None
+
+
+def infer_eval_type(
+    sig: Signature,
+    type_hints: Dict[str, Any],
+    kind: str = "all",
+) -> Union[
+    "PandasScalarUDFType",
+    "PandasScalarIterUDFType",
+    "PandasGroupedAggUDFType",
+    "ArrowScalarUDFType",
+    "ArrowScalarIterUDFType",
+    "ArrowGroupedAggUDFType",
+]:
+    """
+    Infers the evaluation type in :class:`pyspark.util.PythonEvalType` from
+    :class:`inspect.Signature` instance and type hints.
+    """
+    assert kind in ["pandas", "arrow", "all"], "kind should be either 'pandas', 'arrow' or 'all'"
+
+    eval_type: Optional[
+        Union[
+            "PandasScalarUDFType",
+            "PandasScalarIterUDFType",
+            "PandasGroupedAggUDFType",
+            "ArrowScalarUDFType",
+            "ArrowScalarIterUDFType",
+            "ArrowGroupedAggUDFType",
+        ]
+    ] = None
+    if kind == "pandas":
+        eval_type = infer_pandas_eval_type(sig, type_hints)
+    elif kind == "arrow":
+        eval_type = infer_arrow_eval_type(sig, type_hints)
     else:
+        eval_type = infer_pandas_eval_type(sig, type_hints) or infer_arrow_eval_type(
+            sig, type_hints
+        )
+
+    if eval_type is None:
         raise PySparkNotImplementedError(
             errorClass="UNSUPPORTED_SIGNATURE",
             messageParameters={"signature": str(sig)},
         )
 
+    return eval_type
+
 
 def check_tuple_annotation(
     annotation: Any, parameter_check_func: Optional[Callable[[Any], bool]] = None
diff --git a/python/pyspark/sql/pandas/types.py b/python/pyspark/sql/pandas/types.py
index 2f82609c84292..586d86aa6a535 100644
--- a/python/pyspark/sql/pandas/types.py
+++ b/python/pyspark/sql/pandas/types.py
@@ -37,6 +37,7 @@
     StringType,
     BinaryType,
     DateType,
+    TimeType,
     TimestampType,
     TimestampNTZType,
     DayTimeIntervalType,
@@ -127,6 +128,8 @@ def to_arrow_type(
         arrow_type = pa.timestamp("us", tz=None)
     elif type(dt) == DayTimeIntervalType:
         arrow_type = pa.duration("us")
+    elif type(dt) == TimeType:
+        arrow_type = pa.time64("ns")
     elif type(dt) == ArrayType:
         field = pa.field(
             "element",
@@ -302,6 +305,8 @@ def from_arrow_type(at: "pa.DataType", prefer_timestamp_ntz: bool = False) -> Da
         spark_type = BinaryType()
     elif types.is_date32(at):
         spark_type = DateType()
+    elif types.is_time64(at):
+        spark_type = TimeType()
     elif types.is_timestamp(at) and prefer_timestamp_ntz and at.tz is None:
         spark_type = TimestampNTZType()
     elif types.is_timestamp(at):
@@ -311,14 +316,6 @@ def from_arrow_type(at: "pa.DataType", prefer_timestamp_ntz: bool = False) -> Da
     elif types.is_list(at):
         spark_type = ArrayType(from_arrow_type(at.value_type, prefer_timestamp_ntz))
     elif types.is_fixed_size_list(at):
-        import pyarrow as pa
-
-        if LooseVersion(pa.__version__) < LooseVersion("14.0.0"):
-            # PyArrow versions before 14.0.0 do not support casting FixedSizeListArray to ListArray
-            raise PySparkTypeError(
-                errorClass="UNSUPPORTED_DATA_TYPE_FOR_ARROW_CONVERSION",
-                messageParameters={"data_type": str(at)},
-            )
         spark_type = ArrayType(from_arrow_type(at.value_type, prefer_timestamp_ntz))
     elif types.is_large_list(at):
         spark_type = ArrayType(from_arrow_type(at.value_type, prefer_timestamp_ntz))
diff --git a/python/pyspark/sql/pandas/utils.py b/python/pyspark/sql/pandas/utils.py
index a351c13ff0a08..c37665c719c88 100644
--- a/python/pyspark/sql/pandas/utils.py
+++ b/python/pyspark/sql/pandas/utils.py
@@ -22,7 +22,7 @@
 def require_minimum_pandas_version() -> None:
     """Raise ImportError if minimum version of Pandas is not installed"""
     # TODO(HyukjinKwon): Relocate and deduplicate the version specification.
-    minimum_pandas_version = "2.0.0"
+    minimum_pandas_version = "2.2.0"
 
     try:
         import pandas
@@ -61,7 +61,7 @@ def require_minimum_pandas_version() -> None:
 def require_minimum_pyarrow_version() -> None:
     """Raise ImportError if minimum version of pyarrow is not installed"""
     # TODO(HyukjinKwon): Relocate and deduplicate the version specification.
-    minimum_pyarrow_version = "11.0.0"
+    minimum_pyarrow_version = "15.0.0"
 
     import os
 
@@ -98,7 +98,7 @@ def require_minimum_pyarrow_version() -> None:
 
 def require_minimum_numpy_version() -> None:
     """Raise ImportError if minimum version of NumPy is not installed"""
-    minimum_numpy_version = "1.21"
+    minimum_numpy_version = "1.22"
 
     try:
         import numpy
diff --git a/python/pyspark/sql/session.py b/python/pyspark/sql/session.py
index 241424c954b2d..2cb0f2f59b1b9 100644
--- a/python/pyspark/sql/session.py
+++ b/python/pyspark/sql/session.py
@@ -54,6 +54,7 @@
     DataType,
     StructField,
     StructType,
+    VariantVal,
     _make_type_verifier,
     _infer_schema,
     _has_nulltype,
@@ -1194,10 +1195,14 @@ def _createFromLocal(
         if not isinstance(data, list):
             data = list(data)
 
+        if any(isinstance(d, VariantVal) for d in data):
+            raise PySparkValueError("Rows cannot be of type VariantVal")
+
+        tupled_data: Iterable[Tuple]
         if schema is None or isinstance(schema, (list, tuple)):
             struct = self._inferSchemaFromList(data, names=schema)
             converter = _create_converter(struct)
-            tupled_data: Iterable[Tuple] = map(converter, data)
+            tupled_data = map(converter, data)
             if isinstance(schema, (list, tuple)):
                 for i, name in enumerate(schema):
                     struct.fields[i].name = name
@@ -1205,7 +1210,8 @@ def _createFromLocal(
 
         elif isinstance(schema, StructType):
             struct = schema
-            tupled_data = data
+            converter = _create_converter(struct)
+            tupled_data = map(converter, data)
 
         else:
             raise PySparkTypeError(
diff --git a/python/pyspark/sql/streaming/readwriter.py b/python/pyspark/sql/streaming/readwriter.py
index 34af8cd9b070e..8121dd609950e 100644
--- a/python/pyspark/sql/streaming/readwriter.py
+++ b/python/pyspark/sql/streaming/readwriter.py
@@ -1549,7 +1549,7 @@ def foreach(self, f: Union[Callable[[Row], None], "SupportsProcess"]) -> "DataSt
         ...     def close(self, error):
         ...         print("Closed with error: %s" % str(error))
         ...
-        >>> q = df.writeStream.foreach(print_row).start()
+        >>> q = df.writeStream.foreach(RowPrinter()).start()
         >>> time.sleep(3)
         >>> q.stop()
         """
diff --git a/python/pyspark/sql/streaming/stateful_processor_api_client.py b/python/pyspark/sql/streaming/stateful_processor_api_client.py
index 145e24ea2cd19..65e58e025b171 100644
--- a/python/pyspark/sql/streaming/stateful_processor_api_client.py
+++ b/python/pyspark/sql/streaming/stateful_processor_api_client.py
@@ -494,26 +494,34 @@ def _receive_str(self) -> str:
     def _serialize_to_bytes(self, schema: StructType, data: Tuple) -> bytes:
         from pyspark.testing.utils import have_numpy
 
-        converted = []
-
         if have_numpy:
             import numpy as np
 
-            # In order to convert NumPy types to Python primitive types.
-            for v in data:
+            def normalize_value(v: Any) -> Any:
+                # Convert NumPy types to Python primitive types.
                 if isinstance(v, np.generic):
-                    converted.append(v.tolist())
+                    return v.tolist()
+                # List / tuple: recursively normalize each element
+                if isinstance(v, (list, tuple)):
+                    return type(v)(normalize_value(e) for e in v)
+                # Dict: normalize both keys and values
+                if isinstance(v, dict):
+                    return {normalize_value(k): normalize_value(val) for k, val in v.items()}
                 # Address a couple of pandas dtypes too.
                 elif hasattr(v, "to_pytimedelta"):
-                    converted.append(v.to_pytimedelta())
+                    return v.to_pytimedelta()
                 elif hasattr(v, "to_pydatetime"):
-                    converted.append(v.to_pydatetime())
+                    return v.to_pydatetime()
                 else:
-                    converted.append(v)
+                    return v
+
+            converted = [normalize_value(v) for v in data]
         else:
             converted = list(data)
 
-        row_value = Row(*converted)
+        field_names = [f.name for f in schema.fields]
+        row_value = Row(**dict(zip(field_names, converted)))
+
         return self.pickleSer.dumps(schema.toInternal(row_value))
 
     def _deserialize_from_bytes(self, value: bytes) -> Any:
diff --git a/python/pyspark/sql/tests/arrow/test_arrow.py b/python/pyspark/sql/tests/arrow/test_arrow.py
index 5a770a947889b..c74ca121f26d3 100644
--- a/python/pyspark/sql/tests/arrow/test_arrow.py
+++ b/python/pyspark/sql/tests/arrow/test_arrow.py
@@ -707,8 +707,8 @@ def check_createDataFrame_with_single_data_type(self):
     def test_createDataFrame_does_not_modify_input(self):
         # Some series get converted for Spark to consume, this makes sure input is unchanged
         pdf = self.create_pandas_data_frame()
-        # Use a nanosecond value to make sure it is not truncated
-        pdf.iloc[0, 7] = pd.Timestamp(1)
+        # Use a nanosecond value that converts to microseconds without precision loss
+        pdf.iloc[0, 7] = pd.Timestamp(1000)
         # Integers with nulls will get NaNs filled with 0 and will be casted
         pdf.iloc[1, 1] = None
         pdf_copy = pdf.copy(deep=True)
@@ -1713,13 +1713,8 @@ def test_createDataFrame_arrow_fixed_size_binary(self):
     def test_createDataFrame_arrow_fixed_size_list(self):
         a = pa.array([[-1, 3]] * 5, type=pa.list_(pa.int32(), 2))
         t = pa.table([a], ["fsl"])
-        if LooseVersion(pa.__version__) < LooseVersion("14.0.0"):
-            # PyArrow versions before 14.0.0 do not support casting FixedSizeListArray to ListArray
-            with self.assertRaises(PySparkTypeError):
-                df = self.spark.createDataFrame(t)
-        else:
-            df = self.spark.createDataFrame(t)
-            self.assertIsInstance(df.schema["fsl"].dataType, ArrayType)
+        df = self.spark.createDataFrame(t)
+        self.assertIsInstance(df.schema["fsl"].dataType, ArrayType)
 
 
 @unittest.skipIf(
diff --git a/python/pyspark/sql/tests/arrow/test_arrow_python_udf.py b/python/pyspark/sql/tests/arrow/test_arrow_python_udf.py
index 78e72e02836f9..a054261304c6f 100644
--- a/python/pyspark/sql/tests/arrow/test_arrow_python_udf.py
+++ b/python/pyspark/sql/tests/arrow/test_arrow_python_udf.py
@@ -21,7 +21,7 @@
 from pyspark.sql import Row
 from pyspark.sql.functions import udf
 from pyspark.sql.tests.test_udf import BaseUDFTestsMixin
-from pyspark.sql.types import VarcharType
+from pyspark.sql.types import DayTimeIntervalType, VarcharType, StructType, StructField, StringType
 from pyspark.testing.sqlutils import (
     have_pandas,
     have_pyarrow,
@@ -180,6 +180,61 @@ def test_type_coercion_string_to_numeric(self):
         with self.assertRaises(PythonException):
             df_floating_value.select(udf(lambda x: x, "decimal")("value").alias("res")).collect()
 
+    def test_arrow_udf_int_to_decimal_coercion(self):
+        from decimal import Decimal
+
+        with self.sql_conf(
+            {"spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled": False}
+        ):
+            df = self.spark.range(0, 3)
+
+            @udf(returnType="decimal(10,2)", useArrow=True)
+            def int_to_decimal_udf(val):
+                values = [123, 456, 789]
+                return values[int(val) % len(values)]
+
+            # Test with coercion enabled
+            with self.sql_conf(
+                {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": True}
+            ):
+                result = df.select(int_to_decimal_udf("id").alias("decimal_val")).collect()
+                self.assertEqual(result[0]["decimal_val"], Decimal("123.00"))
+                self.assertEqual(result[1]["decimal_val"], Decimal("456.00"))
+                self.assertEqual(result[2]["decimal_val"], Decimal("789.00"))
+
+            # Test with coercion disabled (should fail)
+            with self.sql_conf(
+                {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": False}
+            ):
+                with self.assertRaisesRegex(
+                    PythonException, "An exception was thrown from the Python worker"
+                ):
+                    df.select(int_to_decimal_udf("id").alias("decimal_val")).collect()
+
+            @udf(returnType="decimal(25,1)", useArrow=True)
+            def high_precision_udf(val):
+                values = [1, 2, 3]
+                return values[int(val) % len(values)]
+
+            # Test high precision decimal with coercion enabled
+            with self.sql_conf(
+                {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": True}
+            ):
+                result = df.select(high_precision_udf("id").alias("decimal_val")).collect()
+                self.assertEqual(len(result), 3)
+                self.assertEqual(result[0]["decimal_val"], Decimal("1.0"))
+                self.assertEqual(result[1]["decimal_val"], Decimal("2.0"))
+                self.assertEqual(result[2]["decimal_val"], Decimal("3.0"))
+
+            # Test high precision decimal with coercion disabled (should fail)
+            with self.sql_conf(
+                {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": False}
+            ):
+                with self.assertRaisesRegex(
+                    PythonException, "An exception was thrown from the Python worker"
+                ):
+                    df.select(high_precision_udf("id").alias("decimal_val")).collect()
+
     def test_err_return_type(self):
         with self.assertRaises(PySparkNotImplementedError) as pe:
             udf(lambda x: x, VarcharType(10), useArrow=True)
@@ -243,6 +298,88 @@ def test_udf_use_arrow_and_session_conf(self):
                 udf(lambda x: str(x), useArrow=False).evalType, PythonEvalType.SQL_BATCHED_UDF
             )
 
+    def test_day_time_interval_type_casting(self):
+        """Test that DayTimeIntervalType UDFs work with Arrow and preserve field specifications."""
+
+        # HOUR TO SECOND
+        @udf(useArrow=True, returnType=DayTimeIntervalType(1, 3))
+        def return_interval(x):
+            return x
+
+        # UDF input: HOUR TO SECOND, UDF output: HOUR TO SECOND
+        df = self.spark.sql("SELECT INTERVAL '200:13:50.3' HOUR TO SECOND as value").select(
+            return_interval("value").alias("result")
+        )
+        self.assertEqual(df.schema.fields[0].dataType, DayTimeIntervalType(1, 3))
+        self.assertIsNotNone(df.collect()[0]["result"])
+
+        # UDF input: DAY TO SECOND, UDF output: HOUR TO SECOND
+        df2 = self.spark.sql("SELECT INTERVAL '1 10:30:45.123' DAY TO SECOND as value").select(
+            return_interval("value").alias("result")
+        )
+        self.assertEqual(df.schema.fields[0].dataType, DayTimeIntervalType(1, 3))
+        self.assertIsNotNone(df2.collect()[0]["result"])
+
+    def test_day_time_interval_in_struct(self):
+        """Test that DayTimeIntervalType works within StructType with Arrow UDFs."""
+
+        struct_type = StructType(
+            [
+                StructField("interval_field", DayTimeIntervalType(1, 3)),
+                StructField("name", StringType()),
+            ]
+        )
+
+        @udf(useArrow=True, returnType=struct_type)
+        def create_struct_with_interval(interval_val, name_val):
+            return Row(interval_field=interval_val, name=name_val)
+
+        df = self.spark.sql(
+            """
+            SELECT INTERVAL '15:30:45.678' HOUR TO SECOND as interval_val,
+                   'test_name' as name_val
+        """
+        ).select(create_struct_with_interval("interval_val", "name_val").alias("result"))
+
+        self.assertEqual(df.schema.fields[0].dataType, struct_type)
+        self.assertEqual(df.schema.fields[0].dataType.fields[0].dataType, DayTimeIntervalType(1, 3))
+        result = df.collect()[0]["result"]
+        self.assertIsNotNone(result["interval_field"])
+        self.assertEqual(result["name"], "test_name")
+
+
+@unittest.skipIf(
+    not have_pandas or not have_pyarrow, pandas_requirement_message or pyarrow_requirement_message
+)
+class ArrowPythonUDFLegacyTestsMixin(ArrowPythonUDFTestsMixin):
+    @classmethod
+    def setUpClass(cls):
+        super().setUpClass()
+        cls.spark.conf.set("spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled", "true")
+
+    @classmethod
+    def tearDownClass(cls):
+        try:
+            cls.spark.conf.unset("spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled")
+        finally:
+            super().tearDownClass()
+
+
+class ArrowPythonUDFNonLegacyTestsMixin(ArrowPythonUDFTestsMixin):
+    @classmethod
+    def setUpClass(cls):
+        super().setUpClass()
+        cls.spark.conf.set(
+            "spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled", "false"
+        )
+
+    @classmethod
+    def tearDownClass(cls):
+        try:
+            cls.spark.conf.unset("spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled")
+        finally:
+            super().tearDownClass()
+
 
 class ArrowPythonUDFTests(ArrowPythonUDFTestsMixin, ReusedSQLTestCase):
     @classmethod
@@ -258,18 +395,32 @@ def tearDownClass(cls):
             super(ArrowPythonUDFTests, cls).tearDownClass()
 
 
-class AsyncArrowPythonUDFTests(ArrowPythonUDFTests):
+class ArrowPythonUDFLegacyTests(ArrowPythonUDFLegacyTestsMixin, ReusedSQLTestCase):
+    @classmethod
+    def setUpClass(cls):
+        super(ArrowPythonUDFLegacyTests, cls).setUpClass()
+        cls.spark.conf.set("spark.sql.execution.pythonUDF.arrow.enabled", "true")
+
+    @classmethod
+    def tearDownClass(cls):
+        try:
+            cls.spark.conf.unset("spark.sql.execution.pythonUDF.arrow.enabled")
+        finally:
+            super(ArrowPythonUDFLegacyTests, cls).tearDownClass()
+
+
+class ArrowPythonUDFNonLegacyTests(ArrowPythonUDFNonLegacyTestsMixin, ReusedSQLTestCase):
     @classmethod
     def setUpClass(cls):
-        super(AsyncArrowPythonUDFTests, cls).setUpClass()
-        cls.spark.conf.set("spark.sql.execution.pythonUDF.arrow.concurrency.level", "4")
+        super(ArrowPythonUDFNonLegacyTests, cls).setUpClass()
+        cls.spark.conf.set("spark.sql.execution.pythonUDF.arrow.enabled", "true")
 
     @classmethod
     def tearDownClass(cls):
         try:
-            cls.spark.conf.unset("spark.sql.execution.pythonUDF.arrow.concurrency.level")
+            cls.spark.conf.unset("spark.sql.execution.pythonUDF.arrow.enabled")
         finally:
-            super(AsyncArrowPythonUDFTests, cls).tearDownClass()
+            super(ArrowPythonUDFNonLegacyTests, cls).tearDownClass()
 
 
 if __name__ == "__main__":
diff --git a/python/pyspark/sql/tests/arrow/test_arrow_udf.py b/python/pyspark/sql/tests/arrow/test_arrow_udf.py
index 052ee1c3be830..693d7ba484d80 100644
--- a/python/pyspark/sql/tests/arrow/test_arrow_udf.py
+++ b/python/pyspark/sql/tests/arrow/test_arrow_udf.py
@@ -15,12 +15,13 @@
 # limitations under the License.
 #
 
+import os
+import time
 import unittest
 import datetime
 
-# TODO: import arrow_udf from public API
-from pyspark.sql.pandas.functions import arrow_udf, ArrowUDFType, PandasUDFType
-from pyspark.sql import functions as F
+from pyspark.sql.functions import arrow_udf, ArrowUDFType, PandasUDFType
+from pyspark.sql import functions as F, Row
 from pyspark.sql.types import (
     DoubleType,
     StructType,
@@ -98,6 +99,65 @@ def foo(x):
         self.assertEqual(foo.returnType, DoubleType())
         self.assertEqual(foo.evalType, PythonEvalType.SQL_SCALAR_ARROW_UDF)
 
+    def test_time_zone_against_map_in_arrow(self):
+        import pyarrow as pa
+
+        for tz in [
+            "Asia/Shanghai",
+            "Asia/Hong_Kong",
+            "America/Los_Angeles",
+            "Pacific/Honolulu",
+            "Europe/Amsterdam",
+            "US/Pacific",
+        ]:
+            with self.sql_conf({"spark.sql.session.timeZone": tz}):
+                # There is a time-zone conversion in df.collect:
+                # ts.astimezone().replace(tzinfo=None)
+                # it is controlled by env os.environ["TZ"].
+                # Note that if the env is not equvilent to spark.sql.session.timeZone,
+                # than there is a mismatch between the internal arrow data and df.collect.
+                os.environ["TZ"] = tz
+                time.tzset()
+
+                df = self.spark.sql("SELECT TIMESTAMP('2019-04-12 15:50:01') AS ts")
+
+                def check_value(t):
+                    assert isinstance(t, pa.Array)
+                    assert isinstance(t, pa.TimestampArray)
+                    assert isinstance(t[0], pa.Scalar)
+                    assert isinstance(t[0], pa.TimestampScalar)
+                    ts = t[0].as_py()
+                    assert isinstance(ts, datetime.datetime)
+                    assert ts.year == 2019
+                    assert ts.month == 4
+                    assert ts.day == 12
+                    assert ts.hour == 15
+                    assert ts.minute == 50
+                    assert ts.second == 1
+                    # the timezone is still kept in the internal arrow data
+                    assert ts.tzinfo is not None
+                    assert str(ts.tzinfo) == tz, str(ts.tzinfo)
+
+                @arrow_udf("timestamp")
+                def identity(t):
+                    check_value(t)
+                    return t
+
+                expected = [Row(ts=datetime.datetime(2019, 4, 12, 15, 50, 1))]
+                self.assertEqual(expected, df.collect())
+
+                result1 = df.select(identity("ts").alias("ts"))
+                self.assertEqual(expected, result1.collect())
+
+                def identity2(iter):
+                    for batch in iter:
+                        t = batch["ts"]
+                        check_value(t)
+                        yield batch
+
+                result2 = df.mapInArrow(identity2, "ts timestamp")
+                self.assertEqual(expected, result2.collect())
+
     def test_arrow_udf_wrong_arg(self):
         with self.quiet():
             with self.assertRaises(ParseException):
@@ -166,6 +226,13 @@ def foo(df):
                 def zero_with_type():
                     return 1
 
+            with self.assertRaisesRegex(ValueError, "0-arg arrow_udfs.*not.*supported"):
+
+                @arrow_udf(LongType(), ArrowUDFType.SCALAR_ITER)
+                def zero_with_type():
+                    yield 1
+                    yield 2
+
     def test_arrow_udf_timestamp_ntz(self):
         import pyarrow as pa
 
@@ -207,7 +274,10 @@ def noop(s: pa.Array) -> pa.Array:
 
 
 class ArrowUDFTests(ArrowUDFTestsMixin, ReusedSQLTestCase):
-    pass
+    def setUp(self):
+        tz = "America/Los_Angeles"
+        os.environ["TZ"] = tz
+        time.tzset()
 
 
 if __name__ == "__main__":
diff --git a/python/pyspark/sql/tests/arrow/test_arrow_udf_grouped_agg.py b/python/pyspark/sql/tests/arrow/test_arrow_udf_grouped_agg.py
new file mode 100644
index 0000000000000..3545801c4b5aa
--- /dev/null
+++ b/python/pyspark/sql/tests/arrow/test_arrow_udf_grouped_agg.py
@@ -0,0 +1,883 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import unittest
+
+from pyspark.sql.functions import arrow_udf, ArrowUDFType
+from pyspark.util import PythonEvalType
+from pyspark.sql import Row
+from pyspark.sql.types import ArrayType, YearMonthIntervalType
+from pyspark.sql import functions as sf
+from pyspark.errors import AnalysisException, PythonException
+from pyspark.testing.sqlutils import (
+    ReusedSQLTestCase,
+    have_pyarrow,
+    pyarrow_requirement_message,
+)
+
+
+@unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+class GroupedAggArrowUDFTestsMixin:
+    @property
+    def data(self):
+        return (
+            self.spark.range(10)
+            .toDF("id")
+            .withColumn("vs", sf.array([sf.lit(i * 1.0) + sf.col("id") for i in range(20, 30)]))
+            .withColumn("v", sf.explode(sf.col("vs")))
+            .drop("vs")
+            .withColumn("w", sf.lit(1.0))
+        )
+
+    @property
+    def python_plus_one(self):
+        @sf.udf("double")
+        def plus_one(v):
+            assert isinstance(v, (int, float))
+            return float(v + 1)
+
+        return plus_one
+
+    @property
+    def arrow_scalar_plus_two(self):
+        import pyarrow as pa
+
+        @arrow_udf("double", ArrowUDFType.SCALAR)
+        def plus_two(v):
+            assert isinstance(v, pa.Array)
+            return pa.compute.add(v, 2).cast(pa.float64())
+
+        return plus_two
+
+    @property
+    def arrow_agg_mean_udf(self):
+        import pyarrow as pa
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def avg(v):
+            assert isinstance(v, pa.Array)
+            return pa.compute.mean(v.cast(pa.float64()))
+
+        return avg
+
+    @property
+    def arrow_agg_mean_arr_udf(self):
+        import pyarrow as pa
+
+        @arrow_udf("array<double>", ArrowUDFType.GROUPED_AGG)
+        def avg(v):
+            assert isinstance(v, pa.Array)
+            assert isinstance(v, pa.ListArray)
+            return [pa.compute.mean(v.flatten()).cast(pa.float64())]
+
+        return avg
+
+    @property
+    def arrow_agg_sum_udf(self):
+        import pyarrow as pa
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def sum(v):
+            assert isinstance(v, pa.Array)
+            return pa.compute.sum(v).cast(pa.float64())
+
+        return sum
+
+    @property
+    def arrow_agg_weighted_mean_udf(self):
+        import pyarrow as pa
+        import numpy as np
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def weighted_mean(v, w):
+            assert isinstance(v, pa.Array)
+            assert isinstance(w, pa.Array)
+            return float(np.average(v, weights=w))
+
+        return weighted_mean
+
+    def test_manual(self):
+        df = self.data
+        sum_udf = self.arrow_agg_sum_udf
+        mean_udf = self.arrow_agg_mean_udf
+        mean_arr_udf = self.arrow_agg_mean_arr_udf
+
+        result = (
+            df.groupby("id")
+            .agg(sum_udf(df.v), mean_udf(df.v), mean_arr_udf(sf.array(df.v)))
+            .sort("id")
+        )
+        expected = self.spark.createDataFrame(
+            [
+                [0, 245.0, 24.5, [24.5]],
+                [1, 255.0, 25.5, [25.5]],
+                [2, 265.0, 26.5, [26.5]],
+                [3, 275.0, 27.5, [27.5]],
+                [4, 285.0, 28.5, [28.5]],
+                [5, 295.0, 29.5, [29.5]],
+                [6, 305.0, 30.5, [30.5]],
+                [7, 315.0, 31.5, [31.5]],
+                [8, 325.0, 32.5, [32.5]],
+                [9, 335.0, 33.5, [33.5]],
+            ],
+            ["id", "sum(v)", "avg(v)", "avg(array(v))"],
+        ).collect()
+
+        self.assertEqual(expected, result.collect())
+
+    def test_basic(self):
+        df = self.data
+        weighted_mean_udf = self.arrow_agg_weighted_mean_udf
+
+        # Groupby one column and aggregate one UDF with literal
+        result1 = df.groupby("id").agg(weighted_mean_udf(df.v, sf.lit(1.0))).sort("id")
+        expected1 = (
+            df.groupby("id").agg(sf.mean(df.v).alias("weighted_mean(v, 1.0)")).sort("id").collect()
+        )
+        self.assertEqual(expected1, result1.collect())
+
+        # Groupby one expression and aggregate one UDF with literal
+        result2 = (
+            df.groupby((sf.col("id") + 1)).agg(weighted_mean_udf(df.v, sf.lit(1.0))).sort(df.id + 1)
+        )
+        expected2 = (
+            df.groupby((sf.col("id") + 1))
+            .agg(sf.mean(df.v).alias("weighted_mean(v, 1.0)"))
+            .sort(df.id + 1)
+        ).collect()
+        self.assertEqual(expected2, result2.collect())
+
+        # Groupby one column and aggregate one UDF without literal
+        result3 = df.groupby("id").agg(weighted_mean_udf(df.v, df.w)).sort("id")
+        expected3 = (
+            df.groupby("id").agg(sf.mean(df.v).alias("weighted_mean(v, w)")).sort("id").collect()
+        )
+        self.assertEqual(expected3, result3.collect())
+
+        # Groupby one expression and aggregate one UDF without literal
+        result4 = (
+            df.groupby((sf.col("id") + 1).alias("id")).agg(weighted_mean_udf(df.v, df.w)).sort("id")
+        )
+        expected4 = (
+            df.groupby((sf.col("id") + 1).alias("id"))
+            .agg(sf.mean(df.v).alias("weighted_mean(v, w)"))
+            .sort("id")
+        ).collect()
+        self.assertEqual(expected4, result4.collect())
+
+    def test_alias(self):
+        df = self.data
+        mean_udf = self.arrow_agg_mean_udf
+
+        result = df.groupby("id").agg(mean_udf(df.v).alias("mean_alias"))
+        expected = df.groupby("id").agg(sf.mean(df.v).alias("mean_alias")).collect()
+
+        self.assertEqual(expected, result.collect())
+
+    def test_mixed_sql(self):
+        """
+        Test mixing group aggregate pandas UDF with sql expression.
+        """
+        df = self.data
+        sum_udf = self.arrow_agg_sum_udf
+
+        # Mix group aggregate pandas UDF with sql expression
+        result1 = df.groupby("id").agg(sum_udf(df.v) + 1).sort("id")
+        expected1 = df.groupby("id").agg(sf.sum(df.v) + 1).sort("id").collect()
+
+        # Mix group aggregate pandas UDF with sql expression (order swapped)
+        result2 = df.groupby("id").agg(sum_udf(df.v + 1)).sort("id")
+
+        expected2 = df.groupby("id").agg(sf.sum(df.v + 1)).sort("id").collect()
+
+        # Wrap group aggregate pandas UDF with two sql expressions
+        result3 = df.groupby("id").agg(sum_udf(df.v + 1) + 2).sort("id")
+        expected3 = df.groupby("id").agg(sf.sum(df.v + 1) + 2).sort("id").collect()
+
+        self.assertEqual(expected1, result1.collect())
+        self.assertEqual(expected2, result2.collect())
+        self.assertEqual(expected3, result3.collect())
+
+    def test_mixed_udfs(self):
+        """
+        Test mixing group aggregate pandas UDF with python UDF and scalar pandas UDF.
+        """
+        df = self.data
+        plus_one = self.python_plus_one
+        plus_two = self.arrow_scalar_plus_two
+        sum_udf = self.arrow_agg_sum_udf
+
+        # Mix group aggregate pandas UDF and python UDF
+        result1 = df.groupby("id").agg(plus_one(sum_udf(df.v))).sort("id")
+        expected1 = df.groupby("id").agg(plus_one(sf.sum(df.v))).sort("id").collect()
+
+        # Mix group aggregate pandas UDF and python UDF (order swapped)
+        result2 = df.groupby("id").agg(sum_udf(plus_one(df.v))).sort("id")
+        expected2 = df.groupby("id").agg(sf.sum(plus_one(df.v))).sort("id").collect()
+
+        # Mix group aggregate pandas UDF and scalar pandas UDF
+        result3 = df.groupby("id").agg(sum_udf(plus_two(df.v))).sort("id")
+        expected3 = df.groupby("id").agg(sf.sum(plus_two(df.v))).sort("id").collect()
+
+        # Mix group aggregate pandas UDF and scalar pandas UDF (order swapped)
+        result4 = df.groupby("id").agg(plus_two(sum_udf(df.v))).sort("id")
+        expected4 = df.groupby("id").agg(plus_two(sf.sum(df.v))).sort("id").collect()
+
+        # Wrap group aggregate pandas UDF with two python UDFs and use python UDF in groupby
+        result5 = (
+            df.groupby(plus_one(df.id)).agg(plus_one(sum_udf(plus_one(df.v)))).sort("plus_one(id)")
+        )
+        expected5 = (
+            df.groupby(plus_one(df.id)).agg(plus_one(sf.sum(plus_one(df.v)))).sort("plus_one(id)")
+        ).collect()
+
+        # Wrap group aggregate pandas UDF with two scala pandas UDF and user scala pandas UDF in
+        # groupby
+        result6 = (
+            df.groupby(plus_two(df.id)).agg(plus_two(sum_udf(plus_two(df.v)))).sort("plus_two(id)")
+        )
+        expected6 = (
+            df.groupby(plus_two(df.id)).agg(plus_two(sf.sum(plus_two(df.v)))).sort("plus_two(id)")
+        ).collect()
+
+        self.assertEqual(expected1, result1.collect())
+        self.assertEqual(expected2, result2.collect())
+        self.assertEqual(expected3, result3.collect())
+        self.assertEqual(expected4, result4.collect())
+        self.assertEqual(expected5, result5.collect())
+        self.assertEqual(expected6, result6.collect())
+
+    def test_multiple_udfs(self):
+        """
+        Test multiple group aggregate pandas UDFs in one agg function.
+        """
+        df = self.data
+        mean_udf = self.arrow_agg_mean_udf
+        sum_udf = self.arrow_agg_sum_udf
+        weighted_mean_udf = self.arrow_agg_weighted_mean_udf
+
+        result = (
+            df.groupBy("id")
+            .agg(mean_udf(df.v), sum_udf(df.v), weighted_mean_udf(df.v, df.w))
+            .sort("id")
+        )
+        expected = (
+            df.groupBy("id")
+            .agg(sf.mean(df.v), sf.sum(df.v), sf.mean(df.v).alias("weighted_mean(v, w)"))
+            .sort("id")
+            .collect()
+        )
+
+        self.assertEqual(expected, result.collect())
+
+    def test_complex_groupby(self):
+        df = self.data
+        sum_udf = self.arrow_agg_sum_udf
+        plus_one = self.python_plus_one
+        plus_two = self.arrow_scalar_plus_two
+
+        # groupby one expression
+        result1 = df.groupby(df.v % 2).agg(sum_udf(df.v))
+        expected1 = df.groupby(df.v % 2).agg(sf.sum(df.v)).collect()
+
+        # empty groupby
+        result2 = df.groupby().agg(sum_udf(df.v))
+        expected2 = df.groupby().agg(sf.sum(df.v)).collect()
+
+        # groupby one column and one sql expression
+        result3 = df.groupby(df.id, df.v % 2).agg(sum_udf(df.v)).orderBy(df.id, df.v % 2)
+        expected3 = df.groupby(df.id, df.v % 2).agg(sf.sum(df.v)).orderBy(df.id, df.v % 2).collect()
+
+        # groupby one python UDF
+        result4 = df.groupby(plus_one(df.id)).agg(sum_udf(df.v)).sort("plus_one(id)")
+        expected4 = df.groupby(plus_one(df.id)).agg(sf.sum(df.v)).sort("plus_one(id)").collect()
+
+        # groupby one scalar pandas UDF
+        result5 = df.groupby(plus_two(df.id)).agg(sum_udf(df.v)).sort("sum(v)")
+        expected5 = df.groupby(plus_two(df.id)).agg(sf.sum(df.v)).sort("sum(v)").collect()
+
+        # groupby one expression and one python UDF
+        result6 = (
+            df.groupby(df.v % 2, plus_one(df.id))
+            .agg(sum_udf(df.v))
+            .sort(["(v % 2)", "plus_one(id)"])
+        )
+        expected6 = (
+            df.groupby(df.v % 2, plus_one(df.id))
+            .agg(sf.sum(df.v))
+            .sort(["(v % 2)", "plus_one(id)"])
+        ).collect()
+
+        # groupby one expression and one scalar pandas UDF
+        result7 = (
+            df.groupby(df.v % 2, plus_two(df.id))
+            .agg(sum_udf(df.v))
+            .sort(["sum(v)", "plus_two(id)"])
+        )
+        expected7 = (
+            df.groupby(df.v % 2, plus_two(df.id)).agg(sf.sum(df.v)).sort(["sum(v)", "plus_two(id)"])
+        ).collect()
+
+        self.assertEqual(expected1, result1.collect())
+        self.assertEqual(expected2, result2.collect())
+        self.assertEqual(expected3, result3.collect())
+        self.assertEqual(expected4, result4.collect())
+        self.assertEqual(expected5, result5.collect())
+        self.assertEqual(expected6, result6.collect())
+        self.assertEqual(expected7, result7.collect())
+
+    def test_complex_expressions(self):
+        df = self.data
+        plus_one = self.python_plus_one
+        plus_two = self.arrow_scalar_plus_two
+        sum_udf = self.arrow_agg_sum_udf
+
+        # Test complex expressions with sql expression, python UDF and
+        # group aggregate pandas UDF
+        result1 = (
+            df.withColumn("v1", plus_one(df.v))
+            .withColumn("v2", df.v + 2)
+            .groupby(df.id, df.v % 2)
+            .agg(
+                sum_udf(sf.col("v")),
+                sum_udf(sf.col("v1") + 3),
+                sum_udf(sf.col("v2")) + 5,
+                plus_one(sum_udf(sf.col("v1"))),
+                sum_udf(plus_one(sf.col("v2"))),
+            )
+            .sort(["id", "(v % 2)"])
+        )
+
+        expected1 = (
+            df.withColumn("v1", df.v + 1)
+            .withColumn("v2", df.v + 2)
+            .groupby(df.id, df.v % 2)
+            .agg(
+                sf.sum(sf.col("v")),
+                sf.sum(sf.col("v1") + 3),
+                sf.sum(sf.col("v2")) + 5,
+                plus_one(sf.sum(sf.col("v1"))),
+                sf.sum(plus_one(sf.col("v2"))),
+            )
+            .sort(["id", "(v % 2)"])
+            .collect()
+        )
+
+        # Test complex expressions with sql expression, scala pandas UDF and
+        # group aggregate pandas UDF
+        result2 = (
+            df.withColumn("v1", plus_one(df.v))
+            .withColumn("v2", df.v + 2)
+            .groupby(df.id, df.v % 2)
+            .agg(
+                sum_udf(sf.col("v")),
+                sum_udf(sf.col("v1") + 3),
+                sum_udf(sf.col("v2")) + 5,
+                plus_two(sum_udf(sf.col("v1"))),
+                sum_udf(plus_two(sf.col("v2"))),
+            )
+            .sort(["id", "(v % 2)"])
+        )
+
+        expected2 = (
+            df.withColumn("v1", df.v + 1)
+            .withColumn("v2", df.v + 2)
+            .groupby(df.id, df.v % 2)
+            .agg(
+                sf.sum(sf.col("v")),
+                sf.sum(sf.col("v1") + 3),
+                sf.sum(sf.col("v2")) + 5,
+                plus_two(sf.sum(sf.col("v1"))),
+                sf.sum(plus_two(sf.col("v2"))),
+            )
+            .sort(["id", "(v % 2)"])
+            .collect()
+        )
+
+        # Test sequential groupby aggregate
+        result3 = (
+            df.groupby("id")
+            .agg(sum_udf(df.v).alias("v"))
+            .groupby("id")
+            .agg(sum_udf(sf.col("v")))
+            .sort("id")
+        )
+
+        expected3 = (
+            df.groupby("id")
+            .agg(sf.sum(df.v).alias("v"))
+            .groupby("id")
+            .agg(sf.sum(sf.col("v")))
+            .sort("id")
+            .collect()
+        )
+
+        self.assertEqual(expected1, result1.collect())
+        self.assertEqual(expected2, result2.collect())
+        self.assertEqual(expected3, result3.collect())
+
+    def test_retain_group_columns(self):
+        with self.sql_conf({"spark.sql.retainGroupColumns": False}):
+            df = self.data
+            sum_udf = self.arrow_agg_sum_udf
+
+            result1 = df.groupby(df.id).agg(sum_udf(df.v))
+            expected1 = df.groupby(df.id).agg(sf.sum(df.v)).collect()
+            self.assertEqual(expected1, result1.collect())
+
+    def test_array_type(self):
+        df = self.data
+
+        array_udf = arrow_udf(lambda x: [1.0, 2.0], "array<double>", ArrowUDFType.GROUPED_AGG)
+        result1 = df.groupby("id").agg(array_udf(df["v"]).alias("v2"))
+        self.assertEqual(result1.first()["v2"], [1.0, 2.0])
+
+    def test_invalid_args(self):
+        with self.quiet():
+            self.check_invalid_args()
+
+    def check_invalid_args(self):
+        df = self.data
+        plus_one = self.python_plus_one
+        mean_udf = self.arrow_agg_mean_udf
+        with self.assertRaisesRegex(AnalysisException, "[MISSING_AGGREGATION]"):
+            df.groupby(df.id).agg(plus_one(df.v)).collect()
+        with self.assertRaisesRegex(
+            AnalysisException, "aggregate function.*argument.*aggregate function"
+        ):
+            df.groupby(df.id).agg(mean_udf(mean_udf(df.v))).collect()
+        with self.assertRaisesRegex(
+            AnalysisException,
+            "The group aggregate pandas UDF `avg` cannot be invoked together with as other, "
+            "non-pandas aggregate functions.",
+        ):
+            df.groupby(df.id).agg(mean_udf(df.v), sf.mean(df.v)).collect()
+
+    def test_register_vectorized_udf_basic(self):
+        import pyarrow as pa
+
+        sum_arrow_udf = arrow_udf(
+            lambda v: pa.compute.sum(v).cast(pa.int32()),
+            "integer",
+            PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
+        )
+
+        self.assertEqual(sum_arrow_udf.evalType, PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF)
+        group_agg_pandas_udf = self.spark.udf.register("sum_arrow_udf", sum_arrow_udf)
+        self.assertEqual(group_agg_pandas_udf.evalType, PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF)
+        q = "SELECT sum_arrow_udf(v1) FROM VALUES (3, 0), (2, 0), (1, 1) tbl(v1, v2) GROUP BY v2"
+        actual = sorted(map(lambda r: r[0], self.spark.sql(q).collect()))
+        expected = [1, 5]
+        self.assertEqual(actual, expected)
+
+    def test_grouped_with_empty_partition(self):
+        import pyarrow as pa
+
+        data = [Row(id=1, x=2), Row(id=1, x=3), Row(id=2, x=4)]
+        expected = [Row(id=1, sum=5), Row(id=2, x=4)]
+        num_parts = len(data) + 1
+        df = self.spark.createDataFrame(data).repartition(num_parts)
+
+        f = arrow_udf(lambda x: pa.compute.sum(x).cast(pa.int32()), "int", ArrowUDFType.GROUPED_AGG)
+
+        result = df.groupBy("id").agg(f(df["x"]).alias("sum")).sort("id")
+        self.assertEqual(result.collect(), expected)
+
+    def test_grouped_without_group_by_clause(self):
+        import pyarrow as pa
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def max_udf(v):
+            return float(pa.compute.max(v).as_py())
+
+        df = self.spark.range(0, 100)
+        self.spark.udf.register("max_udf", max_udf)
+
+        with self.tempView("table"):
+            df.createTempView("table")
+
+            agg1 = df.agg(max_udf(df["id"]))
+            agg2 = self.spark.sql("select max_udf(id) from table")
+            self.assertEqual(agg1.collect(), agg2.collect())
+
+    def test_no_predicate_pushdown_through(self):
+        import pyarrow as pa
+
+        @arrow_udf("float", ArrowUDFType.GROUPED_AGG)
+        def mean(x):
+            return pa.compute.mean(x).cast(pa.float32())
+
+        df = self.spark.createDataFrame([Row(id=1, foo=42), Row(id=2, foo=1), Row(id=2, foo=2)])
+
+        agg = df.groupBy("id").agg(mean("foo").alias("mean"))
+        filtered = agg.filter(agg["mean"] > 40.0)
+
+        self.assertEqual(filtered.collect()[0]["mean"], 42.0)
+
+        assert filtered.collect()[0]["mean"] == 42.0
+
+    def test_named_arguments(self):
+        df = self.data
+        weighted_mean = self.arrow_agg_weighted_mean_udf
+
+        with self.tempView("v"):
+            df.createOrReplaceTempView("v")
+            self.spark.udf.register("weighted_mean", weighted_mean)
+
+            for i, aggregated in enumerate(
+                [
+                    df.groupby("id").agg(weighted_mean(df.v, w=df.w).alias("wm")),
+                    df.groupby("id").agg(weighted_mean(v=df.v, w=df.w).alias("wm")),
+                    df.groupby("id").agg(weighted_mean(w=df.w, v=df.v).alias("wm")),
+                    self.spark.sql("SELECT id, weighted_mean(v, w => w) as wm FROM v GROUP BY id"),
+                    self.spark.sql(
+                        "SELECT id, weighted_mean(v => v, w => w) as wm FROM v GROUP BY id"
+                    ),
+                    self.spark.sql(
+                        "SELECT id, weighted_mean(w => w, v => v) as wm FROM v GROUP BY id"
+                    ),
+                ]
+            ):
+                with self.subTest(query_no=i):
+                    self.assertEqual(
+                        aggregated.collect(),
+                        df.groupby("id").agg(sf.mean(df.v).alias("wm")).collect(),
+                    )
+
+    def test_named_arguments_negative(self):
+        df = self.data
+        weighted_mean = self.arrow_agg_weighted_mean_udf
+
+        with self.tempView("v"):
+            df.createOrReplaceTempView("v")
+            self.spark.udf.register("weighted_mean", weighted_mean)
+
+            with self.assertRaisesRegex(
+                AnalysisException,
+                "DUPLICATE_ROUTINE_PARAMETER_ASSIGNMENT.DOUBLE_NAMED_ARGUMENT_REFERENCE",
+            ):
+                self.spark.sql(
+                    "SELECT id, weighted_mean(v => v, v => w) as wm FROM v GROUP BY id"
+                ).show()
+
+            with self.assertRaisesRegex(AnalysisException, "UNEXPECTED_POSITIONAL_ARGUMENT"):
+                self.spark.sql(
+                    "SELECT id, weighted_mean(v => v, w) as wm FROM v GROUP BY id"
+                ).show()
+
+            with self.assertRaisesRegex(
+                PythonException, r"weighted_mean\(\) got an unexpected keyword argument 'x'"
+            ):
+                self.spark.sql(
+                    "SELECT id, weighted_mean(v => v, x => w) as wm FROM v GROUP BY id"
+                ).show()
+
+            with self.assertRaisesRegex(
+                PythonException, r"weighted_mean\(\) got multiple values for argument 'v'"
+            ):
+                self.spark.sql(
+                    "SELECT id, weighted_mean(v, v => w) as wm FROM v GROUP BY id"
+                ).show()
+
+    def test_kwargs(self):
+        df = self.data
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def weighted_mean(**kwargs):
+            import numpy as np
+
+            return np.average(kwargs["v"], weights=kwargs["w"])
+
+        with self.tempView("v"):
+            df.createOrReplaceTempView("v")
+            self.spark.udf.register("weighted_mean", weighted_mean)
+
+            for i, aggregated in enumerate(
+                [
+                    df.groupby("id").agg(weighted_mean(v=df.v, w=df.w).alias("wm")),
+                    df.groupby("id").agg(weighted_mean(w=df.w, v=df.v).alias("wm")),
+                    self.spark.sql(
+                        "SELECT id, weighted_mean(v => v, w => w) as wm FROM v GROUP BY id"
+                    ),
+                    self.spark.sql(
+                        "SELECT id, weighted_mean(w => w, v => v) as wm FROM v GROUP BY id"
+                    ),
+                ]
+            ):
+                with self.subTest(query_no=i):
+                    self.assertEqual(
+                        aggregated.collect(),
+                        df.groupby("id").agg(sf.mean(df.v).alias("wm")).collect(),
+                    )
+
+            # negative
+            with self.assertRaisesRegex(
+                AnalysisException,
+                "DUPLICATE_ROUTINE_PARAMETER_ASSIGNMENT.DOUBLE_NAMED_ARGUMENT_REFERENCE",
+            ):
+                self.spark.sql(
+                    "SELECT id, weighted_mean(v => v, v => w) as wm FROM v GROUP BY id"
+                ).show()
+
+            with self.assertRaisesRegex(AnalysisException, "UNEXPECTED_POSITIONAL_ARGUMENT"):
+                self.spark.sql(
+                    "SELECT id, weighted_mean(v => v, w) as wm FROM v GROUP BY id"
+                ).show()
+
+    def test_named_arguments_and_defaults(self):
+        import pyarrow as pa
+
+        df = self.data
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def biased_sum(v, w=None):
+            return pa.compute.sum(v).as_py() + (pa.compute.sum(w).as_py() if w is not None else 100)
+
+        with self.tempView("v"):
+            df.createOrReplaceTempView("v")
+            self.spark.udf.register("biased_sum", biased_sum)
+
+            # without "w"
+            for i, aggregated in enumerate(
+                [
+                    df.groupby("id").agg(biased_sum(df.v).alias("s")),
+                    df.groupby("id").agg(biased_sum(v=df.v).alias("s")),
+                    self.spark.sql("SELECT id, biased_sum(v) as s FROM v GROUP BY id"),
+                    self.spark.sql("SELECT id, biased_sum(v => v) as s FROM v GROUP BY id"),
+                ]
+            ):
+                with self.subTest(with_w=False, query_no=i):
+                    self.assertEqual(
+                        aggregated.collect(),
+                        df.groupby("id").agg((sf.sum(df.v) + sf.lit(100)).alias("s")).collect(),
+                    )
+
+            # with "w"
+            for i, aggregated in enumerate(
+                [
+                    df.groupby("id").agg(biased_sum(df.v, w=df.w).alias("s")),
+                    df.groupby("id").agg(biased_sum(v=df.v, w=df.w).alias("s")),
+                    df.groupby("id").agg(biased_sum(w=df.w, v=df.v).alias("s")),
+                    self.spark.sql("SELECT id, biased_sum(v, w => w) as s FROM v GROUP BY id"),
+                    self.spark.sql("SELECT id, biased_sum(v => v, w => w) as s FROM v GROUP BY id"),
+                    self.spark.sql("SELECT id, biased_sum(w => w, v => v) as s FROM v GROUP BY id"),
+                ]
+            ):
+                with self.subTest(with_w=True, query_no=i):
+                    self.assertEqual(
+                        aggregated.collect(),
+                        df.groupby("id").agg((sf.sum(df.v) + sf.sum(df.w)).alias("s")).collect(),
+                    )
+
+    def test_complex_agg_collect_set(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame([(1, 1), (1, 2), (2, 3), (2, 5), (2, 1)], ("id", "v"))
+
+        @arrow_udf("array<int>")
+        def arrow_collect_set(v: pa.Array) -> pa.Scalar:
+            assert isinstance(v, pa.Array), str(type(v))
+            s = sorted([x.as_py() for x in pa.compute.unique(v)])
+            t = pa.list_(pa.int32())
+            return pa.scalar(value=s, type=t)
+
+        result1 = df.select(
+            arrow_collect_set(df["id"]).alias("ids"),
+            arrow_collect_set(df["v"]).alias("vs"),
+        )
+
+        expected1 = df.select(
+            sf.sort_array(sf.collect_set(df["id"])).alias("ids"),
+            sf.sort_array(sf.collect_set(df["v"])).alias("vs"),
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_complex_agg_collect_list(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame([(1, 1), (1, 2), (2, 3), (2, 5), (2, 1)], ("id", "v"))
+
+        @arrow_udf("array<int>")
+        def arrow_collect_list(v: pa.Array) -> pa.Scalar:
+            assert isinstance(v, pa.Array), str(type(v))
+            s = sorted([x.as_py() for x in v])
+            t = pa.list_(pa.int32())
+            return pa.scalar(value=s, type=t)
+
+        result1 = df.select(
+            arrow_collect_list(df["id"]).alias("ids"),
+            arrow_collect_list(df["v"]).alias("vs"),
+        )
+
+        expected1 = df.select(
+            sf.sort_array(sf.collect_list(df["id"])).alias("ids"),
+            sf.sort_array(sf.collect_list(df["v"])).alias("vs"),
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_complex_agg_collect_as_map(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame([(1, 1), (2, 2), (3, 5)], ("id", "v"))
+
+        @arrow_udf("map<int, int>")
+        def arrow_collect_as_map(id: pa.Array, v: pa.Array) -> pa.Scalar:
+            assert isinstance(id, pa.Array), str(type(id))
+            assert isinstance(v, pa.Array), str(type(v))
+            d = {i: j for i, j in zip(id.to_pylist(), v.to_pylist())}
+            t = pa.map_(pa.int32(), pa.int32())
+            return pa.scalar(value=d, type=t)
+
+        result1 = df.select(
+            arrow_collect_as_map("id", "v").alias("map"),
+        )
+
+        expected1 = df.select(
+            sf.map_from_arrays(sf.collect_list("id"), sf.collect_list("v")).alias("map"),
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_complex_agg_min_max_struct(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame([(1, 1), (2, 2), (3, 5)], ("id", "v"))
+
+        @arrow_udf("struct<m1: int, m2:int>")
+        def arrow_collect_min_max(id: pa.Array, v: pa.Array) -> pa.Scalar:
+            assert isinstance(id, pa.Array), str(type(id))
+            assert isinstance(v, pa.Array), str(type(v))
+            m1 = pa.compute.min(id)
+            m2 = pa.compute.max(v)
+            t = pa.struct([pa.field("m1", pa.int32()), pa.field("m2", pa.int32())])
+            return pa.scalar(value={"m1": m1.as_py(), "m2": m2.as_py()}, type=t)
+
+        result1 = df.select(
+            arrow_collect_min_max("id", "v").alias("struct"),
+        )
+
+        expected1 = df.select(
+            sf.struct(sf.min("id").alias("m1"), sf.max("v").alias("m2")).alias("struct"),
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_time_min(self):
+        import pyarrow as pa
+
+        df = self.spark.sql(
+            """
+            SELECT * FROM VALUES
+            (1, TIME '12:34:56'),
+            (1, TIME '1:2:3'),
+            (2, TIME '0:58:59'),
+            (2, TIME '10:58:59'),
+            (2, TIME '10:00:03')
+            AS tab(i, t)
+            """
+        )
+
+        @arrow_udf("time", ArrowUDFType.GROUPED_AGG)
+        def agg_min_time(v):
+            assert isinstance(v, pa.Array)
+            assert isinstance(v, pa.Time64Array)
+            return pa.compute.min(v)
+
+        expected1 = df.select(sf.min("t").alias("res"))
+        result1 = df.select(agg_min_time("t").alias("res"))
+        self.assertEqual(expected1.collect(), result1.collect())
+
+        expected2 = df.groupby("i").agg(sf.min("t").alias("res")).sort("i")
+        result2 = df.groupby("i").agg(agg_min_time("t").alias("res")).sort("i")
+        self.assertEqual(expected2.collect(), result2.collect())
+
+    def test_return_type_coercion(self):
+        import pyarrow as pa
+
+        df = self.spark.range(10)
+
+        @arrow_udf("long", ArrowUDFType.GROUPED_AGG)
+        def agg_long(id: pa.Array) -> int:
+            assert isinstance(id, pa.Array), str(type(id))
+            return pa.scalar(value=len(id), type=pa.int64())
+
+        result1 = df.select(agg_long("id").alias("res"))
+        self.assertEqual(1, len(result1.collect()))
+
+        # long -> int coercion
+        @arrow_udf("int", ArrowUDFType.GROUPED_AGG)
+        def agg_int1(id: pa.Array) -> int:
+            assert isinstance(id, pa.Array), str(type(id))
+            return pa.scalar(value=len(id), type=pa.int64())
+
+        result2 = df.select(agg_int1("id").alias("res"))
+        self.assertEqual(1, len(result2.collect()))
+
+        # long -> int coercion, overflow
+        @arrow_udf("int", ArrowUDFType.GROUPED_AGG)
+        def agg_int2(id: pa.Array) -> int:
+            assert isinstance(id, pa.Array), str(type(id))
+            return pa.scalar(value=len(id) + 2147483647, type=pa.int64())
+
+        result3 = df.select(agg_int2("id").alias("res"))
+        with self.assertRaises(Exception):
+            # pyarrow.lib.ArrowInvalid:
+            # Integer value 2147483657 not in range: -2147483648 to 2147483647
+            result3.collect()
+
+    def test_unsupported_return_types(self):
+        import pyarrow as pa
+
+        with self.quiet():
+            with self.assertRaisesRegex(
+                NotImplementedError,
+                "Invalid return type with grouped aggregate "
+                "Arrow UDFs.*ArrayType.*YearMonthIntervalType",
+            ):
+                arrow_udf(
+                    lambda x: x,
+                    ArrayType(ArrayType(YearMonthIntervalType())),
+                    ArrowUDFType.GROUPED_AGG,
+                )
+
+            with self.assertRaisesRegex(
+                NotImplementedError,
+                "Invalid return type with grouped aggregate "
+                "Arrow UDFs.*ArrayType.*YearMonthIntervalType",
+            ):
+
+                @arrow_udf(ArrayType(ArrayType(YearMonthIntervalType())), ArrowUDFType.GROUPED_AGG)
+                def func_a(a: pa.Array) -> pa.Scalar:
+                    return pa.compute.max(a)
+
+
+class GroupedAggArrowUDFTests(GroupedAggArrowUDFTestsMixin, ReusedSQLTestCase):
+    pass
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.arrow.test_arrow_udf_grouped_agg import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/arrow/test_arrow_udf_scalar.py b/python/pyspark/sql/tests/arrow/test_arrow_udf_scalar.py
index 052956db6e6e2..d6e010d8d2a98 100644
--- a/python/pyspark/sql/tests/arrow/test_arrow_udf_scalar.py
+++ b/python/pyspark/sql/tests/arrow/test_arrow_udf_scalar.py
@@ -19,14 +19,13 @@
 import random
 import time
 import unittest
-from datetime import date, datetime, timezone
+import datetime
 from decimal import Decimal
 from typing import Iterator, Tuple
 
 from pyspark.util import PythonEvalType
 
-# TODO: import arrow_udf from public API
-from pyspark.sql.pandas.functions import arrow_udf, ArrowUDFType
+from pyspark.sql.functions import arrow_udf, ArrowUDFType
 from pyspark.sql import functions as F
 from pyspark.sql.types import (
     IntegerType,
@@ -44,6 +43,7 @@
     Row,
     MapType,
     BinaryType,
+    YearMonthIntervalType,
 )
 from pyspark.errors import AnalysisException, PythonException
 from pyspark.testing.sqlutils import (
@@ -98,7 +98,7 @@ def test_arrow_udf_output_nested_arrays(self):
         df = self.spark.createDataFrame([("hi boo",), ("bye boo",)], ["vals"])
 
         tokenize = arrow_udf(
-            lambda s: pa.array([pa.compute.ascii_split_whitespace(s).to_pylist()]),
+            lambda s: pa.array([[v] for v in pa.compute.ascii_split_whitespace(s).to_pylist()]),
             ArrayType(ArrayType(StringType())),
         )
 
@@ -305,16 +305,17 @@ def test_arrow_udf_output_dates(self):
         def build_date(y, m, d):
             assert all(isinstance(x, pa.Array) for x in [y, m, d])
             dates = [
-                date(int(y[i].as_py()), int(m[i].as_py()), int(d[i].as_py())) for i in range(len(y))
+                datetime.date(int(y[i].as_py()), int(m[i].as_py()), int(d[i].as_py()))
+                for i in range(len(y))
             ]
             return pa.array(dates, pa.date32())
 
         result = df.select(build_date("y", "m", "d").alias("date"))
         self.assertEqual(
             [
-                Row(date=date(2022, 1, 5)),
-                Row(date=date(2023, 2, 6)),
-                Row(date=date(2024, 3, 7)),
+                Row(date=datetime.date(2022, 1, 5)),
+                Row(date=datetime.date(2023, 2, 6)),
+                Row(date=datetime.date(2024, 3, 7)),
             ],
             result.collect(),
         )
@@ -361,14 +362,14 @@ def test_arrow_udf_output_timestamps_ltz(self):
         def build_ts(y, m, d, h, mi, s):
             assert all(isinstance(x, pa.Array) for x in [y, m, d, h, mi, s])
             dates = [
-                datetime(
+                datetime.datetime(
                     int(y[i].as_py()),
                     int(m[i].as_py()),
                     int(d[i].as_py()),
                     int(h[i].as_py()),
                     int(mi[i].as_py()),
                     int(s[i].as_py()),
-                    tzinfo=timezone.utc,
+                    tzinfo=datetime.timezone.utc,
                 )
                 for i in range(len(y))
             ]
@@ -377,9 +378,9 @@ def build_ts(y, m, d, h, mi, s):
         result = df.select(build_ts("y", "m", "d", "h", "mi", "s").alias("ts"))
         self.assertEqual(
             [
-                Row(ts=datetime(2022, 1, 5, 7, 0, 1)),
-                Row(ts=datetime(2023, 2, 6, 8, 1, 2)),
-                Row(ts=datetime(2024, 3, 7, 9, 2, 3)),
+                Row(ts=datetime.datetime(2022, 1, 5, 7, 0, 1)),
+                Row(ts=datetime.datetime(2023, 2, 6, 8, 1, 2)),
+                Row(ts=datetime.datetime(2024, 3, 7, 9, 2, 3)),
             ],
             result.collect(),
         )
@@ -401,7 +402,7 @@ def test_arrow_udf_output_timestamps_ntz(self):
         def build_ts(y, m, d, h, mi, s):
             assert all(isinstance(x, pa.Array) for x in [y, m, d, h, mi, s])
             dates = [
-                datetime(
+                datetime.datetime(
                     int(y[i].as_py()),
                     int(m[i].as_py()),
                     int(d[i].as_py()),
@@ -416,13 +417,137 @@ def build_ts(y, m, d, h, mi, s):
         result = df.select(build_ts("y", "m", "d", "h", "mi", "s").alias("ts"))
         self.assertEqual(
             [
-                Row(ts=datetime(2022, 1, 5, 15, 0, 1)),
-                Row(ts=datetime(2023, 2, 6, 16, 1, 2)),
-                Row(ts=datetime(2024, 3, 7, 17, 2, 3)),
+                Row(ts=datetime.datetime(2022, 1, 5, 15, 0, 1)),
+                Row(ts=datetime.datetime(2023, 2, 6, 16, 1, 2)),
+                Row(ts=datetime.datetime(2024, 3, 7, 17, 2, 3)),
+            ],
+            result.collect(),
+        )
+
+    def test_arrow_udf_input_times(self):
+        import pyarrow as pa
+
+        df = self.spark.sql(
+            """
+            SELECT * FROM VALUES
+            (1, TIME '12:34:56'),
+            (2, TIME '1:2:3'),
+            (3, TIME '0:58:59')
+            AS tab(i, ts)
+            """
+        )
+
+        @arrow_udf("int")
+        def extract_second(v):
+            assert isinstance(v, pa.Array)
+            assert isinstance(v, pa.Time64Array), type(v)
+            return pa.array([t.as_py().second for t in v], pa.int32())
+
+        result = df.select(extract_second("ts").alias("sec"))
+        self.assertEqual(
+            [
+                Row(sec=56),
+                Row(sec=3),
+                Row(sec=59),
+            ],
+            result.collect(),
+        )
+
+    def test_arrow_udf_output_times(self):
+        import pyarrow as pa
+
+        df = self.spark.sql(
+            """
+            SELECT * FROM VALUES
+            (12, 34, 56),
+            (1, 2, 3),
+            (0, 58, 59)
+            AS tab(h, mi, s)
+            """
+        )
+
+        @arrow_udf("time")
+        def build_time(h, mi, s):
+            assert all(isinstance(x, pa.Array) for x in [h, mi, s])
+            dates = [
+                datetime.time(
+                    int(h[i].as_py()),
+                    int(mi[i].as_py()),
+                    int(s[i].as_py()),
+                )
+                for i in range(len(h))
+            ]
+            return pa.array(dates, pa.time64("ns"))
+
+        result = df.select(build_time("h", "mi", "s").alias("t"))
+        self.assertEqual(
+            [
+                Row(t=datetime.time(12, 34, 56)),
+                Row(t=datetime.time(1, 2, 3)),
+                Row(t=datetime.time(0, 58, 59)),
             ],
             result.collect(),
         )
 
+    def test_arrow_udf_input_variant(self):
+        import pyarrow as pa
+
+        @arrow_udf("int")
+        def scalar_f(v: pa.Array) -> pa.Array:
+            assert isinstance(v, pa.Array)
+            assert isinstance(v, pa.StructArray)
+            assert isinstance(v.field("metadata"), pa.BinaryArray)
+            assert isinstance(v.field("value"), pa.BinaryArray)
+            return pa.compute.binary_length(v.field("value"))
+
+        @arrow_udf("int")
+        def iter_f(it: Iterator[pa.Array]) -> Iterator[pa.Array]:
+            for v in it:
+                assert isinstance(v, pa.Array)
+                assert isinstance(v, pa.StructArray)
+                assert isinstance(v.field("metadata"), pa.BinaryArray)
+                assert isinstance(v.field("value"), pa.BinaryArray)
+                yield pa.compute.binary_length(v.field("value"))
+
+        df = self.spark.range(0, 10).selectExpr("parse_json(cast(id as string)) v")
+        expected = [Row(l=2) for i in range(10)]
+
+        for f in [scalar_f, iter_f]:
+            result = df.select(f("v").alias("l")).collect()
+            self.assertEqual(result, expected)
+
+    def test_arrow_udf_output_variant(self):
+        # referring to test_udf_with_variant_output in test_pandas_udf_scalar
+        import pyarrow as pa
+
+        # referring to_arrow_type in to pyspark.sql.pandas.types
+        fields = [
+            pa.field("value", pa.binary(), nullable=False),
+            pa.field("metadata", pa.binary(), nullable=False, metadata={b"variant": b"true"}),
+        ]
+
+        @arrow_udf("variant")
+        def scalar_f(v: pa.Array) -> pa.Array:
+            assert isinstance(v, pa.Array)
+            v = pa.array([bytes([12, i.as_py()]) for i in v], pa.binary())
+            m = pa.array([bytes([1, 0, 0]) for i in v], pa.binary())
+            return pa.StructArray.from_arrays([v, m], fields=fields)
+
+        @arrow_udf("variant")
+        def iter_f(it: Iterator[pa.Array]) -> Iterator[pa.Array]:
+            for v in it:
+                assert isinstance(v, pa.Array)
+                v = pa.array([bytes([12, i.as_py()]) for i in v])
+                m = pa.array([bytes([1, 0, 0]) for i in v])
+                yield pa.StructArray.from_arrays([v, m], fields=fields)
+
+        df = self.spark.range(0, 10)
+        expected = [Row(l=i) for i in range(10)]
+
+        for f in [scalar_f, iter_f]:
+            result = df.select(f("id").cast("int").alias("l")).collect()
+            self.assertEqual(result, expected)
+
     def test_arrow_udf_null_boolean(self):
         data = [(True,), (True,), (None,), (False,)]
         schema = StructType().add("bool", BooleanType())
@@ -536,7 +661,9 @@ def test_arrow_udf_datatype_string(self):
             F.col("id").alias("long"),
             F.col("id").cast("float").alias("float"),
             F.col("id").cast("double").alias("double"),
-            # F.col("id").cast("decimal").alias("decimal"),
+            F.col("id").cast("decimal").alias("decimal1"),
+            F.col("id").cast("decimal(10, 0)").alias("decimal2"),
+            F.col("id").cast("decimal(38, 18)").alias("decimal3"),
             F.col("id").cast("boolean").alias("bool"),
         )
 
@@ -549,7 +676,9 @@ def f(x):
             long_f = arrow_udf(f, "long", udf_type)
             float_f = arrow_udf(f, "float", udf_type)
             double_f = arrow_udf(f, "double", udf_type)
-            # decimal_f = arrow_udf(f, "decimal(38, 18)", udf_type)
+            decimal1_f = arrow_udf(f, "decimal", udf_type)
+            decimal2_f = arrow_udf(f, "decimal(10, 0)", udf_type)
+            decimal3_f = arrow_udf(f, "decimal(38, 18)", udf_type)
             bool_f = arrow_udf(f, "boolean", udf_type)
             res = df.select(
                 str_f(F.col("str")),
@@ -557,7 +686,9 @@ def f(x):
                 long_f(F.col("long")),
                 float_f(F.col("float")),
                 double_f(F.col("double")),
-                # decimal_f("decimal"),
+                decimal1_f("decimal1"),
+                decimal2_f("decimal2"),
+                decimal3_f("decimal3"),
                 bool_f(F.col("bool")),
             )
             self.assertEqual(df.collect(), res.collect())
@@ -588,6 +719,22 @@ def test_udf_register_arrow_udf_basic(self):
         self.assertEqual(expected.collect(), res1.collect())
         self.assertEqual(expected.collect(), res2.collect())
 
+        @arrow_udf(LongType())
+        def scalar_iter_add(it: Iterator[Tuple[pa.Array, pa.Array]]) -> Iterator[pa.Array]:
+            for a, b in it:
+                yield pa.compute.add(a, b)
+
+        self.spark.sql("DROP TEMPORARY FUNCTION IF EXISTS add1")
+        new_add = self.spark.udf.register("add1", scalar_iter_add)
+
+        res3 = df.select(new_add(F.col("a"), F.col("b")))
+        res4 = self.spark.sql(
+            "SELECT add1(t.a, t.b) FROM (SELECT id as a, id as b FROM range(10)) t"
+        )
+        expected = df.select(F.expr("a + b"))
+        self.assertEqual(expected.collect(), res3.collect())
+        self.assertEqual(expected.collect(), res4.collect())
+
     def test_catalog_register_arrow_udf_basic(self):
         import pyarrow as pa
 
@@ -614,6 +761,22 @@ def test_catalog_register_arrow_udf_basic(self):
         self.assertEqual(expected.collect(), res1.collect())
         self.assertEqual(expected.collect(), res2.collect())
 
+        @arrow_udf(LongType())
+        def scalar_iter_add(it: Iterator[Tuple[pa.Array, pa.Array]]) -> Iterator[pa.Array]:
+            for a, b in it:
+                yield pa.compute.add(a, b)
+
+        self.spark.sql("DROP TEMPORARY FUNCTION IF EXISTS add1")
+        new_add = self.spark.catalog.registerFunction("add1", scalar_iter_add)
+
+        res3 = df.select(new_add(F.col("a"), F.col("b")))
+        res4 = self.spark.sql(
+            "SELECT add1(t.a, t.b) FROM (SELECT id as a, id as b FROM range(10)) t"
+        )
+        expected = df.select(F.expr("a + b"))
+        self.assertEqual(expected.collect(), res3.collect())
+        self.assertEqual(expected.collect(), res4.collect())
+
     def test_udf_register_nondeterministic_arrow_udf(self):
         import pyarrow as pa
 
@@ -963,6 +1126,48 @@ def multiple(it: Iterator[Tuple[pa.Array, pa.Array, pa.Array]]) -> Iterator[pa.A
         result = df.select(multiple("a", "b", "c").alias("res"))
         self.assertEqual(expected, result.collect())
 
+    def test_return_type_coercion(self):
+        import pyarrow as pa
+
+        df = self.spark.range(10)
+
+        scalar_long = arrow_udf(lambda x: pa.compute.add(x, 1), LongType())
+        result1 = df.select(scalar_long("id").alias("res"))
+        self.assertEqual(10, len(result1.collect()))
+
+        # long -> int coercion
+        scalar_int1 = arrow_udf(lambda x: pa.compute.add(x, 1), IntegerType())
+        result2 = df.select(scalar_int1("id").alias("res"))
+        self.assertEqual(10, len(result2.collect()))
+
+        # long -> int coercion, overflow
+        scalar_int2 = arrow_udf(lambda x: pa.compute.add(x, 2147483647), IntegerType())
+        result3 = df.select(scalar_int2("id").alias("res"))
+        with self.assertRaises(Exception):
+            # pyarrow.lib.ArrowInvalid:
+            # Integer value 2147483652 not in range: -2147483648 to 2147483647
+            result3.collect()
+
+    def test_unsupported_return_types(self):
+        import pyarrow as pa
+
+        with self.quiet():
+            for udf_type in [ArrowUDFType.SCALAR, ArrowUDFType.SCALAR_ITER]:
+                with self.assertRaisesRegex(
+                    NotImplementedError,
+                    "Invalid return type.*scalar Arrow UDF.*ArrayType.*YearMonthIntervalType",
+                ):
+                    arrow_udf(lambda x: x, ArrayType(YearMonthIntervalType()), udf_type)
+
+                with self.assertRaisesRegex(
+                    NotImplementedError,
+                    "Invalid return type.*scalar Arrow UDF.*ArrayType.*YearMonthIntervalType",
+                ):
+
+                    @arrow_udf(ArrayType(YearMonthIntervalType()))
+                    def func_a(a: pa.Array) -> pa.Array:
+                        return a
+
 
 class ScalarArrowUDFTests(ScalarArrowUDFTestsMixin, ReusedSQLTestCase):
     @classmethod
diff --git a/python/pyspark/sql/tests/arrow/test_arrow_udf_typehints.py b/python/pyspark/sql/tests/arrow/test_arrow_udf_typehints.py
new file mode 100644
index 0000000000000..81d980cc37212
--- /dev/null
+++ b/python/pyspark/sql/tests/arrow/test_arrow_udf_typehints.py
@@ -0,0 +1,351 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+from inspect import signature
+from typing import Union, Iterator, Tuple, get_type_hints
+
+from pyspark.sql import functions as sf
+from pyspark.testing.utils import (
+    have_pandas,
+    pandas_requirement_message,
+    have_pyarrow,
+    pyarrow_requirement_message,
+    have_numpy,
+    numpy_requirement_message,
+)
+from pyspark.testing.sqlutils import ReusedSQLTestCase
+from pyspark.sql.pandas.typehints import infer_eval_type
+from pyspark.sql.pandas.functions import arrow_udf, ArrowUDFType
+from pyspark.sql import Row
+
+if have_pyarrow:
+    import pyarrow as pa
+
+
+@unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+class ArrowUDFTypeHintsTests(ReusedSQLTestCase):
+    def test_type_annotation_scalar(self):
+        def func(col: pa.Array) -> pa.Array:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: pa.Array, col1: pa.Array) -> pa.Array:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: pa.Array, *args: pa.Array) -> pa.Array:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: pa.Array, *args: pa.Array, **kwargs: pa.Array) -> pa.Array:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: pa.Array, *, col2: pa.Array) -> pa.Array:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        # Union[pa.Array, pa.Array] equals to pa.Array
+        def func(col: Union[pa.Array, pa.Array], *, col2: pa.Array) -> pa.Array:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+    def test_type_annotation_scalar_iter(self):
+        def func(iter: Iterator[pa.Array]) -> Iterator[pa.Array]:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR_ITER
+        )
+
+        def func(iter: Iterator[Tuple[pa.Array, ...]]) -> Iterator[pa.Array]:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR_ITER
+        )
+
+    def test_type_annotation_tuple_generics(self):
+        def func(iter: Iterator[tuple[pa.Array, pa.Array]]) -> Iterator[pa.Array]:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR_ITER
+        )
+
+        def func(iter: Iterator[tuple[pa.Array, ...]]) -> Iterator[pa.Array]:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR_ITER
+        )
+
+        # Union[pa.Array, pa.Array] equals to pa.Array
+        def func(iter: Iterator[tuple[Union[pa.Array, pa.Array], ...]]) -> Iterator[pa.Array]:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR_ITER
+        )
+
+    def test_type_annotation_group_agg(self):
+        def func(col: pa.Array) -> str:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.GROUPED_AGG
+        )
+
+        def func(col: pa.Array, col1: pa.Array) -> int:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.GROUPED_AGG
+        )
+
+        def func(col: pa.Array, *args: pa.Array) -> Row:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.GROUPED_AGG
+        )
+
+        def func(col: pa.Array, *args: pa.Array, **kwargs: pa.Array) -> str:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.GROUPED_AGG
+        )
+
+        def func(col: pa.Array, *, col2: pa.Array) -> float:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.GROUPED_AGG
+        )
+
+        # Union[pa.Array, pa.Array] equals to pa.Array
+        def func(col: Union[pa.Array, pa.Array], *, col2: pa.Array) -> float:
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.GROUPED_AGG
+        )
+
+    def test_type_annotation_negative(self):
+        def func(col: str) -> pa.Array:
+            pass
+
+        self.assertRaisesRegex(
+            NotImplementedError,
+            "Unsupported signature.*str",
+            infer_eval_type,
+            signature(func),
+            get_type_hints(func),
+        )
+
+        def func(col: pa.Array, col1: int) -> pa.Array:
+            pass
+
+        self.assertRaisesRegex(
+            NotImplementedError,
+            "Unsupported signature.*int",
+            infer_eval_type,
+            signature(func),
+            get_type_hints(func),
+        )
+
+        def func(col: Union[pa.Array, str], col1: int) -> pa.Array:
+            pass
+
+        self.assertRaisesRegex(
+            NotImplementedError,
+            "Unsupported signature.*str",
+            infer_eval_type,
+            signature(func),
+            get_type_hints(func),
+        )
+
+        def func(col: pa.Array) -> Tuple[pa.Array]:
+            pass
+
+        self.assertRaisesRegex(
+            NotImplementedError,
+            "Unsupported signature.*Tuple",
+            infer_eval_type,
+            signature(func),
+            get_type_hints(func),
+        )
+
+        def func(col, *args: pa.Array) -> pa.Array:
+            pass
+
+        self.assertRaisesRegex(
+            ValueError,
+            "should be specified.*Array",
+            infer_eval_type,
+            signature(func),
+            get_type_hints(func),
+        )
+
+        def func(col: pa.Array, *args: pa.Array, **kwargs: pa.Array):
+            pass
+
+        self.assertRaisesRegex(
+            ValueError,
+            "should be specified.*Array",
+            infer_eval_type,
+            signature(func),
+            get_type_hints(func),
+        )
+
+        def func(col: pa.Array, *, col2) -> pa.Array:
+            pass
+
+        self.assertRaisesRegex(
+            ValueError,
+            "should be specified.*Array",
+            infer_eval_type,
+            signature(func),
+            get_type_hints(func),
+        )
+
+    def test_scalar_udf_type_hint(self):
+        df = self.spark.range(10).selectExpr("id", "id as v")
+
+        def plus_one(v: pa.Array) -> pa.Array:
+            return pa.compute.add(v, 1)
+
+        plus_one = arrow_udf("long")(plus_one)
+        actual = df.select(plus_one(df.v).alias("plus_one"))
+        expected = df.selectExpr("(v + 1) as plus_one")
+        self.assertEqual(expected.collect(), actual.collect())
+
+    def test_scalar_iter_udf_type_hint(self):
+        df = self.spark.range(10).selectExpr("id", "id as v")
+
+        def plus_one(itr: Iterator[pa.Array]) -> Iterator[pa.Array]:
+            for s in itr:
+                yield pa.compute.add(s, 1)
+
+        plus_one = arrow_udf("long")(plus_one)
+
+        actual = df.select(plus_one(df.v).alias("plus_one"))
+        expected = df.selectExpr("(v + 1) as plus_one")
+        self.assertEqual(expected.collect(), actual.collect())
+
+    @unittest.skipIf(not have_numpy, numpy_requirement_message)
+    def test_group_agg_udf_type_hint(self):
+        import numpy as np
+
+        df = self.spark.range(10).selectExpr("id", "id as v")
+
+        def weighted_mean(v: pa.Array, w: pa.Array) -> np.float64:
+            return np.average(v, weights=w)
+
+        weighted_mean = arrow_udf("double")(weighted_mean)
+
+        actual = df.groupby("id").agg(weighted_mean(df.v, sf.lit(1.0))).sort("id")
+        expected = df.groupby("id").agg(sf.mean(df.v).alias("weighted_mean(v, 1.0)")).sort("id")
+        self.assertEqual(expected.collect(), actual.collect())
+
+    def test_string_type_annotation(self):
+        def func(col: "pa.Array") -> "pa.Array":
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: "pa.Array", col1: "pa.Array") -> "pa.Array":
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: "pa.Array", *args: "pa.Array") -> "pa.Array":
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: "pa.Array", *args: "pa.Array", **kwargs: "pa.Array") -> "pa.Array":
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        def func(col: "pa.Array", *, col2: "pa.Array") -> "pa.Array":
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+        # Union[pa.Array, pa.Array] equals to pa.Array
+        def func(col: Union["pa.Array", "pa.Array"], *, col2: "pa.Array") -> "pa.Array":
+            pass
+
+        self.assertEqual(
+            infer_eval_type(signature(func), get_type_hints(func)), ArrowUDFType.SCALAR
+        )
+
+    @unittest.skipIf(not have_pandas, pandas_requirement_message)
+    def test_negative_with_pandas_udf(self):
+        import pandas as pd
+
+        with self.assertRaisesRegex(
+            Exception,
+            "Unsupported signature:.*pandas.core.series.Series.",
+        ):
+
+            @arrow_udf("long")
+            def multiply_pandas(a: pd.Series, b: pd.Series) -> pd.Series:
+                return a * b
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.arrow.test_arrow_udf_typehints import *  # noqa: #401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/arrow/test_arrow_udf_window.py b/python/pyspark/sql/tests/arrow/test_arrow_udf_window.py
new file mode 100644
index 0000000000000..fde9d72433757
--- /dev/null
+++ b/python/pyspark/sql/tests/arrow/test_arrow_udf_window.py
@@ -0,0 +1,735 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import unittest
+
+from pyspark.sql.functions import arrow_udf, ArrowUDFType
+from pyspark.util import PythonEvalType
+from pyspark.sql import functions as sf
+from pyspark.sql.window import Window
+from pyspark.errors import AnalysisException, PythonException, PySparkTypeError
+from pyspark.testing.sqlutils import (
+    ReusedSQLTestCase,
+    have_pyarrow,
+    pyarrow_requirement_message,
+)
+
+
+@unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+class WindowArrowUDFTestsMixin:
+    @property
+    def data(self):
+        return (
+            self.spark.range(10)
+            .toDF("id")
+            .withColumn("vs", sf.array([sf.lit(i * 1.0) + sf.col("id") for i in range(20, 30)]))
+            .withColumn("v", sf.explode(sf.col("vs")))
+            .drop("vs")
+            .withColumn("w", sf.lit(1.0))
+        )
+
+    @property
+    def python_plus_one(self):
+        @sf.udf("double")
+        def plus_one(v):
+            assert isinstance(v, float)
+            return v + 1
+
+        return plus_one
+
+    @property
+    def arrow_scalar_time_two(self):
+        import pyarrow as pa
+
+        return arrow_udf(lambda v: pa.compute.multiply(v, 2), "double")
+
+    @property
+    def arrow_agg_count_udf(self):
+        @arrow_udf("long", ArrowUDFType.GROUPED_AGG)
+        def count(v):
+            return len(v)
+
+        return count
+
+    @property
+    def arrow_agg_mean_udf(self):
+        import pyarrow as pa
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def avg(v):
+            return pa.compute.mean(v)
+
+        return avg
+
+    @property
+    def arrow_agg_max_udf(self):
+        import pyarrow as pa
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def max(v):
+            return pa.compute.max(v)
+
+        return max
+
+    @property
+    def arrow_agg_min_udf(self):
+        import pyarrow as pa
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def min(v):
+            return pa.compute.min(v)
+
+        return min
+
+    @property
+    def arrow_agg_weighted_mean_udf(self):
+        import numpy as np
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def weighted_mean(v, w):
+            return np.average(v, weights=w)
+
+        return weighted_mean
+
+    @property
+    def unbounded_window(self):
+        return (
+            Window.partitionBy("id")
+            .rowsBetween(Window.unboundedPreceding, Window.unboundedFollowing)
+            .orderBy("v")
+        )
+
+    @property
+    def ordered_window(self):
+        return Window.partitionBy("id").orderBy("v")
+
+    @property
+    def unpartitioned_window(self):
+        return Window.partitionBy()
+
+    @property
+    def sliding_row_window(self):
+        return Window.partitionBy("id").orderBy("v").rowsBetween(-2, 1)
+
+    @property
+    def sliding_range_window(self):
+        return Window.partitionBy("id").orderBy("v").rangeBetween(-2, 4)
+
+    @property
+    def growing_row_window(self):
+        return Window.partitionBy("id").orderBy("v").rowsBetween(Window.unboundedPreceding, 3)
+
+    @property
+    def growing_range_window(self):
+        return Window.partitionBy("id").orderBy("v").rangeBetween(Window.unboundedPreceding, 4)
+
+    @property
+    def shrinking_row_window(self):
+        return Window.partitionBy("id").orderBy("v").rowsBetween(-2, Window.unboundedFollowing)
+
+    @property
+    def shrinking_range_window(self):
+        return Window.partitionBy("id").orderBy("v").rangeBetween(-3, Window.unboundedFollowing)
+
+    def test_simple(self):
+        df = self.data
+        w = self.unbounded_window
+
+        mean_udf = self.arrow_agg_mean_udf
+
+        result1 = df.withColumn("mean_v", mean_udf(df["v"]).over(w))
+        expected1 = df.withColumn("mean_v", sf.mean(df["v"]).over(w))
+
+        result2 = df.select(mean_udf(df["v"]).over(w))
+        expected2 = df.select(sf.mean(df["v"]).over(w))
+
+        self.assertEqual(expected1.collect(), result1.collect())
+        self.assertEqual(expected2.collect(), result2.collect())
+
+    def test_multiple_udfs(self):
+        df = self.data
+        w = self.unbounded_window
+
+        result1 = (
+            df.withColumn("mean_v", self.arrow_agg_mean_udf(df["v"]).over(w))
+            .withColumn("max_v", self.arrow_agg_max_udf(df["v"]).over(w))
+            .withColumn("min_w", self.arrow_agg_min_udf(df["w"]).over(w))
+        )
+
+        expected1 = (
+            df.withColumn("mean_v", sf.mean(df["v"]).over(w))
+            .withColumn("max_v", sf.max(df["v"]).over(w))
+            .withColumn("min_w", sf.min(df["w"]).over(w))
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_replace_existing(self):
+        df = self.data
+        w = self.unbounded_window
+
+        result1 = df.withColumn("v", self.arrow_agg_mean_udf(df["v"]).over(w))
+        expected1 = df.withColumn("v", sf.mean(df["v"]).over(w))
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_mixed_sql(self):
+        df = self.data
+        w = self.unbounded_window
+        mean_udf = self.arrow_agg_mean_udf
+
+        result1 = df.withColumn("v", mean_udf(df["v"] * 2).over(w) + 1)
+        expected1 = df.withColumn("v", sf.mean(df["v"] * 2).over(w) + 1)
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_mixed_udf(self):
+        df = self.data
+        w = self.unbounded_window
+
+        plus_one = self.python_plus_one
+        time_two = self.arrow_scalar_time_two
+        mean_udf = self.arrow_agg_mean_udf
+
+        result1 = df.withColumn("v2", plus_one(mean_udf(plus_one(df["v"])).over(w)))
+        expected1 = df.withColumn("v2", plus_one(sf.mean(plus_one(df["v"])).over(w)))
+
+        result2 = df.withColumn("v2", time_two(mean_udf(time_two(df["v"])).over(w)))
+        expected2 = df.withColumn("v2", time_two(sf.mean(time_two(df["v"])).over(w)))
+
+        self.assertEqual(expected1.collect(), result1.collect())
+        self.assertEqual(expected2.collect(), result2.collect())
+
+    def test_without_partitionBy(self):
+        df = self.data
+        w = self.unpartitioned_window
+        mean_udf = self.arrow_agg_mean_udf
+
+        result1 = df.withColumn("v2", mean_udf(df["v"]).over(w))
+        expected1 = df.withColumn("v2", sf.mean(df["v"]).over(w))
+
+        result2 = df.select(mean_udf(df["v"]).over(w))
+        expected2 = df.select(sf.mean(df["v"]).over(w))
+
+        self.assertEqual(expected1.collect(), result1.collect())
+        self.assertEqual(expected2.collect(), result2.collect())
+
+    def test_mixed_sql_and_udf(self):
+        df = self.data
+        w = self.unbounded_window
+        ow = self.ordered_window
+        max_udf = self.arrow_agg_max_udf
+        min_udf = self.arrow_agg_min_udf
+
+        result1 = df.withColumn("v_diff", max_udf(df["v"]).over(w) - min_udf(df["v"]).over(w))
+        expected1 = df.withColumn("v_diff", sf.max(df["v"]).over(w) - sf.min(df["v"]).over(w))
+
+        # Test mixing sql window function and window udf in the same expression
+        result2 = df.withColumn("v_diff", max_udf(df["v"]).over(w) - sf.min(df["v"]).over(w))
+        expected2 = expected1
+
+        # Test chaining sql aggregate function and udf
+        result3 = (
+            df.withColumn("max_v", max_udf(df["v"]).over(w))
+            .withColumn("min_v", sf.min(df["v"]).over(w))
+            .withColumn("v_diff", sf.col("max_v") - sf.col("min_v"))
+            .drop("max_v", "min_v")
+        )
+        expected3 = expected1
+
+        # Test mixing sql window function and udf
+        result4 = df.withColumn("max_v", max_udf(df["v"]).over(w)).withColumn(
+            "rank", sf.rank().over(ow)
+        )
+        expected4 = df.withColumn("max_v", sf.max(df["v"]).over(w)).withColumn(
+            "rank", sf.rank().over(ow)
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+        self.assertEqual(expected2.collect(), result2.collect())
+        self.assertEqual(expected3.collect(), result3.collect())
+        self.assertEqual(expected4.collect(), result4.collect())
+
+    def test_array_type(self):
+        df = self.data
+        w = self.unbounded_window
+
+        array_udf = arrow_udf(lambda x: [1.0, 2.0], "array<double>", ArrowUDFType.GROUPED_AGG)
+        result1 = df.withColumn("v2", array_udf(df["v"]).over(w))
+        self.assertEqual(result1.first()["v2"], [1.0, 2.0])
+
+    def test_invalid_args(self):
+        with self.quiet():
+            self.check_invalid_args()
+
+    def check_invalid_args(self):
+        df = self.data
+        w = self.unbounded_window
+
+        with self.assertRaises(PySparkTypeError):
+            foo_udf = arrow_udf(lambda x: x, "v double", PythonEvalType.SQL_GROUPED_MAP_ARROW_UDF)
+            df.withColumn("v2", foo_udf(df["v"]).over(w)).schema
+
+    def test_bounded_simple(self):
+        df = self.data
+        w1 = self.sliding_row_window
+        w2 = self.shrinking_range_window
+
+        plus_one = self.python_plus_one
+        count_udf = self.arrow_agg_count_udf
+        mean_udf = self.arrow_agg_mean_udf
+        max_udf = self.arrow_agg_max_udf
+        min_udf = self.arrow_agg_min_udf
+
+        result1 = (
+            df.withColumn("mean_v", mean_udf(plus_one(df["v"])).over(w1))
+            .withColumn("count_v", count_udf(df["v"]).over(w2))
+            .withColumn("max_v", max_udf(df["v"]).over(w2))
+            .withColumn("min_v", min_udf(df["v"]).over(w1))
+        )
+
+        expected1 = (
+            df.withColumn("mean_v", sf.mean(plus_one(df["v"])).over(w1))
+            .withColumn("count_v", sf.count(df["v"]).over(w2))
+            .withColumn("max_v", sf.max(df["v"]).over(w2))
+            .withColumn("min_v", sf.min(df["v"]).over(w1))
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_growing_window(self):
+        df = self.data
+        w1 = self.growing_row_window
+        w2 = self.growing_range_window
+
+        mean_udf = self.arrow_agg_mean_udf
+
+        result1 = df.withColumn("m1", mean_udf(df["v"]).over(w1)).withColumn(
+            "m2", mean_udf(df["v"]).over(w2)
+        )
+
+        expected1 = df.withColumn("m1", sf.mean(df["v"]).over(w1)).withColumn(
+            "m2", sf.mean(df["v"]).over(w2)
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_sliding_window(self):
+        df = self.data
+        w1 = self.sliding_row_window
+        w2 = self.sliding_range_window
+
+        mean_udf = self.arrow_agg_mean_udf
+
+        result1 = df.withColumn("m1", mean_udf(df["v"]).over(w1)).withColumn(
+            "m2", mean_udf(df["v"]).over(w2)
+        )
+
+        expected1 = df.withColumn("m1", sf.mean(df["v"]).over(w1)).withColumn(
+            "m2", sf.mean(df["v"]).over(w2)
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_shrinking_window(self):
+        df = self.data
+        w1 = self.shrinking_row_window
+        w2 = self.shrinking_range_window
+
+        mean_udf = self.arrow_agg_mean_udf
+
+        result1 = df.withColumn("m1", mean_udf(df["v"]).over(w1)).withColumn(
+            "m2", mean_udf(df["v"]).over(w2)
+        )
+
+        expected1 = df.withColumn("m1", sf.mean(df["v"]).over(w1)).withColumn(
+            "m2", sf.mean(df["v"]).over(w2)
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_bounded_mixed(self):
+        df = self.data
+        w1 = self.sliding_row_window
+        w2 = self.unbounded_window
+
+        mean_udf = self.arrow_agg_mean_udf
+        max_udf = self.arrow_agg_max_udf
+
+        result1 = (
+            df.withColumn("mean_v", mean_udf(df["v"]).over(w1))
+            .withColumn("max_v", max_udf(df["v"]).over(w2))
+            .withColumn("mean_unbounded_v", mean_udf(df["v"]).over(w1))
+        )
+
+        expected1 = (
+            df.withColumn("mean_v", sf.mean(df["v"]).over(w1))
+            .withColumn("max_v", sf.max(df["v"]).over(w2))
+            .withColumn("mean_unbounded_v", sf.mean(df["v"]).over(w1))
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_named_arguments(self):
+        df = self.data
+        weighted_mean = self.arrow_agg_weighted_mean_udf
+
+        for w, bound in [(self.sliding_row_window, True), (self.unbounded_window, False)]:
+            for i, windowed in enumerate(
+                [
+                    df.withColumn("wm", weighted_mean(df.v, w=df.w).over(w)),
+                    df.withColumn("wm", weighted_mean(v=df.v, w=df.w).over(w)),
+                    df.withColumn("wm", weighted_mean(w=df.w, v=df.v).over(w)),
+                ]
+            ):
+                with self.subTest(bound=bound, query_no=i):
+                    self.assertEqual(
+                        windowed.collect(), df.withColumn("wm", sf.mean(df.v).over(w)).collect()
+                    )
+
+        with self.tempView("v"):
+            df.createOrReplaceTempView("v")
+            self.spark.udf.register("weighted_mean", weighted_mean)
+
+            for w in [
+                "ROWS BETWEEN 2 PRECEDING AND 1 FOLLOWING",
+                "ROWS BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING",
+            ]:
+                window_spec = f"PARTITION BY id ORDER BY v {w}"
+                for i, func_call in enumerate(
+                    [
+                        "weighted_mean(v, w => w)",
+                        "weighted_mean(v => v, w => w)",
+                        "weighted_mean(w => w, v => v)",
+                    ]
+                ):
+                    with self.subTest(window_spec=window_spec, query_no=i):
+                        self.assertEqual(
+                            self.spark.sql(
+                                f"SELECT id, {func_call} OVER ({window_spec}) as wm FROM v"
+                            ).collect(),
+                            self.spark.sql(
+                                f"SELECT id, mean(v) OVER ({window_spec}) as wm FROM v"
+                            ).collect(),
+                        )
+
+    def test_named_arguments_negative(self):
+        df = self.data
+        weighted_mean = self.arrow_agg_weighted_mean_udf
+
+        with self.tempView("v"):
+            df.createOrReplaceTempView("v")
+            self.spark.udf.register("weighted_mean", weighted_mean)
+
+            base_sql = "SELECT id, {func_call} OVER ({window_spec}) as wm FROM v"
+
+            for w in [
+                "ROWS BETWEEN 2 PRECEDING AND 1 FOLLOWING",
+                "ROWS BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING",
+            ]:
+                window_spec = f"PARTITION BY id ORDER BY v {w}"
+                with self.subTest(window_spec=window_spec):
+                    with self.assertRaisesRegex(
+                        AnalysisException,
+                        "DUPLICATE_ROUTINE_PARAMETER_ASSIGNMENT.DOUBLE_NAMED_ARGUMENT_REFERENCE",
+                    ):
+                        self.spark.sql(
+                            base_sql.format(
+                                func_call="weighted_mean(v => v, v => w)", window_spec=window_spec
+                            )
+                        ).show()
+
+                    with self.assertRaisesRegex(
+                        AnalysisException, "UNEXPECTED_POSITIONAL_ARGUMENT"
+                    ):
+                        self.spark.sql(
+                            base_sql.format(
+                                func_call="weighted_mean(v => v, w)", window_spec=window_spec
+                            )
+                        ).show()
+
+                    with self.assertRaisesRegex(
+                        PythonException, r"weighted_mean\(\) got an unexpected keyword argument 'x'"
+                    ):
+                        self.spark.sql(
+                            base_sql.format(
+                                func_call="weighted_mean(v => v, x => w)", window_spec=window_spec
+                            )
+                        ).show()
+
+                    with self.assertRaisesRegex(
+                        PythonException, r"weighted_mean\(\) got multiple values for argument 'v'"
+                    ):
+                        self.spark.sql(
+                            base_sql.format(
+                                func_call="weighted_mean(v, v => w)", window_spec=window_spec
+                            )
+                        ).show()
+
+    def test_kwargs(self):
+        df = self.data
+
+        @arrow_udf("double", ArrowUDFType.GROUPED_AGG)
+        def weighted_mean(**kwargs):
+            import numpy as np
+
+            return np.average(kwargs["v"], weights=kwargs["w"])
+
+        for w, bound in [(self.sliding_row_window, True), (self.unbounded_window, False)]:
+            for i, windowed in enumerate(
+                [
+                    df.withColumn("wm", weighted_mean(v=df.v, w=df.w).over(w)),
+                    df.withColumn("wm", weighted_mean(w=df.w, v=df.v).over(w)),
+                ]
+            ):
+                with self.subTest(bound=bound, query_no=i):
+                    self.assertEqual(
+                        windowed.collect(), df.withColumn("wm", sf.mean(df.v).over(w)).collect()
+                    )
+
+        with self.tempView("v"):
+            df.createOrReplaceTempView("v")
+            self.spark.udf.register("weighted_mean", weighted_mean)
+
+            base_sql = "SELECT id, {func_call} OVER ({window_spec}) as wm FROM v"
+
+            for w in [
+                "ROWS BETWEEN 2 PRECEDING AND 1 FOLLOWING",
+                "ROWS BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING",
+            ]:
+                window_spec = f"PARTITION BY id ORDER BY v {w}"
+                with self.subTest(window_spec=window_spec):
+                    for i, func_call in enumerate(
+                        [
+                            "weighted_mean(v => v, w => w)",
+                            "weighted_mean(w => w, v => v)",
+                        ]
+                    ):
+                        with self.subTest(query_no=i):
+                            self.assertEqual(
+                                self.spark.sql(
+                                    base_sql.format(func_call=func_call, window_spec=window_spec)
+                                ).collect(),
+                                self.spark.sql(
+                                    base_sql.format(func_call="mean(v)", window_spec=window_spec)
+                                ).collect(),
+                            )
+
+                    # negative
+                    with self.assertRaisesRegex(
+                        AnalysisException,
+                        "DUPLICATE_ROUTINE_PARAMETER_ASSIGNMENT.DOUBLE_NAMED_ARGUMENT_REFERENCE",
+                    ):
+                        self.spark.sql(
+                            base_sql.format(
+                                func_call="weighted_mean(v => v, v => w)", window_spec=window_spec
+                            )
+                        ).show()
+
+                    with self.assertRaisesRegex(
+                        AnalysisException, "UNEXPECTED_POSITIONAL_ARGUMENT"
+                    ):
+                        self.spark.sql(
+                            base_sql.format(
+                                func_call="weighted_mean(v => v, w)", window_spec=window_spec
+                            )
+                        ).show()
+
+    def test_complex_window_collect_set(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame([(1, 1), (1, 2), (2, 3), (2, 5), (2, 3)], ("id", "v"))
+        w = Window.partitionBy("id").orderBy("v")
+
+        @arrow_udf("array<int>")
+        def arrow_collect_set(v: pa.Array) -> pa.Scalar:
+            assert isinstance(v, pa.Array), str(type(v))
+            s = sorted([x.as_py() for x in pa.compute.unique(v)])
+            t = pa.list_(pa.int32())
+            return pa.scalar(value=s, type=t)
+
+        result1 = df.select(
+            arrow_collect_set(df["v"]).over(w).alias("vs"),
+        )
+
+        expected1 = df.select(
+            sf.sort_array(sf.collect_set(df["v"]).over(w)).alias("vs"),
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_complex_window_collect_list(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame([(1, 1), (1, 2), (2, 3), (2, 5), (2, 3)], ("id", "v"))
+        w = Window.partitionBy("id").orderBy("v")
+
+        @arrow_udf("array<int>")
+        def arrow_collect_list(v: pa.Array) -> pa.Scalar:
+            assert isinstance(v, pa.Array), str(type(v))
+            s = sorted([x.as_py() for x in v])
+            t = pa.list_(pa.int32())
+            return pa.scalar(value=s, type=t)
+
+        result1 = df.select(
+            arrow_collect_list(df["v"]).over(w).alias("vs"),
+        )
+
+        expected1 = df.select(
+            sf.sort_array(sf.collect_list(df["v"]).over(w)).alias("vs"),
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_complex_window_collect_as_map(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame(
+            [(1, 2, 1), (1, 3, 2), (2, 4, 3), (2, 5, 5), (2, 6, 3)], ("id", "k", "v")
+        )
+        w = Window.partitionBy("id").orderBy("v")
+
+        @arrow_udf("map<int, int>")
+        def arrow_collect_as_map(id: pa.Array, v: pa.Array) -> pa.Scalar:
+            assert isinstance(id, pa.Array), str(type(id))
+            assert isinstance(v, pa.Array), str(type(v))
+            d = {i: j for i, j in zip(id.to_pylist(), v.to_pylist())}
+            t = pa.map_(pa.int32(), pa.int32())
+            return pa.scalar(value=d, type=t)
+
+        result1 = df.select(
+            arrow_collect_as_map("k", "v").over(w).alias("map"),
+        )
+
+        expected1 = df.select(
+            sf.map_from_arrays(
+                sf.collect_list("k").over(w),
+                sf.collect_list("v").over(w),
+            ).alias("map")
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_complex_window_min_max_struct(self):
+        import pyarrow as pa
+
+        df = self.spark.createDataFrame([(1, 1), (1, 2), (2, 3), (2, 5), (2, 3)], ("id", "v"))
+        w = Window.partitionBy("id").orderBy("v")
+
+        @arrow_udf("struct<m1: int, m2:int>")
+        def arrow_collect_min_max(id: pa.Array, v: pa.Array) -> pa.Scalar:
+            assert isinstance(id, pa.Array), str(type(id))
+            assert isinstance(v, pa.Array), str(type(v))
+            m1 = pa.compute.min(id)
+            m2 = pa.compute.max(v)
+            t = pa.struct([pa.field("m1", pa.int32()), pa.field("m2", pa.int32())])
+            return pa.scalar(value={"m1": m1.as_py(), "m2": m2.as_py()}, type=t)
+
+        result1 = df.select(
+            arrow_collect_min_max("id", "v").over(w).alias("struct"),
+        )
+
+        expected1 = df.select(
+            sf.struct(
+                sf.min("id").over(w).alias("m1"),
+                sf.max("v").over(w).alias("m2"),
+            ).alias("struct")
+        )
+
+        self.assertEqual(expected1.collect(), result1.collect())
+
+    def test_time_min(self):
+        import pyarrow as pa
+
+        df = self.spark.sql(
+            """
+            SELECT * FROM VALUES
+            (1, TIME '12:34:56'),
+            (1, TIME '1:2:3'),
+            (2, TIME '0:58:59'),
+            (2, TIME '10:58:59'),
+            (2, TIME '10:00:03')
+            AS tab(i, t)
+            """
+        )
+        w1 = Window.partitionBy("i").orderBy("t")
+        w2 = Window.orderBy("t")
+
+        @arrow_udf("time", ArrowUDFType.GROUPED_AGG)
+        def agg_min_time(v):
+            assert isinstance(v, pa.Array)
+            assert isinstance(v, pa.Time64Array)
+            return pa.compute.min(v)
+
+        expected1 = df.withColumn("res", sf.min("t").over(w1))
+        result1 = df.withColumn("res", agg_min_time("t").over(w1))
+        self.assertEqual(expected1.collect(), result1.collect())
+
+        expected2 = df.withColumn("res", sf.min("t").over(w2))
+        result2 = df.withColumn("res", agg_min_time("t").over(w2))
+        self.assertEqual(expected2.collect(), result2.collect())
+
+    def test_return_type_coercion(self):
+        import pyarrow as pa
+
+        df = self.spark.range(10).withColumn("v", sf.lit(1))
+        w = Window.partitionBy("id").orderBy("v")
+
+        @arrow_udf("long", ArrowUDFType.GROUPED_AGG)
+        def agg_long(id: pa.Array) -> int:
+            assert isinstance(id, pa.Array), str(type(id))
+            return pa.scalar(value=len(id), type=pa.int64())
+
+        result1 = df.select(agg_long("v").over(w).alias("res"))
+        self.assertEqual(10, len(result1.collect()))
+
+        # long -> int coercion
+        @arrow_udf("int", ArrowUDFType.GROUPED_AGG)
+        def agg_int1(id: pa.Array) -> int:
+            assert isinstance(id, pa.Array), str(type(id))
+            return pa.scalar(value=len(id), type=pa.int64())
+
+        result2 = df.select(agg_int1("v").over(w).alias("res"))
+        self.assertEqual(10, len(result2.collect()))
+
+        # long -> int coercion, overflow
+        @arrow_udf("int", ArrowUDFType.GROUPED_AGG)
+        def agg_int2(id: pa.Array) -> int:
+            assert isinstance(id, pa.Array), str(type(id))
+            return pa.scalar(value=len(id) + 2147483647, type=pa.int64())
+
+        result3 = df.select(agg_int2("id").alias("res"))
+        with self.assertRaises(Exception):
+            # pyarrow.lib.ArrowInvalid:
+            # Integer value 2147483657 not in range: -2147483648 to 2147483647
+            result3.collect()
+
+
+class WindowArrowUDFTests(WindowArrowUDFTestsMixin, ReusedSQLTestCase):
+    pass
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.arrow.test_arrow_udf_window import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/arrow/test_arrow_udtf.py b/python/pyspark/sql/tests/arrow/test_arrow_udtf.py
new file mode 100644
index 0000000000000..d655639faafe4
--- /dev/null
+++ b/python/pyspark/sql/tests/arrow/test_arrow_udtf.py
@@ -0,0 +1,624 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+from typing import Iterator
+
+from pyspark.errors import PySparkAttributeError
+from pyspark.errors import PythonException
+from pyspark.sql.functions import arrow_udtf, lit
+from pyspark.sql.types import Row, StructType, StructField, IntegerType
+from pyspark.testing.sqlutils import ReusedSQLTestCase, have_pyarrow, pyarrow_requirement_message
+from pyspark.testing import assertDataFrameEqual
+
+if have_pyarrow:
+    import pyarrow as pa
+    import pyarrow.compute as pc
+
+
+@unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+class ArrowUDTFTestsMixin:
+    def test_arrow_udtf_zero_args(self):
+        @arrow_udtf(returnType="id int, value string")
+        class TestUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                result_table = pa.table(
+                    {
+                        "id": pa.array([1, 2, 3], type=pa.int32()),
+                        "value": pa.array(["a", "b", "c"], type=pa.string()),
+                    }
+                )
+                yield result_table
+
+        # Test direct DataFrame API usage
+        result_df = TestUDTF()
+        expected_df = self.spark.createDataFrame(
+            [(1, "a"), (2, "b"), (3, "c")], "id int, value string"
+        )
+        assertDataFrameEqual(result_df, expected_df)
+
+        # Test SQL registration and usage
+        self.spark.udtf.register("test_zero_args_udtf", TestUDTF)
+        sql_result_df = self.spark.sql("SELECT * FROM test_zero_args_udtf()")
+        assertDataFrameEqual(sql_result_df, expected_df)
+
+    def test_arrow_udtf_scalar_args_only(self):
+        @arrow_udtf(returnType="x int, y int, sum int")
+        class ScalarArgsUDTF:
+            def eval(self, x: "pa.Array", y: "pa.Array") -> Iterator["pa.Table"]:
+                assert isinstance(x, pa.Array), f"Expected pa.Array, got {type(x)}"
+                assert isinstance(y, pa.Array), f"Expected pa.Array, got {type(y)}"
+
+                x_val = x[0].as_py()
+                y_val = y[0].as_py()
+                result_table = pa.table(
+                    {
+                        "x": pa.array([x_val], type=pa.int32()),
+                        "y": pa.array([y_val], type=pa.int32()),
+                        "sum": pa.array([x_val + y_val], type=pa.int32()),
+                    }
+                )
+                yield result_table
+
+        # Test direct DataFrame API usage
+        result_df = ScalarArgsUDTF(lit(5), lit(10))
+        expected_df = self.spark.createDataFrame([(5, 10, 15)], "x int, y int, sum int")
+        assertDataFrameEqual(result_df, expected_df)
+
+        # Test SQL registration and usage
+        self.spark.udtf.register("ScalarArgsUDTF", ScalarArgsUDTF)
+        sql_result_df = self.spark.sql("SELECT * FROM ScalarArgsUDTF(5, 10)")
+        assertDataFrameEqual(sql_result_df, expected_df)
+
+        # Test with different values via SQL
+        sql_result_df2 = self.spark.sql("SELECT * FROM ScalarArgsUDTF(4, 7)")
+        expected_df2 = self.spark.createDataFrame([(4, 7, 11)], "x int, y int, sum int")
+        assertDataFrameEqual(sql_result_df2, expected_df2)
+
+    def test_arrow_udtf_record_batch_iterator(self):
+        @arrow_udtf(returnType="batch_id int, name string, count int")
+        class RecordBatchUDTF:
+            def eval(self, batch_size: "pa.Array") -> Iterator["pa.RecordBatch"]:
+                assert isinstance(
+                    batch_size, pa.Array
+                ), f"Expected pa.Array, got {type(batch_size)}"
+
+                size = batch_size[0].as_py()
+
+                for batch_id in range(3):
+                    # Create arrays for each column
+                    batch_id_array = pa.array([batch_id] * size, type=pa.int32())
+                    name_array = pa.array([f"batch_{batch_id}"] * size, type=pa.string())
+                    count_array = pa.array(list(range(size)), type=pa.int32())
+
+                    # Create record batch from arrays and names
+                    batch = pa.record_batch(
+                        [batch_id_array, name_array, count_array],
+                        names=["batch_id", "name", "count"],
+                    )
+                    yield batch
+
+        # Test direct DataFrame API usage
+        result_df = RecordBatchUDTF(lit(2))
+        expected_data = [
+            (0, "batch_0", 0),
+            (0, "batch_0", 1),
+            (1, "batch_1", 0),
+            (1, "batch_1", 1),
+            (2, "batch_2", 0),
+            (2, "batch_2", 1),
+        ]
+        expected_df = self.spark.createDataFrame(
+            expected_data, "batch_id int, name string, count int"
+        )
+        assertDataFrameEqual(result_df, expected_df)
+
+        # Test SQL registration and usage
+        self.spark.udtf.register("record_batch_udtf", RecordBatchUDTF)
+        sql_result_df = self.spark.sql(
+            "SELECT * FROM record_batch_udtf(2) ORDER BY batch_id, count"
+        )
+        assertDataFrameEqual(sql_result_df, expected_df)
+
+        # Test with different batch size via SQL
+        sql_result_df2 = self.spark.sql("SELECT * FROM record_batch_udtf(1) ORDER BY batch_id")
+        expected_data2 = [
+            (0, "batch_0", 0),
+            (1, "batch_1", 0),
+            (2, "batch_2", 0),
+        ]
+        expected_df2 = self.spark.createDataFrame(
+            expected_data2, "batch_id int, name string, count int"
+        )
+        assertDataFrameEqual(sql_result_df2, expected_df2)
+
+    def test_arrow_udtf_error_not_iterator(self):
+        @arrow_udtf(returnType="x int, y string")
+        class NotIteratorUDTF:
+            def eval(self) -> "pa.Table":
+                return pa.table(
+                    {"x": pa.array([1], type=pa.int32()), "y": pa.array(["test"], type=pa.string())}
+                )
+
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_NOT_ITERABLE"):
+            result_df = NotIteratorUDTF()
+            result_df.collect()
+
+    def test_arrow_udtf_error_wrong_yield_type(self):
+        @arrow_udtf(returnType="x int, y string")
+        class WrongYieldTypeUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                yield {"x": [1], "y": ["test"]}
+
+        with self.assertRaisesRegex(PythonException, "UDTF_ARROW_TYPE_CONVERSION_ERROR"):
+            result_df = WrongYieldTypeUDTF()
+            result_df.collect()
+
+    def test_arrow_udtf_error_invalid_arrow_type(self):
+        @arrow_udtf(returnType="x int, y string")
+        class InvalidArrowTypeUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                yield "not_an_arrow_table"
+
+        with self.assertRaisesRegex(PythonException, "UDTF_ARROW_TYPE_CONVERSION_ERROR"):
+            result_df = InvalidArrowTypeUDTF()
+            result_df.collect()
+
+    def test_arrow_udtf_error_mismatched_schema(self):
+        @arrow_udtf(returnType="x int, y string")
+        class MismatchedSchemaUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                result_table = pa.table(
+                    {
+                        "wrong_col": pa.array([1], type=pa.int32()),
+                        "another_wrong_col": pa.array([2.5], type=pa.float64()),
+                    }
+                )
+                yield result_table
+
+        with self.assertRaisesRegex(PythonException, "Schema at index 0 was different"):
+            result_df = MismatchedSchemaUDTF()
+            result_df.collect()
+
+    def test_arrow_udtf_sql_with_aggregation(self):
+        @arrow_udtf(returnType="category string, count int")
+        class CategoryCountUDTF:
+            def eval(self, categories: "pa.Array") -> Iterator["pa.Table"]:
+                # The input is a single array element, extract the array contents
+                cat_array = categories[0].as_py()  # Get the array from the first (and only) element
+
+                # Count occurrences
+                counts = {}
+                for cat in cat_array:
+                    if cat is not None:
+                        counts[cat] = counts.get(cat, 0) + 1
+
+                if counts:
+                    result_table = pa.table(
+                        {
+                            "category": pa.array(list(counts.keys()), type=pa.string()),
+                            "count": pa.array(list(counts.values()), type=pa.int32()),
+                        }
+                    )
+                    yield result_table
+
+        self.spark.udtf.register("category_count_udtf", CategoryCountUDTF)
+
+        # Test with array input
+        result_df = self.spark.sql(
+            "SELECT * FROM category_count_udtf(array('A', 'B', 'A', 'C', 'B', 'A')) "
+            "ORDER BY category"
+        )
+        expected_df = self.spark.createDataFrame(
+            [("A", 3), ("B", 2), ("C", 1)], "category string, count int"
+        )
+        assertDataFrameEqual(result_df, expected_df)
+
+    def test_arrow_udtf_sql_with_struct_output(self):
+        @arrow_udtf(returnType="person struct<name:string,age:int>, status string")
+        class PersonStatusUDTF:
+            def eval(self, name: "pa.Array", age: "pa.Array") -> Iterator["pa.Table"]:
+                name_val = name[0].as_py()
+                age_val = age[0].as_py()
+
+                status = "adult" if age_val >= 18 else "minor"
+
+                # Create struct array
+                person_array = pa.array(
+                    [{"name": name_val, "age": age_val}],
+                    type=pa.struct([("name", pa.string()), ("age", pa.int32())]),
+                )
+
+                result_table = pa.table(
+                    {
+                        "person": person_array,
+                        "status": pa.array([status], type=pa.string()),
+                    }
+                )
+                yield result_table
+
+        self.spark.udtf.register("person_status_udtf", PersonStatusUDTF)
+
+        result_df = self.spark.sql("SELECT * FROM person_status_udtf('John', 25)")
+        # Note: Using Row constructor for the expected struct value
+        expected_df = self.spark.createDataFrame(
+            [(Row(name="John", age=25), "adult")],
+            "person struct<name:string,age:int>, status string",
+        )
+        assertDataFrameEqual(result_df, expected_df)
+
+    def test_arrow_udtf_sql_conditional_yield(self):
+        @arrow_udtf(returnType="number int, type string")
+        class FilterNumbersUDTF:
+            def eval(self, start: "pa.Array", end: "pa.Array") -> Iterator["pa.Table"]:
+                start_val = start[0].as_py()
+                end_val = end[0].as_py()
+
+                numbers = []
+                types = []
+
+                for i in range(start_val, end_val + 1):
+                    if i % 2 == 0:  # Only yield even numbers
+                        numbers.append(i)
+                        types.append("even")
+
+                if numbers:  # Only yield if we have data
+                    result_table = pa.table(
+                        {
+                            "number": pa.array(numbers, type=pa.int32()),
+                            "type": pa.array(types, type=pa.string()),
+                        }
+                    )
+                    yield result_table
+
+        self.spark.udtf.register("filter_numbers_udtf", FilterNumbersUDTF)
+
+        result_df = self.spark.sql("SELECT * FROM filter_numbers_udtf(1, 10) ORDER BY number")
+        expected_df = self.spark.createDataFrame(
+            [(2, "even"), (4, "even"), (6, "even"), (8, "even"), (10, "even")],
+            "number int, type string",
+        )
+        assertDataFrameEqual(result_df, expected_df)
+
+    def test_arrow_udtf_sql_empty_result(self):
+        @arrow_udtf(returnType="value int")
+        class EmptyResultUDTF:
+            def eval(self, condition: "pa.Array") -> Iterator["pa.Table"]:
+                # Only yield if condition is true
+                if condition[0].as_py():
+                    result_table = pa.table(
+                        {
+                            "value": pa.array([42], type=pa.int32()),
+                        }
+                    )
+                    yield result_table
+                # If condition is false, don't yield anything
+
+        self.spark.udtf.register("empty_result_udtf", EmptyResultUDTF)
+
+        # Test with true condition
+        result_df_true = self.spark.sql("SELECT * FROM empty_result_udtf(true)")
+        expected_df_true = self.spark.createDataFrame([(42,)], "value int")
+        assertDataFrameEqual(result_df_true, expected_df_true)
+
+        # Test with false condition (empty result)
+        result_df_false = self.spark.sql("SELECT * FROM empty_result_udtf(false)")
+        expected_df_false = self.spark.createDataFrame([], "value int")
+        assertDataFrameEqual(result_df_false, expected_df_false)
+
+    def test_arrow_udtf_type_coercion_long_to_int(self):
+        @arrow_udtf(returnType="id int")
+        class LongToIntUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                result_table = pa.table(
+                    {
+                        "id": pa.array([1, 2, 3], type=pa.int64()),  # long values
+                    }
+                )
+                yield result_table
+
+        with self.assertRaisesRegex(PythonException, "Schema at index 0 was different"):
+            result_df = LongToIntUDTF()
+            result_df.collect()
+
+    def test_arrow_udtf_type_coercion_string_to_int(self):
+        @arrow_udtf(returnType="id int")
+        class StringToIntUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                # Return string values that cannot be coerced to int
+                result_table = pa.table(
+                    {
+                        "id": pa.array(["abc", "def", "xyz"], type=pa.string()),
+                    }
+                )
+                yield result_table
+
+        with self.assertRaisesRegex(PythonException, "Schema at index 0 was different"):
+            result_df = StringToIntUDTF()
+            result_df.collect()
+
+    def test_arrow_udtf_with_empty_column_result(self):
+        @arrow_udtf(returnType=StructType())
+        class EmptyResultUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                yield pa.Table.from_struct_array(pa.array([{}] * 3))
+
+        assertDataFrameEqual(EmptyResultUDTF(), [Row(), Row(), Row()])
+
+        @arrow_udtf(returnType="id int")
+        class InvalidEmptyResultUDTF:
+            def eval(self) -> Iterator["pa.Table"]:
+                yield pa.Table.from_struct_array(pa.array([{}] * 3))
+
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
+            result_df = InvalidEmptyResultUDTF()
+            result_df.collect()
+
+    def test_arrow_udtf_blocks_analyze_method_none_return_type(self):
+        with self.assertRaises(PySparkAttributeError) as cm:
+
+            @arrow_udtf
+            class AnalyzeUDTF:
+                def eval(self, input_col: "pa.Array") -> Iterator["pa.Table"]:
+                    yield pa.table({"result": pa.array([1, 2, 3])})
+
+                @staticmethod
+                def analyze(arg):
+                    from pyspark.sql.udtf import AnalyzeResult
+
+                    return AnalyzeResult(
+                        schema=StructType([StructField("result", IntegerType(), True)])
+                    )
+
+        self.assertIn("INVALID_ARROW_UDTF_WITH_ANALYZE", str(cm.exception))
+
+    def test_arrow_udtf_blocks_analyze_method_with_return_type(self):
+        with self.assertRaises(PySparkAttributeError) as cm:
+
+            @arrow_udtf(returnType="result: int")
+            class AnalyzeUDTF:
+                def eval(self, input_col: "pa.Array") -> Iterator["pa.Table"]:
+                    yield pa.table({"result": pa.array([1, 2, 3])})
+
+                @staticmethod
+                def analyze(arg):
+                    from pyspark.sql.udtf import AnalyzeResult
+
+                    return AnalyzeResult(
+                        schema=StructType([StructField("result", IntegerType(), True)])
+                    )
+
+        self.assertIn("INVALID_UDTF_BOTH_RETURN_TYPE_AND_ANALYZE", str(cm.exception))
+
+    def test_arrow_udtf_with_table_argument_basic(self):
+        @arrow_udtf(returnType="filtered_id bigint")  # Use bigint to match int64
+        class TableArgUDTF:
+            def eval(self, table_data: "pa.RecordBatch") -> Iterator["pa.Table"]:
+                assert isinstance(
+                    table_data, pa.RecordBatch
+                ), f"Expected pa.RecordBatch, got {type(table_data)}"
+
+                # Convert record batch to table to work with it more easily
+                table = pa.table(table_data)
+
+                # Filter rows where id > 5
+                id_column = table.column("id")
+                mask = pa.compute.greater(id_column, pa.scalar(5))
+                filtered_table = table.filter(mask)
+
+                if filtered_table.num_rows > 0:
+                    result_table = pa.table(
+                        {"filtered_id": filtered_table.column("id")}  # Keep original type (int64)
+                    )
+                    yield result_table
+
+        # Test with DataFrame API using asTable()
+        input_df = self.spark.range(8)
+        result_df = TableArgUDTF(input_df.asTable())
+        expected_df = self.spark.createDataFrame([(6,), (7,)], "filtered_id bigint")
+        assertDataFrameEqual(result_df, expected_df)
+
+        # Test SQL registration and usage with TABLE() syntax
+        self.spark.udtf.register("test_table_arg_udtf", TableArgUDTF)
+        sql_result_df = self.spark.sql(
+            "SELECT * FROM test_table_arg_udtf(TABLE(SELECT id FROM range(0, 8)))"
+        )
+        assertDataFrameEqual(sql_result_df, expected_df)
+
+    def test_arrow_udtf_with_table_argument_and_scalar(self):
+        @arrow_udtf(returnType="filtered_id bigint")  # Use bigint to match int64
+        class MixedArgsUDTF:
+            def eval(
+                self, table_data: "pa.RecordBatch", threshold: "pa.Array"
+            ) -> Iterator["pa.Table"]:
+                assert isinstance(
+                    threshold, pa.Array
+                ), f"Expected pa.Array for threshold, got {type(threshold)}"
+                assert isinstance(
+                    table_data, pa.RecordBatch
+                ), f"Expected pa.RecordBatch for table_data, got {type(table_data)}"
+
+                threshold_val = threshold[0].as_py()
+
+                # Convert record batch to table
+                table = pa.table(table_data)
+                id_column = table.column("id")
+                mask = pa.compute.greater(id_column, pa.scalar(threshold_val))
+                filtered_table = table.filter(mask)
+
+                if filtered_table.num_rows > 0:
+                    result_table = pa.table(
+                        {"filtered_id": filtered_table.column("id")}  # Keep original type
+                    )
+                    yield result_table
+
+        # # Test with DataFrame API
+        input_df = self.spark.range(8)
+        result_df = MixedArgsUDTF(input_df.asTable(), lit(5))
+        expected_df = self.spark.createDataFrame([(6,), (7,)], "filtered_id bigint")
+        assertDataFrameEqual(result_df, expected_df)
+
+        # Test SQL registration and usage
+        self.spark.udtf.register("test_mixed_args_udtf", MixedArgsUDTF)
+        sql_result_df = self.spark.sql(
+            "SELECT * FROM test_mixed_args_udtf(TABLE(SELECT id FROM range(0, 8)), 5)"
+        )
+        assertDataFrameEqual(sql_result_df, expected_df)
+
+    def test_arrow_udtf_lateral_join_disallowed(self):
+        @arrow_udtf(returnType="x int, result int")
+        class SimpleArrowUDTF:
+            def eval(self, input_val: "pa.Array") -> Iterator["pa.Table"]:
+                val = input_val[0].as_py()
+                result_table = pa.table(
+                    {
+                        "x": pa.array([val], type=pa.int32()),
+                        "result": pa.array([val * 2], type=pa.int32()),
+                    }
+                )
+                yield result_table
+
+        self.spark.udtf.register("simple_arrow_udtf", SimpleArrowUDTF)
+
+        test_df = self.spark.createDataFrame([(1,), (2,), (3,)], "id int")
+        test_df.createOrReplaceTempView("test_table")
+
+        with self.assertRaisesRegex(Exception, "LATERAL_JOIN_WITH_ARROW_UDTF_UNSUPPORTED"):
+            self.spark.sql(
+                """
+                SELECT t.id, f.x, f.result
+                FROM test_table t, LATERAL simple_arrow_udtf(t.id) f
+                """
+            )
+
+    def test_arrow_udtf_lateral_join_with_table_argument_disallowed(self):
+        @arrow_udtf(returnType="filtered_id bigint")
+        class MixedArgsUDTF:
+            def eval(self, input_table: "pa.Table") -> Iterator["pa.Table"]:
+                filtered_data = input_table.filter(pc.greater(input_table["id"], 5))
+                result_table = pa.table({"filtered_id": filtered_data["id"]})
+                yield result_table
+
+        self.spark.udtf.register("mixed_args_udtf", MixedArgsUDTF)
+
+        test_df1 = self.spark.createDataFrame([(1,), (2,), (3,)], "id int")
+        test_df1.createOrReplaceTempView("test_table1")
+
+        test_df2 = self.spark.createDataFrame([(6,), (7,), (8,)], "id bigint")
+        test_df2.createOrReplaceTempView("test_table2")
+
+        # Table arguments create nested lateral joins where our CheckAnalysis rule doesn't trigger
+        # because the Arrow UDTF is in the inner lateral join, not the outer one our rule checks.
+        # So Spark's general lateral join validation catches this first with
+        # NON_DETERMINISTIC_LATERAL_SUBQUERIES.
+        with self.assertRaisesRegex(
+            Exception,
+            "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.NON_DETERMINISTIC_LATERAL_SUBQUERIES",
+        ):
+            self.spark.sql(
+                """
+                SELECT t1.id, f.filtered_id
+                FROM test_table1 t1, LATERAL mixed_args_udtf(table(SELECT * FROM test_table2)) f
+                """
+            )
+
+    def test_arrow_udtf_with_table_argument_then_lateral_join_allowed(self):
+        @arrow_udtf(returnType="processed_id bigint")
+        class TableArgUDTF:
+            def eval(self, input_table: "pa.Table") -> Iterator["pa.Table"]:
+                processed_data = pc.add(input_table["id"], 100)
+                result_table = pa.table({"processed_id": processed_data})
+                yield result_table
+
+        self.spark.udtf.register("table_arg_udtf", TableArgUDTF)
+
+        source_df = self.spark.createDataFrame([(1,), (2,), (3,)], "id bigint")
+        source_df.createOrReplaceTempView("source_table")
+
+        join_df = self.spark.createDataFrame([("A",), ("B",), ("C",)], "label string")
+        join_df.createOrReplaceTempView("join_table")
+
+        result_df = self.spark.sql(
+            """
+            SELECT f.processed_id, j.label
+            FROM table_arg_udtf(table(SELECT * FROM source_table)) f,
+                join_table j
+            ORDER BY f.processed_id, j.label
+            """
+        )
+
+        expected_data = [
+            (101, "A"),
+            (101, "B"),
+            (101, "C"),
+            (102, "A"),
+            (102, "B"),
+            (102, "C"),
+            (103, "A"),
+            (103, "B"),
+            (103, "C"),
+        ]
+        expected_df = self.spark.createDataFrame(expected_data, "processed_id bigint, label string")
+        assertDataFrameEqual(result_df, expected_df)
+
+    def test_arrow_udtf_table_argument_with_regular_udtf_lateral_join_allowed(self):
+        @arrow_udtf(returnType="computed_value int")
+        class ComputeUDTF:
+            def eval(self, input_table: "pa.Table") -> Iterator["pa.Table"]:
+                total = pc.sum(input_table["value"]).as_py()
+                result_table = pa.table({"computed_value": pa.array([total], type=pa.int32())})
+                yield result_table
+
+        from pyspark.sql.functions import udtf
+        from pyspark.sql.types import StructType, StructField, IntegerType
+
+        @udtf(returnType=StructType([StructField("multiplied", IntegerType())]))
+        class MultiplyUDTF:
+            def eval(self, input_val: int):
+                yield (input_val * 3,)
+
+        self.spark.udtf.register("compute_udtf", ComputeUDTF)
+        self.spark.udtf.register("multiply_udtf", MultiplyUDTF)
+
+        values_df = self.spark.createDataFrame([(10,), (20,), (30,)], "value int")
+        values_df.createOrReplaceTempView("values_table")
+
+        result_df = self.spark.sql(
+            """
+            SELECT c.computed_value, m.multiplied
+            FROM compute_udtf(table(SELECT * FROM values_table) WITH SINGLE PARTITION) c,
+                LATERAL multiply_udtf(c.computed_value) m
+            """
+        )
+
+        expected_df = self.spark.createDataFrame([(60, 180)], "computed_value int, multiplied int")
+        assertDataFrameEqual(result_df, expected_df)
+
+
+class ArrowUDTFTests(ArrowUDTFTestsMixin, ReusedSQLTestCase):
+    pass
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.arrow.test_arrow_udtf import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_python_udf.py b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_python_udf.py
index 8a5fe6131bd3d..6af55bb0b0bd1 100644
--- a/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_python_udf.py
+++ b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_python_udf.py
@@ -33,6 +33,64 @@ def tearDownClass(cls):
             super(ArrowPythonUDFParityTests, cls).tearDownClass()
 
 
+class ArrowPythonUDFParityLegacyTestsMixin(ArrowPythonUDFTestsMixin):
+    @classmethod
+    def setUpClass(cls):
+        super().setUpClass()
+        cls.spark.conf.set("spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled", "true")
+
+    @classmethod
+    def tearDownClass(cls):
+        try:
+            cls.spark.conf.unset("spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled")
+        finally:
+            super().tearDownClass()
+
+
+class ArrowPythonUDFParityNonLegacyTestsMixin(ArrowPythonUDFTestsMixin):
+    @classmethod
+    def setUpClass(cls):
+        super().setUpClass()
+        cls.spark.conf.set(
+            "spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled", "false"
+        )
+
+    @classmethod
+    def tearDownClass(cls):
+        try:
+            cls.spark.conf.unset("spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled")
+        finally:
+            super().tearDownClass()
+
+
+class ArrowPythonUDFParityLegacyTests(UDFParityTests, ArrowPythonUDFParityLegacyTestsMixin):
+    @classmethod
+    def setUpClass(cls):
+        super(ArrowPythonUDFParityLegacyTests, cls).setUpClass()
+        cls.spark.conf.set("spark.sql.execution.pythonUDF.arrow.enabled", "true")
+
+    @classmethod
+    def tearDownClass(cls):
+        try:
+            cls.spark.conf.unset("spark.sql.execution.pythonUDF.arrow.enabled")
+        finally:
+            super(ArrowPythonUDFParityLegacyTests, cls).tearDownClass()
+
+
+class ArrowPythonUDFParityNonLegacyTests(UDFParityTests, ArrowPythonUDFParityNonLegacyTestsMixin):
+    @classmethod
+    def setUpClass(cls):
+        super(ArrowPythonUDFParityNonLegacyTests, cls).setUpClass()
+        cls.spark.conf.set("spark.sql.execution.pythonUDF.arrow.enabled", "true")
+
+    @classmethod
+    def tearDownClass(cls):
+        try:
+            cls.spark.conf.unset("spark.sql.execution.pythonUDF.arrow.enabled")
+        finally:
+            super(ArrowPythonUDFParityNonLegacyTests, cls).tearDownClass()
+
+
 if __name__ == "__main__":
     import unittest
     from pyspark.sql.tests.connect.arrow.test_parity_arrow_python_udf import *  # noqa: F401
diff --git a/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf.py b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf.py
index 567ab6913d30b..d3dd6d7f87037 100644
--- a/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf.py
+++ b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf.py
@@ -15,12 +15,18 @@
 # limitations under the License.
 #
 
+import os
+import time
+
 from pyspark.sql.tests.arrow.test_arrow_udf import ArrowUDFTestsMixin
 from pyspark.testing.connectutils import ReusedConnectTestCase
 
 
 class ArrowPythonUDFParityTests(ArrowUDFTestsMixin, ReusedConnectTestCase):
-    pass
+    def setUp(self):
+        tz = "America/Los_Angeles"
+        os.environ["TZ"] = tz
+        time.tzset()
 
 
 if __name__ == "__main__":
diff --git a/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf_grouped_agg.py b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf_grouped_agg.py
new file mode 100644
index 0000000000000..fea43edb5f824
--- /dev/null
+++ b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf_grouped_agg.py
@@ -0,0 +1,57 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import time
+
+from pyspark.sql.tests.arrow.test_arrow_udf_grouped_agg import GroupedAggArrowUDFTestsMixin
+from pyspark.testing.connectutils import ReusedConnectTestCase
+
+
+class GroupedAggArrowPythonUDFParityTests(GroupedAggArrowUDFTestsMixin, ReusedConnectTestCase):
+    @classmethod
+    def setUpClass(cls):
+        ReusedConnectTestCase.setUpClass()
+
+        # Synchronize default timezone between Python and Java
+        cls.tz_prev = os.environ.get("TZ", None)  # save current tz if set
+        tz = "America/Los_Angeles"
+        os.environ["TZ"] = tz
+        time.tzset()
+
+        cls.spark.conf.set("spark.sql.session.timeZone", tz)
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ["TZ"]
+        if cls.tz_prev is not None:
+            os.environ["TZ"] = cls.tz_prev
+        time.tzset()
+        ReusedConnectTestCase.tearDownClass()
+
+
+if __name__ == "__main__":
+    import unittest
+    from pyspark.sql.tests.connect.arrow.test_parity_arrow_udf_grouped_agg import *  # noqa: F401
+
+    try:
+        import xmlrunner  # type: ignore[import]
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf_window.py b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf_window.py
new file mode 100644
index 0000000000000..5b834e291df51
--- /dev/null
+++ b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udf_window.py
@@ -0,0 +1,57 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import time
+
+from pyspark.sql.tests.arrow.test_arrow_udf_window import WindowArrowUDFTestsMixin
+from pyspark.testing.connectutils import ReusedConnectTestCase
+
+
+class WindowArrowPythonUDFParityTests(WindowArrowUDFTestsMixin, ReusedConnectTestCase):
+    @classmethod
+    def setUpClass(cls):
+        ReusedConnectTestCase.setUpClass()
+
+        # Synchronize default timezone between Python and Java
+        cls.tz_prev = os.environ.get("TZ", None)  # save current tz if set
+        tz = "America/Los_Angeles"
+        os.environ["TZ"] = tz
+        time.tzset()
+
+        cls.spark.conf.set("spark.sql.session.timeZone", tz)
+
+    @classmethod
+    def tearDownClass(cls):
+        del os.environ["TZ"]
+        if cls.tz_prev is not None:
+            os.environ["TZ"] = cls.tz_prev
+        time.tzset()
+        ReusedConnectTestCase.tearDownClass()
+
+
+if __name__ == "__main__":
+    import unittest
+    from pyspark.sql.tests.connect.arrow.test_parity_arrow_udf_window import *  # noqa: F401
+
+    try:
+        import xmlrunner  # type: ignore[import]
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udtf.py b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udtf.py
new file mode 100644
index 0000000000000..18227f493a0bd
--- /dev/null
+++ b/python/pyspark/sql/tests/connect/arrow/test_parity_arrow_udtf.py
@@ -0,0 +1,45 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import unittest
+
+from pyspark.sql.tests.arrow.test_arrow_udtf import ArrowUDTFTestsMixin
+from pyspark.testing.connectutils import ReusedConnectTestCase
+
+
+class ArrowUDTFParityTests(ArrowUDTFTestsMixin, ReusedConnectTestCase):
+    # TODO(SPARK-53323): Support table arguments in Spark Connect Arrow UDTFs
+    @unittest.skip("asTable() is not supported in Spark Connect")
+    def test_arrow_udtf_with_table_argument_basic(self):
+        super().test_arrow_udtf_with_table_argument_basic()
+
+    # TODO(SPARK-53323): Support table arguments in Spark Connect Arrow UDTFs
+    @unittest.skip("asTable() is not supported in Spark Connect")
+    def test_arrow_udtf_with_table_argument_and_scalar(self):
+        super().test_arrow_udtf_with_table_argument_and_scalar()
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.connect.arrow.test_parity_arrow_udtf import *  # noqa: F401
+
+    try:
+        import xmlrunner  # type: ignore[import]
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/connect/client/test_client.py b/python/pyspark/sql/tests/connect/client/test_client.py
index 647b950fd20f4..c3954827bae54 100644
--- a/python/pyspark/sql/tests/connect/client/test_client.py
+++ b/python/pyspark/sql/tests/connect/client/test_client.py
@@ -34,7 +34,8 @@
         DefaultPolicy,
     )
     from pyspark.sql.connect.client.reattach import ExecutePlanResponseReattachableIterator
-    from pyspark.errors import PySparkRuntimeError, RetriesExceeded
+    from pyspark.sql.connect.session import SparkSession as RemoteSparkSession
+    from pyspark.errors import PySparkRuntimeError
     import pyspark.sql.connect.proto as proto
 
     class TestPolicy(DefaultPolicy):
@@ -226,40 +227,43 @@ def test_is_closed(self):
         client.close()
         self.assertTrue(client.is_closed)
 
-    def test_retry(self):
-        client = SparkConnectClient("sc://foo/;token=bar")
-
-        total_sleep = 0
-
-        def sleep(t):
-            nonlocal total_sleep
-            total_sleep += t
-
-        try:
-            for attempt in Retrying(client._retry_policies, sleep=sleep):
-                with attempt:
-                    raise TestException("Retryable error", grpc.StatusCode.UNAVAILABLE)
-        except RetriesExceeded:
-            pass
+    def test_channel_builder_with_session(self):
+        dummy = str(uuid.uuid4())
+        chan = DefaultChannelBuilder(f"sc://foo/;session_id={dummy}")
+        client = SparkConnectClient(chan)
+        self.assertEqual(client._session_id, chan.session_id)
 
-        # tolerated at least 10 mins of fails
-        self.assertGreaterEqual(total_sleep, 600)
+    def test_session_hook(self):
+        inits = 0
+        calls = 0
 
-    def test_retry_client_unit(self):
-        client = SparkConnectClient("sc://foo/;token=bar")
+        class TestHook(RemoteSparkSession.Hook):
+            def __init__(self, _session):
+                nonlocal inits
+                inits += 1
 
-        policyA = TestPolicy()
-        policyB = DefaultPolicy()
+            def on_execute_plan(self, req):
+                nonlocal calls
+                calls += 1
+                return req
 
-        client.set_retry_policies([policyA, policyB])
+        session = (
+            RemoteSparkSession.builder.remote("sc://foo")._registerHook(TestHook).getOrCreate()
+        )
+        self.assertEqual(inits, 1)
+        self.assertEqual(calls, 0)
+        session.client._stub = MockService(session.client._session_id)
+        session.client.disable_reattachable_execute()
 
-        self.assertEqual(client.get_retry_policies(), [policyA, policyB])
+        # Called from _execute_and_fetch_as_iterator
+        session.range(1).collect()
+        self.assertEqual(inits, 1)
+        self.assertEqual(calls, 1)
 
-    def test_channel_builder_with_session(self):
-        dummy = str(uuid.uuid4())
-        chan = DefaultChannelBuilder(f"sc://foo/;session_id={dummy}")
-        client = SparkConnectClient(chan)
-        self.assertEqual(client._session_id, chan.session_id)
+        # Called from _execute
+        session.udf.register("test_func", lambda x: x + 1)
+        self.assertEqual(inits, 1)
+        self.assertEqual(calls, 2)
 
     def test_custom_operation_id(self):
         client = SparkConnectClient("sc://foo/;token=bar", use_reattachable_execute=False)
@@ -390,7 +394,7 @@ def not_found():
             def checks():
                 self.assertEqual(2, stub.execute_calls)
                 self.assertEqual(0, stub.attach_calls)
-                self.assertEqual(0, stub.release_calls)
+                self.assertEqual(1, stub.release_calls)
                 self.assertEqual(0, stub.release_until_calls)
 
             eventually(timeout=1, catch_assertions=True)(checks)()
diff --git a/python/pyspark/sql/tests/connect/client/test_client_retries.py b/python/pyspark/sql/tests/connect/client/test_client_retries.py
new file mode 100644
index 0000000000000..fb3263e2824f7
--- /dev/null
+++ b/python/pyspark/sql/tests/connect/client/test_client_retries.py
@@ -0,0 +1,248 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import unittest
+import warnings
+
+from pyspark.testing.connectutils import should_test_connect, connect_requirement_message
+
+if should_test_connect:
+    import grpc
+    import google.protobuf.any_pb2 as any_pb2
+    import google.protobuf.duration_pb2 as duration_pb2
+    from google.rpc import status_pb2
+    from google.rpc import error_details_pb2
+    from pyspark.sql.connect.client import SparkConnectClient
+    from pyspark.sql.connect.client.retries import (
+        Retrying,
+        DefaultPolicy,
+    )
+    from pyspark.sql.tests.connect.client.test_client import (
+        TestPolicy,
+        TestException,
+    )
+
+    class SleepTimeTracker:
+        """Tracks sleep times in ms for testing purposes."""
+
+        def __init__(self):
+            self._times = []
+
+        def sleep(self, t: float):
+            self._times.append(int(1000 * t))
+
+        @property
+        def times(self):
+            return list(self._times)
+
+    def create_test_exception_with_details(
+        msg: str,
+        code: grpc.StatusCode = grpc.StatusCode.INTERNAL,
+        retry_delay: int = 0,
+    ) -> TestException:
+        """Helper function for creating TestException with additional error details
+        like retry_delay.
+        """
+        retry_delay_msg = duration_pb2.Duration()
+        retry_delay_msg.FromMilliseconds(retry_delay)
+        retry_info = error_details_pb2.RetryInfo()
+        retry_info.retry_delay.CopyFrom(retry_delay_msg)
+
+        # Pack RetryInfo into an Any type
+        retry_info_any = any_pb2.Any()
+        retry_info_any.Pack(retry_info)
+        status = status_pb2.Status(
+            code=code.value[0],
+            message=msg,
+            details=[retry_info_any],
+        )
+        return TestException(msg=msg, code=code, trailing_status=status)
+
+    def get_client_policies_map(client: SparkConnectClient) -> dict:
+        return {type(policy): policy for policy in client.get_retry_policies()}
+
+
+@unittest.skipIf(not should_test_connect, connect_requirement_message)
+class SparkConnectClientRetriesTestCase(unittest.TestCase):
+    def assertListsAlmostEqual(self, first, second, places=None, msg=None, delta=None):
+        self.assertEqual(len(first), len(second), msg)
+        for i in range(len(first)):
+            self.assertAlmostEqual(first[i], second[i], places, msg, delta)
+
+    def test_retry(self):
+        client = SparkConnectClient("sc://foo/;token=bar")
+
+        sleep_tracker = SleepTimeTracker()
+        try:
+            for attempt in Retrying(client._retry_policies, sleep=sleep_tracker.sleep):
+                with attempt:
+                    raise TestException("Retryable error", grpc.StatusCode.UNAVAILABLE)
+        except TestException:
+            pass
+
+        # tolerated at least 10 mins of fails
+        self.assertGreaterEqual(sum(sleep_tracker.times), 600)
+
+    def test_retry_client_unit(self):
+        client = SparkConnectClient("sc://foo/;token=bar")
+
+        policyA = TestPolicy()
+        policyB = DefaultPolicy()
+
+        client.set_retry_policies([policyA, policyB])
+
+        self.assertEqual(client.get_retry_policies(), [policyA, policyB])
+
+    def test_warning_works(self):
+        client = SparkConnectClient("sc://foo/;token=bar")
+        policy = get_client_policies_map(client).get(DefaultPolicy)
+        self.assertIsNotNone(policy)
+
+        sleep_tracker = SleepTimeTracker()
+        with warnings.catch_warnings(record=True) as warning_list:
+            warnings.simplefilter("always")
+            try:
+                for attempt in Retrying(client._retry_policies, sleep=sleep_tracker.sleep):
+                    with attempt:
+                        raise TestException(
+                            msg="Some error message", code=grpc.StatusCode.UNAVAILABLE
+                        )
+            except TestException:
+                pass
+            self.assertEqual(len(sleep_tracker.times), policy.max_retries)
+            self.assertEqual(len(warning_list), 1)
+            self.assertEqual(
+                str(warning_list[0].message),
+                "[RETRIES_EXCEEDED] The maximum number of retries has been exceeded.",
+            )
+
+    def test_default_policy_retries_retry_info(self):
+        client = SparkConnectClient("sc://foo/;token=bar")
+        policy = get_client_policies_map(client).get(DefaultPolicy)
+        self.assertIsNotNone(policy)
+
+        # retry delay = 0, error code not matched by any policy.
+        # Testing if errors with RetryInfo are being retried by the DefaultPolicy.
+        retry_delay = 0
+        sleep_tracker = SleepTimeTracker()
+        try:
+            for attempt in Retrying(client._retry_policies, sleep=sleep_tracker.sleep):
+                with attempt:
+                    raise create_test_exception_with_details(
+                        msg="Some error message",
+                        code=grpc.StatusCode.UNIMPLEMENTED,
+                        retry_delay=retry_delay,
+                    )
+        except TestException:
+            pass
+        expected_times = [
+            min(policy.max_backoff, policy.initial_backoff * policy.backoff_multiplier**i)
+            for i in range(policy.max_retries)
+        ]
+        self.assertListsAlmostEqual(sleep_tracker.times, expected_times, delta=policy.jitter)
+
+    def test_retry_delay_overrides_max_backoff(self):
+        client = SparkConnectClient("sc://foo/;token=bar")
+        policy = get_client_policies_map(client).get(DefaultPolicy)
+        self.assertIsNotNone(policy)
+
+        # retry delay = 5 mins.
+        # Testing if retry_delay overrides max_backoff.
+        retry_delay = 5 * 60 * 1000
+        sleep_tracker = SleepTimeTracker()
+        # assert that retry_delay is greater than max_backoff to make sure the test is valid
+        self.assertGreaterEqual(retry_delay, policy.max_backoff)
+        try:
+            for attempt in Retrying(client._retry_policies, sleep=sleep_tracker.sleep):
+                with attempt:
+                    raise create_test_exception_with_details(
+                        "Some error message",
+                        grpc.StatusCode.UNAVAILABLE,
+                        retry_delay,
+                    )
+        except TestException:
+            pass
+        expected_times = [retry_delay] * policy.max_retries
+        self.assertListsAlmostEqual(sleep_tracker.times, expected_times, delta=policy.jitter)
+
+    def test_max_server_retry_delay(self):
+        client = SparkConnectClient("sc://foo/;token=bar")
+        policy = get_client_policies_map(client).get(DefaultPolicy)
+        self.assertIsNotNone(policy)
+
+        # retry delay = 10 hours
+        # Testing if max_server_retry_delay limit works.
+        retry_delay = 10 * 60 * 60 * 1000
+        sleep_tracker = SleepTimeTracker()
+        try:
+            for attempt in Retrying(client._retry_policies, sleep=sleep_tracker.sleep):
+                with attempt:
+                    raise create_test_exception_with_details(
+                        "Some error message",
+                        grpc.StatusCode.UNAVAILABLE,
+                        retry_delay,
+                    )
+        except TestException:
+            pass
+
+        expected_times = [policy.max_server_retry_delay] * policy.max_retries
+        self.assertListsAlmostEqual(sleep_tracker.times, expected_times, delta=policy.jitter)
+
+    def test_return_to_exponential_backoff(self):
+        client = SparkConnectClient("sc://foo/;token=bar")
+        policy = get_client_policies_map(client).get(DefaultPolicy)
+        self.assertIsNotNone(policy)
+
+        # Start with retry_delay = 5 mins, then set it to zero.
+        # Test if backoff goes back to client's exponential strategy.
+        initial_retry_delay = 5 * 60 * 1000
+        sleep_tracker = SleepTimeTracker()
+        try:
+            for i, attempt in enumerate(
+                Retrying(client._retry_policies, sleep=sleep_tracker.sleep)
+            ):
+                if i < 2:
+                    retry_delay = initial_retry_delay
+                elif i < 5:
+                    retry_delay = 0
+                else:
+                    break
+                with attempt:
+                    raise create_test_exception_with_details(
+                        "Some error message",
+                        grpc.StatusCode.UNAVAILABLE,
+                        retry_delay,
+                    )
+        except TestException:
+            pass
+
+        expected_times = [initial_retry_delay] * 2 + [
+            policy.initial_backoff * policy.backoff_multiplier**i for i in range(2, 5)
+        ]
+        self.assertListsAlmostEqual(sleep_tracker.times, expected_times, delta=policy.jitter)
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.connect.client.test_client_retries import *  # noqa: F401
+
+    try:
+        import xmlrunner  # type: ignore
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/connect/test_connect_column.py b/python/pyspark/sql/tests/connect/test_connect_column.py
index 4873006fbbb90..8983d45d42d14 100644
--- a/python/pyspark/sql/tests/connect/test_connect_column.py
+++ b/python/pyspark/sql/tests/connect/test_connect_column.py
@@ -25,6 +25,7 @@
     MapType,
     NullType,
     DateType,
+    TimeType,
     TimestampType,
     TimestampNTZType,
     ByteType,
@@ -396,6 +397,7 @@ def test_literal_with_acceptable_type(self):
             ("sss", StringType()),
             (datetime.date(2022, 12, 13), DateType()),
             (datetime.datetime.now(), DateType()),
+            (datetime.time(1, 0, 0), TimeType()),
             (datetime.datetime.now(), TimestampType()),
             (datetime.datetime.now(), TimestampNTZType()),
             (datetime.timedelta(1, 2, 3), DayTimeIntervalType()),
@@ -441,6 +443,7 @@ def test_literal_null(self):
             DoubleType(),
             DecimalType(),
             DateType(),
+            TimeType(),
             TimestampType(),
             TimestampNTZType(),
             DayTimeIntervalType(),
diff --git a/python/pyspark/sql/tests/connect/test_connect_creation.py b/python/pyspark/sql/tests/connect/test_connect_creation.py
index 26e3596fc67df..917320d354e2b 100644
--- a/python/pyspark/sql/tests/connect/test_connect_creation.py
+++ b/python/pyspark/sql/tests/connect/test_connect_creation.py
@@ -530,12 +530,15 @@ def test_create_dataframe_from_pandas_with_ns_timestamp(self):
         from pandas import Timestamp
         import pandas as pd
 
+        # Nanoseconds are truncated to microseconds in the serializer
+        # Arrow will throw an error if precision is lost
+        # (i.e., nanoseconds cannot be represented in microseconds)
         pdf = pd.DataFrame(
             {
                 "naive": [datetime(2019, 1, 1, 0)],
                 "aware": [
                     Timestamp(
-                        year=2019, month=1, day=1, nanosecond=500, tz=timezone(timedelta(hours=-8))
+                        year=2019, month=1, day=1, nanosecond=0, tz=timezone(timedelta(hours=-8))
                     )
                 ],
             }
diff --git a/python/pyspark/sql/tests/connect/test_connect_dataframe_property.py b/python/pyspark/sql/tests/connect/test_connect_dataframe_property.py
index 76007137bc7a6..d5f5f994fe124 100644
--- a/python/pyspark/sql/tests/connect/test_connect_dataframe_property.py
+++ b/python/pyspark/sql/tests/connect/test_connect_dataframe_property.py
@@ -72,6 +72,15 @@ def test_cached_property_is_copied(self):
             df_columns.remove(col)
         assert len(df.columns) == 4
 
+        cdf = self.connect.createDataFrame(data, schema)
+        cdf_schema = cdf.schema
+        assert len(cdf._cached_schema_serialized) > 0
+        assert cdf_schema.jsonValue() == cdf._cached_schema.jsonValue()
+        assert len(cdf_schema.fields) == 4
+        cdf_schema.fields.pop(0)
+        assert cdf.schema.jsonValue() == cdf._cached_schema.jsonValue()
+        assert len(cdf.schema.fields) == 4
+
     def test_cached_schema_to(self):
         rows = [Row(id=x, name=str(x)) for x in range(100)]
         cdf = self.connect.createDataFrame(rows)
diff --git a/python/pyspark/sql/tests/connect/test_connect_function.py b/python/pyspark/sql/tests/connect/test_connect_function.py
index 20ce6b88e390a..b906f5c5cef44 100644
--- a/python/pyspark/sql/tests/connect/test_connect_function.py
+++ b/python/pyspark/sql/tests/connect/test_connect_function.py
@@ -551,8 +551,6 @@ def test_aggregation_functions(self):
             (CF.approx_count_distinct, SF.approx_count_distinct),
             (CF.approxCountDistinct, SF.approxCountDistinct),
             (CF.avg, SF.avg),
-            (CF.collect_list, SF.collect_list),
-            (CF.collect_set, SF.collect_set),
             (CF.listagg, SF.listagg),
             (CF.listagg_distinct, SF.listagg_distinct),
             (CF.string_agg, SF.string_agg),
@@ -589,6 +587,25 @@ def test_aggregation_functions(self):
                 check_exact=False,
             )
 
+        for cfunc, sfunc in [
+            (CF.collect_list, SF.collect_list),
+            (CF.collect_set, SF.collect_set),
+        ]:
+            self.assert_eq(
+                cdf.select(CF.sort_array(cfunc("b")), CF.sort_array(cfunc(cdf.c))).toPandas(),
+                sdf.select(SF.sort_array(sfunc("b")), SF.sort_array(sfunc(sdf.c))).toPandas(),
+                check_exact=False,
+            )
+            self.assert_eq(
+                cdf.groupBy("a")
+                .agg(CF.sort_array(cfunc("b")), CF.sort_array(cfunc(cdf.c)))
+                .toPandas(),
+                sdf.groupBy("a")
+                .agg(SF.sort_array(sfunc("b")), SF.sort_array(sfunc(sdf.c)))
+                .toPandas(),
+                check_exact=False,
+            )
+
         for cfunc, sfunc in [
             (CF.corr, SF.corr),
             (CF.covar_pop, SF.covar_pop),
@@ -601,8 +618,8 @@ def test_aggregation_functions(self):
                 sdf.select(sfunc(sdf.b, "c")).toPandas(),
             )
             self.assert_eq(
-                cdf.groupBy("a").agg(cfunc(cdf.b, "c")).toPandas(),
-                sdf.groupBy("a").agg(sfunc(sdf.b, "c")).toPandas(),
+                cdf.groupBy("a").agg(cfunc(cdf.b, "c")).orderBy("a").toPandas(),
+                sdf.groupBy("a").agg(sfunc(sdf.b, "c")).orderBy("a").toPandas(),
             )
 
         # test grouping
@@ -628,13 +645,13 @@ def test_aggregation_functions(self):
             check_exact=False,
         )
         self.assert_eq(
-            cdf.groupBy("a").agg(CF.percentile_approx("b", 0.5)).toPandas(),
-            sdf.groupBy("a").agg(SF.percentile_approx("b", 0.5)).toPandas(),
+            cdf.groupBy("a").agg(CF.percentile_approx("b", 0.5)).orderBy("a").toPandas(),
+            sdf.groupBy("a").agg(SF.percentile_approx("b", 0.5)).orderBy("a").toPandas(),
             check_exact=False,
         )
         self.assert_eq(
-            cdf.groupBy("a").agg(CF.percentile_approx(cdf.b, [0.1, 0.9])).toPandas(),
-            sdf.groupBy("a").agg(SF.percentile_approx(sdf.b, [0.1, 0.9])).toPandas(),
+            cdf.groupBy("a").agg(CF.percentile_approx(cdf.b, [0.1, 0.9])).orderBy("a").toPandas(),
+            sdf.groupBy("a").agg(SF.percentile_approx(sdf.b, [0.1, 0.9])).orderBy("a").toPandas(),
             check_exact=False,
         )
 
@@ -652,9 +669,11 @@ def test_aggregation_functions(self):
         self.assert_eq(
             cdf.groupBy("a")
             .agg(CF.count_distinct("b").alias("x"), CF.count_distinct(cdf.c).alias("y"))
+            .orderBy("a")
             .toPandas(),
             sdf.groupBy("a")
             .agg(SF.count_distinct("b").alias("x"), SF.count_distinct(sdf.c).alias("y"))
+            .orderBy("a")
             .toPandas(),
         )
 
diff --git a/python/pyspark/sql/tests/connect/test_connect_plan.py b/python/pyspark/sql/tests/connect/test_connect_plan.py
index a03cd30c733fb..d25799f0c9f26 100644
--- a/python/pyspark/sql/tests/connect/test_connect_plan.py
+++ b/python/pyspark/sql/tests/connect/test_connect_plan.py
@@ -893,7 +893,7 @@ def test_float_nan_inf(self):
         self.assertIsNotNone(inf_lit.to_plan(None))
 
     def test_datetime_literal_types(self):
-        """Test the different timestamp, date, and timedelta types."""
+        """Test the different timestamp, date, time, and timedelta types."""
         datetime_lit = lit(datetime.datetime.now())
 
         p = datetime_lit.to_plan(None)
@@ -908,6 +908,10 @@ def test_datetime_literal_types(self):
         # (24 * 3600 + 2) * 1000000 + 3
         self.assertEqual(86402000003, time_delta.to_plan(None).literal.day_time_interval)
 
+        time_lit = lit(datetime.time(23, 59, 59, 999999))
+        self.assertIsNotNone(time_lit.to_plan(None))
+        self.assertEqual(time_lit.to_plan(None).literal.time.nano, 86399999999000)
+
     def test_list_to_literal(self):
         """Test conversion of lists to literals"""
         empty_list = []
@@ -1024,6 +1028,7 @@ def test_literal_to_any_conversion(self):
             decimal.Decimal(1.234567),
             "sss",
             datetime.date(2022, 12, 13),
+            datetime.time(12, 13, 14),
             datetime.datetime.now(),
             datetime.timedelta(1, 2, 3),
             [1, 2, 3, 4, 5, 6],
diff --git a/python/pyspark/sql/tests/connect/test_connect_retry.py b/python/pyspark/sql/tests/connect/test_connect_retry.py
index f51e062479284..21796869e385d 100644
--- a/python/pyspark/sql/tests/connect/test_connect_retry.py
+++ b/python/pyspark/sql/tests/connect/test_connect_retry.py
@@ -18,7 +18,6 @@
 import unittest
 from collections import defaultdict
 
-from pyspark.errors import RetriesExceeded
 from pyspark.testing.connectutils import (
     should_test_connect,
     connect_requirement_message,
@@ -88,7 +87,7 @@ def test_below_limit(self):
 
     def test_exceed_retries(self):
         # Exceed the retries.
-        with self.assertRaises(RetriesExceeded):
+        with self.assertRaises(TestError):
             for attempt in Retrying(TestPolicy(max_retries=2)):
                 with attempt:
                     self.stub(5, grpc.StatusCode.INTERNAL)
@@ -117,7 +116,7 @@ def test_specific_exception(self):
     def test_specific_exception_exceed_retries(self):
         # Exceed the retries.
         policy = TestPolicySpecificError(max_retries=2, specific_code=grpc.StatusCode.UNAVAILABLE)
-        with self.assertRaises(RetriesExceeded):
+        with self.assertRaises(TestError):
             for attempt in Retrying(policy):
                 with attempt:
                     self.stub(5, grpc.StatusCode.UNAVAILABLE)
@@ -157,13 +156,13 @@ def test_multiple_policies_exceed(self):
         policy1 = TestPolicySpecificError(max_retries=2, specific_code=grpc.StatusCode.INTERNAL)
         policy2 = TestPolicySpecificError(max_retries=4, specific_code=grpc.StatusCode.INTERNAL)
 
-        with self.assertRaises(RetriesExceeded):
+        with self.assertRaises(TestError):
             for attempt in Retrying([policy1, policy2]):
                 with attempt:
                     self.stub(10, grpc.StatusCode.INTERNAL)
 
-        self.assertEqual(self.call_wrap["attempts"], 7)
-        self.assertEqual(self.call_wrap["raised"], 7)
+        self.assertEqual(self.call_wrap["attempts"], 3)
+        self.assertEqual(self.call_wrap["raised"], 3)
 
 
 if __name__ == "__main__":
diff --git a/python/pyspark/sql/tests/connect/test_parity_udf_combinations.py b/python/pyspark/sql/tests/connect/test_parity_udf_combinations.py
new file mode 100644
index 0000000000000..bc63aa7aeb505
--- /dev/null
+++ b/python/pyspark/sql/tests/connect/test_parity_udf_combinations.py
@@ -0,0 +1,40 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import unittest
+
+from pyspark.sql.tests.test_udf_combinations import UDFCombinationsTestsMixin
+from pyspark.testing.connectutils import ReusedConnectTestCase
+
+
+class UDFCombinationsParityTests(UDFCombinationsTestsMixin, ReusedConnectTestCase):
+    @classmethod
+    def setUpClass(cls):
+        ReusedConnectTestCase.setUpClass()
+        cls.spark.conf.set("spark.sql.execution.pythonUDF.arrow.enabled", "false")
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.connect.test_parity_udf_combinations import *  # noqa: F401
+
+    try:
+        import xmlrunner  # type: ignore[import]
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/pandas/helper/helper_pandas_transform_with_state.py b/python/pyspark/sql/tests/pandas/helper/helper_pandas_transform_with_state.py
index 8c35e0e3b486f..d258f693ccb88 100644
--- a/python/pyspark/sql/tests/pandas/helper/helper_pandas_transform_with_state.py
+++ b/python/pyspark/sql/tests/pandas/helper/helper_pandas_transform_with_state.py
@@ -31,6 +31,8 @@
     LongType,
     BooleanType,
     FloatType,
+    ArrayType,
+    MapType,
 )
 from pyspark.testing.sqlutils import have_pandas
 
@@ -227,6 +229,14 @@ def row(self):
         return RowMinEventTimeStatefulProcessor()
 
 
+class StatefulProcessorCompositeTypeFactory(StatefulProcessorFactory):
+    def pandas(self):
+        return PandasStatefulProcessorCompositeType()
+
+    def row(self):
+        return RowStatefulProcessorCompositeType()
+
+
 # StatefulProcessor implementations
 
 
@@ -1615,3 +1625,200 @@ def handleInputRows(self, key, rows, timerValues) -> Iterator[Row]:
 
     def close(self) -> None:
         pass
+
+
+# A stateful processor that contains composite python type inside Value, List and Map state variable
+class PandasStatefulProcessorCompositeType(StatefulProcessor):
+    TAGS = [["dummy1", "dummy2"], ["dummy3"]]
+    METADATA = [{"key": "env", "value": "prod"}, {"key": "region", "value": "us-west"}]
+    ATTRIBUTES_MAP = {"key1": [1], "key2": [10]}
+    CONFS_MAP = {"e1": {"e2": 5, "e3": 10}}
+
+    def init(self, handle: StatefulProcessorHandle) -> None:
+        obj_schema = StructType(
+            [
+                StructField("id", ArrayType(IntegerType())),
+                StructField("tags", ArrayType(ArrayType(StringType()))),
+                StructField(
+                    "metadata",
+                    ArrayType(
+                        StructType(
+                            [StructField("key", StringType()), StructField("value", StringType())]
+                        )
+                    ),
+                ),
+            ]
+        )
+
+        map_value_schema = StructType(
+            [
+                StructField("id", IntegerType(), True),
+                StructField("attributes", MapType(StringType(), ArrayType(IntegerType())), True),
+                StructField(
+                    "confs", MapType(StringType(), MapType(StringType(), IntegerType()), True), True
+                ),
+            ]
+        )
+
+        self.obj_state = handle.getValueState("obj_state", obj_schema)
+        self.list_state = handle.getListState("list_state", obj_schema)
+        self.map_state = handle.getMapState("map_state", "name string", map_value_schema)
+
+    def _update_obj_state(self, total_temperature):
+        if self.obj_state.exists():
+            ids, tags, metadata = self.obj_state.get()
+            assert tags == self.TAGS, f"Tag mismatch: {tags}"
+            assert metadata == [Row(**m) for m in self.METADATA], f"Metadata mismatch: {metadata}"
+            ids = [int(x + total_temperature) for x in ids]
+        else:
+            ids = [0]
+        self.obj_state.update((ids, self.TAGS, self.METADATA))
+        return ids
+
+    def _update_list_state(self, total_temperature, initial_obj):
+        existing_list = self.list_state.get()
+        updated_list = []
+        for ids, tags, metadata in existing_list:
+            ids.append(total_temperature)
+            updated_list.append((ids, tags, [row.asDict() for row in metadata]))
+        if not updated_list:
+            updated_list.append(initial_obj)
+        self.list_state.put(updated_list)
+        return [id_val for ids, _, _ in updated_list for id_val in ids]
+
+    def _update_map_state(self, key, total_temperature):
+        if not self.map_state.containsKey(key):
+            self.map_state.updateValue(key, (0, self.ATTRIBUTES_MAP, self.CONFS_MAP))
+        else:
+            id_val, attributes, confs = self.map_state.getValue(key)
+            attributes[key] = [total_temperature]
+            confs.setdefault("e1", {})[key] = total_temperature
+            self.map_state.updateValue(key, (id_val, attributes, confs))
+        return self.map_state.getValue(key)[1], self.map_state.getValue(key)[2]
+
+    def handleInputRows(self, key, rows, timerValues) -> Iterator[pd.DataFrame]:
+        key = key[0]
+        total_temperature = sum(pdf["temperature"].astype(int).sum() for pdf in rows)
+
+        updated_ids = self._update_obj_state(total_temperature)
+        flattened_ids = self._update_list_state(
+            total_temperature, (updated_ids, self.TAGS, self.METADATA)
+        )
+        attributes_map, confs_map = self._update_map_state(key, total_temperature)
+
+        import json
+        import numpy as np
+
+        def np_int64_to_int(x):
+            if isinstance(x, np.int64):
+                return int(x)
+            return x
+
+        yield pd.DataFrame(
+            {
+                "id": [key],
+                "value_arr": [",".join(map(str, updated_ids))],
+                "list_state_arr": [",".join(map(str, flattened_ids))],
+                "map_state_arr": [
+                    json.dumps(attributes_map, default=np_int64_to_int, sort_keys=True)
+                ],
+                "nested_map_state_arr": [
+                    json.dumps(confs_map, default=np_int64_to_int, sort_keys=True)
+                ],
+            }
+        )
+
+    def close(self) -> None:
+        pass
+
+
+class RowStatefulProcessorCompositeType(StatefulProcessor):
+    TAGS = [["dummy1", "dummy2"], ["dummy3"]]
+    METADATA = [{"key": "env", "value": "prod"}, {"key": "region", "value": "us-west"}]
+    ATTRIBUTES_MAP = {"key1": [1], "key2": [10]}
+    CONFS_MAP = {"e1": {"e2": 5, "e3": 10}}
+
+    def init(self, handle: StatefulProcessorHandle) -> None:
+        obj_schema = StructType(
+            [
+                StructField("id", ArrayType(IntegerType())),
+                StructField("tags", ArrayType(ArrayType(StringType()))),
+                StructField(
+                    "metadata",
+                    ArrayType(
+                        StructType(
+                            [StructField("key", StringType()), StructField("value", StringType())]
+                        )
+                    ),
+                ),
+            ]
+        )
+
+        map_value_schema = StructType(
+            [
+                StructField("id", IntegerType(), True),
+                StructField("attributes", MapType(StringType(), ArrayType(IntegerType())), True),
+                StructField(
+                    "confs", MapType(StringType(), MapType(StringType(), IntegerType()), True), True
+                ),
+            ]
+        )
+
+        self.obj_state = handle.getValueState("obj_state", obj_schema)
+        self.list_state = handle.getListState("list_state", obj_schema)
+        self.map_state = handle.getMapState("map_state", "name string", map_value_schema)
+
+    def _update_obj_state(self, total_temperature):
+        if self.obj_state.exists():
+            ids, tags, metadata = self.obj_state.get()
+            assert tags == self.TAGS, f"Tag mismatch: {tags}"
+            assert metadata == [Row(**m) for m in self.METADATA], f"Metadata mismatch: {metadata}"
+            ids = [int(x + total_temperature) for x in ids]
+        else:
+            ids = [0]
+        self.obj_state.update((ids, self.TAGS, self.METADATA))
+        return ids
+
+    def _update_list_state(self, total_temperature, initial_obj):
+        existing_list = self.list_state.get()
+        updated_list = []
+        for ids, tags, metadata in existing_list:
+            ids.append(total_temperature)
+            updated_list.append((ids, tags, [row.asDict() for row in metadata]))
+        if not updated_list:
+            updated_list.append(initial_obj)
+        self.list_state.put(updated_list)
+        return [id_val for ids, _, _ in updated_list for id_val in ids]
+
+    def _update_map_state(self, key, total_temperature):
+        if not self.map_state.containsKey(key):
+            self.map_state.updateValue(key, (0, self.ATTRIBUTES_MAP, self.CONFS_MAP))
+        else:
+            id_val, attributes, confs = self.map_state.getValue(key)
+            attributes[key] = [total_temperature]
+            confs.setdefault("e1", {})[key] = total_temperature
+            self.map_state.updateValue(key, (id_val, attributes, confs))
+        return self.map_state.getValue(key)[1], self.map_state.getValue(key)[2]
+
+    def handleInputRows(self, key, rows, timerValues) -> Iterator[Row]:
+        key = key[0]
+        total_temperature = sum(int(row.temperature) for row in rows)
+
+        updated_ids = self._update_obj_state(total_temperature)
+        flattened_ids = self._update_list_state(
+            total_temperature, (updated_ids, self.TAGS, self.METADATA)
+        )
+        attributes_map, confs_map = self._update_map_state(key, total_temperature)
+
+        import json
+
+        yield Row(
+            id=key,
+            value_arr=",".join(map(str, updated_ids)),
+            list_state_arr=",".join(map(str, flattened_ids)),
+            map_state_arr=json.dumps(attributes_map, sort_keys=True),
+            nested_map_state_arr=json.dumps(confs_map, sort_keys=True),
+        )
+
+    def close(self) -> None:
+        pass
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_cogrouped_map.py b/python/pyspark/sql/tests/pandas/test_pandas_cogrouped_map.py
index 1f9532352679a..d23252abf6a92 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_cogrouped_map.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_cogrouped_map.py
@@ -262,7 +262,7 @@ def check_apply_in_pandas_returning_incompatible_type(self):
                             "`spark.sql.execution.pandas.convertToArrowArraySafely`."
                         )
                     self._test_merge_error(
-                        fn=lambda lft, rgt: pd.DataFrame({"id": [1], "k": ["2.0"]}),
+                        fn=lambda lft, rgt: pd.DataFrame({"id": [1], "k": ["test_string"]}),
                         output_schema="id long, k double",
                         errorClass=PythonException,
                         error_message_regex=expected,
@@ -281,6 +281,54 @@ def check_apply_in_pandas_returning_incompatible_type(self):
                         error_message_regex=expected,
                     )
 
+    def test_cogroup_apply_int_to_decimal_coercion(self):
+        left = self.data1.limit(3)
+        right = self.data2.limit(3)
+
+        def int_to_decimal_merge(lft, rgt):
+            return pd.DataFrame(
+                [
+                    {
+                        "id": 1,
+                        "decimal_result": 98765,
+                        "left_count": len(lft),
+                        "right_count": len(rgt),
+                    }
+                ]
+            )
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": True}
+        ):
+            result = (
+                left.groupby("id")
+                .cogroup(right.groupby("id"))
+                .applyInPandas(
+                    int_to_decimal_merge,
+                    "id long, decimal_result decimal(10,2), left_count long, right_count long",
+                )
+                .collect()
+            )
+            self.assertTrue(len(result) > 0)
+            for row in result:
+                self.assertEqual(row.decimal_result, 98765.00)
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": False}
+        ):
+            with self.assertRaisesRegex(
+                PythonException, "Exception thrown when converting pandas.Series"
+            ):
+                (
+                    left.groupby("id")
+                    .cogroup(right.groupby("id"))
+                    .applyInPandas(
+                        int_to_decimal_merge,
+                        "id long, decimal_result decimal(10,2), left_count long, right_count long",
+                    )
+                    .collect()
+                )
+
     def test_mixed_scalar_udfs_followed_by_cogrouby_apply(self):
         df = self.spark.range(0, 10).toDF("v1")
         df = df.withColumn("v2", udf(lambda x: x + 1, "int")(df["v1"])).withColumn(
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_grouped_map.py b/python/pyspark/sql/tests/pandas/test_pandas_grouped_map.py
index 4ef334549ef5a..b8f1afc5130f9 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_grouped_map.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_grouped_map.py
@@ -221,8 +221,10 @@ def check_register_grouped_map_udf(self):
             exception=pe.exception,
             errorClass="INVALID_UDF_EVAL_TYPE",
             messageParameters={
-                "eval_type": "SQL_BATCHED_UDF, SQL_ARROW_BATCHED_UDF, SQL_SCALAR_PANDAS_UDF, "
-                "SQL_SCALAR_PANDAS_ITER_UDF or SQL_GROUPED_AGG_PANDAS_UDF"
+                "eval_type": "SQL_BATCHED_UDF, SQL_ARROW_BATCHED_UDF, "
+                "SQL_SCALAR_PANDAS_UDF, SQL_SCALAR_ARROW_UDF, "
+                "SQL_SCALAR_PANDAS_ITER_UDF, SQL_SCALAR_ARROW_ITER_UDF, "
+                "SQL_GROUPED_AGG_PANDAS_UDF or SQL_GROUPED_AGG_ARROW_UDF"
             },
         )
 
@@ -370,7 +372,7 @@ def check_apply_in_pandas_returning_incompatible_type(self):
                         )
                     with self.assertRaisesRegex(PythonException, expected + "\n"):
                         self._test_apply_in_pandas(
-                            lambda key, pdf: pd.DataFrame([key + (str(pdf.v.mean()),)]),
+                            lambda key, pdf: pd.DataFrame([key + ("test_string",)]),
                             output_schema="id long, mean double",
                         )
 
@@ -386,6 +388,37 @@ def check_apply_in_pandas_returning_incompatible_type(self):
                             output_schema="id long, mean string",
                         )
 
+    def test_apply_in_pandas_int_to_decimal_coercion(self):
+        def int_to_decimal_func(key, pdf):
+            return pd.DataFrame([{"id": key[0], "decimal_result": 12345}])
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": True}
+        ):
+            result = (
+                self.data.groupby("id")
+                .applyInPandas(int_to_decimal_func, schema="id long, decimal_result decimal(10,2)")
+                .collect()
+            )
+
+            self.assertTrue(len(result) > 0)
+            for row in result:
+                self.assertEqual(row.decimal_result, 12345.00)
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": False}
+        ):
+            with self.assertRaisesRegex(
+                PythonException, "Exception thrown when converting pandas.Series"
+            ):
+                (
+                    self.data.groupby("id")
+                    .applyInPandas(
+                        int_to_decimal_func, schema="id long, decimal_result decimal(10,2)"
+                    )
+                    .collect()
+                )
+
     def test_datatype_string(self):
         df = self.data
 
@@ -868,6 +901,51 @@ def _test_apply_in_pandas_returning_empty_dataframe_error(self, empty_df, error)
             with self.assertRaisesRegex(PythonException, error):
                 self._test_apply_in_pandas_returning_empty_dataframe(empty_df)
 
+    def test_arrow_cast_enabled_numeric_to_decimal(self):
+        import numpy as np
+
+        columns = [
+            "int8",
+            "int16",
+            "int32",
+            "uint8",
+            "uint16",
+            "uint32",
+            "float64",
+        ]
+
+        pdf = pd.DataFrame({key: np.arange(1, 2).astype(key) for key in columns})
+        df = self.spark.range(2).repartition(1)
+
+        for column in columns:
+            with self.subTest(column=column):
+                v = pdf[column].iloc[:1]
+                schema_str = "id long, value decimal(10,0)"
+
+                @pandas_udf(schema_str, PandasUDFType.GROUPED_MAP)
+                def test(pdf):
+                    return pdf.assign(**{"value": v})
+
+                row = df.groupby("id").apply(test).first()
+                res = row[1]
+                self.assertEqual(res, Decimal("1"))
+
+    def test_arrow_cast_enabled_str_to_numeric(self):
+        df = self.spark.range(2).repartition(1)
+
+        types = ["int", "long", "float", "double"]
+
+        for type_str in types:
+            with self.subTest(type=type_str):
+                schema_str = "id long, value " + type_str
+
+                @pandas_udf(schema_str, PandasUDFType.GROUPED_MAP)
+                def test(pdf):
+                    return pdf.assign(value=pd.Series(["123"]))
+
+                row = df.groupby("id").apply(test).first()
+                self.assertEqual(row[1], 123)
+
 
 class GroupedApplyInPandasTests(GroupedApplyInPandasTestsMixin, ReusedSQLTestCase):
     pass
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_grouped_map_with_state.py b/python/pyspark/sql/tests/pandas/test_pandas_grouped_map_with_state.py
index e1b8d7c76d183..e4f307ebc96ae 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_grouped_map_with_state.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_grouped_map_with_state.py
@@ -23,6 +23,7 @@
 
 import unittest
 from typing import cast
+from decimal import Decimal
 
 from pyspark.sql.streaming.state import GroupStateTimeout, GroupState
 from pyspark.sql.types import (
@@ -31,6 +32,7 @@
     StructType,
     StructField,
     Row,
+    DecimalType,
 )
 from pyspark.testing.sqlutils import (
     ReusedSQLTestCase,
@@ -59,7 +61,12 @@ def conf(cls):
         cfg.set("spark.sql.shuffle.partitions", "5")
         return cfg
 
-    def _test_apply_in_pandas_with_state_basic(self, func, check_results):
+    def _test_apply_in_pandas_with_state_basic(self, func, check_results, output_type=None):
+        if output_type is None:
+            output_type = StructType(
+                [StructField("key", StringType()), StructField("countAsString", StringType())]
+            )
+
         input_path = tempfile.mkdtemp()
 
         def prepare_test_resource():
@@ -75,9 +82,6 @@ def prepare_test_resource():
             q.stop()
         self.assertTrue(df.isStreaming)
 
-        output_type = StructType(
-            [StructField("key", StringType()), StructField("countAsString", StringType())]
-        )
         state_type = StructType([StructField("c", LongType())])
 
         q = (
@@ -314,6 +318,26 @@ def assert_test():
         finally:
             q.stop()
 
+    def test_apply_in_pandas_with_state_int_to_decimal_coercion(self):
+        def func(key, pdf_iter, state):
+            assert isinstance(state, GroupState)
+            yield pd.DataFrame({"key": [key[0]], "decimal_sum": [1]})
+
+        def check_results(batch_df, _):
+            assert set(batch_df.sort("key").collect()) == {
+                Row(key="hello", decimal_sum=Decimal("1.00")),
+                Row(key="this", decimal_sum=Decimal("1.00")),
+            }, "Decimal coercion failed: " + str(batch_df.sort("key").collect())
+
+        output_type = StructType(
+            [StructField("key", StringType()), StructField("decimal_sum", DecimalType(10, 2))]
+        )
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": True}
+        ):
+            self._test_apply_in_pandas_with_state_basic(func, check_results, output_type)
+
 
 class GroupedApplyInPandasWithStateTests(
     GroupedApplyInPandasWithStateTestsMixin, ReusedSQLTestCase
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_map.py b/python/pyspark/sql/tests/pandas/test_pandas_map.py
index 7debe8035f611..b241b91e02a29 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_map.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_map.py
@@ -276,16 +276,17 @@ def test_dataframes_with_incompatible_types(self):
             self.check_dataframes_with_incompatible_types()
 
     def check_dataframes_with_incompatible_types(self):
-        def func(iterator):
-            for pdf in iterator:
-                yield pdf.assign(id=pdf["id"].apply(str))
-
         for safely in [True, False]:
             with self.subTest(convertToArrowArraySafely=safely), self.sql_conf(
                 {"spark.sql.execution.pandas.convertToArrowArraySafely": safely}
             ):
                 # sometimes we see ValueErrors
                 with self.subTest(convert="string to double"):
+
+                    def func(iterator):
+                        for pdf in iterator:
+                            yield pdf.assign(id="test_string")
+
                     expected = (
                         r"ValueError: Exception thrown when converting pandas.Series "
                         r"\(object\) with name 'id' to Arrow Array \(double\)."
@@ -304,18 +305,31 @@ def func(iterator):
                             .collect()
                         )
 
-                # sometimes we see TypeErrors
-                with self.subTest(convert="double to string"):
-                    with self.assertRaisesRegex(
-                        PythonException,
-                        r"TypeError: Exception thrown when converting pandas.Series "
-                        r"\(float64\) with name 'id' to Arrow Array \(string\).\n",
-                    ):
-                        (
-                            self.spark.range(10, numPartitions=3)
-                            .select(col("id").cast("double"))
-                            .mapInPandas(self.identity_dataframes_iter("id"), "id string")
-                            .collect()
+                with self.subTest(convert="float to int precision loss"):
+
+                    def func(iterator):
+                        for pdf in iterator:
+                            yield pdf.assign(id=pdf["id"] + 0.1)
+
+                    df = (
+                        self.spark.range(10, numPartitions=3)
+                        .select(col("id").cast("double"))
+                        .mapInPandas(func, "id int")
+                    )
+                    if safely:
+                        expected = (
+                            r"ValueError: Exception thrown when converting pandas.Series "
+                            r"\(float64\) with name 'id' to Arrow Array \(int32\)."
+                            " It can be caused by overflows or other "
+                            "unsafe conversions warned by Arrow. Arrow safe type check "
+                            "can be disabled by using SQL config "
+                            "`spark.sql.execution.pandas.convertToArrowArraySafely`."
+                        )
+                        with self.assertRaisesRegex(PythonException, expected + "\n"):
+                            df.collect()
+                    else:
+                        self.assertEqual(
+                            df.collect(), self.spark.range(10, numPartitions=3).collect()
                         )
 
     def test_empty_iterator(self):
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_transform_with_state.py b/python/pyspark/sql/tests/pandas/test_pandas_transform_with_state.py
index 007ed5de2fbd7..d3bda545e1c99 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_transform_with_state.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_transform_with_state.py
@@ -35,6 +35,7 @@
     Row,
     IntegerType,
     TimestampType,
+    DecimalType,
 )
 from pyspark.testing import assertDataFrameEqual
 from pyspark.testing.sqlutils import (
@@ -68,6 +69,7 @@
     ReorderedFieldsProcessorFactory,
     UpcastProcessorFactory,
     MinEventTimeStatefulProcessorFactory,
+    StatefulProcessorCompositeTypeFactory,
 )
 
 
@@ -138,6 +140,12 @@ def _test_transform_with_state_basic(
         timeMode="None",
         checkpoint_path=None,
         initial_state=None,
+        output_schema=StructType(
+            [
+                StructField("id", StringType(), True),
+                StructField("countAsString", StringType(), True),
+            ]
+        ),
     ):
         input_path = tempfile.mkdtemp()
         if checkpoint_path is None:
@@ -153,13 +161,6 @@ def _test_transform_with_state_basic(
             q.stop()
         self.assertTrue(df.isStreaming)
 
-        output_schema = StructType(
-            [
-                StructField("id", StringType(), True),
-                StructField("countAsString", StringType(), True),
-            ]
-        )
-
         stateful_processor = self.get_processor(stateful_processor_factory)
         if self.use_pandas():
             tws_df = df.groupBy("id").transformWithStateInPandas(
@@ -194,6 +195,7 @@ def _test_transform_with_state_basic(
 
     def test_transform_with_state_basic(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 assert set(batch_df.sort("id").collect()) == {
                     Row(id="0", countAsString="2"),
@@ -209,6 +211,7 @@ def check_results(batch_df, batch_id):
 
     def test_transform_with_state_non_exist_value_state(self):
         def check_results(batch_df, _):
+            batch_df.collect()
             assert set(batch_df.sort("id").collect()) == {
                 Row(id="0", countAsString="0"),
                 Row(id="1", countAsString="0"),
@@ -294,6 +297,7 @@ def test_transform_with_state_query_restarts(self):
 
     def test_transform_with_state_list_state(self):
         def check_results(batch_df, _):
+            batch_df.collect()
             assert set(batch_df.sort("id").collect()) == {
                 Row(id="0", countAsString="2"),
                 Row(id="1", countAsString="2"),
@@ -305,6 +309,7 @@ def check_results(batch_df, _):
 
     def test_transform_with_state_list_state_large_list(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 expected_prev_elements = ""
                 expected_updated_elements = ",".join(map(lambda x: str(x), range(90)))
@@ -379,6 +384,7 @@ def check_results(batch_df, batch_id):
     # test list state with ttl has the same behavior as list state when state doesn't expire.
     def test_transform_with_state_list_state_large_ttl(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             assert set(batch_df.sort("id").collect()) == {
                 Row(id="0", countAsString="2"),
                 Row(id="1", countAsString="2"),
@@ -390,6 +396,7 @@ def check_results(batch_df, batch_id):
 
     def test_transform_with_state_map_state(self):
         def check_results(batch_df, _):
+            batch_df.collect()
             assert set(batch_df.sort("id").collect()) == {
                 Row(id="0", countAsString="2"),
                 Row(id="1", countAsString="2"),
@@ -400,6 +407,7 @@ def check_results(batch_df, _):
     # test map state with ttl has the same behavior as map state when state doesn't expire.
     def test_transform_with_state_map_state_large_ttl(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             assert set(batch_df.sort("id").collect()) == {
                 Row(id="0", countAsString="2"),
                 Row(id="1", countAsString="2"),
@@ -413,6 +421,7 @@ def check_results(batch_df, batch_id):
     # state doesn't expire.
     def test_value_state_ttl_basic(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 assert set(batch_df.sort("id").collect()) == {
                     Row(id="0", countAsString="2"),
@@ -432,6 +441,7 @@ def check_results(batch_df, batch_id):
     @unittest.skip("test is flaky and it is only a timing issue, skipping until we can resolve")
     def test_value_state_ttl_expiration(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 assertDataFrameEqual(
                     batch_df,
@@ -580,6 +590,8 @@ def _test_transform_with_state_proc_timer(self, stateful_processor_factory, chec
 
     def test_transform_with_state_proc_timer(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
+
             # helper function to check expired timestamp is smaller than current processing time
             def check_timestamp(batch_df):
                 expired_df = (
@@ -695,6 +707,7 @@ def prepare_batch3(input_path):
 
     def test_transform_with_state_event_time(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 # watermark for late event = 0
                 # watermark for eviction = 0
@@ -726,6 +739,7 @@ def check_results(batch_df, batch_id):
 
     def test_transform_with_state_with_wmark_and_non_event_time(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 # watermark for late event = 0 and min event = 20
                 assert set(batch_df.sort("id").collect()) == {
@@ -823,6 +837,7 @@ def _test_transform_with_state_init_state(
 
     def test_transform_with_state_init_state(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 # for key 0, initial state was processed and it was only processed once;
                 # for key 1, it did not appear in the initial state df;
@@ -846,6 +861,7 @@ def check_results(batch_df, batch_id):
 
     def test_transform_with_state_init_state_with_extra_transformation(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 # for key 0, initial state was processed and it was only processed once;
                 # for key 1, it did not appear in the initial state df;
@@ -924,6 +940,7 @@ def _test_transform_with_state_non_contiguous_grouping_cols(
 
     def test_transform_with_state_non_contiguous_grouping_cols(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             assert set(batch_df.collect()) == {
                 Row(id1="0", id2="1", value=str(123 + 46)),
                 Row(id1="1", id2="2", value=str(146 + 346)),
@@ -935,6 +952,7 @@ def check_results(batch_df, batch_id):
 
     def test_transform_with_state_non_contiguous_grouping_cols_with_init_state(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             # initial state for key (0, 1) is processed
             assert set(batch_df.collect()) == {
                 Row(id1="0", id2="1", value=str(789 + 123 + 46)),
@@ -1017,6 +1035,7 @@ def _test_transform_with_state_chaining_ops(
 
     def test_transform_with_state_chaining_ops(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             import datetime
 
             if batch_id == 0:
@@ -1052,6 +1071,7 @@ def check_results(batch_df, batch_id):
 
     def test_transform_with_state_init_state_with_timers(self):
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 # timers are registered and handled in the first batch for
                 # rows in initial state; For key=0 and key=3 which contains
@@ -1176,6 +1196,7 @@ def _test_transform_with_map_state_metadata(self, initial_state):
             expected_operator_name = "transformWithStateInPySparkExec"
 
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 assert set(batch_df.sort("id").collect()) == {
                     Row(id="0", countAsString="2"),
@@ -1292,6 +1313,7 @@ def test_transform_with_list_state_metadata(self):
         checkpoint_path = tempfile.mktemp()
 
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 assert set(batch_df.sort("id").collect()) == {
                     Row(id="0", countAsString="2"),
@@ -1371,6 +1393,7 @@ def test_transform_with_value_state_metadata(self):
         checkpoint_path = tempfile.mktemp()
 
         def check_results(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 assert set(batch_df.sort("id").collect()) == {
                     Row(id="0", countAsString="2"),
@@ -1458,12 +1481,14 @@ def check_results(batch_df, batch_id):
 
     def test_transform_with_state_restart_with_multiple_rows_init_state(self):
         def check_results(batch_df, _):
+            batch_df.collect()
             assert set(batch_df.sort("id").collect()) == {
                 Row(id="0", countAsString="2"),
                 Row(id="1", countAsString="2"),
             }
 
         def check_results_for_new_query(batch_df, batch_id):
+            batch_df.collect()
             if batch_id == 0:
                 assert set(batch_df.sort("id").collect()) == {
                     Row(id="0", value=str(123 + 46)),
@@ -1513,6 +1538,63 @@ def dataframe_to_value_list(output_df):
             initial_state=init_df,
         )
 
+    def test_transform_with_state_in_pandas_composite_type(self):
+        def check_results(batch_df, batch_id):
+            if batch_id == 0:
+                map_val = {"key1": [1], "key2": [10]}
+                nested_map_val = {"e1": {"e2": 5, "e3": 10}}
+                assert set(batch_df.sort("id").collect()) == {
+                    Row(
+                        id="0",
+                        value_arr="0",
+                        list_state_arr="0",
+                        map_state_arr=json.dumps(map_val, sort_keys=True),
+                        nested_map_state_arr=json.dumps(nested_map_val, sort_keys=True),
+                    ),
+                    Row(
+                        id="1",
+                        value_arr="0",
+                        list_state_arr="0",
+                        map_state_arr=json.dumps(map_val, sort_keys=True),
+                        nested_map_state_arr=json.dumps(nested_map_val, sort_keys=True),
+                    ),
+                }, f"batch id: {batch_id}, real df is: {batch_df.collect()}"
+            else:
+                map_val_0 = {"key1": [1], "key2": [10], "0": [669]}
+                map_val_1 = {"key1": [1], "key2": [10], "1": [252]}
+                nested_map_val_0 = {"e1": {"e2": 5, "e3": 10, "0": 669}}
+                nested_map_val_1 = {"e1": {"e2": 5, "e3": 10, "1": 252}}
+                assert set(batch_df.sort("id").collect()) == {
+                    Row(
+                        id="0",
+                        countAsString="669",
+                        list_state_arr="0,669",
+                        map_state_arr=json.dumps(map_val_0, sort_keys=True),
+                        nested_map_state_arr=json.dumps(nested_map_val_0, sort_keys=True),
+                    ),
+                    Row(
+                        id="1",
+                        countAsString="252",
+                        list_state_arr="0,252",
+                        map_state_arr=json.dumps(map_val_1, sort_keys=True),
+                        nested_map_state_arr=json.dumps(nested_map_val_1, sort_keys=True),
+                    ),
+                }, f"batch id: {batch_id}, real df is: {batch_df.collect()}"
+
+        output_schema = StructType(
+            [
+                StructField("id", StringType(), True),
+                StructField("value_arr", StringType(), True),
+                StructField("list_state_arr", StringType(), True),
+                StructField("map_state_arr", StringType(), True),
+                StructField("nested_map_state_arr", StringType(), True),
+            ]
+        )
+
+        self._test_transform_with_state_basic(
+            StatefulProcessorCompositeTypeFactory(), check_results, output_schema=output_schema
+        )
+
     # run the same test suites again but with single shuffle partition
     def test_transform_with_state_with_timers_single_partition(self):
         with self.sql_conf({"spark.sql.shuffle.partitions": "1"}):
@@ -1714,6 +1796,74 @@ def check_basic_state(batch_df, batch_id):
                         and "column family state must be nullable" in error_msg
                     )
 
+    def test_transform_with_state_int_to_decimal_coercion(self):
+        if not self.use_pandas():
+            return
+
+        class IntToDecimalProcessor(StatefulProcessor):
+            def init(self, handle):
+                count_schema = StructType([StructField("value", IntegerType(), True)])
+                self.count_state = handle.getValueState("count", count_schema)
+
+            def handleInputRows(self, key, rows, timerValues):
+                if self.count_state.exists():
+                    count = self.count_state.get()[0]
+                else:
+                    count = 0
+                count += len(list(rows))
+                self.count_state.update((count,))
+
+                import pandas as pd
+
+                yield pd.DataFrame(
+                    {"id": [key[0]], "decimal_result": [12345]}  # Integer to be coerced to decimal
+                )
+
+            def close(self):
+                pass
+
+        data = [("1", "a"), ("1", "b"), ("2", "c")]
+        df = self.spark.createDataFrame(data, ["id", "value"])
+
+        output_schema = StructType(
+            [
+                StructField("id", StringType(), True),
+                StructField("decimal_result", DecimalType(10, 2), True),
+            ]
+        )
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": True}
+        ):
+            result = (
+                df.groupBy("id")
+                .transformWithStateInPandas(
+                    statefulProcessor=IntToDecimalProcessor(),
+                    outputStructType=output_schema,
+                    outputMode="Update",
+                    timeMode="None",
+                )
+                .collect()
+            )
+            self.assertTrue(len(result) > 0)
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": False}
+        ):
+            with self.assertRaisesRegex(
+                Exception, "Exception thrown when converting pandas.Series"
+            ):
+                (
+                    df.groupBy("id")
+                    .transformWithStateInPandas(
+                        statefulProcessor=IntToDecimalProcessor(),
+                        outputStructType=output_schema,
+                        outputMode="Update",
+                        timeMode="None",
+                    )
+                    .collect()
+                )
+
 
 @unittest.skipIf(
     not have_pyarrow or os.environ.get("PYTHON_GIL", "?") == "0",
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_udf.py b/python/pyspark/sql/tests/pandas/test_pandas_udf.py
index c2769bf882b6b..23fceb746114f 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_udf.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_udf.py
@@ -222,12 +222,20 @@ def foo(x):
 
         with self.assertRaisesRegex(ValueError, "0-arg pandas_udfs.*not.*supported"):
             pandas_udf(lambda: 1, LongType(), PandasUDFType.SCALAR)
+
         with self.assertRaisesRegex(ValueError, "0-arg pandas_udfs.*not.*supported"):
 
             @pandas_udf(LongType(), PandasUDFType.SCALAR)
             def zero_with_type():
                 return 1
 
+        with self.assertRaisesRegex(ValueError, "0-arg pandas_udfs.*not.*supported"):
+
+            @pandas_udf(LongType(), PandasUDFType.SCALAR_ITER)
+            def zero_with_type():
+                yield 1
+                yield 2
+
         with self.assertRaises(PySparkTypeError) as pe:
 
             @pandas_udf(returnType=PandasUDFType.GROUPED_MAP)
@@ -343,6 +351,54 @@ def udf(column):
         with self.sql_conf({"spark.sql.execution.pandas.convertToArrowArraySafely": False}):
             df.withColumn("udf", udf("id")).collect()
 
+    def test_pandas_udf_int_to_decimal_coercion(self):
+        import pandas as pd
+        from decimal import Decimal
+
+        df = self.spark.range(0, 3)
+
+        @pandas_udf(returnType="decimal(10,2)")
+        def int_to_decimal_udf(column):
+            values = [123, 456, 789]
+            return pd.Series([values[int(val) % len(values)] for val in column])
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": True}
+        ):
+            result = df.withColumn("decimal_val", int_to_decimal_udf("id")).collect()
+            self.assertEqual(result[0]["decimal_val"], 123.00)
+            self.assertEqual(result[1]["decimal_val"], 456.00)
+            self.assertEqual(result[2]["decimal_val"], 789.00)
+
+        with self.sql_conf(
+            {"spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": False}
+        ):
+            self.assertRaisesRegex(
+                PythonException,
+                "Exception thrown when converting pandas.Series",
+                df.withColumn("decimal_val", int_to_decimal_udf("id")).collect,
+            )
+
+        @pandas_udf(returnType="decimal(25,1)")
+        def high_precision_udf(column):
+            values = [1, 2, 3]
+            return pd.Series([values[int(val) % len(values)] for val in column])
+
+        for intToDecimalCoercionEnabled in [True, False]:
+            # arrow_cast is enabled by default for SQL_SCALAR_PANDAS_UDF and
+            # and SQL_SCALAR_PANDAS_ITER_UDF, arrow can do this cast safely.
+            # intToDecimalCoercionEnabled is not required for this case
+            with self.sql_conf(
+                {
+                    "spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled": intToDecimalCoercionEnabled  # noqa: E501
+                }
+            ):
+                result = df.withColumn("decimal_val", high_precision_udf("id")).collect()
+                self.assertEqual(len(result), 3)
+                self.assertEqual(result[0]["decimal_val"], Decimal("1.0"))
+                self.assertEqual(result[1]["decimal_val"], Decimal("2.0"))
+                self.assertEqual(result[2]["decimal_val"], Decimal("3.0"))
+
     def test_pandas_udf_timestamp_ntz(self):
         # SPARK-36626: Test TimestampNTZ in pandas UDF
         @pandas_udf(returnType="timestamp_ntz")
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_udf_grouped_agg.py b/python/pyspark/sql/tests/pandas/test_pandas_udf_grouped_agg.py
index e22b8f9ccacc2..1059af59f4a84 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_udf_grouped_agg.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_udf_grouped_agg.py
@@ -718,6 +718,49 @@ def biased_sum(v, w=None):
                         aggregated, df.groupby("id").agg((sum(df.v) + sum(df.w)).alias("s"))
                     )
 
+    def test_arrow_cast_enabled_numeric_to_decimal(self):
+        import numpy as np
+        from decimal import Decimal
+
+        columns = [
+            "int8",
+            "int16",
+            "int32",
+            "uint8",
+            "uint16",
+            "uint32",
+            "float64",
+        ]
+
+        pdf = pd.DataFrame({key: np.arange(1, 2).astype(key) for key in columns})
+        df = self.spark.range(2).repartition(1)
+
+        for column in columns:
+            with self.subTest(column=column):
+
+                @pandas_udf("decimal(10,0)", PandasUDFType.GROUPED_AGG)
+                def test(series):
+                    return pdf[column].iloc[0]
+
+                row = df.groupby("id").agg(test(df.id)).first()
+                res = row[1]
+                self.assertEqual(res, Decimal("1"))
+
+    def test_arrow_cast_enabled_str_to_numeric(self):
+        df = self.spark.range(2).repartition(1)
+
+        types = ["int", "long", "float", "double"]
+
+        for type_str in types:
+            with self.subTest(type=type_str):
+
+                @pandas_udf(type_str, PandasUDFType.GROUPED_AGG)
+                def test(series):
+                    return 123
+
+                row = df.groupby("id").agg(test(df.id)).first()
+                self.assertEqual(row[1], 123)
+
 
 class GroupedAggPandasUDFTests(GroupedAggPandasUDFTestsMixin, ReusedSQLTestCase):
     pass
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_udf_scalar.py b/python/pyspark/sql/tests/pandas/test_pandas_udf_scalar.py
index 0128ae4840703..e614d9039b61a 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_udf_scalar.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_udf_scalar.py
@@ -517,7 +517,10 @@ def test_vectorized_udf_struct_complex(self):
 
         def _scalar_f(id):
             return pd.DataFrame(
-                {"ts": id.apply(lambda i: pd.Timestamp(i)), "arr": id.apply(lambda i: [i, i + 1])}
+                {
+                    "ts": id.apply(lambda i: pd.Timestamp(i, unit="s")),
+                    "arr": id.apply(lambda i: [i, i + 1]),
+                }
             )
 
         scalar_f = pandas_udf(_scalar_f, returnType=return_type)
@@ -532,7 +535,7 @@ def iter_f(it):
             for i, row in enumerate(actual):
                 id, f = row
                 self.assertEqual(i, id)
-                self.assertEqual(pd.Timestamp(i).to_pydatetime(), f[0])
+                self.assertEqual(pd.Timestamp(i, unit="s").to_pydatetime(), f[0])
                 self.assertListEqual([i, i + 1], f[1])
 
     def test_vectorized_udf_struct_empty(self):
@@ -1872,6 +1875,36 @@ def test_udf(a, b=0):
             with self.subTest(with_b=True, query_no=i):
                 assertDataFrameEqual(df, [Row(0), Row(101)])
 
+    def test_arrow_cast_enabled_numeric_to_decimal(self):
+        import numpy as np
+
+        columns = [
+            "int8",
+            "int16",
+            "int32",
+            "uint8",
+            "uint16",
+            "uint32",
+            "float64",
+        ]
+
+        pdf = pd.DataFrame({key: np.arange(1, 2).astype(key) for key in columns})
+        df = self.spark.range(2).repartition(1)
+
+        t = DecimalType(10, 0)
+        for column in columns:
+            with self.subTest(column=column):
+                v = pdf[column].iloc[:1]
+                row = df.select(pandas_udf(lambda _: v, t)(df.id)).first()
+                assert (row[0] == v).all()
+
+    def test_arrow_cast_enabled_str_to_numeric(self):
+        df = self.spark.range(2).repartition(1)
+        for t in [IntegerType(), LongType(), FloatType(), DoubleType()]:
+            with self.subTest(type=t):
+                row = df.select(pandas_udf(lambda _: pd.Series(["123"]), t)(df.id)).first()
+                assert row[0] == 123
+
 
 class ScalarPandasUDFTests(ScalarPandasUDFTestsMixin, ReusedSQLTestCase):
     @classmethod
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_udf_typehints.py b/python/pyspark/sql/tests/pandas/test_pandas_udf_typehints.py
index 7a0fccc225725..bb00f8f5b69b7 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_udf_typehints.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_udf_typehints.py
@@ -377,6 +377,19 @@ def func(col: "Union[pd.Series, pd.DataFrame]", *, col2: "pd.DataFrame") -> "pd.
             infer_eval_type(signature(func), get_type_hints(func)), PandasUDFType.SCALAR
         )
 
+    @unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+    def test_negative_with_arrow_udf(self):
+        import pyarrow as pa
+
+        with self.assertRaisesRegex(
+            Exception,
+            "Unsupported signature:.*pyarrow.lib.Array.",
+        ):
+
+            @pandas_udf("long")
+            def multiply_arrow(a: pa.Array, b: pa.Array) -> pa.Array:
+                return pa.compute.multiply(a, b)
+
 
 if __name__ == "__main__":
     from pyspark.sql.tests.pandas.test_pandas_udf_typehints import *  # noqa: #401
diff --git a/python/pyspark/sql/tests/pandas/test_pandas_udf_window.py b/python/pyspark/sql/tests/pandas/test_pandas_udf_window.py
index 9b3673d80d224..2f534b811b345 100644
--- a/python/pyspark/sql/tests/pandas/test_pandas_udf_window.py
+++ b/python/pyspark/sql/tests/pandas/test_pandas_udf_window.py
@@ -17,6 +17,7 @@
 
 import unittest
 from typing import cast
+from decimal import Decimal
 
 from pyspark.errors import AnalysisException, PythonException
 from pyspark.sql.functions import (
@@ -33,6 +34,13 @@
     PandasUDFType,
 )
 from pyspark.sql.window import Window
+from pyspark.sql.types import (
+    DecimalType,
+    IntegerType,
+    LongType,
+    FloatType,
+    DoubleType,
+)
 from pyspark.testing.sqlutils import (
     ReusedSQLTestCase,
     have_pandas,
@@ -563,6 +571,43 @@ def weighted_mean(**kwargs):
                             )
                         ).show()
 
+    def test_arrow_cast_numeric_to_decimal(self):
+        import numpy as np
+        import pandas as pd
+
+        columns = [
+            "int8",
+            "int16",
+            "int32",
+            "uint8",
+            "uint16",
+            "uint32",
+            "float64",
+        ]
+
+        pdf = pd.DataFrame({key: np.arange(1, 2).astype(key) for key in columns})
+        df = self.data
+        w = self.unbounded_window
+
+        t = DecimalType(10, 0)
+        for column in columns:
+            with self.subTest(column=column):
+                value = pdf[column].iloc[0]
+                mean_udf = pandas_udf(lambda v: value, t, PandasUDFType.GROUPED_AGG)
+                result = df.select(mean_udf(df["v"]).over(w)).first()[0]
+                assert result == Decimal("1.0")
+                assert type(result) == Decimal
+
+    def test_arrow_cast_str_to_numeric(self):
+        df = self.data
+        w = self.unbounded_window
+
+        for t in [IntegerType(), LongType(), FloatType(), DoubleType()]:
+            with self.subTest(type=t):
+                mean_udf = pandas_udf(lambda v: "123", t, PandasUDFType.GROUPED_AGG)
+                result = df.select(mean_udf(df["v"]).over(w)).first()[0]
+                assert result == 123
+
 
 class WindowPandasUDFTests(WindowPandasUDFTestsMixin, ReusedSQLTestCase):
     pass
diff --git a/python/pyspark/sql/tests/streaming/test_streaming_foreach_batch.py b/python/pyspark/sql/tests/streaming/test_streaming_foreach_batch.py
index 9db66aa252ee6..380f089d6a552 100644
--- a/python/pyspark/sql/tests/streaming/test_streaming_foreach_batch.py
+++ b/python/pyspark/sql/tests/streaming/test_streaming_foreach_batch.py
@@ -29,18 +29,18 @@ def test_streaming_foreach_batch(self):
         q = None
 
         def collectBatch(batch_df, batch_id):
-            batch_df.write.format("parquet").saveAsTable("test_table")
+            batch_df.write.format("parquet").saveAsTable("test_table1")
 
         try:
             df = self.spark.readStream.format("text").load("python/test_support/sql/streaming")
             q = df.writeStream.foreachBatch(collectBatch).start()
             q.processAllAvailable()
-            collected = self.spark.sql("select * from test_table").collect()
+            collected = self.spark.sql("select * from test_table1").collect()
             self.assertTrue(len(collected), 2)
         finally:
             if q:
                 q.stop()
-            self.spark.sql("DROP TABLE IF EXISTS test_table")
+            self.spark.sql("DROP TABLE IF EXISTS test_table1")
 
     def test_streaming_foreach_batch_tempview(self):
         q = None
@@ -52,18 +52,18 @@ def collectBatch(batch_df, batch_id):
             # streaming query
             assert len(batch_df.sparkSession.sql("SELECT * FROM updates").collect()) == 2
             # Write a table to verify on the repl/client side.
-            batch_df.write.format("parquet").saveAsTable("test_table")
+            batch_df.write.format("parquet").saveAsTable("test_table2")
 
         try:
             df = self.spark.readStream.format("text").load("python/test_support/sql/streaming")
             q = df.writeStream.foreachBatch(collectBatch).start()
             q.processAllAvailable()
-            collected = self.spark.sql("SELECT * FROM test_table").collect()
+            collected = self.spark.sql("SELECT * FROM test_table2").collect()
             self.assertTrue(len(collected[0]), 2)
         finally:
             if q:
                 q.stop()
-            self.spark.sql("DROP TABLE IF EXISTS test_table")
+            self.spark.sql("DROP TABLE IF EXISTS test_table2")
 
     def test_streaming_foreach_batch_propagates_python_errors(self):
         from pyspark.errors import StreamingQueryException
@@ -204,6 +204,27 @@ def func(df: DataFrame, batch_id: int):
             df = self.spark.read.format("text").load("python/test_support/sql/streaming")
             self.assertEqual(sorted(df.collect()), sorted(actual.collect()))
 
+    def test_streaming_foreach_batch_external_column(self):
+        from pyspark.sql import functions as sf
+
+        table_name = "testTable_foreach_batch_external_column"
+        with self.table(table_name):
+            # Define 'col' outside the `func` below, so it'd have to be serialized.
+            col = sf.col("value")
+
+            def func(df: DataFrame, batch_id: int):
+                result_df = df.select(col.alias("result"))
+                result_df.write.mode("append").saveAsTable(table_name)
+
+            df = self.spark.readStream.format("text").load("python/test_support/sql/streaming")
+            q = df.writeStream.foreachBatch(func).start()
+            q.processAllAvailable()
+            q.stop()
+
+            collected = self.spark.sql("select * from " + table_name).collect()
+            results = [row["result"] for row in collected]
+            self.assertEqual(sorted(results), ["hello", "this"])
+
 
 class StreamingTestsForeachBatch(StreamingTestsForeachBatchMixin, ReusedSQLTestCase):
     pass
diff --git a/python/pyspark/sql/tests/streaming/test_streaming_listener.py b/python/pyspark/sql/tests/streaming/test_streaming_listener.py
index 934b1463a15cd..bb485dae6bdc2 100644
--- a/python/pyspark/sql/tests/streaming/test_streaming_listener.py
+++ b/python/pyspark/sql/tests/streaming/test_streaming_listener.py
@@ -400,9 +400,17 @@ def verify(test_listener):
                 # Check query terminated with exception
                 from pyspark.sql.functions import col, udf
 
+                start_event = None
+                progress_event = None
+                terminated_event = None
                 bad_udf = udf(lambda x: 1 / 0)
                 q = df.select(bad_udf(col("value"))).writeStream.format("noop").start()
-                time.sleep(5)
+                wait_count = 0
+                while terminated_event is None:
+                    time.sleep(0.5)
+                    wait_count = wait_count + 1
+                    if wait_count > 100:
+                        self.fail("Not getting terminated event after 50 seconds")
                 q.stop()
                 self.spark.sparkContext._jsc.sc().listenerBus().waitUntilEmpty()
                 self.check_terminated_event(terminated_event, "ZeroDivisionError")
diff --git a/python/pyspark/sql/tests/test_collection.py b/python/pyspark/sql/tests/test_collection.py
index f59f4dc7b465a..5c923e0e7558e 100644
--- a/python/pyspark/sql/tests/test_collection.py
+++ b/python/pyspark/sql/tests/test_collection.py
@@ -15,9 +15,11 @@
 # limitations under the License.
 #
 
+import datetime
 import unittest
 
 from pyspark.sql.types import (
+    Row,
     ArrayType,
     StringType,
     IntegerType,
@@ -363,6 +365,49 @@ def check_to_local_iterator_not_fully_consumed(self):
                 break
         self.assertEqual(df.take(8), result)
 
+    def test_collect_time(self):
+        import pandas as pd
+
+        query = """
+                SELECT * FROM VALUES
+                (TIME '12:34:56', 'a'), (TIME '22:56:01', 'b'), (NULL, 'c')
+                AS tab(t, i)
+                """
+
+        df = self.spark.sql(query)
+
+        rows = df.collect()
+        self.assertEqual(
+            rows,
+            [
+                Row(t=datetime.time(12, 34, 56), i="a"),
+                Row(t=datetime.time(22, 56, 1), i="b"),
+                Row(t=None, i="c"),
+            ],
+        )
+
+        pdf = df.toPandas()
+        self.assertTrue(
+            pdf.equals(
+                pd.DataFrame(
+                    {
+                        "t": [datetime.time(12, 34, 56), datetime.time(22, 56, 1), None],
+                        "i": ["a", "b", "c"],
+                    }
+                )
+            )
+        )
+
+        tbl = df.toArrow()
+        self.assertEqual(
+            [t.as_py() for t in tbl.column("t")],
+            [datetime.time(12, 34, 56), datetime.time(22, 56, 1), None],
+        )
+        self.assertEqual(
+            [i.as_py() for i in tbl.column("i")],
+            ["a", "b", "c"],
+        )
+
 
 class DataFrameCollectionTests(
     DataFrameCollectionTestsMixin,
diff --git a/python/pyspark/sql/tests/test_column.py b/python/pyspark/sql/tests/test_column.py
index 5f1991973d27d..e2ebfd3c092c4 100644
--- a/python/pyspark/sql/tests/test_column.py
+++ b/python/pyspark/sql/tests/test_column.py
@@ -133,8 +133,8 @@ def test_access_column(self):
         self.assertTrue(isinstance(df["key"], Column))
         self.assertTrue(isinstance(df[0], Column))
         self.assertRaises(IndexError, lambda: df[2])
-        self.assertRaises(AnalysisException, lambda: df["bad_key"])
         self.assertRaises(TypeError, lambda: df[{}])
+        self.assertRaises(AnalysisException, lambda: df.select(df["bad_key"]).schema)
 
     def test_column_name_with_non_ascii(self):
         columnName = "数量"
@@ -361,6 +361,9 @@ def test_lit_time_representation(self):
         ts = datetime.datetime(2021, 3, 4, 12, 34, 56, 1234)
         self.assertEqual(str(sf.lit(ts)), "Column<'2021-03-04 12:34:56.001234'>")
 
+        ts = datetime.time(12, 34, 56, 1234)
+        self.assertEqual(str(sf.lit(ts)), "Column<'12:34:56.001234'>")
+
     @unittest.skipIf(not have_pandas, pandas_requirement_message)
     def test_lit_delta_representation(self):
         for delta in [
diff --git a/python/pyspark/sql/tests/test_conversion.py b/python/pyspark/sql/tests/test_conversion.py
new file mode 100644
index 0000000000000..2b18fe8d04d7a
--- /dev/null
+++ b/python/pyspark/sql/tests/test_conversion.py
@@ -0,0 +1,122 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+
+from pyspark.sql.conversion import ArrowTableToRowsConversion, LocalDataToArrowConversion
+from pyspark.sql.types import (
+    ArrayType,
+    BinaryType,
+    IntegerType,
+    MapType,
+    Row,
+    StringType,
+    StructType,
+)
+from pyspark.testing.objects import ExamplePoint, ExamplePointUDT
+from pyspark.testing.utils import have_pyarrow, pyarrow_requirement_message
+
+
+@unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+class ConversionTests(unittest.TestCase):
+    def test_conversion(self):
+        data = [
+            (
+                i if i % 2 == 0 else None,
+                str(i),
+                i,
+                str(i).encode(),
+                [j if j % 2 == 0 else None for j in range(i)],
+                list(range(i)),
+                [str(j).encode() for j in range(i)],
+                {str(j): j if j % 2 == 0 else None for j in range(i)},
+                {str(j): j for j in range(i)},
+                {str(j): str(j).encode() for j in range(i)},
+                (i if i % 2 == 0 else None, str(i), i, str(i).encode()),
+                {"i": i if i % 2 == 0 else None, "s": str(i), "ii": i, "b": str(i).encode()},
+                ExamplePoint(float(i), float(i)),
+            )
+            for i in range(5)
+        ]
+        schema = (
+            StructType()
+            .add("i", IntegerType())
+            .add("s", StringType())
+            .add("ii", IntegerType(), nullable=False)
+            .add("b", BinaryType())
+            .add("arr_i", ArrayType(IntegerType()))
+            .add("arr_ii", ArrayType(IntegerType(), containsNull=False))
+            .add("arr_b", ArrayType(BinaryType()))
+            .add("map_i", MapType(StringType(), IntegerType()))
+            .add("map_ii", MapType(StringType(), IntegerType(), valueContainsNull=False))
+            .add("map_b", MapType(StringType(), BinaryType()))
+            .add(
+                "struct_t",
+                StructType()
+                .add("i", IntegerType())
+                .add("s", StringType())
+                .add("ii", IntegerType(), nullable=False)
+                .add("b", BinaryType()),
+            )
+            .add(
+                "struct_d",
+                StructType()
+                .add("i", IntegerType())
+                .add("s", StringType())
+                .add("ii", IntegerType(), nullable=False)
+                .add("b", BinaryType()),
+            )
+            .add("udt", ExamplePointUDT())
+        )
+
+        tbl = LocalDataToArrowConversion.convert(data, schema, use_large_var_types=False)
+        actual = ArrowTableToRowsConversion.convert(tbl, schema)
+
+        for a, e in zip(
+            actual,
+            [
+                Row(
+                    i=i if i % 2 == 0 else None,
+                    s=str(i),
+                    ii=i,
+                    b=str(i).encode(),
+                    arr_i=[j if j % 2 == 0 else None for j in range(i)],
+                    arr_ii=list(range(i)),
+                    arr_b=[str(j).encode() for j in range(i)],
+                    map_i={str(j): j if j % 2 == 0 else None for j in range(i)},
+                    map_ii={str(j): j for j in range(i)},
+                    map_b={str(j): str(j).encode() for j in range(i)},
+                    struct_t=Row(i=i if i % 2 == 0 else None, s=str(i), ii=i, b=str(i).encode()),
+                    struct_d=Row(i=i if i % 2 == 0 else None, s=str(i), ii=i, b=str(i).encode()),
+                    udt=ExamplePoint(float(i), float(i)),
+                )
+                for i in range(5)
+            ],
+        ):
+            with self.subTest(expected=e):
+                self.assertEqual(a, e)
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.test_conversion import *  # noqa: F401
+
+    try:
+        import xmlrunner  # type: ignore
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/test_creation.py b/python/pyspark/sql/tests/test_creation.py
index c6917aa234b41..fb78b4c146326 100644
--- a/python/pyspark/sql/tests/test_creation.py
+++ b/python/pyspark/sql/tests/test_creation.py
@@ -24,7 +24,12 @@
 from pyspark.sql import Row
 import pyspark.sql.functions as F
 from pyspark.sql.types import (
+    DecimalType,
+    StructType,
+    StructField,
+    StringType,
     DateType,
+    TimeType,
     TimestampType,
     TimestampNTZType,
 )
@@ -32,6 +37,7 @@
     PySparkTypeError,
     PySparkValueError,
 )
+from pyspark.testing import assertDataFrameEqual
 from pyspark.testing.sqlutils import (
     ReusedSQLTestCase,
     have_pandas,
@@ -42,6 +48,21 @@
 
 
 class DataFrameCreationTestsMixin:
+    def test_create_str_from_dict(self):
+        data = [
+            {"broker": {"teamId": 3398, "contactEmail": "abc.xyz@123.ca"}},
+        ]
+
+        for schema in [
+            StructType([StructField("broker", StringType())]),
+            "broker: string",
+        ]:
+            df = self.spark.createDataFrame(data, schema=schema)
+            self.assertEqual(
+                df.first().broker,
+                """{'teamId': 3398, 'contactEmail': 'abc.xyz@123.ca'}""",
+            )
+
     def test_create_dataframe_from_array_of_long(self):
         import array
 
@@ -49,6 +70,20 @@ def test_create_dataframe_from_array_of_long(self):
         df = self.spark.createDataFrame(data)
         self.assertEqual(df.first(), Row(longarray=[-9223372036854775808, 0, 9223372036854775807]))
 
+    def test_create_dataframe_from_datetime_time(self):
+        import datetime
+
+        df = self.spark.createDataFrame(
+            [
+                (datetime.time(1, 2, 3),),
+                (datetime.time(4, 5, 6),),
+                (datetime.time(7, 8, 9),),
+            ],
+            ["t"],
+        )
+        self.assertIsInstance(df.schema["t"].dataType, TimeType)
+        self.assertEqual(df.count(), 3)
+
     @unittest.skipIf(not have_pandas, pandas_requirement_message)  # type: ignore
     def test_create_dataframe_from_pandas_with_timestamp(self):
         import pandas as pd
@@ -126,6 +161,12 @@ def test_create_nan_decimal_dataframe(self):
             [Row(value=None)],
         )
 
+    def test_check_decimal_nan(self):
+        data = [Row(dec=Decimal("NaN"))]
+        schema = StructType([StructField("dec", DecimalType(), False)])
+        with self.assertRaises(PySparkValueError):
+            self.spark.createDataFrame(data=data, schema=schema)
+
     def test_invalid_argument_create_dataframe(self):
         with self.assertRaises(PySparkTypeError) as pe:
             self.spark.createDataFrame([(1, 2)], schema=123)
@@ -210,6 +251,13 @@ def test_schema_inference_from_pandas_with_dict(self):
                 [Row(str_col="second", dict_col={"first": 0.7, "second": 0.3}, test=0.3)],
             )
 
+    def test_empty_schema(self):
+        schema = StructType()
+        for data in [[], [Row()]]:
+            with self.subTest(data=data):
+                sdf = self.spark.createDataFrame(data, schema)
+                assertDataFrameEqual(sdf, data)
+
 
 class DataFrameCreationTests(
     DataFrameCreationTestsMixin,
diff --git a/python/pyspark/sql/tests/test_dataframe.py b/python/pyspark/sql/tests/test_dataframe.py
index 890ae56ffa529..75a553b62838e 100644
--- a/python/pyspark/sql/tests/test_dataframe.py
+++ b/python/pyspark/sql/tests/test_dataframe.py
@@ -26,7 +26,18 @@
 from contextlib import redirect_stdout
 
 from pyspark.sql import Row, functions, DataFrame
-from pyspark.sql.functions import col, lit, count, struct, date_format, to_date, array, explode
+from pyspark.sql.functions import (
+    col,
+    lit,
+    count,
+    struct,
+    date_format,
+    to_date,
+    array,
+    explode,
+    when,
+    concat,
+)
 from pyspark.sql.types import (
     StringType,
     IntegerType,
@@ -189,6 +200,54 @@ def test_drop(self):
         self.assertEqual(df.drop(col("name"), col("age")).columns, ["active"])
         self.assertEqual(df.drop(col("name"), col("age"), col("random")).columns, ["active"])
 
+    def test_drop_notexistent_col(self):
+        df1 = self.spark.createDataFrame(
+            [("a", "b", "c")],
+            schema="colA string, colB string, colC string",
+        )
+        df2 = self.spark.createDataFrame(
+            [("c", "d", "e")],
+            schema="colC string, colD string, colE string",
+        )
+        df3 = df1.join(df2, df1["colC"] == df2["colC"]).withColumn(
+            "colB",
+            when(df1["colB"] == "b", concat(df1["colB"].cast("string"), lit("x"))).otherwise(
+                df1["colB"]
+            ),
+        )
+        df4 = df3.drop(df1["colB"])
+
+        self.assertEqual(df4.columns, ["colA", "colB", "colC", "colC", "colD", "colE"])
+        self.assertEqual(df4.count(), 1)
+
+    def test_drop_col_from_different_dataframe(self):
+        df1 = self.spark.range(10)
+        df2 = df1.withColumn("v0", lit(0))
+
+        # drop df2["id"] from df2
+        self.assertEqual(df2.drop(df2["id"]).columns, ["v0"])
+
+        # drop df1["id"] from df2, which is semantically equal to df2["id"]
+        # note that df1.drop(df2["id"]) works in Classic, but not in Connect
+        self.assertEqual(df2.drop(df1["id"]).columns, ["v0"])
+
+        df3 = df2.select("*", lit(1).alias("v1"))
+
+        # drop df3["id"] from df3
+        self.assertEqual(df3.drop(df3["id"]).columns, ["v0", "v1"])
+
+        # drop df2["id"] from df3, which is semantically equal to df3["id"]
+        self.assertEqual(df3.drop(df2["id"]).columns, ["v0", "v1"])
+
+        # drop df1["id"] from df3, which is semantically equal to df3["id"]
+        self.assertEqual(df3.drop(df1["id"]).columns, ["v0", "v1"])
+
+        # drop df3["v0"] from df3
+        self.assertEqual(df3.drop(df3["v0"]).columns, ["id", "v1"])
+
+        # drop df2["v0"] from df3, which is semantically equal to df3["v0"]
+        self.assertEqual(df3.drop(df2["v0"]).columns, ["id", "v1"])
+
     def test_drop_join(self):
         left_df = self.spark.createDataFrame(
             [(1, "a"), (2, "b"), (3, "c")],
diff --git a/python/pyspark/sql/tests/test_functions.py b/python/pyspark/sql/tests/test_functions.py
index e2b3e33756ba3..2fde3edc2486c 100644
--- a/python/pyspark/sql/tests/test_functions.py
+++ b/python/pyspark/sql/tests/test_functions.py
@@ -81,7 +81,10 @@ def test_function_parity(self):
         missing_in_py = jvm_fn_set.difference(py_fn_set)
 
         # Functions that we expect to be missing in python until they are added to pyspark
-        expected_missing_in_py = set()
+        expected_missing_in_py = set(
+            # TODO(SPARK-53108): Implement the time_diff function in Python
+            ["time_diff"]
+        )
 
         self.assertEqual(
             expected_missing_in_py, missing_in_py, "Missing functions in pyspark not as expected"
@@ -400,6 +403,19 @@ def test_rand_functions(self):
         rndn2 = df.select("key", F.randn(0)).collect()
         self.assertEqual(sorted(rndn1), sorted(rndn2))
 
+    def test_time_trunc(self):
+        # SPARK-53110: test the time_trunc function.
+        df = self.spark.range(1).select(
+            F.lit("minute").alias("unit"), F.lit(datetime.time(1, 2, 3)).alias("time")
+        )
+        result = datetime.time(1, 2, 0)
+        row_from_col = df.select(F.time_trunc(df.unit, df.time)).first()
+        self.assertIsInstance(row_from_col[0], datetime.time)
+        self.assertEqual(row_from_col[0], result)
+        row_from_name = df.select(F.time_trunc("unit", "time")).first()
+        self.assertIsInstance(row_from_name[0], datetime.time)
+        self.assertEqual(row_from_name[0], result)
+
     def test_try_parse_url(self):
         df = self.spark.createDataFrame(
             [("https://spark.apache.org/path?query=1", "QUERY", "query")],
@@ -574,6 +590,30 @@ def test_dayname(self):
         row = df.select(F.dayname(df.date)).first()
         self.assertEqual(row[0], "Mon")
 
+    def test_hour(self):
+        # SPARK-52892: test the hour function with time.
+        df = self.spark.range(1).select(F.lit(datetime.time(12, 34, 56)).alias("time"))
+        row_from_col = df.select(F.hour(df.time)).first()
+        self.assertEqual(row_from_col[0], 12)
+        row_from_name = df.select(F.hour("time")).first()
+        self.assertEqual(row_from_name[0], 12)
+
+    def test_minute(self):
+        # SPARK-52893: test the minute function with time.
+        df = self.spark.range(1).select(F.lit(datetime.time(12, 34, 56)).alias("time"))
+        row_from_col = df.select(F.minute(df.time)).first()
+        self.assertEqual(row_from_col[0], 34)
+        row_from_name = df.select(F.minute("time")).first()
+        self.assertEqual(row_from_name[0], 34)
+
+    def test_second(self):
+        # SPARK-52894: test the second function with time.
+        df = self.spark.range(1).select(F.lit(datetime.time(12, 34, 56)).alias("time"))
+        row_from_col = df.select(F.second(df.time)).first()
+        self.assertEqual(row_from_col[0], 56)
+        row_from_name = df.select(F.second("time")).first()
+        self.assertEqual(row_from_name[0], 56)
+
     # Test added for SPARK-37738; change Python API to accept both col & int as input
     def test_date_add_function(self):
         dt = datetime.date(2021, 12, 27)
@@ -628,6 +668,17 @@ def test_add_months_function(self):
             )
         )
 
+    def test_make_time(self):
+        # SPARK-52888: test the make_time function.
+        df = self.spark.createDataFrame([(1, 2, 3)], ["hour", "minute", "second"])
+        result = datetime.time(1, 2, 3)
+        row_from_col = df.select(F.make_time(df.hour, df.minute, df.second)).first()
+        self.assertIsInstance(row_from_col[0], datetime.time)
+        self.assertEqual(row_from_col[0], result)
+        row_from_name = df.select(F.make_time("hour", "minute", "second")).first()
+        self.assertIsInstance(row_from_name[0], datetime.time)
+        self.assertEqual(row_from_name[0], result)
+
     def test_make_date(self):
         # SPARK-36554: expose make_date expression
         df = self.spark.createDataFrame([(2020, 6, 26)], ["Y", "M", "D"])
@@ -1275,6 +1326,11 @@ def test_datetime_functions(self):
         parse_result = df.select(F.to_date(F.col("dateCol"))).first()
         self.assertEqual(datetime.date(2017, 1, 22), parse_result["to_date(dateCol)"])
 
+    def test_try_datetime_functions(self):
+        df = self.spark.range(1).selectExpr("'2017-01-22' as dateCol")
+        parse_result = df.select(F.try_to_date(F.col("dateCol")).alias("tryToDateCol")).first()
+        self.assertEqual(datetime.date(2017, 1, 22), parse_result["tryToDateCol"])
+
     def test_assert_true(self):
         self.check_assert_true(SparkRuntimeException)
 
@@ -1344,6 +1400,11 @@ def test_shiftrightunsigned(self):
             )
         ).collect()
 
+    def test_lit_time(self):
+        t = datetime.time(12, 34, 56)
+        actual = self.spark.range(1).select(F.lit(t)).first()[0]
+        self.assertEqual(actual, t)
+
     def test_lit_day_time_interval(self):
         td = datetime.timedelta(days=1, hours=12, milliseconds=123)
         actual = self.spark.range(1).select(F.lit(td)).first()[0]
@@ -1614,6 +1675,35 @@ def test_try_parse_json(self):
         self.assertEqual("""{"a":1}""", actual[0]["var"])
         self.assertEqual(None, actual[1]["var"])
 
+    def test_try_to_time(self):
+        # SPARK-52891: test the try_to_time function.
+        df = self.spark.createDataFrame([("10:30:00", "HH:mm:ss")], ["time", "format"])
+        result = datetime.time(10, 30, 0)
+        # Test without format.
+        row_from_col_no_format = df.select(F.try_to_time(df.time)).first()
+        self.assertIsInstance(row_from_col_no_format[0], datetime.time)
+        self.assertEqual(row_from_col_no_format[0], result)
+        row_from_name_no_format = df.select(F.try_to_time("time")).first()
+        self.assertIsInstance(row_from_name_no_format[0], datetime.time)
+        self.assertEqual(row_from_name_no_format[0], result)
+        # Test with format.
+        row_from_col_with_format = df.select(F.try_to_time(df.time, df.format)).first()
+        self.assertIsInstance(row_from_col_with_format[0], datetime.time)
+        self.assertEqual(row_from_col_with_format[0], result)
+        row_from_name_with_format = df.select(F.try_to_time("time", "format")).first()
+        self.assertIsInstance(row_from_name_with_format[0], datetime.time)
+        self.assertEqual(row_from_name_with_format[0], result)
+        # Test with malformed time.
+        df = self.spark.createDataFrame([("malformed", "HH:mm:ss")], ["time", "format"])
+        row_from_col_no_format_malformed = df.select(F.try_to_time(df.time)).first()
+        self.assertIsNone(row_from_col_no_format_malformed[0])
+        row_from_name_no_format_malformed = df.select(F.try_to_time("time")).first()
+        self.assertIsNone(row_from_name_no_format_malformed[0])
+        row_from_col_with_format_malformed = df.select(F.try_to_time(df.time, df.format)).first()
+        self.assertIsNone(row_from_col_with_format_malformed[0])
+        row_from_name_with_format_malformed = df.select(F.try_to_time("time", "format")).first()
+        self.assertIsNone(row_from_name_with_format_malformed[0])
+
     def test_to_variant_object(self):
         df = self.spark.createDataFrame([(1, {"a": 1})], "i int, v struct<a int>")
         actual = df.select(
@@ -1723,6 +1813,25 @@ def test_bucket(self):
             messageParameters={"arg_name": "numBuckets", "arg_type": "str"},
         )
 
+    def test_to_time(self):
+        # SPARK-52890: test the to_time function.
+        df = self.spark.createDataFrame([("10:30:00", "HH:mm:ss")], ["time", "format"])
+        result = datetime.time(10, 30, 0)
+        # Test without format.
+        row_from_col_no_format = df.select(F.to_time(df.time)).first()
+        self.assertIsInstance(row_from_col_no_format[0], datetime.time)
+        self.assertEqual(row_from_col_no_format[0], result)
+        row_from_name_no_format = df.select(F.to_time("time")).first()
+        self.assertIsInstance(row_from_name_no_format[0], datetime.time)
+        self.assertEqual(row_from_name_no_format[0], result)
+        # Test with format.
+        row_from_col_with_format = df.select(F.to_time(df.time, df.format)).first()
+        self.assertIsInstance(row_from_col_with_format[0], datetime.time)
+        self.assertEqual(row_from_col_with_format[0], result)
+        row_from_name_with_format = df.select(F.to_time("time", "format")).first()
+        self.assertIsInstance(row_from_name_with_format[0], datetime.time)
+        self.assertEqual(row_from_name_with_format[0], result)
+
     def test_to_timestamp_ltz(self):
         df = self.spark.createDataFrame([("2016-12-31",)], ["e"])
         df = df.select(F.to_timestamp_ltz(df.e, F.lit("yyyy-MM-dd")).alias("r"))
@@ -1765,6 +1874,16 @@ def test_non_deterministic_with_seed(self):
         for i in range(3):
             self.assertEqual(res[0][i * 2], res[0][i * 2 + 1])
 
+    def test_current_time(self):
+        # SPARK-52889: test the current_time function without precision.
+        df = self.spark.range(1).select(F.current_time())
+        self.assertIsInstance(df.first()[0], datetime.time)
+        self.assertEqual(df.schema.names[0], "current_time(6)")
+        # SPARK-52889: test the current_time function with precision.
+        df = self.spark.range(1).select(F.current_time(3))
+        self.assertIsInstance(df.first()[0], datetime.time)
+        self.assertEqual(df.schema.names[0], "current_time(3)")
+
     def test_current_timestamp(self):
         df = self.spark.range(1).select(F.current_timestamp())
         self.assertIsInstance(df.first()[0], datetime.datetime)
diff --git a/python/pyspark/sql/tests/test_python_streaming_datasource.py b/python/pyspark/sql/tests/test_python_streaming_datasource.py
index fa14b37b57e62..9879231540f1d 100644
--- a/python/pyspark/sql/tests/test_python_streaming_datasource.py
+++ b/python/pyspark/sql/tests/test_python_streaming_datasource.py
@@ -24,6 +24,7 @@
     DataSourceStreamReader,
     InputPartition,
     DataSourceStreamWriter,
+    DataSourceStreamArrowWriter,
     SimpleDataSourceStreamReader,
     WriterCommitMessage,
 )
@@ -295,6 +296,156 @@ def test_stream_writer(self):
             output_dir.cleanup()
             checkpoint_dir.cleanup()
 
+    def test_stream_arrow_writer(self):
+        """Test DataSourceStreamArrowWriter with Arrow RecordBatch format."""
+        import tempfile
+        import shutil
+        import json
+        import os
+        import pyarrow as pa
+        from dataclasses import dataclass
+
+        @dataclass
+        class ArrowCommitMessage(WriterCommitMessage):
+            partition_id: int
+            batch_count: int
+            total_rows: int
+
+        class TestStreamArrowWriter(DataSourceStreamArrowWriter):
+            def __init__(self, options):
+                self.options = options
+                self.path = self.options.get("path")
+                assert self.path is not None
+
+            def write(self, iterator):
+                from pyspark import TaskContext
+
+                context = TaskContext.get()
+                partition_id = context.partitionId()
+                batch_count = 0
+                total_rows = 0
+
+                for batch in iterator:
+                    assert isinstance(batch, pa.RecordBatch)
+                    batch_count += 1
+                    total_rows += batch.num_rows
+
+                    # Convert to pandas and write to temp JSON file
+                    df = batch.to_pandas()
+
+                    filename = f"partition_{partition_id}_batch_{batch_count}.json"
+                    filepath = os.path.join(self.path, filename)
+
+                    # Actually write the JSON file
+                    df.to_json(filepath, orient="records")
+
+                commit_msg = ArrowCommitMessage(
+                    partition_id=partition_id, batch_count=batch_count, total_rows=total_rows
+                )
+                return commit_msg
+
+            def commit(self, messages, batchId):
+                """Write commit metadata for successful batch."""
+                total_batches = sum(m.batch_count for m in messages if m)
+                total_rows = sum(m.total_rows for m in messages if m)
+
+                status = {
+                    "batch_id": batchId,
+                    "num_partitions": len([m for m in messages if m]),
+                    "total_batches": total_batches,
+                    "total_rows": total_rows,
+                }
+
+                with open(os.path.join(self.path, f"commit_{batchId}.json"), "w") as f:
+                    json.dump(status, f)
+
+            def abort(self, messages, batchId):
+                """Handle batch failure."""
+                with open(os.path.join(self.path, f"abort_{batchId}.txt"), "w") as f:
+                    f.write(f"Batch {batchId} aborted")
+
+        class TestDataSource(DataSource):
+            @classmethod
+            def name(cls):
+                return "TestArrowStreamWriter"
+
+            def schema(self):
+                return "id INT, name STRING, value DOUBLE"
+
+            def streamWriter(self, schema, overwrite):
+                return TestStreamArrowWriter(self.options)
+
+        # Create temporary directory for test
+        temp_dir = tempfile.mkdtemp()
+        try:
+            # Register the data source
+            self.spark.dataSource.register(TestDataSource)
+
+            # Create test data
+            df = (
+                self.spark.readStream.format("rate")
+                .option("rowsPerSecond", 10)
+                .option("numPartitions", 3)
+                .load()
+                .selectExpr("value as id", "concat('name_', value) as name", "value * 2.5 as value")
+            )
+
+            # Write using streaming with Arrow writer
+            query = (
+                df.writeStream.format("TestArrowStreamWriter")
+                .option("path", temp_dir)
+                .option("checkpointLocation", os.path.join(temp_dir, "checkpoint"))
+                .trigger(processingTime="1 seconds")
+                .start()
+            )
+
+            # Wait a bit for data to be processed, then stop
+            time.sleep(6)  # Allow a few batches to run
+            query.stop()
+            query.awaitTermination()
+
+            # Since we're writing actual JSON files, verify commit metadata and written files
+            commit_files = [f for f in os.listdir(temp_dir) if f.startswith("commit_")]
+            self.assertTrue(len(commit_files) > 0, "No commit files were created")
+
+            # Read and verify commit metadata - check all commits for any with data
+            total_committed_rows = 0
+            total_committed_batches = 0
+
+            for commit_file in commit_files:
+                with open(os.path.join(temp_dir, commit_file), "r") as f:
+                    commit_data = json.load(f)
+                    total_committed_rows += commit_data.get("total_rows", 0)
+                    total_committed_batches += commit_data.get("total_batches", 0)
+
+            # We should have both committed data AND JSON files written
+            json_files = [
+                f
+                for f in os.listdir(temp_dir)
+                if f.startswith("partition_") and f.endswith(".json")
+            ]
+
+            # Verify that we have both committed data AND JSON files
+            has_committed_data = total_committed_rows > 0
+            has_json_files = len(json_files) > 0
+
+            self.assertTrue(
+                has_committed_data, f"Expected committed data but got {total_committed_rows} rows"
+            )
+            self.assertTrue(
+                has_json_files, f"Expected JSON files but found {len(json_files)} files"
+            )
+
+            # Verify JSON files contain valid data
+            for json_file in json_files:
+                with open(os.path.join(temp_dir, json_file), "r") as f:
+                    data = json.load(f)
+                    self.assertTrue(len(data) > 0, f"JSON file {json_file} is empty")
+
+        finally:
+            # Clean up
+            shutil.rmtree(temp_dir, ignore_errors=True)
+
 
 class PythonStreamingDataSourceTests(BasePythonStreamingDataSourceTestsMixin, ReusedSQLTestCase):
     pass
diff --git a/python/pyspark/sql/tests/test_sql.py b/python/pyspark/sql/tests/test_sql.py
index bf50bbc11ac33..e60ad183d1474 100644
--- a/python/pyspark/sql/tests/test_sql.py
+++ b/python/pyspark/sql/tests/test_sql.py
@@ -168,6 +168,12 @@ def test_nested_dataframe(self):
         self.assertEqual(df3.take(1), [Row(id=4)])
         self.assertEqual(df3.tail(1), [Row(id=9)])
 
+    def test_lit_time(self):
+        import datetime
+
+        actual = self.spark.sql("select TIME '12:34:56'").first()[0]
+        self.assertEqual(actual, datetime.time(12, 34, 56))
+
 
 class SQLTests(SQLTestsMixin, ReusedSQLTestCase):
     pass
diff --git a/python/pyspark/sql/tests/test_stat.py b/python/pyspark/sql/tests/test_stat.py
index 804e2484536f8..fe1746dbd894d 100644
--- a/python/pyspark/sql/tests/test_stat.py
+++ b/python/pyspark/sql/tests/test_stat.py
@@ -435,12 +435,12 @@ def test_unpivot(self):
                     self.assertEqual(
                         actual.collect(),
                         [
-                            Row(var="int", value=10.0),
-                            Row(var="double", value=1.0),
-                            Row(var="int", value=20.0),
-                            Row(var="double", value=2.0),
-                            Row(var="int", value=30.0),
-                            Row(var="double", value=3.0),
+                            Row(var="int", val=10.0),
+                            Row(var="double", val=1.0),
+                            Row(var="int", val=20.0),
+                            Row(var="double", val=2.0),
+                            Row(var="int", val=30.0),
+                            Row(var="double", val=3.0),
                         ],
                     )
 
@@ -455,12 +455,12 @@ def test_unpivot(self):
                     self.assertEqual(
                         actual.collect(),
                         [
-                            Row(id=1, var="int", value=10.0),
-                            Row(id=1, var="double", value=1.0),
-                            Row(id=2, var="int", value=20.0),
-                            Row(id=2, var="double", value=2.0),
-                            Row(id=3, var="int", value=30.0),
-                            Row(id=3, var="double", value=3.0),
+                            Row(id=1, var="int", val=10.0),
+                            Row(id=1, var="double", val=1.0),
+                            Row(id=2, var="int", val=20.0),
+                            Row(id=2, var="double", val=2.0),
+                            Row(id=3, var="int", val=30.0),
+                            Row(id=3, var="double", val=3.0),
                         ],
                     )
 
@@ -475,12 +475,12 @@ def test_unpivot(self):
                     self.assertEqual(
                         actual.collect(),
                         [
-                            Row(id=1, double=1.0, var="int", value=10.0),
-                            Row(id=1, double=1.0, var="double", value=1.0),
-                            Row(id=2, double=2.0, var="int", value=20.0),
-                            Row(id=2, double=2.0, var="double", value=2.0),
-                            Row(id=3, double=3.0, var="int", value=30.0),
-                            Row(id=3, double=3.0, var="double", value=3.0),
+                            Row(id=1, double=1.0, var="int", val=10.0),
+                            Row(id=1, double=1.0, var="double", val=1.0),
+                            Row(id=2, double=2.0, var="int", val=20.0),
+                            Row(id=2, double=2.0, var="double", val=2.0),
+                            Row(id=3, double=3.0, var="int", val=30.0),
+                            Row(id=3, double=3.0, var="double", val=3.0),
                         ],
                     )
 
@@ -491,15 +491,15 @@ def test_unpivot(self):
             self.assertEqual(
                 actual.collect(),
                 [
-                    Row(var="id", value=1.0),
-                    Row(var="int", value=10.0),
-                    Row(var="double", value=1.0),
-                    Row(var="id", value=2.0),
-                    Row(var="int", value=20.0),
-                    Row(var="double", value=2.0),
-                    Row(var="id", value=3.0),
-                    Row(var="int", value=30.0),
-                    Row(var="double", value=3.0),
+                    Row(var="id", val=1.0),
+                    Row(var="int", val=10.0),
+                    Row(var="double", val=1.0),
+                    Row(var="id", val=2.0),
+                    Row(var="int", val=20.0),
+                    Row(var="double", val=2.0),
+                    Row(var="id", val=3.0),
+                    Row(var="int", val=30.0),
+                    Row(var="double", val=3.0),
                 ],
             )
 
@@ -514,12 +514,12 @@ def test_unpivot(self):
                     self.assertEqual(
                         actual.collect(),
                         [
-                            Row(id=1, var="int", value=10.0),
-                            Row(id=1, var="double", value=1.0),
-                            Row(id=2, var="int", value=20.0),
-                            Row(id=2, var="double", value=2.0),
-                            Row(id=3, var="int", value=30.0),
-                            Row(id=3, var="double", value=3.0),
+                            Row(id=1, var="int", val=10.0),
+                            Row(id=1, var="double", val=1.0),
+                            Row(id=2, var="int", val=20.0),
+                            Row(id=2, var="double", val=2.0),
+                            Row(id=3, var="int", val=30.0),
+                            Row(id=3, var="double", val=3.0),
                         ],
                     )
 
diff --git a/python/pyspark/sql/tests/test_types.py b/python/pyspark/sql/tests/test_types.py
index 185198766b794..319ff92dd362d 100644
--- a/python/pyspark/sql/tests/test_types.py
+++ b/python/pyspark/sql/tests/test_types.py
@@ -42,6 +42,7 @@
     IntegerType,
     FloatType,
     DateType,
+    TimeType,
     TimestampType,
     TimestampNTZType,
     DayTimeIntervalType,
@@ -183,6 +184,7 @@ def __init__(self):
             "a",
             datetime.date(1970, 1, 1),
             datetime.datetime(1970, 1, 1, 0, 0),
+            datetime.time(hour=1, minute=2, second=3),
             datetime.timedelta(microseconds=123456678),
             1.0,
             array.array("d", [1]),
@@ -206,6 +208,7 @@ def __init__(self):
             "string",
             "date",
             "timestamp",
+            "time(6)",
             "interval day to second",
             "double",
             "array<double>",
@@ -229,6 +232,7 @@ def __init__(self):
             "a",
             datetime.date(1970, 1, 1),
             datetime.datetime(1970, 1, 1, 0, 0),
+            datetime.time(hour=1, minute=2, second=3),
             datetime.timedelta(microseconds=123456678),
             1.0,
             [1.0],
@@ -525,7 +529,7 @@ def test_create_dataframe_from_objects(self):
         self.assertEqual(df.first(), Row(key=1, value="1"))
 
     def test_apply_schema(self):
-        from datetime import date, datetime, timedelta
+        from datetime import date, time, datetime, timedelta
 
         rdd = self.sc.parallelize(
             [
@@ -537,6 +541,7 @@ def test_apply_schema(self):
                     2147483647,
                     1.0,
                     date(2010, 1, 1),
+                    time(23, 23, 59, 999999),
                     datetime(2010, 1, 1, 1, 1, 1),
                     timedelta(days=1),
                     {"a": 1},
@@ -555,6 +560,7 @@ def test_apply_schema(self):
                 StructField("int1", IntegerType(), False),
                 StructField("float1", FloatType(), False),
                 StructField("date1", DateType(), False),
+                StructField("time", TimeType(), False),
                 StructField("time1", TimestampType(), False),
                 StructField("daytime1", DayTimeIntervalType(), False),
                 StructField("map1", MapType(StringType(), IntegerType(), False), False),
@@ -573,6 +579,7 @@ def test_apply_schema(self):
                 x.int1,
                 x.float1,
                 x.date1,
+                x.time,
                 x.time1,
                 x.daytime1,
                 x.map1["a"],
@@ -589,6 +596,7 @@ def test_apply_schema(self):
             2147483647,
             1.0,
             date(2010, 1, 1),
+            time(23, 23, 59, 999999),
             datetime(2010, 1, 1, 1, 1, 1),
             timedelta(days=1),
             1,
@@ -642,6 +650,17 @@ def test_schema_with_collations_json_ser_de(self):
         from pyspark.sql.types import _parse_datatype_json_string
 
         unicode_collation = "UNICODE"
+        utf8_lcase_collation = "UTF8_LCASE"
+
+        standalone_string = StringType(unicode_collation)
+
+        standalone_array = ArrayType(StringType(unicode_collation))
+
+        standalone_map = MapType(StringType(utf8_lcase_collation), StringType(unicode_collation))
+
+        standalone_nested = ArrayType(
+            MapType(StringType(utf8_lcase_collation), ArrayType(StringType(unicode_collation)))
+        )
 
         simple_struct = StructType([StructField("c1", StringType(unicode_collation))])
 
@@ -713,6 +732,10 @@ def test_schema_with_collations_json_ser_de(self):
         )
 
         schemas = [
+            standalone_string,
+            standalone_array,
+            standalone_map,
+            standalone_nested,
             simple_struct,
             nested_struct,
             array_in_schema,
@@ -1241,6 +1264,7 @@ def test_parse_datatype_json_string(self):
             IntegerType(),
             LongType(),
             DateType(),
+            TimeType(5),
             TimestampType(),
             TimestampNTZType(),
             NullType(),
@@ -1291,6 +1315,8 @@ def test_parse_datatype_string(self):
             _parse_datatype_string("a INT, c DOUBLE"),
         )
         self.assertEqual(VariantType(), _parse_datatype_string("variant"))
+        self.assertEqual(TimeType(5), _parse_datatype_string("time(5)"))
+        self.assertEqual(TimeType(), _parse_datatype_string("time( 6 )"))
 
     def test_tree_string(self):
         schema1 = DataType.fromDDL("c1 INT, c2 STRUCT<c3: INT, c4: STRUCT<c5: INT, c6: INT>>")
@@ -1543,6 +1569,7 @@ def test_tree_string_for_builtin_types(self):
             .add("bin", BinaryType())
             .add("bool", BooleanType())
             .add("date", DateType())
+            .add("time", TimeType())
             .add("ts", TimestampType())
             .add("ts_ntz", TimestampNTZType())
             .add("dec", DecimalType(10, 2))
@@ -1578,6 +1605,7 @@ def test_tree_string_for_builtin_types(self):
                 " |-- bin: binary (nullable = true)",
                 " |-- bool: boolean (nullable = true)",
                 " |-- date: date (nullable = true)",
+                " |-- time: time(6) (nullable = true)",
                 " |-- ts: timestamp (nullable = true)",
                 " |-- ts_ntz: timestamp_ntz (nullable = true)",
                 " |-- dec: decimal(10,2) (nullable = true)",
@@ -1925,6 +1953,7 @@ def test_repr(self):
             BinaryType(),
             BooleanType(),
             DateType(),
+            TimeType(),
             TimestampType(),
             DecimalType(),
             DoubleType(),
@@ -2332,8 +2361,10 @@ def test_to_ddl(self):
         schema = StructType().add("a", ArrayType(DoubleType()), False).add("b", DateType())
         self.assertEqual(schema.toDDL(), "a ARRAY<DOUBLE> NOT NULL,b DATE")
 
-        schema = StructType().add("a", TimestampType()).add("b", TimestampNTZType())
-        self.assertEqual(schema.toDDL(), "a TIMESTAMP,b TIMESTAMP_NTZ")
+        schema = (
+            StructType().add("a", TimestampType()).add("b", TimestampNTZType()).add("c", TimeType())
+        )
+        self.assertEqual(schema.toDDL(), "a TIMESTAMP,b TIMESTAMP_NTZ,c TIME(6)")
 
     def test_from_ddl(self):
         self.assertEqual(DataType.fromDDL("long"), LongType())
@@ -2349,6 +2380,10 @@ def test_from_ddl(self):
             DataType.fromDDL("a int, v variant"),
             StructType([StructField("a", IntegerType()), StructField("v", VariantType())]),
         )
+        self.assertEqual(
+            DataType.fromDDL("a time(6)"),
+            StructType([StructField("a", TimeType(6))]),
+        )
 
     # Ensures that changing the implementation of `DataType.fromDDL` in PR #47253 does not change
     # `fromDDL`'s behavior.
@@ -2602,8 +2637,9 @@ def __init__(self, **kwargs):
             (decimal.Decimal("1.0"), DecimalType()),
             # Binary
             (bytearray([1, 2]), BinaryType()),
-            # Date/Timestamp
+            # Date/Time/Timestamp
             (datetime.date(2000, 1, 2), DateType()),
+            (datetime.time(1, 0, 0), TimeType()),
             (datetime.datetime(2000, 1, 2, 3, 4), DateType()),
             (datetime.datetime(2000, 1, 2, 3, 4), TimestampType()),
             # Array
@@ -2666,8 +2702,9 @@ def __init__(self, **kwargs):
             ("1.0", DecimalType(), TypeError),
             # Binary
             (1, BinaryType(), TypeError),
-            # Date/Timestamp
+            # Date/Time/Timestamp
             ("2000-01-02", DateType(), TypeError),
+            ("23:59:59", TimeType(), TypeError),
             (946811040, TimestampType(), TypeError),
             # Array
             (["1", None], ArrayType(StringType(), containsNull=False), ValueError),
diff --git a/python/pyspark/sql/tests/test_udf.py b/python/pyspark/sql/tests/test_udf.py
index bd4db5306cb75..9d130a7f525ac 100644
--- a/python/pyspark/sql/tests/test_udf.py
+++ b/python/pyspark/sql/tests/test_udf.py
@@ -1379,6 +1379,73 @@ def add1(x):
         result = empty_df.select(add1("id"))
         self.assertEqual(result.collect(), [])
 
+    def test_udf_with_collated_string_types(self):
+        @udf("string collate fr")
+        def my_udf(input_val):
+            return "%s - %s" % (type(input_val), input_val)
+
+        string_types = [
+            StringType(),
+            StringType("UTF8_BINARY"),
+            StringType("UTF8_LCASE"),
+            StringType("UNICODE"),
+        ]
+        data = [("hello",)]
+        expected = "<class 'str'> - hello"
+
+        for string_type in string_types:
+            schema = StructType([StructField("input_col", string_type, True)])
+            df = self.spark.createDataFrame(data, schema=schema)
+            df_result = df.select(my_udf(df.input_col).alias("result"))
+            row = df_result.collect()[0][0]
+            self.assertEqual(row, expected)
+            result_type = df_result.schema["result"].dataType
+            self.assertEqual(result_type, StringType("fr"))
+
+    def test_udf_with_char_varchar_return_type(self):
+        (char_type, char_value) = ("char(10)", "a")
+        (varchar_type, varchar_value) = ("varchar(8)", "a")
+        (array_with_char_type, array_with_char_type_value) = ("array<char(5)>", ["a", "b"])
+        (array_with_varchar_type, array_with_varchar_value) = ("array<varchar(12)>", ["a", "b"])
+        (map_type, map_value) = (f"map<{char_type}, {varchar_type}>", {"a": "b"})
+        (struct_type, struct_value) = (
+            f"struct<f1: {char_type}, f2: {varchar_type}>",
+            {"f1": "a", "f2": "b"},
+        )
+
+        pairs = [
+            (char_type, char_value),
+            (varchar_type, varchar_value),
+            (array_with_char_type, array_with_char_type_value),
+            (array_with_varchar_type, array_with_varchar_value),
+            (map_type, map_value),
+            (struct_type, struct_value),
+            (
+                f"struct<f1: {array_with_char_type}, f2: {array_with_varchar_type}, "
+                f"f3: {map_type}>",
+                f"{{'f1': {array_with_char_type_value}, 'f2': {array_with_varchar_value}, "
+                f"'f3': {map_value}}}",
+            ),
+            (
+                f"map<{array_with_char_type}, {array_with_varchar_type}>",
+                f"{{{array_with_char_type_value}: {array_with_varchar_value}}}",
+            ),
+            (f"array<{struct_type}>", [struct_value, struct_value]),
+        ]
+
+        for return_type, return_value in pairs:
+            with self.assertRaisesRegex(
+                Exception,
+                "(Please use a different output data type for your UDF or DataFrame|"
+                "Invalid return type with Arrow-optimized Python UDF)",
+            ):
+
+                @udf(return_type)
+                def my_udf():
+                    return return_value
+
+                self.spark.range(1).select(my_udf().alias("result")).show()
+
 
 class UDFTests(BaseUDFTestsMixin, ReusedSQLTestCase):
     @classmethod
diff --git a/python/pyspark/sql/tests/test_udf_combinations.py b/python/pyspark/sql/tests/test_udf_combinations.py
new file mode 100644
index 0000000000000..8111bb79d3c75
--- /dev/null
+++ b/python/pyspark/sql/tests/test_udf_combinations.py
@@ -0,0 +1,208 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+from typing import Iterator
+import itertools
+import unittest
+
+from pyspark.sql.functions import udf, arrow_udf, pandas_udf
+from pyspark.testing.sqlutils import ReusedSQLTestCase
+from pyspark.testing.utils import (
+    have_pandas,
+    have_pyarrow,
+    pandas_requirement_message,
+    pyarrow_requirement_message,
+)
+
+
+@unittest.skipIf(
+    not have_pandas or not have_pyarrow,
+    pandas_requirement_message or pyarrow_requirement_message,
+)
+class UDFCombinationsTestsMixin:
+    @property
+    def python_udf_add1(self):
+        @udf("long")
+        def py_add1(v):
+            assert isinstance(v, int)
+            return v + 1
+
+        return py_add1
+
+    @property
+    def arrow_opt_python_udf_add1(self):
+        @udf("long")
+        def py_arrow_opt_add1(v, useArrow=True):
+            assert isinstance(v, int)
+            return v + 1
+
+        return py_arrow_opt_add1
+
+    @property
+    def pandas_udf_add1(self):
+        import pandas as pd
+
+        @pandas_udf("long")
+        def pandas_add1(s):
+            assert isinstance(s, pd.Series)
+            return s + 1
+
+        return pandas_add1
+
+    @property
+    def pandas_iter_udf_add1(self):
+        import pandas as pd
+
+        @pandas_udf("long")
+        def pandas_iter_add1(it: Iterator[pd.Series]) -> Iterator[pd.Series]:
+            for s in it:
+                assert isinstance(s, pd.Series)
+                yield s + 1
+
+        return pandas_iter_add1
+
+    @property
+    def arrow_udf_add1(self):
+        import pyarrow as pa
+
+        @arrow_udf("long")
+        def arrow_add1(a):
+            assert isinstance(a, pa.Array)
+            return pa.compute.add(a, 1)
+
+        return arrow_add1
+
+    @property
+    def arrow_iter_udf_add1(self):
+        import pyarrow as pa
+
+        @arrow_udf("long")
+        def arrow_iter_add1(it: Iterator[pa.Array]) -> Iterator[pa.Array]:
+            for a in it:
+                assert isinstance(a, pa.Array)
+                yield pa.compute.add(a, 1)
+
+        return arrow_iter_add1
+
+    def all_scalar_functions(self):
+        return [
+            self.python_udf_add1,
+            self.arrow_opt_python_udf_add1,
+            self.pandas_udf_add1,
+            self.pandas_iter_udf_add1,
+            self.arrow_udf_add1,
+            self.arrow_iter_udf_add1,
+        ]
+
+    def test_combination_2(self):
+        df = self.spark.range(10)
+
+        expected = df.selectExpr("id + 2 AS res").collect()
+
+        combs = itertools.combinations(self.all_scalar_functions(), 2)
+        for f1, f2 in combs:
+            with self.subTest(
+                udf1=f1.__name__,
+                udf2=f2.__name__,
+            ):
+                result = df.select(f1(f2("id")).alias("res"))
+                self.assertEqual(expected, result.collect())
+
+    def test_combination_3(self):
+        df = self.spark.range(10)
+
+        expected = df.selectExpr("id + 3 AS res").collect()
+
+        combs = itertools.combinations(self.all_scalar_functions(), 3)
+        for f1, f2, f3 in combs:
+            with self.subTest(
+                udf1=f1.__name__,
+                udf2=f2.__name__,
+                udf3=f3.__name__,
+            ):
+                result = df.select(f1(f2(f3("id"))).alias("res"))
+                self.assertEqual(expected, result.collect())
+
+    def test_combination_4(self):
+        df = self.spark.range(10)
+
+        expected = df.selectExpr("id + 4 AS res").collect()
+
+        combs = itertools.combinations(self.all_scalar_functions(), 4)
+        for f1, f2, f3, f4 in combs:
+            with self.subTest(
+                udf1=f1.__name__,
+                udf2=f2.__name__,
+                udf3=f3.__name__,
+                udf4=f4.__name__,
+            ):
+                result = df.select(f1(f2(f3(f4("id")))).alias("res"))
+                self.assertEqual(expected, result.collect())
+
+    def test_combination_5(self):
+        df = self.spark.range(10)
+
+        expected = df.selectExpr("id + 5 AS res").collect()
+
+        combs = itertools.combinations(self.all_scalar_functions(), 5)
+        for f1, f2, f3, f4, f5 in combs:
+            with self.subTest(
+                udf1=f1.__name__,
+                udf2=f2.__name__,
+                udf3=f3.__name__,
+                udf4=f4.__name__,
+                udf5=f5.__name__,
+            ):
+                result = df.select(f1(f2(f3(f4(f5("id"))))).alias("res"))
+                self.assertEqual(expected, result.collect())
+
+    def test_combination_6(self):
+        df = self.spark.range(10)
+
+        expected = df.selectExpr("id + 6 AS res").collect()
+
+        combs = itertools.combinations(self.all_scalar_functions(), 6)
+        for f1, f2, f3, f4, f5, f6 in combs:
+            with self.subTest(
+                udf1=f1.__name__,
+                udf2=f2.__name__,
+                udf3=f3.__name__,
+                udf4=f4.__name__,
+                udf5=f5.__name__,
+                udf6=f6.__name__,
+            ):
+                result = df.select(f1(f2(f3(f4(f5(f6("id")))))).alias("res"))
+                self.assertEqual(expected, result.collect())
+
+
+class UDFCombinationsTests(UDFCombinationsTestsMixin, ReusedSQLTestCase):
+    @classmethod
+    def setUpClass(cls):
+        ReusedSQLTestCase.setUpClass()
+        cls.spark.conf.set("spark.sql.execution.pythonUDF.arrow.enabled", "false")
+
+
+if __name__ == "__main__":
+    from pyspark.sql.tests.test_udf_combinations import *  # noqa: F401
+
+    try:
+        import xmlrunner  # type: ignore
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/test_udf_profiler.py b/python/pyspark/sql/tests/test_udf_profiler.py
index 8c45149605c72..de35532285df6 100644
--- a/python/pyspark/sql/tests/test_udf_profiler.py
+++ b/python/pyspark/sql/tests/test_udf_profiler.py
@@ -28,7 +28,7 @@
 from pyspark import SparkConf
 from pyspark.errors import PySparkValueError
 from pyspark.sql import SparkSession
-from pyspark.sql.functions import col, pandas_udf, udf
+from pyspark.sql.functions import col, arrow_udf, pandas_udf, udf
 from pyspark.sql.window import Window
 from pyspark.profiler import UDFBasicProfiler
 from pyspark.testing.sqlutils import ReusedSQLTestCase
@@ -127,6 +127,16 @@ def iter_to_iter(batch_ser: Iterator[pd.Series]) -> Iterator[pd.Series]:
 
         self.spark.range(10).select(iter_to_iter("id")).collect()
 
+    def exec_arrow_udf_iter_to_iter(self):
+        import pyarrow as pa
+
+        @arrow_udf("int")
+        def iter_to_iter(iter: Iterator[pa.Array]) -> Iterator[pa.Array]:
+            for s in iter:
+                yield pa.compute.add(s, 1)
+
+        self.spark.range(10).select(iter_to_iter("id")).collect()
+
     # Unsupported
     def exec_map(self):
         import pandas as pd
@@ -149,6 +159,15 @@ def test_unsupported(self):
                 "Profiling UDFs with iterators input/output is not supported" in str(user_warns[0])
             )
 
+        with warnings.catch_warnings(record=True) as warns:
+            warnings.simplefilter("always")
+            self.exec_arrow_udf_iter_to_iter()
+            user_warns = [warn.message for warn in warns if isinstance(warn.message, UserWarning)]
+            self.assertTrue(len(user_warns) > 0)
+            self.assertTrue(
+                "Profiling UDFs with iterators input/output is not supported" in str(user_warns[0])
+            )
+
         with warnings.catch_warnings(record=True) as warns:
             warnings.simplefilter("always")
             self.exec_map()
@@ -278,6 +297,29 @@ def add2(x):
         for id in self.profile_results:
             self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=2)
 
+    @unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+    def test_perf_profiler_arrow_udf(self):
+        import pyarrow as pa
+
+        @arrow_udf("long")
+        def add1(x):
+            return pa.compute.add(x, 1)
+
+        @arrow_udf("long")
+        def add2(x):
+            return pa.compute.add(x, 2)
+
+        with self.sql_conf({"spark.sql.pyspark.udf.profiler": "perf"}):
+            df = self.spark.range(10, numPartitions=2).select(
+                add1("id"), add2("id"), add1("id"), add2(col("id") + 1)
+            )
+            df.collect()
+
+        self.assertEqual(3, len(self.profile_results), str(self.profile_results.keys()))
+
+        for id in self.profile_results:
+            self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=2)
+
     @unittest.skipIf(
         not have_pandas or not have_pyarrow,
         cast(str, pandas_requirement_message or pyarrow_requirement_message),
@@ -305,6 +347,30 @@ def add2(iter: Iterator[pd.Series]) -> Iterator[pd.Series]:
         for id in self.profile_results:
             self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=2)
 
+    @unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+    def test_perf_profiler_arrow_udf_iterator_not_supported(self):
+        import pyarrow as pa
+
+        @arrow_udf("long")
+        def add1(x):
+            return pa.compute.add(x, 1)
+
+        @arrow_udf("long")
+        def add2(iter: Iterator[pa.Array]) -> Iterator[pa.Array]:
+            for s in iter:
+                yield pa.compute.add(s, 2)
+
+        with self.sql_conf({"spark.sql.pyspark.udf.profiler": "perf"}):
+            df = self.spark.range(10, numPartitions=2).select(
+                add1("id"), add2("id"), add1("id"), add2(col("id") + 1)
+            )
+            df.collect()
+
+        self.assertEqual(1, len(self.profile_results), str(self.profile_results.keys()))
+
+        for id in self.profile_results:
+            self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=2)
+
     @unittest.skipIf(
         not have_pandas or not have_pyarrow,
         cast(str, pandas_requirement_message or pyarrow_requirement_message),
@@ -346,6 +412,27 @@ def mean_udf(v: pd.Series) -> float:
         for id in self.profile_results:
             self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=5)
 
+    @unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+    def test_perf_profiler_arrow_udf_window(self):
+        import pyarrow as pa
+
+        @arrow_udf("double")
+        def mean_udf(v: pa.Array) -> float:
+            return pa.compute.mean(v)
+
+        df = self.spark.createDataFrame(
+            [(1, 1.0), (1, 2.0), (2, 3.0), (2, 5.0), (2, 10.0)], ("id", "v")
+        )
+        w = Window.partitionBy("id").orderBy("v").rowsBetween(-1, 0)
+
+        with self.sql_conf({"spark.sql.pyspark.udf.profiler": "perf"}):
+            df.withColumn("mean_v", mean_udf("v").over(w)).show()
+
+        self.assertEqual(1, len(self.profile_results), str(self.profile_results.keys()))
+
+        for id in self.profile_results:
+            self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=5)
+
     @unittest.skipIf(
         not have_pandas or not have_pyarrow,
         cast(str, pandas_requirement_message or pyarrow_requirement_message),
@@ -369,6 +456,25 @@ def min_udf(v: pd.Series) -> float:
         for id in self.profile_results:
             self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=2)
 
+    @unittest.skipIf(not have_pyarrow, pyarrow_requirement_message)
+    def test_perf_profiler_arrow_udf_agg(self):
+        import pyarrow as pa
+
+        @arrow_udf("double")
+        def min_udf(v: pa.Array) -> float:
+            return pa.compute.min(v)
+
+        with self.sql_conf({"spark.sql.pyspark.udf.profiler": "perf"}):
+            df = self.spark.createDataFrame(
+                [(2, "Alice"), (3, "Alice"), (5, "Bob"), (10, "Bob")], ["age", "name"]
+            )
+            df.groupBy(df.name).agg(min_udf(df.age)).show()
+
+        self.assertEqual(1, len(self.profile_results), str(self.profile_results.keys()))
+
+        for id in self.profile_results:
+            self.assert_udf_profile_present(udf_id=id, expected_line_count_prefix=2)
+
     @unittest.skipIf(
         not have_pandas or not have_pyarrow,
         cast(str, pandas_requirement_message or pyarrow_requirement_message),
diff --git a/python/pyspark/sql/tests/test_udtf.py b/python/pyspark/sql/tests/test_udtf.py
index b5536ddc7b5d0..b006ac6c14d4a 100644
--- a/python/pyspark/sql/tests/test_udtf.py
+++ b/python/pyspark/sql/tests/test_udtf.py
@@ -63,6 +63,7 @@
     VariantVal,
 )
 from pyspark.testing import assertDataFrameEqual, assertSchemaEqual
+from pyspark.testing.objects import ExamplePoint, ExamplePointUDT
 from pyspark.testing.sqlutils import (
     have_pandas,
     have_pyarrow,
@@ -169,11 +170,58 @@ def eval(self, a: int, b: int) -> Iterator:
 
         self.spark.udtf.register("testUDTF", TestUDTF)
 
+        for i, df in enumerate(
+            [
+                self.spark.sql("values (0, 1), (1, 2) t(a, b)").lateralJoin(
+                    TestUDTF(col("a").outer(), col("b").outer())
+                ),
+                self.spark.sql("values (0, 1), (1, 2) t(a, b)").lateralJoin(
+                    TestUDTF(a=col("a").outer(), b=col("b").outer())
+                ),
+                self.spark.sql("values (0, 1), (1, 2) t(a, b)").lateralJoin(
+                    TestUDTF(b=col("b").outer(), a=col("a").outer())
+                ),
+            ]
+        ):
+            with self.subTest(query_no=i):
+                assertDataFrameEqual(
+                    df,
+                    self.spark.sql(
+                        "SELECT * FROM values (0, 1), (1, 2) t(a, b), LATERAL testUDTF(a, b)"
+                    ),
+                )
+
+        @udtf(returnType="a: int")
+        class TestUDTF:
+            def eval(self):
+                yield 1,
+                yield 2,
+
         assertDataFrameEqual(
-            self.spark.sql("values (0, 1), (1, 2) t(a, b)").lateralJoin(
-                TestUDTF(col("a").outer(), col("b").outer())
-            ),
-            self.spark.sql("SELECT * FROM values (0, 1), (1, 2) t(a, b), LATERAL testUDTF(a, b)"),
+            self.spark.range(3, numPartitions=1).lateralJoin(TestUDTF()),
+            [
+                Row(id=0, a=1),
+                Row(id=0, a=2),
+                Row(id=1, a=1),
+                Row(id=1, a=2),
+                Row(id=2, a=1),
+                Row(id=2, a=2),
+            ],
+        )
+
+        @udtf(returnType="a: int")
+        class TestUDTF:
+            def eval(self, i: int):
+                for n in range(i):
+                    yield n,
+
+        assertDataFrameEqual(
+            self.spark.range(3, numPartitions=1).lateralJoin(TestUDTF(col("id").outer())),
+            [
+                Row(id=1, a=0),
+                Row(id=2, a=0),
+                Row(id=2, a=1),
+            ],
         )
 
     def test_udtf_eval_with_return_stmt(self):
@@ -202,6 +250,62 @@ def eval(self, a: int):
         with self.assertRaisesRegex(PythonException, "UDTF_INVALID_OUTPUT_ROW_TYPE"):
             TestUDTF(lit(1)).collect()
 
+        @udtf(returnType="a: int")
+        class TestUDTF:
+            def eval(self, a: int):
+                return [a]
+
+        with self.assertRaisesRegex(PythonException, "UDTF_INVALID_OUTPUT_ROW_TYPE"):
+            TestUDTF(lit(1)).collect()
+
+        @udtf(returnType=StructType().add("point", ExamplePointUDT()))
+        class TestUDTF:
+            def eval(self, x: float, y: float):
+                yield ExamplePoint(x=x * 10, y=y * 10)
+
+        with self.assertRaisesRegex(PythonException, "UDTF_INVALID_OUTPUT_ROW_TYPE"):
+            TestUDTF(lit(1.0), lit(2.0)).collect()
+
+    def test_udtf_eval_returning_tuple_with_struct_type(self):
+        @udtf(returnType="a: struct<b: int, c: int>")
+        class TestUDTF:
+            def eval(self, a: int):
+                yield (a, a + 1),
+
+        assertDataFrameEqual(TestUDTF(lit(1)), [Row(a=Row(b=1, c=2))])
+
+        @udtf(returnType="a: struct<b: int, c: int>")
+        class TestUDTF:
+            def eval(self, a: int):
+                yield a, a + 1
+
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
+            TestUDTF(lit(1)).collect()
+
+    def test_udtf_eval_returning_udt(self):
+        @udtf(returnType=StructType().add("point", ExamplePointUDT()))
+        class TestUDTF:
+            def eval(self, x: float, y: float):
+                yield ExamplePoint(x=x * 10, y=y * 10),
+
+        assertDataFrameEqual(
+            TestUDTF(lit(1.0), lit(2.0)), [Row(point=ExamplePoint(x=10.0, y=20.0))]
+        )
+
+    def test_udtf_eval_taking_udt(self):
+        @udtf(returnType="x: double, y: double")
+        class TestUDTF:
+            def eval(self, point: ExamplePoint):
+                yield point.x * 10, point.y * 10
+
+        df = self.spark.createDataFrame(
+            [(ExamplePoint(x=1.0, y=2.0),)], schema=StructType().add("point", ExamplePointUDT())
+        )
+        assertDataFrameEqual(
+            df.lateralJoin(TestUDTF(col("point").outer())),
+            [Row(point=ExamplePoint(x=1.0, y=2.0), x=10.0, y=20.0)],
+        )
+
     def test_udtf_with_invalid_return_value(self):
         @udtf(returnType="x: int")
         class TestUDTF:
@@ -351,15 +455,13 @@ def terminate(self, a: int):
             TestUDTF(lit(1)).show()
 
     def test_udtf_with_wrong_num_output(self):
-        err_msg = "(UDTF_ARROW_TYPE_CONVERSION_ERROR|UDTF_RETURN_SCHEMA_MISMATCH)"
-
         # Output less columns than specified return schema
         @udtf(returnType="a: int, b: int")
         class TestUDTF:
             def eval(self, a: int):
                 yield a,
 
-        with self.assertRaisesRegex(PythonException, err_msg):
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
             TestUDTF(lit(1)).collect()
 
         # Output more columns than specified return schema
@@ -368,7 +470,7 @@ class TestUDTF:
             def eval(self, a: int):
                 yield a, a + 1
 
-        with self.assertRaisesRegex(PythonException, err_msg):
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
             TestUDTF(lit(1)).collect()
 
     def test_udtf_with_empty_output_schema_and_non_empty_output(self):
@@ -377,9 +479,7 @@ class TestUDTF:
             def eval(self):
                 yield 1,
 
-        with self.assertRaisesRegex(
-            PythonException, "(UDTF_RETURN_SCHEMA_MISMATCH|UDTF_ARROW_TYPE_CONVERSION_ERROR)"
-        ):
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
             TestUDTF().collect()
 
     def test_udtf_with_non_empty_output_schema_and_empty_output(self):
@@ -388,9 +488,7 @@ class TestUDTF:
             def eval(self):
                 yield tuple()
 
-        with self.assertRaisesRegex(
-            PythonException, "(UDTF_RETURN_SCHEMA_MISMATCH|UDTF_ARROW_TYPE_CONVERSION_ERROR)"
-        ):
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
             TestUDTF().collect()
 
     def test_udtf_init(self):
@@ -545,8 +643,6 @@ def terminate(self):
             TestUDTF(lit(1)).collect()
 
     def test_udtf_terminate_with_wrong_num_output(self):
-        err_msg = "(UDTF_RETURN_SCHEMA_MISMATCH|UDTF_ARROW_TYPE_CONVERSION_ERROR)"
-
         @udtf(returnType="a: int, b: int")
         class TestUDTF:
             def eval(self, a: int):
@@ -555,7 +651,7 @@ def eval(self, a: int):
             def terminate(self):
                 yield 1, 2, 3
 
-        with self.assertRaisesRegex(PythonException, err_msg):
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
             TestUDTF(lit(1)).show()
 
         @udtf(returnType="a: int, b: int")
@@ -566,7 +662,7 @@ def eval(self, a: int):
             def terminate(self):
                 yield 1,
 
-        with self.assertRaisesRegex(PythonException, err_msg):
+        with self.assertRaisesRegex(PythonException, "UDTF_RETURN_SCHEMA_MISMATCH"):
             TestUDTF(lit(1)).show()
 
     def test_udtf_determinism(self):
@@ -2036,6 +2132,25 @@ def eval(self, a, b):
             with self.subTest(query_no=i):
                 assertDataFrameEqual(df, [Row(a=10)])
 
+    def test_udtf_with_named_table_arguments(self):
+        @udtf(returnType="a: int")
+        class TestUDTF:
+            def eval(self, a, b):
+                yield a.id,
+
+        self.spark.udtf.register("test_udtf", TestUDTF)
+
+        for i, df in enumerate(
+            [
+                self.spark.sql("SELECT * FROM test_udtf(a => TABLE(FROM range(3)), b => 'x')"),
+                self.spark.sql("SELECT * FROM test_udtf(b => 'x', a => TABLE(FROM range(3)))"),
+                TestUDTF(a=self.spark.range(3).asTable(), b=lit("x")),
+                TestUDTF(b=lit("x"), a=self.spark.range(3).asTable()),
+            ]
+        ):
+            with self.subTest(query_no=i):
+                assertDataFrameEqual(df, [Row(a=i) for i in range(3)])
+
     def test_udtf_with_named_arguments_negative(self):
         @udtf(returnType="a: int")
         class TestUDTF:
@@ -2088,6 +2203,25 @@ def eval(self, **kwargs):
         with self.assertRaisesRegex(AnalysisException, "UNEXPECTED_POSITIONAL_ARGUMENT"):
             self.spark.sql("SELECT * FROM test_udtf(a => 10, 'x')").show()
 
+    def test_udtf_with_table_argument_and_kwargs(self):
+        @udtf(returnType="a: int, b: string")
+        class TestUDTF:
+            def eval(self, **kwargs):
+                yield kwargs["a"].id, kwargs["b"]
+
+        self.spark.udtf.register("test_udtf", TestUDTF)
+
+        for i, df in enumerate(
+            [
+                self.spark.sql("SELECT * FROM test_udtf(a => TABLE(FROM range(3)), b => 'x')"),
+                self.spark.sql("SELECT * FROM test_udtf(b => 'x', a => TABLE(FROM range(3)))"),
+                TestUDTF(a=self.spark.range(3).asTable(), b=lit("x")),
+                TestUDTF(b=lit("x"), a=self.spark.range(3).asTable()),
+            ]
+        ):
+            with self.subTest(query_no=i):
+                assertDataFrameEqual(df, [Row(a=i, b="x") for i in range(3)])
+
     def test_udtf_with_analyze_kwargs(self):
         @udtf
         class TestUDTF:
@@ -2122,6 +2256,38 @@ def eval(self, **kwargs):
             with self.subTest(query_no=i):
                 assertDataFrameEqual(df, [Row(a=10, b="x")])
 
+    def test_udtf_with_table_argument_and_analyze_kwargs(self):
+        @udtf
+        class TestUDTF:
+            @staticmethod
+            def analyze(**kwargs: AnalyzeArgument) -> AnalyzeResult:
+                assert isinstance(kwargs["a"].dataType, StructType)
+                assert kwargs["a"].isTable is True
+                assert isinstance(kwargs["b"].dataType, StringType)
+                assert kwargs["b"].value == "x"
+                assert not kwargs["b"].isTable
+                return AnalyzeResult(
+                    StructType(
+                        [StructField(key, arg.dataType) for key, arg in sorted(kwargs.items())]
+                    )
+                )
+
+            def eval(self, **kwargs):
+                yield tuple(value for _, value in sorted(kwargs.items()))
+
+        self.spark.udtf.register("test_udtf", TestUDTF)
+
+        for i, df in enumerate(
+            [
+                self.spark.sql("SELECT * FROM test_udtf(a => TABLE(FROM range(3)), b => 'x')"),
+                self.spark.sql("SELECT * FROM test_udtf(b => 'x', a => TABLE(FROM range(3)))"),
+                TestUDTF(a=self.spark.range(3).asTable(), b=lit("x")),
+                TestUDTF(b=lit("x"), a=self.spark.range(3).asTable()),
+            ]
+        ):
+            with self.subTest(query_no=i):
+                assertDataFrameEqual(df, [Row(a=Row(id=i), b="x") for i in range(3)])
+
     def test_udtf_with_named_arguments_lateral_join(self):
         @udtf
         class TestUDTF:
@@ -2841,6 +3007,43 @@ def eval(self):
                     err_type=Exception,
                 )
 
+    def test_udtf_with_collated_string_types(self):
+        @udtf(
+            returnType="out1 string, out2 string collate UTF8_BINARY, "
+            "out3 string collate UTF8_LCASE, out4 string collate UNICODE"
+        )
+        class MyUDTF:
+            def eval(self, v1, v2, v3, v4):
+                yield (v1 + "1", v2 + "2", v3 + "3", v4 + "4")
+
+        schema = StructType(
+            [
+                StructField("col1", StringType(), True),
+                StructField("col2", StringType("UTF8_BINARY"), True),
+                StructField("col3", StringType("UTF8_LCASE"), True),
+                StructField("col4", StringType("UNICODE"), True),
+            ]
+        )
+        df = self.spark.createDataFrame([("hello",) * 4], schema=schema)
+
+        result_df = df.lateralJoin(
+            MyUDTF(
+                col("col1").outer(), col("col2").outer(), col("col3").outer(), col("col4").outer()
+            )
+        ).select("out1", "out2", "out3", "out4")
+
+        expected_row = ("hello1", "hello2", "hello3", "hello4")
+        self.assertEqual(result_df.collect()[0], expected_row)
+
+        expected_output_types = [
+            StringType(),
+            StringType("UTF8_BINARY"),
+            StringType("UTF8_LCASE"),
+            StringType("UNICODE"),
+        ]
+        for idx, field in enumerate(result_df.schema.fields):
+            self.assertEqual(field.dataType, expected_output_types[idx])
+
 
 class UDTFTests(BaseUDTFTestsMixin, ReusedSQLTestCase):
     @classmethod
@@ -2905,6 +3108,13 @@ def eval(self, a: int):
         # When arrow is enabled, it can handle non-tuple return value.
         assertDataFrameEqual(TestUDTF(lit(1)), [Row(a=1)])
 
+        @udtf(returnType="a: int")
+        class TestUDTF:
+            def eval(self, a: int):
+                return (a,)
+
+        assertDataFrameEqual(TestUDTF(lit(1)), [Row(a=1)])
+
         @udtf(returnType="a: int")
         class TestUDTF:
             def eval(self, a: int):
@@ -2912,6 +3122,27 @@ def eval(self, a: int):
 
         assertDataFrameEqual(TestUDTF(lit(1)), [Row(a=1)])
 
+        @udtf(returnType=StructType().add("udt", ExamplePointUDT()))
+        class TestUDTF:
+            def eval(self, x: float, y: float):
+                yield ExamplePoint(x=x * 10, y=y * 10)
+
+        assertDataFrameEqual(TestUDTF(lit(1.0), lit(2.0)), [Row(udt=ExamplePoint(x=10.0, y=20.0))])
+
+    def test_udtf_use_large_var_types(self):
+        for use_large_var_types in [True, False]:
+            with self.subTest(use_large_var_types=use_large_var_types):
+                with self.sql_conf(
+                    {"spark.sql.execution.arrow.useLargeVarTypes": use_large_var_types}
+                ):
+
+                    @udtf(returnType="a: string")
+                    class TestUDTF:
+                        def eval(self, a: int):
+                            yield str(a)
+
+                    assertDataFrameEqual(TestUDTF(lit(1)), [Row(a="1")])
+
     def test_numeric_output_type_casting(self):
         class TestUDTF:
             def eval(self):
@@ -3158,23 +3389,6 @@ def tearDownClass(cls):
 
 
 class UDTFArrowTestsMixin(LegacyUDTFArrowTestsMixin):
-    def test_udtf_eval_returning_non_tuple(self):
-        @udtf(returnType="a: int")
-        class TestUDTF:
-            def eval(self, a: int):
-                yield a
-
-        with self.assertRaisesRegex(PythonException, "UDTF_ARROW_TYPE_CONVERSION_ERROR"):
-            TestUDTF(lit(1)).collect()
-
-        @udtf(returnType="a: int")
-        class TestUDTF:
-            def eval(self, a: int):
-                return [a]
-
-        with self.assertRaisesRegex(PythonException, "UDTF_ARROW_TYPE_CONVERSION_ERROR"):
-            TestUDTF(lit(1)).collect()
-
     def test_numeric_output_type_casting(self):
         class TestUDTF:
             def eval(self):
diff --git a/python/pyspark/sql/tests/udf_type_tests/README.md b/python/pyspark/sql/tests/udf_type_tests/README.md
new file mode 100644
index 0000000000000..74d1933c49519
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/README.md
@@ -0,0 +1,13 @@
+These tests capture input/output type interfaces between python udfs and the engine. This internal documentation, not user-facing documentation. Please consider the type behavior "experimental", unless we specify otherwise. Parts of the type handling might change in the future.
+
+# Return type tests
+These generate tables with the returned 'Python Value' and the 'SQL Type' output type of the UDF. The 'SQL Type' fields are DDL formatted strings, which can be used as `returnType`s.
+- Note: The values inside the table are generated by `repr`. X' means it throws an exception during the conversion.
+- Note: Python 3.11.9, Pandas 2.2.3 and PyArrow 17.0.0 are used.
+
+# Input type tests
+These generate tables with 'Spark Type' and 'Spark Value', representing the engine-side input data. The UDF input data is captured in the 'Python type' and 'Python value' columns.
+
+# When this test fails:
+- Look at the diff in the test output
+- To regenerate golden files, simply delete the existing golden file and re-run the test.
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/__init__.py b/python/pyspark/sql/tests/udf_type_tests/__init__.py
new file mode 100644
index 0000000000000..cce3acad34a49
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/__init__.py
@@ -0,0 +1,16 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_pandas_udf_input_types.txt b/python/pyspark/sql/tests/udf_type_tests/golden_pandas_udf_input_types.txt
new file mode 100644
index 0000000000000..d21e7f2eb24a1
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_pandas_udf_input_types.txt
@@ -0,0 +1,43 @@
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|Test Case                                                                             |Spark Type                                                                            |Spark Value                                                                           |Python Type                                                                           |Python Value                                                                          |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|byte_values                                                                           |tinyint                                                                               |[-128, 127, 0]                                                                        |['int8', 'int8', 'int8']                                                              |[-128, 127, 0]                                                                        |
+|byte_null                                                                             |tinyint                                                                               |[None, 42]                                                                            |['float64', 'float64']                                                                |[None, 42]                                                                            |
+|short_values                                                                          |smallint                                                                              |[-32768, 32767, 0]                                                                    |['int16', 'int16', 'int16']                                                           |[-32768, 32767, 0]                                                                    |
+|short_null                                                                            |smallint                                                                              |[None, 123]                                                                           |['float64', 'float64']                                                                |[None, 123]                                                                           |
+|int_values                                                                            |int                                                                                   |[-2147483648, 2147483647, 0]                                                          |['int32', 'int32', 'int32']                                                           |[-2147483648, 2147483647, 0]                                                          |
+|int_null                                                                              |int                                                                                   |[None, 456]                                                                           |['float64', 'float64']                                                                |[None, 456]                                                                           |
+|long_values                                                                           |bigint                                                                                |[-9223372036854775808, 9223372036854775807, 0]                                        |['int64', 'int64', 'int64']                                                           |[-9223372036854775808, 9223372036854775807, 0]                                        |
+|long_null                                                                             |bigint                                                                                |[None, 789]                                                                           |['float64', 'float64']                                                                |[None, 789]                                                                           |
+|float_values                                                                          |float                                                                                 |[0.0, 1.0, 3.140000104904175]                                                         |['float32', 'float32', 'float32']                                                     |[0.0, 1.0, 3.140000104904175]                                                         |
+|float_null                                                                            |float                                                                                 |[None, 3.140000104904175]                                                             |['float32', 'float32']                                                                |[None, 3.140000104904175]                                                             |
+|double_values                                                                         |double                                                                                |[0.0, 1.0, 0.3333333333333333]                                                        |['float64', 'float64', 'float64']                                                     |[0.0, 1.0, 0.3333333333333333]                                                        |
+|double_null                                                                           |double                                                                                |[None, 2.71]                                                                          |['float64', 'float64']                                                                |[None, 2.71]                                                                          |
+|decimal_values                                                                        |decimal(3,2)                                                                          |[Decimal('5.35'), Decimal('1.23')]                                                    |['object', 'object']                                                                  |[Decimal('5.35'), Decimal('1.23')]                                                    |
+|decimal_null                                                                          |decimal(3,2)                                                                          |[None, Decimal('9.99')]                                                               |['object', 'object']                                                                  |[None, Decimal('9.99')]                                                               |
+|string_values                                                                         |string                                                                                |['abc', '', 'hello']                                                                  |['object', 'object', 'object']                                                        |['abc', '', 'hello']                                                                  |
+|string_null                                                                           |string                                                                                |[None, 'test']                                                                        |['object', 'object']                                                                  |[None, 'test']                                                                        |
+|binary_values                                                                         |binary                                                                                |[bytearray(b'abc'), bytearray(b''), bytearray(b'ABC')]                                |['object', 'object', 'object']                                                        |[bytearray(b'abc'), bytearray(b''), bytearray(b'ABC')]                                |
+|binary_null                                                                           |binary                                                                                |[None, bytearray(b'test')]                                                            |['object', 'object']                                                                  |[None, bytearray(b'test')]                                                            |
+|boolean_values                                                                        |boolean                                                                               |[True, False]                                                                         |['bool', 'bool']                                                                      |[True, False]                                                                         |
+|boolean_null                                                                          |boolean                                                                               |[None, True]                                                                          |['object', 'object']                                                                  |[None, True]                                                                          |
+|date_values                                                                           |date                                                                                  |[datetime.date(2020, 2, 2), datetime.date(1970, 1, 1)]                                |['object', 'object']                                                                  |[datetime.date(2020, 2, 2), datetime.date(1970, 1, 1)]                                |
+|date_null                                                                             |date                                                                                  |[None, datetime.date(2023, 1, 1)]                                                     |['object', 'object']                                                                  |[None, datetime.date(2023, 1, 1)]                                                     |
+|timestamp_values                                                                      |timestamp                                                                             |[datetime.datetime(2020, 2, 2, 12, 15, 16, 123000)]                                   |['datetime64[ns]']                                                                    |[datetime.datetime(2020, 2, 2, 12, 15, 16, 123000)]                                   |
+|timestamp_null                                                                        |timestamp                                                                             |[None, datetime.datetime(2023, 1, 1, 12, 0)]                                          |['datetime64[ns]', 'datetime64[ns]']                                                  |[None, datetime.datetime(2023, 1, 1, 12, 0)]                                          |
+|array_int_values                                                                      |array<int>                                                                            |[[1, 2, 3], [], [1, None, 3]]                                                         |['object', 'object', 'object']                                                        |[[1, 2, 3], [], [1, None, 3]]                                                         |
+|array_int_null                                                                        |array<int>                                                                            |[None, [4, 5, 6]]                                                                     |['object', 'object']                                                                  |[None, [4, 5, 6]]                                                                     |
+|map_str_int_values                                                                    |map<string,int>                                                                       |[{'world': 2, 'hello': 1}, {}]                                                        |['object', 'object']                                                                  |[{'world': 2, 'hello': 1}, {}]                                                        |
+|map_str_int_null                                                                      |map<string,int>                                                                       |[None, {'test': 123}]                                                                 |['object', 'object']                                                                  |[None, {'test': 123}]                                                                 |
+|struct_int_str_values                                                                 |struct<a1:int,a2:string>                                                              |[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]                                        |['DataFrame', 'DataFrame']                                                            |[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]                                        |
+|struct_int_str_null                                                                   |struct<a1:int,a2:string>                                                              |[None, Row(a1=99, a2='test')]                                                         |['DataFrame', 'DataFrame']                                                            |[Row(a1=None, a2=None), Row(a1=99, a2='test')]                                        |
+|array_array_int                                                                       |array<array<int>>                                                                     |[[[1, 2, 3]], [[1], [2, 3]]]                                                          |['object', 'object']                                                                  |[[[1, 2, 3]], [[1], [2, 3]]]                                                          |
+|array_map_str_int                                                                     |array<map<string,int>>                                                                |[[{'world': 2, 'hello': 1}], [{'a': 1}, {'b': 2}]]                                    |['object', 'object']                                                                  |[[{'world': 2, 'hello': 1}], [{'a': 1}, {'b': 2}]]                                    |
+|array_struct_int_str                                                                  |array<struct<a1:int,a2:string>>                                                       |[[Row(a1=1, a2='hello')], [Row(a1=1, a2='hello'), Row(a1=2, a2='world')]]             |['object', 'object']                                                                  |[[Row(a1=1, a2='hello')], [Row(a1=1, a2='hello'), Row(a1=2, a2='world')]]             |
+|map_int_array_int                                                                     |map<int,array<int>>                                                                   |[{1: [1, 2, 3]}, {1: [1], 2: [2, 3]}]                                                 |['object', 'object']                                                                  |[{1: [1, 2, 3]}, {1: [1], 2: [2, 3]}]                                                 |
+|map_int_map_str_int                                                                   |map<int,map<string,int>>                                                              |[{1: {'world': 2, 'hello': 1}}]                                                       |['object']                                                                            |[{1: {'world': 2, 'hello': 1}}]                                                       |
+|map_int_struct_int_str                                                                |map<int,struct<a1:int,a2:string>>                                                     |[{1: Row(a1=1, a2='hello')}]                                                          |['object']                                                                            |[{1: Row(a1=1, a2='hello')}]                                                          |
+|struct_int_array_int                                                                  |struct<a:int,b:array<int>>                                                            |[Row(a=1, b=[1, 2, 3])]                                                               |['DataFrame']                                                                         |[Row(a=1, b=[1, 2, 3])]                                                               |
+|struct_int_map_str_int                                                                |struct<a:int,b:map<string,int>>                                                       |[Row(a=1, b={'world': 2, 'hello': 1})]                                                |['DataFrame']                                                                         |[Row(a=1, b={'world': 2, 'hello': 1})]                                                |
+|struct_int_struct_int_str                                                             |struct<a:int,b:struct<a1:int,a2:string>>                                              |[Row(a=1, b=Row(a1=1, a2='hello'))]                                                   |['DataFrame']                                                                         |[Row(a=1, b=Row(a1=1, a2='hello'))]                                                   |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_pandas_udf_return_type_coercion.txt b/python/pyspark/sql/tests/udf_type_tests/golden_pandas_udf_return_type_coercion.txt
new file mode 100644
index 0000000000000..7719d1805d9e9
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_pandas_udf_return_type_coercion.txt
@@ -0,0 +1,19 @@
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|SQL Type \ Pandas Value(Type)  |[None, None](list)             |[True, False](list)            |[1 2](ndarray)                 |[1 2](ndarray)                 |[1 2](ndarray)                 |[1 2](ndarray)                 |[1 2](ndarray)                 |[1 2](ndarray)                 |[1 2](ndarray)                 |[1 2](ndarray)                 |[1. 2.](ndarray)               |[1. 2.](ndarray)               |[1. 2.](ndarray)               |[1. 2.](ndarray)               |[1.+0.j 2.+0.j](ndarray)       |[1.+0.j 2.+0.j](ndarray)       |['a', 'b'](list)               |['12', '34'](list)             |[array([1, 2, 3], dtype=int32) |[Decimal('1'), Decimal('2')](l |['1970-01-01T00:00:00.00000000 |['1970-01-01T05:00:00.00000000 |[Timedelta('1 days 00:00:00'), |['A', 'B'] Categories (2, obje |   _1 0   1 1   2(DataFrame)   |[{'a': 1}, {'b': 2}](list)     |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|boolean                        |[None, None]                   |[True, False]                  |[True, True]                   |[True, True]                   |[True, True]                   |[True, True]                   |[True, True]                   |[True, True]                   |[True, True]                   |[True, True]                   |X                              |[True, True]                   |[True, True]                   |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |
+|tinyint                        |[None, None]                   |[1, 0]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |X                              |X                              |X                              |X                              |[12, 34]                       |X                              |[1, 2]                         |X                              |X                              |X                              |X                              |X                              |X                              |
+|smallint                       |[None, None]                   |[1, 0]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |X                              |X                              |X                              |X                              |[12, 34]                       |X                              |[1, 2]                         |X                              |X                              |X                              |X                              |X                              |X                              |
+|int                            |[None, None]                   |[1, 0]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |X                              |X                              |X                              |X                              |[12, 34]                       |X                              |[1, 2]                         |X                              |X                              |X                              |X                              |X                              |X                              |
+|bigint                         |[None, None]                   |[1, 0]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |[1, 2]                         |X                              |X                              |X                              |X                              |[12, 34]                       |X                              |[1, 2]                         |[0, 86400000000000]            |[18000000000000, 1044000000000 |[86400000000000, 1728000000000 |X                              |X                              |X                              |
+|string                         |[None, None]                   |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |['a', 'b']                     |['12', '34']                   |X                              |X                              |X                              |X                              |X                              |['A', 'B']                     |X                              |X                              |
+|date                           |[None, None]                   |X                              |X                              |X                              |[datetime.date(1970, 1, 2), da |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |[datetime.date(1970, 1, 2), da |[datetime.date(1970, 1, 1), da |[datetime.date(1970, 1, 1), da |X                              |X                              |X                              |X                              |
+|timestamp                      |[None, None]                   |X                              |X                              |X                              |X                              |[datetime.datetime(1970, 1, 1, |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |[datetime.datetime(1970, 1, 1, |[datetime.datetime(1970, 1, 1, |[datetime.datetime(1970, 1, 1, |X                              |X                              |X                              |X                              |
+|float                          |[None, None]                   |[1.0, 0.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |X                              |X                              |X                              |X                              |[12.0, 34.0]                   |X                              |[1.0, 2.0]                     |X                              |X                              |X                              |X                              |X                              |X                              |
+|double                         |[None, None]                   |[1.0, 0.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |[1.0, 2.0]                     |X                              |X                              |X                              |X                              |[12.0, 34.0]                   |X                              |[1.0, 2.0]                     |X                              |X                              |X                              |X                              |X                              |X                              |
+|array<int>                     |[None, None]                   |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |[[1, 2], [3, 4]]               |[[1, 2, 3], [1, 2, 3]]         |X                              |X                              |X                              |X                              |X                              |X                              |X                              |
+|binary                         |[None, None]                   |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b'\x01'), bytearray |[bytearray(b''), bytearray(b'' |[bytearray(b''), bytearray(b'' |[bytearray(b''), bytearray(b'' |[bytearray(b''), bytearray(b'' |[bytearray(b''), bytearray(b'' |[bytearray(b''), bytearray(b'' |[bytearray(b'a'), bytearray(b' |[bytearray(b'12'), bytearray(b |X                              |X                              |[bytearray(b''), bytearray(b'' |[bytearray(b''), bytearray(b'' |[bytearray(b''), bytearray(b'' |[bytearray(b'A'), bytearray(b' |X                              |X                              |
+|decimal(10,0)                  |[None, None]                   |X                              |[Decimal('1'), Decimal('2')]   |[Decimal('1'), Decimal('2')]   |[Decimal('1'), Decimal('2')]   |X                              |[Decimal('1'), Decimal('2')]   |[Decimal('1'), Decimal('2')]   |[Decimal('1'), Decimal('2')]   |X                              |X                              |[Decimal('1'), Decimal('2')]   |[Decimal('1'), Decimal('2')]   |X                              |X                              |X                              |X                              |X                              |X                              |[Decimal('1'), Decimal('2')]   |X                              |X                              |X                              |X                              |X                              |X                              |
+|map<string,int>                |[None, None]                   |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |[{'a': 1}, {'b': 2}]           |
+|struct<_1:int>                 |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |[Row(_1=1), Row(_1=2)]         |X                              |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_disabled.txt b/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_disabled.txt
new file mode 100644
index 0000000000000..2572d48dbec7c
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_disabled.txt
@@ -0,0 +1,43 @@
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|Test Case                                                                             |Spark Type                                                                            |Spark Value                                                                           |Python Type                                                                           |Python Value                                                                          |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|byte_values                                                                           |tinyint                                                                               |[-128, 127, 0]                                                                        |['int', 'int', 'int']                                                                 |['-128', '127', '0']                                                                  |
+|byte_null                                                                             |tinyint                                                                               |[None, 42]                                                                            |['NoneType', 'int']                                                                   |['None', '42']                                                                        |
+|short_values                                                                          |smallint                                                                              |[-32768, 32767, 0]                                                                    |['int', 'int', 'int']                                                                 |['-32768', '32767', '0']                                                              |
+|short_null                                                                            |smallint                                                                              |[None, 123]                                                                           |['NoneType', 'int']                                                                   |['None', '123']                                                                       |
+|int_values                                                                            |int                                                                                   |[-2147483648, 2147483647, 0]                                                          |['int', 'int', 'int']                                                                 |['-2147483648', '2147483647', '0']                                                    |
+|int_null                                                                              |int                                                                                   |[None, 456]                                                                           |['NoneType', 'int']                                                                   |['None', '456']                                                                       |
+|long_values                                                                           |bigint                                                                                |[-9223372036854775808, 9223372036854775807, 0]                                        |['int', 'int', 'int']                                                                 |['-9223372036854775808', '9223372036854775807', '0']                                  |
+|long_null                                                                             |bigint                                                                                |[None, 789]                                                                           |['NoneType', 'int']                                                                   |['None', '789']                                                                       |
+|float_values                                                                          |float                                                                                 |[0.0, 1.0, 3.140000104904175]                                                         |['float', 'float', 'float']                                                           |['0.0', '1.0', '3.140000104904175']                                                   |
+|float_null                                                                            |float                                                                                 |[None, 3.140000104904175]                                                             |['NoneType', 'float']                                                                 |['None', '3.140000104904175']                                                         |
+|double_values                                                                         |double                                                                                |[0.0, 1.0, 0.3333333333333333]                                                        |['float', 'float', 'float']                                                           |['0.0', '1.0', '0.3333333333333333']                                                  |
+|double_null                                                                           |double                                                                                |[None, 2.71]                                                                          |['NoneType', 'float']                                                                 |['None', '2.71']                                                                      |
+|decimal_values                                                                        |decimal(3,2)                                                                          |[Decimal('5.35'), Decimal('1.23')]                                                    |['Decimal', 'Decimal']                                                                |['5.35', '1.23']                                                                      |
+|decimal_null                                                                          |decimal(3,2)                                                                          |[None, Decimal('9.99')]                                                               |['NoneType', 'Decimal']                                                               |['None', '9.99']                                                                      |
+|string_values                                                                         |string                                                                                |['abc', '', 'hello']                                                                  |['str', 'str', 'str']                                                                 |['abc', '', 'hello']                                                                  |
+|string_null                                                                           |string                                                                                |[None, 'test']                                                                        |['NoneType', 'str']                                                                   |['None', 'test']                                                                      |
+|binary_values                                                                         |binary                                                                                |[bytearray(b'abc'), bytearray(b''), bytearray(b'ABC')]                                |['bytearray', 'bytearray', 'bytearray']                                               |["bytearray(b'abc')", "bytearray(b'')", "bytearray(b'ABC')"]                          |
+|binary_null                                                                           |binary                                                                                |[None, bytearray(b'test')]                                                            |['NoneType', 'bytearray']                                                             |['None', "bytearray(b'test')"]                                                        |
+|boolean_values                                                                        |boolean                                                                               |[True, False]                                                                         |['bool', 'bool']                                                                      |['True', 'False']                                                                     |
+|boolean_null                                                                          |boolean                                                                               |[None, True]                                                                          |['NoneType', 'bool']                                                                  |['None', 'True']                                                                      |
+|date_values                                                                           |date                                                                                  |[datetime.date(2020, 2, 2), datetime.date(1970, 1, 1)]                                |['date', 'date']                                                                      |['2020-02-02', '1970-01-01']                                                          |
+|date_null                                                                             |date                                                                                  |[None, datetime.date(2023, 1, 1)]                                                     |['NoneType', 'date']                                                                  |['None', '2023-01-01']                                                                |
+|timestamp_values                                                                      |timestamp                                                                             |[datetime.datetime(2020, 2, 2, 12, 15, 16, 123000)]                                   |['datetime']                                                                          |['2020-02-02 12:15:16.123000']                                                        |
+|timestamp_null                                                                        |timestamp                                                                             |[None, datetime.datetime(2023, 1, 1, 12, 0)]                                          |['NoneType', 'datetime']                                                              |['None', '2023-01-01 12:00:00']                                                       |
+|array_int_values                                                                      |array<int>                                                                            |[[1, 2, 3], [], [1, None, 3]]                                                         |['list', 'list', 'list']                                                              |['[1, 2, 3]', '[]', '[1, None, 3]']                                                   |
+|array_int_null                                                                        |array<int>                                                                            |[None, [4, 5, 6]]                                                                     |['NoneType', 'list']                                                                  |['None', '[4, 5, 6]']                                                                 |
+|map_str_int_values                                                                    |map<string,int>                                                                       |[{'world': 2, 'hello': 1}, {}]                                                        |['dict', 'dict']                                                                      |["{'world': 2, 'hello': 1}", '{}']                                                    |
+|map_str_int_null                                                                      |map<string,int>                                                                       |[None, {'test': 123}]                                                                 |['NoneType', 'dict']                                                                  |['None', "{'test': 123}"]                                                             |
+|struct_int_str_values                                                                 |struct<a1:int,a2:string>                                                              |[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]                                        |['Row', 'Row']                                                                        |["Row(a1=1, a2='hello')", "Row(a1=2, a2='world')"]                                    |
+|struct_int_str_null                                                                   |struct<a1:int,a2:string>                                                              |[None, Row(a1=99, a2='test')]                                                         |['NoneType', 'Row']                                                                   |['None', "Row(a1=99, a2='test')"]                                                     |
+|array_array_int                                                                       |array<array<int>>                                                                     |[[[1, 2, 3]], [[1], [2, 3]]]                                                          |['list', 'list']                                                                      |['[[1, 2, 3]]', '[[1], [2, 3]]']                                                      |
+|array_map_str_int                                                                     |array<map<string,int>>                                                                |[[{'world': 2, 'hello': 1}], [{'a': 1}, {'b': 2}]]                                    |['list', 'list']                                                                      |["[{'world': 2, 'hello': 1}]", "[{'a': 1}, {'b': 2}]"]                                |
+|array_struct_int_str                                                                  |array<struct<a1:int,a2:string>>                                                       |[[Row(a1=1, a2='hello')], [Row(a1=1, a2='hello'), Row(a1=2, a2='world')]]             |['list', 'list']                                                                      |["[Row(a1=1, a2='hello')]", "[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]"]         |
+|map_int_array_int                                                                     |map<int,array<int>>                                                                   |[{1: [1, 2, 3]}, {1: [1], 2: [2, 3]}]                                                 |['dict', 'dict']                                                                      |['{1: [1, 2, 3]}', '{1: [1], 2: [2, 3]}']                                             |
+|map_int_map_str_int                                                                   |map<int,map<string,int>>                                                              |[{1: {'world': 2, 'hello': 1}}]                                                       |['dict']                                                                              |["{1: {'world': 2, 'hello': 1}}"]                                                     |
+|map_int_struct_int_str                                                                |map<int,struct<a1:int,a2:string>>                                                     |[{1: Row(a1=1, a2='hello')}]                                                          |['dict']                                                                              |["{1: Row(a1=1, a2='hello')}"]                                                        |
+|struct_int_array_int                                                                  |struct<a:int,b:array<int>>                                                            |[Row(a=1, b=[1, 2, 3])]                                                               |['Row']                                                                               |['Row(a=1, b=[1, 2, 3])']                                                             |
+|struct_int_map_str_int                                                                |struct<a:int,b:map<string,int>>                                                       |[Row(a=1, b={'world': 2, 'hello': 1})]                                                |['Row']                                                                               |["Row(a=1, b={'world': 2, 'hello': 1})"]                                              |
+|struct_int_struct_int_str                                                             |struct<a:int,b:struct<a1:int,a2:string>>                                              |[Row(a=1, b=Row(a1=1, a2='hello'))]                                                   |['Row']                                                                               |["Row(a=1, b=Row(a1=1, a2='hello'))"]                                                 |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_enabled.txt b/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_enabled.txt
new file mode 100644
index 0000000000000..2572d48dbec7c
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_enabled.txt
@@ -0,0 +1,43 @@
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|Test Case                                                                             |Spark Type                                                                            |Spark Value                                                                           |Python Type                                                                           |Python Value                                                                          |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|byte_values                                                                           |tinyint                                                                               |[-128, 127, 0]                                                                        |['int', 'int', 'int']                                                                 |['-128', '127', '0']                                                                  |
+|byte_null                                                                             |tinyint                                                                               |[None, 42]                                                                            |['NoneType', 'int']                                                                   |['None', '42']                                                                        |
+|short_values                                                                          |smallint                                                                              |[-32768, 32767, 0]                                                                    |['int', 'int', 'int']                                                                 |['-32768', '32767', '0']                                                              |
+|short_null                                                                            |smallint                                                                              |[None, 123]                                                                           |['NoneType', 'int']                                                                   |['None', '123']                                                                       |
+|int_values                                                                            |int                                                                                   |[-2147483648, 2147483647, 0]                                                          |['int', 'int', 'int']                                                                 |['-2147483648', '2147483647', '0']                                                    |
+|int_null                                                                              |int                                                                                   |[None, 456]                                                                           |['NoneType', 'int']                                                                   |['None', '456']                                                                       |
+|long_values                                                                           |bigint                                                                                |[-9223372036854775808, 9223372036854775807, 0]                                        |['int', 'int', 'int']                                                                 |['-9223372036854775808', '9223372036854775807', '0']                                  |
+|long_null                                                                             |bigint                                                                                |[None, 789]                                                                           |['NoneType', 'int']                                                                   |['None', '789']                                                                       |
+|float_values                                                                          |float                                                                                 |[0.0, 1.0, 3.140000104904175]                                                         |['float', 'float', 'float']                                                           |['0.0', '1.0', '3.140000104904175']                                                   |
+|float_null                                                                            |float                                                                                 |[None, 3.140000104904175]                                                             |['NoneType', 'float']                                                                 |['None', '3.140000104904175']                                                         |
+|double_values                                                                         |double                                                                                |[0.0, 1.0, 0.3333333333333333]                                                        |['float', 'float', 'float']                                                           |['0.0', '1.0', '0.3333333333333333']                                                  |
+|double_null                                                                           |double                                                                                |[None, 2.71]                                                                          |['NoneType', 'float']                                                                 |['None', '2.71']                                                                      |
+|decimal_values                                                                        |decimal(3,2)                                                                          |[Decimal('5.35'), Decimal('1.23')]                                                    |['Decimal', 'Decimal']                                                                |['5.35', '1.23']                                                                      |
+|decimal_null                                                                          |decimal(3,2)                                                                          |[None, Decimal('9.99')]                                                               |['NoneType', 'Decimal']                                                               |['None', '9.99']                                                                      |
+|string_values                                                                         |string                                                                                |['abc', '', 'hello']                                                                  |['str', 'str', 'str']                                                                 |['abc', '', 'hello']                                                                  |
+|string_null                                                                           |string                                                                                |[None, 'test']                                                                        |['NoneType', 'str']                                                                   |['None', 'test']                                                                      |
+|binary_values                                                                         |binary                                                                                |[bytearray(b'abc'), bytearray(b''), bytearray(b'ABC')]                                |['bytearray', 'bytearray', 'bytearray']                                               |["bytearray(b'abc')", "bytearray(b'')", "bytearray(b'ABC')"]                          |
+|binary_null                                                                           |binary                                                                                |[None, bytearray(b'test')]                                                            |['NoneType', 'bytearray']                                                             |['None', "bytearray(b'test')"]                                                        |
+|boolean_values                                                                        |boolean                                                                               |[True, False]                                                                         |['bool', 'bool']                                                                      |['True', 'False']                                                                     |
+|boolean_null                                                                          |boolean                                                                               |[None, True]                                                                          |['NoneType', 'bool']                                                                  |['None', 'True']                                                                      |
+|date_values                                                                           |date                                                                                  |[datetime.date(2020, 2, 2), datetime.date(1970, 1, 1)]                                |['date', 'date']                                                                      |['2020-02-02', '1970-01-01']                                                          |
+|date_null                                                                             |date                                                                                  |[None, datetime.date(2023, 1, 1)]                                                     |['NoneType', 'date']                                                                  |['None', '2023-01-01']                                                                |
+|timestamp_values                                                                      |timestamp                                                                             |[datetime.datetime(2020, 2, 2, 12, 15, 16, 123000)]                                   |['datetime']                                                                          |['2020-02-02 12:15:16.123000']                                                        |
+|timestamp_null                                                                        |timestamp                                                                             |[None, datetime.datetime(2023, 1, 1, 12, 0)]                                          |['NoneType', 'datetime']                                                              |['None', '2023-01-01 12:00:00']                                                       |
+|array_int_values                                                                      |array<int>                                                                            |[[1, 2, 3], [], [1, None, 3]]                                                         |['list', 'list', 'list']                                                              |['[1, 2, 3]', '[]', '[1, None, 3]']                                                   |
+|array_int_null                                                                        |array<int>                                                                            |[None, [4, 5, 6]]                                                                     |['NoneType', 'list']                                                                  |['None', '[4, 5, 6]']                                                                 |
+|map_str_int_values                                                                    |map<string,int>                                                                       |[{'world': 2, 'hello': 1}, {}]                                                        |['dict', 'dict']                                                                      |["{'world': 2, 'hello': 1}", '{}']                                                    |
+|map_str_int_null                                                                      |map<string,int>                                                                       |[None, {'test': 123}]                                                                 |['NoneType', 'dict']                                                                  |['None', "{'test': 123}"]                                                             |
+|struct_int_str_values                                                                 |struct<a1:int,a2:string>                                                              |[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]                                        |['Row', 'Row']                                                                        |["Row(a1=1, a2='hello')", "Row(a1=2, a2='world')"]                                    |
+|struct_int_str_null                                                                   |struct<a1:int,a2:string>                                                              |[None, Row(a1=99, a2='test')]                                                         |['NoneType', 'Row']                                                                   |['None', "Row(a1=99, a2='test')"]                                                     |
+|array_array_int                                                                       |array<array<int>>                                                                     |[[[1, 2, 3]], [[1], [2, 3]]]                                                          |['list', 'list']                                                                      |['[[1, 2, 3]]', '[[1], [2, 3]]']                                                      |
+|array_map_str_int                                                                     |array<map<string,int>>                                                                |[[{'world': 2, 'hello': 1}], [{'a': 1}, {'b': 2}]]                                    |['list', 'list']                                                                      |["[{'world': 2, 'hello': 1}]", "[{'a': 1}, {'b': 2}]"]                                |
+|array_struct_int_str                                                                  |array<struct<a1:int,a2:string>>                                                       |[[Row(a1=1, a2='hello')], [Row(a1=1, a2='hello'), Row(a1=2, a2='world')]]             |['list', 'list']                                                                      |["[Row(a1=1, a2='hello')]", "[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]"]         |
+|map_int_array_int                                                                     |map<int,array<int>>                                                                   |[{1: [1, 2, 3]}, {1: [1], 2: [2, 3]}]                                                 |['dict', 'dict']                                                                      |['{1: [1, 2, 3]}', '{1: [1], 2: [2, 3]}']                                             |
+|map_int_map_str_int                                                                   |map<int,map<string,int>>                                                              |[{1: {'world': 2, 'hello': 1}}]                                                       |['dict']                                                                              |["{1: {'world': 2, 'hello': 1}}"]                                                     |
+|map_int_struct_int_str                                                                |map<int,struct<a1:int,a2:string>>                                                     |[{1: Row(a1=1, a2='hello')}]                                                          |['dict']                                                                              |["{1: Row(a1=1, a2='hello')}"]                                                        |
+|struct_int_array_int                                                                  |struct<a:int,b:array<int>>                                                            |[Row(a=1, b=[1, 2, 3])]                                                               |['Row']                                                                               |['Row(a=1, b=[1, 2, 3])']                                                             |
+|struct_int_map_str_int                                                                |struct<a:int,b:map<string,int>>                                                       |[Row(a=1, b={'world': 2, 'hello': 1})]                                                |['Row']                                                                               |["Row(a=1, b={'world': 2, 'hello': 1})"]                                              |
+|struct_int_struct_int_str                                                             |struct<a:int,b:struct<a1:int,a2:string>>                                              |[Row(a=1, b=Row(a1=1, a2='hello'))]                                                   |['Row']                                                                               |["Row(a=1, b=Row(a1=1, a2='hello'))"]                                                 |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_legacy_pandas.txt b/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_legacy_pandas.txt
new file mode 100644
index 0000000000000..92f8af100e743
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_udf_input_types_arrow_legacy_pandas.txt
@@ -0,0 +1,43 @@
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|Test Case                                                                             |Spark Type                                                                            |Spark Value                                                                           |Python Type                                                                           |Python Value                                                                          |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
+|byte_values                                                                           |tinyint                                                                               |[-128, 127, 0]                                                                        |['int', 'int', 'int']                                                                 |['-128', '127', '0']                                                                  |
+|byte_null                                                                             |tinyint                                                                               |[None, 42]                                                                            |['float', 'float']                                                                    |['nan', '42.0']                                                                       |
+|short_values                                                                          |smallint                                                                              |[-32768, 32767, 0]                                                                    |['int', 'int', 'int']                                                                 |['-32768', '32767', '0']                                                              |
+|short_null                                                                            |smallint                                                                              |[None, 123]                                                                           |['float', 'float']                                                                    |['nan', '123.0']                                                                      |
+|int_values                                                                            |int                                                                                   |[-2147483648, 2147483647, 0]                                                          |['int', 'int', 'int']                                                                 |['-2147483648', '2147483647', '0']                                                    |
+|int_null                                                                              |int                                                                                   |[None, 456]                                                                           |['float', 'float']                                                                    |['nan', '456.0']                                                                      |
+|long_values                                                                           |bigint                                                                                |[-9223372036854775808, 9223372036854775807, 0]                                        |['int', 'int', 'int']                                                                 |['-9223372036854775808', '9223372036854775807', '0']                                  |
+|long_null                                                                             |bigint                                                                                |[None, 789]                                                                           |['float', 'float']                                                                    |['nan', '789.0']                                                                      |
+|float_values                                                                          |float                                                                                 |[0.0, 1.0, 3.140000104904175]                                                         |['float', 'float', 'float']                                                           |['0.0', '1.0', '3.140000104904175']                                                   |
+|float_null                                                                            |float                                                                                 |[None, 3.140000104904175]                                                             |['float', 'float']                                                                    |['nan', '3.140000104904175']                                                          |
+|double_values                                                                         |double                                                                                |[0.0, 1.0, 0.3333333333333333]                                                        |['float', 'float', 'float']                                                           |['0.0', '1.0', '0.3333333333333333']                                                  |
+|double_null                                                                           |double                                                                                |[None, 2.71]                                                                          |['float', 'float']                                                                    |['nan', '2.71']                                                                       |
+|decimal_values                                                                        |decimal(3,2)                                                                          |[Decimal('5.35'), Decimal('1.23')]                                                    |['Decimal', 'Decimal']                                                                |['5.35', '1.23']                                                                      |
+|decimal_null                                                                          |decimal(3,2)                                                                          |[None, Decimal('9.99')]                                                               |['NoneType', 'Decimal']                                                               |['None', '9.99']                                                                      |
+|string_values                                                                         |string                                                                                |['abc', '', 'hello']                                                                  |['str', 'str', 'str']                                                                 |['abc', '', 'hello']                                                                  |
+|string_null                                                                           |string                                                                                |[None, 'test']                                                                        |['NoneType', 'str']                                                                   |['None', 'test']                                                                      |
+|binary_values                                                                         |binary                                                                                |[bytearray(b'abc'), bytearray(b''), bytearray(b'ABC')]                                |['bytes', 'bytes', 'bytes']                                                           |["b'abc'", "b''", "b'ABC'"]                                                           |
+|binary_null                                                                           |binary                                                                                |[None, bytearray(b'test')]                                                            |['NoneType', 'bytes']                                                                 |['None', "b'test'"]                                                                   |
+|boolean_values                                                                        |boolean                                                                               |[True, False]                                                                         |['bool', 'bool']                                                                      |['True', 'False']                                                                     |
+|boolean_null                                                                          |boolean                                                                               |[None, True]                                                                          |['NoneType', 'bool']                                                                  |['None', 'True']                                                                      |
+|date_values                                                                           |date                                                                                  |[datetime.date(2020, 2, 2), datetime.date(1970, 1, 1)]                                |['date', 'date']                                                                      |['2020-02-02', '1970-01-01']                                                          |
+|date_null                                                                             |date                                                                                  |[None, datetime.date(2023, 1, 1)]                                                     |['NoneType', 'date']                                                                  |['None', '2023-01-01']                                                                |
+|timestamp_values                                                                      |timestamp                                                                             |[datetime.datetime(2020, 2, 2, 12, 15, 16, 123000)]                                   |['Timestamp']                                                                         |['2020-02-02 12:15:16.123000']                                                        |
+|timestamp_null                                                                        |timestamp                                                                             |[None, datetime.datetime(2023, 1, 1, 12, 0)]                                          |['NaTType', 'Timestamp']                                                              |['NaT', '2023-01-01 12:00:00']                                                        |
+|array_int_values                                                                      |array<int>                                                                            |[[1, 2, 3], [], [1, None, 3]]                                                         |['list', 'list', 'list']                                                              |['[np.float64(1.0), np.float64(2.0), np.float64(3.0)]', '[]', '[np.float64(1.0), np.f |
+|array_int_null                                                                        |array<int>                                                                            |[None, [4, 5, 6]]                                                                     |['NoneType', 'list']                                                                  |['None', '[np.int32(4), np.int32(5), np.int32(6)]']                                   |
+|map_str_int_values                                                                    |map<string,int>                                                                       |[{'world': 2, 'hello': 1}, {}]                                                        |['dict', 'dict']                                                                      |["{'world': 2, 'hello': 1}", '{}']                                                    |
+|map_str_int_null                                                                      |map<string,int>                                                                       |[None, {'test': 123}]                                                                 |['NoneType', 'dict']                                                                  |['None', "{'test': 123}"]                                                             |
+|struct_int_str_values                                                                 |struct<a1:int,a2:string>                                                              |[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]                                        |['Row', 'Row']                                                                        |["Row(a1=1, a2='hello')", "Row(a1=2, a2='world')"]                                    |
+|struct_int_str_null                                                                   |struct<a1:int,a2:string>                                                              |[None, Row(a1=99, a2='test')]                                                         |['NoneType', 'Row']                                                                   |['None', "Row(a1=99.0, a2='test')"]                                                   |
+|array_array_int                                                                       |array<array<int>>                                                                     |[[[1, 2, 3]], [[1], [2, 3]]]                                                          |['list', 'list']                                                                      |['[[np.int32(1), np.int32(2), np.int32(3)]]', '[[np.int32(1)], [np.int32(2), np.int32 |
+|array_map_str_int                                                                     |array<map<string,int>>                                                                |[[{'world': 2, 'hello': 1}], [{'a': 1}, {'b': 2}]]                                    |['list', 'list']                                                                      |["[{'world': 2, 'hello': 1}]", "[{'a': 1}, {'b': 2}]"]                                |
+|array_struct_int_str                                                                  |array<struct<a1:int,a2:string>>                                                       |[[Row(a1=1, a2='hello')], [Row(a1=1, a2='hello'), Row(a1=2, a2='world')]]             |['list', 'list']                                                                      |["[Row(a1=1, a2='hello')]", "[Row(a1=1, a2='hello'), Row(a1=2, a2='world')]"]         |
+|map_int_array_int                                                                     |map<int,array<int>>                                                                   |[{1: [1, 2, 3]}, {1: [1], 2: [2, 3]}]                                                 |['dict', 'dict']                                                                      |['{1: [np.int32(1), np.int32(2), np.int32(3)]}', '{1: [np.int32(1)], 2: [np.int32(2), |
+|map_int_map_str_int                                                                   |map<int,map<string,int>>                                                              |[{1: {'world': 2, 'hello': 1}}]                                                       |['dict']                                                                              |["{1: {'world': 2, 'hello': 1}}"]                                                     |
+|map_int_struct_int_str                                                                |map<int,struct<a1:int,a2:string>>                                                     |[{1: Row(a1=1, a2='hello')}]                                                          |['dict']                                                                              |["{1: Row(a1=1, a2='hello')}"]                                                        |
+|struct_int_array_int                                                                  |struct<a:int,b:array<int>>                                                            |[Row(a=1, b=[1, 2, 3])]                                                               |['Row']                                                                               |['Row(a=1, b=[np.int32(1), np.int32(2), np.int32(3)])']                               |
+|struct_int_map_str_int                                                                |struct<a:int,b:map<string,int>>                                                       |[Row(a=1, b={'world': 2, 'hello': 1})]                                                |['Row']                                                                               |["Row(a=1, b={'world': 2, 'hello': 1})"]                                              |
+|struct_int_struct_int_str                                                             |struct<a:int,b:struct<a1:int,a2:string>>                                              |[Row(a=1, b=Row(a1=1, a2='hello'))]                                                   |['Row']                                                                               |["Row(a=1, b=Row(a1=1, a2='hello'))"]                                                 |
++--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+--------------------------------------------------------------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_disabled.txt b/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_disabled.txt
new file mode 100644
index 0000000000000..7f87b89a5fcf6
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_disabled.txt
@@ -0,0 +1,19 @@
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|SQL Type \ Python Value(Type)  |None(NoneType)                 |True(bool)                     |1(int)                         |a(str)                         |1970-01-01(date)               |1970-01-01 00:00:00(datetime)  |1.0(float)                     |array('i', [1])(array)         |[1](list)                      |(1,)(tuple)                    |bytearray(b'ABC')(bytearray)   |1(Decimal)                     |{'a': 1}(dict)                 |Row(kwargs=1)(Row)             |Row(namedtuple=1)(Row)         |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|boolean                        |None                           |True                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |X                              |X                              |
+|tinyint                        |None                           |None                           |1                              |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |X                              |X                              |
+|smallint                       |None                           |None                           |1                              |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |X                              |X                              |
+|int                            |None                           |None                           |1                              |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |X                              |X                              |
+|bigint                         |None                           |None                           |1                              |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |X                              |X                              |
+|string                         |None                           |'true'                         |'1'                            |'a'                            |'java.util.GregorianCalendar[t |'java.util.GregorianCalendar[t |'1.0'                          |'[I@<hash>'                    |'[1]'                          |'[Ljava.lang.Object;@<hash>'   |'[B@<hash>'                    |'1'                            |'{a=1}'                        |X                              |X                              |
+|date                           |None                           |X                              |X                              |X                              |datetime.date(1970, 1, 1)      |datetime.date(1970, 1, 1)      |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |
+|timestamp                      |None                           |X                              |X                              |X                              |X                              |datetime.datetime(1970, 1, 1,  |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |
+|float                          |None                           |None                           |None                           |None                           |None                           |None                           |1.0                            |None                           |None                           |None                           |None                           |None                           |None                           |X                              |X                              |
+|double                         |None                           |None                           |None                           |None                           |None                           |None                           |1.0                            |None                           |None                           |None                           |None                           |None                           |None                           |X                              |X                              |
+|array<int>                     |None                           |None                           |None                           |None                           |None                           |None                           |None                           |[1]                            |[1]                            |[1]                            |[65, 66, 67]                   |None                           |None                           |X                              |X                              |
+|binary                         |None                           |None                           |None                           |bytearray(b'a')                |None                           |None                           |None                           |None                           |None                           |None                           |bytearray(b'ABC')              |None                           |None                           |X                              |X                              |
+|decimal(10,0)                  |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |Decimal('1')                   |None                           |X                              |X                              |
+|map<string,int>                |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |None                           |{'a': 1}                       |X                              |X                              |
+|struct<_1:int>                 |None                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |Row(_1=1)                      |Row(_1=1)                      |X                              |X                              |Row(_1=None)                   |Row(_1=1)                      |Row(_1=1)                      |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_enabled.txt b/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_enabled.txt
new file mode 100644
index 0000000000000..c117113369e56
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_enabled.txt
@@ -0,0 +1,19 @@
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|SQL Type \ Python Value(Type)  |None(NoneType)                 |True(bool)                     |1(int)                         |a(str)                         |1970-01-01(date)               |1970-01-01 00:00:00(datetime)  |1.0(float)                     |array('i', [1])(array)         |[1](list)                      |(1,)(tuple)                    |bytearray(b'ABC')(bytearray)   |1(Decimal)                     |{'a': 1}(dict)                 |Row(kwargs=1)(Row)             |Row(namedtuple=1)(Row)         |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|boolean                        |None                           |True                           |True                           |X                              |X                              |X                              |True                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |
+|tinyint                        |None                           |X                              |1                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|smallint                       |None                           |X                              |1                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|int                            |None                           |X                              |1                              |X                              |0                              |X                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|bigint                         |None                           |X                              |1                              |X                              |X                              |0                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|string                         |None                           |'true'                         |'1'                            |'a'                            |'1970-01-01'                   |'1970-01-01 00:00:00'          |'1.0'                          |"array('i', [1])"              |'[1]'                          |'(1,)'                         |"bytearray(b'ABC')"            |'1'                            |"{'a': 1}"                     |'Row(kwargs=1)'                |'Row(namedtuple=1)'            |
+|date                           |None                           |X                              |datetime.date(1970, 1, 2)      |X                              |datetime.date(1970, 1, 1)      |datetime.date(1970, 1, 1)      |datetime.date(1970, 1, 2)      |X                              |X                              |X                              |X                              |datetime.date(1970, 1, 2)      |X                              |X                              |X                              |
+|timestamp                      |None                           |X                              |X                              |X                              |X                              |datetime.datetime(1970, 1, 1,  |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |
+|float                          |None                           |1.0                            |1.0                            |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |
+|double                         |None                           |1.0                            |1.0                            |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |
+|array<int>                     |None                           |X                              |X                              |X                              |X                              |X                              |X                              |[1]                            |[1]                            |[1]                            |[65, 66, 67]                   |X                              |X                              |[1]                            |[1]                            |
+|binary                         |None                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |bytearray(b'ABC')              |X                              |X                              |X                              |X                              |
+|decimal(10,0)                  |None                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |Decimal('1')                   |X                              |X                              |X                              |
+|map<string,int>                |None                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |{'a': 1}                       |X                              |X                              |
+|struct<_1:int>                 |None                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |Row(_1=1)                      |X                              |X                              |Row(_1=None)                   |Row(_1=1)                      |Row(_1=1)                      |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_legacy_pandas.txt b/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_legacy_pandas.txt
new file mode 100644
index 0000000000000..a1809dfa9aab6
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/golden_udf_return_type_coercion_arrow_legacy_pandas.txt
@@ -0,0 +1,19 @@
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|SQL Type \ Python Value(Type)  |None(NoneType)                 |True(bool)                     |1(int)                         |a(str)                         |1970-01-01(date)               |1970-01-01 00:00:00(datetime)  |1.0(float)                     |array('i', [1])(array)         |[1](list)                      |(1,)(tuple)                    |bytearray(b'ABC')(bytearray)   |1(Decimal)                     |{'a': 1}(dict)                 |Row(kwargs=1)(Row)             |Row(namedtuple=1)(Row)         |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
+|boolean                        |None                           |True                           |True                           |X                              |X                              |X                              |True                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |
+|tinyint                        |None                           |1                              |1                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|smallint                       |None                           |1                              |1                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|int                            |None                           |1                              |1                              |X                              |0                              |X                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|bigint                         |None                           |1                              |1                              |X                              |X                              |0                              |1                              |X                              |X                              |X                              |X                              |1                              |X                              |X                              |X                              |
+|string                         |None                           |'True'                         |'1'                            |'a'                            |'1970-01-01'                   |'1970-01-01 00:00:00'          |'1.0'                          |"array('i', [1])"              |'[1]'                          |'(1,)'                         |"bytearray(b'ABC')"            |'1'                            |"{'a': 1}"                     |'Row(kwargs=1)'                |'Row(namedtuple=1)'            |
+|date                           |None                           |X                              |X                              |X                              |datetime.date(1970, 1, 1)      |datetime.date(1970, 1, 1)      |X                              |X                              |X                              |X                              |X                              |datetime.date(1970, 1, 2)      |X                              |X                              |X                              |
+|timestamp                      |None                           |X                              |datetime.datetime(1970, 1, 1,  |X                              |X                              |datetime.datetime(1970, 1, 1,  |X                              |X                              |X                              |X                              |X                              |datetime.datetime(1970, 1, 1,  |X                              |X                              |X                              |
+|float                          |None                           |1.0                            |1.0                            |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |
+|double                         |None                           |1.0                            |1.0                            |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |X                              |1.0                            |X                              |X                              |X                              |
+|array<int>                     |None                           |X                              |X                              |X                              |X                              |X                              |X                              |[1]                            |[1]                            |[1]                            |[65, 66, 67]                   |X                              |X                              |[1]                            |[1]                            |
+|binary                         |None                           |bytearray(b'\x00')             |bytearray(b'\x00')             |X                              |X                              |X                              |X                              |bytearray(b'\x01\x00\x00\x00') |bytearray(b'\x01')             |bytearray(b'\x01')             |bytearray(b'ABC')              |X                              |X                              |bytearray(b'\x01')             |bytearray(b'\x01')             |
+|decimal(10,0)                  |None                           |X                              |X                              |X                              |X                              |X                              |Decimal('1')                   |X                              |X                              |X                              |X                              |Decimal('1')                   |X                              |X                              |X                              |
+|map<string,int>                |None                           |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |X                              |{'a': 1}                       |X                              |X                              |
+|struct<_1:int>                 |None                           |X                              |X                              |X                              |X                              |X                              |X                              |Row(_1=1)                      |Row(_1=1)                      |Row(_1=1)                      |Row(_1=65)                     |X                              |Row(_1=None)                   |Row(_1=1)                      |Row(_1=1)                      |
++-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+-------------------------------+
\ No newline at end of file
diff --git a/python/pyspark/sql/tests/udf_type_tests/test_udf_input_types.py b/python/pyspark/sql/tests/udf_type_tests/test_udf_input_types.py
new file mode 100644
index 0000000000000..152fadf87124e
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/test_udf_input_types.py
@@ -0,0 +1,400 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import unittest
+import pandas as pd
+
+from pyspark.sql import Row
+from pyspark.sql.functions import udf, pandas_udf
+from pyspark.sql.types import (
+    ArrayType,
+    BinaryType,
+    BooleanType,
+    ByteType,
+    DateType,
+    DecimalType,
+    DoubleType,
+    FloatType,
+    IntegerType,
+    LongType,
+    MapType,
+    ShortType,
+    StringType,
+    StructField,
+    StructType,
+    TimestampType,
+)
+from pyspark.testing.sqlutils import ReusedSQLTestCase
+from .type_table_utils import generate_table_diff, format_type_table
+
+
+class UDFInputTypeTests(ReusedSQLTestCase):
+    @classmethod
+    def setUpClass(cls):
+        super(UDFInputTypeTests, cls).setUpClass()
+
+    def setUp(self):
+        super(UDFInputTypeTests, self).setUp()
+
+    def test_udf_input_types_arrow_disabled(self):
+        golden_file = os.path.join(
+            os.path.dirname(__file__), "golden_udf_input_types_arrow_disabled.txt"
+        )
+        self._run_udf_input_type_coercion_test(
+            config={},
+            use_arrow=False,
+            golden_file=golden_file,
+            test_name="UDF input types - Arrow disabled",
+        )
+
+    def test_udf_input_types_arrow_legacy_pandas(self):
+        golden_file = os.path.join(
+            os.path.dirname(__file__), "golden_udf_input_types_arrow_legacy_pandas.txt"
+        )
+        self._run_udf_input_type_coercion_test(
+            config={"spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled": "true"},
+            use_arrow=True,
+            golden_file=golden_file,
+            test_name="UDF input types - Arrow with legacy pandas",
+        )
+
+    def test_udf_input_types_arrow_enabled(self):
+        golden_file = os.path.join(
+            os.path.dirname(__file__), "golden_udf_input_types_arrow_enabled.txt"
+        )
+        self._run_udf_input_type_coercion_test(
+            config={"spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled": "false"},
+            use_arrow=True,
+            golden_file=golden_file,
+            test_name="UDF input types - Arrow enabled",
+        )
+
+    def _run_udf_input_type_coercion_test(self, config, use_arrow, golden_file, test_name):
+        with self.sql_conf(config):
+            results = self._generate_udf_input_type_coercion_results(use_arrow)
+            actual_output = format_type_table(
+                results,
+                ["Test Case", "Spark Type", "Spark Value", "Python Type", "Python Value"],
+                column_width=85,
+            )
+            self._compare_or_create_golden_file(actual_output, golden_file, test_name)
+
+    def _generate_udf_input_type_coercion_results(self, use_arrow):
+        results = []
+        test_cases = self._get_input_type_test_cases()
+
+        for test_name, spark_type, data_func in test_cases:
+            input_df = data_func(spark_type).repartition(1)
+            input_data = [row["value"] for row in input_df.collect()]
+            result_row = [test_name, spark_type.simpleString(), str(input_data)]
+
+            try:
+
+                def type_udf(x):
+                    if x is None:
+                        return "NoneType"
+                    else:
+                        return type(x).__name__
+
+                def value_udf(x):
+                    return x
+
+                def value_str(x):
+                    return str(x)
+
+                type_test_udf = udf(type_udf, returnType=StringType(), useArrow=use_arrow)
+                value_test_udf = udf(value_udf, returnType=spark_type, useArrow=use_arrow)
+                value_str_udf = udf(value_str, returnType=StringType(), useArrow=use_arrow)
+
+                result_df = input_df.select(
+                    value_test_udf("value").alias("python_value"),
+                    type_test_udf("value").alias("python_type"),
+                    value_str_udf("value").alias("python_value_str"),
+                )
+                results_data = result_df.collect()
+                values = [row["python_value"] for row in results_data]
+                types = [row["python_type"] for row in results_data]
+                values_str = [row["python_value_str"] for row in results_data]
+
+                # Assert that the UDF output values match the input values
+                assert values == input_data, f"Input {values} != output {input_data}"
+
+                result_row.append(str(types))
+                result_row.append(str(values_str).replace("\n", " "))
+
+            except Exception as e:
+                print("error_msg", e)
+                # Clean up exception message to remove newlines and extra whitespace
+                error_msg = str(e).replace("\n", " ").replace("\r", " ")
+                result_row.append(f"✗ {error_msg}")
+
+            results.append(result_row)
+
+        return results
+
+    def test_pandas_udf_input(self):
+        golden_file = os.path.join(os.path.dirname(__file__), "golden_pandas_udf_input_types.txt")
+        results = self._generate_pandas_udf_input_type_coercion_results()
+        actual_output = format_type_table(
+            results,
+            ["Test Case", "Spark Type", "Spark Value", "Python Type", "Python Value"],
+            column_width=85,
+        )
+        self._compare_or_create_golden_file(actual_output, golden_file, "Pandas UDF input types")
+
+    def _generate_pandas_udf_input_type_coercion_results(self):
+        results = []
+        test_cases = self._get_input_type_test_cases()
+
+        for test_name, spark_type, data_func in test_cases:
+            input_df = data_func(spark_type).repartition(1)
+            input_data = [row["value"] for row in input_df.collect()]
+            result_row = [test_name, spark_type.simpleString(), str(input_data)]
+
+            try:
+
+                def type_pandas_udf(data):
+                    if hasattr(data, "dtype"):
+                        # Series case
+                        return pd.Series([str(data.dtype)] * len(data))
+                    else:
+                        # DataFrame case (for struct types)
+                        return pd.Series([str(type(data).__name__)] * len(data))
+
+                def value_pandas_udf(series):
+                    return series
+
+                type_test_pandas_udf = pandas_udf(type_pandas_udf, returnType=StringType())
+                value_test_pandas_udf = pandas_udf(value_pandas_udf, returnType=spark_type)
+
+                result_df = input_df.select(
+                    value_test_pandas_udf("value").alias("python_value"),
+                    type_test_pandas_udf("value").alias("python_type"),
+                )
+                results_data = result_df.collect()
+                values = [row["python_value"] for row in results_data]
+                types = [row["python_type"] for row in results_data]
+
+                result_row.append(str(types))
+                result_row.append(str(values).replace("\n", " "))
+
+            except Exception as e:
+                print("error_msg", e)
+                error_msg = str(e).replace("\n", " ").replace("\r", " ")
+                result_row.append(f"✗ {error_msg}")
+
+            results.append(result_row)
+
+        return results
+
+    def _compare_or_create_golden_file(self, actual_output, golden_file, test_name):
+        """Compare actual output with golden file or create golden file if it doesn't exist.
+
+        Args:
+            actual_output: The actual output to compare
+            golden_file: Path to the golden file
+            test_name: Name of the test for error messages
+        """
+        if os.path.exists(golden_file):
+            with open(golden_file, "r") as f:
+                expected_output = f.read()
+
+            if actual_output != expected_output:
+                diff_output = generate_table_diff(actual_output, expected_output, cell_width=85)
+                self.fail(
+                    f"""
+                    Results don't match golden file for :{test_name}.\n
+                    Diff:\n{diff_output}
+                    """
+                )
+        else:
+            with open(golden_file, "w") as f:
+                f.write(actual_output)
+            self.fail(f"Golden file created for {test_name}. Please review and re-run the test.")
+
+    def _create_value_schema(self, data_type):
+        """Helper to create a StructType schema with a single 'value' column of the given type."""
+        return StructType([StructField("value", data_type, True)])
+
+    def _get_input_type_test_cases(self):
+        from pyspark.sql.types import StructType, StructField
+        import datetime
+        from decimal import Decimal
+
+        def df(args):
+            def create_df(data_type):
+                # For StructType where the data contains Row objects (not wrapped in tuples)
+                if (
+                    isinstance(data_type, StructType)
+                    and len(args) > 0
+                    and args[0][0] is not None
+                    and hasattr(args[0][0], "_fields")
+                ):
+                    schema = data_type
+                else:
+                    # For all other types, wrap in a "value" column
+                    schema = StructType([StructField("value", data_type, True)])
+                return self.spark.createDataFrame(args, schema)
+
+            return create_df
+
+        return [
+            ("byte_values", ByteType(), df([(-128,), (127,), (0,)])),
+            ("byte_null", ByteType(), df([(None,), (42,)])),
+            ("short_values", ShortType(), df([(-32768,), (32767,), (0,)])),
+            ("short_null", ShortType(), df([(None,), (123,)])),
+            ("int_values", IntegerType(), df([(-2147483648,), (2147483647,), (0,)])),
+            ("int_null", IntegerType(), df([(None,), (456,)])),
+            (
+                "long_values",
+                LongType(),
+                df([(-9223372036854775808,), (9223372036854775807,), (0,)]),
+            ),
+            ("long_null", LongType(), df([(None,), (789,)])),
+            ("float_values", FloatType(), df([(0.0,), (1.0,), (3.14,)])),
+            ("float_null", FloatType(), df([(None,), (3.14,)])),
+            ("double_values", DoubleType(), df([(0.0,), (1.0,), (1.0 / 3,)])),
+            ("double_null", DoubleType(), df([(None,), (2.71,)])),
+            ("decimal_values", DecimalType(3, 2), df([(Decimal("5.35"),), (Decimal("1.23"),)])),
+            ("decimal_null", DecimalType(3, 2), df([(None,), (Decimal("9.99"),)])),
+            ("string_values", StringType(), df([("abc",), ("",), ("hello",)])),
+            ("string_null", StringType(), df([(None,), ("test",)])),
+            ("binary_values", BinaryType(), df([(b"abc",), (b"",), (bytearray([65, 66, 67]),)])),
+            ("binary_null", BinaryType(), df([(None,), (b"test",)])),
+            ("boolean_values", BooleanType(), df([(True,), (False,)])),
+            ("boolean_null", BooleanType(), df([(None,), (True,)])),
+            (
+                "date_values",
+                DateType(),
+                df([(datetime.date(2020, 2, 2),), (datetime.date(1970, 1, 1),)]),
+            ),
+            ("date_null", DateType(), df([(None,), (datetime.date(2023, 1, 1),)])),
+            (
+                "timestamp_values",
+                TimestampType(),
+                df([(datetime.datetime(2020, 2, 2, 12, 15, 16, 123000),)]),
+            ),
+            (
+                "timestamp_null",
+                TimestampType(),
+                df([(None,), (datetime.datetime(2023, 1, 1, 12, 0, 0),)]),
+            ),
+            (
+                "array_int_values",
+                ArrayType(IntegerType()),
+                df([([1, 2, 3],), ([],), ([1, None, 3],)]),
+            ),
+            ("array_int_null", ArrayType(IntegerType()), df([(None,), ([4, 5, 6],)])),
+            (
+                "map_str_int_values",
+                MapType(StringType(), IntegerType()),
+                df([({"hello": 1, "world": 2},), ({},)]),
+            ),
+            (
+                "map_str_int_null",
+                MapType(StringType(), IntegerType()),
+                df([(None,), ({"test": 123},)]),
+            ),
+            (
+                "struct_int_str_values",
+                StructType([StructField("a1", IntegerType()), StructField("a2", StringType())]),
+                df([(Row(a1=1, a2="hello"),), (Row(a1=2, a2="world"),)]),
+            ),
+            (
+                "struct_int_str_null",
+                StructType([StructField("a1", IntegerType()), StructField("a2", StringType())]),
+                df([(None,), (Row(a1=99, a2="test"),)]),
+            ),
+            (
+                "array_array_int",
+                ArrayType(ArrayType(IntegerType())),
+                df([([[1, 2, 3]],), ([[1], [2, 3]],)]),
+            ),
+            (
+                "array_map_str_int",
+                ArrayType(MapType(StringType(), IntegerType())),
+                df([([{"hello": 1, "world": 2}],), ([{"a": 1}, {"b": 2}],)]),
+            ),
+            (
+                "array_struct_int_str",
+                ArrayType(
+                    StructType([StructField("a1", IntegerType()), StructField("a2", StringType())])
+                ),
+                df([([Row(a1=1, a2="hello")],), ([Row(a1=1, a2="hello"), Row(a1=2, a2="world")],)]),
+            ),
+            (
+                "map_int_array_int",
+                MapType(IntegerType(), ArrayType(IntegerType())),
+                df([({1: [1, 2, 3]},), ({1: [1], 2: [2, 3]},)]),
+            ),
+            (
+                "map_int_map_str_int",
+                MapType(IntegerType(), MapType(StringType(), IntegerType())),
+                df([({1: {"hello": 1, "world": 2}},)]),
+            ),
+            (
+                "map_int_struct_int_str",
+                MapType(
+                    IntegerType(),
+                    StructType([StructField("a1", IntegerType()), StructField("a2", StringType())]),
+                ),
+                df([({1: Row(a1=1, a2="hello")},)]),
+            ),
+            (
+                "struct_int_array_int",
+                StructType(
+                    [StructField("a", IntegerType()), StructField("b", ArrayType(IntegerType()))]
+                ),
+                df([(Row(a=1, b=[1, 2, 3]),)]),
+            ),
+            (
+                "struct_int_map_str_int",
+                StructType(
+                    [
+                        StructField("a", IntegerType()),
+                        StructField("b", MapType(StringType(), IntegerType())),
+                    ]
+                ),
+                df([(Row(a=1, b={"hello": 1, "world": 2}),)]),
+            ),
+            (
+                "struct_int_struct_int_str",
+                StructType(
+                    [
+                        StructField("a", IntegerType()),
+                        StructField(
+                            "b",
+                            StructType(
+                                [StructField("a1", IntegerType()), StructField("a2", StringType())]
+                            ),
+                        ),
+                    ]
+                ),
+                df([(Row(a=1, b=Row(a1=1, a2="hello")),)]),
+            ),
+        ]
+
+
+if __name__ == "__main__":
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/udf_type_tests/test_udf_return_types.py b/python/pyspark/sql/tests/udf_type_tests/test_udf_return_types.py
new file mode 100644
index 0000000000000..a5172ae1cf2fc
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/test_udf_return_types.py
@@ -0,0 +1,268 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import array
+import datetime
+import os
+import unittest
+from decimal import Decimal
+import numpy as np
+import pandas as pd
+
+from pyspark.sql import Row
+from pyspark.sql.functions import udf, pandas_udf
+from pyspark.sql.types import (
+    ArrayType,
+    BinaryType,
+    BooleanType,
+    ByteType,
+    DateType,
+    DecimalType,
+    DoubleType,
+    FloatType,
+    IntegerType,
+    LongType,
+    MapType,
+    ShortType,
+    StringType,
+    StructField,
+    StructType,
+    TimestampType,
+)
+from pyspark.testing.sqlutils import ReusedSQLTestCase
+from .type_table_utils import generate_table_diff, format_type_table
+
+
+class UDFReturnTypeTests(ReusedSQLTestCase):
+    @classmethod
+    def setUpClass(cls):
+        super(UDFReturnTypeTests, cls).setUpClass()
+
+    def setUp(self):
+        super(UDFReturnTypeTests, self).setUp()
+        self.test_data = [
+            None,
+            True,
+            1,
+            "a",
+            datetime.date(1970, 1, 1),
+            datetime.datetime(1970, 1, 1, 0, 0),
+            1.0,
+            array.array("i", [1]),
+            [1],
+            (1,),
+            bytearray([65, 66, 67]),
+            Decimal(1),
+            {"a": 1},
+            Row(kwargs=1),
+            Row("namedtuple")(1),
+        ]
+
+        self.test_types = [
+            BooleanType(),
+            ByteType(),
+            ShortType(),
+            IntegerType(),
+            LongType(),
+            StringType(),
+            DateType(),
+            TimestampType(),
+            FloatType(),
+            DoubleType(),
+            ArrayType(IntegerType()),
+            BinaryType(),
+            DecimalType(10, 0),
+            MapType(StringType(), IntegerType()),
+            StructType([StructField("_1", IntegerType())]),
+        ]
+
+        self.pandas_test_data = [
+            [None, None],
+            [True, False],
+            np.arange(1, 3).astype("int8"),
+            np.arange(1, 3).astype("int16"),
+            np.arange(1, 3).astype("int32"),
+            np.arange(1, 3).astype("int64"),
+            np.arange(1, 3).astype("uint8"),
+            np.arange(1, 3).astype("uint16"),
+            np.arange(1, 3).astype("uint32"),
+            np.arange(1, 3).astype("uint64"),
+            np.arange(1, 3).astype("float16"),
+            np.arange(1, 3).astype("float32"),
+            np.arange(1, 3).astype("float64"),
+            np.arange(1, 3).astype("float128"),
+            np.arange(1, 3).astype("complex64"),
+            np.arange(1, 3).astype("complex128"),
+            list("ab"),
+            ["12", "34"],
+            [np.array([1, 2, 3], dtype=np.int32), np.array([1, 2, 3], dtype=np.int32)],
+            [Decimal("1"), Decimal("2")],
+            pd.date_range("19700101", periods=2).values,
+            pd.date_range("19700101", periods=2, tz="US/Eastern").values,
+            [pd.Timedelta("1 day"), pd.Timedelta("2 days")],
+            pd.Categorical(["A", "B"]),
+            pd.DataFrame({"_1": [1, 2]}),
+            [{"a": 1}, {"b": 2}],
+        ]
+
+    def test_udf_return_type_coercion_arrow_disabled(self):
+        golden_file = os.path.join(
+            os.path.dirname(__file__), "golden_udf_return_type_coercion_arrow_disabled.txt"
+        )
+        self._run_udf_return_type_coercion_test(
+            use_arrow=False,
+            legacy_pandas=False,
+            golden_file=golden_file,
+            test_name="Arrow disabled",
+        )
+
+    def test_udf_return_type_coercion_arrow_legacy_pandas(self):
+        golden_file = os.path.join(
+            os.path.dirname(__file__), "golden_udf_return_type_coercion_arrow_legacy_pandas.txt"
+        )
+        self._run_udf_return_type_coercion_test(
+            use_arrow=True,
+            legacy_pandas=True,
+            golden_file=golden_file,
+            test_name="Arrow enabled, legacy pandas enabled",
+        )
+
+    def test_udf_return_type_coercion_arrow_enabled(self):
+        golden_file = os.path.join(
+            os.path.dirname(__file__), "golden_udf_return_type_coercion_arrow_enabled.txt"
+        )
+        self._run_udf_return_type_coercion_test(
+            use_arrow=True,
+            legacy_pandas=False,
+            golden_file=golden_file,
+            test_name="Arrow enabled, legacy pandas disabled",
+        )
+
+    def _run_udf_return_type_coercion_test(self, use_arrow, legacy_pandas, golden_file, test_name):
+        with self.sql_conf(
+            {
+                "spark.sql.execution.pythonUDF.arrow.enabled": str(use_arrow).lower(),
+                "spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled": str(
+                    legacy_pandas
+                ).lower(),
+            }
+        ):
+            results = self._generate_udf_return_type_coercion_results(use_arrow)
+            header = ["SQL Type \\ Python Value(Type)"] + [
+                f"{str(v)}({type(v).__name__})" for v in self.test_data
+            ]
+            actual_output = format_type_table(results, header)
+            self._compare_or_create_golden_file(actual_output, golden_file, test_name)
+
+    def _compare_or_create_golden_file(self, actual_output, golden_file, test_name):
+        """Compare actual output with golden file or create golden file if it doesn't exist.
+
+        Args:
+            actual_output: The actual output to compare
+            golden_file: Path to the golden file
+            test_name: Name of the test for error messages
+        """
+        if os.path.exists(golden_file):
+            with open(golden_file, "r") as f:
+                expected_output = f.read()
+
+            if actual_output != expected_output:
+                diff_output = generate_table_diff(actual_output, expected_output)
+                self.fail(
+                    f"""
+                    Results don't match golden file for :{test_name}.\n
+                    Diff:\n{diff_output}
+                    """
+                )
+        else:
+            with open(golden_file, "w") as f:
+                f.write(actual_output)
+            self.fail(f"Golden file created for {test_name}. Please review and re-run the test.")
+
+    def _generate_udf_return_type_coercion_results(self, use_arrow):
+        results = []
+
+        for spark_type in self.test_types:
+            result = [spark_type.simpleString()]
+            for value in self.test_data:
+                try:
+                    test_udf = udf(lambda _: value, spark_type, useArrow=use_arrow)
+                    row = self.spark.range(1).select(test_udf("id")).first()
+                    result_value = repr(row[0])
+                    # Normalize Java object hash codes to make tests deterministic
+                    import re
+
+                    result_value = re.sub(r"@[a-fA-F0-9]+", "@<hash>", result_value)
+                except Exception:
+                    result_value = "X"
+                result.append(result_value)
+            results.append(result)
+
+        return results
+
+    def test_pandas_udf_return_type_coercion(self):
+        golden_file = os.path.join(
+            os.path.dirname(__file__), "golden_pandas_udf_return_type_coercion.txt"
+        )
+
+        test_name = "Pandas UDF type coercion"
+
+        results = self._generate_pandas_udf_type_coercion_results()
+        header = ["SQL Type \\ Pandas Value(Type)"] + [
+            f"{str(v).replace(chr(10), ' ')}({type(v).__name__})" for v in self.pandas_test_data
+        ]
+        actual_output = format_type_table(results, header)
+        self._compare_or_create_golden_file(actual_output, golden_file, test_name)
+
+    def _generate_pandas_udf_type_coercion_results(self):
+        results = []
+
+        for spark_type in self.test_types:
+            result = [spark_type.simpleString()]
+            for value in self.pandas_test_data:
+                try:
+
+                    @pandas_udf(returnType=spark_type)
+                    def pandas_udf_func(series: pd.Series) -> pd.Series:
+                        assert len(series) == 2
+                        if isinstance(value, pd.DataFrame):
+                            return value
+                        else:
+                            return pd.Series(value)
+
+                    rows = (
+                        self.spark.range(0, 2, 1, 1)
+                        .select(pandas_udf_func("id").alias("result"))
+                        .collect()
+                    )
+                    ret_str = repr([row[0] for row in rows])
+                except Exception:
+                    ret_str = "X"
+                result.append(ret_str)
+            results.append(result)
+
+        return results
+
+
+if __name__ == "__main__":
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    unittest.main(testRunner=testRunner, verbosity=2)
diff --git a/python/pyspark/sql/tests/udf_type_tests/type_table_utils.py b/python/pyspark/sql/tests/udf_type_tests/type_table_utils.py
new file mode 100755
index 0000000000000..88752027f6704
--- /dev/null
+++ b/python/pyspark/sql/tests/udf_type_tests/type_table_utils.py
@@ -0,0 +1,332 @@
+#!/usr/bin/env python3
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import sys
+import argparse
+import re
+from typing import List, Tuple, Optional
+
+CELL_WIDTH = 30
+
+
+class Colors:
+    """ANSI color codes for terminal output"""
+
+    RESET = "\033[0m"
+    RED = "\033[91m"
+    GREEN = "\033[92m"
+    BOLD = "\033[1m"
+    BG_RED = "\033[101m"
+    BG_GREEN = "\033[102m"
+
+
+def parse_table_line(line: str) -> Optional[List[str]]:
+    """Parse a table line and extract cell contents."""
+    if not line.strip() or line.strip().startswith("+"):
+        return None
+
+    cells = [cell.strip() for cell in line.strip("|").split("|")]
+    return cells
+
+
+def parse_table_content(content: str) -> Tuple[List[str], List[List[str]]]:
+    """Parse table content and return header and rows."""
+    lines = content.strip().split("\n")
+    header = None
+    rows = []
+
+    for line in lines:
+        cells = parse_table_line(line)
+        if cells is not None:
+            if header is None:
+                header = cells
+            else:
+                rows.append(cells)
+
+    return header, rows
+
+
+def highlight_cell_diff(
+    expected_cell: str, actual_cell: str, use_colors: bool = True, cell_width: int = CELL_WIDTH
+) -> str:
+    """Highlight differences within a single cell, showing inline diff with both parts visible."""
+    if expected_cell == actual_cell:
+        return expected_cell
+
+    if use_colors:
+        format_overhead = 1
+    else:
+        format_overhead = 6
+
+    total_content_length = len(expected_cell) + len(actual_cell) + format_overhead
+
+    if total_content_length > cell_width:
+        available_space = cell_width - format_overhead
+        half_space = available_space // 2
+
+        expected_truncated = expected_cell
+        actual_truncated = actual_cell
+
+        if len(expected_cell) > half_space:
+            expected_truncated = expected_cell[: half_space - 3] + "..."
+        if len(actual_cell) > half_space:
+            actual_truncated = actual_cell[: half_space - 3] + "..."
+    else:
+        expected_truncated = expected_cell
+        actual_truncated = actual_cell
+
+    if use_colors:
+        return (
+            f"{Colors.BG_RED}{expected_truncated}{Colors.RESET}→"
+            f"{Colors.BG_GREEN}{actual_truncated}{Colors.RESET}"
+        )
+    else:
+        return f"[-{expected_truncated}-][+{actual_truncated}+]"
+
+
+def format_table_diff(
+    header: List[str],
+    expected_rows: List[List[str]],
+    actual_rows: List[List[str]],
+    use_colors: bool = True,
+    cell_width: int = CELL_WIDTH,
+) -> str:
+    """Format a table diff with cell-level highlighting."""
+    output_lines = []
+
+    title = "Table Comparison (Expected vs Actual)"
+    output_lines.append(
+        f"\n{Colors.BOLD if use_colors else ''}{title}{Colors.RESET if use_colors else ''}"
+    )
+    output_lines.append("=" * len(title))
+
+    col_widths = [cell_width] * len(header)
+
+    def format_row(cells: List[str], prefix: str = "", color: str = "") -> str:
+        """Format a single row with proper alignment."""
+        formatted_cells = []
+        for i, (cell, width) in enumerate(zip(cells, col_widths)):
+            display_cell = str(cell)
+
+            visible_length = len(re.sub(r"\x1b\[[0-9;]*m", "", display_cell))
+
+            if visible_length > width:
+                truncated = ""
+                visible_count = 0
+                i = 0
+                while i < len(display_cell) and visible_count < width - 3:
+                    if display_cell[i : i + 1] == "\x1b":
+                        end = display_cell.find("m", i)
+                        if end != -1:
+                            truncated += display_cell[i : end + 1]
+                            i = end + 1
+                        else:
+                            i += 1
+                    else:
+                        truncated += display_cell[i]
+                        visible_count += 1
+                        i += 1
+                display_cell = truncated + "..."
+                visible_length = visible_count + 3
+
+            padding = width - visible_length
+            formatted_cells.append(display_cell + " " * padding)
+
+        row_content = f"|{' |'.join(formatted_cells)} |"
+        if color and use_colors:
+            return f"{prefix}{color}{row_content}{Colors.RESET}"
+        return f"{prefix}{row_content}"
+
+    def create_border(char: str = "-") -> str:
+        """Create a table border."""
+        return "+" + "+".join(char * (width + 1) for width in col_widths) + "+"
+
+    output_lines.append(create_border())
+    output_lines.append(format_row(header))
+    output_lines.append(create_border())
+
+    max_rows = max(len(expected_rows), len(actual_rows))
+    changes_found = False
+
+    for row_idx in range(max_rows):
+        expected_row = expected_rows[row_idx] if row_idx < len(expected_rows) else None
+        actual_row = actual_rows[row_idx] if row_idx < len(actual_rows) else None
+
+        if expected_row is None:
+            display_row = actual_row[:] if actual_row else []
+            while len(display_row) < len(header):
+                display_row.append("")
+            output_lines.append(format_row(display_row, "+ ", Colors.GREEN if use_colors else ""))
+            changes_found = True
+        elif actual_row is None:
+            display_row = expected_row[:] if expected_row else []
+            while len(display_row) < len(header):
+                display_row.append("")
+            output_lines.append(format_row(display_row, "- ", Colors.RED if use_colors else ""))
+            changes_found = True
+        else:
+            row_has_changes = False
+            diff_row = []
+
+            for col_idx in range(len(header)):
+                expected_cell = expected_row[col_idx] if col_idx < len(expected_row) else ""
+                actual_cell = actual_row[col_idx] if col_idx < len(actual_row) else ""
+
+                if expected_cell != actual_cell:
+                    row_has_changes = True
+                    diff_cell = highlight_cell_diff(
+                        expected_cell, actual_cell, use_colors, cell_width
+                    )
+                    diff_row.append(diff_cell)
+                else:
+                    diff_row.append(expected_cell)
+
+            while len(diff_row) < len(header):
+                diff_row.append("")
+
+            output_lines.append(format_row(diff_row))
+            if row_has_changes:
+                changes_found = True
+
+    output_lines.append(create_border())
+
+    if not changes_found:
+        green_start = Colors.GREEN if use_colors else ""
+        reset_end = Colors.RESET if use_colors else ""
+        output_lines.append(f"\n{green_start}✓ Tables are identical!{reset_end}")
+    else:
+        legend = "\nLegend:"
+        if use_colors:
+            legend += f"\n  {Colors.BG_RED}Red background{Colors.RESET}: Expected content (removed)"
+            legend += f"\n  {Colors.BG_GREEN}Green background{Colors.RESET}: Actual content (added)"
+        else:
+            legend += "\n  [-text-]: Expected content (removed)"
+            legend += "\n  [+text+]: Actual content (added)"
+        legend += "\n  Lines prefixed with '-': Expected only rows"
+        legend += "\n  Lines prefixed with '+': Actual only rows"
+        output_lines.append(legend)
+
+    return "\n".join(output_lines)
+
+
+def generate_table_diff(actual, expected, cell_width=CELL_WIDTH):
+    """Generate a table-aware diff between actual and expected output."""
+    try:
+        expected_header, expected_rows = parse_table_content(expected)
+        actual_header, actual_rows = parse_table_content(actual)
+
+        if expected_header and actual_header:
+            return format_table_diff(expected_header, expected_rows, actual_rows, True, cell_width)
+    except Exception:
+        pass
+
+    return "Unable to parse content as table format."
+
+
+def format_type_table(results, header, column_width=30):
+    """Format results into an ASCII table with the given header and column width.
+
+    Args:
+        results: List of rows, where each row is a list of values
+        header: List of header strings
+        column_width: Width of each column (default: 30)
+
+    Returns:
+        String representation of the formatted table
+    """
+    column_widths = [column_width] * len(header)
+    output_lines = []
+
+    top_border = "+" + "+".join("-" * (width + 1) for width in column_widths) + "+"
+    output_lines.append(top_border)
+
+    header_line = (
+        "|"
+        + "|".join(f"{cell[:width]:<{width}} " for cell, width in zip(header, column_widths))
+        + "|"
+    )
+    output_lines.append(header_line)
+    output_lines.append(top_border)
+
+    for row in results:
+        data_line = (
+            "|"
+            + "|".join(f"{str(cell)[:width]:<{width}} " for cell, width in zip(row, column_widths))
+            + "|"
+        )
+        output_lines.append(data_line)
+
+    output_lines.append(top_border)
+    return "\n".join(output_lines)
+
+
+def compare_files(file1_path, file2_path, cell_width=CELL_WIDTH):
+    """Compare two files and show the differences."""
+    if not os.path.exists(file1_path):
+        print(f"Error: File '{file1_path}' does not exist")
+        return False
+
+    if not os.path.exists(file2_path):
+        print(f"Error: File '{file2_path}' does not exist")
+        return False
+
+    try:
+        with open(file1_path, "r") as f1:
+            content1 = f1.read()
+
+        with open(file2_path, "r") as f2:
+            content2 = f2.read()
+    except Exception as e:
+        print(f"Error reading files: {e}")
+        return False
+
+    print(f"Comparing '{file1_path}' (expected) with '{file2_path}' (actual)")
+    print("=" * 80)
+
+    if content1 == content2:
+        print("Files are identical!")
+        return True
+    else:
+        print("Files differ. Generating word-wise diff...")
+        print()
+
+        diff_output = generate_table_diff(content2, content1, cell_width)
+        print(diff_output)
+        return False
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Compare two table files using word-wise diff")
+    parser.add_argument("file1", help="First file (expected)")
+    parser.add_argument("file2", help="Second file (actual)")
+    parser.add_argument(
+        "--cell-width",
+        type=int,
+        default=CELL_WIDTH,
+        help=f"Width of each table cell (default: {CELL_WIDTH})",
+    )
+
+    args = parser.parse_args()
+
+    success = compare_files(args.file1, args.file2, args.cell_width)
+    sys.exit(0 if success else 1)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/python/pyspark/sql/types.py b/python/pyspark/sql/types.py
index 26658bb8d6048..db162e8b1c521 100644
--- a/python/pyspark/sql/types.py
+++ b/python/pyspark/sql/types.py
@@ -80,6 +80,7 @@
     "BinaryType",
     "BooleanType",
     "DateType",
+    "TimeType",
     "TimestampType",
     "TimestampNTZType",
     "DecimalType",
@@ -215,6 +216,7 @@ def _get_jvm_type_name(cls, dataType: "DataType") -> str:
                 VarcharType,
                 DayTimeIntervalType,
                 YearMonthIntervalType,
+                TimeType,
             ),
         ):
             return dataType.simpleString()
@@ -296,11 +298,8 @@ def simpleString(self) -> str:
 
         return f"string collate {self.collation}"
 
-    # For backwards compatibility and compatibility with other readers all string types
-    # are serialized in json as regular strings and the collation info is written to
-    # struct field metadata
     def jsonValue(self) -> str:
-        return "string"
+        return self.simpleString()
 
     def __repr__(self) -> str:
         return (
@@ -367,7 +366,11 @@ class BooleanType(AtomicType, metaclass=DataTypeSingleton):
     pass
 
 
-class DateType(AtomicType, metaclass=DataTypeSingleton):
+class DatetimeType(AtomicType):
+    """Super class of all datetime data type."""
+
+
+class DateType(DatetimeType, metaclass=DataTypeSingleton):
     """Date (datetime.date) data type."""
 
     EPOCH_ORDINAL = datetime.datetime(1970, 1, 1).toordinal()
@@ -384,7 +387,49 @@ def fromInternal(self, v: int) -> datetime.date:
             return datetime.date.fromordinal(v + self.EPOCH_ORDINAL)
 
 
-class TimestampType(AtomicType, metaclass=DataTypeSingleton):
+class AnyTimeType(DatetimeType):
+    """A TIME type of any valid precision."""
+
+    pass
+
+
+class TimeType(AnyTimeType):
+    """Time (datetime.time) data type."""
+
+    def __init__(self, precision: int = 6):
+        self.precision = precision
+
+    def needConversion(self) -> bool:
+        return True
+
+    def toInternal(self, t: datetime.time) -> int:
+        if t is not None:
+            return (
+                t.hour * 3_600_000_000_000
+                + t.minute * 60_000_000_000
+                + t.second * 1_000_000_000
+                + t.microsecond * 1_000
+            )
+
+    def fromInternal(self, nano: int) -> datetime.time:
+        if nano is not None:
+            hours, remainder = divmod(nano, 3_600_000_000_000)
+            minutes, remainder = divmod(remainder, 60_000_000_000)
+            seconds, remainder = divmod(remainder, 1_000_000_000)
+            microseconds = remainder // 1_000
+            return datetime.time(hours, minutes, seconds, microseconds)
+
+    def simpleString(self) -> str:
+        return "time(%d)" % (self.precision)
+
+    def jsonValue(self) -> str:
+        return "time(%d)" % (self.precision)
+
+    def __repr__(self) -> str:
+        return "TimeType(%d)" % (self.precision)
+
+
+class TimestampType(DatetimeType, metaclass=DataTypeSingleton):
     """Timestamp (datetime.datetime) data type."""
 
     def needConversion(self) -> bool:
@@ -403,7 +448,7 @@ def fromInternal(self, ts: int) -> datetime.datetime:
             return datetime.datetime.fromtimestamp(ts // 1000000).replace(microsecond=ts % 1000000)
 
 
-class TimestampNTZType(AtomicType, metaclass=DataTypeSingleton):
+class TimestampNTZType(DatetimeType, metaclass=DataTypeSingleton):
     """Timestamp (datetime.datetime) data type without timezone information."""
 
     def needConversion(self) -> bool:
@@ -1010,11 +1055,39 @@ def jsonValue(self) -> Dict[str, Any]:
 
         return {
             "name": self.name,
-            "type": self.dataType.jsonValue(),
+            "type": self._dataTypeJsonValue(collationMetadata),
             "nullable": self.nullable,
             "metadata": metadata,
         }
 
+    def _dataTypeJsonValue(self, collationMetadata: Dict[str, str]) -> Union[str, Dict[str, Any]]:
+        if not collationMetadata:
+            return self.dataType.jsonValue()
+
+        def removeCollations(dt: DataType) -> DataType:
+            # Only recurse into map and array types as any child struct type
+            # will have already been processed.
+            if isinstance(dt, ArrayType):
+                return ArrayType(removeCollations(dt.elementType), dt.containsNull)
+            elif isinstance(dt, MapType):
+                return MapType(
+                    removeCollations(dt.keyType),
+                    removeCollations(dt.valueType),
+                    dt.valueContainsNull,
+                )
+            elif isinstance(dt, StringType):
+                return StringType()
+            elif isinstance(dt, VarcharType):
+                return VarcharType(dt.length)
+            elif isinstance(dt, CharType):
+                return CharType(dt.length)
+            else:
+                return dt
+
+        # As we want to be backwards compatible we should remove all collations information from the
+        # json and only keep that information in the metadata.
+        return removeCollations(self.dataType).jsonValue()
+
     @classmethod
     def fromJson(cls, json: Dict[str, Any]) -> "StructField":
         metadata = json.get("metadata")
@@ -1843,9 +1916,11 @@ def parseJson(cls, json_str: str) -> "VariantVal":
 
 _LENGTH_CHAR = re.compile(r"char\(\s*(\d+)\s*\)")
 _LENGTH_VARCHAR = re.compile(r"varchar\(\s*(\d+)\s*\)")
+_STRING_WITH_COLLATION = re.compile(r"string\s+collate\s+(\w+)")
 _FIXED_DECIMAL = re.compile(r"decimal\(\s*(\d+)\s*,\s*(-?\d+)\s*\)")
 _INTERVAL_DAYTIME = re.compile(r"interval (day|hour|minute|second)( to (day|hour|minute|second))?")
 _INTERVAL_YEARMONTH = re.compile(r"interval (year|month)( to (year|month))?")
+_TIME = re.compile(r"time\(\s*(\d+)\s*\)")
 
 _COLLATIONS_METADATA_KEY = "__COLLATIONS"
 
@@ -1987,6 +2062,9 @@ def _parse_datatype_json_value(
         elif _FIXED_DECIMAL.match(json_value):
             m = _FIXED_DECIMAL.match(json_value)
             return DecimalType(int(m.group(1)), int(m.group(2)))  # type: ignore[union-attr]
+        elif _TIME.match(json_value):
+            m = _TIME.match(json_value)
+            return TimeType(int(m.group(1)))  # type: ignore[union-attr]
         elif _INTERVAL_DAYTIME.match(json_value):
             m = _INTERVAL_DAYTIME.match(json_value)
             inverted_fields = DayTimeIntervalType._inverted_fields
@@ -2003,6 +2081,9 @@ def _parse_datatype_json_value(
             if first_field is not None and second_field is None:
                 return YearMonthIntervalType(first_field)
             return YearMonthIntervalType(first_field, second_field)
+        elif _STRING_WITH_COLLATION.match(json_value):
+            m = _STRING_WITH_COLLATION.match(json_value)
+            return StringType(m.group(1))  # type: ignore[union-attr]
         elif _LENGTH_CHAR.match(json_value):
             m = _LENGTH_CHAR.match(json_value)
             return CharType(int(m.group(1)))  # type: ignore[union-attr]
@@ -2012,7 +2093,7 @@ def _parse_datatype_json_value(
         else:
             raise PySparkValueError(
                 errorClass="CANNOT_PARSE_DATATYPE",
-                messageParameters={"error": str(json_value)},
+                messageParameters={"msg": str(json_value)},
             )
     else:
         tpe = json_value["type"]
@@ -2067,7 +2148,7 @@ def _assert_valid_collation_provider(provider: str) -> None:
     decimal.Decimal: DecimalType,
     datetime.date: DateType,
     datetime.datetime: TimestampType,  # can be TimestampNTZType
-    datetime.time: TimestampType,  # can be TimestampNTZType
+    datetime.time: TimeType,
     datetime.timedelta: DayTimeIntervalType,
     bytes: BinaryType,
 }
@@ -2510,6 +2591,9 @@ def _need_converter(dataType: DataType) -> bool:
         return _need_converter(dataType.keyType) or _need_converter(dataType.valueType)
     elif isinstance(dataType, NullType):
         return True
+    elif isinstance(dataType, StringType):
+        # Coercion to StringType is allowed, e.g. dict -> str
+        return True
     else:
         return False
 
@@ -2521,16 +2605,35 @@ def _create_converter(dataType: DataType) -> Callable:
 
     if isinstance(dataType, ArrayType):
         conv = _create_converter(dataType.elementType)
-        return lambda row: [conv(v) for v in row]
+        return lambda row: [conv(v) for v in row] if row is not None else None
 
     elif isinstance(dataType, MapType):
         kconv = _create_converter(dataType.keyType)
         vconv = _create_converter(dataType.valueType)
-        return lambda row: dict((kconv(k), vconv(v)) for k, v in row.items())
+        return (
+            lambda row: dict((kconv(k), vconv(v)) for k, v in row.items())
+            if row is not None
+            else None
+        )
 
     elif isinstance(dataType, NullType):
         return lambda x: None
 
+    elif isinstance(dataType, StringType):
+
+        def convert_string(value: Any) -> Any:
+            if value is None:
+                return None
+            else:
+                if isinstance(value, bool):
+                    # To match the Classic behavior
+                    return str(value).lower()
+                else:
+                    # Coercion to StringType is allowed, e.g. dict -> str
+                    return str(value)
+
+        return convert_string
+
     elif not isinstance(dataType, StructType):
         return lambda x: x
 
@@ -2581,6 +2684,7 @@ def convert_struct(obj: Any) -> Optional[Tuple]:
     VarcharType: (str,),
     BinaryType: (bytearray, bytes),
     DateType: (datetime.date, datetime.datetime),
+    TimeType: (datetime.time,),
     TimestampType: (datetime.datetime,),
     TimestampNTZType: (datetime.datetime,),
     DayTimeIntervalType: (datetime.timedelta,),
@@ -2685,7 +2789,9 @@ def new_name(n: str) -> str:
             return "field %s in %s" % (n, name)
 
     def verify_nullability(obj: Any) -> bool:
-        if obj is None:
+        if obj is None or (isinstance(obj, decimal.Decimal) and obj.is_nan()):
+            # Spark's DecimalType doesn't support NaN,
+            # casting DoubleType NaN to DecimalType will return Null.
             if nullable:
                 return True
             else:
@@ -3187,6 +3293,17 @@ def convert(self, obj: datetime.date, gateway_client: "GatewayClient") -> "JavaG
         return Date.valueOf(obj.strftime("%Y-%m-%d"))
 
 
+class TimeConverter:
+    def can_convert(self, obj: Any) -> bool:
+        return isinstance(obj, datetime.time)
+
+    def convert(self, obj: datetime.time, gateway_client: "GatewayClient") -> "JavaGateway":
+        from py4j.java_gateway import JavaClass
+
+        LocalTime = JavaClass("java.time.LocalTime", gateway_client)
+        return LocalTime.of(obj.hour, obj.minute, obj.second, obj.microsecond * 1000)
+
+
 class DatetimeConverter:
     def can_convert(self, obj: Any) -> bool:
         return isinstance(obj, datetime.datetime)
@@ -3315,6 +3432,7 @@ def convert(self, obj: "np.ndarray", gateway_client: "GatewayClient") -> "JavaGa
     register_input_converter(DatetimeNTZConverter())
     register_input_converter(DatetimeConverter())
     register_input_converter(DateConverter())
+    register_input_converter(TimeConverter())
     register_input_converter(DayTimeIntervalTypeConverter())
     register_input_converter(NumpyScalarConverter())
     # NumPy array satisfies py4j.java_collections.ListConverter,
diff --git a/python/pyspark/sql/udf.py b/python/pyspark/sql/udf.py
index 6c166392f8cea..6785e50cf3512 100644
--- a/python/pyspark/sql/udf.py
+++ b/python/pyspark/sql/udf.py
@@ -90,32 +90,12 @@ def _create_py_udf(
     useArrow: Optional[bool] = None,
 ) -> "UserDefinedFunctionLike":
     """Create a regular/Arrow-optimized Python UDF."""
-    # The following table shows the results when the type coercion in Arrow is needed, that is,
-    # when the user-specified return type(SQL Type) of the UDF and the actual instance(Python
-    # Value(Type)) that the UDF returns are different.
+    # The tables in python/pyspark/sql/tests/udf_type_tests show the results when the type coercion
+    # in Arrow is needed, that is, when the user-specified return type(SQL Type) of the UDF and the
+    # actual instance(Python Value(Type)) that the UDF returns are different.
     # Arrow and Pickle have different type coercion rules, so a UDF might have a different result
     # with/without Arrow optimization. That's the main reason the Arrow optimization for Python
     # UDFs is disabled by default.
-    # +-----------------------------+--------------+----------+------+---------------+--------------------+-----------------------------+----------+----------------------+---------+--------------------+----------------------------+------------+--------------+  # noqa
-    # |SQL Type \ Python Value(Type)|None(NoneType)|True(bool)|1(int)|         a(str)|    1970-01-01(date)|1970-01-01 00:00:00(datetime)|1.0(float)|array('i', [1])(array)|[1](list)|         (1,)(tuple)|bytearray(b'ABC')(bytearray)|  1(Decimal)|{'a': 1}(dict)|  # noqa
-    # +-----------------------------+--------------+----------+------+---------------+--------------------+-----------------------------+----------+----------------------+---------+--------------------+----------------------------+------------+--------------+  # noqa
-    # |                      boolean|          None|      True|  None|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|  # noqa
-    # |                      tinyint|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|  # noqa
-    # |                     smallint|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|  # noqa
-    # |                          int|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|  # noqa
-    # |                       bigint|          None|      None|     1|           None|                None|                         None|      None|                  None|     None|                None|                        None|        None|          None|  # noqa
-    # |                       string|          None|    'true'|   '1'|            'a'|'java.util.Gregor...|         'java.util.Gregor...|     '1.0'|         '[I@120d813a'|    '[1]'|'[Ljava.lang.Obje...|               '[B@48571878'|         '1'|       '{a=1}'|  # noqa
-    # |                         date|          None|         X|     X|              X|datetime.date(197...|         datetime.date(197...|         X|                     X|        X|                   X|                           X|           X|             X|  # noqa
-    # |                    timestamp|          None|         X|     X|              X|                   X|         datetime.datetime...|         X|                     X|        X|                   X|                           X|           X|             X|  # noqa
-    # |                        float|          None|      None|  None|           None|                None|                         None|       1.0|                  None|     None|                None|                        None|        None|          None|  # noqa
-    # |                       double|          None|      None|  None|           None|                None|                         None|       1.0|                  None|     None|                None|                        None|        None|          None|  # noqa
-    # |                       binary|          None|      None|  None|bytearray(b'a')|                None|                         None|      None|                  None|     None|                None|           bytearray(b'ABC')|        None|          None|  # noqa
-    # |                decimal(10,0)|          None|      None|  None|           None|                None|                         None|      None|                  None|     None|                None|                        None|Decimal('1')|          None|  # noqa
-    # +-----------------------------+--------------+----------+------+---------------+--------------------+-----------------------------+----------+----------------------+---------+--------------------+----------------------------+------------+--------------+  # noqa
-    # Note: Python 3.9.15, Pandas 1.5.2 and PyArrow 10.0.1 are used.
-    # Note: The values of 'SQL Type' are DDL formatted strings, which can be used as `returnType`s.
-    # Note: The values inside the table are generated by `repr`. X' means it throws an exception
-    # during the conversion.
     is_arrow_enabled = False
 
     if useArrow is None:
@@ -229,6 +209,19 @@ def _check_return_type(returnType: DataType, evalType: int) -> None:
                         "feature": f"Invalid return type with scalar Pandas UDFs: " f"{returnType}"
                     },
                 )
+        elif (
+            evalType == PythonEvalType.SQL_SCALAR_ARROW_UDF
+            or evalType == PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF
+        ):
+            try:
+                to_arrow_type(returnType)
+            except TypeError:
+                raise PySparkNotImplementedError(
+                    errorClass="NOT_IMPLEMENTED",
+                    messageParameters={
+                        "feature": f"Invalid return type with scalar Arrow UDFs: " f"{returnType}"
+                    },
+                )
         elif (
             evalType == PythonEvalType.SQL_GROUPED_MAP_PANDAS_UDF
             or evalType == PythonEvalType.SQL_GROUPED_MAP_PANDAS_UDF_WITH_STATE
@@ -355,12 +348,23 @@ def _check_return_type(returnType: DataType, evalType: int) -> None:
                         f"{returnType}"
                     },
                 )
+        elif evalType == PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF:
+            try:
+                # Different from SQL_GROUPED_AGG_PANDAS_UDF, StructType is allowed here
+                to_arrow_type(returnType)
+            except TypeError:
+                raise PySparkNotImplementedError(
+                    errorClass="NOT_IMPLEMENTED",
+                    messageParameters={
+                        "feature": f"Invalid return type with grouped aggregate Arrow UDFs: "
+                        f"{returnType}"
+                    },
+                )
 
     @property
     def returnType(self) -> DataType:
         # Make sure this is called after SparkContext is initialized.
         # ``_parse_datatype_string`` accesses to JVM for parsing a DDL formatted string.
-        # TODO: PythonEvalType.SQL_BATCHED_UDF
         if self._returnType_placeholder is None:
             if isinstance(self._returnType, DataType):
                 self._returnType_placeholder = self._returnType
@@ -412,6 +416,7 @@ def __call__(self, *args: "ColumnOrName", **kwargs: "ColumnOrName") -> Column:
             # Disable profiling Pandas UDFs with iterators as input/output.
             if self.evalType in [
                 PythonEvalType.SQL_SCALAR_PANDAS_ITER_UDF,
+                PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF,
                 PythonEvalType.SQL_MAP_PANDAS_ITER_UDF,
                 PythonEvalType.SQL_MAP_ARROW_ITER_UDF,
             ]:
@@ -654,14 +659,17 @@ def register(
                 PythonEvalType.SQL_SCALAR_PANDAS_UDF,
                 PythonEvalType.SQL_SCALAR_ARROW_UDF,
                 PythonEvalType.SQL_SCALAR_PANDAS_ITER_UDF,
+                PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF,
                 PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF,
+                PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
             ]:
                 raise PySparkTypeError(
                     errorClass="INVALID_UDF_EVAL_TYPE",
                     messageParameters={
                         "eval_type": "SQL_BATCHED_UDF, SQL_ARROW_BATCHED_UDF, "
-                        "SQL_SCALAR_PANDAS_UDF, SQL_SCALAR_PANDAS_ITER_UDF or "
-                        "SQL_GROUPED_AGG_PANDAS_UDF"
+                        "SQL_SCALAR_PANDAS_UDF, SQL_SCALAR_ARROW_UDF, "
+                        "SQL_SCALAR_PANDAS_ITER_UDF, SQL_SCALAR_ARROW_ITER_UDF, "
+                        "SQL_GROUPED_AGG_PANDAS_UDF or SQL_GROUPED_AGG_ARROW_UDF"
                     },
                 )
             source_udf = _create_udf(
diff --git a/python/pyspark/sql/udtf.py b/python/pyspark/sql/udtf.py
index c678cc9701677..faaa80b4011e0 100644
--- a/python/pyspark/sql/udtf.py
+++ b/python/pyspark/sql/udtf.py
@@ -24,7 +24,12 @@
 import warnings
 from typing import Any, Type, TYPE_CHECKING, Optional, Sequence, Union
 
-from pyspark.errors import PySparkAttributeError, PySparkPicklingError, PySparkTypeError
+from pyspark.errors import (
+    PySparkAttributeError,
+    PySparkPicklingError,
+    PySparkTypeError,
+    PySparkImportError,
+)
 from pyspark.util import PythonEvalType
 from pyspark.sql.pandas.utils import require_minimum_pandas_version, require_minimum_pyarrow_version
 from pyspark.sql.types import DataType, StructType, _parse_datatype_string
@@ -242,6 +247,46 @@ def _create_py_udtf(
     )
 
 
+def _create_pyarrow_udtf(
+    cls: Type,
+    returnType: Optional[Union[StructType, str]],
+    name: Optional[str] = None,
+    deterministic: bool = False,
+) -> "UserDefinedTableFunction":
+    """Create a PyArrow-native Python UDTF."""
+    # Validate PyArrow dependencies
+    try:
+        require_minimum_pyarrow_version()
+    except ImportError as e:
+        raise PySparkImportError(f"PyArrow UDTF requires pyarrow dependencies: {str(e)}") from e
+
+    # Validate the handler class with PyArrow-specific checks
+    _validate_arrow_udtf_handler(cls, returnType)
+
+    return _create_udtf(
+        cls=cls,
+        returnType=returnType,
+        name=name,
+        evalType=PythonEvalType.SQL_ARROW_UDTF,
+        deterministic=deterministic,
+    )
+
+
+def _validate_arrow_udtf_handler(cls: Any, returnType: Optional[Union[StructType, str]]) -> None:
+    """Validate the handler class of a PyArrow UDTF."""
+    # First run standard UDTF validation
+    _validate_udtf_handler(cls, returnType)
+
+    # Block analyze method usage in arrow UDTFs
+    # TODO(SPARK-53286): Support analyze method for Arrow UDTFs to enable dynamic return types
+    has_analyze = hasattr(cls, "analyze")
+    if has_analyze:
+        raise PySparkAttributeError(
+            errorClass="INVALID_ARROW_UDTF_WITH_ANALYZE",
+            messageParameters={"name": cls.__name__},
+        )
+
+
 def _validate_udtf_handler(cls: Any, returnType: Optional[Union[StructType, str]]) -> None:
     """Validate the handler class of a UDTF."""
 
@@ -484,7 +529,11 @@ def register(
                 },
             )
 
-        if f.evalType not in [PythonEvalType.SQL_TABLE_UDF, PythonEvalType.SQL_ARROW_TABLE_UDF]:
+        if f.evalType not in [
+            PythonEvalType.SQL_TABLE_UDF,
+            PythonEvalType.SQL_ARROW_TABLE_UDF,
+            PythonEvalType.SQL_ARROW_UDTF,
+        ]:
             raise PySparkTypeError(
                 errorClass="INVALID_UDTF_EVAL_TYPE",
                 messageParameters={
diff --git a/python/pyspark/sql/worker/analyze_udtf.py b/python/pyspark/sql/worker/analyze_udtf.py
index 1c926f4980a59..892130bbae16a 100644
--- a/python/pyspark/sql/worker/analyze_udtf.py
+++ b/python/pyspark/sql/worker/analyze_udtf.py
@@ -108,6 +108,7 @@ def main(infile: IO, outfile: IO) -> None:
     and call the `analyze` static method, and send back a AnalyzeResult as a result of the method.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -116,6 +117,9 @@ def main(infile: IO, outfile: IO) -> None:
 
         check_python_version(infile)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         memory_limit_mb = int(os.environ.get("PYSPARK_PLANNER_MEMORY_MB", "-1"))
         setup_memory_limits(memory_limit_mb)
 
@@ -270,6 +274,9 @@ def invalid_analyze_result_field(field_name: str, expected_field: str) -> PySpar
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/sql/worker/commit_data_source_write.py b/python/pyspark/sql/worker/commit_data_source_write.py
index d08d65974dfb8..dd080f1feb6c1 100644
--- a/python/pyspark/sql/worker/commit_data_source_write.py
+++ b/python/pyspark/sql/worker/commit_data_source_write.py
@@ -49,6 +49,7 @@ def main(infile: IO, outfile: IO) -> None:
     writer instance, given a list of commit messages.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -57,6 +58,9 @@ def main(infile: IO, outfile: IO) -> None:
 
         check_python_version(infile)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         memory_limit_mb = int(os.environ.get("PYSPARK_PLANNER_MEMORY_MB", "-1"))
         setup_memory_limits(memory_limit_mb)
 
@@ -116,6 +120,9 @@ def main(infile: IO, outfile: IO) -> None:
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/sql/worker/create_data_source.py b/python/pyspark/sql/worker/create_data_source.py
index 424f070127232..fc1b8eaffdaae 100644
--- a/python/pyspark/sql/worker/create_data_source.py
+++ b/python/pyspark/sql/worker/create_data_source.py
@@ -62,6 +62,7 @@ def main(infile: IO, outfile: IO) -> None:
     sends the pickled instance as well as the schema back to the JVM.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -70,6 +71,9 @@ def main(infile: IO, outfile: IO) -> None:
 
         check_python_version(infile)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         memory_limit_mb = int(os.environ.get("PYSPARK_PLANNER_MEMORY_MB", "-1"))
         setup_memory_limits(memory_limit_mb)
 
@@ -181,6 +185,9 @@ def main(infile: IO, outfile: IO) -> None:
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/sql/worker/data_source_pushdown_filters.py b/python/pyspark/sql/worker/data_source_pushdown_filters.py
index 0415f450fe0fc..ac6f84e617150 100644
--- a/python/pyspark/sql/worker/data_source_pushdown_filters.py
+++ b/python/pyspark/sql/worker/data_source_pushdown_filters.py
@@ -140,6 +140,7 @@ def main(infile: IO, outfile: IO) -> None:
     filters are sent back to the JVM, along with the list of partitions and the read function.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -148,6 +149,9 @@ def main(infile: IO, outfile: IO) -> None:
 
         check_python_version(infile)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         memory_limit_mb = int(os.environ.get("PYSPARK_PLANNER_MEMORY_MB", "-1"))
         setup_memory_limits(memory_limit_mb)
 
@@ -266,6 +270,9 @@ def main(infile: IO, outfile: IO) -> None:
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/sql/worker/lookup_data_sources.py b/python/pyspark/sql/worker/lookup_data_sources.py
index af138ab689659..eeb84263d4452 100644
--- a/python/pyspark/sql/worker/lookup_data_sources.py
+++ b/python/pyspark/sql/worker/lookup_data_sources.py
@@ -52,6 +52,7 @@ def main(infile: IO, outfile: IO) -> None:
     statically registered automatically.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -60,6 +61,9 @@ def main(infile: IO, outfile: IO) -> None:
 
         check_python_version(infile)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         memory_limit_mb = int(os.environ.get("PYSPARK_PLANNER_MEMORY_MB", "-1"))
         setup_memory_limits(memory_limit_mb)
 
@@ -101,6 +105,9 @@ def main(infile: IO, outfile: IO) -> None:
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/sql/worker/plan_data_source_read.py b/python/pyspark/sql/worker/plan_data_source_read.py
index 5edc8185adcfe..7c14ebfc53e4d 100644
--- a/python/pyspark/sql/worker/plan_data_source_read.py
+++ b/python/pyspark/sql/worker/plan_data_source_read.py
@@ -284,6 +284,7 @@ def main(infile: IO, outfile: IO) -> None:
     via the socket.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -292,6 +293,9 @@ def main(infile: IO, outfile: IO) -> None:
 
         check_python_version(infile)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         memory_limit_mb = int(os.environ.get("PYSPARK_PLANNER_MEMORY_MB", "-1"))
         setup_memory_limits(memory_limit_mb)
 
@@ -406,6 +410,9 @@ def main(infile: IO, outfile: IO) -> None:
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/sql/worker/python_streaming_sink_runner.py b/python/pyspark/sql/worker/python_streaming_sink_runner.py
index cf6246b544909..83ba027a0601b 100644
--- a/python/pyspark/sql/worker/python_streaming_sink_runner.py
+++ b/python/pyspark/sql/worker/python_streaming_sink_runner.py
@@ -57,6 +57,7 @@ def main(infile: IO, outfile: IO) -> None:
     writer instance, given a list of commit messages.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -64,6 +65,10 @@ def main(infile: IO, outfile: IO) -> None:
             faulthandler.enable(file=faulthandler_log_file)
 
         check_python_version(infile)
+
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         setup_spark_files(infile)
         setup_broadcasts(infile)
 
@@ -145,6 +150,9 @@ def main(infile: IO, outfile: IO) -> None:
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/sql/worker/write_into_data_source.py b/python/pyspark/sql/worker/write_into_data_source.py
index d6d055f01e543..3e772031225d5 100644
--- a/python/pyspark/sql/worker/write_into_data_source.py
+++ b/python/pyspark/sql/worker/write_into_data_source.py
@@ -36,6 +36,8 @@
     DataSourceArrowWriter,
     WriterCommitMessage,
     CaseInsensitiveDict,
+    DataSourceStreamWriter,
+    DataSourceStreamArrowWriter,
 )
 from pyspark.sql.types import (
     _parse_datatype_json_string,
@@ -76,6 +78,7 @@ def main(infile: IO, outfile: IO) -> None:
     in mapInPandas/mapInArrow back to the JVM.
     """
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -84,6 +87,9 @@ def main(infile: IO, outfile: IO) -> None:
 
         check_python_version(infile)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         memory_limit_mb = int(os.environ.get("PYSPARK_PLANNER_MEMORY_MB", "-1"))
         setup_memory_limits(memory_limit_mb)
 
@@ -172,6 +178,17 @@ def main(infile: IO, outfile: IO) -> None:
         if is_streaming:
             # Instantiate the streaming data source writer.
             writer = data_source.streamWriter(schema, overwrite)
+            if not isinstance(writer, (DataSourceStreamWriter, DataSourceStreamArrowWriter)):
+                raise PySparkAssertionError(
+                    errorClass="DATA_SOURCE_TYPE_MISMATCH",
+                    messageParameters={
+                        "expected": (
+                            "an instance of DataSourceStreamWriter or "
+                            "DataSourceStreamArrowWriter"
+                        ),
+                        "actual": f"'{type(writer).__name__}'",
+                    },
+                )
         else:
             # Instantiate the data source writer.
             writer = data_source.writer(schema, overwrite)  # type: ignore[assignment]
@@ -204,6 +221,8 @@ def batch_to_rows() -> Iterator[Row]:
 
             if isinstance(writer, DataSourceArrowWriter):
                 res = writer.write(iterator)
+            elif isinstance(writer, DataSourceStreamArrowWriter):
+                res = writer.write(iterator)  # type: ignore[arg-type]
             else:
                 res = writer.write(batch_to_rows())
 
@@ -252,6 +271,9 @@ def batch_to_rows() -> Iterator[Row]:
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/pyspark/testing/__init__.py b/python/pyspark/testing/__init__.py
index 63bea27a32dbe..ca233325b52a8 100644
--- a/python/pyspark/testing/__init__.py
+++ b/python/pyspark/testing/__init__.py
@@ -14,54 +14,34 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
+import sys
 import typing
-
-from pyspark.testing.utils import assertDataFrameEqual, assertSchemaEqual
+import unittest
 
 
-grpc_requirement_message = None
-try:
-    import grpc
-except ImportError as e:
-    grpc_requirement_message = str(e)
-have_grpc = grpc_requirement_message is None
+_unittest_main = None
 
+if sys.version_info >= (3, 12) and _unittest_main is None:
+    _unittest_main = unittest.main
 
-grpc_status_requirement_message = None
-try:
-    import grpc_status
-except ImportError as e:
-    grpc_status_requirement_message = str(e)
-have_grpc_status = grpc_status_requirement_message is None
+    def unittest_main(*args, **kwargs):
+        exit = kwargs.pop("exit", True)
+        kwargs["exit"] = False
+        res = _unittest_main(*args, **kwargs)
 
-googleapis_common_protos_requirement_message = None
-try:
-    from google.rpc import error_details_pb2
-except ImportError as e:
-    googleapis_common_protos_requirement_message = str(e)
-have_googleapis_common_protos = googleapis_common_protos_requirement_message is None
+        if exit:
+            if not res.result.wasSuccessful():
+                sys.exit(1)
+            elif res.result.testsRun == 0 and len(res.result.skipped) == 0:
+                sys.exit(5)
+            else:
+                sys.exit(0)
 
-graphviz_requirement_message = None
-try:
-    import graphviz
-except ImportError as e:
-    graphviz_requirement_message = str(e)
-have_graphviz: bool = graphviz_requirement_message is None
+        return res
 
-from pyspark.testing.utils import (
-    PySparkErrorTestUtils,
-    pandas_requirement_message,
-    pyarrow_requirement_message,
-)
+    unittest.main = unittest_main
 
 
-connect_requirement_message = (
-    pandas_requirement_message
-    or pyarrow_requirement_message
-    or grpc_requirement_message
-    or googleapis_common_protos_requirement_message
-    or grpc_status_requirement_message
-)
-should_test_connect: str = typing.cast(str, connect_requirement_message is None)
+from pyspark.testing.utils import assertDataFrameEqual, assertSchemaEqual
 
 __all__ = ["assertDataFrameEqual", "assertSchemaEqual"]
diff --git a/python/pyspark/testing/connectutils.py b/python/pyspark/testing/connectutils.py
index 5e2d6ae8724b1..1f5c5a086abfb 100644
--- a/python/pyspark/testing/connectutils.py
+++ b/python/pyspark/testing/connectutils.py
@@ -23,27 +23,28 @@
 import uuid
 import contextlib
 
-from pyspark.testing import (
+from pyspark import Row, SparkConf
+from pyspark.util import is_remote_only
+from pyspark.testing.utils import PySparkErrorTestUtils
+from pyspark import Row, SparkConf
+from pyspark.util import is_remote_only
+from pyspark.testing.utils import (
+    have_pandas,
+    pandas_requirement_message,
+    pyarrow_requirement_message,
+    have_graphviz,
+    graphviz_requirement_message,
     grpc_requirement_message,
     have_grpc,
     grpc_status_requirement_message,
     have_grpc_status,
     googleapis_common_protos_requirement_message,
     have_googleapis_common_protos,
-    graphviz_requirement_message,
-    have_graphviz,
     connect_requirement_message,
     should_test_connect,
+    PySparkErrorTestUtils,
 )
-from pyspark import Row, SparkConf
-from pyspark.util import is_remote_only
-from pyspark.testing.utils import PySparkErrorTestUtils
-from pyspark.testing.sqlutils import (
-    have_pandas,
-    pandas_requirement_message,
-    pyarrow_requirement_message,
-    SQLTestUtils,
-)
+from pyspark.testing.sqlutils import SQLTestUtils
 from pyspark.sql.session import SparkSession as PySparkSession
 
 
@@ -166,6 +167,9 @@ def master(cls):
 
     @classmethod
     def setUpClass(cls):
+        # This environment variable is for interrupting hanging ML-handler and making the
+        # tests fail fast.
+        os.environ["SPARK_CONNECT_ML_HANDLER_INTERRUPTION_TIMEOUT_MINUTES"] = "5"
         cls.spark = (
             PySparkSession.builder.config(conf=cls.conf())
             .appName(cls.__name__)
diff --git a/python/pyspark/testing/pandasutils.py b/python/pyspark/testing/pandasutils.py
index b55034da3f58c..e53240586d59f 100644
--- a/python/pyspark/testing/pandasutils.py
+++ b/python/pyspark/testing/pandasutils.py
@@ -127,8 +127,8 @@ def _assert_pandas_almost_equal(
 
     def compare_vals_approx(val1, val2):
         # compare vals for approximate equality
-        if isinstance(lval, (float, decimal.Decimal)) or isinstance(rval, (float, decimal.Decimal)):
-            if abs(float(lval) - float(rval)) > (atol + rtol * abs(float(rval))):
+        if isinstance(val1, (float, decimal.Decimal)) or isinstance(val2, (float, decimal.Decimal)):
+            if abs(float(val1) - float(val2)) > (atol + rtol * abs(float(val2))):
                 return False
         elif val1 != val2:
             return False
diff --git a/python/pyspark/testing/tests/__init__.py b/python/pyspark/testing/tests/__init__.py
new file mode 100644
index 0000000000000..12bdf0d0175b6
--- /dev/null
+++ b/python/pyspark/testing/tests/__init__.py
@@ -0,0 +1,16 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
diff --git a/python/pyspark/testing/tests/test_fail.py b/python/pyspark/testing/tests/test_fail.py
new file mode 100644
index 0000000000000..d525cae8288f8
--- /dev/null
+++ b/python/pyspark/testing/tests/test_fail.py
@@ -0,0 +1,37 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+
+
+class FailTests(unittest.TestCase):
+    def test_something(self):
+        self.assertEqual(True, False)
+
+
+if __name__ == "__main__":
+    from pyspark.testing.tests.test_fail import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    try:
+        unittest.main(testRunner=testRunner, verbosity=2)
+    except SystemExit as e:
+        assert e.code == 1, f"status code: {e.code}"
diff --git a/python/pyspark/testing/tests/test_fail_in_set_up_class.py b/python/pyspark/testing/tests/test_fail_in_set_up_class.py
new file mode 100644
index 0000000000000..e61f6db288251
--- /dev/null
+++ b/python/pyspark/testing/tests/test_fail_in_set_up_class.py
@@ -0,0 +1,42 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+
+
+class FailInSetUpClassTests(unittest.TestCase):
+    @classmethod
+    def setUpClass(cls):
+        super().setUpClass()
+        raise Exception("error")
+
+    def test_something(self):
+        self.assertEqual(True, True)
+
+
+if __name__ == "__main__":
+    from pyspark.testing.tests.test_fail_in_set_up_class import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    try:
+        unittest.main(testRunner=testRunner, verbosity=2)
+    except SystemExit as e:
+        assert e.code == 1, f"status code: {e.code}"
diff --git a/python/pyspark/testing/tests/test_no_tests.py b/python/pyspark/testing/tests/test_no_tests.py
new file mode 100644
index 0000000000000..ed16fb16f0198
--- /dev/null
+++ b/python/pyspark/testing/tests/test_no_tests.py
@@ -0,0 +1,36 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import sys
+import unittest
+
+
+if __name__ == "__main__":
+    from pyspark.testing.tests.test_no_tests import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    try:
+        unittest.main(testRunner=testRunner, verbosity=2)
+    except SystemExit as e:
+        if sys.version_info >= (3, 12):
+            assert e.code == 5, f"status code: {e.code}"
+        else:
+            assert e.code == 0, f"status code: {e.code}"
diff --git a/python/pyspark/testing/tests/test_pass_all.py b/python/pyspark/testing/tests/test_pass_all.py
new file mode 100644
index 0000000000000..5a1b090def36e
--- /dev/null
+++ b/python/pyspark/testing/tests/test_pass_all.py
@@ -0,0 +1,37 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+
+
+class PassAllTests(unittest.TestCase):
+    def test_something(self):
+        self.assertEqual(True, True)
+
+
+if __name__ == "__main__":
+    from pyspark.testing.tests.test_pass_all import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    try:
+        unittest.main(testRunner=testRunner, verbosity=2)
+    except SystemExit as e:
+        assert e.code == 0, f"status code: {e.code}"
diff --git a/python/pyspark/testing/tests/test_skip_all.py b/python/pyspark/testing/tests/test_skip_all.py
new file mode 100644
index 0000000000000..ae229f4d7c4a8
--- /dev/null
+++ b/python/pyspark/testing/tests/test_skip_all.py
@@ -0,0 +1,38 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+
+
+class SkipAllTests(unittest.TestCase):
+    @unittest.skip
+    def test_something(self):
+        self.assertEqual(True, False)
+
+
+if __name__ == "__main__":
+    from pyspark.testing.tests.test_skip_all import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    try:
+        unittest.main(testRunner=testRunner, verbosity=2)
+    except SystemExit as e:
+        assert e.code == 0, f"status code: {e.code}"
diff --git a/python/pyspark/testing/tests/test_skip_class.py b/python/pyspark/testing/tests/test_skip_class.py
new file mode 100644
index 0000000000000..1d7febb46d15d
--- /dev/null
+++ b/python/pyspark/testing/tests/test_skip_class.py
@@ -0,0 +1,42 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import sys
+import unittest
+
+
+@unittest.skip
+class SkipClassTests(unittest.TestCase):
+    def test_something(self):
+        self.assertEqual(True, False)
+
+
+if __name__ == "__main__":
+    from pyspark.testing.tests.test_skip_class import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    try:
+        unittest.main(testRunner=testRunner, verbosity=2)
+    except SystemExit as e:
+        if sys.version_info >= (3, 12):
+            assert e.code == 5, f"status code: {e.code}"
+        else:
+            assert e.code == 0, f"status code: {e.code}"
diff --git a/python/pyspark/testing/tests/test_skip_set_up_class.py b/python/pyspark/testing/tests/test_skip_set_up_class.py
new file mode 100644
index 0000000000000..7c73985656507
--- /dev/null
+++ b/python/pyspark/testing/tests/test_skip_set_up_class.py
@@ -0,0 +1,42 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+import unittest
+
+
+class SkipSetUpClassTests(unittest.TestCase):
+    @classmethod
+    @unittest.skip
+    def setUpClass(cls):
+        super().setUpClass()
+
+    def test_something(self):
+        self.assertEqual(True, False)
+
+
+if __name__ == "__main__":
+    from pyspark.testing.tests.test_skip_set_up_class import *  # noqa: F401
+
+    try:
+        import xmlrunner
+
+        testRunner = xmlrunner.XMLTestRunner(output="target/test-reports", verbosity=2)
+    except ImportError:
+        testRunner = None
+    try:
+        unittest.main(testRunner=testRunner, verbosity=2)
+    except SystemExit as e:
+        assert e.code == 0, f"status code: {e.code}"
diff --git a/python/pyspark/testing/utils.py b/python/pyspark/testing/utils.py
index 3daad83d7cb45..2c13d2f74026f 100644
--- a/python/pyspark/testing/utils.py
+++ b/python/pyspark/testing/utils.py
@@ -94,6 +94,21 @@ def have_package(name: str) -> bool:
 have_yaml = have_package("yaml")
 yaml_requirement_message = None if have_yaml else "No module named 'yaml'"
 
+have_grpc = have_package("grpc")
+grpc_requirement_message = None if have_grpc else "No module named 'grpc'"
+
+have_grpc_status = have_package("grpc_status")
+grpc_status_requirement_message = None if have_grpc_status else "No module named 'grpc_status'"
+
+
+googleapis_common_protos_requirement_message = None
+
+try:
+    from google.rpc import error_details_pb2
+except ImportError as e:
+    googleapis_common_protos_requirement_message = str(e)
+have_googleapis_common_protos = googleapis_common_protos_requirement_message is None
+
 pandas_requirement_message = None
 try:
     from pyspark.sql.pandas.utils import require_minimum_pandas_version
@@ -117,6 +132,18 @@ def have_package(name: str) -> bool:
 
 have_pyarrow = pyarrow_requirement_message is None
 
+
+connect_requirement_message = (
+    pandas_requirement_message
+    or pyarrow_requirement_message
+    or grpc_requirement_message
+    or googleapis_common_protos_requirement_message
+    or grpc_status_requirement_message
+)
+
+should_test_connect = connect_requirement_message is None
+
+
 is_ansi_mode_test = True
 if os.environ.get("SPARK_ANSI_SQL_MODE") == "false":
     is_ansi_mode_test = False
@@ -132,15 +159,15 @@ def write_int(i):
     return struct.pack("!i", i)
 
 
-def timeout(seconds):
+def timeout(timeout):
     def decorator(func):
         def handler(signum, frame):
-            raise TimeoutError(f"Function {func.__name__} timed out after {seconds} seconds")
+            raise TimeoutError(f"Function {func.__name__} timed out after {timeout} seconds")
 
         def wrapper(*args, **kwargs):
             signal.alarm(0)
             signal.signal(signal.SIGALRM, handler)
-            signal.alarm(seconds)
+            signal.alarm(timeout)
             try:
                 result = func(*args, **kwargs)
             finally:
@@ -155,6 +182,7 @@ def wrapper(*args, **kwargs):
 def eventually(
     timeout=30.0,
     catch_assertions=False,
+    catch_timeout=False,
 ):
     """
     Wait a given amount of time for a condition to pass, else fail with an error.
@@ -176,9 +204,14 @@ def eventually(
         If False (default), do not catch AssertionErrors.
         If True, catch AssertionErrors; continue, but save
         error to throw upon timeout.
+    catch_timeout : bool
+        If False (default), do not catch TimeoutError.
+        If True, catch TimeoutError; continue, but save
+        error to throw upon timeout.
     """
     assert timeout > 0
     assert isinstance(catch_assertions, bool)
+    assert isinstance(catch_timeout, bool)
 
     def decorator(condition: Callable) -> Callable:
         assert isinstance(condition, Callable)
@@ -191,13 +224,18 @@ def wrapper(*args: Any, **kwargs: Any) -> Any:
             while time() - start_time < timeout:
                 numTries += 1
 
-                if catch_assertions:
-                    try:
-                        lastValue = condition(*args, **kwargs)
-                    except AssertionError as e:
-                        lastValue = e
-                else:
+                try:
                     lastValue = condition(*args, **kwargs)
+                except AssertionError as e:
+                    if catch_assertions:
+                        lastValue = e
+                    else:
+                        raise e
+                except TimeoutError as e:
+                    if catch_timeout:
+                        lastValue = e
+                    else:
+                        raise e
 
                 if lastValue is True or lastValue is None:
                     return
@@ -205,7 +243,7 @@ def wrapper(*args: Any, **kwargs: Any) -> Any:
                 print(f"\nAttempt #{numTries} failed!\n{lastValue}")
                 sleep(0.01)
 
-            if isinstance(lastValue, AssertionError):
+            if isinstance(lastValue, (AssertionError, TimeoutError)):
                 raise lastValue
             else:
                 raise AssertionError(
@@ -421,6 +459,7 @@ def assertSchemaEqual(
     ignoreColumnOrder: bool = False,
     ignoreColumnName: bool = False,
 ):
+    __tracebackhide__ = True
     r"""
     A util function to assert equality between DataFrame schemas `actual` and `expected`.
 
@@ -610,6 +649,7 @@ def assertDataFrameEqual(
     showOnlyDiff: bool = False,
     includeDiffRows=False,
 ):
+    __tracebackhide__ = True
     r"""
     A util function to assert equality between `actual` and `expected`
     (DataFrames or lists of Rows), with optional parameters `checkRowOrder`, `rtol`, and `atol`.
@@ -996,6 +1036,7 @@ def compare_vals(val1, val2):
     def assert_rows_equal(
         rows1: List[Row], rows2: List[Row], maxErrors: int = None, showOnlyDiff: bool = False
     ):
+        __tracebackhide__ = True
         zipped = list(zip_longest(rows1, rows2))
         diff_rows_cnt = 0
         diff_rows = []
diff --git a/python/pyspark/tests/test_memory_profiler.py b/python/pyspark/tests/test_memory_profiler.py
index ef427271c97a8..ca75e4fa89763 100644
--- a/python/pyspark/tests/test_memory_profiler.py
+++ b/python/pyspark/tests/test_memory_profiler.py
@@ -167,7 +167,7 @@ def ser_to_ser(ser: pd.Series) -> pd.Series:
     def exec_pandas_udf_ser_to_scalar(self):
         import pandas as pd
 
-        @pandas_udf("int")
+        @pandas_udf("double")
         def ser_to_scalar(ser: pd.Series) -> float:
             return ser.median()
 
diff --git a/python/pyspark/tests/test_util.py b/python/pyspark/tests/test_util.py
index d9bda1e569933..712abcddb60a5 100644
--- a/python/pyspark/tests/test_util.py
+++ b/python/pyspark/tests/test_util.py
@@ -148,6 +148,17 @@ def test_parse_memory(self):
         with self.assertRaisesRegex(ValueError, "invalid format"):
             _parse_memory("2gs")
 
+    @eventually(timeout=180, catch_timeout=True)
+    @timeout(timeout=1)
+    def test_retry_timeout_test(self):
+        import random
+
+        if random.random() < 0.5:
+            print("hanging for 1 hour")
+            time.sleep(3600)  # Simulate a long-running operation
+        else:
+            print("succeeding immediately")
+
 
 class HandleWorkerExceptionTests(unittest.TestCase):
     exception_bytes = b"ValueError: test_message"
diff --git a/python/pyspark/util.py b/python/pyspark/util.py
index b688b3e57e82d..8497cabde5e6f 100644
--- a/python/pyspark/util.py
+++ b/python/pyspark/util.py
@@ -67,12 +67,15 @@
         GroupedMapUDFTransformWithStateInitStateType,
         ArrowScalarUDFType,
         ArrowScalarIterUDFType,
+        ArrowGroupedAggUDFType,
+        ArrowWindowAggUDFType,
     )
     from pyspark.sql._typing import (
         SQLArrowBatchedUDFType,
         SQLArrowTableUDFType,
         SQLBatchedUDFType,
         SQLTableUDFType,
+        SQLArrowUDTFType,
     )
     from pyspark.serializers import Serializer
     from pyspark.sql import SparkSession
@@ -651,9 +654,12 @@ class PythonEvalType:
     # Arrow UDFs
     SQL_SCALAR_ARROW_UDF: "ArrowScalarUDFType" = 250
     SQL_SCALAR_ARROW_ITER_UDF: "ArrowScalarIterUDFType" = 251
+    SQL_GROUPED_AGG_ARROW_UDF: "ArrowGroupedAggUDFType" = 252
+    SQL_WINDOW_AGG_ARROW_UDF: "ArrowWindowAggUDFType" = 253
 
     SQL_TABLE_UDF: "SQLTableUDFType" = 300
     SQL_ARROW_TABLE_UDF: "SQLArrowTableUDFType" = 301
+    SQL_ARROW_UDTF: "SQLArrowUDTFType" = 302
 
 
 def _create_local_socket(sock_info: "JavaArray") -> "io.BufferedRWPair":
diff --git a/python/pyspark/worker.py b/python/pyspark/worker.py
index 67cf25cff6e6a..c54b3c75f89db 100644
--- a/python/pyspark/worker.py
+++ b/python/pyspark/worker.py
@@ -52,7 +52,6 @@
 from pyspark.sql.functions import SkipRestOfInputTableException
 from pyspark.sql.pandas.serializers import (
     ArrowStreamPandasUDFSerializer,
-    ArrowStreamArrowUDFSerializer,
     ArrowStreamPandasUDTFSerializer,
     CogroupArrowUDFSerializer,
     CogroupPandasUDFSerializer,
@@ -63,9 +62,12 @@
     TransformWithStateInPandasInitStateSerializer,
     TransformWithStateInPySparkRowSerializer,
     TransformWithStateInPySparkRowInitStateSerializer,
+    ArrowStreamArrowUDFSerializer,
+    ArrowBatchUDFSerializer,
     ArrowStreamUDTFSerializer,
+    ArrowStreamArrowUDTFSerializer,
 )
-from pyspark.sql.pandas.types import to_arrow_type, from_arrow_schema
+from pyspark.sql.pandas.types import to_arrow_type
 from pyspark.sql.types import (
     ArrayType,
     BinaryType,
@@ -79,7 +81,7 @@
 )
 from pyspark.util import fail_on_stopiteration, handle_worker_exception
 from pyspark import shuffle
-from pyspark.errors import PySparkRuntimeError, PySparkTypeError
+from pyspark.errors import PySparkRuntimeError, PySparkTypeError, PySparkValueError
 from pyspark.worker_util import (
     check_python_version,
     read_command,
@@ -202,6 +204,81 @@ def verify_result_length(result, length):
 
 
 def wrap_arrow_batch_udf(f, args_offsets, kwargs_offsets, return_type, runner_conf):
+    if use_legacy_pandas_udf_conversion(runner_conf):
+        return wrap_arrow_batch_udf_legacy(
+            f, args_offsets, kwargs_offsets, return_type, runner_conf
+        )
+    else:
+        return wrap_arrow_batch_udf_arrow(f, args_offsets, kwargs_offsets, return_type, runner_conf)
+
+
+def wrap_arrow_batch_udf_arrow(f, args_offsets, kwargs_offsets, return_type, runner_conf):
+    from pyspark.sql.pandas.types import to_arrow_type
+
+    func, args_kwargs_offsets = wrap_kwargs_support(f, args_offsets, kwargs_offsets)
+
+    zero_arg_exec = False
+    if len(args_kwargs_offsets) == 0:
+        args_kwargs_offsets = (0,)
+        zero_arg_exec = True
+
+    arrow_return_type = to_arrow_type(
+        return_type, prefers_large_types=use_large_var_types(runner_conf)
+    )
+
+    if zero_arg_exec:
+
+        def get_args(*args: list):
+            return [() for _ in args[0]]
+
+    else:
+
+        def get_args(*args: list):
+            return zip(*args)
+
+    if "spark.sql.execution.pythonUDF.arrow.concurrency.level" in runner_conf:
+        from concurrent.futures import ThreadPoolExecutor
+
+        c = int(runner_conf["spark.sql.execution.pythonUDF.arrow.concurrency.level"])
+
+        @fail_on_stopiteration
+        def evaluate(*args):
+            with ThreadPoolExecutor(max_workers=c) as pool:
+                """
+                Takes list of Python objects and returns tuple of
+                (results, arrow_return_type, return_type).
+                """
+                return list(pool.map(lambda row: func(*row), get_args(*args)))
+
+    else:
+
+        @fail_on_stopiteration
+        def evaluate(*args):
+            """
+            Takes list of Python objects and returns tuple of
+            (results, arrow_return_type, return_type).
+            """
+            return [func(*row) for row in get_args(*args)]
+
+    def verify_result_length(result, length):
+        if len(result) != length:
+            raise PySparkRuntimeError(
+                errorClass="SCHEMA_MISMATCH_FOR_ARROW_PYTHON_UDF",
+                messageParameters={
+                    "udf_type": "arrow_batch_udf",
+                    "expected": str(length),
+                    "actual": str(len(result)),
+                },
+            )
+        return result
+
+    return (
+        args_kwargs_offsets,
+        lambda *a: (verify_result_length(evaluate(*a), len(a[0])), arrow_return_type, return_type),
+    )
+
+
+def wrap_arrow_batch_udf_legacy(f, args_offsets, kwargs_offsets, return_type, runner_conf):
     import pandas as pd
 
     func, args_kwargs_offsets = wrap_kwargs_support(f, args_offsets, kwargs_offsets)
@@ -796,10 +873,29 @@ def wrapped(*series):
     )
 
 
+def wrap_grouped_agg_arrow_udf(f, args_offsets, kwargs_offsets, return_type, runner_conf):
+    func, args_kwargs_offsets = wrap_kwargs_support(f, args_offsets, kwargs_offsets)
+
+    arrow_return_type = to_arrow_type(
+        return_type, prefers_large_types=use_large_var_types(runner_conf)
+    )
+
+    def wrapped(*series):
+        import pyarrow as pa
+
+        result = func(*series)
+        return pa.array([result])
+
+    return (
+        args_kwargs_offsets,
+        lambda *a: (wrapped(*a), arrow_return_type),
+    )
+
+
 def wrap_window_agg_pandas_udf(
     f, args_offsets, kwargs_offsets, return_type, runner_conf, udf_index
 ):
-    window_bound_types_str = runner_conf.get("pandas_window_bound_types")
+    window_bound_types_str = runner_conf.get("window_bound_types")
     window_bound_type = [t.strip().lower() for t in window_bound_types_str.split(",")][udf_index]
     if window_bound_type == "bounded":
         return wrap_bounded_window_agg_pandas_udf(
@@ -818,6 +914,26 @@ def wrap_window_agg_pandas_udf(
         )
 
 
+def wrap_window_agg_arrow_udf(f, args_offsets, kwargs_offsets, return_type, runner_conf, udf_index):
+    window_bound_types_str = runner_conf.get("window_bound_types")
+    window_bound_type = [t.strip().lower() for t in window_bound_types_str.split(",")][udf_index]
+    if window_bound_type == "bounded":
+        return wrap_bounded_window_agg_arrow_udf(
+            f, args_offsets, kwargs_offsets, return_type, runner_conf
+        )
+    elif window_bound_type == "unbounded":
+        return wrap_unbounded_window_agg_arrow_udf(
+            f, args_offsets, kwargs_offsets, return_type, runner_conf
+        )
+    else:
+        raise PySparkRuntimeError(
+            errorClass="INVALID_WINDOW_BOUND_TYPE",
+            messageParameters={
+                "window_bound_type": window_bound_type,
+            },
+        )
+
+
 def wrap_unbounded_window_agg_pandas_udf(f, args_offsets, kwargs_offsets, return_type, runner_conf):
     func, args_kwargs_offsets = wrap_kwargs_support(f, args_offsets, kwargs_offsets)
 
@@ -841,6 +957,27 @@ def wrapped(*series):
     )
 
 
+def wrap_unbounded_window_agg_arrow_udf(f, args_offsets, kwargs_offsets, return_type, runner_conf):
+    func, args_kwargs_offsets = wrap_kwargs_support(f, args_offsets, kwargs_offsets)
+
+    # This is similar to wrap_unbounded_window_agg_pandas_udf, the only difference
+    # is that this function is for arrow udf.
+    arrow_return_type = to_arrow_type(
+        return_type, prefers_large_types=use_large_var_types(runner_conf)
+    )
+
+    def wrapped(*series):
+        import pyarrow as pa
+
+        result = func(*series)
+        return pa.repeat(result, len(series[0]))
+
+    return (
+        args_kwargs_offsets,
+        lambda *a: (wrapped(*a), arrow_return_type),
+    )
+
+
 def wrap_bounded_window_agg_pandas_udf(f, args_offsets, kwargs_offsets, return_type, runner_conf):
     # args_offsets should have at least 2 for begin_index, end_index.
     assert len(args_offsets) >= 2, len(args_offsets)
@@ -885,6 +1022,35 @@ def wrapped(begin_index, end_index, *series):
     )
 
 
+def wrap_bounded_window_agg_arrow_udf(f, args_offsets, kwargs_offsets, return_type, runner_conf):
+    # args_offsets should have at least 2 for begin_index, end_index.
+    assert len(args_offsets) >= 2, len(args_offsets)
+    func, args_kwargs_offsets = wrap_kwargs_support(f, args_offsets[2:], kwargs_offsets)
+
+    arrow_return_type = to_arrow_type(
+        return_type, prefers_large_types=use_large_var_types(runner_conf)
+    )
+
+    def wrapped(begin_index, end_index, *series):
+        import pyarrow as pa
+
+        assert isinstance(begin_index, pa.Int32Array), type(begin_index)
+        assert isinstance(end_index, pa.Int32Array), type(end_index)
+
+        result = []
+        for i in range(len(begin_index)):
+            offset = begin_index[i].as_py()
+            length = end_index[i].as_py() - offset
+            series_slices = [s.slice(offset=offset, length=length) for s in series]
+            result.append(func(*series_slices))
+        return pa.array(result)
+
+    return (
+        args_offsets[:2] + args_kwargs_offsets,
+        lambda *a: (wrapped(*a), arrow_return_type),
+    )
+
+
 def wrap_kwargs_support(f, args_offsets, kwargs_offsets):
     if len(kwargs_offsets):
         keys = list(kwargs_offsets.keys())
@@ -971,9 +1137,11 @@ def read_single_udf(pickleSer, infile, eval_type, runner_conf, udf_index, profil
         PythonEvalType.SQL_SCALAR_ARROW_UDF,
         PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF,
         PythonEvalType.SQL_WINDOW_AGG_PANDAS_UDF,
+        PythonEvalType.SQL_WINDOW_AGG_ARROW_UDF,
         # The below doesn't support named argument, but shares the same protocol.
         PythonEvalType.SQL_SCALAR_PANDAS_ITER_UDF,
         PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF,
+        PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
     ):
         args_offsets = []
         kwargs_offsets = {}
@@ -1070,10 +1238,18 @@ def read_single_udf(pickleSer, infile, eval_type, runner_conf, udf_index, profil
         return wrap_grouped_agg_pandas_udf(
             func, args_offsets, kwargs_offsets, return_type, runner_conf
         )
+    elif eval_type == PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF:
+        return wrap_grouped_agg_arrow_udf(
+            func, args_offsets, kwargs_offsets, return_type, runner_conf
+        )
     elif eval_type == PythonEvalType.SQL_WINDOW_AGG_PANDAS_UDF:
         return wrap_window_agg_pandas_udf(
             func, args_offsets, kwargs_offsets, return_type, runner_conf, udf_index
         )
+    elif eval_type == PythonEvalType.SQL_WINDOW_AGG_ARROW_UDF:
+        return wrap_window_agg_arrow_udf(
+            func, args_offsets, kwargs_offsets, return_type, runner_conf, udf_index
+        )
     elif eval_type == PythonEvalType.SQL_BATCHED_UDF:
         return wrap_udf(func, args_offsets, kwargs_offsets, return_type)
     else:
@@ -1098,6 +1274,15 @@ def use_large_var_types(runner_conf):
     return runner_conf.get("spark.sql.execution.arrow.useLargeVarTypes", "false").lower() == "true"
 
 
+def use_legacy_pandas_udf_conversion(runner_conf):
+    return (
+        runner_conf.get(
+            "spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled", "false"
+        ).lower()
+        == "true"
+    )
+
+
 # Read and process a serialized user-defined table function (UDTF) from a socket.
 # It expects the UDTF to be in a specific format and performs various checks to
 # ensure the UDTF is valid. This function also prepares a mapper function for applying
@@ -1121,6 +1306,9 @@ def read_udtf(pickleSer, infile, eval_type):
             ).lower()
             == "true"
         )
+        input_types = [
+            field.dataType for field in _parse_datatype_json_string(utf8_deserializer.loads(infile))
+        ]
         if legacy_pandas_conversion:
             # NOTE: if timezone is set here, that implies respectSessionTimeZone is True
             safecheck = (
@@ -1129,11 +1317,34 @@ def read_udtf(pickleSer, infile, eval_type):
                 ).lower()
                 == "true"
             )
+            int_to_decimal_coercion_enabled = (
+                runner_conf.get(
+                    "spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled", "false"
+                ).lower()
+                == "true"
+            )
             timezone = runner_conf.get("spark.sql.session.timeZone", None)
-            ser = ArrowStreamPandasUDTFSerializer(timezone, safecheck)
+            ser = ArrowStreamPandasUDTFSerializer(
+                timezone,
+                safecheck,
+                input_types=input_types,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
+            )
         else:
             ser = ArrowStreamUDTFSerializer()
-
+    elif eval_type == PythonEvalType.SQL_ARROW_UDTF:
+        runner_conf = {}
+        num_conf = read_int(infile)
+        for i in range(num_conf):
+            k = utf8_deserializer.loads(infile)
+            v = utf8_deserializer.loads(infile)
+            runner_conf[k] = v
+        prefers_large_var_types = use_large_var_types(runner_conf)
+        # Read the table argument offsets
+        num_table_arg_offsets = read_int(infile)
+        table_arg_offsets = [read_int(infile) for _ in range(num_table_arg_offsets)]
+        # Use PyArrow-native serializer for Arrow UDTFs with potential UDT support
+        ser = ArrowStreamArrowUDTFSerializer(table_arg_offsets=table_arg_offsets)
     else:
         # Each row is a group so do not batch but send one by one.
         ser = BatchedSerializer(CPickleSerializer(), 1)
@@ -1446,7 +1657,7 @@ def wrap_arrow_udtf(f, return_type):
             import pandas as pd
 
             arrow_return_type = to_arrow_type(
-                return_type, prefers_large_types=use_large_var_types(runner_conf)
+                return_type, prefers_large_types=prefers_large_var_types
             )
             return_type_size = len(return_type)
 
@@ -1514,19 +1725,24 @@ def check_return_value(res):
                     else:
                         yield from res
 
-            def evaluate(*args: pd.Series):
+            def evaluate(*args: pd.Series, num_rows=1):
                 if len(args) == 0:
-                    res = func()
-                    yield verify_result(pd.DataFrame(check_return_value(res))), arrow_return_type
+                    for _ in range(num_rows):
+                        yield (
+                            verify_result(pd.DataFrame(check_return_value(func()))),
+                            arrow_return_type,
+                            return_type,
+                        )
                 else:
                     # Create tuples from the input pandas Series, each tuple
                     # represents a row across all Series.
                     row_tuples = zip(*args)
                     for row in row_tuples:
-                        res = func(*row)
-                        yield verify_result(
-                            pd.DataFrame(check_return_value(res))
-                        ), arrow_return_type
+                        yield (
+                            verify_result(pd.DataFrame(check_return_value(func(*row)))),
+                            arrow_return_type,
+                            return_type,
+                        )
 
             return evaluate
 
@@ -1547,7 +1763,7 @@ def mapper(_, it):
                 for a in it:
                     # The eval function yields an iterator. Each element produced by this
                     # iterator is a tuple in the form of (pandas.DataFrame, arrow_return_type).
-                    yield from eval(*[a[o] for o in args_kwargs_offsets])
+                    yield from eval(*[a[o] for o in args_kwargs_offsets], num_rows=len(a[0]))
                 if terminate is not None:
                     yield from terminate()
             except SkipRestOfInputTableException:
@@ -1565,12 +1781,12 @@ def wrap_arrow_udtf(f, return_type):
             import pyarrow as pa
 
             arrow_return_type = to_arrow_type(
-                return_type, prefers_large_types=use_large_var_types(runner_conf)
+                return_type, prefers_large_types=prefers_large_var_types
             )
             return_type_size = len(return_type)
 
             def verify_result(result):
-                if not isinstance(result, pa.RecordBatch):
+                if not isinstance(result, pa.Table):
                     raise PySparkTypeError(
                         errorClass="INVALID_ARROW_UDTF_RETURN_TYPE",
                         messageParameters={
@@ -1584,23 +1800,23 @@ def verify_result(result):
                 # rows or columns. Note that we avoid using `df.empty` here because the
                 # result dataframe may contain an empty row. For example, when a UDTF is
                 # defined as follows: def eval(self): yield tuple().
-                if len(result) > 0 or len(result.columns) > 0:
-                    if len(result.columns) != return_type_size:
+                if result.num_rows > 0 or result.num_columns > 0:
+                    if result.num_columns != return_type_size:
                         raise PySparkRuntimeError(
                             errorClass="UDTF_RETURN_SCHEMA_MISMATCH",
                             messageParameters={
                                 "expected": str(return_type_size),
-                                "actual": str(len(result.columns)),
+                                "actual": str(result.num_columns),
                                 "func": f.__name__,
                             },
                         )
 
                 # Verify the type and the schema of the result.
                 verify_arrow_result(
-                    pa.Table.from_batches([result], schema=pa.schema(list(arrow_return_type))),
+                    result,
                     assign_cols_by_name=False,
                     expected_cols_and_types=[
-                        (col.name, to_arrow_type(col.dataType)) for col in return_type.fields
+                        (field.name, field.type) for field in arrow_return_type
                     ],
                 )
                 return result
@@ -1629,28 +1845,23 @@ def check_return_value(res):
                                 "func": f.__name__,
                             },
                         )
-                    if check_output_row_against_schema is not None:
-                        for row in res:
+                    for row in res:
+                        if not isinstance(row, tuple) and return_type_size == 1:
+                            row = (row,)
+                        if check_output_row_against_schema is not None:
                             if row is not None:
                                 check_output_row_against_schema(row)
-                            yield row
-                    else:
-                        yield from res
+                        yield row
 
             def convert_to_arrow(data: Iterable):
                 data = list(check_return_value(data))
                 if len(data) == 0:
+                    # Return one empty RecordBatch to match the left side of the lateral join
                     return [
                         pa.RecordBatch.from_pylist(data, schema=pa.schema(list(arrow_return_type)))
                     ]
-                try:
-                    ret = LocalDataToArrowConversion.convert(
-                        data, return_type, prefers_large_var_types
-                    ).to_batches()
-                    if len(return_type.fields) == 0:
-                        return [pa.RecordBatch.from_struct_array(pa.array([{}] * len(data)))]
-                    return ret
-                except Exception as e:
+
+                def raise_conversion_error(original_exception):
                     raise PySparkRuntimeError(
                         errorClass="UDTF_ARROW_TYPE_CONVERSION_ERROR",
                         messageParameters={
@@ -1658,23 +1869,43 @@ def convert_to_arrow(data: Iterable):
                             "schema": return_type.simpleString(),
                             "arrow_schema": str(arrow_return_type),
                         },
-                    ) from e
+                    ) from original_exception
 
-            def evaluate(*args: pa.ChunkedArray):
+                try:
+                    table = LocalDataToArrowConversion.convert(
+                        data, return_type, prefers_large_var_types
+                    )
+                except PySparkValueError as e:
+                    if e.getErrorClass() == "AXIS_LENGTH_MISMATCH":
+                        raise PySparkRuntimeError(
+                            errorClass="UDTF_RETURN_SCHEMA_MISMATCH",
+                            messageParameters={
+                                "expected": e.getMessageParameters()[
+                                    "expected_length"
+                                ],  # type: ignore[index]
+                                "actual": e.getMessageParameters()[
+                                    "actual_length"
+                                ],  # type: ignore[index]
+                                "func": f.__name__,
+                            },
+                        ) from e
+                    # Fall through to general conversion error
+                    raise_conversion_error(e)
+                except Exception as e:
+                    raise_conversion_error(e)
+
+                return verify_result(table).to_batches()
+
+            def evaluate(*args: list, num_rows=1):
                 if len(args) == 0:
-                    for batch in convert_to_arrow(func()):
-                        yield verify_result(batch), arrow_return_type
+                    for _ in range(num_rows):
+                        for batch in convert_to_arrow(func()):
+                            yield batch, arrow_return_type
 
                 else:
-                    list_args = list(args)
-                    names = [f"_{n}" for n in range(len(list_args))]
-                    t = pa.Table.from_arrays(list_args, names=names)
-                    schema = from_arrow_schema(t.schema, prefers_large_var_types)
-                    rows = ArrowTableToRowsConversion.convert(t, schema=schema)
-                    for row in rows:
-                        row = tuple(row)  # type: ignore[assignment]
+                    for row in zip(*args):
                         for batch in convert_to_arrow(func(*row)):
-                            yield verify_result(batch), arrow_return_type
+                            yield batch, arrow_return_type
 
             return evaluate
 
@@ -1692,9 +1923,134 @@ def evaluate(*args: pa.ChunkedArray):
 
         def mapper(_, it):
             try:
+                converters = [
+                    ArrowTableToRowsConversion._create_converter(dt, none_on_identity=True)
+                    for dt in input_types
+                ]
                 for a in it:
+                    pylist = [
+                        [conv(v) for v in column.to_pylist()]
+                        if conv is not None
+                        else column.to_pylist()
+                        for column, conv in zip(a.columns, converters)
+                    ]
                     # The eval function yields an iterator. Each element produced by this
                     # iterator is a tuple in the form of (pyarrow.RecordBatch, arrow_return_type).
+                    yield from eval(*[pylist[o] for o in args_kwargs_offsets], num_rows=a.num_rows)
+                if terminate is not None:
+                    yield from terminate()
+            except SkipRestOfInputTableException:
+                if terminate is not None:
+                    yield from terminate()
+            finally:
+                if cleanup is not None:
+                    cleanup()
+
+        return mapper, None, ser, ser
+
+    elif eval_type == PythonEvalType.SQL_ARROW_UDTF:
+
+        def wrap_pyarrow_udtf(f, return_type):
+            import pyarrow as pa
+
+            arrow_return_type = to_arrow_type(
+                return_type, prefers_large_types=use_large_var_types(runner_conf)
+            )
+            return_type_size = len(return_type)
+
+            def verify_result(result):
+                # Validate the output schema when the result has columns
+                if result.num_columns != return_type_size:
+                    raise PySparkRuntimeError(
+                        errorClass="UDTF_RETURN_SCHEMA_MISMATCH",
+                        messageParameters={
+                            "expected": str(return_type_size),
+                            "actual": str(result.num_columns),
+                            "func": f.__name__,
+                        },
+                    )
+
+                # Verify the type and the schema of the result.
+                verify_arrow_result(
+                    pa.Table.from_batches([result], schema=pa.schema(list(arrow_return_type))),
+                    assign_cols_by_name=False,
+                    expected_cols_and_types=[
+                        (col.name, to_arrow_type(col.dataType)) for col in return_type.fields
+                    ],
+                )
+                return result
+
+            # Wrap the exception thrown from the UDTF in a PySparkRuntimeError.
+            def func(*a: Any) -> Any:
+                try:
+                    return f(*a)
+                except SkipRestOfInputTableException:
+                    raise
+                except Exception as e:
+                    raise PySparkRuntimeError(
+                        errorClass="UDTF_EXEC_ERROR",
+                        messageParameters={"method_name": f.__name__, "error": str(e)},
+                    )
+
+            def check_return_value(res):
+                # Check whether the result of a PyArrow UDTF is iterable before processing
+                if res is not None:
+                    if not isinstance(res, Iterable):
+                        raise PySparkRuntimeError(
+                            errorClass="UDTF_RETURN_NOT_ITERABLE",
+                            messageParameters={
+                                "type": type(res).__name__,
+                                "func": f.__name__,
+                            },
+                        )
+                    return res
+                else:
+                    return iter([])
+
+            def convert_to_arrow(data: Iterable):
+                data_iter = check_return_value(data)
+
+                # Handle PyArrow Tables/RecordBatches directly
+                is_empty = True
+                for item in data_iter:
+                    is_empty = False
+                    if isinstance(item, pa.Table):
+                        yield from item.to_batches()
+                    elif isinstance(item, pa.RecordBatch):
+                        yield item
+                    else:
+                        # Arrow UDTF should only return Arrow types (RecordBatch/Table)
+                        raise PySparkRuntimeError(
+                            errorClass="UDTF_ARROW_TYPE_CONVERSION_ERROR",
+                            messageParameters={},
+                        )
+
+                if is_empty:
+                    yield pa.RecordBatch.from_pylist([], schema=pa.schema(list(arrow_return_type)))
+
+            def evaluate(*args: pa.RecordBatch):
+                # For Arrow UDTFs, unpack the RecordBatches and pass them to the function
+                for batch in convert_to_arrow(func(*args)):
+                    yield verify_result(batch), arrow_return_type
+
+            return evaluate
+
+        eval_func_kwargs_support, args_kwargs_offsets = wrap_kwargs_support(
+            getattr(udtf, "eval"), args_offsets, kwargs_offsets
+        )
+        eval = wrap_pyarrow_udtf(eval_func_kwargs_support, return_type)
+
+        if hasattr(udtf, "terminate"):
+            terminate = wrap_pyarrow_udtf(getattr(udtf, "terminate"), return_type)
+        else:
+            terminate = None
+
+        cleanup = getattr(udtf, "cleanup") if hasattr(udtf, "cleanup") else None
+
+        def mapper(_, it):
+            try:
+                for a in it:
+                    # For PyArrow UDTFs, pass RecordBatches directly (no row conversion needed)
                     yield from eval(*[a[o] for o in args_kwargs_offsets])
                 if terminate is not None:
                     yield from terminate()
@@ -1706,6 +2062,7 @@ def mapper(_, it):
                     cleanup()
 
         return mapper, None, ser, ser
+
     else:
 
         def wrap_udtf(f, return_type):
@@ -1715,6 +2072,16 @@ def wrap_udtf(f, return_type):
 
             def verify_and_convert_result(result):
                 if result is not None:
+                    if hasattr(result, "__UDT__"):
+                        # UDT object should not be returned directly.
+                        raise PySparkRuntimeError(
+                            errorClass="UDTF_INVALID_OUTPUT_ROW_TYPE",
+                            messageParameters={
+                                "type": type(result).__name__,
+                                "func": f.__name__,
+                            },
+                        )
+
                     if hasattr(result, "__len__") and len(result) != return_type_size:
                         raise PySparkRuntimeError(
                             errorClass="UDTF_RETURN_SCHEMA_MISMATCH",
@@ -1815,7 +2182,9 @@ def read_udfs(pickleSer, infile, eval_type):
         PythonEvalType.SQL_MAP_ARROW_ITER_UDF,
         PythonEvalType.SQL_GROUPED_MAP_PANDAS_UDF,
         PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF,
+        PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
         PythonEvalType.SQL_WINDOW_AGG_PANDAS_UDF,
+        PythonEvalType.SQL_WINDOW_AGG_ARROW_UDF,
         PythonEvalType.SQL_GROUPED_MAP_PANDAS_UDF_WITH_STATE,
         PythonEvalType.SQL_GROUPED_MAP_ARROW_UDF,
         PythonEvalType.SQL_COGROUPED_MAP_ARROW_UDF,
@@ -1852,12 +2221,24 @@ def read_udfs(pickleSer, infile, eval_type):
             runner_conf.get("spark.sql.execution.pandas.convertToArrowArraySafely", "false").lower()
             == "true"
         )
+        int_to_decimal_coercion_enabled = (
+            runner_conf.get(
+                "spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled", "false"
+            ).lower()
+            == "true"
+        )
         _assign_cols_by_name = assign_cols_by_name(runner_conf)
 
         if eval_type == PythonEvalType.SQL_COGROUPED_MAP_ARROW_UDF:
             ser = CogroupArrowUDFSerializer(_assign_cols_by_name)
         elif eval_type == PythonEvalType.SQL_COGROUPED_MAP_PANDAS_UDF:
-            ser = CogroupPandasUDFSerializer(timezone, safecheck, _assign_cols_by_name)
+            ser = CogroupPandasUDFSerializer(
+                timezone,
+                safecheck,
+                _assign_cols_by_name,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
+                arrow_cast=True,
+            )
         elif eval_type == PythonEvalType.SQL_GROUPED_MAP_PANDAS_UDF_WITH_STATE:
             arrow_max_records_per_batch = runner_conf.get(
                 "spark.sql.execution.arrow.maxRecordsPerBatch", 10000
@@ -1871,6 +2252,7 @@ def read_udfs(pickleSer, infile, eval_type):
                 state_object_schema,
                 arrow_max_records_per_batch,
                 prefers_large_var_types,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
             )
         elif eval_type == PythonEvalType.SQL_TRANSFORM_WITH_STATE_PANDAS_UDF:
             arrow_max_records_per_batch = runner_conf.get(
@@ -1879,7 +2261,11 @@ def read_udfs(pickleSer, infile, eval_type):
             arrow_max_records_per_batch = int(arrow_max_records_per_batch)
 
             ser = TransformWithStateInPandasSerializer(
-                timezone, safecheck, _assign_cols_by_name, arrow_max_records_per_batch
+                timezone,
+                safecheck,
+                _assign_cols_by_name,
+                arrow_max_records_per_batch,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
             )
         elif eval_type == PythonEvalType.SQL_TRANSFORM_WITH_STATE_PANDAS_INIT_STATE_UDF:
             arrow_max_records_per_batch = runner_conf.get(
@@ -1888,7 +2274,11 @@ def read_udfs(pickleSer, infile, eval_type):
             arrow_max_records_per_batch = int(arrow_max_records_per_batch)
 
             ser = TransformWithStateInPandasInitStateSerializer(
-                timezone, safecheck, _assign_cols_by_name, arrow_max_records_per_batch
+                timezone,
+                safecheck,
+                _assign_cols_by_name,
+                arrow_max_records_per_batch,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
             )
         elif eval_type == PythonEvalType.SQL_TRANSFORM_WITH_STATE_PYTHON_ROW_UDF:
             arrow_max_records_per_batch = runner_conf.get(
@@ -1911,9 +2301,21 @@ def read_udfs(pickleSer, infile, eval_type):
         elif eval_type in (
             PythonEvalType.SQL_SCALAR_ARROW_UDF,
             PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF,
+            PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
+            PythonEvalType.SQL_WINDOW_AGG_ARROW_UDF,
+        ):
+            # Arrow cast and safe check are always enabled
+            ser = ArrowStreamArrowUDFSerializer(timezone, True, _assign_cols_by_name, True)
+        elif (
+            eval_type == PythonEvalType.SQL_ARROW_BATCHED_UDF
+            and not use_legacy_pandas_udf_conversion(runner_conf)
         ):
-            # Arrow cast for type coercion is disabled by default
-            ser = ArrowStreamArrowUDFSerializer(timezone, safecheck, _assign_cols_by_name, False)
+            input_types = [
+                f.dataType for f in _parse_datatype_json_string(utf8_deserializer.loads(infile))
+            ]
+            ser = ArrowBatchUDFSerializer(
+                timezone, safecheck, input_types, int_to_decimal_coercion_enabled
+            )
         else:
             # Scalar Pandas UDF handles struct type arguments as pandas DataFrames instead of
             # pandas Series. See SPARK-27240.
@@ -1927,8 +2329,6 @@ def read_udfs(pickleSer, infile, eval_type):
                 "row" if eval_type == PythonEvalType.SQL_ARROW_BATCHED_UDF else "dict"
             )
             ndarray_as_list = eval_type == PythonEvalType.SQL_ARROW_BATCHED_UDF
-            # Arrow-optimized Python UDF uses explicit Arrow cast for type coercion
-            arrow_cast = eval_type == PythonEvalType.SQL_ARROW_BATCHED_UDF
             # Arrow-optimized Python UDF takes input types
             input_types = (
                 [f.dataType for f in _parse_datatype_json_string(utf8_deserializer.loads(infile))]
@@ -1943,8 +2343,9 @@ def read_udfs(pickleSer, infile, eval_type):
                 df_for_struct,
                 struct_in_pandas,
                 ndarray_as_list,
-                arrow_cast,
+                True,
                 input_types,
+                int_to_decimal_coercion_enabled=int_to_decimal_coercion_enabled,
             )
     else:
         batch_size = int(os.environ.get("PYTHON_UDF_BATCH_SIZE", "100"))
@@ -2347,6 +2748,7 @@ def func(_, it):
 
 def main(infile, outfile):
     faulthandler_log_path = os.environ.get("PYTHON_FAULTHANDLER_DIR", None)
+    tracebackDumpIntervalSeconds = os.environ.get("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", None)
     try:
         if faulthandler_log_path:
             faulthandler_log_path = os.path.join(faulthandler_log_path, str(os.getpid()))
@@ -2358,6 +2760,9 @@ def main(infile, outfile):
         if split_index == -1:  # for unit tests
             sys.exit(-1)
 
+        if tracebackDumpIntervalSeconds is not None and int(tracebackDumpIntervalSeconds) > 0:
+            faulthandler.dump_traceback_later(int(tracebackDumpIntervalSeconds), repeat=True)
+
         check_python_version(infile)
 
         # read inputs only for a barrier task
@@ -2415,7 +2820,11 @@ def main(infile, outfile):
         eval_type = read_int(infile)
         if eval_type == PythonEvalType.NON_UDF:
             func, profiler, deserializer, serializer = read_command(pickleSer, infile)
-        elif eval_type in (PythonEvalType.SQL_TABLE_UDF, PythonEvalType.SQL_ARROW_TABLE_UDF):
+        elif eval_type in (
+            PythonEvalType.SQL_TABLE_UDF,
+            PythonEvalType.SQL_ARROW_TABLE_UDF,
+            PythonEvalType.SQL_ARROW_UDTF,
+        ):
             func, profiler, deserializer, serializer = read_udtf(pickleSer, infile, eval_type)
         else:
             func, profiler, deserializer, serializer = read_udfs(pickleSer, infile, eval_type)
@@ -2465,6 +2874,9 @@ def process():
         write_int(SpecialLengths.END_OF_DATA_SECTION, outfile)
         sys.exit(-1)
 
+    # Force to cancel dump_traceback_later
+    faulthandler.cancel_dump_traceback_later()
+
 
 if __name__ == "__main__":
     # Read information about how to connect back to the JVM from the environment.
diff --git a/python/run-tests b/python/run-tests
index b5492a080d6a5..c0b0f1c9e5da4 100755
--- a/python/run-tests
+++ b/python/run-tests
@@ -21,9 +21,9 @@
 FWDIR="$(cd "`dirname $0`"/..; pwd)"
 cd "$FWDIR"
 
-PYTHON_VERSION_CHECK=$(python3 -c 'import sys; print(sys.version_info < (3, 9, 0))')
+PYTHON_VERSION_CHECK=$(python3 -c 'import sys; print(sys.version_info < (3, 10, 0))')
 if [[ "$PYTHON_VERSION_CHECK" == "True" ]]; then
-  echo "Python versions prior to 3.9 are not supported."
+  echo "Python versions prior to 3.10 are not supported."
   exit -1
 fi
 
diff --git a/python/run-tests.py b/python/run-tests.py
index 091fcfe73ac10..773f686549858 100755
--- a/python/run-tests.py
+++ b/python/run-tests.py
@@ -212,9 +212,9 @@ def run_individual_python_test(target_dir, test_name, pyspark_python, keep_test_
 
 
 def get_default_python_executables():
-    python_execs = [x for x in ["python3.9", "pypy3"] if which(x)]
+    python_execs = [x for x in ["python3.11", "pypy3"] if which(x)]
 
-    if "python3.9" not in python_execs:
+    if "python3.11" not in python_execs:
         p = which("python3")
         if not p:
             LOGGER.error("No python3 executable found.  Exiting!")
diff --git a/repl/src/main/scala/org/apache/spark/repl/Main.scala b/repl/src/main/scala/org/apache/spark/repl/Main.scala
index 8548801266b26..4ed3bd51d7521 100644
--- a/repl/src/main/scala/org/apache/spark/repl/Main.scala
+++ b/repl/src/main/scala/org/apache/spark/repl/Main.scala
@@ -57,7 +57,9 @@ object Main extends Logging {
 
   def main(args: Array[String]): Unit = {
     isShellSession = true
-    doMain(args, new SparkILoop)
+    val settings = new GenericRunnerSettings(scalaOptionError)
+    settings.processArguments(args.toList, true)
+    doMain(args, new SparkILoop(settings))
   }
 
   // Visible for testing
diff --git a/repl/src/main/scala/org/apache/spark/repl/SparkILoop.scala b/repl/src/main/scala/org/apache/spark/repl/SparkILoop.scala
index f49e8adcc74af..ecb46c478a204 100644
--- a/repl/src/main/scala/org/apache/spark/repl/SparkILoop.scala
+++ b/repl/src/main/scala/org/apache/spark/repl/SparkILoop.scala
@@ -31,9 +31,15 @@ import scala.util.Properties.{javaVersion, javaVmName, versionString}
 /**
  *  A Spark-specific interactive shell.
  */
-class SparkILoop(in0: BufferedReader, out: PrintWriter)
-  extends ILoop(ShellConfig(new GenericRunnerSettings(_ => ())), in0, out) {
-  def this() = this(null, new PrintWriter(Console.out, true))
+class SparkILoop(config: ShellConfig, in0: BufferedReader, out: PrintWriter)
+  extends ILoop(config, in0, out) {
+  def this(in0: BufferedReader, out: PrintWriter) = this(
+    ShellConfig(new GenericRunnerSettings(_ => ())), in0, out)
+
+  def this(settings: Settings) = this(ShellConfig(settings), null,
+    new PrintWriter(Console.out, true))
+
+  def this() = this(new GenericRunnerSettings(_ => ()))
 
   val initializationCommands: Seq[String] = Seq(
     """
@@ -67,7 +73,9 @@ class SparkILoop(in0: BufferedReader, out: PrintWriter)
     "import spark.implicits._",
     "import spark.sql",
     "import org.apache.spark.sql.functions._",
-    "import org.apache.spark.util.LogUtils.SPARK_LOG_SCHEMA"
+    "import org.apache.spark.util.LogUtils.SPARK_LOG_SCHEMA",
+    "import java.net._",
+    "import java.nio.file._"
   )
 
   override protected def internalReplAutorunCode(): Seq[String] =
diff --git a/repl/src/test/resources/IntSumUdf.class b/repl/src/test/resources/IntSumUdf.class
deleted file mode 100644
index 75a41446cfca1..0000000000000
Binary files a/repl/src/test/resources/IntSumUdf.class and /dev/null differ
diff --git a/repl/src/test/resources/IntSumUdf.scala b/repl/src/test/scala/org/apache/spark/repl/IntSumUdf.scala
similarity index 96%
rename from repl/src/test/resources/IntSumUdf.scala
rename to repl/src/test/scala/org/apache/spark/repl/IntSumUdf.scala
index 9678caaed5db5..9f27671277651 100644
--- a/repl/src/test/resources/IntSumUdf.scala
+++ b/repl/src/test/scala/org/apache/spark/repl/IntSumUdf.scala
@@ -15,6 +15,8 @@
  * limitations under the License.
  */
 
+package org.apache.spark.repl
+
 import org.apache.spark.sql.api.java.UDF2
 
 class IntSumUdf extends UDF2[Long, Long, Long] {
diff --git a/repl/src/test/scala/org/apache/spark/repl/ReplSuite.scala b/repl/src/test/scala/org/apache/spark/repl/ReplSuite.scala
index 9bf716e52fffe..4471f93840e22 100644
--- a/repl/src/test/scala/org/apache/spark/repl/ReplSuite.scala
+++ b/repl/src/test/scala/org/apache/spark/repl/ReplSuite.scala
@@ -398,67 +398,91 @@ class ReplSuite extends SparkFunSuite {
   }
 
   test("register UDF via SparkSession.addArtifact") {
-    val artifactPath = new File("src/test/resources").toPath
-    val intSumUdfPath = artifactPath.resolve("IntSumUdf.class")
-    assume(intSumUdfPath.toFile.exists)
-    val output = runInterpreterInPasteMode("local",
-      s"""
-         |import org.apache.spark.sql.api.java.UDF2
-         |import org.apache.spark.sql.types.DataTypes
-         |
-         |spark.addArtifact("${intSumUdfPath.toString}")
-         |
-         |spark.udf.registerJava("intSum", "IntSumUdf", DataTypes.LongType)
-         |
-         |val r = spark.range(5)
-         |  .withColumn("id2", col("id") + 1)
-         |  .selectExpr("intSum(id, id2)")
-         |  .collect()
-         |assert(r.map(_.getLong(0)).toSeq == Seq(1, 3, 5, 7, 9))
-         |
-      """.stripMargin)
-    assertContains("Array([1], [3], [5], [7], [9])", output)
-    assertDoesNotContain("error:", output)
-    assertDoesNotContain("Exception", output)
-    assertDoesNotContain("assertion failed", output)
-
-    // The UDF should not work in a new REPL session.
-    val anotherOutput = runInterpreterInPasteMode("local",
-      s"""
-         |val r = spark.range(5)
-         |  .withColumn("id2", col("id") + 1)
-         |  .selectExpr("intSum(id, id2)")
-         |  .collect()
-         |
-      """.stripMargin)
-    assertContains(
-      "[UNRESOLVED_ROUTINE] Cannot resolve routine `intSum` on search path",
-      anotherOutput)
+    withTempDir { tempDir =>
+      val clsName = "org.apache.spark.repl.IntSumUdf"
+      val intSumUdfStream = classOf[IntSumUdf]
+        .getResourceAsStream("/" + clsName.replace(".", "/") + ".class")
+      val intSumUdfPath = new File(tempDir, "IntSumUdf.class")
+      Files.copy(intSumUdfStream, intSumUdfPath.toPath)
+      val output = runInterpreterInPasteMode("local",
+        s"""
+           |import org.apache.spark.sql.api.java.UDF2
+           |import org.apache.spark.sql.types.DataTypes
+           |
+           |spark.addArtifact("${intSumUdfPath.toString}")
+           |
+           |spark.udf.registerJava("intSum", "$clsName", DataTypes.LongType)
+           |
+           |val r = spark.range(5)
+           |  .withColumn("id2", col("id") + 1)
+           |  .selectExpr("intSum(id, id2)")
+           |  .collect()
+           |assert(r.map(_.getLong(0)).toSeq == Seq(1, 3, 5, 7, 9))
+           |
+        """.stripMargin)
+      assertContains("Array([1], [3], [5], [7], [9])", output)
+      assertDoesNotContain("error:", output)
+      assertDoesNotContain("Exception", output)
+      assertDoesNotContain("assertion failed", output)
+
+      // The UDF should not work in a new REPL session.
+      val anotherOutput = runInterpreterInPasteMode("local",
+        s"""
+           |val r = spark.range(5)
+           |  .withColumn("id2", col("id") + 1)
+           |  .selectExpr("intSum(id, id2)")
+           |  .collect()
+           |
+        """.stripMargin)
+      assertContains(
+        "[UNRESOLVED_ROUTINE] Cannot resolve routine `intSum` on search path",
+        anotherOutput)
+    }
   }
 
   test("register a class via SparkSession.addArtifact") {
-    val artifactPath = new File("src/test/resources").toPath
-    val intSumUdfPath = artifactPath.resolve("IntSumUdf.class")
-    assume(intSumUdfPath.toFile.exists)
-    val output = runInterpreterInPasteMode("local",
-      s"""
-         |import org.apache.spark.sql.functions.udf
-         |
-         |spark.addArtifact("${intSumUdfPath.toString}")
-         |
-         |val intSumUdf = udf((x: Long, y: Long) => new IntSumUdf().call(x, y))
-         |spark.udf.register("intSum", intSumUdf)
-         |
-         |val r = spark.range(5)
-         |  .withColumn("id2", col("id") + 1)
-         |  .selectExpr("intSum(id, id2)")
-         |  .collect()
-         |assert(r.map(_.getLong(0)).toSeq == Seq(1, 3, 5, 7, 9))
-         |
+    withTempDir { tempDir =>
+      val clsName = "org.apache.spark.repl.IntSumUdf"
+      val intSumUdfStream = classOf[IntSumUdf]
+        .getResourceAsStream("/" + clsName.replace(".", "/") + ".class")
+      val intSumUdfPath = new File(tempDir, "IntSumUdf.class")
+      Files.copy(intSumUdfStream, intSumUdfPath.toPath)
+      val output = runInterpreterInPasteMode("local",
+        s"""
+           |import org.apache.spark.sql.functions.udf
+           |
+           |spark.addArtifact("${intSumUdfPath.toString}")
+           |
+           |val intSumUdf = udf((x: Long, y: Long) => new $clsName().call(x, y))
+           |spark.udf.register("intSum", intSumUdf)
+           |
+           |val r = spark.range(5)
+           |  .withColumn("id2", col("id") + 1)
+           |  .selectExpr("intSum(id, id2)")
+           |  .collect()
+           |assert(r.map(_.getLong(0)).toSeq == Seq(1, 3, 5, 7, 9))
+           |
+        """.stripMargin)
+      assertContains("Array([1], [3], [5], [7], [9])", output)
+      assertDoesNotContain("error:", output)
+      assertDoesNotContain("Exception", output)
+      assertDoesNotContain("assertion failed", output)
+    }
+  }
+
+  test("SPARK-53129: spark-shell imports java.net._ by default") {
+    val output = runInterpreter("local",
+      """
+        |new URI("https://spark.apache.org")
       """.stripMargin)
-    assertContains("Array([1], [3], [5], [7], [9])", output)
-    assertDoesNotContain("error:", output)
-    assertDoesNotContain("Exception", output)
-    assertDoesNotContain("assertion failed", output)
+    assertDoesNotContain("error: not found: type URI", output)
+  }
+
+  test("SPARK-53131: spark-shell imports java.nio.file._ by default") {
+    val output = runInterpreter("local",
+      """
+        |Path.of("/tmp")
+      """.stripMargin)
+    assertDoesNotContain("error: not found: type URI", output)
   }
 }
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/Config.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/Config.scala
index 4467f73e70568..a56043b4912f2 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/Config.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/Config.scala
@@ -131,20 +131,23 @@ private[spark] object Config extends Logging {
     ConfigBuilder("spark.kubernetes.container.image")
       .doc("Container image to use for Spark containers. Individual container types " +
         "(e.g. driver or executor) can also be configured to use different images if desired, " +
-        "by setting the container type-specific image name.")
+        "by setting the container type-specific image name. Note that `{{SPARK_VERSION}}` is " +
+        "the built-in variable that will be substituted with current Spark's version.")
       .version("2.3.0")
       .stringConf
       .createOptional
 
   val DRIVER_CONTAINER_IMAGE =
     ConfigBuilder("spark.kubernetes.driver.container.image")
-      .doc("Container image to use for the driver.")
+      .doc("Container image to use for the driver. Note that `{{SPARK_VERSION}}` is " +
+        "the built-in variable that will be substituted with current Spark's version.")
       .version("2.3.0")
       .fallbackConf(CONTAINER_IMAGE)
 
   val EXECUTOR_CONTAINER_IMAGE =
     ConfigBuilder("spark.kubernetes.executor.container.image")
-      .doc("Container image to use for the executors.")
+      .doc("Container image to use for the executors. Note that `{{SPARK_VERSION}}` is " +
+        "the built-in variable that will be substituted with current Spark's version.")
       .version("2.3.0")
       .fallbackConf(CONTAINER_IMAGE)
 
@@ -404,6 +407,14 @@ private[spark] object Config extends Logging {
       .toSequence
       .createWithDefault(Nil)
 
+  val KUBERNETES_DRIVER_POD_EXCLUDED_FEATURE_STEPS =
+    ConfigBuilder("spark.kubernetes.driver.pod.excludedFeatureSteps")
+      .doc("Class names to exclude from driver pod feature steps. Comma separated.")
+      .version("4.1.0")
+      .stringConf
+      .toSequence
+      .createWithDefault(Nil)
+
   val KUBERNETES_EXECUTOR_POD_FEATURE_STEPS =
     ConfigBuilder("spark.kubernetes.executor.pod.featureSteps")
       .doc("Class name of an extra executor pod feature step implementing " +
@@ -416,6 +427,14 @@ private[spark] object Config extends Logging {
       .toSequence
       .createWithDefault(Nil)
 
+  val KUBERNETES_EXECUTOR_POD_EXCLUDED_FEATURE_STEPS =
+    ConfigBuilder("spark.kubernetes.executor.pod.excludedFeatureSteps")
+      .doc("Class name to exclude from executor pod feature steps. Comma separated.")
+      .version("4.1.0")
+      .stringConf
+      .toSequence
+      .createWithDefault(Nil)
+
   val KUBERNETES_EXECUTOR_DECOMMISSION_LABEL =
     ConfigBuilder("spark.kubernetes.executor.decommissionLabel")
       .doc("Label to apply to a pod which is being decommissioned." +
@@ -682,6 +701,14 @@ private[spark] object Config extends Logging {
       .booleanConf
       .createWithDefault(true)
 
+  val KUBERNETES_EXECUTOR_TERMINATION_GRACE_PERIOD_SECONDS =
+    ConfigBuilder("spark.kubernetes.executor.terminationGracePeriodSeconds")
+      .doc("Time to wait for graceful termination of executor pods.")
+      .version("4.1.0")
+      .timeConf(TimeUnit.SECONDS)
+      .checkValue(period => period >= 0, "terminationGracePeriodSeconds must be non-negative")
+      .createWithDefaultString("30s")
+
   val KUBERNETES_DYN_ALLOC_KILL_GRACE_PERIOD =
     ConfigBuilder("spark.kubernetes.dynamicAllocation.deleteGracePeriod")
       .doc("How long to wait for executors to shut down gracefully before a forceful kill.")
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesConf.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesConf.scala
index deb178eb90e17..182ba1fe15186 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesConf.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesConf.scala
@@ -19,15 +19,14 @@ package org.apache.spark.deploy.k8s
 import java.util.{Locale, UUID}
 
 import io.fabric8.kubernetes.api.model.{LocalObjectReference, LocalObjectReferenceBuilder, Pod}
-import org.apache.commons.lang3.StringUtils
 
-import org.apache.spark.{SPARK_VERSION, SparkConf}
+import org.apache.spark.{SPARK_VERSION, SparkConf, SparkException}
 import org.apache.spark.annotation.{DeveloperApi, Since, Unstable}
 import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.Constants._
 import org.apache.spark.deploy.k8s.features.DriverServiceFeatureStep._
 import org.apache.spark.deploy.k8s.submit._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.ConfigEntry
 import org.apache.spark.resource.ResourceProfile.DEFAULT_RESOURCE_PROFILE_ID
 import org.apache.spark.util.{Clock, SystemClock, Utils}
@@ -46,6 +45,7 @@ private[spark] abstract class KubernetesConf(val sparkConf: SparkConf) {
   def volumes: Seq[KubernetesVolumeSpec]
   def schedulerName: Option[String]
   def appId: String
+  def image: String
 
   def appName: String = get("spark.app.name", "spark")
 
@@ -173,6 +173,12 @@ class KubernetesDriverConf(
   override def schedulerName: Option[String] = {
     Option(get(KUBERNETES_DRIVER_SCHEDULER_NAME).getOrElse(get(KUBERNETES_SCHEDULER_NAME).orNull))
   }
+
+  override def image: String = {
+    get(DRIVER_CONTAINER_IMAGE).map(Utils.substituteSparkVersion).getOrElse {
+      throw new SparkException("Must specify the driver container image")
+    }
+  }
 }
 
 private[spark] class KubernetesExecutorConf(
@@ -237,6 +243,12 @@ private[spark] class KubernetesExecutorConf(
     Option(get(KUBERNETES_EXECUTOR_SCHEDULER_NAME).getOrElse(get(KUBERNETES_SCHEDULER_NAME).orNull))
   }
 
+  override def image: String = {
+    get(EXECUTOR_CONTAINER_IMAGE).map(Utils.substituteSparkVersion).getOrElse {
+      throw new SparkException("Must specify the executor container image")
+    }
+  }
+
   private def checkExecutorEnvKey(key: String): Boolean = {
     // Pattern for matching an executorEnv key, which meets certain naming rules.
     val executorEnvRegex = "[-._a-zA-Z][-._a-zA-Z0-9]*".r
@@ -301,7 +313,7 @@ private[spark] object KubernetesConf {
     // must be 63 characters or less to follow the DNS label standard, so take the 63 characters
     // of the appName name as the label. In addition, label value must start and end with
     // an alphanumeric character.
-    StringUtils.abbreviate(
+    Utils.abbreviate(
       s"$appName"
         .trim
         .toLowerCase(Locale.ROOT)
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesUtils.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesUtils.scala
index c2fcfe179bbeb..a6eb0fcc98b9a 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesUtils.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/KubernetesUtils.scala
@@ -19,20 +19,19 @@ package org.apache.spark.deploy.k8s
 import java.io.{File, IOException}
 import java.net.URI
 import java.security.SecureRandom
-import java.util.{Collections, UUID}
+import java.util.{Collections, HexFormat, UUID}
 
 import scala.jdk.CollectionConverters._
 
 import io.fabric8.kubernetes.api.model.{Container, ContainerBuilder, ContainerStateRunning, ContainerStateTerminated, ContainerStateWaiting, ContainerStatus, EnvVar, EnvVarBuilder, EnvVarSourceBuilder, HasMetadata, OwnerReferenceBuilder, Pod, PodBuilder, Quantity}
 import io.fabric8.kubernetes.client.KubernetesClient
-import org.apache.commons.codec.binary.Hex
 import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.annotation.{DeveloperApi, Since, Unstable}
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.deploy.k8s.Config.KUBERNETES_FILE_UPLOAD_PATH
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.POD_ID
 import org.apache.spark.launcher.SparkLauncher
 import org.apache.spark.resource.ResourceUtils
@@ -146,7 +145,7 @@ object KubernetesUtils extends Logging {
   @Since("3.0.0")
   def formatPairsBundle(pairs: Seq[(String, String)], indent: Int = 1) : String = {
     // Use more loggable format if value is null or empty
-    val indentStr = "\t" * indent
+    val indentStr = "\t".repeat(indent)
     pairs.map {
       case (k, v) => s"\n$indentStr $k: ${Option(v).filter(_.nonEmpty).getOrElse("N/A")}"
     }.mkString("")
@@ -241,7 +240,7 @@ object KubernetesUtils extends Logging {
     }
 
     val time = java.lang.Long.toHexString(clock.getTimeMillis() & 0xFFFFFFFFFFL)
-    Hex.encodeHexString(random) + time
+    HexFormat.of().formatHex(random) + time
   }
 
   /**
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/SparkKubernetesClientFactory.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/SparkKubernetesClientFactory.scala
index 557bf01cbdbae..345d61aaf7cc2 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/SparkKubernetesClientFactory.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/SparkKubernetesClientFactory.scala
@@ -17,10 +17,9 @@
 package org.apache.spark.deploy.k8s
 
 import java.io.File
+import java.nio.file.Files
 
 import com.fasterxml.jackson.databind.ObjectMapper
-import com.google.common.base.Charsets
-import com.google.common.io.Files
 import io.fabric8.kubernetes.client.{ConfigBuilder, KubernetesClient, KubernetesClientBuilder}
 import io.fabric8.kubernetes.client.Config.KUBERNETES_REQUEST_RETRY_BACKOFFLIMIT_SYSTEM_PROPERTY
 import io.fabric8.kubernetes.client.Config.autoConfigure
@@ -29,7 +28,7 @@ import io.fabric8.kubernetes.client.utils.Utils.getSystemPropertyOrEnvVar
 import org.apache.spark.SparkConf
 import org.apache.spark.annotation.{DeveloperApi, Since, Stable}
 import org.apache.spark.deploy.k8s.Config._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.K8S_CONTEXT
 import org.apache.spark.internal.config.ConfigEntry
 
@@ -98,8 +97,7 @@ object SparkKubernetesClientFactory extends Logging {
       .withOption(oauthTokenValue) {
         (token, configBuilder) => configBuilder.withOauthToken(token)
       }.withOption(oauthTokenFile) {
-        (file, configBuilder) =>
-            configBuilder.withOauthToken(Files.asCharSource(file, Charsets.UTF_8).read())
+        (file, configBuilder) => configBuilder.withOauthToken(Files.readString(file.toPath))
       }.withOption(caCertFile) {
         (file, configBuilder) => configBuilder.withCaCertFile(file)
       }.withOption(clientKeyFile) {
@@ -128,17 +126,19 @@ object SparkKubernetesClientFactory extends Logging {
 
   object ClientType extends Enumeration {
     import scala.language.implicitConversions
-    val Driver = Val(DRIVER_CLIENT_REQUEST_TIMEOUT, DRIVER_CLIENT_CONNECTION_TIMEOUT)
-    val Submission = Val(SUBMISSION_CLIENT_REQUEST_TIMEOUT, SUBMISSION_CLIENT_CONNECTION_TIMEOUT)
+    val Driver: ClientTypeVal =
+      ClientTypeVal(DRIVER_CLIENT_REQUEST_TIMEOUT, DRIVER_CLIENT_CONNECTION_TIMEOUT)
+    val Submission: ClientTypeVal =
+      ClientTypeVal(SUBMISSION_CLIENT_REQUEST_TIMEOUT, SUBMISSION_CLIENT_CONNECTION_TIMEOUT)
 
-    protected case class Val(
+    protected case class ClientTypeVal(
         requestTimeoutEntry: ConfigEntry[Int],
         connectionTimeoutEntry: ConfigEntry[Int])
-      extends super.Val {
+      extends Val {
       def requestTimeout(conf: SparkConf): Int = conf.get(requestTimeoutEntry)
       def connectionTimeout(conf: SparkConf): Int = conf.get(connectionTimeoutEntry)
     }
 
-    implicit def convert(value: Value): Val = value.asInstanceOf[Val]
+    implicit def convert(value: Value): ClientTypeVal = value.asInstanceOf[ClientTypeVal]
   }
 }
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicDriverFeatureStep.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicDriverFeatureStep.scala
index 598034544477c..eaf39914ea027 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicDriverFeatureStep.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicDriverFeatureStep.scala
@@ -21,7 +21,6 @@ import scala.jdk.CollectionConverters._
 
 import io.fabric8.kubernetes.api.model._
 
-import org.apache.spark.SparkException
 import org.apache.spark.deploy.k8s._
 import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.Constants._
@@ -37,9 +36,7 @@ private[spark] class BasicDriverFeatureStep(conf: KubernetesDriverConf)
     .get(KUBERNETES_DRIVER_POD_NAME)
     .getOrElse(s"${conf.resourceNamePrefix}-driver")
 
-  private val driverContainerImage = conf
-    .get(DRIVER_CONTAINER_IMAGE)
-    .getOrElse(throw new SparkException("Must specify the driver container image"))
+  private val driverContainerImage = conf.image
 
   // CPU settings
   private val driverCpuCores = conf.get(DRIVER_CORES)
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStep.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStep.scala
index 20050de69f89c..308764bbe13e3 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStep.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStep.scala
@@ -39,9 +39,7 @@ private[spark] class BasicExecutorFeatureStep(
   extends KubernetesFeatureConfigStep with Logging {
 
   // Consider moving some of these fields to KubernetesConf or KubernetesExecutorSpecificConf
-  private val executorContainerImage = kubernetesConf
-    .get(EXECUTOR_CONTAINER_IMAGE)
-    .getOrElse(throw new SparkException("Must specify the executor container image"))
+  private val executorContainerImage = kubernetesConf.image
   private val blockManagerPort = kubernetesConf
     .sparkConf
     .getInt(BLOCK_MANAGER_PORT.key, DEFAULT_BLOCKMANAGER_PORT)
@@ -228,6 +226,10 @@ private[spark] class BasicExecutorFeatureStep(
     val containerWithLimitCores = if (isDefaultProfile) {
       executorLimitCores.map { limitCores =>
         val executorCpuLimitQuantity = new Quantity(limitCores)
+        if (executorCpuLimitQuantity.compareTo(executorCpuQuantity) < 0) {
+          throw new SparkException(s"The executor cpu request ($executorCpuQuantity) should be " +
+            s"less than or equal to cpu limit ($executorCpuLimitQuantity)")
+        }
         new ContainerBuilder(executorContainerWithConfVolume)
           .editResources()
           .addToLimits("cpu", executorCpuLimitQuantity)
@@ -277,6 +279,8 @@ private[spark] class BasicExecutorFeatureStep(
       .editOrNewSpec()
         .withHostname(hostname)
         .withRestartPolicy(policy)
+        .withTerminationGracePeriodSeconds(
+          kubernetesConf.get(KUBERNETES_EXECUTOR_TERMINATION_GRACE_PERIOD_SECONDS))
         .addToNodeSelector(kubernetesConf.nodeSelector.asJava)
         .addToNodeSelector(kubernetesConf.executorNodeSelector.asJava)
         .addToImagePullSecrets(kubernetesConf.imagePullSecrets: _*)
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverCommandFeatureStep.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverCommandFeatureStep.scala
index a8706370eead6..f15f5bc566b4b 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverCommandFeatureStep.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverCommandFeatureStep.scala
@@ -24,7 +24,7 @@ import org.apache.spark.deploy.k8s._
 import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.Constants._
 import org.apache.spark.deploy.k8s.submit._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, CONFIG2, CONFIG3, CONFIG4, CONFIG5}
 import org.apache.spark.internal.config.{PYSPARK_DRIVER_PYTHON, PYSPARK_PYTHON}
 import org.apache.spark.launcher.SparkLauncher
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStep.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStep.scala
index 462d70dee5345..83f8ed01774df 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStep.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStep.scala
@@ -18,10 +18,11 @@ package org.apache.spark.deploy.k8s.features
 
 import java.io.File
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
+import java.util.Base64
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.{BaseEncoding, Files}
 import io.fabric8.kubernetes.api.model.{ContainerBuilder, HasMetadata, PodBuilder, Secret, SecretBuilder}
 
 import org.apache.spark.deploy.k8s.{KubernetesConf, SparkPod}
@@ -47,7 +48,7 @@ private[spark] class DriverKubernetesCredentialsFeatureStep(kubernetesConf: Kube
   private val oauthTokenBase64 = kubernetesConf
     .getOption(s"$KUBERNETES_AUTH_DRIVER_CONF_PREFIX.$OAUTH_TOKEN_CONF_SUFFIX")
     .map { token =>
-      BaseEncoding.base64().encode(token.getBytes(StandardCharsets.UTF_8))
+      Base64.getEncoder().encodeToString(token.getBytes(StandardCharsets.UTF_8))
     }
 
   private val caCertDataBase64 = safeFileConfToBase64(
@@ -153,7 +154,7 @@ private[spark] class DriverKubernetesCredentialsFeatureStep(kubernetesConf: Kube
       .map { file =>
         require(file.isFile, String.format("%s provided at %s does not exist or is not a file.",
           fileType, file.getAbsolutePath))
-        BaseEncoding.base64().encode(Files.toByteArray(file))
+        Base64.getEncoder().encodeToString(Files.readAllBytes(file.toPath))
       }
   }
 
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStep.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStep.scala
index d64378a65d66f..290f6d377aeee 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStep.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStep.scala
@@ -17,11 +17,10 @@
 package org.apache.spark.deploy.k8s.features
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
 import io.fabric8.kubernetes.api.model._
 
 import org.apache.spark.deploy.k8s.{KubernetesConf, KubernetesUtils, SparkPod}
@@ -116,7 +115,7 @@ private[spark] class HadoopConfDriverFeatureStep(conf: KubernetesConf)
   override def getAdditionalKubernetesResources(): Seq[HasMetadata] = {
     if (confDir.isDefined) {
       val fileMap = confFiles.map { file =>
-        (file.getName(), Files.asCharSource(file, StandardCharsets.UTF_8).read())
+        (file.getName(), Files.readString(file.toPath))
       }.toMap.asJava
 
       Seq(new ConfigMapBuilder()
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStep.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStep.scala
index bd591b39de010..b62b5dc3e1fb0 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStep.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStep.scala
@@ -17,14 +17,13 @@
 package org.apache.spark.deploy.k8s.features
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
+import java.util.Base64
 
 import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
-import com.google.common.io.Files
 import io.fabric8.kubernetes.api.model._
-import org.apache.commons.codec.binary.Base64
 import org.apache.hadoop.security.UserGroupInformation
 
 import org.apache.spark.deploy.SparkHadoopUtil
@@ -227,6 +226,7 @@ private[spark] class KerberosConfDriverFeatureStep(kubernetesConf: KubernetesDri
   }
 
   override def getAdditionalKubernetesResources(): Seq[HasMetadata] = {
+    val encodeToString = Base64.getEncoder().encodeToString(_)
     Seq[HasMetadata]() ++ {
       krb5File.map { path =>
         val file = new File(path)
@@ -236,7 +236,7 @@ private[spark] class KerberosConfDriverFeatureStep(kubernetesConf: KubernetesDri
             .endMetadata()
           .withImmutable(true)
           .addToData(
-            Map(file.getName() -> Files.asCharSource(file, StandardCharsets.UTF_8).read()).asJava)
+            Map(file.getName() -> Files.readString(file.toPath)).asJava)
           .build()
       }
     } ++ {
@@ -248,7 +248,7 @@ private[spark] class KerberosConfDriverFeatureStep(kubernetesConf: KubernetesDri
             .withName(ktSecretName)
             .endMetadata()
           .withImmutable(true)
-          .addToData(kt.getName(), Base64.encodeBase64String(Files.toByteArray(kt)))
+          .addToData(kt.getName(), encodeToString(Files.readAllBytes(kt.toPath)))
           .build())
       } else {
         Nil
@@ -260,7 +260,7 @@ private[spark] class KerberosConfDriverFeatureStep(kubernetesConf: KubernetesDri
             .withName(dtSecretName)
             .endMetadata()
           .withImmutable(true)
-          .addToData(KERBEROS_SECRET_KEY, Base64.encodeBase64String(delegationTokens))
+          .addToData(KERBEROS_SECRET_KEY, encodeToString(delegationTokens))
           .build())
       } else {
         Nil
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/PodTemplateConfigMapStep.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/PodTemplateConfigMapStep.scala
index f94dad2d15dc1..3d0828044dc0b 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/PodTemplateConfigMapStep.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/features/PodTemplateConfigMapStep.scala
@@ -17,9 +17,8 @@
 package org.apache.spark.deploy.k8s.features
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
-import com.google.common.io.Files
 import io.fabric8.kubernetes.api.model.{ConfigMapBuilder, ContainerBuilder, HasMetadata, PodBuilder}
 
 import org.apache.spark.deploy.SparkHadoopUtil
@@ -81,7 +80,7 @@ private[spark] class PodTemplateConfigMapStep(conf: KubernetesConf)
       val hadoopConf = SparkHadoopUtil.get.newConfiguration(conf.sparkConf)
       val uri = downloadFile(podTemplateFile, Utils.createTempDir(), conf.sparkConf, hadoopConf)
       val file = new java.net.URI(uri).getPath
-      val podTemplateString = Files.asCharSource(new File(file), StandardCharsets.UTF_8).read()
+      val podTemplateString = Files.readString(new File(file).toPath)
       Seq(new ConfigMapBuilder()
           .withNewMetadata()
             .withName(configmapName)
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientApplication.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientApplication.scala
index 042f984933a7e..a7a8e248f9c48 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientApplication.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientApplication.scala
@@ -31,7 +31,7 @@ import org.apache.spark.deploy.k8s._
 import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.Constants._
 import org.apache.spark.deploy.k8s.KubernetesUtils.addOwnerReference
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{APP_ID, APP_NAME, SUBMISSION_ID}
 import org.apache.spark.util.Utils
 
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientUtils.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientUtils.scala
index d6b1da39bcbb5..729e45c3eb1da 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientUtils.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesClientUtils.scala
@@ -32,7 +32,7 @@ import org.apache.spark.annotation.{DeveloperApi, Since, Unstable}
 import org.apache.spark.deploy.k8s.{Config, Constants, KubernetesUtils}
 import org.apache.spark.deploy.k8s.Config.{KUBERNETES_DNS_SUBDOMAIN_NAME_MAX_LENGTH, KUBERNETES_NAMESPACE}
 import org.apache.spark.deploy.k8s.Constants.ENV_SPARK_CONF_DIR
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, PATH, PATHS}
 import org.apache.spark.util.ArrayImplicits._
 
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilder.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilder.scala
index 12626a8676efe..da234762ea1de 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilder.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilder.scala
@@ -72,7 +72,7 @@ class KubernetesDriverBuilder {
         }
       }
 
-    val features = Seq(
+    val allFeatures = Seq(
       new BasicDriverFeatureStep(conf),
       new DriverKubernetesCredentialsFeatureStep(conf),
       new DriverServiceFeatureStep(conf),
@@ -85,6 +85,9 @@ class KubernetesDriverBuilder {
       new PodTemplateConfigMapStep(conf),
       new LocalDirsFeatureStep(conf)) ++ userFeatures
 
+    val features = allFeatures.filterNot(f =>
+      conf.get(Config.KUBERNETES_DRIVER_POD_EXCLUDED_FEATURE_STEPS).contains(f.getClass.getName))
+
     val spec = KubernetesDriverSpec(
       initialPod,
       driverPreKubernetesResources = Seq.empty,
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/LoggingPodStatusWatcher.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/LoggingPodStatusWatcher.scala
index 1bef7e50c0460..f4e205ee28f40 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/LoggingPodStatusWatcher.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/deploy/k8s/submit/LoggingPodStatusWatcher.scala
@@ -23,7 +23,7 @@ import io.fabric8.kubernetes.client.Watcher.Action
 import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.KubernetesDriverConf
 import org.apache.spark.deploy.k8s.KubernetesUtils._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{APP_ID, APP_NAME, POD_PHASE, POD_STATE, STATUS, SUBMISSION_ID}
 
 private[k8s] trait LoggingPodStatusWatcher extends Watcher[Pod] {
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsAllocator.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsAllocator.scala
index 6021a4fb953e5..e84a0c97724c2 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsAllocator.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsAllocator.scala
@@ -32,7 +32,7 @@ import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.Constants._
 import org.apache.spark.deploy.k8s.KubernetesConf
 import org.apache.spark.deploy.k8s.KubernetesUtils.addOwnerReference
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.resource.ResourceProfile
 import org.apache.spark.scheduler.cluster.SchedulerBackendUtils.DEFAULT_NUMBER_EXECUTORS
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsLifecycleManager.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsLifecycleManager.scala
index fe2707a7f65b1..35386aff4a80c 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsLifecycleManager.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsLifecycleManager.scala
@@ -31,7 +31,7 @@ import org.apache.spark.deploy.ExecutorFailureTracker
 import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.Constants._
 import org.apache.spark.deploy.k8s.KubernetesUtils._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.scheduler.ExecutorExited
 import org.apache.spark.util.{Clock, SystemClock, Utils}
 import org.apache.spark.util.SparkExitCode.EXCEED_MAX_EXECUTOR_FAILURES
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsSnapshot.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsSnapshot.scala
index 44daf57d76ebf..2a8fd16d7e1ed 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsSnapshot.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorPodsSnapshot.scala
@@ -24,7 +24,7 @@ import io.fabric8.kubernetes.api.model.ContainerStateTerminated
 import io.fabric8.kubernetes.api.model.Pod
 
 import org.apache.spark.deploy.k8s.Constants._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{POD_NAME, POD_NAMESPACE, POD_PHASE}
 
 /**
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorRollPlugin.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorRollPlugin.scala
index 548000893cd77..c624050d819ff 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorRollPlugin.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/ExecutorRollPlugin.scala
@@ -26,7 +26,7 @@ import org.apache.spark.SparkContext
 import org.apache.spark.api.plugin.{DriverPlugin, ExecutorPlugin, PluginContext, SparkPlugin}
 import org.apache.spark.deploy.k8s.Config.{EXECUTOR_ROLL_INTERVAL, EXECUTOR_ROLL_POLICY, ExecutorRollPolicy, MINIMUM_TASKS_PER_EXECUTOR_BEFORE_ROLLING}
 import org.apache.spark.executor.ExecutorMetrics
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, CONFIG, EXECUTOR_ID, INTERVAL}
 import org.apache.spark.internal.config.DECOMMISSION_ENABLED
 import org.apache.spark.scheduler.ExecutorDecommissionInfo
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterManager.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterManager.scala
index ddcdc2cf663ac..49eac64745b7c 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterManager.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterManager.scala
@@ -25,7 +25,7 @@ import org.apache.spark.{SparkConf, SparkContext, SparkMasterRegex}
 import org.apache.spark.deploy.k8s.{KubernetesConf, KubernetesUtils, SparkKubernetesClientFactory}
 import org.apache.spark.deploy.k8s.Config._
 import org.apache.spark.deploy.k8s.Constants.DEFAULT_EXECUTOR_CONTAINER_NAME
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.MASTER_URL
 import org.apache.spark.internal.config.TASK_MAX_FAILURES
 import org.apache.spark.scheduler.{ExternalClusterManager, SchedulerBackend, TaskScheduler, TaskSchedulerImpl}
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterSchedulerBackend.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterSchedulerBackend.scala
index 09faa2a7fb1b3..aacd8b84199e1 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterSchedulerBackend.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesClusterSchedulerBackend.scala
@@ -33,7 +33,6 @@ import org.apache.spark.deploy.k8s.Constants._
 import org.apache.spark.deploy.k8s.submit.KubernetesClientUtils
 import org.apache.spark.deploy.security.HadoopDelegationTokenManager
 import org.apache.spark.internal.LogKeys.{COUNT, TOTAL}
-import org.apache.spark.internal.MDC
 import org.apache.spark.internal.config.SCHEDULER_MIN_REGISTERED_RESOURCES_RATIO
 import org.apache.spark.resource.ResourceProfile
 import org.apache.spark.rpc.{RpcAddress, RpcCallContext}
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilder.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilder.scala
index a85e42662b890..2253c07df116e 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilder.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilder.scala
@@ -65,7 +65,7 @@ private[spark] class KubernetesExecutorBuilder {
         }
       }
 
-    val features = Seq(
+    val allFeatures = Seq(
       new BasicExecutorFeatureStep(conf, secMgr, resourceProfile),
       new ExecutorKubernetesCredentialsFeatureStep(conf),
       new MountSecretsFeatureStep(conf),
@@ -74,6 +74,9 @@ private[spark] class KubernetesExecutorBuilder {
       new HadoopConfExecutorFeatureStep(conf),
       new LocalDirsFeatureStep(conf)) ++ userFeatures
 
+    val features = allFeatures.filterNot(f =>
+      conf.get(Config.KUBERNETES_EXECUTOR_POD_EXCLUDED_FEATURE_STEPS).contains(f.getClass.getName))
+
     val spec = KubernetesExecutorSpec(
       initialPod,
       executorKubernetesResources = Seq.empty)
diff --git a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/shuffle/KubernetesLocalDiskShuffleExecutorComponents.scala b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/shuffle/KubernetesLocalDiskShuffleExecutorComponents.scala
index 2728385874f6d..cbe215c3f218b 100644
--- a/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/shuffle/KubernetesLocalDiskShuffleExecutorComponents.scala
+++ b/resource-managers/kubernetes/core/src/main/scala/org/apache/spark/shuffle/KubernetesLocalDiskShuffleExecutorComponents.scala
@@ -27,7 +27,7 @@ import org.apache.commons.io.FileExistsException
 
 import org.apache.spark.{SparkConf, SparkEnv}
 import org.apache.spark.deploy.k8s.Config.KUBERNETES_DRIVER_REUSE_PVC
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.{SHUFFLE_CHECKSUM_ALGORITHM, SHUFFLE_CHECKSUM_ENABLED}
 import org.apache.spark.shuffle.ShuffleChecksumUtils.{compareChecksums, getChecksumFileName}
 import org.apache.spark.shuffle.api.{ShuffleExecutorComponents, ShuffleMapOutputWriter, SingleSpillShuffleMapOutputWriter}
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesConfSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesConfSuite.scala
index 3c53e9b74f924..33cfd3c7588fa 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesConfSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesConfSuite.scala
@@ -254,15 +254,15 @@ class KubernetesConfSuite extends SparkFunSuite {
 
   test("SPARK-36566: get app name label") {
     assert(KubernetesConf.getAppNameLabel(" Job+Spark-Pi 2021") === "job-spark-pi-2021")
-    assert(KubernetesConf.getAppNameLabel("a" * 63) === "a" * 63)
-    assert(KubernetesConf.getAppNameLabel("a" * 64) === "a" * 63)
-    assert(KubernetesConf.getAppNameLabel("a" * 253) === "a" * 63)
+    assert(KubernetesConf.getAppNameLabel("a".repeat(63)) === "a".repeat(63))
+    assert(KubernetesConf.getAppNameLabel("a".repeat(64)) === "a".repeat(63))
+    assert(KubernetesConf.getAppNameLabel("a".repeat(253)) === "a".repeat(63))
   }
 
   test("SPARK-38630: K8s label value should start and end with alphanumeric") {
     assert(KubernetesConf.getAppNameLabel("-hello-") === "hello")
-    assert(KubernetesConf.getAppNameLabel("a" * 62 + "-aaa") === "a" * 62)
-    assert(KubernetesConf.getAppNameLabel("-" + "a" * 63) === "a" * 62)
+    assert(KubernetesConf.getAppNameLabel("a".repeat(62) + "-aaa") === "a".repeat(62))
+    assert(KubernetesConf.getAppNameLabel("-" + "a".repeat(63)) === "a".repeat(62))
   }
 
   test("SPARK-40869: Resource name prefix should not start with a hyphen") {
@@ -276,4 +276,14 @@ class KubernetesConfSuite extends SparkFunSuite {
       assert(KubernetesConf.getResourceNamePrefix(appName).matches("[a-z]([-a-z0-9]*[a-z0-9])?"))
     }
   }
+
+  test("SPARK-52902: K8s image configs support {{SPARK_VERSION}} placeholder") {
+    val sparkConf = new SparkConf(false)
+    sparkConf.set(CONTAINER_IMAGE, "apache/spark:{{SPARK_VERSION}}")
+    sparkConf.set(EXECUTOR_CONTAINER_IMAGE, Some("foo.com/spark:{{SPARK_VERSION}}-corp"))
+    val driverUnsetConf = KubernetesTestConf.createDriverConf(sparkConf)
+    val execUnsetConf = KubernetesTestConf.createExecutorConf(sparkConf)
+    assert(driverUnsetConf.image === s"apache/spark:$SPARK_VERSION")
+    assert(execUnsetConf.image === s"foo.com/spark:$SPARK_VERSION-corp")
+  }
 }
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesUtilsSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesUtilsSuite.scala
index be10d21aa527b..9c0251936df25 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesUtilsSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/KubernetesUtilsSuite.scala
@@ -19,11 +19,12 @@ package org.apache.spark.deploy.k8s
 
 import java.io.File
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
+import java.nio.file.StandardOpenOption._
 
 import scala.jdk.CollectionConverters._
 
 import io.fabric8.kubernetes.api.model.{ContainerBuilder, EnvVarBuilder, EnvVarSourceBuilder, PodBuilder}
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.scalatest.PrivateMethodTester
@@ -91,7 +92,7 @@ class KubernetesUtilsSuite extends SparkFunSuite with PrivateMethodTester {
         }
 
         def appendFileAndUpload(content: String, delSrc: Boolean, overwrite: Boolean): Unit = {
-          FileUtils.write(srcFile, content, StandardCharsets.UTF_8, true)
+          Files.writeString(srcFile.toPath, content, StandardCharsets.UTF_8, CREATE, WRITE, APPEND)
           KubernetesUtils.invokePrivate(upload(src, dest, fs, delSrc, overwrite))
         }
 
@@ -121,7 +122,7 @@ class KubernetesUtilsSuite extends SparkFunSuite with PrivateMethodTester {
 
         // Rewrite a new file, upload file with delSrc = true and overwrite = false.
         // Upload failed because dest exists, src still exists.
-        FileUtils.write(srcFile, "re-init-content", StandardCharsets.UTF_8, true)
+        Files.writeString(srcFile.toPath, "re-init-content")
         checkUploadException(delSrc = true, overwrite = false)
         assert(fs.exists(src))
       }
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/PodBuilderSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/PodBuilderSuite.scala
index 947db5dd41c1a..a803819432378 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/PodBuilderSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/PodBuilderSuite.scala
@@ -40,6 +40,8 @@ abstract class PodBuilderSuite extends SparkFunSuite {
 
   protected def roleSpecificSchedulerNameConf: ConfigEntry[_]
 
+  protected def excludedFeatureStepsConf: ConfigEntry[_]
+
   protected def userFeatureStepsConf: ConfigEntry[_]
 
   protected def userFeatureStepWithExpectedAnnotation: (String, String)
@@ -91,6 +93,21 @@ abstract class PodBuilderSuite extends SparkFunSuite {
     assert(pod.container.getVolumeMounts.asScala.exists(_.getName == "so_long_two"))
   }
 
+  test("SPARK-52830: exclude a feature step") {
+    val client = mockKubernetesClient()
+    val sparkConf = baseConf.clone()
+      .set(excludedFeatureStepsConf.key,
+        "org.apache.spark.deploy.k8s.TestStepTwo")
+      .set(userFeatureStepsConf.key,
+        "org.apache.spark.deploy.k8s.TestStepTwo," +
+        "org.apache.spark.deploy.k8s.TestStep")
+      .set(templateFileConf.key, "template-file.yaml")
+    val pod = buildPod(sparkConf, client)
+    verifyPod(pod)
+    assert(pod.container.getVolumeMounts.asScala.exists(_.getName == "so_long"))
+    assert(!pod.container.getVolumeMounts.asScala.exists(_.getName == "so_long_two"))
+  }
+
   test("SPARK-37145: configure a custom test step with base config") {
     val client = mockKubernetesClient()
     val sparkConf = baseConf.clone()
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStepSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStepSuite.scala
index 37d28c203000e..71d484b4cd006 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStepSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/BasicExecutorFeatureStepSuite.scala
@@ -120,6 +120,43 @@ class BasicExecutorFeatureStepSuite extends SparkFunSuite with BeforeAndAfter {
     assert(error.contains("You must specify an amount for gpu"))
   }
 
+  test("SPARK-52933: Verify if the executor cpu request exceeds limit") {
+    baseConf.set(KUBERNETES_EXECUTOR_REQUEST_CORES, "2")
+    baseConf.set(KUBERNETES_EXECUTOR_LIMIT_CORES, "1")
+    val error = intercept[SparkException] {
+      initDefaultProfile(baseConf)
+      val step = new BasicExecutorFeatureStep(newExecutorConf(), new SecurityManager(baseConf),
+        defaultProfile)
+      val executor = step.configurePod(SparkPod.initialPod())
+    }.getMessage()
+    assert(error.contains("cpu request (2) should be less than or equal to cpu limit (1)"))
+  }
+
+  test("SPARK-53096: Check the default value of terminationGracePeriodSeconds") {
+    initDefaultProfile(baseConf)
+    val step = new BasicExecutorFeatureStep(newExecutorConf(), new SecurityManager(baseConf),
+      defaultProfile)
+    val executor = step.configurePod(SparkPod.initialPod())
+    assert(executor.pod.getSpec.getTerminationGracePeriodSeconds === 30)
+  }
+
+  test("SPARK-53096: Support spark.kubernetes.executor.terminationGracePeriodSeconds") {
+    val m = intercept[SparkIllegalArgumentException] {
+      baseConf.set(KUBERNETES_EXECUTOR_TERMINATION_GRACE_PERIOD_SECONDS, -1L)
+      initDefaultProfile(baseConf)
+      new BasicExecutorFeatureStep(newExecutorConf(), new SecurityManager(baseConf),
+        defaultProfile).configurePod(SparkPod.initialPod())
+    }.getMessage
+    assert(m.contains("terminationGracePeriodSeconds must be non-negative"))
+
+    baseConf.set(KUBERNETES_EXECUTOR_TERMINATION_GRACE_PERIOD_SECONDS, 0L)
+    initDefaultProfile(baseConf)
+    val step = new BasicExecutorFeatureStep(newExecutorConf(), new SecurityManager(baseConf),
+      defaultProfile)
+    val executor = step.configurePod(SparkPod.initialPod())
+    assert(executor.pod.getSpec.getTerminationGracePeriodSeconds === 0L)
+  }
+
   test("basic executor pod with resources") {
     val fpgaResourceID = new ResourceID(SPARK_EXECUTOR_PREFIX, FPGA)
     val gpuExecutorResourceID = new ResourceID(SPARK_EXECUTOR_PREFIX, GPU)
@@ -201,7 +238,7 @@ class BasicExecutorFeatureStepSuite extends SparkFunSuite with BeforeAndAfter {
 
   test("SPARK-35460: invalid PodNamePrefixes") {
     withPodNamePrefix {
-      Seq("_123", "spark_exec", "spark@", "a" * 238).foreach { invalid =>
+      Seq("_123", "spark_exec", "spark@", "a".repeat(238)).foreach { invalid =>
         baseConf.set(KUBERNETES_EXECUTOR_POD_NAME_PREFIX, invalid)
         checkError(
           exception = intercept[SparkIllegalArgumentException](newExecutorConf()),
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStepSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStepSuite.scala
index a72152a851c4f..33982e9298887 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStepSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverKubernetesCredentialsFeatureStepSuite.scala
@@ -17,11 +17,12 @@
 package org.apache.spark.deploy.k8s.features
 
 import java.io.File
+import java.nio.charset.StandardCharsets
+import java.nio.file.Files
+import java.util.Base64
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.base.Charsets
-import com.google.common.io.{BaseEncoding, Files}
 import io.fabric8.kubernetes.api.model.Secret
 
 import org.apache.spark.{SparkConf, SparkFunSuite}
@@ -106,7 +107,7 @@ class DriverKubernetesCredentialsFeatureStepSuite extends SparkFunSuite {
     assert(credentialsSecret.getMetadata.getName ===
       s"${kubernetesConf.resourceNamePrefix}-kubernetes-credentials")
     val decodedSecretData = credentialsSecret.getData.asScala.map { data =>
-      (data._1, new String(BaseEncoding.base64().decode(data._2), Charsets.UTF_8))
+      (data._1, new String(Base64.getDecoder().decode(data._2), StandardCharsets.UTF_8))
     }
     val expectedSecretData = Map(
       DRIVER_CREDENTIALS_CA_CERT_SECRET_NAME -> "ca-cert",
@@ -128,7 +129,7 @@ class DriverKubernetesCredentialsFeatureStepSuite extends SparkFunSuite {
 
   private def writeCredentials(credentialsFileName: String, credentialsContents: String): File = {
     val credentialsFile = new File(credentialsTempDirectory, credentialsFileName)
-    Files.asCharSink(credentialsFile, Charsets.UTF_8).write(credentialsContents)
+    Files.writeString(credentialsFile.toPath, credentialsContents)
     credentialsFile
   }
 }
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverServiceFeatureStepSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverServiceFeatureStepSuite.scala
index 8d4670393f9d7..3b8738a31bce0 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverServiceFeatureStepSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/DriverServiceFeatureStepSuite.scala
@@ -32,7 +32,7 @@ import org.apache.spark.util.ManualClock
 class DriverServiceFeatureStepSuite extends SparkFunSuite {
 
   private val LONG_RESOURCE_NAME_PREFIX =
-    "a" * (DriverServiceFeatureStep.MAX_SERVICE_NAME_LENGTH -
+    "a".repeat(DriverServiceFeatureStep.MAX_SERVICE_NAME_LENGTH -
       DriverServiceFeatureStep.DRIVER_SVC_POSTFIX.length + 1)
   private val DRIVER_LABELS = Map(
     "label1key" -> "label1value",
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStepSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStepSuite.scala
index 4310ac0220e5e..946b8c5ff47cc 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStepSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfDriverFeatureStepSuite.scala
@@ -17,11 +17,10 @@
 package org.apache.spark.deploy.k8s.features
 
 import java.io.File
-import java.nio.charset.StandardCharsets.UTF_8
+import java.nio.file.Files
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
 import io.fabric8.kubernetes.api.model.ConfigMap
 
 import org.apache.spark.{SparkConf, SparkFunSuite}
@@ -48,7 +47,7 @@ class HadoopConfDriverFeatureStepSuite extends SparkFunSuite {
     val confFiles = Set("core-site.xml", "hdfs-site.xml")
 
     confFiles.foreach { f =>
-      Files.asCharSink(new File(confDir, f), UTF_8).write("some data")
+      Files.writeString(new File(confDir, f).toPath, "some data")
     }
 
     val sparkConf = new SparkConfWithEnv(Map(ENV_HADOOP_CONF_DIR -> confDir.getAbsolutePath()))
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfExecutorFeatureStepSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfExecutorFeatureStepSuite.scala
index 04e20258d068f..96d485801a41b 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfExecutorFeatureStepSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/HadoopConfExecutorFeatureStepSuite.scala
@@ -18,9 +18,7 @@
 package org.apache.spark.deploy.k8s.features
 
 import java.io.File
-import java.nio.charset.StandardCharsets.UTF_8
-
-import com.google.common.io.Files
+import java.nio.file.Files
 
 import org.apache.spark.{SparkConf, SparkFunSuite}
 import org.apache.spark.deploy.k8s.{Constants, KubernetesTestConf, SecretVolumeUtils, SparkPod}
@@ -36,7 +34,7 @@ class HadoopConfExecutorFeatureStepSuite extends SparkFunSuite  {
     val confFiles = Set("core-site.xml", "hdfs-site.xml")
 
     confFiles.foreach { f =>
-      Files.asCharSink(new File(confDir, f), UTF_8).write("some data")
+      Files.writeString(new File(confDir, f).toPath, "some data")
     }
 
     Seq(
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStepSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStepSuite.scala
index b172bdc06ddca..0da39b30e3883 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStepSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/features/KerberosConfDriverFeatureStepSuite.scala
@@ -17,14 +17,13 @@
 package org.apache.spark.deploy.k8s.features
 
 import java.io.File
-import java.nio.charset.StandardCharsets.UTF_8
+import java.nio.file.Files
 import java.security.PrivilegedExceptionAction
+import java.util.Base64
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
 import io.fabric8.kubernetes.api.model.{ConfigMap, Secret}
-import org.apache.commons.codec.binary.Base64
 import org.apache.hadoop.io.Text
 import org.apache.hadoop.security.UserGroupInformation
 
@@ -55,7 +54,7 @@ class KerberosConfDriverFeatureStepSuite extends SparkFunSuite {
 
   test("create krb5.conf config map if local config provided") {
     val krbConf = File.createTempFile("krb5", ".conf", tmpDir)
-    Files.asCharSink(krbConf, UTF_8).write("some data")
+    Files.writeString(krbConf.toPath, "some data")
 
     val sparkConf = new SparkConf(false)
       .set(KUBERNETES_KERBEROS_KRB5_FILE, krbConf.getAbsolutePath())
@@ -70,7 +69,7 @@ class KerberosConfDriverFeatureStepSuite extends SparkFunSuite {
 
   test("create keytab secret if client keytab file used") {
     val keytab = File.createTempFile("keytab", ".bin", tmpDir)
-    Files.asCharSink(keytab, UTF_8).write("some data")
+    Files.writeString(keytab.toPath, "some data")
 
     val sparkConf = new SparkConf(false)
       .set(KEYTAB, keytab.getAbsolutePath())
@@ -127,7 +126,8 @@ class KerberosConfDriverFeatureStepSuite extends SparkFunSuite {
         val step = createStep(new SparkConf(false))
 
         val dtSecret = filter[Secret](step.getAdditionalKubernetesResources()).head
-        assert(dtSecret.getData().get(KERBEROS_SECRET_KEY) === Base64.encodeBase64String(tokens))
+        assert(dtSecret.getData().get(KERBEROS_SECRET_KEY) ===
+          Base64.getEncoder().encodeToString(tokens))
 
         checkPodForTokens(step.configurePod(SparkPod.initialPod()),
           dtSecret.getMetadata().getName())
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilderSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilderSuite.scala
index 861b8e0fff943..d3fd5ee5f00c4 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilderSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/deploy/k8s/submit/KubernetesDriverBuilderSuite.scala
@@ -38,6 +38,10 @@ class KubernetesDriverBuilderSuite extends PodBuilderSuite {
     Config.KUBERNETES_DRIVER_SCHEDULER_NAME
   }
 
+  override protected def excludedFeatureStepsConf: ConfigEntry[_] = {
+    Config.KUBERNETES_DRIVER_POD_EXCLUDED_FEATURE_STEPS
+  }
+
   override protected def userFeatureStepsConf: ConfigEntry[_] = {
     Config.KUBERNETES_DRIVER_POD_FEATURE_STEPS
   }
diff --git a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilderSuite.scala b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilderSuite.scala
index 17c2d4a938c14..5f0f04da9196b 100644
--- a/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilderSuite.scala
+++ b/resource-managers/kubernetes/core/src/test/scala/org/apache/spark/scheduler/cluster/k8s/KubernetesExecutorBuilderSuite.scala
@@ -42,6 +42,10 @@ class KubernetesExecutorBuilderSuite extends PodBuilderSuite {
     Config.KUBERNETES_EXECUTOR_SCHEDULER_NAME
   }
 
+  override protected def excludedFeatureStepsConf: ConfigEntry[_] = {
+    Config.KUBERNETES_EXECUTOR_POD_EXCLUDED_FEATURE_STEPS
+  }
+
   override protected def userFeatureStepsConf: ConfigEntry[_] = {
     Config.KUBERNETES_EXECUTOR_POD_FEATURE_STEPS
   }
diff --git a/resource-managers/kubernetes/docker/src/main/dockerfiles/spark/Dockerfile b/resource-managers/kubernetes/docker/src/main/dockerfiles/spark/Dockerfile
index 936359544320a..0f970a3d63adf 100644
--- a/resource-managers/kubernetes/docker/src/main/dockerfiles/spark/Dockerfile
+++ b/resource-managers/kubernetes/docker/src/main/dockerfiles/spark/Dockerfile
@@ -14,9 +14,10 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
+ARG java_image_name=azul/zulu-openjdk
 ARG java_image_tag=21
 
-FROM azul/zulu-openjdk:${java_image_tag}
+FROM ${java_image_name}:${java_image_tag}
 LABEL org.opencontainers.image.authors="Apache Spark project <dev@spark.apache.org>"
 LABEL org.opencontainers.image.licenses="Apache-2.0"
 LABEL org.opencontainers.image.ref.name="Apache Spark Scala/Java Image"
@@ -47,8 +48,6 @@ RUN set -ex && \
     rm -rf /var/cache/apt/* && rm -rf /var/lib/apt/lists/*
 
 COPY jars /opt/spark/jars
-# Copy hive-jackson directory if exists
-COPY hive-jackso[n] /opt/spark/hive-jackson
 # Copy RELEASE file if exists
 COPY RELEAS[E] /opt/spark/RELEASE
 COPY bin /opt/spark/bin
diff --git a/resource-managers/kubernetes/integration-tests/README.md b/resource-managers/kubernetes/integration-tests/README.md
index 3511a64f7fe5b..7ffee0693bcf2 100644
--- a/resource-managers/kubernetes/integration-tests/README.md
+++ b/resource-managers/kubernetes/integration-tests/README.md
@@ -330,11 +330,11 @@ You can also specify your specific dockerfile to build JVM/Python/R based image
 
 ## Requirements
 - A minimum of 6 CPUs and 9G of memory is required to complete all Volcano test cases.
-- Volcano v1.11.0.
+- Volcano v1.12.2.
 
 ## Installation
 
-    kubectl apply -f https://raw.githubusercontent.com/volcano-sh/volcano/v1.11.0/installer/volcano-development.yaml
+    kubectl apply -f https://raw.githubusercontent.com/volcano-sh/volcano/v1.12.2/installer/volcano-development.yaml
 
 ## Run tests
 
@@ -355,5 +355,5 @@ You can also specify `volcano` tag to only run Volcano test:
 
 ## Cleanup Volcano
 
-    kubectl delete -f https://raw.githubusercontent.com/volcano-sh/volcano/v1.11.0/installer/volcano-development.yaml
+    kubectl delete -f https://raw.githubusercontent.com/volcano-sh/volcano/v1.12.2/installer/volcano-development.yaml
 
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/BasicTestsSuite.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/BasicTestsSuite.scala
index 0dafe30c364ae..d710add45eb96 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/BasicTestsSuite.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/BasicTestsSuite.scala
@@ -70,7 +70,7 @@ private[spark] trait BasicTestsSuite { k8sSuite: KubernetesSuite =>
   }
 
   test("Run SparkPi with a very long application name.", k8sTestTag) {
-    sparkAppConf.set("spark.app.name", "long" * 40)
+    sparkAppConf.set("spark.app.name", "long".repeat(40))
     runSparkPiAndVerifyCompletion()
   }
 
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/ClientModeTestsSuite.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/ClientModeTestsSuite.scala
index 456943a965847..7ca156e524bda 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/ClientModeTestsSuite.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/ClientModeTestsSuite.scala
@@ -34,7 +34,7 @@ private[spark] trait ClientModeTestsSuite { k8sSuite: KubernetesSuite =>
       .getKubernetesClient
       .services()
       .inNamespace(kubernetesTestComponents.namespace)
-      .create(new ServiceBuilder()
+      .resource(new ServiceBuilder()
         .withNewMetadata()
           .withName(s"$driverPodName-svc")
           .endMetadata()
@@ -53,11 +53,12 @@ private[spark] trait ClientModeTestsSuite { k8sSuite: KubernetesSuite =>
             .endPort()
           .endSpec()
         .build())
+      .create()
     try {
       val driverPod = testBackend.getKubernetesClient
         .pods()
         .inNamespace(kubernetesTestComponents.namespace)
-        .create(new PodBuilder()
+        .resource(new PodBuilder()
           .withNewMetadata()
           .withName(driverPodName)
           .withLabels(labels.asJava)
@@ -95,6 +96,7 @@ private[spark] trait ClientModeTestsSuite { k8sSuite: KubernetesSuite =>
             .endContainer()
           .endSpec()
         .build())
+        .create()
       Eventually.eventually(TIMEOUT, INTERVAL) {
         assert(kubernetesTestComponents.kubernetesClient
           .pods()
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DecommissionSuite.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DecommissionSuite.scala
index 950079dcb5362..17a7c4d2a21db 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DecommissionSuite.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DecommissionSuite.scala
@@ -17,11 +17,10 @@
 package org.apache.spark.deploy.k8s.integrationtest
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
 import io.fabric8.kubernetes.api.model.Pod
 import org.scalatest.concurrent.{Eventually, PatienceConfiguration}
 import org.scalatest.matchers.should.Matchers._
@@ -40,7 +39,7 @@ private[spark] trait DecommissionSuite { k8sSuite: KubernetesSuite =>
     val logConfFilePath = s"${sparkHomeDir.toFile}/conf/log4j2.properties"
 
     try {
-      Files.asCharSink(new File(logConfFilePath), StandardCharsets.UTF_8).write(
+      Files.writeString(new File(logConfFilePath).toPath,
         """rootLogger.level = info
           |rootLogger.appenderRef.stdout.ref = console
           |appender.console.type = Console
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DepsTestsSuite.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DepsTestsSuite.scala
index 8ab7e994788f3..785983d408163 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DepsTestsSuite.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/DepsTestsSuite.scala
@@ -38,7 +38,7 @@ import org.apache.spark.deploy.k8s.integrationtest.DepsTestsSuite.{DEPS_TIMEOUT,
 import org.apache.spark.deploy.k8s.integrationtest.KubernetesSuite._
 import org.apache.spark.deploy.k8s.integrationtest.Utils.getExamplesJarName
 import org.apache.spark.deploy.k8s.integrationtest.backend.minikube.Minikube
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.internal.config.{ARCHIVES, PYSPARK_DRIVER_PYTHON, PYSPARK_PYTHON}
 
 private[spark] trait DepsTestsSuite { k8sSuite: KubernetesSuite =>
@@ -135,7 +135,7 @@ private[spark] trait DepsTestsSuite { k8sSuite: KubernetesSuite =>
       .kubernetesClient
       .services()
       .inNamespace(kubernetesTestComponents.namespace)
-      .create(minioService))
+      .resource(minioService).create())
 
     // try until the stateful set of a previous test is deleted
     Eventually.eventually(TIMEOUT, INTERVAL) (kubernetesTestComponents
@@ -143,7 +143,7 @@ private[spark] trait DepsTestsSuite { k8sSuite: KubernetesSuite =>
       .apps()
       .statefulSets()
       .inNamespace(kubernetesTestComponents.namespace)
-      .create(minioStatefulSet))
+      .resource(minioStatefulSet).create())
   }
 
   private def deleteMinioStorage(): Unit = {
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesSuite.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesSuite.scala
index cf129677ad9c2..2450d50366a2d 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesSuite.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesSuite.scala
@@ -17,13 +17,11 @@
 package org.apache.spark.deploy.k8s.integrationtest
 
 import java.io.File
-import java.nio.file.{Path, Paths}
+import java.nio.file.{Files, Path, Paths}
 import java.util.UUID
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.base.Charsets
-import com.google.common.io.Files
 import io.fabric8.kubernetes.api.model.Pod
 import io.fabric8.kubernetes.client.{Watcher, WatcherException}
 import io.fabric8.kubernetes.client.KubernetesClientException
@@ -129,7 +127,7 @@ class KubernetesSuite extends SparkFunSuite
         val tagFile = new File(path)
         require(tagFile.isFile,
           s"No file found for image tag at ${tagFile.getAbsolutePath}.")
-        Files.asCharSource(tagFile, Charsets.UTF_8).read().trim
+        Files.readString(tagFile.toPath).trim
       }
       .orElse(sys.props.get(CONFIG_KEY_IMAGE_TAG))
       .getOrElse {
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesTestComponents.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesTestComponents.scala
index 9581a78619dd6..f572e3246c310 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesTestComponents.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/KubernetesTestComponents.scala
@@ -45,11 +45,12 @@ private[spark] class KubernetesTestComponents(val kubernetesClient: KubernetesCl
   val clientConfig = kubernetesClient.getConfiguration
 
   def createNamespace(): Unit = {
-    kubernetesClient.namespaces.create(new NamespaceBuilder()
+    kubernetesClient.namespaces.resource(new NamespaceBuilder()
       .withNewMetadata()
       .withName(namespace)
       .endMetadata()
       .build())
+      .create()
   }
 
   def deleteNamespace(): Unit = {
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/PVTestsSuite.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/PVTestsSuite.scala
index 212eef0d9ac22..216441418aea8 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/PVTestsSuite.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/PVTestsSuite.scala
@@ -71,13 +71,15 @@ private[spark] trait PVTestsSuite { k8sSuite: KubernetesSuite =>
     kubernetesTestComponents
       .kubernetesClient
       .persistentVolumes()
-      .create(pvBuilder.build())
+      .resource(pvBuilder.build())
+      .create()
 
     kubernetesTestComponents
       .kubernetesClient
       .persistentVolumeClaims()
       .inNamespace(kubernetesTestComponents.namespace)
-      .create(pvcBuilder.build())
+      .resource(pvcBuilder.build())
+      .create()
   }
 
   private def deleteLocalStorage(): Unit = {
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/SecretsTestsSuite.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/SecretsTestsSuite.scala
index 3e076ea16fdc4..234f627202c12 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/SecretsTestsSuite.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/SecretsTestsSuite.scala
@@ -16,12 +16,11 @@
  */
 package org.apache.spark.deploy.k8s.integrationtest
 
-import java.util.Locale
+import java.util.{Base64, Locale}
 
 import scala.jdk.CollectionConverters._
 
 import io.fabric8.kubernetes.api.model.{Pod, SecretBuilder}
-import org.apache.commons.codec.binary.Base64
 import org.scalatest.concurrent.Eventually
 import org.scalatest.matchers.should.Matchers._
 
@@ -36,8 +35,8 @@ private[spark] trait SecretsTestsSuite { k8sSuite: KubernetesSuite =>
     sb.withNewMetadata()
       .withName(ENV_SECRET_NAME)
       .endMetadata()
-    val secUsername = Base64.encodeBase64String(ENV_SECRET_VALUE_1.getBytes())
-    val secPassword = Base64.encodeBase64String(ENV_SECRET_VALUE_2.getBytes())
+    val secUsername = Base64.getEncoder().encodeToString(ENV_SECRET_VALUE_1.getBytes())
+    val secPassword = Base64.getEncoder().encodeToString(ENV_SECRET_VALUE_2.getBytes())
     val envSecretData = Map(ENV_SECRET_KEY_1 -> secUsername, ENV_SECRET_KEY_2 -> secPassword)
     sb.addToData(envSecretData.asJava)
     val envSecret = sb.build()
@@ -45,7 +44,8 @@ private[spark] trait SecretsTestsSuite { k8sSuite: KubernetesSuite =>
       .kubernetesClient
       .secrets()
       .inNamespace(kubernetesTestComponents.namespace)
-      .createOrReplace(envSecret)
+      .resource(envSecret)
+      .serverSideApply()
   }
 
   private def deleteTestSecret(): Unit = {
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/Utils.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/Utils.scala
index 6aeefe94d779c..685d70cbdc520 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/Utils.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/Utils.scala
@@ -17,6 +17,7 @@
 package org.apache.spark.deploy.k8s.integrationtest
 
 import java.io.{Closeable, File, FileInputStream, FileOutputStream, PrintWriter}
+import java.nio.charset.StandardCharsets
 import java.nio.file.{Files, Path}
 import java.util.concurrent.CountDownLatch
 import java.util.zip.{ZipEntry, ZipOutputStream}
@@ -27,11 +28,11 @@ import io.fabric8.kubernetes.client.dsl.ExecListener
 import io.fabric8.kubernetes.client.dsl.ExecListener.Response
 import org.apache.commons.compress.archivers.tar.{TarArchiveEntry, TarArchiveOutputStream}
 import org.apache.commons.compress.compressors.gzip.GzipCompressorOutputStream
-import org.apache.commons.compress.utils.IOUtils
 import org.apache.commons.io.output.ByteArrayOutputStream
 
 import org.apache.spark.{SPARK_VERSION, SparkException}
 import org.apache.spark.internal.Logging
+import org.apache.spark.util.SparkErrorUtils
 
 object Utils extends Logging {
 
@@ -83,7 +84,7 @@ object Utils extends Logging {
     }
     val listener = new ReadyListener()
     val watch = pod
-      .readingInput(System.in)
+      .redirectingInput()
       .writingOutput(out)
       .writingError(System.err)
       .withTTY()
@@ -91,10 +92,11 @@ object Utils extends Logging {
       .exec(cmd.toArray: _*)
     // under load sometimes the stdout isn't connected by the time we try to read from it.
     listener.waitForInputStreamToConnect()
+    System.in.transferTo(watch.getInput)
     listener.waitForClose()
     watch.close()
     out.flush()
-    val result = out.toString()
+    val result = out.toString(StandardCharsets.UTF_8)
     result
   }
 
@@ -143,9 +145,9 @@ object Utils extends Logging {
     val zipOut = new ZipOutputStream(fos)
     val zipEntry = new ZipEntry(fileToZip.getName)
     zipOut.putNextEntry(zipEntry)
-    IOUtils.copy(fis, zipOut)
-    IOUtils.closeQuietly(fis)
-    IOUtils.closeQuietly(zipOut)
+    fis.transferTo(zipOut)
+    SparkErrorUtils.closeQuietly(fis)
+    SparkErrorUtils.closeQuietly(zipOut)
   }
 
   def createTarGzFile(inFile: String, outFile: String): Unit = {
@@ -165,7 +167,7 @@ object Utils extends Logging {
         // to 777.
         tarEntry.setMode(0x81ff)
         tOut.putArchiveEntry(tarEntry)
-        IOUtils.copy(fis, tOut)
+        fis.transferTo(tOut)
         tOut.closeArchiveEntry()
         tOut.finish()
       }
diff --git a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/backend/cloud/KubeConfigBackend.scala b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/backend/cloud/KubeConfigBackend.scala
index aa34cc617d6f0..45ad3db263cb4 100644
--- a/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/backend/cloud/KubeConfigBackend.scala
+++ b/resource-managers/kubernetes/integration-tests/src/test/scala/org/apache/spark/deploy/k8s/integrationtest/backend/cloud/KubeConfigBackend.scala
@@ -18,11 +18,11 @@ package org.apache.spark.deploy.k8s.integrationtest.backend.cloud
 
 import io.fabric8.kubernetes.client.{Config, KubernetesClient, KubernetesClientBuilder}
 import io.fabric8.kubernetes.client.utils.Utils
-import org.apache.commons.lang3.StringUtils
 
 import org.apache.spark.deploy.k8s.integrationtest.TestConstants
 import org.apache.spark.deploy.k8s.integrationtest.backend.IntegrationTestBackend
 import org.apache.spark.internal.Logging
+import org.apache.spark.util.SparkStringUtils
 import org.apache.spark.util.Utils.checkAndGetK8sMasterUrl
 
 private[spark] class KubeConfigBackend(var context: String)
@@ -44,11 +44,11 @@ private[spark] class KubeConfigBackend(var context: String)
     // If an explicit master URL was specified then override that detected from the
     // K8S config if it is different
     var masterUrl = Option(System.getProperty(TestConstants.CONFIG_KEY_KUBE_MASTER_URL)).orNull
-    if (StringUtils.isNotBlank(masterUrl)) {
+    if (SparkStringUtils.isNotBlank(masterUrl)) {
       // Clean up master URL which would have been specified in Spark format into a normal
       // K8S master URL
       masterUrl = checkAndGetK8sMasterUrl(masterUrl).replaceFirst("k8s://", "")
-      if (!StringUtils.equals(config.getMasterUrl, masterUrl)) {
+      if (!config.getMasterUrl.equals(masterUrl)) {
         logInfo(s"Overriding K8S master URL ${config.getMasterUrl} from K8S config file " +
           s"with user specified master URL ${masterUrl}")
         config.setMasterUrl(masterUrl)
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ApplicationMaster.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ApplicationMaster.scala
index 11d22a3225d8a..9c9f6f3bc313a 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ApplicationMaster.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ApplicationMaster.scala
@@ -28,10 +28,8 @@ import scala.concurrent.Promise
 import scala.concurrent.duration.Duration
 import scala.util.control.NonFatal
 
-import org.apache.commons.lang3.{StringUtils => ComStrUtils}
 import org.apache.hadoop.fs.{FileSystem, Path}
 import org.apache.hadoop.security.UserGroupInformation
-import org.apache.hadoop.util.StringUtils
 import org.apache.hadoop.yarn.api._
 import org.apache.hadoop.yarn.api.records._
 import org.apache.hadoop.yarn.conf.YarnConfiguration
@@ -43,7 +41,7 @@ import org.apache.spark.deploy.{ExecutorFailureTracker, SparkHadoopUtil}
 import org.apache.spark.deploy.history.HistoryServer
 import org.apache.spark.deploy.security.HadoopDelegationTokenManager
 import org.apache.spark.deploy.yarn.config._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.UI._
 import org.apache.spark.metrics.{MetricsSystem, MetricsSystemInstances}
@@ -272,7 +270,7 @@ private[spark] class ApplicationMaster(
         logError("Uncaught exception: ", e)
         finish(FinalApplicationStatus.FAILED,
           ApplicationMaster.EXIT_UNCAUGHT_EXCEPTION,
-          "Uncaught exception: " + StringUtils.stringifyException(e))
+          "Uncaught exception: " + Utils.stringifyException(e))
     } finally {
       try {
         metricsSystem.foreach { ms =>
@@ -315,7 +313,7 @@ private[spark] class ApplicationMaster(
         logError("Uncaught exception: ", e)
         finish(FinalApplicationStatus.FAILED,
           ApplicationMaster.EXIT_UNCAUGHT_EXCEPTION,
-          "Uncaught exception: " + StringUtils.stringifyException(e))
+          "Uncaught exception: " + Utils.stringifyException(e))
         if (!unregistered) {
           // It's ok to clean staging dir first because unmanaged AM can't be retried.
           cleanupStagingDir(stagingDir)
@@ -390,7 +388,7 @@ private[spark] class ApplicationMaster(
         logInfo(log"Final app status: ${MDC(LogKeys.APP_STATE, finalStatus)}, " +
           log"exitCode: ${MDC(LogKeys.EXIT_CODE, exitCode)}" +
           Option(msg).map(msg => log", (reason: ${MDC(LogKeys.REASON, msg)})").getOrElse(log""))
-        finalMsg = ComStrUtils.abbreviate(msg, sparkConf.get(AM_FINAL_MSG_LIMIT).toInt)
+        finalMsg = Utils.abbreviate(msg, sparkConf.get(AM_FINAL_MSG_LIMIT).toInt)
         finished = true
         if (!inShutdown && Thread.currentThread() != reporterThread && reporterThread != null) {
           logDebug("shutting down reporter thread")
@@ -592,7 +590,7 @@ private[spark] class ApplicationMaster(
           if (!NonFatal(e)) {
             finish(FinalApplicationStatus.FAILED,
               ApplicationMaster.EXIT_REPORTER_FAILURE,
-              "Fatal exception: " + StringUtils.stringifyException(e))
+              "Fatal exception: " + Utils.stringifyException(e))
           } else if (failureCount >= reporterMaxFailures) {
             finish(FinalApplicationStatus.FAILED,
               ApplicationMaster.EXIT_REPORTER_FAILURE, "Exception was thrown " +
@@ -749,7 +747,7 @@ private[spark] class ApplicationMaster(
             e.getCause match {
               case _: InterruptedException =>
                 // Reporter thread can interrupt to stop user class
-              case SparkUserAppException(exitCode) =>
+              case SparkUserAppException(exitCode, _) =>
                 val msg = log"User application exited with status " +
                   log"${MDC(LogKeys.EXIT_CODE, exitCode)}"
                 logError(msg)
@@ -758,7 +756,7 @@ private[spark] class ApplicationMaster(
                 logError("User class threw exception: ", cause)
                 finish(FinalApplicationStatus.FAILED,
                   ApplicationMaster.EXIT_EXCEPTION_USER_CLASS,
-                  "User class threw exception: " + StringUtils.stringifyException(cause))
+                  "User class threw exception: " + Utils.stringifyException(cause))
             }
             sparkContextPromise.tryFailure(e.getCause())
         } finally {
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/Client.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/Client.scala
index 8b621e82afe28..b4f9c7469236d 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/Client.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/Client.scala
@@ -17,20 +17,20 @@
 
 package org.apache.spark.deploy.yarn
 
-import java.io.{File, FileFilter, FileNotFoundException, FileOutputStream, InterruptedIOException, IOException, OutputStreamWriter}
+import java.io.{BufferedInputStream, BufferedOutputStream, File, FileFilter, FileInputStream, FileNotFoundException, FileOutputStream, InterruptedIOException, IOException, OutputStreamWriter}
 import java.net.{InetAddress, UnknownHostException, URI, URL}
 import java.nio.ByteBuffer
 import java.nio.charset.StandardCharsets
 import java.nio.file.{Files, Paths}
-import java.util.{Collections, Locale, Properties, UUID}
+import java.util.{Collections, Locale, Objects, Properties, UUID}
 import java.util.zip.{ZipEntry, ZipOutputStream}
 
 import scala.collection.immutable.{Map => IMap}
 import scala.collection.mutable.{ArrayBuffer, HashMap, HashSet, ListBuffer, Map}
 import scala.jdk.CollectionConverters._
+import scala.util.Using
 import scala.util.control.NonFatal
 
-import com.google.common.base.Objects
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 import org.apache.hadoop.fs.permission.FsPermission
@@ -55,7 +55,7 @@ import org.apache.spark.deploy.security.HadoopDelegationTokenManager
 import org.apache.spark.deploy.yarn.ResourceRequestHelper._
 import org.apache.spark.deploy.yarn.YarnSparkHadoopUtil._
 import org.apache.spark.deploy.yarn.config._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config._
 import org.apache.spark.internal.config.Python._
 import org.apache.spark.launcher.{JavaModuleOptions, LauncherBackend, SparkAppHandle, YarnCommandBuilderUtils}
@@ -705,27 +705,27 @@ private[spark] class Client(
           // No configuration, so fall back to uploading local jar files.
           logWarning(
             log"Neither ${MDC(LogKeys.CONFIG, SPARK_JARS.key)} nor " +
-              log"${MDC(LogKeys.CONFIG2, SPARK_ARCHIVE.key)}} is set, falling back to uploading " +
+              log"${MDC(LogKeys.CONFIG2, SPARK_ARCHIVE.key)} is set, falling back to uploading " +
               log"libraries under SPARK_HOME.")
           val jarsDir = new File(YarnCommandBuilderUtils.findJarsDir(
             sparkConf.getenv("SPARK_HOME")))
           val jarsArchive = File.createTempFile(LOCALIZED_LIB_DIR, ".zip",
             new File(Utils.getLocalDir(sparkConf)))
-          val jarsStream = new ZipOutputStream(new FileOutputStream(jarsArchive))
-
-          try {
-            jarsStream.setLevel(0)
-            jarsDir.listFiles().foreach { f =>
-              if (f.isFile && f.getName.toLowerCase(Locale.ROOT).endsWith(".jar") && f.canRead) {
-                jarsStream.putNextEntry(new ZipEntry(f.getName))
-                Files.copy(f.toPath, jarsStream)
+          val bufferSize = sparkConf.get(BUFFER_SIZE)
+          Using.resource(new ZipOutputStream(
+            new BufferedOutputStream(new FileOutputStream(jarsArchive), bufferSize))) {
+            jarsStream =>
+              jarsStream.setLevel(0)
+              jarsDir.listFiles().foreach { f =>
+                if (f.isFile && f.getName.toLowerCase(Locale.ROOT).endsWith(".jar") && f.canRead) {
+                  jarsStream.putNextEntry(new ZipEntry(f.getName))
+                  Using.resource(new BufferedInputStream(new FileInputStream(f), bufferSize)) {
+                    _.transferTo(jarsStream)
+                  }
+                }
                 jarsStream.closeEntry()
               }
-            }
-          } finally {
-            jarsStream.close()
           }
-
           distribute(jarsArchive.toURI.getPath,
             resType = LocalResourceType.ARCHIVE,
             destName = Some(LOCALIZED_LIB_DIR))
@@ -1725,7 +1725,7 @@ private[spark] object Client extends Logging {
       }
     }
 
-    Objects.equal(srcHost, dstHost) && srcUri.getPort() == dstUri.getPort()
+    Objects.equals(srcHost, dstHost) && srcUri.getPort() == dstUri.getPort()
 
   }
 
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala
index 62753f35ae76c..858b4eef07455 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ClientArguments.scala
@@ -19,7 +19,7 @@ package org.apache.spark.deploy.yarn
 
 import scala.collection.mutable.ArrayBuffer
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.ARGS
 
 // TODO: Add code and support for ensuring that yarn resource 'tasks' are location aware !
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ExecutorRunnable.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ExecutorRunnable.scala
index 983ab5b4341b8..052b759e3f5c5 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ExecutorRunnable.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ExecutorRunnable.scala
@@ -38,7 +38,7 @@ import org.apache.hadoop.yarn.ipc.YarnRPC
 import org.apache.hadoop.yarn.util.Records
 
 import org.apache.spark.{SecurityManager, SparkConf, SparkException}
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys.{EXECUTOR_ENVS, EXECUTOR_LAUNCH_COMMANDS, EXECUTOR_RESOURCES}
 import org.apache.spark.internal.config._
 import org.apache.spark.network.util.JavaUtils
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ResourceRequestHelper.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ResourceRequestHelper.scala
index a747f99f1b85d..899382d4c5d13 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ResourceRequestHelper.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/ResourceRequestHelper.scala
@@ -25,7 +25,7 @@ import org.apache.hadoop.yarn.exceptions.ResourceNotFoundException
 
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.deploy.yarn.config._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ERROR, RESOURCE_NAME}
 import org.apache.spark.internal.config._
 import org.apache.spark.resource.ResourceID
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/SparkRackResolver.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/SparkRackResolver.scala
index d6e814f5c30a5..b1bfbbb385747 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/SparkRackResolver.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/SparkRackResolver.scala
@@ -20,14 +20,14 @@ package org.apache.spark.deploy.yarn
 import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
-import com.google.common.base.Strings
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.CommonConfigurationKeysPublic
 import org.apache.hadoop.net._
 import org.apache.hadoop.util.ReflectionUtils
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.NODE_LOCATION
+import org.apache.spark.util.SparkStringUtils
 
 /**
  * Re-implement YARN's [[RackResolver]] for hadoop releases without YARN-9332.
@@ -73,7 +73,7 @@ private[spark] class SparkRackResolver(conf: Configuration) extends Logging {
         log"Falling back to ${MDC(NODE_LOCATION, NetworkTopology.DEFAULT_RACK)} for all")
     } else {
       for ((hostName, rName) <- hostNames.zip(rNameList)) {
-        if (Strings.isNullOrEmpty(rName)) {
+        if (SparkStringUtils.isEmpty(rName)) {
           nodes += new NodeBase(hostName, NetworkTopology.DEFAULT_RACK)
           logDebug(s"Could not resolve $hostName. " +
             s"Falling back to ${NetworkTopology.DEFAULT_RACK}")
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocator.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocator.scala
index 911ce2e27f96d..48946b5a8e6ea 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocator.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocator.scala
@@ -40,7 +40,7 @@ import org.apache.spark.deploy.yarn.ResourceRequestHelper._
 import org.apache.spark.deploy.yarn.YarnSparkHadoopUtil._
 import org.apache.spark.deploy.yarn.config._
 import org.apache.spark.executor.ExecutorExitCode
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config._
 import org.apache.spark.resource.ResourceProfile
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocatorNodeHealthTracker.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocatorNodeHealthTracker.scala
index 6938c0d7f8020..7455f33f48b0b 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocatorNodeHealthTracker.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/YarnAllocatorNodeHealthTracker.scala
@@ -25,7 +25,7 @@ import org.apache.hadoop.yarn.client.api.AMRMClient.ContainerRequest
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.ExecutorFailureTracker
 import org.apache.spark.deploy.yarn.config._
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FAILURES, HOST, NODES}
 import org.apache.spark.internal.config._
 import org.apache.spark.scheduler.HealthTracker
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/config.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/config/package.scala
similarity index 100%
rename from resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/config.scala
rename to resource-managers/yarn/src/main/scala/org/apache/spark/deploy/yarn/config/package.scala
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnClientSchedulerBackend.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnClientSchedulerBackend.scala
index 8032d782cf4fc..9389a13e292f8 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnClientSchedulerBackend.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnClientSchedulerBackend.scala
@@ -26,7 +26,7 @@ import org.apache.hadoop.yarn.api.records.{FinalApplicationStatus, YarnApplicati
 import org.apache.spark.{SparkContext, SparkException}
 import org.apache.spark.deploy.yarn.{Client, ClientArguments, YarnAppReport}
 import org.apache.spark.deploy.yarn.config._
-import org.apache.spark.internal.{config, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{config, Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{APP_ID, APP_STATE}
 import org.apache.spark.launcher.SparkAppHandle
 import org.apache.spark.scheduler.TaskSchedulerImpl
diff --git a/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnSchedulerBackend.scala b/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnSchedulerBackend.scala
index cd81f11510fee..dae3317f0892c 100644
--- a/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnSchedulerBackend.scala
+++ b/resource-managers/yarn/src/main/scala/org/apache/spark/scheduler/cluster/YarnSchedulerBackend.scala
@@ -29,7 +29,7 @@ import org.apache.hadoop.yarn.api.records.{ApplicationAttemptId, ApplicationId}
 
 import org.apache.spark.SparkContext
 import org.apache.spark.deploy.security.HadoopDelegationTokenManager
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.internal.config.UI._
 import org.apache.spark.resource.ResourceProfile
diff --git a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/BaseYarnClusterSuite.scala b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/BaseYarnClusterSuite.scala
index 3bf6a6e84a88b..1f755ba5efee5 100644
--- a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/BaseYarnClusterSuite.scala
+++ b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/BaseYarnClusterSuite.scala
@@ -19,13 +19,13 @@ package org.apache.spark.deploy.yarn
 
 import java.io.{File, FileOutputStream, OutputStreamWriter}
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.Properties
 import java.util.concurrent.TimeUnit
 
 import scala.concurrent.duration._
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
 import org.apache.hadoop.yarn.conf.YarnConfiguration
 import org.apache.hadoop.yarn.server.MiniYARNCluster
 import org.scalactic.source.Position
@@ -86,7 +86,7 @@ abstract class BaseYarnClusterSuite extends SparkFunSuite with Matchers {
     logConfDir.mkdir()
 
     val logConfFile = new File(logConfDir, "log4j2.properties")
-    Files.asCharSink(logConfFile, StandardCharsets.UTF_8).write(LOG4J_CONF)
+    Files.writeString(logConfFile.toPath, LOG4J_CONF)
 
     // Disable the disk utilization check to avoid the test hanging when people's disks are
     // getting full.
@@ -236,11 +236,11 @@ abstract class BaseYarnClusterSuite extends SparkFunSuite with Matchers {
     // an error message
     val output = new Object() {
       override def toString: String = outFile
-          .map(Files.asCharSource(_, StandardCharsets.UTF_8).read())
+          .map((f: File) => java.nio.file.Files.readString(f.toPath))
           .getOrElse("(stdout/stderr was not captured)")
     }
     assert(finalState === SparkAppHandle.State.FINISHED, output)
-    val resultString = Files.asCharSource(result, StandardCharsets.UTF_8).read()
+    val resultString = Files.readString(result.toPath)
     assert(resultString === expected, output)
   }
 
diff --git a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnClusterSuite.scala b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnClusterSuite.scala
index 3280b80b50f45..32cf9ea66803a 100644
--- a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnClusterSuite.scala
+++ b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnClusterSuite.scala
@@ -20,14 +20,13 @@ package org.apache.spark.deploy.yarn
 import java.io.File
 import java.net.URL
 import java.nio.charset.StandardCharsets
-import java.nio.file.Paths
+import java.nio.file.{Files, Paths}
 import java.util.{HashMap => JHashMap}
 
 import scala.collection.mutable
 import scala.concurrent.duration._
 import scala.io.Source
 
-import com.google.common.io.{ByteStreams, Files}
 import org.apache.hadoop.yarn.conf.YarnConfiguration
 import org.scalatest.concurrent.Eventually._
 import org.scalatest.exceptions.TestFailedException
@@ -180,7 +179,7 @@ class YarnClusterSuite extends BaseYarnClusterSuite {
       |  </property>
       |</configuration>
       |""".stripMargin
-    Files.asCharSink(new File(customConf, "core-site.xml"), StandardCharsets.UTF_8).write(coreSite)
+    Files.writeString(new File(customConf, "core-site.xml").toPath, coreSite)
 
     val result = File.createTempFile("result", null, tempDir)
     val finalState = runSpark(false,
@@ -353,7 +352,7 @@ class YarnClusterSuite extends BaseYarnClusterSuite {
   test("running Spark in yarn-cluster mode displays driver log links") {
     val log4jConf = new File(tempDir, "log4j2.properties")
     val logOutFile = new File(tempDir, "logs")
-    Files.asCharSink(log4jConf, StandardCharsets.UTF_8).write(
+    Files.writeString(log4jConf.toPath,
       s"""rootLogger.level = debug
          |rootLogger.appenderRef.file.ref = file
          |appender.file.type = File
@@ -367,8 +366,7 @@ class YarnClusterSuite extends BaseYarnClusterSuite {
     val confDir = new File(tempDir, "conf")
     confDir.mkdir()
     val javaOptsFile = new File(confDir, "java-opts")
-    Files.asCharSink(javaOptsFile, StandardCharsets.UTF_8)
-      .write(s"-Dlog4j.configurationFile=file://$log4jConf\n")
+    Files.writeString(javaOptsFile.toPath, s"-Dlog4j.configurationFile=file://$log4jConf\n")
 
     val result = File.createTempFile("result", null, tempDir)
     val finalState = runSpark(clientMode = false,
@@ -377,7 +375,7 @@ class YarnClusterSuite extends BaseYarnClusterSuite {
       extraEnv = Map("SPARK_CONF_DIR" -> confDir.getAbsolutePath),
       extraConf = Map(CLIENT_INCLUDE_DRIVER_LOGS_LINK.key -> true.toString))
     checkResult(finalState, result)
-    val logOutput = Files.asCharSource(logOutFile, StandardCharsets.UTF_8).read()
+    val logOutput = Files.readString(logOutFile.toPath)
     val logFilePattern = raw"""(?s).+\sDriver Logs \(<NAME>\): https?://.+/<NAME>(\?\S+)?\s.+"""
     logOutput should fullyMatch regex logFilePattern.replace("<NAME>", "stdout")
     logOutput should fullyMatch regex logFilePattern.replace("<NAME>", "stderr")
@@ -432,7 +430,7 @@ class YarnClusterSuite extends BaseYarnClusterSuite {
       script: String = TEST_PYFILE): Unit = {
     assume(isPythonAvailable)
     val primaryPyFile = new File(tempDir, "test.py")
-    Files.asCharSink(primaryPyFile, StandardCharsets.UTF_8).write(script)
+    Files.writeString(primaryPyFile.toPath, script)
 
     // When running tests, let's not assume the user has built the assembly module, which also
     // creates the pyspark archive. Instead, let's use PYSPARK_ARCHIVES_PATH to point at the
@@ -460,7 +458,7 @@ class YarnClusterSuite extends BaseYarnClusterSuite {
       subdir
     }
     val pyModule = new File(moduleDir, "mod1.py")
-    Files.asCharSink(pyModule, StandardCharsets.UTF_8).write(TEST_PYMODULE)
+    Files.writeString(pyModule.toPath, TEST_PYMODULE)
 
     val mod2Archive = TestUtils.createJarWithFiles(Map("mod2.py" -> TEST_PYMODULE), moduleDir)
     val pyFiles = Seq(pyModule.getAbsolutePath(), mod2Archive.getPath()).mkString(",")
@@ -507,7 +505,7 @@ class YarnClusterSuite extends BaseYarnClusterSuite {
 
   def createEmptyIvySettingsFile: File = {
     val emptyIvySettings = File.createTempFile("ivy", ".xml")
-    Files.asCharSink(emptyIvySettings, StandardCharsets.UTF_8).write("<ivysettings />")
+    Files.writeString(emptyIvySettings.toPath, "<ivysettings />")
     emptyIvySettings
   }
 
@@ -619,7 +617,7 @@ private object YarnClusterDriverUseSparkHadoopUtilConf extends Logging with Matc
       }
       result = "success"
     } finally {
-      Files.asCharSink(status, StandardCharsets.UTF_8).write(result)
+      Files.writeString(status.toPath, result)
       sc.stop()
     }
   }
@@ -722,7 +720,7 @@ private object YarnClusterDriver extends Logging with Matchers {
         assert(driverAttributes === expectationAttributes)
       }
     } finally {
-      Files.asCharSink(status, StandardCharsets.UTF_8).write(result)
+      Files.writeString(status.toPath, result)
       sc.stop()
     }
   }
@@ -764,14 +762,13 @@ private object YarnClasspathTest extends Logging {
     var result = "failure"
     try {
       val ccl = Thread.currentThread().getContextClassLoader()
-      val resource = ccl.getResourceAsStream("test.resource")
-      val bytes = ByteStreams.toByteArray(resource)
+      val bytes = ccl.getResourceAsStream("test.resource").readAllBytes()
       result = new String(bytes, 0, bytes.length, StandardCharsets.UTF_8)
     } catch {
       case t: Throwable =>
         error(s"loading test.resource to $resultPath", t)
     } finally {
-      Files.asCharSink(new File(resultPath), StandardCharsets.UTF_8).write(result)
+      Files.writeString(new File(resultPath).toPath, result)
     }
   }
 
@@ -815,7 +812,7 @@ private object YarnAddJarTest extends Logging {
         result = "success"
       }
     } finally {
-      Files.asCharSink(new File(resultPath), StandardCharsets.UTF_8).write(result)
+      Files.writeString(new File(resultPath).toPath, result)
       sc.stop()
     }
   }
@@ -860,7 +857,7 @@ private object ExecutorEnvTestApp {
       executorEnvs.get(k).contains(v)
     }
 
-    Files.asCharSink(new File(status), StandardCharsets.UTF_8).write(result.toString)
+    Files.writeString(new File(status).toPath, result.toString)
     sc.stop()
   }
 
@@ -875,7 +872,7 @@ private class PyConnectDepChecker(python: String, libPath: Seq[String]) {
   lazy val isSparkConnectJarAvailable: Boolean = {
     val filePath = s"$sparkHome/assembly/target/$scalaDir/jars/" +
       s"spark-connect_$scalaVersion-$SPARK_VERSION.jar"
-    java.nio.file.Files.exists(Paths.get(filePath))
+    Files.exists(Paths.get(filePath))
   }
 
   lazy val isConnectPythonPackagesAvailable: Boolean = Try {
diff --git a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnShuffleIntegrationSuite.scala b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnShuffleIntegrationSuite.scala
index f8d69c0ae568e..2c567b3fa243d 100644
--- a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnShuffleIntegrationSuite.scala
+++ b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnShuffleIntegrationSuite.scala
@@ -18,10 +18,8 @@
 package org.apache.spark.deploy.yarn
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
-import com.google.common.io.Files
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.yarn.conf.YarnConfiguration
 import org.scalatest.matchers.must.Matchers
 import org.scalatest.matchers.should.Matchers._
@@ -34,6 +32,7 @@ import org.apache.spark.network.shuffle.ShuffleTestAccessor
 import org.apache.spark.network.shuffledb.DBBackend
 import org.apache.spark.network.yarn.{YarnShuffleService, YarnTestAccessor}
 import org.apache.spark.tags.{ExtendedLevelDBTest, ExtendedYarnTest}
+import org.apache.spark.util.Utils
 
 /**
  * Integration test for the external shuffle service with a yarn mini-cluster
@@ -172,16 +171,16 @@ private object YarnExternalShuffleDriver extends Logging with Matchers {
         val dbBackend = DBBackend.byName(dbBackendName)
         logWarning(s"Use ${dbBackend.name()} as the implementation of " +
           s"${SHUFFLE_SERVICE_DB_BACKEND.key}")
-        FileUtils.copyDirectory(registeredExecFile, execStateCopy)
+        Utils.copyDirectory(registeredExecFile, execStateCopy)
         assert(!ShuffleTestAccessor
           .reloadRegisteredExecutors(dbBackend, execStateCopy).isEmpty)
       }
     } finally {
       sc.stop()
       if (execStateCopy != null) {
-        FileUtils.deleteDirectory(execStateCopy)
+        Utils.deleteRecursively(execStateCopy)
       }
-      Files.asCharSink(status, StandardCharsets.UTF_8).write(result)
+      Files.writeString(status.toPath, result)
     }
   }
 
diff --git a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtilSuite.scala b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtilSuite.scala
index 562ce3b5bdbaf..a6b9caae8d369 100644
--- a/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtilSuite.scala
+++ b/resource-managers/yarn/src/test/scala/org/apache/spark/deploy/yarn/YarnSparkHadoopUtilSuite.scala
@@ -18,9 +18,8 @@
 package org.apache.spark.deploy.yarn
 
 import java.io.{File, IOException}
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
-import com.google.common.io.{ByteStreams, Files}
 import org.apache.hadoop.yarn.api.records.ApplicationAccessType
 import org.apache.hadoop.yarn.conf.YarnConfiguration
 import org.scalatest.matchers.must.Matchers
@@ -54,12 +53,12 @@ class YarnSparkHadoopUtilSuite extends SparkFunSuite with Matchers with ResetSys
     val args = Array("arg1", "${arg.2}", "\"arg3\"", "'arg4'", "$arg5", "\\arg6")
     try {
       val argLine = args.map(a => YarnSparkHadoopUtil.escapeForShell(a)).mkString(" ")
-      Files.write(("bash -c \"echo " + argLine + "\"").getBytes(StandardCharsets.UTF_8), scriptFile)
+      Files.writeString(scriptFile.toPath, "bash -c \"echo " + argLine + "\"")
       scriptFile.setExecutable(true)
 
       val proc = Runtime.getRuntime().exec(Array(scriptFile.getAbsolutePath()))
-      val out = new String(ByteStreams.toByteArray(proc.getInputStream())).trim()
-      val err = new String(ByteStreams.toByteArray(proc.getErrorStream()))
+      val out = Utils.toString(proc.getInputStream()).trim()
+      val err = Utils.toString(proc.getErrorStream())
       val exitCode = proc.waitFor()
       exitCode should be (0)
       out should be (args.mkString(" "))
diff --git a/resource-managers/yarn/src/test/scala/org/apache/spark/network/yarn/YarnShuffleServiceSuite.scala b/resource-managers/yarn/src/test/scala/org/apache/spark/network/yarn/YarnShuffleServiceSuite.scala
index 56d7b7ff6a09e..72d684e15fc62 100644
--- a/resource-managers/yarn/src/test/scala/org/apache/spark/network/yarn/YarnShuffleServiceSuite.scala
+++ b/resource-managers/yarn/src/test/scala/org/apache/spark/network/yarn/YarnShuffleServiceSuite.scala
@@ -129,12 +129,12 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
       reduceId: Int,
       blockId: String): AppShufflePartitionInfo = {
     val dataFile = ShuffleTestAccessor.getMergedShuffleDataFile(mergeManager, partitionId, reduceId)
-    dataFile.getParentFile.mkdirs()
+    Utils.createDirectory(dataFile.getParentFile)
     val indexFile =
       ShuffleTestAccessor.getMergedShuffleIndexFile(mergeManager, partitionId, reduceId)
-    indexFile.getParentFile.mkdirs()
+    Utils.createDirectory(indexFile.getParentFile)
     val metaFile = ShuffleTestAccessor.getMergedShuffleMetaFile(mergeManager, partitionId, reduceId)
-    metaFile.getParentFile.mkdirs()
+    Utils.createDirectory(metaFile.getParentFile)
     val partitionInfo = ShuffleTestAccessor.getOrCreateAppShufflePartitionInfo(
       mergeManager, partitionId, reduceId, blockId)
 
@@ -616,35 +616,35 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     val mergeManager1DB = ShuffleTestAccessor.mergeManagerDB(mergeManager1)
     ShuffleTestAccessor.recoveryFile(mergeManager1) should be (mergeMgrFile)
 
-    ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1).size() equals 0
-    ShuffleTestAccessor.reloadAppShuffleInfo(
-      mergeManager1, mergeManager1DB).size() equals 0
+    assert(ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1).size() equals 0)
+    assert(ShuffleTestAccessor.reloadAppShuffleInfo(
+      mergeManager1, mergeManager1DB).size() equals 0)
 
     mergeManager1.registerExecutor(app1Id.toString, mergedShuffleInfo1)
     var appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 1
+    assert(appShuffleInfo.size() equals 1)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     var appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 1
+    assert(appShuffleInfoAfterReload.size() equals 1)
     appShuffleInfoAfterReload.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
 
     mergeManager1.registerExecutor(app2Attempt1Id.toString, mergedShuffleInfo2Attempt1)
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 2
+    assert(appShuffleInfo.size() equals 2)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfo.get(
       app2Attempt1Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt1)
     appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 2
+    assert(appShuffleInfoAfterReload.size() equals 2)
     appShuffleInfoAfterReload.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfoAfterReload.get(
       app2Attempt1Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt1)
 
     mergeManager1.registerExecutor(app3IdNoAttemptId.toString, mergedShuffleInfo3NoAttemptId)
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 3
+    assert(appShuffleInfo.size() equals 3)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfo.get(
       app2Attempt1Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt1)
@@ -652,7 +652,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
       app3IdNoAttemptId.toString).getAppPathsInfo should be (appPathsInfo3NoAttempt)
     appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 3
+    assert(appShuffleInfoAfterReload.size() equals 3)
     appShuffleInfoAfterReload.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfoAfterReload.get(
       app2Attempt1Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt1)
@@ -661,7 +661,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
 
     mergeManager1.registerExecutor(app2Attempt2Id.toString, mergedShuffleInfo2Attempt2)
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 3
+    assert(appShuffleInfo.size() equals 3)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfo.get(
       app2Attempt2Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt2)
@@ -669,7 +669,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
       app3IdNoAttemptId.toString).getAppPathsInfo should be (appPathsInfo3NoAttempt)
     appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 3
+    assert(appShuffleInfoAfterReload.size() equals 3)
     appShuffleInfoAfterReload.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfoAfterReload.get(
       app2Attempt2Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt2)
@@ -678,14 +678,14 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
 
     mergeManager1.applicationRemoved(app2Attempt2Id.toString, true)
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 2
+    assert(appShuffleInfo.size() equals 2)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     assert(!appShuffleInfo.containsKey(app2Attempt2Id.toString))
     appShuffleInfo.get(
       app3IdNoAttemptId.toString).getAppPathsInfo should be (appPathsInfo3NoAttempt)
     appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 2
+    assert(appShuffleInfoAfterReload.size() equals 2)
     appShuffleInfoAfterReload.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     assert(!appShuffleInfoAfterReload.containsKey(app2Attempt2Id.toString))
     appShuffleInfoAfterReload.get(
@@ -725,9 +725,9 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     val mergeManager1DB = ShuffleTestAccessor.mergeManagerDB(mergeManager1)
     ShuffleTestAccessor.recoveryFile(mergeManager1) should be (mergeMgrFile)
 
-    ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1).size() equals 0
-    ShuffleTestAccessor.reloadAppShuffleInfo(
-      mergeManager1, mergeManager1DB).size() equals 0
+    assert(ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1).size() equals 0)
+    assert(ShuffleTestAccessor.reloadAppShuffleInfo(
+      mergeManager1, mergeManager1DB).size() equals 0)
 
     mergeManager1.registerExecutor(app1Id.toString, mergedShuffleInfo1)
     mergeManager1.registerExecutor(app2Attempt1Id.toString, mergedShuffleInfo2Attempt1)
@@ -737,7 +737,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     prepareAppShufflePartition(mergeManager1, partitionId2, 2, "4")
 
     var appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 2
+    assert(appShuffleInfo.size() equals 2)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfo.get(
       app2Attempt1Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt1)
@@ -745,7 +745,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     assert(!appShuffleInfo.get(app2Attempt1Id.toString).getShuffles.get(2).isFinalized)
     var appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 2
+    assert(appShuffleInfoAfterReload.size() equals 2)
     appShuffleInfoAfterReload.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfoAfterReload.get(
       app2Attempt1Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt1)
@@ -765,12 +765,12 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
 
     mergeManager1.applicationRemoved(app1Id.toString, true)
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 1
+    assert(appShuffleInfo.size() equals 1)
     assert(!appShuffleInfo.containsKey(app1Id.toString))
     assert(appShuffleInfo.get(app2Attempt1Id.toString).getShuffles.get(2).isFinalized)
     appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 1
+    assert(appShuffleInfoAfterReload.size() equals 1)
     assert(!appShuffleInfoAfterReload.containsKey(app1Id.toString))
     assert(appShuffleInfoAfterReload.get(app2Attempt1Id.toString).getShuffles.get(2).isFinalized)
 
@@ -844,7 +844,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     prepareAppShufflePartition(mergeManager1, partitionId2, 2, "4")
 
     var appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 2
+    assert(appShuffleInfo.size() equals 2)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     appShuffleInfo.get(
       app2Id.toString).getAppPathsInfo should be (appPathsInfo2Attempt1)
@@ -867,20 +867,20 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     mergeManager1.applicationRemoved(app1Id.toString, true)
 
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 1
+    assert(appShuffleInfo.size() equals 1)
     assert(!appShuffleInfo.containsKey(app1Id.toString))
     assert(appShuffleInfo.get(app2Id.toString).getShuffles.get(2).isFinalized)
     // Clear the AppsShuffleInfo hashmap and reload the hashmap from DB
     appShuffleInfoAfterReload =
       ShuffleTestAccessor.reloadAppShuffleInfo(mergeManager1, mergeManager1DB)
-    appShuffleInfoAfterReload.size() equals 1
+    assert(appShuffleInfoAfterReload.size() equals 1)
     assert(!appShuffleInfoAfterReload.containsKey(app1Id.toString))
     assert(appShuffleInfoAfterReload.get(app2Id.toString).getShuffles.get(2).isFinalized)
 
     // Register application app1Id again and reload the DB again
     mergeManager1.registerExecutor(app1Id.toString, mergedShuffleInfo1)
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 2
+    assert(appShuffleInfo.size() equals 2)
     appShuffleInfo.get(app1Id.toString).getAppPathsInfo should be (appPathsInfo1)
     assert(appShuffleInfo.get(app1Id.toString).getShuffles.isEmpty)
     assert(appShuffleInfo.get(app2Id.toString).getShuffles.get(2).isFinalized)
@@ -924,7 +924,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     prepareAppShufflePartition(mergeManager1, partitionId1, 2, "4")
 
     var appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 1
+    assert(appShuffleInfo.size() equals 1)
     appShuffleInfo.get(
       app1Id.toString).getAppPathsInfo should be (appPathsInfo1Attempt1)
     assert(!appShuffleInfo.get(app1Id.toString).getShuffles.get(2).isFinalized)
@@ -938,7 +938,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     prepareAppShufflePartition(mergeManager1, partitionId2, 2, "4")
 
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 1
+    assert(appShuffleInfo.size() equals 1)
     appShuffleInfo.get(
       app1Id.toString).getAppPathsInfo should be (appPathsInfo1Attempt2)
     assert(!appShuffleInfo.get(app1Id.toString).getShuffles.get(2).isFinalized)
@@ -973,7 +973,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     val mergeManager3 = s3.shuffleMergeManager.asInstanceOf[RemoteBlockPushResolver]
     val mergeManager3DB = ShuffleTestAccessor.mergeManagerDB(mergeManager3)
     appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager3)
-    appShuffleInfo.size() equals 1
+    assert(appShuffleInfo.size() equals 1)
     appShuffleInfo.get(
       app1Id.toString).getAppPathsInfo should be (appPathsInfo1Attempt2)
     assert(appShuffleInfo.get(app1Id.toString).getShuffles.get(2).isFinalized)
@@ -1014,7 +1014,7 @@ abstract class YarnShuffleServiceSuite extends SparkFunSuite with Matchers {
     mergeManager1.registerExecutor(app1Id.toString, mergedShuffleInfo1Attempt2)
 
     val appShuffleInfo = ShuffleTestAccessor.getAppsShuffleInfo(mergeManager1)
-    appShuffleInfo.size() equals 1
+    assert(appShuffleInfo.size() equals 1)
     appShuffleInfo.get(
       app1Id.toString).getAppPathsInfo should be (appPathsInfo1Attempt2)
 
diff --git a/scalastyle-config.xml b/scalastyle-config.xml
index ca3d507ed3a44..f9b260e14c6f9 100644
--- a/scalastyle-config.xml
+++ b/scalastyle-config.xml
@@ -46,7 +46,7 @@ This file is divided into 3 sections:
 
   <check level="error" class="org.scalastyle.file.FileTabChecker" enabled="true"></check>
 
-  <check level="error" class="org.scalastyle.file.HeaderMatchesChecker" enabled="true">
+  <check customId="license" level="error" class="org.scalastyle.file.HeaderMatchesChecker" enabled="true">
     <parameters>
        <parameter name="header"><![CDATA[/*
  * Licensed to the Apache Software Foundation (ASF) under one or more
@@ -282,14 +282,260 @@ This file is divided into 3 sections:
       scala.jdk.CollectionConverters._ and use .asScala / .asJava methods</customMessage>
   </check>
 
+  <check customId="createParentDirs" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.createParentDirs\b</parameter></parameters>
+    <customMessage>Use createParentDirs of SparkFileUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="filesequal" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.equal\b</parameter></parameters>
+    <customMessage>Use contentEquals of SparkFileUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="toByteArray" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.toByteArray\b</parameter></parameters>
+    <customMessage>Use java.nio.file.Files.readAllBytes instead.</customMessage>
+  </check>
+
+  <check customId="asByteSource" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.asByteSource\b</parameter></parameters>
+    <customMessage>Use java.nio.file.Files.newInputStream instead.</customMessage>
+  </check>
+
+  <check customId="getTempDirectory" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.getTempDirectory\b</parameter></parameters>
+    <customMessage>Use System.getProperty instead.</customMessage>
+  </check>
+
+  <check customId="readLines" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.readLines\b</parameter></parameters>
+    <customMessage>Use Files.readAllLines instead.</customMessage>
+  </check>
+
+  <check customId="filesreadLines" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.readLines\b</parameter></parameters>
+    <customMessage>Use Files.readAllLines instead.</customMessage>
+  </check>
+
+  <check customId="readFileToString" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.readFileToString\b</parameter></parameters>
+    <customMessage>Use Files.readString instead.</customMessage>
+  </check>
+
+  <check customId="asCharSource" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.asCharSource\b</parameter></parameters>
+    <customMessage>Use Files.readString instead.</customMessage>
+  </check>
+
+  <check customId="write" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.write\b</parameter></parameters>
+    <customMessage>Use Files.writeString instead.</customMessage>
+  </check>
+
+  <check customId="asCharSink" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.asCharSink\b</parameter></parameters>
+    <customMessage>Use Files.writeString instead.</customMessage>
+  </check>
+
+  <check customId="writeLines" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.writeLines\b</parameter></parameters>
+    <customMessage>Use Files.write instead.</customMessage>
+  </check>
+
+  <check customId="cleanDirectory" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.cleanDirectory\b</parameter></parameters>
+    <customMessage>Use cleanDirectory of JavaUtils/SparkFileUtils/Utils</customMessage>
+  </check>
+
+  <check customId="deleteRecursively" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.deleteDirectory\b</parameter></parameters>
+    <customMessage>Use deleteRecursively of JavaUtils/SparkFileUtils/Utils</customMessage>
+  </check>
+
+  <check customId="forceDelete" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.forceDelete\b</parameter></parameters>
+    <customMessage>Use deleteRecursively of JavaUtils/SparkFileUtils/Utils</customMessage>
+  </check>
+
+  <check customId="forceDeleteOnExit" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.forceDeleteOnExit\b</parameter></parameters>
+    <customMessage>Use forceDeleteOnExit of JavaUtils/SparkFileUtils/Utils instead.</customMessage>
+  </check>
+
+  <check customId="deleteQuietly" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.deleteQuietly\b</parameter></parameters>
+    <customMessage>Use deleteQuietly of JavaUtils/SparkFileUtils/Utils</customMessage>
+  </check>
+
+  <check customId="readFileToByteArray" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.readFileToByteArray\b</parameter></parameters>
+    <customMessage>Use java.nio.file.Files.readAllBytes</customMessage>
+  </check>
+
+  <check customId="sizeOf" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.sizeOf(Directory)?\b</parameter></parameters>
+    <customMessage>Use sizeOf of JavaUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="moveFile" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.moveFile\b</parameter></parameters>
+    <customMessage>Use copyFile of JavaUtils/SparkFileUtils/Utils instead.</customMessage>
+  </check>
+
+  <check customId="copyURLToFile" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.copyURLToFile\b</parameter></parameters>
+    <customMessage>Use copyURLToFile of JavaUtils instead.</customMessage>
+  </check>
+
+  <check customId="copyFile" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.copyFile\b</parameter></parameters>
+    <customMessage>Use copyFile of SparkFileUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="copyFileToDirectory" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.copyFileToDirectory\b</parameter></parameters>
+    <customMessage>Use copyFileToDirectory of SparkFileUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="copyDirectory" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.copyDirectory\b</parameter></parameters>
+    <customMessage>Use copyDirectory of JavaUtils/SparkFileUtils/Utils instead.</customMessage>
+  </check>
+
+  <check customId="moveDirectory" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.moveDirectory\b</parameter></parameters>
+    <customMessage>Use copyDirectory of SparkFileUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="contentEquals" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.contentEquals\b</parameter></parameters>
+    <customMessage>Use contentEquals of SparkFileUtils or Utils instead.</customMessage>
+  </check>
+
   <check customId="commonslang2" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
     <parameters><parameter name="regex">org\.apache\.commons\.lang\.</parameter></parameters>
     <customMessage>Use Commons Lang 3 classes (package org.apache.commons.lang3.*) instead
     of Commons Lang 2 (package org.apache.commons.lang.*)</customMessage>
   </check>
 
+  <check customId="getFile" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.getFile\b</parameter></parameters>
+    <customMessage>Use getFile of SparkFileUtil or Utils instead.</customMessage>
+  </check>
+
+  <check customId="touch" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.touch\b</parameter></parameters>
+    <customMessage>Use touch of SparkFileUtil or Utils instead.</customMessage>
+  </check>
+
+  <check customId="filestouch" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFiles\.touch\b</parameter></parameters>
+    <customMessage>Use touch of SparkFileUtil or Utils instead.</customMessage>
+  </check>
+
+  <check customId="writeStringToFile" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.writeStringToFile\b</parameter></parameters>
+    <customMessage>Use java.nio.file.Files.writeString instead.</customMessage>
+  </check>
+
+  <check customId="listFiles" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bFileUtils\.listFiles\b</parameter></parameters>
+    <customMessage>Use listFiles of SparkFileUtil or Utils instead.</customMessage>
+  </check>
+
+  <check customId="commonscodecbase64" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.codec\.binary\.Base64\b</parameter></parameters>
+    <customMessage>Use java.util.Base64 instead</customMessage>
+  </check>
+
+  <check customId="commonslang3javaversion" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.lang3\..*JavaVersion</parameter></parameters>
+    <customMessage>Use JEP 223 API (java.lang.Runtime.Version) instead of
+      Commons Lang 3 JavaVersion (org.apache.commons.lang3.JavaVersion)</customMessage>
+  </check>
+
+  <check customId="commonslang3tuple" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.lang3\.tuple</parameter></parameters>
+    <customMessage>Use org.apache.spark.util.Pair instead</customMessage>
+  </check>
+
+  <check customId="commonslang3tostringbuilder" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.lang3\.builder\.ToStringBuilder</parameter></parameters>
+    <customMessage>Use String concatenation instead</customMessage>
+  </check>
+
+  <check customId="commonslang3pad" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bStringUtils\.(left|right)Pad\b</parameter></parameters>
+    <customMessage>Use (left|right)Pad of SparkStringUtils or Utils instead</customMessage>
+  </check>
+
+  <check customId="commonslang3split" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bStringUtils\.split\b</parameter></parameters>
+    <customMessage>Use Utils.stringToSeq instead</customMessage>
+  </check>
+
+  <check customId="commonslang3isblankorempty" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bStringUtils\.is(Not)?(Blank|Empty)\b</parameter></parameters>
+    <customMessage>Use Utils.is(Not)?(Blank|Empty) instead</customMessage>
+  </check>
+
+  <check customId="commonslang3getrootcause" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bExceptionUtils\.getRootCause\b</parameter></parameters>
+    <customMessage>Use getRootCause of SparkErrorUtils or Utils instead</customMessage>
+  </check>
+
+  <check customId="commonslang3getstacktrace" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bExceptionUtils\.getStackTrace\b</parameter></parameters>
+    <customMessage>Use stackTraceToString of JavaUtils/SparkFileUtils/Utils instead.</customMessage>
+  </check>
+
+  <check customId="commonslang3strings" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.lang3\.Strings\b</parameter></parameters>
+    <customMessage>Use Java String methods instead</customMessage>
+  </check>
+
+  <check customId="commonslang3strip" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bStringUtils\.strip\b</parameter></parameters>
+    <customMessage>Use Utils.strip method instead</customMessage>
+  </check>
+
+  <check customId="encodeHexString" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bHex\.encodeHexString\b</parameter></parameters>
+    <customMessage>Use java.util.HexFormat instead</customMessage>
+  </check>
+
+  <check customId="commonsiofileutils" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.io\.FileUtils\b</parameter></parameters>
+    <customMessage>Use Java API or Spark's JavaUtils/SparkSystemUtils/Utils instead</customMessage>
+  </check>
+
+  <check customId="commonslang3stringutils" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.lang3\.StringUtils\b</parameter></parameters>
+    <customMessage>Use Java String or Spark's Utils/JavaUtils methods instead</customMessage>
+  </check>
+
+  <check customId="commonslang3systemutils" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.lang3\.SystemUtils\b</parameter></parameters>
+    <customMessage>Use SparkSystemUtils or Utils instead</customMessage>
+  </check>
+
+  <check customId="commonstextstringsubstitutor" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.text\.StringSubstitutor\b</parameter></parameters>
+    <customMessage>Use org.apache.spark.StringSubstitutor instead</customMessage>
+  </check>
+
+  <check customId="commonslang3abbreviate" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bStringUtils\.abbreviate\b</parameter></parameters>
+    <customMessage>Use Utils.abbreviate method instead</customMessage>
+  </check>
+
+  <check customId="commonslang3substring" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bStringUtils\.substring\b</parameter></parameters>
+    <customMessage>Use Java String.substring instead.</customMessage>
+  </check>
+
   <check customId="uribuilder" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
-    <parameters><parameter name="regex">UriBuilder\.fromUri</parameter></parameters>
+    <parameters><parameter name="regex">\bUriBuilder\.fromUri\b</parameter></parameters>
     <customMessage>Use Utils.getUriBuilder instead.</customMessage>
   </check>
 
@@ -300,7 +546,7 @@ This file is divided into 3 sections:
   </check>
 
   <check customId="FileSystemGet" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
-    <parameters><parameter name="regex">FileSystem.get\([a-zA-Z_$][a-zA-Z_$0-9]*\)</parameter></parameters>
+    <parameters><parameter name="regex">\bFileSystem\.get\([a-zA-Z_$][a-zA-Z_$0-9]*\)</parameter></parameters>
     <customMessage><![CDATA[
       Are you sure that you want to use "FileSystem.get(Configuration conf)"? If the input
       configuration is not set properly, a default FileSystem instance will be returned. It can
@@ -449,7 +695,7 @@ This file is divided into 3 sections:
   </check>
 
   <check customId="byteCountToDisplaySize" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
-    <parameters><parameter name="regex">byteCountToDisplaySize</parameter></parameters>
+    <parameters><parameter name="regex">\bbyteCountToDisplaySize\b</parameter></parameters>
     <customMessage>Use Utils.bytesToString instead of byteCountToDisplaySize for consistency.</customMessage>
   </check>
 
@@ -470,4 +716,124 @@ This file is divided into 3 sections:
     <parameters><parameter name="regex">buildConf\("spark.databricks.</parameter></parameters>
     <customMessage>Use Apache Spark config namespace.</customMessage>
   </check>
+
+  <check customId="googleStrings" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">com\.google\.common\.base\.Strings\b</parameter></parameters>
+    <customMessage>Use Java built-in methods or SparkStringUtils instead</customMessage>
+  </check>
+
+  <check customId="hadoopioutils" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.hadoop\.io\.IOUtils\b</parameter></parameters>
+    <customMessage>Use org.apache.spark.util.Utils instead.</customMessage>
+  </check>
+
+  <check customId="defaultCharset" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">Charset\.defaultCharset</parameter></parameters>
+    <customMessage>Use StandardCharsets.UTF_8 instead.</customMessage>
+  </check>
+
+  <check customId="ioutilstobytearray" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bIOUtils\.toByteArray\b</parameter></parameters>
+    <customMessage>Use Java readAllBytes instead.</customMessage>
+  </check>
+
+  <check customId="ioutilsclosequietly" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bIOUtils\.closeQuietly\b</parameter></parameters>
+    <customMessage>Use closeQuietly of SparkErrorUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="ioutilscopy" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bIOUtils\.copy\b</parameter></parameters>
+    <customMessage>Use Java transferTo instead.</customMessage>
+  </check>
+
+  <check customId="ioutilstostring" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bIOUtils\.toString\b</parameter></parameters>
+    <customMessage>Use toString of SparkStreamUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="charstreamstostring" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bCharStreams\.toString\b</parameter></parameters>
+    <customMessage>Use toString of SparkStreamUtils or Utils instead.</customMessage>
+  </check>
+
+  <check customId="ioutilswrite" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bIOUtils\.write\b</parameter></parameters>
+    <customMessage>Use Java `write` instead.</customMessage>
+  </check>
+
+  <check customId="bytestreamsread" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bByteStreams\.read\b</parameter></parameters>
+    <customMessage>Use Java readNBytes instead.</customMessage>
+  </check>
+
+  <check customId="bytestreamscopy" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bByteStreams\.copy\b</parameter></parameters>
+    <customMessage>Use Java transferTo instead.</customMessage>
+  </check>
+
+  <check customId="skipFully" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bByteStreams\.skipFully\b</parameter></parameters>
+    <customMessage>Use Java `skipNBytes` instead.</customMessage>
+  </check>
+
+  <check customId="readFully" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bByteStreams\.readFully\b</parameter></parameters>
+    <customMessage>Use readFully of JavaUtils/SparkStreamUtils/Utils instead.</customMessage>
+  </check>
+
+  <check customId="nullOutputStream" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bByteStreams\.nullOutputStream\b</parameter></parameters>
+    <customMessage>Use OutputStream.nullOutputStream instead.</customMessage>
+  </check>
+
+  <check customId="ImmutableMapcopyOf" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bImmutableMap\.copyOf\b</parameter></parameters>
+    <customMessage>Use Map.copyOf instead.</customMessage>
+  </check>
+
+  <check customId="ImmutableSetof" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bImmutableSet\.of\b</parameter></parameters>
+    <customMessage>Use java.util.Set.of instead.</customMessage>
+  </check>
+
+  <check customId="maputils" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">org\.apache\.commons\.collections4\.MapUtils\b</parameter></parameters>
+    <customMessage>Use org.apache.spark.util.collection.Utils instead.</customMessage>
+  </check>
+
+  <check customId="googleFiles" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">com\.google\.common\.io\.Files\b</parameter></parameters>
+    <customMessage>Use Java API or Spark's JavaUtils/SparkFileUtils/Utils instead.</customMessage>
+  </check>
+
+  <check customId="googleObjects" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">com\.google\.common\.base\.Objects\b</parameter></parameters>
+    <customMessage>Use Java APIs (like java.util.Objects) instead.</customMessage>
+  </check>
+
+  <check customId="googleJoiner" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">com\.google\.common\.base\.Joiner\b</parameter></parameters>
+    <customMessage>Use Java APIs (like String.join/StringJoiner) instead.</customMessage>
+  </check>
+
+  <check customId="googleBaseEncoding" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">com\.google\.common\.io\.BaseEncoding\b</parameter></parameters>
+    <customMessage>Use Java APIs (like java.util.Base64) instead.</customMessage>
+  </check>
+
+  <check customId="googleThrowablesGetStackTraceAsString" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bThrowables\.getStackTraceAsString\b</parameter></parameters>
+    <customMessage>Use stackTraceToString of JavaUtils/SparkFileUtils/Utils instead.</customMessage>
+  </check>
+
+  <check customId="preconditionschecknotnull" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bPreconditions\.checkNotNull\b</parameter></parameters>
+    <customMessage>Use requireNonNull of java.util.Objects instead.</customMessage>
+  </check>
+
+  <check customId="intscheckedcast" level="error" class="org.scalastyle.file.RegexChecker" enabled="true">
+    <parameters><parameter name="regex">\bInts\.checkedCast\b</parameter></parameters>
+    <customMessage>Use JavaUtils.checkedCast instead.</customMessage>
+  </check>
 </scalastyle>
diff --git a/sql/api/pom.xml b/sql/api/pom.xml
index 86a8b0adaff95..184d39c4b8ea1 100644
--- a/sql/api/pom.xml
+++ b/sql/api/pom.xml
@@ -64,6 +64,10 @@
             <version>${project.version}</version>
             <scope>compile</scope>
         </dependency>
+        <dependency>
+           <groupId>org.apache.commons</groupId>
+           <artifactId>commons-lang3</artifactId>
+        </dependency>
         <dependency>
             <groupId>org.json4s</groupId>
             <artifactId>json4s-jackson_${scala.binary.version}</artifactId>
diff --git a/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseLexer.g4 b/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseLexer.g4
index c698f2696eb41..e402067926f2a 100644
--- a/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseLexer.g4
+++ b/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseLexer.g4
@@ -507,6 +507,7 @@ WHILE: 'WHILE';
 WINDOW: 'WINDOW';
 WITH: 'WITH';
 WITHIN: 'WITHIN';
+WITHOUT: 'WITHOUT';
 YEAR: 'YEAR';
 YEARS: 'YEARS';
 ZONE: 'ZONE';
@@ -547,13 +548,13 @@ HENT_END: '*/';
 QUESTION: '?';
 
 STRING_LITERAL
-    : '\'' ( ~('\''|'\\') | ('\\' .) )* '\''
+    : '\'' ( ~('\''|'\\') | ('\\' .) | ('\'' '\'') )* '\''
     | 'R\'' (~'\'')* '\''
     | 'R"'(~'"')* '"'
     ;
 
 DOUBLEQUOTED_STRING
-    :'"' ( ~('"'|'\\') | ('\\' .) )* '"'
+    :'"' ( ~('"'|'\\') | '""' | ('\\' .) )* '"'
     ;
 
 // NOTE: If you move a numeric literal, you should modify `ParserUtils.toExprAlias()`
diff --git a/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseParser.g4 b/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseParser.g4
index 08f222b2f4124..e63a229a32078 100644
--- a/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseParser.g4
+++ b/sql/api/src/main/antlr4/org/apache/spark/sql/catalyst/parser/SqlBaseParser.g4
@@ -298,7 +298,9 @@ statement
         RETURN (query | expression)                                    #createUserDefinedFunction
     | DROP TEMPORARY? FUNCTION (IF EXISTS)? identifierReference        #dropFunction
     | DECLARE (OR REPLACE)? variable?
-        identifierReference dataType? variableDefaultExpression?       #createVariable
+        identifierReferences+=identifierReference
+        (COMMA identifierReferences+=identifierReference)*
+        dataType? variableDefaultExpression?                           #createVariable
     | DROP TEMPORARY variable (IF EXISTS)? identifierReference         #dropVariable
     | EXPLAIN (LOGICAL | FORMATTED | EXTENDED | CODEGEN | COST)?
         (statement|setResetStatement)                                  #explain
@@ -374,8 +376,8 @@ createPipelineDatasetHeader
     ;
 
 streamRelationPrimary
-    : STREAM multipartIdentifier tableAlias optionsClause?                           #streamTableName
-    | STREAM LEFT_PAREN multipartIdentifier RIGHT_PAREN tableAlias optionsClause?    #streamTableName
+    : STREAM multipartIdentifier optionsClause? tableAlias                             #streamTableName
+    | STREAM LEFT_PAREN multipartIdentifier RIGHT_PAREN optionsClause? tableAlias     #streamTableName
     ;
 
 setResetStatement
@@ -1208,6 +1210,7 @@ primaryExpression
     | constant                                                                                 #constantDefault
     | ASTERISK exceptClause?                                                                   #star
     | qualifiedName DOT ASTERISK exceptClause?                                                 #star
+    | col=primaryExpression COLON path=semiStructuredExtractionPath                            #semiStructuredExtract
     | LEFT_PAREN namedExpression (COMMA namedExpression)+ RIGHT_PAREN                          #rowConstructor
     | LEFT_PAREN query RIGHT_PAREN                                                             #subqueryExpression
     | functionName LEFT_PAREN (setQuantifier? argument+=functionArgument
@@ -1230,6 +1233,32 @@ primaryExpression
       FROM position=valueExpression (FOR length=valueExpression)? RIGHT_PAREN                  #overlay
     ;
 
+semiStructuredExtractionPath
+    : jsonPathFirstPart (jsonPathParts)*
+    ;
+
+jsonPathIdentifier
+    : identifier
+    | BACKQUOTED_IDENTIFIER
+    ;
+
+jsonPathBracketedIdentifier
+    : LEFT_BRACKET stringLit RIGHT_BRACKET
+    ;
+
+jsonPathFirstPart
+    : jsonPathIdentifier
+    | jsonPathBracketedIdentifier
+    | LEFT_BRACKET INTEGER_VALUE RIGHT_BRACKET
+    ;
+
+jsonPathParts
+    : DOT jsonPathIdentifier
+    | jsonPathBracketedIdentifier
+    | LEFT_BRACKET INTEGER_VALUE RIGHT_BRACKET
+    | LEFT_BRACKET identifier RIGHT_BRACKET
+    ;
+
 literalType
     : DATE
     | TIME
@@ -1313,7 +1342,20 @@ collateClause
     : COLLATE collationName=multipartIdentifier
     ;
 
-type
+nonTrivialPrimitiveType
+    : STRING collateClause?
+    | (CHARACTER | CHAR) (LEFT_PAREN length=INTEGER_VALUE RIGHT_PAREN)?
+    | VARCHAR (LEFT_PAREN length=INTEGER_VALUE RIGHT_PAREN)?
+    | (DECIMAL | DEC | NUMERIC)
+        (LEFT_PAREN precision=INTEGER_VALUE (COMMA scale=INTEGER_VALUE)? RIGHT_PAREN)?
+    | INTERVAL
+        (fromYearMonth=(YEAR | MONTH) (TO to=MONTH)? |
+         fromDayTime=(DAY | HOUR | MINUTE | SECOND) (TO to=(HOUR | MINUTE | SECOND))?)?
+    | TIMESTAMP (WITHOUT TIME ZONE)?
+    | TIME (LEFT_PAREN precision=INTEGER_VALUE RIGHT_PAREN)? (WITHOUT TIME ZONE)?
+    ;
+
+trivialPrimitiveType
     : BOOLEAN
     | TINYINT | BYTE
     | SMALLINT | SHORT
@@ -1322,29 +1364,23 @@ type
     | FLOAT | REAL
     | DOUBLE
     | DATE
-    | TIME
-    | TIMESTAMP | TIMESTAMP_NTZ | TIMESTAMP_LTZ
-    | STRING collateClause?
-    | CHARACTER | CHAR
-    | VARCHAR
+    | TIMESTAMP_LTZ | TIMESTAMP_NTZ
     | BINARY
-    | DECIMAL | DEC | NUMERIC
     | VOID
-    | INTERVAL
     | VARIANT
-    | ARRAY | STRUCT | MAP
-    | unsupportedType=identifier
+    ;
+
+primitiveType
+    : nonTrivialPrimitiveType
+    | trivialPrimitiveType
+    | unsupportedType=identifier (LEFT_PAREN INTEGER_VALUE(COMMA INTEGER_VALUE)* RIGHT_PAREN)?
     ;
 
 dataType
-    : complex=ARRAY LT dataType GT                              #complexDataType
-    | complex=MAP LT dataType COMMA dataType GT                 #complexDataType
-    | complex=STRUCT (LT complexColTypeList? GT | NEQ)          #complexDataType
-    | INTERVAL from=(YEAR | MONTH) (TO to=MONTH)?               #yearMonthIntervalDataType
-    | INTERVAL from=(DAY | HOUR | MINUTE | SECOND)
-      (TO to=(HOUR | MINUTE | SECOND))?                         #dayTimeIntervalDataType
-    | type (LEFT_PAREN INTEGER_VALUE
-      (COMMA INTEGER_VALUE)* RIGHT_PAREN)?                      #primitiveDataType
+    : complex=ARRAY (LT dataType GT)?                           #complexDataType
+    | complex=MAP (LT dataType COMMA dataType GT)?              #complexDataType
+    | complex=STRUCT ((LT complexColTypeList? GT) | NEQ)?       #complexDataType
+    | primitiveType                                             #primitiveDataType
     ;
 
 qualifiedColTypeWithPositionList
@@ -2013,6 +2049,7 @@ ansiNonReserved
     | WEEKS
     | WHILE
     | WINDOW
+    | WITHOUT
     | YEAR
     | YEARS
     | ZONE
@@ -2423,6 +2460,7 @@ nonReserved
     | WINDOW
     | WITH
     | WITHIN
+    | WITHOUT
     | YEAR
     | YEARS
     | ZONE
diff --git a/sql/api/src/main/java/org/apache/spark/sql/connector/catalog/IdentifierImpl.java b/sql/api/src/main/java/org/apache/spark/sql/connector/catalog/IdentifierImpl.java
index ba883b8042c4d..d209a540823c2 100644
--- a/sql/api/src/main/java/org/apache/spark/sql/connector/catalog/IdentifierImpl.java
+++ b/sql/api/src/main/java/org/apache/spark/sql/connector/catalog/IdentifierImpl.java
@@ -17,8 +17,6 @@
 
 package org.apache.spark.sql.connector.catalog;
 
-import org.apache.arrow.util.Preconditions;
-
 import java.util.Arrays;
 import java.util.Objects;
 import java.util.StringJoiner;
@@ -36,10 +34,8 @@ class IdentifierImpl implements Identifier {
   private String name;
 
   IdentifierImpl(String[] namespace, String name) {
-    Preconditions.checkNotNull(namespace, "Identifier namespace cannot be null");
-    Preconditions.checkNotNull(name, "Identifier name cannot be null");
-    this.namespace = namespace;
-    this.name = name;
+    this.namespace = Objects.requireNonNull(namespace, "Identifier namespace cannot be null");
+    this.name = Objects.requireNonNull(name, "Identifier name cannot be null");
   }
 
   @Override
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/Artifact.scala b/sql/api/src/main/scala/org/apache/spark/sql/Artifact.scala
index 7e020df06fe47..40c7e532c27db 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/Artifact.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/Artifact.scala
@@ -21,12 +21,10 @@ import java.io.{ByteArrayInputStream, InputStream, PrintStream}
 import java.net.URI
 import java.nio.file.{Files, Path, Paths}
 
-import org.apache.commons.lang3.StringUtils
-
 import org.apache.spark.sql.Artifact.LocalData
 import org.apache.spark.sql.util.ArtifactUtils
+import org.apache.spark.util.{MavenUtils, SparkStringUtils}
 import org.apache.spark.util.ArrayImplicits._
-import org.apache.spark.util.MavenUtils
 
 private[sql] class Artifact private (val path: Path, val storage: LocalData) {
   require(!path.isAbsolute, s"Bad path: $path")
@@ -104,7 +102,7 @@ private[sql] object Artifact {
     val (transitive, exclusions, repos) = MavenUtils.parseQueryParams(uri)
 
     val exclusionsList: Seq[String] =
-      if (!StringUtils.isBlank(exclusions)) {
+      if (!SparkStringUtils.isBlank(exclusions)) {
         exclusions.split(",").toImmutableArraySeq
       } else {
         Nil
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/Column.scala b/sql/api/src/main/scala/org/apache/spark/sql/Column.scala
index 88d597fdfbb73..316b629df4c14 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/Column.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/Column.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.annotation.Stable
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{LEFT_EXPR, RIGHT_EXPR}
 import org.apache.spark.sql.catalyst.parser.DataTypeParser
 import org.apache.spark.sql.catalyst.trees.CurrentOrigin.withOrigin
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/Encoders.scala b/sql/api/src/main/scala/org/apache/spark/sql/Encoders.scala
index 94a627fd17a64..cb1402e1b0f4a 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/Encoders.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/Encoders.scala
@@ -368,4 +368,11 @@ object Encoders {
    */
   def scalaBoolean: Encoder[Boolean] = PrimitiveBooleanEncoder
 
+  /**
+   * An encoder for UserDefinedType.
+   * @since 4.1.0
+   */
+  def udt[T >: Null](tpe: UserDefinedType[T]): Encoder[T] = {
+    UDTEncoder(tpe)
+  }
 }
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/AgnosticEncoder.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/AgnosticEncoder.scala
index 1dd939131ab96..0c5295176608f 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/AgnosticEncoder.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/AgnosticEncoder.scala
@@ -182,6 +182,12 @@ object AgnosticEncoders {
     override def clsTag: ClassTag[E] = ClassTag(udt.userClass)
   }
 
+  object UDTEncoder {
+    def apply[E >: Null](udt: UserDefinedType[E]): UDTEncoder[E] = {
+      new UDTEncoder(udt, udt.getClass.asInstanceOf[Class[_ <: UserDefinedType[_]]])
+    }
+  }
+
   // Enums are special leafs because we need to capture the class.
   protected abstract class EnumEncoder[E] extends AgnosticEncoder[E] {
     override def isPrimitive: Boolean = false
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/RowEncoder.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/RowEncoder.scala
index d5692bb85c4e9..620278c66d21d 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/RowEncoder.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/encoders/RowEncoder.scala
@@ -22,7 +22,7 @@ import scala.reflect.classTag
 
 import org.apache.spark.sql.{AnalysisException, Row}
 import org.apache.spark.sql.catalyst.encoders.AgnosticEncoders.{BinaryEncoder, BoxedBooleanEncoder, BoxedByteEncoder, BoxedDoubleEncoder, BoxedFloatEncoder, BoxedIntEncoder, BoxedLongEncoder, BoxedShortEncoder, CalendarIntervalEncoder, CharEncoder, DateEncoder, DayTimeIntervalEncoder, EncoderField, InstantEncoder, IterableEncoder, JavaDecimalEncoder, LocalDateEncoder, LocalDateTimeEncoder, LocalTimeEncoder, MapEncoder, NullEncoder, RowEncoder => AgnosticRowEncoder, StringEncoder, TimestampEncoder, UDTEncoder, VarcharEncoder, VariantEncoder, YearMonthIntervalEncoder}
-import org.apache.spark.sql.errors.{DataTypeErrorsBase, ExecutionErrors}
+import org.apache.spark.sql.errors.DataTypeErrorsBase
 import org.apache.spark.sql.internal.SqlApiConf
 import org.apache.spark.sql.types._
 import org.apache.spark.util.ArrayImplicits._
@@ -99,16 +99,7 @@ object RowEncoder extends DataTypeErrorsBase {
       case p: PythonUserDefinedType =>
         // TODO check if this works.
         encoderForDataType(p.sqlType, lenient)
-      case udt: UserDefinedType[_] =>
-        val annotation = udt.userClass.getAnnotation(classOf[SQLUserDefinedType])
-        val udtClass: Class[_] = if (annotation != null) {
-          annotation.udt()
-        } else {
-          UDTRegistration.getUDTFor(udt.userClass.getName).getOrElse {
-            throw ExecutionErrors.userDefinedTypeNotAnnotatedAndRegisteredError(udt)
-          }
-        }
-        UDTEncoder(udt, udtClass.asInstanceOf[Class[_ <: UserDefinedType[_]]])
+      case udt: UserDefinedType[_] => UDTEncoder(udt, udt.getClass)
       case ArrayType(elementType, containsNull) =>
         IterableEncoder(
           classTag[mutable.ArraySeq[_]],
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/DataTypeAstBuilder.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/DataTypeAstBuilder.scala
index bf9a250d6499e..beb7061a841a8 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/DataTypeAstBuilder.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/DataTypeAstBuilder.scala
@@ -69,54 +69,85 @@ class DataTypeAstBuilder extends SqlBaseParserBaseVisitor[AnyRef] {
    * Resolve/create a primitive type.
    */
   override def visitPrimitiveDataType(ctx: PrimitiveDataTypeContext): DataType = withOrigin(ctx) {
-    val typeCtx = ctx.`type`
-    (typeCtx.start.getType, ctx.INTEGER_VALUE().asScala.toList) match {
-      case (BOOLEAN, Nil) => BooleanType
-      case (TINYINT | BYTE, Nil) => ByteType
-      case (SMALLINT | SHORT, Nil) => ShortType
-      case (INT | INTEGER, Nil) => IntegerType
-      case (BIGINT | LONG, Nil) => LongType
-      case (FLOAT | REAL, Nil) => FloatType
-      case (DOUBLE, Nil) => DoubleType
-      case (DATE, Nil) => DateType
-      case (TIME, Nil) => TimeType(TimeType.MICROS_PRECISION)
-      case (TIME, precision :: Nil) => TimeType(precision.getText.toInt)
-      case (TIMESTAMP, Nil) => SqlApiConf.get.timestampType
-      case (TIMESTAMP_NTZ, Nil) => TimestampNTZType
-      case (TIMESTAMP_LTZ, Nil) => TimestampType
-      case (STRING, Nil) =>
-        typeCtx.children.asScala.toSeq match {
-          case Seq(_) => StringType
-          case Seq(_, ctx: CollateClauseContext) =>
-            val collationNameParts = visitCollateClause(ctx).toArray
-            val collationId = CollationFactory.collationNameToId(
-              CollationFactory.resolveFullyQualifiedName(collationNameParts))
-            StringType(collationId)
-        }
-      case (CHARACTER | CHAR, length :: Nil) => CharType(length.getText.toInt)
-      case (VARCHAR, length :: Nil) => VarcharType(length.getText.toInt)
-      case (BINARY, Nil) => BinaryType
-      case (DECIMAL | DEC | NUMERIC, Nil) => DecimalType.USER_DEFAULT
-      case (DECIMAL | DEC | NUMERIC, precision :: Nil) =>
-        DecimalType(precision.getText.toInt, 0)
-      case (DECIMAL | DEC | NUMERIC, precision :: scale :: Nil) =>
-        DecimalType(precision.getText.toInt, scale.getText.toInt)
-      case (VOID, Nil) => NullType
-      case (INTERVAL, Nil) => CalendarIntervalType
-      case (VARIANT, Nil) => VariantType
-      case (CHARACTER | CHAR | VARCHAR, Nil) =>
-        throw QueryParsingErrors.charTypeMissingLengthError(ctx.`type`.getText, ctx)
-      case (ARRAY | STRUCT | MAP, Nil) =>
-        throw QueryParsingErrors.nestedTypeMissingElementTypeError(ctx.`type`.getText, ctx)
-      case (_, params) =>
-        val badType = ctx.`type`.getText
-        val dtStr = if (params.nonEmpty) s"$badType(${params.mkString(",")})" else badType
-        throw QueryParsingErrors.dataTypeUnsupportedError(dtStr, ctx)
+    val typeCtx = ctx.primitiveType
+    if (typeCtx.nonTrivialPrimitiveType != null) {
+      // This is a primitive type with parameters, e.g. VARCHAR(10), DECIMAL(10, 2), etc.
+      val currentCtx = typeCtx.nonTrivialPrimitiveType
+      currentCtx.start.getType match {
+        case STRING =>
+          currentCtx.children.asScala.toSeq match {
+            case Seq(_) => StringType
+            case Seq(_, ctx: CollateClauseContext) =>
+              val collationNameParts = visitCollateClause(ctx).toArray
+              val collationId = CollationFactory.collationNameToId(
+                CollationFactory.resolveFullyQualifiedName(collationNameParts))
+              StringType(collationId)
+          }
+        case CHARACTER | CHAR =>
+          if (currentCtx.length == null) {
+            throw QueryParsingErrors.charVarcharTypeMissingLengthError(typeCtx.getText, ctx)
+          } else CharType(currentCtx.length.getText.toInt)
+        case VARCHAR =>
+          if (currentCtx.length == null) {
+            throw QueryParsingErrors.charVarcharTypeMissingLengthError(typeCtx.getText, ctx)
+          } else VarcharType(currentCtx.length.getText.toInt)
+        case DECIMAL | DEC | NUMERIC =>
+          if (currentCtx.precision == null) {
+            DecimalType.USER_DEFAULT
+          } else if (currentCtx.scale == null) {
+            DecimalType(currentCtx.precision.getText.toInt, 0)
+          } else {
+            DecimalType(currentCtx.precision.getText.toInt, currentCtx.scale.getText.toInt)
+          }
+        case INTERVAL =>
+          if (currentCtx.fromDayTime != null) {
+            visitDayTimeIntervalDataType(currentCtx)
+          } else if (currentCtx.fromYearMonth != null) {
+            visitYearMonthIntervalDataType(currentCtx)
+          } else {
+            CalendarIntervalType
+          }
+        case TIMESTAMP =>
+          if (currentCtx.WITHOUT() == null) {
+            SqlApiConf.get.timestampType
+          } else TimestampNTZType
+        case TIME =>
+          val precision = if (currentCtx.precision == null) {
+            TimeType.DEFAULT_PRECISION
+          } else {
+            currentCtx.precision.getText.toInt
+          }
+          TimeType(precision)
+      }
+    } else if (typeCtx.trivialPrimitiveType != null) {
+      // This is a primitive type without parameters, e.g. BOOLEAN, TINYINT, etc.
+      typeCtx.trivialPrimitiveType.start.getType match {
+        case BOOLEAN => BooleanType
+        case TINYINT | BYTE => ByteType
+        case SMALLINT | SHORT => ShortType
+        case INT | INTEGER => IntegerType
+        case BIGINT | LONG => LongType
+        case FLOAT | REAL => FloatType
+        case DOUBLE => DoubleType
+        case DATE => DateType
+        case TIMESTAMP_LTZ => TimestampType
+        case TIMESTAMP_NTZ => TimestampNTZType
+        case BINARY => BinaryType
+        case VOID => NullType
+        case VARIANT => VariantType
+      }
+    } else {
+      val badType = typeCtx.unsupportedType.getText
+      val params = typeCtx.INTEGER_VALUE().asScala.toList
+      val dtStr =
+        if (params.nonEmpty) s"$badType(${params.mkString(",")})"
+        else badType
+      throw QueryParsingErrors.dataTypeUnsupportedError(dtStr, ctx)
     }
   }
 
-  override def visitYearMonthIntervalDataType(ctx: YearMonthIntervalDataTypeContext): DataType = {
-    val startStr = ctx.from.getText.toLowerCase(Locale.ROOT)
+  private def visitYearMonthIntervalDataType(ctx: NonTrivialPrimitiveTypeContext): DataType = {
+    val startStr = ctx.fromYearMonth.getText.toLowerCase(Locale.ROOT)
     val start = YearMonthIntervalType.stringToField(startStr)
     if (ctx.to != null) {
       val endStr = ctx.to.getText.toLowerCase(Locale.ROOT)
@@ -130,8 +161,8 @@ class DataTypeAstBuilder extends SqlBaseParserBaseVisitor[AnyRef] {
     }
   }
 
-  override def visitDayTimeIntervalDataType(ctx: DayTimeIntervalDataTypeContext): DataType = {
-    val startStr = ctx.from.getText.toLowerCase(Locale.ROOT)
+  private def visitDayTimeIntervalDataType(ctx: NonTrivialPrimitiveTypeContext): DataType = {
+    val startStr = ctx.fromDayTime.getText.toLowerCase(Locale.ROOT)
     val start = DayTimeIntervalType.stringToField(startStr)
     if (ctx.to != null) {
       val endStr = ctx.to.getText.toLowerCase(Locale.ROOT)
@@ -149,6 +180,9 @@ class DataTypeAstBuilder extends SqlBaseParserBaseVisitor[AnyRef] {
    * Create a complex DataType. Arrays, Maps and Structures are supported.
    */
   override def visitComplexDataType(ctx: ComplexDataTypeContext): DataType = withOrigin(ctx) {
+    if (ctx.LT() == null && ctx.NEQ() == null) {
+      throw QueryParsingErrors.nestedTypeMissingElementTypeError(ctx.getText, ctx)
+    }
     ctx.complex.getType match {
       case SqlBaseParser.ARRAY =>
         ArrayType(typedVisit(ctx.dataType(0)))
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/parsers.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/parsers.scala
index 28fccd2092b34..f149fd5f165f7 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/parsers.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/parser/parsers.scala
@@ -16,15 +16,18 @@
  */
 package org.apache.spark.sql.catalyst.parser
 
+import java.util.concurrent.atomic.AtomicReference
+
 import scala.jdk.CollectionConverters._
 
 import org.antlr.v4.runtime._
-import org.antlr.v4.runtime.atn.PredictionMode
+import org.antlr.v4.runtime.atn.{ATN, ParserATNSimulator, PredictionContextCache, PredictionMode}
+import org.antlr.v4.runtime.dfa.DFA
 import org.antlr.v4.runtime.misc.{Interval, ParseCancellationException}
 import org.antlr.v4.runtime.tree.TerminalNodeImpl
 
 import org.apache.spark.{QueryContext, SparkException, SparkThrowable, SparkThrowableHelper}
-import org.apache.spark.internal.Logging
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.trees.{CurrentOrigin, Origin, SQLQueryContext, WithOrigin}
 import org.apache.spark.sql.catalyst.util.SparkParserUtils
@@ -62,6 +65,7 @@ abstract class AbstractParser extends DataTypeParserInterface with Logging {
 
     val tokenStream = new CommonTokenStream(lexer)
     val parser = new SqlBaseParser(tokenStream)
+    if (conf.manageParserCaches) AbstractParser.installCaches(parser)
     parser.addParseListener(PostProcessor)
     parser.addParseListener(UnclosedCommentProcessor(command, tokenStream))
     parser.removeErrorListeners()
@@ -102,6 +106,18 @@ abstract class AbstractParser extends DataTypeParserInterface with Logging {
           errorClass = e.getCondition,
           messageParameters = e.getMessageParameters.asScala.toMap,
           queryContext = e.getQueryContext)
+    } finally {
+      // Antlr4 uses caches to make parsing faster but its caches are unbounded and never purged,
+      // which can cause OOMs when parsing a huge number of SQL queries. Clearing these caches too
+      // often will slow down parsing and cause performance regressions, but will prevent OOMs
+      // caused by the parser cache. We use a heuristic and clear the cache if the number of states
+      // in the DFA cache has exceeded the threshold
+      // configured by `spark.sql.parser.parserDfaCacheFlushThreshold`. These states generally
+      // represent the bulk of the memory consumed by the parser, and the size of a single state
+      // is approximately `BYTES_PER_DFA_STATE` bytes.
+      //
+      // Negative values mean we should never clear the cache
+      AbstractParser.maybeClearParserCaches(parser, conf)
     }
   }
 
@@ -439,3 +455,109 @@ case class UnclosedCommentProcessor(command: String, tokenStream: CommonTokenStr
 object DataTypeParser extends AbstractParser {
   override protected def astBuilder: DataTypeAstBuilder = new DataTypeAstBuilder
 }
+
+object AbstractParser extends Logging {
+  // Approximation based on experiments. Used to estimate the size of the DFA cache for the
+  // `parserDfaCacheFlushRatio` threshold.
+  final val BYTES_PER_DFA_STATE = 9700
+
+  private val DRIVER_MEMORY = Runtime.getRuntime.maxMemory()
+
+  private case class AntlrCaches(atn: ATN) {
+    private[parser] val predictionContextCache: PredictionContextCache =
+      new PredictionContextCache
+    private[parser] val decisionToDFACache: Array[DFA] = AntlrCaches.makeDecisionToDFACache(atn)
+
+    def installManagedParserCaches(parser: SqlBaseParser): Unit = {
+      parser.setInterpreter(
+        new ParserATNSimulator(parser, atn, decisionToDFACache, predictionContextCache))
+    }
+  }
+
+  private object AntlrCaches {
+    private def makeDecisionToDFACache(atn: ATN): Array[DFA] = {
+      val decisionToDFA = new Array[DFA](atn.getNumberOfDecisions)
+      for (i <- 0 until atn.getNumberOfDecisions) {
+        decisionToDFA(i) = new DFA(atn.getDecisionState(i), i)
+      }
+      decisionToDFA
+    }
+  }
+
+  private val parserCaches = new AtomicReference[AntlrCaches](AntlrCaches(SqlBaseParser._ATN))
+
+  private var numDFACacheStates: Long = 0
+  def getDFACacheNumStates: Long = numDFACacheStates
+
+  /**
+   * Returns the number of DFA states in the DFA cache.
+   *
+   * DFA states empirically consume about `BYTES_PER_DFA_STATE` bytes of memory each.
+   */
+  private def computeDFACacheNumStates: Long = {
+    parserCaches.get().decisionToDFACache.map(_.states.size).sum
+  }
+
+  /**
+   * Install the managed parser caches into the given parser. Configuring the parser to use the
+   * managed `AntlrCaches` enables us to manage the size of the cache and clear it when required
+   * as the parser caches are unbounded by default.
+   *
+   * This method should be called before parsing any input.
+   */
+  private[parser] def installCaches(parser: SqlBaseParser): Unit = {
+    parserCaches.get().installManagedParserCaches(parser)
+  }
+
+  /**
+   * Drop the existing parser caches and create a new one.
+   *
+   * ANTLR retains caches in its parser that are never released. This speeds up parsing of future
+   * input, but it can consume a lot of memory depending on the input seen so far.
+   *
+   * This method provides a mechanism to free the retained caches, which can be useful after
+   * parsing very large SQL inputs, especially if those large inputs are unlikely to be similar to
+   * future inputs seen by the driver.
+   */
+  private[parser] def clearParserCaches(parser: SqlBaseParser): Unit = {
+    parserCaches.set(AntlrCaches(SqlBaseParser._ATN))
+    logInfo(log"ANTLR parser caches cleared")
+    numDFACacheStates = 0
+    installCaches(parser)
+  }
+
+  /**
+   * Check cache size and config values to determine if we should clear the parser caches. Also
+   * logs the current cache size and the delta since the last check. This method should be called
+   * after parsing each input.
+   */
+  private[parser] def maybeClearParserCaches(parser: SqlBaseParser, conf: SqlApiConf): Unit = {
+    if (!conf.manageParserCaches) {
+      return
+    }
+
+    val numDFACacheStatesCurrent: Long = computeDFACacheNumStates
+    val numDFACacheStatesDelta = numDFACacheStatesCurrent - numDFACacheStates
+    numDFACacheStates = numDFACacheStatesCurrent
+    logInfo(
+      log"EXPERIMENTAL: Query cached " +
+        log"${MDC(LogKeys.ANTLR_DFA_CACHE_DELTA, numDFACacheStatesDelta)} " +
+        log"DFA states in the parser. Total cached DFA states: " +
+        log"${MDC(LogKeys.ANTLR_DFA_CACHE_SIZE, numDFACacheStatesCurrent)}." +
+        log"Driver memory: ${MDC(LogKeys.DRIVER_JVM_MEMORY, DRIVER_MEMORY)}.")
+
+    val staticThresholdExceeded = 0 <= conf.parserDfaCacheFlushThreshold &&
+      conf.parserDfaCacheFlushThreshold <= numDFACacheStatesCurrent
+
+    val estCacheBytes: Long = numDFACacheStatesCurrent * BYTES_PER_DFA_STATE
+    if (estCacheBytes < 0) {
+      logWarning(log"Estimated cache size is negative, likely due to an integer overflow.")
+    }
+    val dynamicThresholdExceeded = 0 <= conf.parserDfaCacheFlushRatio &&
+      conf.parserDfaCacheFlushRatio * DRIVER_MEMORY / 100 <= estCacheBytes
+
+    if (staticThresholdExceeded || dynamicThresholdExceeded) {
+      AbstractParser.clearParserCaches(parser)
+    }
+  }
+}
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkDateTimeUtils.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkDateTimeUtils.scala
index 6a51799e1132d..9ce9d14ed3161 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkDateTimeUtils.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkDateTimeUtils.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.catalyst.util
 import java.lang.invoke.{MethodHandles, MethodType}
 import java.sql.{Date, Timestamp}
 import java.time.{Instant, LocalDate, LocalDateTime, LocalTime, ZonedDateTime, ZoneId, ZoneOffset}
-import java.time.temporal.ChronoField.MICRO_OF_DAY
+import java.time.temporal.ChronoField.NANO_OF_DAY
 import java.util.TimeZone
 import java.util.concurrent.TimeUnit.{MICROSECONDS, NANOSECONDS}
 import java.util.regex.Pattern
@@ -83,6 +83,12 @@ trait SparkDateTimeUtils {
     case ldt: LocalDateTime => localDateTimeToMicros(ldt)
   }
 
+  /**
+   * Converts the time to microseconds since midnight. In Spark time values have nanoseconds
+   * precision, so this conversion is lossy.
+   */
+  def nanosToMicros(nanos: Long): Long = Math.floorDiv(nanos, MICROS_PER_MILLIS)
+
   /**
    * Converts the timestamp to milliseconds since epoch. In Spark timestamp values have
    * microseconds precision, so this conversion is lossy.
@@ -101,6 +107,11 @@ trait SparkDateTimeUtils {
     Math.multiplyExact(millis, MICROS_PER_MILLIS)
   }
 
+  /**
+   * Converts microseconds since the midnight to nanoseconds.
+   */
+  def microsToNanos(micros: Long): Long = Math.multiplyExact(micros, NANOS_PER_MICROS)
+
   // See issue SPARK-35679
   // min second cause overflow in instant to micro
   private val MIN_SECONDS = Math.floorDiv(Long.MinValue, MICROS_PER_SECOND)
@@ -134,42 +145,42 @@ trait SparkDateTimeUtils {
   }
 
   /**
-   * Gets the number of microseconds since midnight using the given time zone.
+   * Gets the number of nanoseconds since midnight using the given time zone.
    */
-  def instantToMicrosOfDay(instant: Instant, timezone: String): Long = {
-    instantToMicrosOfDay(instant, getZoneId(timezone))
+  def instantToNanosOfDay(instant: Instant, timezone: String): Long = {
+    instantToNanosOfDay(instant, getZoneId(timezone))
   }
 
   /**
-   * Gets the number of microseconds since midnight using the given time zone.
+   * Gets the number of nanoseconds since midnight using the given time zone.
    */
-  def instantToMicrosOfDay(instant: Instant, zoneId: ZoneId): Long = {
+  def instantToNanosOfDay(instant: Instant, zoneId: ZoneId): Long = {
     val localDateTime = LocalDateTime.ofInstant(instant, zoneId)
-    localDateTime.toLocalTime.getLong(MICRO_OF_DAY)
+    localDateTime.toLocalTime.getLong(NANO_OF_DAY)
   }
 
   /**
-   * Truncates a time value (in microseconds) to the specified fractional precision `p`.
+   * Truncates a time value (in nanoseconds) to the specified fractional precision `p`.
    *
    * For example, if `p = 3`, we keep millisecond resolution and discard any digits beyond the
-   * thousand-microsecond place. So a value like `123456` microseconds (12:34:56.123456) becomes
+   * thousand-nanosecond place. So a value like `123456` microseconds (12:34:56.123456) becomes
    * `123000` microseconds (12:34:56.123).
    *
-   * @param micros
-   *   The original time in microseconds.
+   * @param nanos
+   *   The original time in nanoseconds.
    * @param p
    *   The fractional second precision (range 0 to 6).
    * @return
-   *   The truncated microsecond value, preserving only `p` fractional digits.
+   *   The truncated nanosecond value, preserving only `p` fractional digits.
    */
-  def truncateTimeMicrosToPrecision(micros: Long, p: Int): Long = {
+  def truncateTimeToPrecision(nanos: Long, p: Int): Long = {
     assert(
-      p >= TimeType.MIN_PRECISION && p <= TimeType.MICROS_PRECISION,
+      TimeType.MIN_PRECISION <= p && p <= TimeType.MAX_PRECISION,
       s"Fractional second precision $p out" +
-        s" of range [${TimeType.MIN_PRECISION}..${TimeType.MICROS_PRECISION}].")
-    val scale = TimeType.MICROS_PRECISION - p
+        s" of range [${TimeType.MIN_PRECISION}..${TimeType.MAX_PRECISION}].")
+    val scale = TimeType.NANOS_PRECISION - p
     val factor = math.pow(10, scale).toLong
-    (micros / factor) * factor
+    (nanos / factor) * factor
   }
 
   /**
@@ -225,17 +236,15 @@ trait SparkDateTimeUtils {
   }
 
   /**
-   * Converts the local time to the number of microseconds within the day, from 0 to (24 * 60 * 60
-   * * 1000000) - 1.
+   * Converts the local time to the number of nanoseconds within the day, from 0 to (24 * 60 * 60
+   * * 1000 * 1000 * 1000) - 1.
    */
-  def localTimeToMicros(localTime: LocalTime): Long = localTime.getLong(MICRO_OF_DAY)
+  def localTimeToNanos(localTime: LocalTime): Long = localTime.getLong(NANO_OF_DAY)
 
   /**
-   * Converts the number of microseconds within the day to the local time.
+   * Converts the number of nanoseconds within the day to the local time.
    */
-  def microsToLocalTime(micros: Long): LocalTime = {
-    LocalTime.ofNanoOfDay(Math.multiplyExact(micros, NANOS_PER_MICROS))
-  }
+  def nanosToLocalTime(nanos: Long): LocalTime = LocalTime.ofNanoOfDay(nanos)
 
   /**
    * Converts a local date at the default JVM time zone to the number of days since 1970-01-01 in
@@ -708,15 +717,63 @@ trait SparkDateTimeUtils {
    */
   def stringToTime(s: UTF8String): Option[Long] = {
     try {
-      val (segments, zoneIdOpt, justTime) = parseTimestampString(s)
+      // Check for the AM/PM suffix.
+      val trimmed = s.trimRight
+      val numChars = trimmed.numChars()
+      var (isAM, isPM, hasSuffix) = (false, false, false)
+      if (numChars > 2) {
+        val lc = trimmed.getChar(numChars - 1)
+        if (lc == 'M' || lc == 'm') {
+          val slc = trimmed.getChar(numChars - 2)
+          isAM = slc == 'A' || slc == 'a'
+          isPM = slc == 'P' || slc == 'p'
+          hasSuffix = isAM || isPM
+        }
+      }
+      val timeString = if (hasSuffix) {
+        trimmed.substring(0, numChars - 2)
+      } else {
+        trimmed
+      }
+
+      val (segments, zoneIdOpt, justTime) = parseTimestampString(timeString)
+
       // If the input string can't be parsed as a time, or it contains not only
       // the time part or has time zone information, return None.
       if (segments.isEmpty || !justTime || zoneIdOpt.isDefined) {
         return None
       }
-      val nanoseconds = MICROSECONDS.toNanos(segments(6))
-      val localTime = LocalTime.of(segments(3), segments(4), segments(5), nanoseconds.toInt)
-      Some(localTimeToMicros(localTime))
+
+      // Unpack the segments.
+      var (hr, min, sec, ms) = (segments(3), segments(4), segments(5), segments(6))
+
+      // Handle AM/PM conversion in separate cases.
+      if (!hasSuffix) {
+        // For 24-hour format, validate hour range: 0-23.
+        if (hr < 0 || hr > 23) {
+          return None
+        }
+      } else {
+        // For 12-hour format, validate hour range: 1-12.
+        if (hr < 1 || hr > 12) {
+          return None
+        }
+        // For 12-hour format, convert to 24-hour format.
+        if (isAM) {
+          // AM: 12:xx:xx becomes 00:xx:xx, 1-11:xx:xx stays the same.
+          if (hr == 12) {
+            hr = 0
+          }
+        } else {
+          // PM: 12:xx:xx stays 12:xx:xx, 1-11:xx:xx becomes 13-23:xx:xx.
+          if (hr != 12) {
+            hr += 12
+          }
+        }
+      }
+
+      val localTime = LocalTime.of(hr, min, sec, MICROSECONDS.toNanos(ms).toInt)
+      Some(localTimeToNanos(localTime))
     } catch {
       case NonFatal(_) => None
     }
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkParserUtils.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkParserUtils.scala
index 9c9e623e03395..52788262ce169 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkParserUtils.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/SparkParserUtils.scala
@@ -26,8 +26,19 @@ import org.apache.spark.sql.catalyst.trees.{CurrentOrigin, Origin}
 
 trait SparkParserUtils {
 
-  /** Unescape backslash-escaped string enclosed by quotes. */
-  def unescapeSQLString(b: String): String = {
+  /**
+   * Unescape escaped string enclosed by quotes, with support for:
+   *   1. Double-quote escaping (`""`, `''`)
+   *   2. Traditional backslash escaping (\n, \t, \", etc.)
+   *
+   * @param b
+   *   The input string
+   * @param ignoreQuoteQuote
+   *   If true, consecutive quotes (`''` or `""`) are treated as string concatenation and will be
+   *   removed directly (e.g., `'a''b'` → `ab`). If false, they are treated as escape sequences
+   *   (e.g., `'a''b'` → `a'b`). Default is false (standard SQL escaping).
+   */
+  def unescapeSQLString(b: String, ignoreQuoteQuote: Boolean = false): String = {
     def appendEscapedChar(n: Char, sb: JStringBuilder): Unit = {
       n match {
         case '0' => sb.append('\u0000')
@@ -71,10 +82,20 @@ trait SparkParserUtils {
       firstChar == 'r' || firstChar == 'R'
     }
 
+    val isDoubleQuotedString = {
+      b.charAt(0) == '"'
+    }
+
+    val isSingleQuotedString = {
+      b.charAt(0) == '\''
+    }
+
     if (isRawString) {
       // Skip the 'r' or 'R' and the first and last quotations enclosing the string literal.
       b.substring(2, b.length - 1)
-    } else if (b.indexOf('\\') == -1) {
+    } else if (b.indexOf('\\') == -1 &&
+      (!isDoubleQuotedString || b.indexOf("\"\"") == -1) &&
+      (!isSingleQuotedString || b.indexOf("''") == -1)) {
       // Fast path for the common case where the string has no escaped characters,
       // in which case we just skip the first and last quotations enclosing the string literal.
       b.substring(1, b.length - 1)
@@ -85,7 +106,19 @@ trait SparkParserUtils {
       val length = b.length - 1
       while (i < length) {
         val c = b.charAt(i)
-        if (c != '\\' || i + 1 == length) {
+        // First check for double-quote escaping (`""`, `''`)
+        if (isDoubleQuotedString && c == '"' && i + 1 < length && b.charAt(i + 1) == '"') {
+          if (!ignoreQuoteQuote) {
+            sb.append('"')
+          }
+          i += 2
+        } else if (isSingleQuotedString && c == '\'' && i + 1 < length && b.charAt(
+            i + 1) == '\'') {
+          if (!ignoreQuoteQuote) {
+            sb.append('\'')
+          }
+          i += 2
+        } else if (c != '\\' || i + 1 == length) {
           // Either a regular character or a backslash at the end of the string:
           sb.append(c)
           i += 1
@@ -138,6 +171,9 @@ trait SparkParserUtils {
   /** Convert a string token into a string. */
   def string(token: Token): String = unescapeSQLString(token.getText)
 
+  /** Convert a string token into a string and remove `""` and `''`. */
+  def stringIgnoreQuoteQuote(token: Token): String = unescapeSQLString(token.getText, true)
+
   /** Convert a string node into a string. */
   def string(node: TerminalNode): String = unescapeSQLString(node.getText)
 
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/StringConcat.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/StringConcat.scala
new file mode 100644
index 0000000000000..006c413d941cc
--- /dev/null
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/StringConcat.scala
@@ -0,0 +1,63 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.sql.catalyst.util
+
+import org.apache.spark.unsafe.array.ByteArrayUtils
+
+/**
+ * Concatenation of sequence of strings to final string with cheap append method and one memory
+ * allocation for the final string. Can also bound the final size of the string.
+ */
+class StringConcat(val maxLength: Int = ByteArrayUtils.MAX_ROUNDED_ARRAY_LENGTH) {
+  protected val strings = new java.util.ArrayList[String]
+  protected var length: Int = 0
+
+  def atLimit: Boolean = length >= maxLength
+
+  /**
+   * Appends a string and accumulates its length to allocate a string buffer for all appended
+   * strings once in the toString method. Returns true if the string still has room for further
+   * appends before it hits its max limit.
+   */
+  def append(s: String): Unit = {
+    if (s != null) {
+      val sLen = s.length
+      if (!atLimit) {
+        val available = maxLength - length
+        val stringToAppend = if (available >= sLen) s else s.substring(0, available)
+        strings.add(stringToAppend)
+      }
+
+      // Keeps the total length of appended strings. Note that we need to cap the length at
+      // `ByteArrayMethods.MAX_ROUNDED_ARRAY_LENGTH`; otherwise, we will overflow
+      // length causing StringIndexOutOfBoundsException in the substring call above.
+      length = Math.min(length.toLong + sLen, ByteArrayUtils.MAX_ROUNDED_ARRAY_LENGTH).toInt
+    }
+  }
+
+  /**
+   * The method allocates memory for all appended strings, writes them to the memory and returns
+   * concatenated string.
+   */
+  override def toString: String = {
+    val finalLength = if (atLimit) maxLength else length
+    val result = new java.lang.StringBuilder(finalLength)
+    strings.forEach(s => result.append(s))
+    result.toString
+  }
+}
+
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/StringUtils.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/StringUtils.scala
deleted file mode 100644
index 486093225f063..0000000000000
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/StringUtils.scala
+++ /dev/null
@@ -1,141 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package org.apache.spark.sql.catalyst.util
-
-import java.util.HexFormat
-import java.util.concurrent.atomic.AtomicBoolean
-
-import org.apache.spark.internal.Logging
-import org.apache.spark.unsafe.array.ByteArrayUtils
-import org.apache.spark.util.ArrayImplicits._
-
-/**
- * Concatenation of sequence of strings to final string with cheap append method and one memory
- * allocation for the final string. Can also bound the final size of the string.
- */
-class StringConcat(val maxLength: Int = ByteArrayUtils.MAX_ROUNDED_ARRAY_LENGTH) {
-  protected val strings = new java.util.ArrayList[String]
-  protected var length: Int = 0
-
-  def atLimit: Boolean = length >= maxLength
-
-  /**
-   * Appends a string and accumulates its length to allocate a string buffer for all appended
-   * strings once in the toString method. Returns true if the string still has room for further
-   * appends before it hits its max limit.
-   */
-  def append(s: String): Unit = {
-    if (s != null) {
-      val sLen = s.length
-      if (!atLimit) {
-        val available = maxLength - length
-        val stringToAppend = if (available >= sLen) s else s.substring(0, available)
-        strings.add(stringToAppend)
-      }
-
-      // Keeps the total length of appended strings. Note that we need to cap the length at
-      // `ByteArrayMethods.MAX_ROUNDED_ARRAY_LENGTH`; otherwise, we will overflow
-      // length causing StringIndexOutOfBoundsException in the substring call above.
-      length = Math.min(length.toLong + sLen, ByteArrayUtils.MAX_ROUNDED_ARRAY_LENGTH).toInt
-    }
-  }
-
-  /**
-   * The method allocates memory for all appended strings, writes them to the memory and returns
-   * concatenated string.
-   */
-  override def toString: String = {
-    val finalLength = if (atLimit) maxLength else length
-    val result = new java.lang.StringBuilder(finalLength)
-    strings.forEach(s => result.append(s))
-    result.toString
-  }
-}
-
-object SparkStringUtils extends Logging {
-
-  /** Whether we have warned about plan string truncation yet. */
-  private val truncationWarningPrinted = new AtomicBoolean(false)
-
-  /**
-   * Format a sequence with semantics similar to calling .mkString(). Any elements beyond
-   * `maxFields` will be dropped and replaced by a "... N more fields" placeholder.
-   *
-   * @return
-   *   the trimmed and formatted string.
-   */
-  def truncatedString[T](
-      seq: Seq[T],
-      start: String,
-      sep: String,
-      end: String,
-      maxFields: Int,
-      customToString: Option[T => String] = None): String = {
-    if (seq.length > maxFields) {
-      if (truncationWarningPrinted.compareAndSet(false, true)) {
-        logWarning(
-          "Truncated the string representation of a plan since it was too large. This " +
-            s"behavior can be adjusted by setting 'spark.sql.debug.maxToStringFields'.")
-      }
-      val numFields = math.max(0, maxFields)
-      val restNum = seq.length - numFields
-      val ending = (if (numFields == 0) "" else sep) +
-        (if (restNum == 0) "" else s"... $restNum more fields") + end
-      if (customToString.isDefined) {
-        seq.take(numFields).map(customToString.get).mkString(start, sep, ending)
-      } else {
-        seq.take(numFields).mkString(start, sep, ending)
-      }
-    } else {
-      if (customToString.isDefined) {
-        seq.map(customToString.get).mkString(start, sep, end)
-      } else {
-        seq.mkString(start, sep, end)
-      }
-    }
-  }
-
-  /** Shorthand for calling truncatedString() without start or end strings. */
-  def truncatedString[T](seq: Seq[T], sep: String, maxFields: Int): String = {
-    truncatedString(seq, "", sep, "", maxFields)
-  }
-
-  private final lazy val SPACE_DELIMITED_UPPERCASE_HEX =
-    HexFormat.of().withDelimiter(" ").withUpperCase()
-
-  /**
-   * Returns a pretty string of the byte array which prints each byte as a hex digit and add
-   * spaces between them. For example, [1A C0].
-   */
-  def getHexString(bytes: Array[Byte]): String = {
-    s"[${SPACE_DELIMITED_UPPERCASE_HEX.formatHex(bytes)}]"
-  }
-
-  def sideBySide(left: String, right: String): Seq[String] = {
-    sideBySide(left.split("\n").toImmutableArraySeq, right.split("\n").toImmutableArraySeq)
-  }
-
-  def sideBySide(left: Seq[String], right: Seq[String]): Seq[String] = {
-    val maxLeftSize = left.map(_.length).max
-    val leftPadded = left ++ Seq.fill(math.max(right.size - left.size, 0))("")
-    val rightPadded = right ++ Seq.fill(math.max(left.size - right.size, 0))("")
-
-    leftPadded.zip(rightPadded).map { case (l, r) =>
-      (if (l == r) " " else "!") + l + (" " * ((maxLeftSize - l.length) + 3)) + r
-    }
-  }
-}
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/TimeFormatter.scala b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/TimeFormatter.scala
index 46afbc8aca196..d0438c6ff1b46 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/TimeFormatter.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/catalyst/util/TimeFormatter.scala
@@ -25,11 +25,11 @@ import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils._
 import org.apache.spark.unsafe.types.UTF8String
 
 sealed trait TimeFormatter extends Serializable {
-  def parse(s: String): Long // returns microseconds since midnight
+  def parse(s: String): Long // returns nanoseconds since midnight
 
   def format(localTime: LocalTime): String
-  // Converts microseconds since the midnight to time string
-  def format(micros: Long): String
+  // Converts nanoseconds since the midnight to time string
+  def format(nanos: Long): String
 
   def validatePatternString(): Unit
 }
@@ -47,15 +47,15 @@ class Iso8601TimeFormatter(pattern: String, locale: Locale, isParsing: Boolean)
 
   override def parse(s: String): Long = {
     val localTime = toLocalTime(formatter.parse(s))
-    localTimeToMicros(localTime)
+    localTimeToNanos(localTime)
   }
 
   override def format(localTime: LocalTime): String = {
     localTime.format(formatter)
   }
 
-  override def format(micros: Long): String = {
-    format(microsToLocalTime(micros))
+  override def format(nanos: Long): String = {
+    format(nanosToLocalTime(nanos))
   }
 
   override def validatePatternString(): Unit = {
@@ -135,4 +135,8 @@ object TimeFormatter {
   def apply(isParsing: Boolean): TimeFormatter = {
     getFormatter(None, defaultLocale, isParsing)
   }
+
+  def getFractionFormatter(): TimeFormatter = {
+    new FractionTimeFormatter()
+  }
 }
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/errors/ExecutionErrors.scala b/sql/api/src/main/scala/org/apache/spark/sql/errors/ExecutionErrors.scala
index 8124b1a4ab197..1a4369b172f82 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/errors/ExecutionErrors.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/errors/ExecutionErrors.scala
@@ -24,7 +24,7 @@ import org.apache.arrow.vector.types.pojo.ArrowType
 import org.apache.spark.{QueryContext, SparkArithmeticException, SparkBuildInfo, SparkDateTimeException, SparkException, SparkRuntimeException, SparkUnsupportedOperationException, SparkUpgradeException}
 import org.apache.spark.sql.catalyst.WalkedTypePath
 import org.apache.spark.sql.internal.SqlApiConf
-import org.apache.spark.sql.types.{DataType, DoubleType, StringType, UserDefinedType}
+import org.apache.spark.sql.types.{DataType, DoubleType, StringType}
 import org.apache.spark.unsafe.types.UTF8String
 
 private[sql] trait ExecutionErrors extends DataTypeErrorsBase {
@@ -160,13 +160,6 @@ private[sql] trait ExecutionErrors extends DataTypeErrorsBase {
       messageParameters = Map("typeName" -> toSQLType(typeName)))
   }
 
-  def userDefinedTypeNotAnnotatedAndRegisteredError(udt: UserDefinedType[_]): Throwable = {
-    new SparkException(
-      errorClass = "_LEGACY_ERROR_TEMP_2155",
-      messageParameters = Map("userClass" -> udt.userClass.getName),
-      cause = null)
-  }
-
   def cannotFindEncoderForTypeError(typeName: String): SparkUnsupportedOperationException = {
     new SparkUnsupportedOperationException(
       errorClass = "ENCODER_NOT_FOUND",
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/errors/QueryParsingErrors.scala b/sql/api/src/main/scala/org/apache/spark/sql/errors/QueryParsingErrors.scala
index 12f986b89fd2b..60ccf7a9282cf 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/errors/QueryParsingErrors.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/errors/QueryParsingErrors.scala
@@ -324,7 +324,9 @@ private[sql] object QueryParsingErrors extends DataTypeErrorsBase {
       ctx)
   }
 
-  def charTypeMissingLengthError(dataType: String, ctx: PrimitiveDataTypeContext): Throwable = {
+  def charVarcharTypeMissingLengthError(
+      dataType: String,
+      ctx: PrimitiveDataTypeContext): Throwable = {
     new ParseException(
       errorClass = "DATATYPE_MISSING_SIZE",
       messageParameters = Map("type" -> toSQLType(dataType)),
@@ -333,7 +335,7 @@ private[sql] object QueryParsingErrors extends DataTypeErrorsBase {
 
   def nestedTypeMissingElementTypeError(
       dataType: String,
-      ctx: PrimitiveDataTypeContext): Throwable = {
+      ctx: ComplexDataTypeContext): Throwable = {
     dataType.toUpperCase(Locale.ROOT) match {
       case "ARRAY" =>
         new ParseException(
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/functions.scala b/sql/api/src/main/scala/org/apache/spark/sql/functions.scala
index ce5c76807b5c1..0165d8d4cf708 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/functions.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/functions.scala
@@ -871,6 +871,22 @@ object functions {
   def last_value(e: Column, ignoreNulls: Column): Column =
     Column.fn("last_value", e, ignoreNulls)
 
+  /**
+   * Create time from hour, minute and second fields. For invalid inputs it will throw an error.
+   *
+   * @param hour
+   *   the hour to represent, from 0 to 23
+   * @param minute
+   *   the minute to represent, from 0 to 59
+   * @param second
+   *   the second to represent, from 0 to 59.999999
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def make_time(hour: Column, minute: Column, second: Column): Column = {
+    Column.fn("make_time", hour, minute, second)
+  }
+
   /**
    * Aggregate function: returns the most frequent value in a group.
    *
@@ -1376,6 +1392,36 @@ object functions {
    */
   def count_if(e: Column): Column = Column.fn("count_if", e)
 
+  /**
+   * Returns the current time at the start of query evaluation. Note that the result will contain
+   * 6 fractional digits of seconds.
+   *
+   * @return
+   *   A time.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def current_time(): Column = {
+    Column.fn("current_time")
+  }
+
+  /**
+   * Returns the current time at the start of query evaluation.
+   *
+   * @param precision
+   *   An integer literal in the range [0..6], indicating how many fractional digits of seconds to
+   *   include in the result.
+   * @return
+   *   A time.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def current_time(precision: Int): Column = {
+    Column.fn("current_time", lit(precision))
+  }
+
   /**
    * Aggregate function: computes a histogram on numeric 'expr' using nb bins. The return value is
    * an array of (x,y) pairs representing the centers of the histogram's bins. As the value of
@@ -5400,7 +5446,7 @@ object functions {
   def dayofyear(e: Column): Column = Column.fn("dayofyear", e)
 
   /**
-   * Extracts the hours as an integer from a given date/timestamp/string.
+   * Extracts the hours as an integer from a given date/time/timestamp/string.
    * @return
    *   An integer, or null if the input was a string that could not be cast to a date
    * @group datetime_funcs
@@ -5473,7 +5519,7 @@ object functions {
   def last_day(e: Column): Column = Column.fn("last_day", e)
 
   /**
-   * Extracts the minutes as an integer from a given date/timestamp/string.
+   * Extracts the minutes as an integer from a given date/time/timestamp/string.
    * @return
    *   An integer, or null if the input was a string that could not be cast to a date
    * @group datetime_funcs
@@ -5579,7 +5625,7 @@ object functions {
     Column.fn("next_day", date, dayOfWeek)
 
   /**
-   * Extracts the seconds as an integer from a given date/timestamp/string.
+   * Extracts the seconds as an integer from a given date/time/timestamp/string.
    * @return
    *   An integer, or null if the input was a string that could not be cast to a timestamp
    * @group datetime_funcs
@@ -5683,6 +5729,41 @@ object functions {
   def unix_timestamp(s: Column, p: String): Column =
     Column.fn("unix_timestamp", s, lit(p))
 
+  /**
+   * Parses a string value to a time value.
+   *
+   * @param str
+   *   A string to be parsed to time.
+   * @return
+   *   A time, or raises an error if the input is malformed.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def to_time(str: Column): Column = {
+    Column.fn("to_time", str)
+  }
+
+  /**
+   * Parses a string value to a time value.
+   *
+   * See <a href="https://spark.apache.org/docs/latest/sql-ref-datetime-pattern.html"> Datetime
+   * Patterns</a> for valid time format patterns.
+   *
+   * @param str
+   *   A string to be parsed to time.
+   * @param format
+   *   A time format pattern to follow.
+   * @return
+   *   A time, or raises an error if the input is malformed.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def to_time(str: Column, format: Column): Column = {
+    Column.fn("to_time", str, format)
+  }
+
   /**
    * Converts to a timestamp by casting rules to `TimestampType`.
    *
@@ -5715,6 +5796,41 @@ object functions {
    */
   def to_timestamp(s: Column, fmt: String): Column = Column.fn("to_timestamp", s, lit(fmt))
 
+  /**
+   * Parses a string value to a time value.
+   *
+   * @param str
+   *   A string to be parsed to time.
+   * @return
+   *   A time, or null if the input is malformed.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def try_to_time(str: Column): Column = {
+    Column.fn("try_to_time", str)
+  }
+
+  /**
+   * Parses a string value to a time value.
+   *
+   * See <a href="https://spark.apache.org/docs/latest/sql-ref-datetime-pattern.html"> Datetime
+   * Patterns</a> for valid time format patterns.
+   *
+   * @param str
+   *   A string to be parsed to time.
+   * @param format
+   *   A time format pattern to follow.
+   * @return
+   *   A time, or null if the input is malformed.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def try_to_time(str: Column, format: Column): Column = {
+    Column.fn("try_to_time", str, format)
+  }
+
   /**
    * Parses the `s` with the `format` to a timestamp. The function always returns null on an
    * invalid input with`/`without ANSI SQL mode enabled. The result data type is consistent with
@@ -5763,6 +5879,24 @@ object functions {
    */
   def to_date(e: Column, fmt: String): Column = Column.fn("to_date", e, lit(fmt))
 
+  /**
+   * This is a special version of `to_date` that performs the same operation, but returns a NULL
+   * value instead of raising an error if date cannot be created.
+   *
+   * @group datetime_funcs
+   * @since 4.0.0
+   */
+  def try_to_date(e: Column): Column = Column.fn("try_to_date", e)
+
+  /**
+   * This is a special version of `to_date` that performs the same operation, but returns a NULL
+   * value instead of raising an error if date cannot be created.
+   *
+   * @group datetime_funcs
+   * @since 4.0.0
+   */
+  def try_to_date(e: Column, fmt: String): Column = Column.fn("try_to_date", e, lit(fmt))
+
   /**
    * Returns the number of days since 1970-01-01.
    *
@@ -6158,6 +6292,49 @@ object functions {
   def timestamp_add(unit: String, quantity: Column, ts: Column): Column =
     Column.internalFn("timestampadd", lit(unit), quantity, ts)
 
+  /**
+   * Returns the difference between two times, measured in specified units. Throws a
+   * SparkIllegalArgumentException, in case the specified unit is not supported.
+   *
+   * @param unit
+   *   A STRING representing the unit of the time difference. Supported units are: "HOUR",
+   *   "MINUTE", "SECOND", "MILLISECOND", and "MICROSECOND". The unit is case-insensitive.
+   * @param start
+   *   A starting TIME.
+   * @param end
+   *   An ending TIME.
+   * @return
+   *   The difference between `end` and `start` times, measured in specified units.
+   * @note
+   *   If any of the inputs is `NULL`, the result is `NULL`.
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def time_diff(unit: Column, start: Column, end: Column): Column = {
+    Column.fn("time_diff", unit, start, end)
+  }
+
+  /**
+   * Returns `time` truncated to the `unit`.
+   *
+   * @param unit
+   *   A STRING representing the unit to truncate the time to. Supported units are: "HOUR",
+   *   "MINUTE", "SECOND", "MILLISECOND", and "MICROSECOND". The unit is case-insensitive.
+   * @param time
+   *   A TIME to truncate.
+   * @return
+   *   A TIME truncated to the specified unit.
+   * @note
+   *   If any of the inputs is `NULL`, the result is `NULL`.
+   * @throws IllegalArgumentException
+   *   If the `unit` is not supported.
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def time_trunc(unit: Column, time: Column): Column = {
+    Column.fn("time_trunc", unit, time)
+  }
+
   /**
    * Parses the `timestamp` expression with the `format` expression to a timestamp without time
    * zone. Returns null with invalid input.
@@ -8464,6 +8641,15 @@ object functions {
       secs: Column): Column =
     Column.fn("make_timestamp_ntz", years, months, days, hours, mins, secs)
 
+  /**
+   * Create a local date-time from date and time fields.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def make_timestamp_ntz(date: Column, time: Column): Column =
+    Column.fn("make_timestamp_ntz", date, time)
+
   /**
    * Try to create a local date-time from years, months, days, hours, mins, secs fields. The
    * function returns NULL on invalid inputs.
@@ -8480,6 +8666,15 @@ object functions {
       secs: Column): Column =
     Column.fn("try_make_timestamp_ntz", years, months, days, hours, mins, secs)
 
+  /**
+   * Try to create a local date-time from date and time fields.
+   *
+   * @group datetime_funcs
+   * @since 4.1.0
+   */
+  def try_make_timestamp_ntz(date: Column, time: Column): Column =
+    Column.fn("try_make_timestamp_ntz", date, time)
+
   /**
    * Make year-month interval from years, months.
    *
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConf.scala b/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConf.scala
index 76449f1704d26..3ab9b312feea8 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConf.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConf.scala
@@ -47,6 +47,9 @@ private[sql] trait SqlApiConf {
   def stackTracesInDataFrameContext: Int
   def dataFrameQueryContextEnabled: Boolean
   def legacyAllowUntypedScalaUDFs: Boolean
+  def manageParserCaches: Boolean
+  def parserDfaCacheFlushThreshold: Int
+  def parserDfaCacheFlushRatio: Double
 }
 
 private[sql] object SqlApiConf {
@@ -60,6 +63,11 @@ private[sql] object SqlApiConf {
   val LOCAL_RELATION_CACHE_THRESHOLD_KEY: String = {
     SqlApiConfHelper.LOCAL_RELATION_CACHE_THRESHOLD_KEY
   }
+  val PARSER_DFA_CACHE_FLUSH_THRESHOLD_KEY: String =
+    SqlApiConfHelper.PARSER_DFA_CACHE_FLUSH_THRESHOLD_KEY
+  val PARSER_DFA_CACHE_FLUSH_RATIO_KEY: String =
+    SqlApiConfHelper.PARSER_DFA_CACHE_FLUSH_RATIO_KEY
+  val MANAGE_PARSER_CACHES_KEY: String = SqlApiConfHelper.MANAGE_PARSER_CACHES_KEY
 
   def get: SqlApiConf = SqlApiConfHelper.getConfGetter.get()()
 
@@ -88,4 +96,7 @@ private[sql] object DefaultSqlApiConf extends SqlApiConf {
   override def stackTracesInDataFrameContext: Int = 1
   override def dataFrameQueryContextEnabled: Boolean = true
   override def legacyAllowUntypedScalaUDFs: Boolean = false
+  override def manageParserCaches: Boolean = false
+  override def parserDfaCacheFlushThreshold: Int = -1
+  override def parserDfaCacheFlushRatio: Double = -1.0
 }
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConfHelper.scala b/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConfHelper.scala
index dace1dbaecfa5..727620bd5bd03 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConfHelper.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/internal/SqlApiConfHelper.scala
@@ -33,6 +33,10 @@ private[sql] object SqlApiConfHelper {
   val SESSION_LOCAL_TIMEZONE_KEY: String = "spark.sql.session.timeZone"
   val LOCAL_RELATION_CACHE_THRESHOLD_KEY: String = "spark.sql.session.localRelationCacheThreshold"
   val ARROW_EXECUTION_USE_LARGE_VAR_TYPES = "spark.sql.execution.arrow.useLargeVarTypes"
+  val PARSER_DFA_CACHE_FLUSH_THRESHOLD_KEY: String =
+    "spark.sql.parser.parserDfaCacheFlushThreshold"
+  val PARSER_DFA_CACHE_FLUSH_RATIO_KEY: String = "spark.sql.parser.parserDfaCacheFlushRatio"
+  val MANAGE_PARSER_CACHES_KEY: String = "spark.sql.parser.manageParserCaches"
 
   val confGetter: AtomicReference[() => SqlApiConf] = {
     new AtomicReference[() => SqlApiConf](() => DefaultSqlApiConf)
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/AbstractDataType.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/AbstractDataType.scala
index 9590fb23e16b1..a87482e88139f 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/AbstractDataType.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/AbstractDataType.scala
@@ -175,3 +175,17 @@ private[spark] object AnsiIntervalType extends AbstractDataType {
 
   override private[sql] def defaultConcreteType: DataType = DayTimeIntervalType()
 }
+
+/**
+ * A TIME type of any valid precision.
+ */
+private[sql] abstract class AnyTimeType extends DatetimeType
+
+private[spark] object AnyTimeType extends AbstractDataType with Serializable {
+  override private[sql] def simpleString: String = "time"
+
+  override private[sql] def acceptsType(other: DataType): Boolean =
+    other.isInstanceOf[AnyTimeType]
+
+  override private[sql] def defaultConcreteType: DataType = TimeType(TimeType.DEFAULT_PRECISION)
+}
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/DataType.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/DataType.scala
index f798276d60f7c..3ecc84a1578a4 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/DataType.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/DataType.scala
@@ -126,6 +126,7 @@ object DataType {
   private val FIXED_DECIMAL = """decimal\(\s*(\d+)\s*,\s*(\-?\d+)\s*\)""".r
   private val CHAR_TYPE = """char\(\s*(\d+)\s*\)""".r
   private val VARCHAR_TYPE = """varchar\(\s*(\d+)\s*\)""".r
+  private val STRING_WITH_COLLATION = """string\s+collate\s+(\w+)""".r
 
   val COLLATIONS_METADATA_KEY = "__COLLATIONS"
 
@@ -215,6 +216,7 @@ object DataType {
       case FIXED_DECIMAL(precision, scale) => DecimalType(precision.toInt, scale.toInt)
       case CHAR_TYPE(length) => CharType(length.toInt)
       case VARCHAR_TYPE(length) => VarcharType(length.toInt)
+      case STRING_WITH_COLLATION(collation) => StringType(collation)
       // For backwards compatibility, previously the type name of NullType is "null"
       case "null" => NullType
       case "timestamp_ltz" => TimestampType
@@ -234,11 +236,15 @@ object DataType {
     }
   }
 
+  private[sql] def parseDataType(json: JValue): DataType = {
+    parseDataType(json, fieldPath = "", collationsMap = Map.empty)
+  }
+
   // NOTE: Map fields must be sorted in alphabetical order to keep consistent with the Python side.
   private[sql] def parseDataType(
       json: JValue,
-      fieldPath: String = "",
-      collationsMap: Map[String, String] = Map.empty): DataType = json match {
+      fieldPath: String,
+      collationsMap: Map[String, String]): DataType = json match {
     case JString(name) =>
       collationsMap.get(fieldPath) match {
         case Some(collation) =>
@@ -442,15 +448,41 @@ object DataType {
   }
 
   /**
-   * Check if `from` is equal to `to` type except for collations, which are checked to be
-   * compatible so that data of type `from` can be interpreted as of type `to`.
+   * Compares two data types, ignoring compatible collation of StringType. If `checkComplexTypes`
+   * is true, it will also ignore collations for nested types.
    */
-  private[sql] def equalsIgnoreCompatibleCollation(from: DataType, to: DataType): Boolean = {
-    (from, to) match {
-      // String types with possibly different collations are compatible.
-      case (a: StringType, b: StringType) => a.constraint == b.constraint
+  private[sql] def equalsIgnoreCompatibleCollation(
+      from: DataType,
+      to: DataType,
+      checkComplexTypes: Boolean = true): Boolean = {
+    def transform: PartialFunction[DataType, DataType] = {
+      case dt @ (_: CharType | _: VarcharType) => dt
+      case _: StringType => StringType
+      // SPARK-53330 (see below)
+      case _: DayTimeIntervalType => DayTimeIntervalType.DEFAULT
+    }
 
-      case (fromDataType, toDataType) => fromDataType == toDataType
+    if (checkComplexTypes) {
+      from.transformRecursively(transform) == to.transformRecursively(transform)
+    } else {
+      (from, to) match {
+        case (a: StringType, b: StringType) => a.constraint == b.constraint
+        // SPARK-53330: Arrow serialization always returns DayTimeIntervalType(0, 3)
+        // as it has the maximum range, we can always assume that we can match
+        // with the target type.
+        case (x: DayTimeIntervalType, y: DayTimeIntervalType) => true
+
+        case (fromDataType, toDataType) => fromDataType == toDataType
+      }
+    }
+  }
+
+  private[sql] def equalsIgnoreCompatibleCollation(
+      from: Seq[DataType],
+      to: Seq[DataType]): Boolean = {
+    from.length == to.length &&
+    from.zip(to).forall { case (fromDataType, toDataType) =>
+      equalsIgnoreCompatibleCollation(fromDataType, toDataType)
     }
   }
 
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/Metadata.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/Metadata.scala
index 8d7bcbac8af16..f2cfcb984594d 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/Metadata.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/Metadata.scala
@@ -40,13 +40,15 @@ import org.apache.spark.util.ArrayImplicits._
  * @since 1.3.0
  */
 @Stable
-sealed class Metadata private[types] (
-    private[types] val map: Map[String, Any],
-    @transient private[types] val runtimeMap: Map[String, Any])
+@SerialVersionUID(-3987058932362209243L)
+sealed class Metadata private[types] (private[types] val map: Map[String, Any])
     extends Serializable {
 
+  @transient private[types] var runtimeMap: Map[String, Any] = _
+  private[types] def setRuntimeMap(map: Map[String, Any]): Unit = runtimeMap = map
+
   /** No-arg constructor for kryo. */
-  protected def this() = this(null, null)
+  protected def this() = this(null)
 
   /** Tests whether this Metadata contains a binding for a key. */
   def contains(key: String): Boolean = map.contains(key)
@@ -137,7 +139,7 @@ sealed class Metadata private[types] (
 @Stable
 object Metadata {
 
-  private[this] val _empty = new Metadata(Map.empty, Map.empty)
+  private[this] val _empty = new Metadata(Map.empty)
 
   /** Returns an empty Metadata. */
   def empty: Metadata = _empty
@@ -305,7 +307,16 @@ class MetadataBuilder {
 
   /** Builds the [[Metadata]] instance. */
   def build(): Metadata = {
-    new Metadata(map.toMap, runtimeMap.toMap)
+    if (map.isEmpty && runtimeMap.isEmpty) {
+      // Save some memory when the metadata is empty
+      Metadata.empty
+    } else {
+      val metadata = new Metadata(map.toMap)
+      if (runtimeMap.nonEmpty) {
+        metadata.setRuntimeMap(runtimeMap.toMap)
+      }
+      metadata
+    }
   }
 
   private def put(key: String, value: Any): this.type = {
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/StringType.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/StringType.scala
index 5fec578b03581..787730f775084 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/StringType.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/StringType.scala
@@ -17,8 +17,6 @@
 
 package org.apache.spark.sql.types
 
-import org.json4s.JsonAST.{JString, JValue}
-
 import org.apache.spark.annotation.Stable
 import org.apache.spark.sql.catalyst.util.CollationFactory
 import org.apache.spark.sql.internal.SqlApiConf
@@ -90,11 +88,6 @@ class StringType private[sql] (
   private[sql] def collationName: String =
     CollationFactory.fetchCollation(collationId).collationName
 
-  // Due to backwards compatibility and compatibility with other readers
-  // all string types are serialized in json as regular strings and
-  // the collation information is written to struct field metadata
-  override def jsonValue: JValue = JString("string")
-
   override def equals(obj: Any): Boolean = {
     obj match {
       case s: StringType => s.collationId == collationId && s.constraint == constraint
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/StructField.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/StructField.scala
index 4c51980d4e6c4..eb3d30051880a 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/StructField.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/StructField.scala
@@ -70,11 +70,30 @@ case class StructField(
 
   private[sql] def jsonValue: JValue = {
     ("name" -> name) ~
-      ("type" -> dataType.jsonValue) ~
+      ("type" -> dataTypeJsonValue) ~
       ("nullable" -> nullable) ~
       ("metadata" -> metadataJson)
   }
 
+  private[sql] def dataTypeJsonValue: JValue = {
+    if (collationMetadata.isEmpty) return dataType.jsonValue
+
+    def removeCollations(dt: DataType): DataType = dt match {
+      // Only recurse into map and array types as any child struct type
+      // will have already been processed.
+      case ArrayType(et, nullable) =>
+        ArrayType(removeCollations(et), nullable)
+      case MapType(kt, vt, nullable) =>
+        MapType(removeCollations(kt), removeCollations(vt), nullable)
+      case st: StringType => StringHelper.removeCollation(st)
+      case _ => dt
+    }
+
+    // As we want to be backwards compatible we should remove all collations information from the
+    // json and only keep that information in the metadata.
+    removeCollations(dataType).jsonValue
+  }
+
   private def metadataJson: JValue = {
     val metadataJsonValue = metadata.jsonValue
     metadataJsonValue match {
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/StructType.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/StructType.scala
index 4c49d3a58f4fc..5b1d9f1f116a5 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/StructType.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/StructType.scala
@@ -30,11 +30,11 @@ import org.apache.spark.annotation.Stable
 import org.apache.spark.sql.catalyst.analysis.SqlApiAnalysis
 import org.apache.spark.sql.catalyst.parser.{DataTypeParser, LegacyTypeStringParser}
 import org.apache.spark.sql.catalyst.trees.Origin
-import org.apache.spark.sql.catalyst.util.{CaseInsensitiveMap, SparkStringUtils, StringConcat}
+import org.apache.spark.sql.catalyst.util.{CaseInsensitiveMap, StringConcat}
 import org.apache.spark.sql.errors.DataTypeErrors
 import org.apache.spark.sql.errors.DataTypeErrors.toSQLId
 import org.apache.spark.sql.internal.SqlApiConf
-import org.apache.spark.util.SparkCollectionUtils
+import org.apache.spark.util.{SparkCollectionUtils, SparkStringUtils}
 
 /**
  * A [[StructType]] object can be constructed by
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/TimeType.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/TimeType.scala
index c42311c6a1dcc..135ad278438ed 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/TimeType.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/TimeType.scala
@@ -31,7 +31,7 @@ import org.apache.spark.sql.errors.DataTypeErrors
  * @since 4.1.0
  */
 @Unstable
-case class TimeType(precision: Int) extends DatetimeType {
+case class TimeType(precision: Int) extends AnyTimeType {
 
   if (precision < TimeType.MIN_PRECISION || precision > TimeType.MAX_PRECISION) {
     throw DataTypeErrors.unsupportedTimePrecisionError(precision)
@@ -51,6 +51,8 @@ object TimeType {
   val MIN_PRECISION: Int = 0
   val MICROS_PRECISION: Int = 6
   val MAX_PRECISION: Int = MICROS_PRECISION
+  val DEFAULT_PRECISION: Int = MICROS_PRECISION
+  val NANOS_PRECISION: Int = 9
 
-  def apply(): TimeType = new TimeType(MICROS_PRECISION)
+  def apply(): TimeType = new TimeType(DEFAULT_PRECISION)
 }
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/UDTRegistration.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/UDTRegistration.scala
index 85d421a07577b..7bc9bde65c19b 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/UDTRegistration.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/UDTRegistration.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.types
 import scala.collection.mutable
 
 import org.apache.spark.annotation.{DeveloperApi, Since}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.errors.DataTypeErrors
 import org.apache.spark.util.SparkClassUtils
 
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/types/UserDefinedType.scala b/sql/api/src/main/scala/org/apache/spark/sql/types/UserDefinedType.scala
index dd8ca26c52462..3d3521d88fdf5 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/types/UserDefinedType.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/types/UserDefinedType.scala
@@ -94,6 +94,22 @@ abstract class UserDefinedType[UserType >: Null] extends DataType with Serializa
   }
 
   override def catalogString: String = sqlType.simpleString
+
+  /**
+   * This method is used to convert the value of a UDT to a string representation.
+   *
+   * By default, it simply calls `toString` on the object.
+   *
+   * @param obj
+   *   The object to convert to a string.
+   * @return
+   *   A string representation of the object.
+   * @since 4.1.0
+   */
+  @Since("4.1.0")
+  def stringifyValue(obj: Any): String = {
+    obj.toString
+  }
 }
 
 private[spark] object UserDefinedType {
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/util/ArrowUtils.scala b/sql/api/src/main/scala/org/apache/spark/sql/util/ArrowUtils.scala
index 587ca43e57300..6caabf20f8f6b 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/util/ArrowUtils.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/util/ArrowUtils.scala
@@ -58,6 +58,7 @@ private[sql] object ArrowUtils {
       case TimestampType => new ArrowType.Timestamp(TimeUnit.MICROSECOND, timeZoneId)
       case TimestampNTZType =>
         new ArrowType.Timestamp(TimeUnit.MICROSECOND, null)
+      case _: TimeType => new ArrowType.Time(TimeUnit.NANOSECOND, 8 * 8)
       case NullType => ArrowType.Null.INSTANCE
       case _: YearMonthIntervalType => new ArrowType.Interval(IntervalUnit.YEAR_MONTH)
       case _: DayTimeIntervalType => new ArrowType.Duration(TimeUnit.MICROSECOND)
@@ -88,6 +89,8 @@ private[sql] object ArrowUtils {
         if ts.getUnit == TimeUnit.MICROSECOND && ts.getTimezone == null =>
       TimestampNTZType
     case ts: ArrowType.Timestamp if ts.getUnit == TimeUnit.MICROSECOND => TimestampType
+    case t: ArrowType.Time if t.getUnit == TimeUnit.NANOSECOND && t.getBitWidth == 8 * 8 =>
+      TimeType(TimeType.MICROS_PRECISION)
     case ArrowType.Null.INSTANCE => NullType
     case yi: ArrowType.Interval if yi.getUnit == IntervalUnit.YEAR_MONTH =>
       YearMonthIntervalType()
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/util/ArtifactUtils.scala b/sql/api/src/main/scala/org/apache/spark/sql/util/ArtifactUtils.scala
index 8cd239b55cff0..0fc14b4c8b460 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/util/ArtifactUtils.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/util/ArtifactUtils.scala
@@ -19,6 +19,8 @@ package org.apache.spark.sql.util
 
 import java.nio.file.{Path, Paths}
 
+import org.apache.spark.SparkRuntimeException
+
 object ArtifactUtils {
 
   private[sql] def concatenatePaths(basePath: Path, otherPath: Path): Path = {
@@ -40,4 +42,18 @@ object ArtifactUtils {
   private[sql] def concatenatePaths(basePath: Path, otherPath: String): Path = {
     concatenatePaths(basePath, Paths.get(otherPath))
   }
+
+  /**
+   * Converts a sequence of exceptions into a single exception by adding all but the first
+   * exceptions as suppressed exceptions to the first one.
+   * @param exceptions
+   * @return
+   */
+  private[sql] def mergeExceptionsWithSuppressed(
+      exceptions: Seq[SparkRuntimeException]): SparkRuntimeException = {
+    require(exceptions.nonEmpty)
+    val mainException = exceptions.head
+    exceptions.drop(1).foreach(mainException.addSuppressed)
+    mainException
+  }
 }
diff --git a/sql/api/src/main/scala/org/apache/spark/sql/util/ProtobufUtils.scala b/sql/api/src/main/scala/org/apache/spark/sql/util/ProtobufUtils.scala
index 11f35ceb060c0..be56e3cf13133 100644
--- a/sql/api/src/main/scala/org/apache/spark/sql/util/ProtobufUtils.scala
+++ b/sql/api/src/main/scala/org/apache/spark/sql/util/ProtobufUtils.scala
@@ -18,18 +18,16 @@
 package org.apache.spark.sql.util
 
 import java.io.{File, FileNotFoundException}
-import java.nio.file.NoSuchFileException
+import java.nio.file.{Files, NoSuchFileException}
 
 import scala.util.control.NonFatal
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.sql.errors.CompilationErrors
 
 object ProtobufUtils {
   def readDescriptorFileContent(filePath: String): Array[Byte] = {
     try {
-      FileUtils.readFileToByteArray(new File(filePath))
+      Files.readAllBytes(new File(filePath).toPath())
     } catch {
       case ex: FileNotFoundException =>
         throw CompilationErrors.cannotFindDescriptorFileError(filePath, ex)
diff --git a/sql/catalyst/benchmarks/CalendarIntervalBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/CalendarIntervalBenchmark-jdk21-results.txt
index 01fcb4c21cb28..6daa0f267ff51 100644
--- a/sql/catalyst/benchmarks/CalendarIntervalBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/CalendarIntervalBenchmark-jdk21-results.txt
@@ -2,10 +2,10 @@
 CalendarInterval
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 CalendarInterval:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Call setInterval & getInterval                     1032           1033           1        130.0           7.7       1.0X
+Call setInterval & getInterval                     1034           1034           0        129.9           7.7       1.0X
 
 
diff --git a/sql/catalyst/benchmarks/CalendarIntervalBenchmark-results.txt b/sql/catalyst/benchmarks/CalendarIntervalBenchmark-results.txt
index 1f828510aa2ab..88548550e418d 100644
--- a/sql/catalyst/benchmarks/CalendarIntervalBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/CalendarIntervalBenchmark-results.txt
@@ -2,10 +2,10 @@
 CalendarInterval
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 CalendarInterval:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Call setInterval & getInterval                     1051           1053           2        127.7           7.8       1.0X
+Call setInterval & getInterval                     1037           1038           2        129.4           7.7       1.0X
 
 
diff --git a/sql/catalyst/benchmarks/EnumTypeSetBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/EnumTypeSetBenchmark-jdk21-results.txt
index 42b473742f2f1..54be9abdb59d7 100644
--- a/sql/catalyst/benchmarks/EnumTypeSetBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/EnumTypeSetBenchmark-jdk21-results.txt
@@ -1,105 +1,105 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use empty Set:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           1              1           0       1389.0           0.7       1.0X
-Use EnumSet                                           2              2           0        560.9           1.8       0.4X
+Use HashSet                                           1              1           0       1390.4           0.7       1.0X
+Use EnumSet                                           2              2           0        414.9           2.4       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 1 item Set:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           2              2           0        424.0           2.4       1.0X
-Use EnumSet                                           2              2           0        571.0           1.8       1.3X
+Use HashSet                                           2              2           0        489.8           2.0       1.0X
+Use EnumSet                                           2              2           0        507.3           2.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 3 items Set:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           2              3           0        413.2           2.4       1.0X
-Use EnumSet                                           2              2           0        601.3           1.7       1.5X
+Use HashSet                                           2              2           0        490.2           2.0       1.0X
+Use EnumSet                                           2              2           0        562.4           1.8       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 5 items Set:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           9              9           0        109.4           9.1       1.0X
-Use EnumSet                                           2              2           0        550.6           1.8       5.0X
+Use HashSet                                           9              9           0        116.1           8.6       1.0X
+Use EnumSet                                           2              2           0        532.6           1.9       4.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 10 items Set:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          10             10           0         99.7          10.0       1.0X
-Use EnumSet                                           2              2           0        550.7           1.8       5.5X
+Use HashSet                                          10             10           0        105.0           9.5       1.0X
+Use EnumSet                                           2              2           0        532.4           1.9       5.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create empty Set:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           0              0           0        413.1           2.4       1.0X
-Use EnumSet                                           0              0           0        291.1           3.4       0.7X
+Use HashSet                                           0              0           0        412.3           2.4       1.0X
+Use EnumSet                                           0              0           0        291.5           3.4       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 1 item Set:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           1              1           0        102.3           9.8       1.0X
-Use EnumSet                                           0              0           0        290.9           3.4       2.8X
+Use HashSet                                           1              1           0        102.6           9.7       1.0X
+Use EnumSet                                           0              0           0        294.4           3.4       2.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 3 items Set:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           9             10           0         10.6          94.7       1.0X
-Use EnumSet                                           1              1           0        132.0           7.6      12.5X
+Use HashSet                                          10             10           0         10.2          98.5       1.0X
+Use EnumSet                                           1              1           0        132.6           7.5      13.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 5 items Set:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          35             36           1          2.8         354.1       1.0X
-Use EnumSet                                           1              1           0        144.5           6.9      51.2X
+Use HashSet                                          32             33           0          3.1         323.4       1.0X
+Use EnumSet                                           1              1           0        144.8           6.9      46.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 10 items Set:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          57             57           0          1.8         569.8       1.0X
-Use EnumSet                                           1              1           0        138.3           7.2      78.8X
+Use HashSet                                          57             57           1          1.8         568.2       1.0X
+Use EnumSet                                           1              1           0        138.5           7.2      78.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use empty Set:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           4              4           0        267.5           3.7       1.0X
-Use EnumSet                                           5              5           0        198.5           5.0       0.7X
+Use HashSet                                           4              4           0        226.1           4.4       1.0X
+Use EnumSet                                           6              6           0        176.0           5.7       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 1 item Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          12             13           0         85.1          11.8       1.0X
-Use EnumSet                                           6              6           0        160.1           6.2       1.9X
+Use HashSet                                          13             14           0         74.3          13.5       1.0X
+Use EnumSet                                           7              7           0        149.4           6.7       2.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 3 items Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          26             27           0         38.4          26.1       1.0X
-Use EnumSet                                           6              6           0        163.7           6.1       4.3X
+Use HashSet                                          27             27           0         37.2          26.9       1.0X
+Use EnumSet                                           6              7           0        154.6           6.5       4.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 5 items Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          51             51           1         19.7          50.8       1.0X
-Use EnumSet                                           6              6           0        160.4           6.2       8.1X
+Use HashSet                                          54             54           0         18.6          53.7       1.0X
+Use EnumSet                                           7              7           0        152.2           6.6       8.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 10 items Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           78             79           0         12.8          78.1       1.0X
-Use EnumSet                                            7              7           0        149.0           6.7      11.6X
+Use HashSet                                           77             78           1         12.9          77.5       1.0X
+Use EnumSet                                            7              7           0        150.8           6.6      11.7X
 
diff --git a/sql/catalyst/benchmarks/EnumTypeSetBenchmark-results.txt b/sql/catalyst/benchmarks/EnumTypeSetBenchmark-results.txt
index a63a191f4e2d6..69baaea7f6e5d 100644
--- a/sql/catalyst/benchmarks/EnumTypeSetBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/EnumTypeSetBenchmark-results.txt
@@ -1,105 +1,105 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use empty Set:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           1              1           0       1446.7           0.7       1.0X
-Use EnumSet                                           2              2           0        498.8           2.0       0.3X
+Use HashSet                                           1              1           0       1452.7           0.7       1.0X
+Use EnumSet                                           2              2           0        561.7           1.8       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 1 item Set:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           2              2           0        495.9           2.0       1.0X
-Use EnumSet                                           2              2           0        491.3           2.0       1.0X
+Use HashSet                                           2              2           0        506.0           2.0       1.0X
+Use EnumSet                                           2              2           0        483.6           2.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 3 items Set:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           2              2           0        488.0           2.0       1.0X
-Use EnumSet                                           2              2           0        552.0           1.8       1.1X
+Use HashSet                                           2              2           0        542.0           1.8       1.0X
+Use EnumSet                                           2              2           0        577.9           1.7       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 5 items Set:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           9              9           0        108.3           9.2       1.0X
-Use EnumSet                                           2              2           0        533.8           1.9       4.9X
+Use HashSet                                           8              8           0        121.7           8.2       1.0X
+Use EnumSet                                           2              2           0        540.7           1.8       4.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test contains use 10 items Set:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          10             10           0        103.2           9.7       1.0X
-Use EnumSet                                           2              2           0        534.3           1.9       5.2X
+Use HashSet                                           9              9           0        109.4           9.1       1.0X
+Use EnumSet                                           2              2           0        541.0           1.8       4.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create empty Set:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           0              0           0        414.2           2.4       1.0X
-Use EnumSet                                           1              1           0        132.4           7.6       0.3X
+Use HashSet                                           0              0           0        413.0           2.4       1.0X
+Use EnumSet                                           1              1           0        132.1           7.6       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 1 item Set:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           2              2           0         58.9          17.0       1.0X
-Use EnumSet                                           1              1           0        135.5           7.4       2.3X
+Use HashSet                                           1              1           0         98.2          10.2       1.0X
+Use EnumSet                                           0              0           0        209.7           4.8       2.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 3 items Set:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           9              9           0         11.0          90.9       1.0X
-Use EnumSet                                           1              1           0        137.6           7.3      12.5X
+Use HashSet                                           9             10           1         11.2          89.6       1.0X
+Use EnumSet                                           1              1           0        150.4           6.6      13.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 5 items Set:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          34             35           1          2.9         341.5       1.0X
-Use EnumSet                                           1              1           0        137.4           7.3      46.9X
+Use HashSet                                          31             31           0          3.3         306.4       1.0X
+Use EnumSet                                           1              1           0        150.6           6.6      46.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create 10 items Set:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          58             58           1          1.7         576.3       1.0X
-Use EnumSet                                           1              1           0        131.3           7.6      75.7X
+Use HashSet                                          58             58           1          1.7         576.1       1.0X
+Use EnumSet                                           1              1           0        138.2           7.2      79.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use empty Set:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           4              4           0        251.0           4.0       1.0X
-Use EnumSet                                           5              5           0        190.6           5.2       0.8X
+Use HashSet                                           4              4           0        234.2           4.3       1.0X
+Use EnumSet                                           6              6           0        181.0           5.5       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 1 item Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          11             12           0         87.1          11.5       1.0X
-Use EnumSet                                           6              7           0        157.5           6.4       1.8X
+Use HashSet                                          10             11           0         96.0          10.4       1.0X
+Use EnumSet                                           7              7           0        150.9           6.6       1.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 3 items Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          29             29           0         34.9          28.6       1.0X
-Use EnumSet                                           6              6           0        157.4           6.4       4.5X
+Use HashSet                                          28             29           0         35.3          28.3       1.0X
+Use EnumSet                                           7              7           0        150.9           6.6       4.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 5 items Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                          55             56           1         18.1          55.4       1.0X
-Use EnumSet                                           6              7           0        154.3           6.5       8.5X
+Use HashSet                                          53             54           0         18.8          53.3       1.0X
+Use EnumSet                                           7              7           0        148.8           6.7       7.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test create and contains use 10 items Set:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Use HashSet                                           81             82           1         12.4          80.8       1.0X
-Use EnumSet                                            7              7           0        153.7           6.5      12.4X
+Use HashSet                                           78             79           1         12.8          78.0       1.0X
+Use EnumSet                                            7              7           0        147.4           6.8      11.5X
 
diff --git a/sql/catalyst/benchmarks/EscapePathBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/EscapePathBenchmark-jdk21-results.txt
index 471fea1fbd045..680c21beb2f52 100644
--- a/sql/catalyst/benchmarks/EscapePathBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/EscapePathBenchmark-jdk21-results.txt
@@ -2,23 +2,23 @@
 Escape
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Escape Tests:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Legacy                                             6403           6417          22          0.2        6403.1       1.0X
-New                                                 792            822          11          1.3         791.5       8.1X
+Legacy                                             7201           7208           5          0.1        7200.9       1.0X
+New                                                 809            811           2          1.2         809.0       8.9X
 
 
 ================================================================================================
 Unescape
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Unescape Tests:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Legacy                                             5057           5069          11          0.2        5057.1       1.0X
-New                                                 589            592           3          1.7         588.7       8.6X
+Legacy                                             5298           5304           7          0.2        5297.6       1.0X
+New                                                 591            598           4          1.7         591.3       9.0X
 
 
diff --git a/sql/catalyst/benchmarks/EscapePathBenchmark-results.txt b/sql/catalyst/benchmarks/EscapePathBenchmark-results.txt
index 9dc0f68498fed..0297bd37455e2 100644
--- a/sql/catalyst/benchmarks/EscapePathBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/EscapePathBenchmark-results.txt
@@ -2,23 +2,23 @@
 Escape
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Escape Tests:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Legacy                                             6776           6787          13          0.1        6776.1       1.0X
-New                                                 680            682           1          1.5         680.5      10.0X
+Legacy                                             6814           6819           4          0.1        6814.3       1.0X
+New                                                 688            719          11          1.5         687.6       9.9X
 
 
 ================================================================================================
 Unescape
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Unescape Tests:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Legacy                                             6899           6912          13          0.1        6898.6       1.0X
-New                                                 592            598           7          1.7         592.3      11.6X
+Legacy                                             6008           6016           5          0.2        6008.2       1.0X
+New                                                 593            599           6          1.7         593.1      10.1X
 
 
diff --git a/sql/catalyst/benchmarks/GenericArrayDataBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/GenericArrayDataBenchmark-jdk21-results.txt
index 2c9329b736de5..38c290b69c5f2 100644
--- a/sql/catalyst/benchmarks/GenericArrayDataBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/GenericArrayDataBenchmark-jdk21-results.txt
@@ -1,10 +1,10 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 constructor:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-arrayOfAny                                            6              6           0       1611.5           0.6       1.0X
-arrayOfAnyAsObject                                    6              6           0       1611.6           0.6       1.0X
-arrayOfAnyAsSeq                                     173            175           3         57.7          17.3       0.0X
-arrayOfInt                                          271            272           0         36.8          27.1       0.0X
-arrayOfIntAsObject                                  251            252           1         39.8          25.1       0.0X
+arrayOfAny                                            6              6           0       1611.7           0.6       1.0X
+arrayOfAnyAsObject                                    6              6           0       1611.8           0.6       1.0X
+arrayOfAnyAsSeq                                     174            175           1         57.5          17.4       0.0X
+arrayOfInt                                          393            395           1         25.4          39.3       0.0X
+arrayOfIntAsObject                                  419            419           1         23.9          41.9       0.0X
 
diff --git a/sql/catalyst/benchmarks/GenericArrayDataBenchmark-results.txt b/sql/catalyst/benchmarks/GenericArrayDataBenchmark-results.txt
index 19dc9e88757be..7ee0bb288eb73 100644
--- a/sql/catalyst/benchmarks/GenericArrayDataBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/GenericArrayDataBenchmark-results.txt
@@ -1,10 +1,10 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 constructor:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-arrayOfAny                                            6              6           0       1611.5           0.6       1.0X
-arrayOfAnyAsObject                                    6              6           0       1611.4           0.6       1.0X
-arrayOfAnyAsSeq                                     158            160           1         63.1          15.8       0.0X
-arrayOfInt                                          254            255           1         39.4          25.4       0.0X
-arrayOfIntAsObject                                  254            256           3         39.4          25.4       0.0X
+arrayOfAny                                            6              6           0       1611.8           0.6       1.0X
+arrayOfAnyAsObject                                    6              6           0       1611.8           0.6       1.0X
+arrayOfAnyAsSeq                                     158            159           1         63.4          15.8       0.0X
+arrayOfInt                                          258            259           1         38.8          25.8       0.0X
+arrayOfIntAsObject                                  258            258           0         38.8          25.8       0.0X
 
diff --git a/sql/catalyst/benchmarks/HashBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/HashBenchmark-jdk21-results.txt
index 08fcb7d351e26..8175c4c7120db 100644
--- a/sql/catalyst/benchmarks/HashBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/HashBenchmark-jdk21-results.txt
@@ -2,69 +2,69 @@
 single ints
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For single ints:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                2093           2095           3        256.5           3.9       1.0X
-codegen version                                    3536           3540           6        151.8           6.6       0.6X
-codegen version 64-bit                             3124           3124           1        171.9           5.8       0.7X
-codegen HiveHash version                           2560           2561           2        209.7           4.8       0.8X
+interpreted version                                2095           2098           4        256.2           3.9       1.0X
+codegen version                                    3534           3537           5        151.9           6.6       0.6X
+codegen version 64-bit                             3123           3127           5        171.9           5.8       0.7X
+codegen HiveHash version                           2563           2569           8        209.4           4.8       0.8X
 
 
 ================================================================================================
 single longs
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For single longs:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                2707           2710           4        198.3           5.0       1.0X
-codegen version                                    4519           4520           2        118.8           8.4       0.6X
-codegen version 64-bit                             3833           3842          13        140.0           7.1       0.7X
-codegen HiveHash version                           3138           3145           9        171.1           5.8       0.9X
+interpreted version                                2712           2713           1        197.9           5.1       1.0X
+codegen version                                    4518           4521           4        118.8           8.4       0.6X
+codegen version 64-bit                             3658           3659           0        146.8           6.8       0.7X
+codegen HiveHash version                           3139           3140           2        171.0           5.8       0.9X
 
 
 ================================================================================================
 normal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For normal:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                1414           1415           2          1.5         674.3       1.0X
-codegen version                                    1905           1906           1          1.1         908.5       0.7X
-codegen version 64-bit                              749            753           3          2.8         357.3       1.9X
-codegen HiveHash version                           3833           3837           5          0.5        1827.9       0.4X
+interpreted version                                1342           1344           3          1.6         640.1       1.0X
+codegen version                                    1858           1860           2          1.1         886.2       0.7X
+codegen version 64-bit                              731            731           1          2.9         348.4       1.8X
+codegen HiveHash version                           3704           3706           2          0.6        1766.4       0.4X
 
 
 ================================================================================================
 array
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For array:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                1081           1083           2          0.1        8249.1       1.0X
-codegen version                                    3788           3788           1          0.0       28896.9       0.3X
-codegen version 64-bit                             2596           2601           6          0.1       19805.4       0.4X
-codegen HiveHash version                            761            762           2          0.2        5807.2       1.4X
+interpreted version                                 965            966           1          0.1        7363.6       1.0X
+codegen version                                    3439           3440           1          0.0       26238.1       0.3X
+codegen version 64-bit                             2363           2364           1          0.1       18030.0       0.4X
+codegen HiveHash version                            695            696           1          0.2        5304.0       1.4X
 
 
 ================================================================================================
 map
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For map:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                   0              0           0         91.2          11.0       1.0X
-codegen version                                     260            263           3          0.0       63355.0       0.0X
-codegen version 64-bit                              177            179           3          0.0       43169.7       0.0X
-codegen HiveHash version                             29             29           0          0.1        7041.8       0.0X
+interpreted version                                   0              0           0         85.0          11.8       1.0X
+codegen version                                     236            236           0          0.0       57574.4       0.0X
+codegen version 64-bit                              161            161           0          0.0       39306.9       0.0X
+codegen HiveHash version                             26             26           0          0.2        6395.2       0.0X
 
 
diff --git a/sql/catalyst/benchmarks/HashBenchmark-results.txt b/sql/catalyst/benchmarks/HashBenchmark-results.txt
index b1dbc78213bca..8aa274e1a510a 100644
--- a/sql/catalyst/benchmarks/HashBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/HashBenchmark-results.txt
@@ -2,69 +2,69 @@
 single ints
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For single ints:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                2179           2180           1        246.4           4.1       1.0X
-codegen version                                    3670           3678          11        146.3           6.8       0.6X
-codegen version 64-bit                             3423           3426           4        156.8           6.4       0.6X
-codegen HiveHash version                           2864           2865           1        187.5           5.3       0.8X
+interpreted version                                2174           2177           4        246.9           4.0       1.0X
+codegen version                                    3672           3675           4        146.2           6.8       0.6X
+codegen version 64-bit                             3423           3427           5        156.8           6.4       0.6X
+codegen HiveHash version                           2857           2857           1        187.9           5.3       0.8X
 
 
 ================================================================================================
 single longs
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For single longs:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                3019           3021           3        177.8           5.6       1.0X
-codegen version                                    5477           5480           4         98.0          10.2       0.6X
-codegen version 64-bit                             3755           3759           5        143.0           7.0       0.8X
-codegen HiveHash version                           3319           3326           9        161.7           6.2       0.9X
+interpreted version                                3018           3019           2        177.9           5.6       1.0X
+codegen version                                    5238           5240           2        102.5           9.8       0.6X
+codegen version 64-bit                             3762           3765           4        142.7           7.0       0.8X
+codegen HiveHash version                           3342           3342           0        160.6           6.2       0.9X
 
 
 ================================================================================================
 normal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For normal:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                2487           2488           1          0.8        1186.0       1.0X
-codegen version                                    2253           2255           2          0.9        1074.5       1.1X
-codegen version 64-bit                              705            705           1          3.0         336.0       3.5X
-codegen HiveHash version                           3671           3675           6          0.6        1750.3       0.7X
+interpreted version                                2617           2618           2          0.8        1248.0       1.0X
+codegen version                                    2296           2296           0          0.9        1094.8       1.1X
+codegen version 64-bit                              704            706           1          3.0         335.9       3.7X
+codegen HiveHash version                           3782           3786           5          0.6        1803.6       0.7X
 
 
 ================================================================================================
 array
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For array:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                1042           1045           4          0.1        7947.6       1.0X
-codegen version                                    3728           3735          10          0.0       28442.1       0.3X
-codegen version 64-bit                             2487           2499          18          0.1       18971.5       0.4X
-codegen HiveHash version                            775            776           1          0.2        5910.2       1.3X
+interpreted version                                1015           1021           8          0.1        7747.0       1.0X
+codegen version                                    3673           3676           4          0.0       28025.1       0.3X
+codegen version 64-bit                             2453           2454           1          0.1       18717.5       0.4X
+codegen HiveHash version                            781            782           1          0.2        5961.0       1.3X
 
 
 ================================================================================================
 map
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash For map:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-interpreted version                                   0              0           0         97.0          10.3       1.0X
-codegen version                                     262            262           1          0.0       63915.5       0.0X
-codegen version 64-bit                              177            177           0          0.0       43098.3       0.0X
-codegen HiveHash version                             29             29           1          0.1        7091.4       0.0X
+interpreted version                                   0              0           0         97.3          10.3       1.0X
+codegen version                                     256            256           0          0.0       62469.7       0.0X
+codegen version 64-bit                              181            182           1          0.0       44237.6       0.0X
+codegen HiveHash version                             30             30           0          0.1        7329.7       0.0X
 
 
diff --git a/sql/catalyst/benchmarks/HashByteArrayBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/HashByteArrayBenchmark-jdk21-results.txt
index 7c326a530dcf9..e5a5f508343eb 100644
--- a/sql/catalyst/benchmarks/HashByteArrayBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/HashByteArrayBenchmark-jdk21-results.txt
@@ -2,76 +2,76 @@
 Benchmark for MurMurHash 3 and xxHash64
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 8:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       10             10           0        206.4           4.8       1.0X
-xxHash 64-bit                                        10             10           0        200.7           5.0       1.0X
-HiveHasher                                           14             14           0        151.5           6.6       0.7X
+Murmur3_x86_32                                       11             11           0        196.5           5.1       1.0X
+xxHash 64-bit                                        11             11           0        199.5           5.0       1.0X
+HiveHasher                                           14             14           1        150.9           6.6       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 16:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
 Murmur3_x86_32                                       14             15           0        145.5           6.9       1.0X
-xxHash 64-bit                                        12             13           0        168.0           6.0       1.2X
-HiveHasher                                           23             23           0         90.8          11.0       0.6X
+xxHash 64-bit                                        13             13           0        167.2           6.0       1.1X
+HiveHasher                                           23             23           0         91.0          11.0       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 24:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
 Murmur3_x86_32                                       20             20           0        104.3           9.6       1.0X
-xxHash 64-bit                                        14             15           0        144.9           6.9       1.4X
-HiveHasher                                           33             33           0         62.7          15.9       0.6X
+xxHash 64-bit                                        14             15           0        144.8           6.9       1.4X
+HiveHasher                                           33             34           1         62.7          15.9       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 31:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       35             35           0         60.6          16.5       1.0X
-xxHash 64-bit                                        27             27           0         76.9          13.0       1.3X
-HiveHasher                                           44             44           1         48.2          20.8       0.8X
+Murmur3_x86_32                                       32             32           0         65.5          15.3       1.0X
+xxHash 64-bit                                        27             27           0         76.9          13.0       1.2X
+HiveHasher                                           44             44           0         48.2          20.8       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 95:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       82             82           1         25.5          39.1       1.0X
-xxHash 64-bit                                        57             58           0         36.5          27.4       1.4X
-HiveHasher                                          157            157           0         13.4          74.8       0.5X
+Murmur3_x86_32                                       70             71           0         29.8          33.6       1.0X
+xxHash 64-bit                                        57             58           0         36.5          27.4       1.2X
+HiveHasher                                          157            157           0         13.4          74.8       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 287:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                      224            224           0          9.4         106.6       1.0X
-xxHash 64-bit                                       102            102           0         20.6          48.4       2.2X
-HiveHasher                                          532            534           1          3.9         253.9       0.4X
+Murmur3_x86_32                                      197            198           0         10.6          94.1       1.0X
+xxHash 64-bit                                       102            102           0         20.6          48.6       1.9X
+HiveHasher                                          532            533           0          3.9         253.9       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 1055:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                      803            803           0          2.6         382.7       1.0X
-xxHash 64-bit                                       294            294           1          7.1         140.1       2.7X
-HiveHasher                                         2043           2044           0          1.0         974.4       0.4X
+Murmur3_x86_32                                      710            711           1          3.0         338.6       1.0X
+xxHash 64-bit                                       293            293           0          7.2         139.7       2.4X
+HiveHasher                                         2042           2043           0          1.0         973.8       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 2079:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                     1597           1597           0          1.3         761.3       1.0X
-xxHash 64-bit                                       550            551           0          3.8         262.4       2.9X
-HiveHasher                                         4047           4047           0          0.5        1929.6       0.4X
+Murmur3_x86_32                                     1387           1387           0          1.5         661.3       1.0X
+xxHash 64-bit                                       550            550           0          3.8         262.1       2.5X
+HiveHasher                                         4047           4048           0          0.5        1929.9       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 8223:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                     6287           6290           4          0.3        2997.9       1.0X
-xxHash 64-bit                                      2071           2071           0          1.0         987.4       3.0X
-HiveHasher                                        16084          16086           3          0.1        7669.3       0.4X
+Murmur3_x86_32                                     5727           5729           2          0.4        2730.9       1.0X
+xxHash 64-bit                                      2066           2066           1          1.0         985.1       2.8X
+HiveHasher                                        16085          16086           1          0.1        7669.9       0.4X
 
 
diff --git a/sql/catalyst/benchmarks/HashByteArrayBenchmark-results.txt b/sql/catalyst/benchmarks/HashByteArrayBenchmark-results.txt
index 45b4e8ac70025..a7e8c45f4f42e 100644
--- a/sql/catalyst/benchmarks/HashByteArrayBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/HashByteArrayBenchmark-results.txt
@@ -2,76 +2,76 @@
 Benchmark for MurMurHash 3 and xxHash64
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 8:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       11             11           0        183.1           5.5       1.0X
+Murmur3_x86_32                                       11             12           0        183.1           5.5       1.0X
 xxHash 64-bit                                        10             10           0        213.5           4.7       1.2X
-HiveHasher                                           14             14           0        150.0           6.7       0.8X
+HiveHasher                                           14             14           0        149.9           6.7       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 16:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       17             17           0        123.2           8.1       1.0X
-xxHash 64-bit                                        12             12           0        175.4           5.7       1.4X
+Murmur3_x86_32                                       17             17           0        122.9           8.1       1.0X
+xxHash 64-bit                                        12             12           0        175.2           5.7       1.4X
 HiveHasher                                           23             23           0         93.0          10.8       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 24:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       24             24           2         89.1          11.2       1.0X
-xxHash 64-bit                                        14             14           0        145.3           6.9       1.6X
-HiveHasher                                           33             34           2         63.0          15.9       0.7X
+Murmur3_x86_32                                       24             24           0         89.1          11.2       1.0X
+xxHash 64-bit                                        14             15           0        145.1           6.9       1.6X
+HiveHasher                                           33             33           0         63.0          15.9       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 31:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       37             37           0         56.2          17.8       1.0X
-xxHash 64-bit                                        27             28           0         76.4          13.1       1.4X
-HiveHasher                                           43             43           0         49.2          20.3       0.9X
+Murmur3_x86_32                                       36             36           0         57.9          17.3       1.0X
+xxHash 64-bit                                        28             28           0         75.5          13.2       1.3X
+HiveHasher                                           43             43           0         49.2          20.3       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 95:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                       88             88           0         23.9          41.8       1.0X
-xxHash 64-bit                                        64             64           0         32.9          30.4       1.4X
-HiveHasher                                          158            160           4         13.2          75.6       0.6X
+Murmur3_x86_32                                       87             87           0         24.0          41.6       1.0X
+xxHash 64-bit                                        65             65           0         32.5          30.8       1.3X
+HiveHasher                                          158            159           0         13.2          75.5       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 287:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                      244            244           0          8.6         116.5       1.0X
-xxHash 64-bit                                       123            123           0         17.1          58.5       2.0X
+Murmur3_x86_32                                      244            244           0          8.6         116.4       1.0X
+xxHash 64-bit                                       124            125           1         16.9          59.2       2.0X
 HiveHasher                                          534            534           0          3.9         254.8       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 1055:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                      878            878           0          2.4         418.7       1.0X
-xxHash 64-bit                                       401            402           1          5.2         191.1       2.2X
-HiveHasher                                         2044           2044           0          1.0         974.7       0.4X
+Murmur3_x86_32                                      879            879           0          2.4         418.9       1.0X
+xxHash 64-bit                                       401            401           0          5.2         191.2       2.2X
+HiveHasher                                         2045           2045           0          1.0         975.0       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 2079:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                     1718           1724           9          1.2         819.2       1.0X
-xxHash 64-bit                                       781            781           0          2.7         372.4       2.2X
-HiveHasher                                         4050           4052           3          0.5        1931.4       0.4X
+Murmur3_x86_32                                     1714           1715           0          1.2         817.5       1.0X
+xxHash 64-bit                                       783            784           1          2.7         373.5       2.2X
+HiveHasher                                         4050           4051           1          0.5        1931.4       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Hash byte arrays with length 8223:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Murmur3_x86_32                                     6746           6747           2          0.3        3216.6       1.0X
-xxHash 64-bit                                      3042           3044           2          0.7        1450.7       2.2X
-HiveHasher                                        16080          16081           3          0.1        7667.3       0.4X
+Murmur3_x86_32                                     6745           6745           0          0.3        3216.1       1.0X
+xxHash 64-bit                                      3046           3046           0          0.7        1452.4       2.2X
+HiveHasher                                        16085          16086           2          0.1        7669.9       0.4X
 
 
diff --git a/sql/catalyst/benchmarks/HexBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/HexBenchmark-jdk21-results.txt
index afad7d3f6c6f4..238fe92dd9593 100644
--- a/sql/catalyst/benchmarks/HexBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/HexBenchmark-jdk21-results.txt
@@ -2,13 +2,13 @@
 UnHex Comparison
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Cardinality 1000000:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Common Codecs                                      4735           4800         106          0.2        4734.6       1.0X
-Java                                               4008           4011           3          0.2        4008.3       1.2X
-Spark                                              3493           3519          44          0.3        3492.8       1.4X
-Spark Binary                                       2641           2648          11          0.4        2641.3       1.8X
+Common Codecs                                      4701           4786         118          0.2        4700.5       1.0X
+Java                                               3962           3969          10          0.3        3962.4       1.2X
+Spark                                              3492           3494           2          0.3        3491.6       1.3X
+Spark Binary                                       2638           2638           0          0.4        2637.8       1.8X
 
 
diff --git a/sql/catalyst/benchmarks/HexBenchmark-results.txt b/sql/catalyst/benchmarks/HexBenchmark-results.txt
index ebb1fb05aef2c..796f48468187d 100644
--- a/sql/catalyst/benchmarks/HexBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/HexBenchmark-results.txt
@@ -2,13 +2,13 @@
 UnHex Comparison
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Cardinality 1000000:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Common Codecs                                      4537           4561          21          0.2        4536.8       1.0X
-Java                                               3137           3142           6          0.3        3137.5       1.4X
-Spark                                              3793           3799           6          0.3        3793.3       1.2X
-Spark Binary                                       2755           2758           2          0.4        2755.5       1.6X
+Common Codecs                                      4821           4894          64          0.2        4820.6       1.0X
+Java                                               2565           2572          10          0.4        2564.8       1.9X
+Spark                                              3811           3812           1          0.3        3810.7       1.3X
+Spark Binary                                       2758           2759           1          0.4        2757.9       1.7X
 
 
diff --git a/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-jdk21-results.txt
index 754895dda89b4..2ae65e2b4a716 100644
--- a/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-jdk21-results.txt
@@ -1,7 +1,7 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 internal row comparable wrapper:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-toSet                                               100            103           3          2.0         499.8       1.0X
-mergePartitions                                     181            184           3          1.1         907.3       0.6X
+toSet                                                81             84           2          2.5         406.5       1.0X
+mergePartitions                                     139            141           2          1.4         695.7       0.6X
 
diff --git a/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-results.txt b/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-results.txt
index ebb7cb08939ed..6ce0c60a96565 100644
--- a/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/InternalRowComparableWrapperBenchmark-results.txt
@@ -1,7 +1,7 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 internal row comparable wrapper:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-toSet                                               116            118           2          1.7         581.5       1.0X
-mergePartitions                                     208            211           3          1.0        1040.8       0.6X
+toSet                                               114            117           3          1.8         568.6       1.0X
+mergePartitions                                     212            213           1          0.9        1059.5       0.5X
 
diff --git a/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-jdk21-results.txt b/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-jdk21-results.txt
index 7cf3689a033d6..e20ffc3ffec3a 100644
--- a/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-jdk21-results.txt
+++ b/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-jdk21-results.txt
@@ -2,13 +2,13 @@
 unsafe projection
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 unsafe projection:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-single long                                        1331           1333           2        201.6           5.0       1.0X
-single nullable long                               2369           2380          16        113.3           8.8       0.6X
-7 primitive types                                  7127           7128           2         37.7          26.5       0.2X
-7 nullable primitive types                        10678          10678           0         25.1          39.8       0.1X
+single long                                        1331           1332           1        201.7           5.0       1.0X
+single nullable long                               2369           2412          61        113.3           8.8       0.6X
+7 primitive types                                  7149           7154           8         37.5          26.6       0.2X
+7 nullable primitive types                        10649          10652           4         25.2          39.7       0.1X
 
 
diff --git a/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-results.txt b/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-results.txt
index b2f82a851689f..b1c8e9a375809 100644
--- a/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-results.txt
+++ b/sql/catalyst/benchmarks/UnsafeProjectionBenchmark-results.txt
@@ -2,13 +2,13 @@
 unsafe projection
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 unsafe projection:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-single long                                        1376           1377           2        195.1           5.1       1.0X
-single nullable long                               2447           2449           3        109.7           9.1       0.6X
-7 primitive types                                  7004           7011          10         38.3          26.1       0.2X
-7 nullable primitive types                        10357          10363           7         25.9          38.6       0.1X
+single long                                        1377           1378           0        194.9           5.1       1.0X
+single nullable long                               2385           2420          50        112.5           8.9       0.6X
+7 primitive types                                  7018           7019           2         38.3          26.1       0.2X
+7 nullable primitive types                        10399          10400           1         25.8          38.7       0.1X
 
 
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/ArrayOfDecimalsSerDe.java b/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/ArrayOfDecimalsSerDe.java
new file mode 100644
index 0000000000000..3a445fea56906
--- /dev/null
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/ArrayOfDecimalsSerDe.java
@@ -0,0 +1,259 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.expressions;
+
+import java.math.BigDecimal;
+import java.math.BigInteger;
+import java.util.Objects;
+
+import org.apache.datasketches.common.ArrayOfItemsSerDe;
+import org.apache.datasketches.common.ArrayOfLongsSerDe;
+import org.apache.datasketches.common.ArrayOfNumbersSerDe;
+import org.apache.datasketches.common.Util;
+import org.apache.datasketches.memory.Memory;
+
+import org.apache.spark.sql.types.Decimal;
+import org.apache.spark.sql.types.DecimalType;
+
+import static org.apache.datasketches.common.ByteArrayUtil.copyBytes;
+import static org.apache.datasketches.common.ByteArrayUtil.putIntLE;
+
+public class ArrayOfDecimalsSerDe extends ArrayOfItemsSerDe<Decimal> {
+
+    private final int precision;
+    private final int scale;
+    private final DecimalType decimalType;
+    private final ArrayOfItemsSerDe<?> delegate;
+
+    public ArrayOfDecimalsSerDe(DecimalType decimalType) {
+        this.decimalType = decimalType;
+        this.precision = decimalType.precision();
+        this.scale = decimalType.scale();
+
+        if (DecimalType.is32BitDecimalType(decimalType)) {
+            this.delegate = new ArrayOfNumbersSerDe();
+        } else if (DecimalType.is64BitDecimalType(decimalType)) {
+            this.delegate = new ArrayOfLongsSerDe();
+        } else {
+            this.delegate = new ArrayOfDecimalByteArrSerDe(decimalType);
+        }
+    }
+
+    @Override
+    public byte[] serializeToByteArray(Decimal item) {
+        Objects.requireNonNull(item, "Item must not be null");
+        if (DecimalType.is32BitDecimalType(decimalType)) {
+            return ((ArrayOfNumbersSerDe) delegate).serializeToByteArray(decimalToInt(item));
+        } else if (DecimalType.is64BitDecimalType(decimalType)) {
+            return ((ArrayOfLongsSerDe) delegate).serializeToByteArray(item.toUnscaledLong());
+        } else {
+            return ((ArrayOfDecimalByteArrSerDe) delegate).serializeToByteArray(item);
+        }
+    }
+
+    @Override
+    public byte[] serializeToByteArray(Decimal[] items) {
+        Objects.requireNonNull(items, "Item must not be null");
+        if (DecimalType.is32BitDecimalType(decimalType)) {
+            Number[] intItems = new Number[items.length];
+            for (int i = 0; i < items.length; i++) {
+                intItems[i] = decimalToInt(items[i]);
+            }
+            return ((ArrayOfNumbersSerDe) delegate).serializeToByteArray(intItems);
+        } else if (DecimalType.is64BitDecimalType(decimalType)) {
+            Long[] longItems = new Long[items.length];
+            for (int i = 0; i < items.length; i++) {
+                longItems[i] = items[i].toUnscaledLong();
+            }
+            return ((ArrayOfLongsSerDe) delegate).serializeToByteArray(longItems);
+        } else {
+            return ((ArrayOfDecimalByteArrSerDe) delegate).serializeToByteArray(items);
+        }
+    }
+
+    @Override
+    public Decimal[] deserializeFromMemory(Memory mem, long offsetBytes, int numItems) {
+        Objects.requireNonNull(mem, "Memory must not be null");
+        if (DecimalType.is32BitDecimalType(decimalType)) {
+            Number[] intArray = ((ArrayOfNumbersSerDe) delegate)
+                    .deserializeFromMemory(mem, offsetBytes, numItems);
+            Decimal[] result = new Decimal[intArray.length];
+            for (int i = 0; i < intArray.length; i++) {
+                result[i] = Decimal.createUnsafe((int) intArray[i], precision, scale);
+            }
+            return result;
+        } else if (DecimalType.is64BitDecimalType(decimalType)) {
+            Long[] longArray = ((ArrayOfLongsSerDe) delegate)
+                    .deserializeFromMemory(mem, offsetBytes, numItems);
+            Decimal[] result = new Decimal[longArray.length];
+            for (int i = 0; i < longArray.length; i++) {
+                result[i] = Decimal.createUnsafe(longArray[i], precision, scale);
+            }
+            return result;
+        } else {
+            return ((ArrayOfDecimalByteArrSerDe) delegate)
+                    .deserializeFromMemory(mem, offsetBytes, numItems);
+        }
+    }
+
+    @Override
+    public int sizeOf(Decimal item) {
+        Objects.requireNonNull(item, "Item must not be null");
+        if (DecimalType.is32BitDecimalType(decimalType)) {
+            return ((ArrayOfNumbersSerDe) delegate).sizeOf(decimalToInt(item));
+        } else if (DecimalType.is64BitDecimalType(decimalType)) {
+            return ((ArrayOfLongsSerDe) delegate).sizeOf(item.toUnscaledLong());
+        } else {
+            return ((ArrayOfDecimalByteArrSerDe) delegate).sizeOf(item);
+        }
+    }
+
+    @Override
+    public int sizeOf(Memory mem, long offsetBytes, int numItems) {
+        Objects.requireNonNull(mem, "Memory must not be null");
+        return delegate.sizeOf(mem, offsetBytes, numItems);
+    }
+
+    @Override
+    public String toString(Decimal item) {
+        if (item == null) {
+            return "null";
+        }
+        return item.toString();
+    }
+
+    @Override
+    public Class<Decimal> getClassOfT() {
+        return Decimal.class;
+    }
+
+    private int decimalToInt(Decimal item) {
+        return ((int) item.toUnscaledLong());
+    }
+
+
+    /**
+     * Serialize and deserialize Decimal as byte array.
+     */
+    private static class ArrayOfDecimalByteArrSerDe extends ArrayOfItemsSerDe<Decimal> {
+        private final int precision;
+        private final int scale;
+
+        ArrayOfDecimalByteArrSerDe(DecimalType decimalType) {
+            assert DecimalType.isByteArrayDecimalType(decimalType);
+            this.precision = decimalType.precision();
+            this.scale = decimalType.scale();
+        }
+
+        @Override
+        public byte[] serializeToByteArray(Decimal item) {
+            Objects.requireNonNull(item, "Item must not be null");
+            final byte[] decimalByteArr = item.toJavaBigDecimal().unscaledValue().toByteArray();
+            final int numBytes = decimalByteArr.length;
+            final byte[] out = new byte[numBytes + Integer.BYTES];
+            copyBytes(decimalByteArr, 0, out, 4, numBytes);
+            putIntLE(out, 0, numBytes);
+            return out;
+        }
+
+        @Override
+        public byte[] serializeToByteArray(Decimal[] items) {
+            Objects.requireNonNull(items, "Items must not be null");
+            if (items.length == 0) {
+                return new byte[0];
+            }
+            int totalBytes = 0;
+            final int numItems = items.length;
+            final byte[][] serialized2DArray = new byte[numItems][];
+            for (int i = 0; i < numItems; i++) {
+                serialized2DArray[i] = items[i].toJavaBigDecimal().unscaledValue().toByteArray();
+                totalBytes += serialized2DArray[i].length + Integer.BYTES;
+            }
+            final byte[] bytesOut = new byte[totalBytes];
+            int offset = 0;
+            for (int i = 0; i < numItems; i++) {
+                final int decimalLen = serialized2DArray[i].length;
+                putIntLE(bytesOut, offset, decimalLen);
+                offset += Integer.BYTES;
+                copyBytes(serialized2DArray[i], 0, bytesOut, offset, decimalLen);
+                offset += decimalLen;
+            }
+            return bytesOut;
+        }
+
+        @Override
+        public Decimal[] deserializeFromMemory(Memory mem, long offsetBytes, int numItems) {
+            Objects.requireNonNull(mem, "Memory must not be null");
+            if (numItems <= 0) {
+                return new Decimal[0];
+            }
+            final Decimal[] array = new Decimal[numItems];
+            long offset = offsetBytes;
+            for (int i = 0; i < numItems; i++) {
+                Util.checkBounds(offset, Integer.BYTES, mem.getCapacity());
+                final int decimalLength = mem.getInt(offset);
+                offset += Integer.BYTES;
+                final byte[] decimalBytes = new byte[decimalLength];
+                Util.checkBounds(offset, decimalLength, mem.getCapacity());
+                mem.getByteArray(offset, decimalBytes, 0, decimalLength);
+                offset += decimalLength;
+                BigInteger bigInteger = new BigInteger(decimalBytes);
+                BigDecimal javaDecimal = new BigDecimal(bigInteger, scale);
+                array[i] = Decimal.apply(javaDecimal, precision, scale);
+            }
+            return array;
+        }
+
+        @Override
+        public int sizeOf(Decimal item) {
+            Objects.requireNonNull(item, "Item must not be null");
+            return item.toJavaBigDecimal().unscaledValue().toByteArray().length + Integer.BYTES;
+        }
+
+        @Override
+        public int sizeOf(Memory mem, long offsetBytes, int numItems) {
+            Objects.requireNonNull(mem, "Memory must not be null");
+            if (numItems <= 0) {
+                return 0;
+            }
+            long offset = offsetBytes;
+            final long memCap = mem.getCapacity();
+            for (int i = 0; i < numItems; i++) {
+                Util.checkBounds(offset, Integer.BYTES, memCap);
+                final int itemLenBytes = mem.getInt(offset);
+                offset += Integer.BYTES;
+                Util.checkBounds(offset, itemLenBytes, memCap);
+                offset += itemLenBytes;
+            }
+            return (int) (offset - offsetBytes);
+        }
+
+        @Override
+        public String toString(Decimal item) {
+            if (item == null) {
+                return "null";
+            }
+            return item.toString();
+        }
+
+        @Override
+        public Class<Decimal> getClassOfT() {
+            return Decimal.class;
+        }
+    }
+}
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/RowBasedKeyValueBatch.java b/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/RowBasedKeyValueBatch.java
index 5074348a1fd6a..4a041b70cf592 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/RowBasedKeyValueBatch.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/catalyst/expressions/RowBasedKeyValueBatch.java
@@ -129,7 +129,7 @@ private boolean acquirePage(long requiredSize) {
       page = allocatePage(requiredSize);
     } catch (SparkOutOfMemoryError e) {
       logger.warn("Failed to allocate page ({} bytes).",
-        MDC.of(LogKeys.PAGE_SIZE$.MODULE$, requiredSize));
+        MDC.of(LogKeys.PAGE_SIZE, requiredSize));
       return false;
     }
     base = page.getBaseObject();
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/Table.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/Table.java
index f9a75ccd1c8da..3a1e0d9f7011e 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/Table.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/Table.java
@@ -20,6 +20,7 @@
 import org.apache.spark.annotation.Evolving;
 import org.apache.spark.sql.connector.catalog.constraints.Constraint;
 import org.apache.spark.sql.connector.expressions.Transform;
+import org.apache.spark.sql.errors.QueryCompilationErrors;
 import org.apache.spark.sql.types.StructType;
 
 import java.util.Collections;
@@ -56,7 +57,9 @@ public interface Table {
    * @deprecated This is deprecated. Please override {@link #columns} instead.
    */
   @Deprecated(since = "3.4.0")
-  StructType schema();
+  default StructType schema() {
+    throw QueryCompilationErrors.mustOverrideOneMethodError("columns");
+  }
 
   /**
    * Returns the columns of this table. If the table is not readable and doesn't have a schema, an
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableCapability.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableCapability.java
index 5732c0f3af4ee..0a01c0c266b9a 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableCapability.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableCapability.java
@@ -93,6 +93,12 @@ public enum TableCapability {
    */
   ACCEPT_ANY_SCHEMA,
 
+  /**
+   * Signals that table supports Spark altering the schema if necessary
+   * as part of an operation.
+   */
+  AUTOMATIC_SCHEMA_EVOLUTION,
+
   /**
    * Signals that the table supports append writes using the V1 InsertableRelation interface.
    * <p>
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableInfo.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableInfo.java
index 8dc71c5aee472..a5b4e333afa87 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableInfo.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableInfo.java
@@ -16,14 +16,14 @@
  */
 package org.apache.spark.sql.connector.catalog;
 
-import static com.google.common.base.Preconditions.checkNotNull;
-import com.google.common.collect.Maps;
+import java.util.HashMap;
+import java.util.Map;
+import java.util.Objects;
+
 import org.apache.spark.sql.connector.catalog.constraints.Constraint;
 import org.apache.spark.sql.connector.expressions.Transform;
 import org.apache.spark.sql.types.StructType;
 
-import java.util.Map;
-
 public class TableInfo {
 
   private final Column[] columns;
@@ -62,7 +62,7 @@ public Transform[] partitions() {
 
   public static class Builder {
     private Column[] columns;
-    private Map<String, String> properties = Maps.newHashMap();
+    private Map<String, String> properties = new HashMap<>();
     private Transform[] partitions = new Transform[0];
     private Constraint[] constraints = new Constraint[0];
 
@@ -87,7 +87,7 @@ public Builder withConstraints(Constraint[] constraints) {
     }
 
     public TableInfo build() {
-      checkNotNull(columns, "columns should not be null");
+      Objects.requireNonNull(columns, "columns should not be null");
       return new TableInfo(this);
     }
   }
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableSummary.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableSummary.java
index e08f83b98319e..8f46a372342a8 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableSummary.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/TableSummary.java
@@ -17,9 +17,9 @@
 
 package org.apache.spark.sql.connector.catalog;
 
-import org.apache.spark.annotation.Evolving;
+import java.util.Objects;
 
-import static com.google.common.base.Preconditions.checkNotNull;
+import org.apache.spark.annotation.Evolving;
 
 @Evolving
 public interface TableSummary {
@@ -38,7 +38,7 @@ static TableSummary of(Identifier identifier, String tableType) {
 
 record TableSummaryImpl(Identifier identifier, String tableType) implements TableSummary {
     TableSummaryImpl {
-        checkNotNull(identifier, "Identifier of a table summary object cannot be null");
-        checkNotNull(tableType, "Table type of a table summary object cannot be null");
+      Objects.requireNonNull(identifier, "Identifier of a table summary object cannot be null");
+      Objects.requireNonNull(tableType, "Table type of a table summary object cannot be null");
     }
 }
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/BaseConstraint.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/BaseConstraint.java
index 28791a9f3a58f..f93d716a27842 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/BaseConstraint.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/BaseConstraint.java
@@ -63,15 +63,26 @@ public boolean rely() {
 
   @Override
   public String toDDL() {
+    // The validation status is not included in the DDL output as it's not part of
+    // the Spark SQL syntax for constraints.
     return String.format(
-        "CONSTRAINT %s %s %s %s %s",
+        "CONSTRAINT %s %s %s %s",
         name,
         definition(),
         enforced ? "ENFORCED" : "NOT ENFORCED",
-        validationStatus,
         rely ? "RELY" : "NORELY");
   }
 
+  public String toDescription() {
+    StringJoiner joiner = new StringJoiner(" ");
+    joiner.add(definition());
+    joiner.add(enforced ? "ENFORCED" : "NOT ENFORCED");
+    if (rely) {
+      joiner.add("RELY");
+    }
+    return joiner.toString();
+  }
+
   @Override
   public String toString() {
     return toDDL();
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/Constraint.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/Constraint.java
index c3a2cd73e9abe..93ffb22422e60 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/Constraint.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/catalog/constraints/Constraint.java
@@ -58,6 +58,12 @@ public interface Constraint {
    */
   String toDDL();
 
+  /**
+   * Returns the constraint description for DESCRIBE TABLE output, excluding the constraint
+   * name (shown separately).
+   */
+  String toDescription();
+
   /**
    * Instantiates a builder for a CHECK constraint.
    *
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/expressions/filter/Predicate.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/expressions/filter/Predicate.java
index e58cddc274c5f..65f2bd88940a3 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/expressions/filter/Predicate.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/expressions/filter/Predicate.java
@@ -136,6 +136,12 @@
  *    <li>Since version: 3.3.0</li>
  *   </ul>
  *  </li>
+ *  <li>Name: <code>BOOLEAN_EXPRESSION</code>
+ *   <ul>
+ *    <li>A simple wrapper for any expression that returns boolean type.</li>
+ *    <li>Since version: 4.1.0</li>
+ *   </ul>
+ *  </li>
  * </ol>
  *
  * @since 3.3.0
@@ -145,5 +151,8 @@ public class Predicate extends GeneralScalarExpression {
 
   public Predicate(String name, Expression[] children) {
     super(name, children);
+    if ("BOOLEAN_EXPRESSION".equals(name)) {
+      assert children.length == 1;
+    }
   }
 }
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/RetriesExceeded.scala b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/join/JoinType.java
similarity index 76%
rename from sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/RetriesExceeded.scala
rename to sql/catalyst/src/main/java/org/apache/spark/sql/connector/join/JoinType.java
index 77e1c0deab24f..56fb0a51c243a 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/RetriesExceeded.scala
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/join/JoinType.java
@@ -15,11 +15,18 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.connect.client
+package org.apache.spark.sql.connector.join;
+
+import org.apache.spark.annotation.Evolving;
 
 /**
- * Represents an exception which was considered retriable but has exceeded retry limits.
+ * Enum representing the join type in public API.
  *
- * The actual exceptions incurred can be retrieved with getSuppressed()
+ * @since 4.1.0
  */
-class RetriesExceeded extends Throwable
+@Evolving
+public enum JoinType {
+    INNER_JOIN,
+    LEFT_OUTER_JOIN,
+    RIGHT_OUTER_JOIN,
+}
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/read/SupportsPushDownJoin.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/read/SupportsPushDownJoin.java
new file mode 100644
index 0000000000000..a48a78671922a
--- /dev/null
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/read/SupportsPushDownJoin.java
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.connector.read;
+
+import org.apache.spark.annotation.Evolving;
+import org.apache.spark.sql.connector.expressions.filter.Predicate;
+import org.apache.spark.sql.connector.join.JoinType;
+
+/**
+ * A mix-in interface for {@link ScanBuilder}. Data sources can implement this interface to
+ * push down join operators.
+ *
+ * @since 4.1.0
+ */
+@Evolving
+public interface SupportsPushDownJoin extends ScanBuilder {
+  /**
+   * Returns true if the other side of the join is compatible with the
+   * current {@code SupportsPushDownJoin} for a join push down, meaning both sides can be
+   * processed together within the same underlying data source.
+   * <br>
+   * <br>
+   * For example, JDBC connectors are compatible if they use the same
+   * host, port, username, and password.
+   */
+  boolean isOtherSideCompatibleForJoin(SupportsPushDownJoin other);
+
+  /**
+   * Pushes down the join of the current {@code SupportsPushDownJoin} and the other side of join
+   * {@code SupportsPushDownJoin}.
+   *
+   * @param other {@code SupportsPushDownJoin} that this {@code SupportsPushDownJoin}
+   * gets joined with.
+   * @param joinType the type of join.
+   * @param leftSideRequiredColumnsWithAliases required output of the
+   *                                           left side {@code SupportsPushDownJoin}
+   * @param rightSideRequiredColumnsWithAliases required output of the
+   *                                            right side {@code SupportsPushDownJoin}
+   * @param condition join condition. Columns are named after the specified aliases in
+   * {@code leftSideRequiredColumnWithAliases} and {@code rightSideRequiredColumnWithAliases}
+   * @return True if join has been successfully pushed down.
+   */
+  boolean pushDownJoin(
+      SupportsPushDownJoin other,
+      JoinType joinType,
+      ColumnWithAlias[] leftSideRequiredColumnsWithAliases,
+      ColumnWithAlias[] rightSideRequiredColumnsWithAliases,
+      Predicate condition
+  );
+
+  /**
+   *  A helper class used when there are duplicated names coming from 2 sides of the join
+   *  operator.
+   *  <br>
+   *  Holds information of original output name and the alias of the new output.
+   */
+  record ColumnWithAlias(String colName, String alias) {
+    public String prettyString() {
+      if (alias == null) return colName;
+      else return colName + " AS " + alias;
+    }
+  }
+}
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/util/V2ExpressionSQLBuilder.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/util/V2ExpressionSQLBuilder.java
index 4298f31227500..2bc994acaf33f 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/util/V2ExpressionSQLBuilder.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/util/V2ExpressionSQLBuilder.java
@@ -99,6 +99,8 @@ public String build(Expression expr) {
         case "CONTAINS" -> visitContains(build(e.children()[0]), build(e.children()[1]));
         case "=", "<>", "<=>", "<", "<=", ">", ">=" ->
           visitBinaryComparison(name, e.children()[0], e.children()[1]);
+        case "BOOLEAN_EXPRESSION" ->
+          build(expr.children()[0]);
         case "+", "*", "/", "%", "&", "|", "^" ->
           visitBinaryArithmetic(name, inputToSQL(e.children()[0]), inputToSQL(e.children()[1]));
         case "-" -> {
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/BatchWrite.java b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/BatchWrite.java
index 8c068928415f4..c8febd0fe4934 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/BatchWrite.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/connector/write/BatchWrite.java
@@ -19,6 +19,8 @@
 
 import org.apache.spark.annotation.Evolving;
 
+import java.util.Map;
+
 /**
  * An interface that defines how to write the data to data source for batch processing.
  * <p>
@@ -88,6 +90,49 @@ default void onDataWriterCommit(WriterCommitMessage message) {}
    */
   void commit(WriterCommitMessage[] messages);
 
+  /**
+   * Commits this writing job with a list of commit messages and operation metrics.
+   * <p>
+   * If this method fails (by throwing an exception), this writing job is considered to to have been
+   * failed, and {@link #abort(WriterCommitMessage[])} would be called. The state of the destination
+   * is undefined and @{@link #abort(WriterCommitMessage[])} may not be able to deal with it.
+   * <p>
+   * Note that speculative execution may cause multiple tasks to run for a partition. By default,
+   * Spark uses the commit coordinator to allow at most one task to commit. Implementations can
+   * disable this behavior by overriding {@link #useCommitCoordinator()}. If disabled, multiple
+   * tasks may have committed successfully and one successful commit message per task will be
+   * passed to this commit method. The remaining commit messages are ignored by Spark.
+   * <p>
+   * @param messages a list of commit messages from successful data writers, produced by
+   *                 {@link DataWriter#commit()}.
+   * @param metrics a map of operation metrics collected from the query producing write.
+   *                The keys will be prefixed by operation type, eg `merge`.
+   *                <p>
+   *                Currently supported metrics are:
+   *                <ul>
+   *                  <li>Operation Type = `merge`
+   *                    <ul>
+   *                      <li>`numTargetRowsCopied`: number of target rows copied unmodified because
+   *                      they did not match any action</li>
+   *                      <li>`numTargetRowsDeleted`: number of target rows deleted</li>
+   *                      <li>`numTargetRowsUpdated`: number of target rows updated</li>
+   *                      <li>`numTargetRowsInserted`: number of target rows inserted</li>
+   *                      <li>`numTargetRowsMatchedUpdated`: number of target rows updated by a
+   *                      matched clause</li>
+   *                      <li>`numTargetRowsMatchedDeleted`: number of target rows deleted by a
+   *                      matched clause</li>
+   *                      <li>`numTargetRowsNotMatchedBySourceUpdated`: number of target rows
+   *                      updated by a not matched by source clause</li>
+   *                      <li>`numTargetRowsNotMatchedBySourceDeleted`: number of target rows
+   *                      deleted by a not matched by source clause</li>
+   *                    </ul>
+   *                  </li>
+   *                </ul>
+   */
+  default void commit(WriterCommitMessage[] messages, Map<String, Long> metrics) {
+    commit(messages);
+  }
+
   /**
    * Aborts this writing job because some data writers are failed and keep failing when retry,
    * or the Spark job fails with some unknown reasons,
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/util/CaseInsensitiveStringMap.java b/sql/catalyst/src/main/java/org/apache/spark/sql/util/CaseInsensitiveStringMap.java
index ec461f9740019..0c85f9b41cbaf 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/util/CaseInsensitiveStringMap.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/util/CaseInsensitiveStringMap.java
@@ -63,7 +63,7 @@ public CaseInsensitiveStringMap(Map<String, String> originalMap) {
       String key = toLowerCase(entry.getKey());
       if (delegate.containsKey(key)) {
         logger.warn("Converting duplicated key {} into CaseInsensitiveStringMap.",
-          MDC.of(LogKeys.KEY$.MODULE$, entry.getKey()));
+          MDC.of(LogKeys.KEY, entry.getKey()));
       }
       delegate.put(key, entry.getValue());
     }
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ArrowColumnVector.java b/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ArrowColumnVector.java
index 7382d96e20baa..66116d7c952fd 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ArrowColumnVector.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ArrowColumnVector.java
@@ -182,6 +182,8 @@ void initAccessor(ValueVector vector) {
       accessor = new TimestampAccessor(timeStampMicroTZVector);
     } else if (vector instanceof TimeStampMicroVector timeStampMicroVector) {
       accessor = new TimestampNTZAccessor(timeStampMicroVector);
+    } else if (vector instanceof TimeNanoVector timeNanoVector) {
+      accessor = new TimeNanoAccessor(timeNanoVector);
     } else if (vector instanceof MapVector mapVector) {
       accessor = new MapAccessor(mapVector);
     } else if (vector instanceof ListVector listVector) {
@@ -522,6 +524,21 @@ final long getLong(int rowId) {
     }
   }
 
+  static class TimeNanoAccessor extends ArrowVectorAccessor {
+
+    private final TimeNanoVector accessor;
+
+    TimeNanoAccessor(TimeNanoVector vector) {
+      super(vector);
+      this.accessor = vector;
+    }
+
+    @Override
+    final long getLong(int rowId) {
+      return accessor.get(rowId);
+    }
+  }
+
   static class ArrayAccessor extends ArrowVectorAccessor {
 
     private final ListVector accessor;
diff --git a/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ColumnVector.java b/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ColumnVector.java
index 54b62c00283fa..f1d1f5b3ea800 100644
--- a/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ColumnVector.java
+++ b/sql/catalyst/src/main/java/org/apache/spark/sql/vectorized/ColumnVector.java
@@ -16,6 +16,8 @@
  */
 package org.apache.spark.sql.vectorized;
 
+import scala.PartialFunction;
+
 import org.apache.spark.annotation.Evolving;
 import org.apache.spark.sql.types.DataType;
 import org.apache.spark.sql.types.Decimal;
@@ -336,10 +338,21 @@ public final VariantVal getVariant(int rowId) {
    * Sets up the data type of this column vector.
    */
   protected ColumnVector(DataType type) {
-    if (type instanceof UserDefinedType) {
-      this.type = ((UserDefinedType) type).sqlType();
-    } else {
-      this.type = type;
-    }
+    this.type = type.transformRecursively(
+      new PartialFunction<DataType, DataType>() {
+        @Override
+        public boolean isDefinedAt(DataType x) {
+          return x instanceof UserDefinedType<?>;
+        }
+
+        @Override
+        public DataType apply(DataType t) {
+          if (t instanceof UserDefinedType<?> udt) {
+            return udt.sqlType();
+          } else {
+            return t;
+          }
+        }
+      });
   }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/CapturesConfig.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/CapturesConfig.scala
new file mode 100644
index 0000000000000..c77c3ac537e14
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/CapturesConfig.scala
@@ -0,0 +1,100 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst
+
+import scala.collection.mutable
+
+import org.apache.spark.sql.internal.SQLConf
+
+/**
+ * Trait used for persisting the conf values in views/UDFs.
+ */
+trait CapturesConfig {
+  private val configPrefixDenyList = Seq(
+    SQLConf.MAX_NESTED_VIEW_DEPTH.key,
+    "spark.sql.optimizer.",
+    "spark.sql.codegen.",
+    "spark.sql.execution.",
+    "spark.sql.shuffle.",
+    "spark.sql.adaptive.",
+    // ignore optimization configs used in `RelationConversions`
+    "spark.sql.hive.convertMetastoreParquet",
+    "spark.sql.hive.convertMetastoreOrc",
+    "spark.sql.hive.convertInsertingPartitionedTable",
+    "spark.sql.hive.convertInsertingUnpartitionedTable",
+    "spark.sql.hive.convertMetastoreCtas",
+    SQLConf.ADDITIONAL_REMOTE_REPOSITORIES.key)
+
+  private val configAllowList = Set(
+    SQLConf.DISABLE_HINTS.key
+  )
+
+  /**
+   * Set of single-pass resolver confs that shouldn't be stored during view/UDF/proc creation.
+   * This is needed to avoid accidental failures in tentative and dual-run modes when querying the
+   * view.
+   */
+  private val singlePassResolverDenyList = Set(
+    SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_ENABLED_TENTATIVELY.key,
+    SQLConf.ANALYZER_DUAL_RUN_LEGACY_AND_SINGLE_PASS_RESOLVER.key
+  )
+
+  /**
+   * Convert the provided SQL configs to `properties`. Here we only capture the SQL configs that are
+   * modifiable and should be captured, i.e. not in the denyList and in the allowList. We also
+   * capture `SESSION_LOCAL_TIMEZONE` whose default value relies on the JVM system timezone and
+   * the `ANSI_ENABLED` value.
+   *
+   * We need to always capture them to make sure we apply the same configs when querying the
+   * view/UDF.
+   */
+  def sqlConfigsToProps(conf: SQLConf, prefix: String): Map[String, String] = {
+    val modifiedConfs = getModifiedConf(conf)
+
+    val alwaysCaptured = Seq(SQLConf.SESSION_LOCAL_TIMEZONE, SQLConf.ANSI_ENABLED)
+      .filter(c => !modifiedConfs.contains(c.key))
+      .map(c => (c.key, conf.getConf(c).toString))
+
+    val props = new mutable.HashMap[String, String]
+    for ((key, value) <- modifiedConfs ++ alwaysCaptured) {
+      props.put(s"$prefix$key", value)
+    }
+    props.toMap
+  }
+
+  /**
+   * Get all configurations that are modifiable and should be captured.
+   */
+  private def getModifiedConf(conf: SQLConf): Map[String, String] = {
+    conf.getAllConfs.filter { case (k, _) =>
+      conf.isModifiable(k) && shouldCaptureConfig(k)
+    }
+  }
+
+  /**
+   * Capture view config either of:
+   * 1. exists in allowList
+   * 2. do not exists in denyList
+   */
+  private def shouldCaptureConfig(key: String): Boolean = {
+    configAllowList.contains(key) || (
+      !configPrefixDenyList.exists(prefix => key.startsWith(prefix)) &&
+        !singlePassResolverDenyList.contains(key)
+      )
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/CatalystTypeConverters.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/CatalystTypeConverters.scala
index bb6afb3b13faf..c1e0674d391d2 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/CatalystTypeConverters.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/CatalystTypeConverters.scala
@@ -375,14 +375,14 @@ object CatalystTypeConverters {
 
   private object TimeConverter extends CatalystTypeConverter[LocalTime, LocalTime, Any] {
     override def toCatalystImpl(scalaValue: LocalTime): Long = {
-      DateTimeUtils.localTimeToMicros(scalaValue)
+      DateTimeUtils.localTimeToNanos(scalaValue)
     }
     override def toScala(catalystValue: Any): LocalTime = {
       if (catalystValue == null) null
-      else DateTimeUtils.microsToLocalTime(catalystValue.asInstanceOf[Long])
+      else DateTimeUtils.nanosToLocalTime(catalystValue.asInstanceOf[Long])
     }
     override def toScalaImpl(row: InternalRow, column: Int): LocalTime =
-      DateTimeUtils.microsToLocalTime(row.getLong(column))
+      DateTimeUtils.nanosToLocalTime(row.getLong(column))
   }
 
   private object TimestampConverter extends CatalystTypeConverter[Any, Timestamp, Any] {
@@ -579,6 +579,7 @@ object CatalystTypeConverters {
       new DecimalConverter(DecimalType(Math.max(d.precision, d.scale), d.scale)).toCatalyst(d)
     case d: JavaBigDecimal =>
       new DecimalConverter(DecimalType(Math.max(d.precision, d.scale), d.scale)).toCatalyst(d)
+    case seq: scala.collection.mutable.ArraySeq[_] => convertToCatalyst(seq.array)
     case seq: Seq[Any] => new GenericArrayData(seq.map(convertToCatalyst).toArray)
     case r: Row => InternalRow(r.toSeq.map(convertToCatalyst): _*)
     case arr: Array[Byte] => arr
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/DeserializerBuildHelper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/DeserializerBuildHelper.scala
index 9b22f28ed12da..15de70e35a45d 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/DeserializerBuildHelper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/DeserializerBuildHelper.scala
@@ -160,7 +160,7 @@ object DeserializerBuildHelper {
     StaticInvoke(
       DateTimeUtils.getClass,
       ObjectType(classOf[java.time.LocalTime]),
-      "microsToLocalTime",
+      "nanosToLocalTime",
       path :: Nil,
       returnNullable = false)
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/InternalRow.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/InternalRow.scala
index 5158cdb276fd4..f9bf0ebdfd9ad 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/InternalRow.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/InternalRow.scala
@@ -175,7 +175,7 @@ object InternalRow {
     case ShortType => (input, v) => input.setShort(ordinal, v.asInstanceOf[Short])
     case IntegerType | DateType | _: YearMonthIntervalType =>
       (input, v) => input.setInt(ordinal, v.asInstanceOf[Int])
-    case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType =>
+    case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType =>
       (input, v) => input.setLong(ordinal, v.asInstanceOf[Long])
     case FloatType => (input, v) => input.setFloat(ordinal, v.asInstanceOf[Float])
     case DoubleType => (input, v) => input.setDouble(ordinal, v.asInstanceOf[Double])
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/SerializerBuildHelper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/SerializerBuildHelper.scala
index c8bf1f5237997..82b3cdc508bf9 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/SerializerBuildHelper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/SerializerBuildHelper.scala
@@ -103,7 +103,7 @@ object SerializerBuildHelper {
     StaticInvoke(
       DateTimeUtils.getClass,
       TimeType(),
-      "localTimeToMicros",
+      "localTimeToNanos",
       inputObject :: Nil,
       returnNullable = false)
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala
index f30c22c2566ba..1896a1c7ac279 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/Analyzer.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.catalyst.analysis
 
 import java.util
-import java.util.Locale
+import java.util.{LinkedHashMap, Locale}
 
 import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
@@ -31,9 +31,7 @@ import org.apache.spark.sql.catalyst._
 import org.apache.spark.sql.catalyst.analysis.resolver.{
   AnalyzerBridgeState,
   HybridAnalyzer,
-  Resolver => OperatorResolver,
-  ResolverExtension,
-  ResolverGuard
+  ResolverExtension
 }
 import org.apache.spark.sql.catalyst.catalog._
 import org.apache.spark.sql.catalyst.encoders.OuterScopes
@@ -258,7 +256,10 @@ object Analyzer {
     "spark.sql.expressionTreeChangeLog.level"
   )
 
-  def retainResolutionConfigsForAnalysis(newConf: SQLConf, existingConf: SQLConf): Unit = {
+  def retainResolutionConfigsForAnalysis(
+      newConf: SQLConf,
+      existingConf: SQLConf,
+      createSparkVersion: String = ""): Unit = {
     val retainedConfigs = existingConf.getAllConfs.filter { case (key, _) =>
       // Also apply catalog configs
       RETAINED_ANALYSIS_FLAGS.contains(key) || key.startsWith("spark.sql.catalog.")
@@ -267,6 +268,25 @@ object Analyzer {
     retainedConfigs.foreach { case (k, v) =>
       newConf.settings.put(k, v)
     }
+
+    trySetAnsiValue(newConf, createSparkVersion)
+  }
+
+  /**
+   * In case ANSI value wasn't persisted for a view or a UDF, we set it to `true` in case Spark
+   * version used to create the view is 4.0.0 or higher. We set it to `false` in case Spark version
+   * is lower than 4.0.0 or if the Spark version wasn't stored (in that case we assume that the
+   * value is `false`)
+   */
+  def trySetAnsiValue(sqlConf: SQLConf, createSparkVersion: String = ""): Unit = {
+    if (conf.getConf(SQLConf.ASSUME_ANSI_FALSE_IF_NOT_PERSISTED) &&
+      !sqlConf.settings.containsKey(SQLConf.ANSI_ENABLED.key)) {
+      if (createSparkVersion.startsWith("4.")) {
+        sqlConf.settings.put(SQLConf.ANSI_ENABLED.key, "true")
+      } else {
+        sqlConf.settings.put(SQLConf.ANSI_ENABLED.key, "false")
+      }
+    }
   }
 }
 
@@ -297,17 +317,17 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
   def getRelationResolution: RelationResolution = relationResolution
 
   def executeAndCheck(plan: LogicalPlan, tracker: QueryPlanningTracker): LogicalPlan = {
-    if (plan.analyzed) return plan
-    AnalysisHelper.markInAnalyzer {
-      new HybridAnalyzer(
-        this,
-        new ResolverGuard(catalogManager),
-        new OperatorResolver(
-          catalogManager,
-          singlePassResolverExtensions,
-          singlePassMetadataResolverExtensions
-        )
-      ).apply(plan, tracker)
+    if (plan.analyzed) {
+      plan
+    } else {
+      AnalysisContext.reset()
+      try {
+        AnalysisHelper.markInAnalyzer {
+          HybridAnalyzer.fromLegacyAnalyzer(legacyAnalyzer = this).apply(plan, tracker)
+        }
+      } finally {
+        AnalysisContext.reset()
+      }
     }
   }
 
@@ -424,6 +444,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
       AddMetadataColumns ::
       DeduplicateRelations ::
       ResolveCollationName ::
+      ResolveMergeIntoSchemaEvolution ::
       new ResolveReferences(catalogManager) ::
       // Please do not insert any other rules in between. See the TODO comments in rule
       // ResolveLateralColumnAliasReference for more details.
@@ -454,7 +475,6 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
       ResolveNaturalAndUsingJoin ::
       ResolveOutputRelation ::
       new ResolveTableConstraints(catalogManager) ::
-      new ResolveDataFrameDropColumns(catalogManager) ::
       new ResolveSetVariable(catalogManager) ::
       ExtractWindowExpressions ::
       GlobalAggregates ::
@@ -519,7 +539,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
    * 1. if both side are interval, stays the same;
    * 2. else if one side is date and the other is interval,
    *    turns it to [[DateAddInterval]];
-   * 3. else if one side is interval, turns it to [[TimeAdd]];
+   * 3. else if one side is interval, turns it to [[TimestampAddInterval]];
    * 4. else if one side is date, turns it to [[DateAdd]] ;
    * 5. else stays the same.
    *
@@ -527,7 +547,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
    * 1. if both side are interval, stays the same;
    * 2. else if the left side is date and the right side is interval,
    *    turns it to [[DateAddInterval(l, -r)]];
-   * 3. else if the right side is an interval, turns it to [[TimeAdd(l, -r)]];
+   * 3. else if the right side is an interval, turns it to [[TimestampAddInterval(l, -r)]];
    * 4. else if one side is timestamp, turns it to [[SubtractTimestamps]];
    * 5. else if the right side is date, turns it to [[DateDiff]]/[[SubtractDates]];
    * 6. else if the left side is date, turns it to [[DateSub]];
@@ -795,6 +815,10 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
       } else {
         colResolved.havingCondition
       }
+      // `cond` might contain unresolved aggregate functions so defer its resolution to
+      // `ResolveAggregateFunctions` rule if needed.
+      if (!cond.resolved) return colResolved
+
       // Try resolving the condition of the filter as though it is in the aggregate clause
       val (extraAggExprs, Seq(resolvedHavingCond)) =
         ResolveAggregateFunctions.resolveExprsWithAggregate(Seq(cond), aggForResolving)
@@ -1483,6 +1507,8 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
       new ResolveReferencesInUpdate(catalogManager)
     private val resolveReferencesInSort =
       new ResolveReferencesInSort(catalogManager)
+    private val resolveDataFrameDropColumns =
+      new ResolveDataFrameDropColumns(catalogManager)
 
     /**
      * Return true if there're conflicting attributes among children's outputs of a plan
@@ -1572,29 +1598,11 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
         )
 
       case u @ Union(children, _, _)
-        // if there are duplicate output columns, give them unique expr ids
-          if children.exists(c => c.output.map(_.exprId).distinct.length < c.output.length) =>
-        val newChildren = children.map { c =>
-          if (c.output.map(_.exprId).distinct.length < c.output.length) {
-            val existingExprIds = mutable.HashSet[ExprId]()
-            val projectList = c.output.map { attr =>
-              if (existingExprIds.contains(attr.exprId)) {
-                // replace non-first duplicates with aliases and tag them
-                val newMetadata = new MetadataBuilder().withMetadata(attr.metadata)
-                  .putNull("__is_duplicate").build()
-                Alias(attr, attr.name)(explicitMetadata = Some(newMetadata))
-              } else {
-                // leave first duplicate alone
-                existingExprIds.add(attr.exprId)
-                attr
-              }
-            }
-            Project(projectList, c)
-          } else {
-            c
-          }
-        }
-        u.withNewChildren(newChildren)
+          // if there are duplicate output columns, give them unique expr ids
+          if (u.allChildrenCompatible &&
+          conf.getConf(SQLConf.ENFORCE_TYPE_COERCION_BEFORE_UNION_DEDUPLICATION)) &&
+          children.exists(c => c.output.map(_.exprId).distinct.length < c.output.length) =>
+        DeduplicateUnionChildOutput.deduplicateOutputPerChild(u)
 
       // A special case for Generate, because the output of Generate should not be resolved by
       // ResolveReferences. Attributes in the output will be resolved by ResolveGenerate.
@@ -1662,7 +1670,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
       case u: UpdateTable => resolveReferencesInUpdate(u)
 
       case m @ MergeIntoTable(targetTable, sourceTable, _, _, _, _, _)
-        if !m.resolved && targetTable.resolved && sourceTable.resolved =>
+        if !m.resolved && targetTable.resolved && sourceTable.resolved && !m.needSchemaEvolution =>
 
         EliminateSubqueryAliases(targetTable) match {
           case r: NamedRelation if r.skipSchemaResolution =>
@@ -1685,9 +1693,12 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
                   // The update value can access columns from both target and source tables.
                   resolveAssignments(assignments, m, MergeResolvePolicy.BOTH))
               case UpdateStarAction(updateCondition) =>
-                val assignments = targetTable.output.map { attr =>
-                  Assignment(attr, UnresolvedAttribute(Seq(attr.name)))
-                }
+                // Use only source columns.  Missing columns in target will be handled in
+                // ResolveRowLevelCommandAssignments.
+                val assignments = targetTable.output.flatMap{ targetAttr =>
+                  sourceTable.output.find(
+                      sourceCol => conf.resolver(sourceCol.name, targetAttr.name))
+                    .map(Assignment(targetAttr, _))}
                 UpdateAction(
                   updateCondition.map(resolveExpressionByPlanChildren(_, m)),
                   // For UPDATE *, the value must be from source table.
@@ -1708,9 +1719,12 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
                 // access columns from the source table.
                 val resolvedInsertCondition = insertCondition.map(
                   resolveExpressionByPlanOutput(_, m.sourceTable))
-                val assignments = targetTable.output.map { attr =>
-                  Assignment(attr, UnresolvedAttribute(Seq(attr.name)))
-                }
+                // Use only source columns.  Missing columns in target will be handled in
+                // ResolveRowLevelCommandAssignments.
+                val assignments = targetTable.output.flatMap{ targetAttr =>
+                  sourceTable.output.find(
+                      sourceCol => conf.resolver(sourceCol.name, targetAttr.name))
+                    .map(Assignment(targetAttr, _))}
                 InsertAction(
                   resolvedInsertCondition,
                   resolveAssignments(assignments, m, MergeResolvePolicy.SOURCE))
@@ -1791,6 +1805,9 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
       // Pass for Execute Immediate as arguments will be resolved by [[SubstituteExecuteImmediate]].
       case e : ExecuteImmediateQuery => e
 
+      case d: DataFrameDropColumns if !d.resolved =>
+        resolveDataFrameDropColumns(d)
+
       case q: LogicalPlan =>
         logTrace(s"Attempting to resolve ${q.simpleString(conf.maxToStringFields)}")
         q.mapExpressions(resolveExpressionByPlanChildren(_, q, includeLastResort = true))
@@ -2241,12 +2258,15 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
             case _ => tvf
           }
 
-          Project(
-            Seq(UnresolvedStar(Some(Seq(alias)))),
-            LateralJoin(
-              tableArgs.map(_._2).reduceLeft(Join(_, _, Inner, None, JoinHint.NONE)),
-              LateralSubquery(SubqueryAlias(alias, tvfWithTableColumnIndexes)), Inner, None)
-          )
+          val lateralJoin = LateralJoin(
+            tableArgs.map(_._2).reduceLeft(Join(_, _, Inner, None, JoinHint.NONE)),
+            LateralSubquery(SubqueryAlias(alias, tvfWithTableColumnIndexes)), Inner, None)
+
+          // Set the tag so that it can be used to differentiate lateral join added by
+          // TABLE argument vs added by user.
+          lateralJoin.setTagValue(LateralJoin.BY_TABLE_ARGUMENT, ())
+
+          Project(Seq(UnresolvedStar(Some(Seq(alias)))), lateralJoin)
         }
 
       case q: LogicalPlan =>
@@ -2301,7 +2321,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
             }
             PythonUDTF(
               u.name, u.func, analyzeResult.schema, Some(analyzeResult.pickledAnalyzeResult),
-              newChildren, u.evalType, u.udfDeterministic, u.resultId)
+              newChildren, u.evalType, u.udfDeterministic, u.resultId, None, u.tableArguments)
           }
         }
     }
@@ -2557,9 +2577,10 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
             // Extract the function input project list from the SQL function plan and
             // inline the SQL function expression.
             plan match {
-              case Project(body :: Nil, Project(aliases, _: LocalRelation)) =>
-                projectList ++= aliases
-                SQLScalarFunction(f.function, aliases.map(_.toAttribute), body)
+              case Project(body :: Nil, Project(aliases, _: OneRowRelation)) =>
+                val inputs = aliases.map(stripOuterReference)
+                projectList ++= inputs
+                SQLScalarFunction(f.function, inputs.map(_.toAttribute), body)
               case o =>
                 throw new AnalysisException(
                   errorClass = "INVALID_SQL_FUNCTION_PLAN_STRUCTURE",
@@ -2935,7 +2956,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
     def resolveExprsWithAggregate(
         exprs: Seq[Expression],
         agg: Aggregate): (Seq[NamedExpression], Seq[Expression]) = {
-      val extraAggExprs = ArrayBuffer.empty[NamedExpression]
+      val extraAggExprs = new LinkedHashMap[Expression, NamedExpression]
       val transformed = exprs.map { e =>
         if (!e.resolved) {
           e
@@ -2943,39 +2964,44 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
           buildAggExprList(e, agg, extraAggExprs)
         }
       }
-      (extraAggExprs.toSeq, transformed)
+      (extraAggExprs.values().asScala.toSeq, transformed)
     }
 
     private def buildAggExprList(
         expr: Expression,
         agg: Aggregate,
-        aggExprList: ArrayBuffer[NamedExpression]): Expression = {
+        aggExprMap: LinkedHashMap[Expression, NamedExpression]): Expression = {
       // Avoid adding an extra aggregate expression if it's already present in
-      // `agg.aggregateExpressions`.
-      val index = agg.aggregateExpressions.indexWhere {
-        case Alias(child, _) => child semanticEquals expr
-        case other => other semanticEquals expr
-      }
-      if (index >= 0) {
-        agg.aggregateExpressions(index).toAttribute
+      // `agg.aggregateExpressions`. Trim inner aliases from aggregate expressions because of
+      // expressions like `spark_grouping_id` that can have inner aliases.
+      val replacement: Option[NamedExpression] =
+        agg.aggregateExpressions.foldLeft(Option.empty[NamedExpression]) {
+          case (None, alias: Alias) if expr.semanticEquals(trimAliases(alias.child)) => Some(alias)
+          case (None | Some(_: Alias), aggExpr) if expr.semanticEquals(aggExpr) => Some(aggExpr)
+          case (current, _) => current
+        }
+      if (replacement.isDefined) {
+        replacement.get.toAttribute
       } else {
         expr match {
           case ae: AggregateExpression =>
             val cleaned = trimTempResolvedColumn(ae)
-            val alias =
-              Alias(cleaned, toPrettySQL(e = cleaned, shouldTrimTempResolvedColumn = true))()
-            aggExprList += alias
-            alias.toAttribute
+            val resultAlias = aggExprMap.computeIfAbsent(
+              cleaned.canonicalized,
+              _ => Alias(cleaned, toPrettySQL(e = cleaned, shouldTrimTempResolvedColumn = true))()
+            )
+            resultAlias.toAttribute
           case grouping: Expression if agg.groupingExpressions.exists(grouping.semanticEquals) =>
             trimTempResolvedColumn(grouping) match {
               case ne: NamedExpression =>
-                aggExprList += ne
-                ne.toAttribute
+                val resultAttribute = aggExprMap.computeIfAbsent(ne.canonicalized, _ => ne)
+                resultAttribute.toAttribute
               case other =>
-                val alias =
-                  Alias(other, toPrettySQL(e = other, shouldTrimTempResolvedColumn = true))()
-                aggExprList += alias
-                alias.toAttribute
+                val resultAlias = aggExprMap.computeIfAbsent(
+                  other.canonicalized,
+                  _ => Alias(other, toPrettySQL(e = other, shouldTrimTempResolvedColumn = true))()
+                )
+                resultAlias.toAttribute
             }
           case t: TempResolvedColumn =>
             if (t.child.isInstanceOf[Attribute]) {
@@ -2990,7 +3016,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
               val childWithTempCol = t.child.transformUp {
                 case a: Attribute => TempResolvedColumn(a, Seq(a.name))
               }
-              val newChild = buildAggExprList(childWithTempCol, agg, aggExprList)
+              val newChild = buildAggExprList(childWithTempCol, agg, aggExprMap)
               if (newChild.containsPattern(TEMP_RESOLVED_COLUMN)) {
                 withOrigin(t.origin)(t.copy(hasTried = true))
               } else {
@@ -2998,7 +3024,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
               }
             }
           case other =>
-            other.withNewChildren(other.children.map(buildAggExprList(_, agg, aggExprList)))
+            other.withNewChildren(other.children.map(buildAggExprList(_, agg, aggExprMap)))
         }
       }
     }
@@ -3643,23 +3669,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
   object ResolveWindowFrame extends Rule[LogicalPlan] {
     def apply(plan: LogicalPlan): LogicalPlan = plan.resolveExpressionsWithPruning(
       _.containsPattern(WINDOW_EXPRESSION), ruleId) {
-      case WindowExpression(wf: FrameLessOffsetWindowFunction,
-        WindowSpecDefinition(_, _, f: SpecifiedWindowFrame)) if wf.frame != f =>
-        throw QueryCompilationErrors.cannotSpecifyWindowFrameError(wf.prettyName)
-      case WindowExpression(wf: WindowFunction, WindowSpecDefinition(_, _, f: SpecifiedWindowFrame))
-          if wf.frame != UnspecifiedFrame && wf.frame != f =>
-        throw QueryCompilationErrors.windowFrameNotMatchRequiredFrameError(f, wf.frame)
-      case WindowExpression(wf: WindowFunction, s @ WindowSpecDefinition(_, _, UnspecifiedFrame))
-          if wf.frame != UnspecifiedFrame =>
-        WindowExpression(wf, s.copy(frameSpecification = wf.frame))
-      case we @ WindowExpression(e, s @ WindowSpecDefinition(_, o, UnspecifiedFrame))
-          if e.resolved =>
-        val frame = if (o.nonEmpty) {
-          SpecifiedWindowFrame(RangeFrame, UnboundedPreceding, CurrentRow)
-        } else {
-          SpecifiedWindowFrame(RowFrame, UnboundedPreceding, UnboundedFollowing)
-        }
-        we.copy(windowSpec = s.copy(frameSpecification = frame))
+      case we: WindowExpression => WindowResolution.resolveFrame(we)
     }
   }
 
@@ -3669,11 +3679,7 @@ class Analyzer(override val catalogManager: CatalogManager) extends RuleExecutor
   object ResolveWindowOrder extends Rule[LogicalPlan] {
     def apply(plan: LogicalPlan): LogicalPlan = plan.resolveExpressionsWithPruning(
       _.containsPattern(WINDOW_EXPRESSION), ruleId) {
-      case WindowExpression(wf: WindowFunction, spec) if spec.orderSpec.isEmpty =>
-        throw QueryCompilationErrors.windowFunctionWithWindowFrameNotOrderedError(wf)
-      case WindowExpression(rank: RankLike, spec) if spec.resolved =>
-        val order = spec.orderSpec.map(_.child)
-        WindowExpression(rank.withOrder(order), spec)
+      case we: WindowExpression => WindowResolution.resolveOrder(we)
     }
   }
 
@@ -4218,13 +4224,14 @@ object UpdateOuterReferences extends Rule[LogicalPlan] {
   private def updateOuterReferenceInSubquery(
       plan: LogicalPlan,
       refExprs: Seq[Expression]): LogicalPlan = {
-    plan resolveExpressions { case e =>
-      val outerAlias =
-        refExprs.find(stripAlias(_).semanticEquals(stripOuterReference(e)))
-      outerAlias match {
-        case Some(a: Alias) => OuterReference(a.toAttribute)
-        case _ => e
-      }
+    plan resolveExpressions {
+      case e if e.containsPattern(OUTER_REFERENCE) =>
+        val outerAlias =
+          refExprs.find(stripAlias(_).semanticEquals(stripOuterReference(e)))
+        outerAlias match {
+          case Some(a: Alias) => OuterReference(a.toAttribute)
+          case _ => e
+        }
     }
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/AnsiStringPromotionTypeCoercion.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/AnsiStringPromotionTypeCoercion.scala
index e7be95bc645ea..f6d7a9605831a 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/AnsiStringPromotionTypeCoercion.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/AnsiStringPromotionTypeCoercion.scala
@@ -27,7 +27,7 @@ import org.apache.spark.sql.catalyst.expressions.{
   Literal,
   SubtractDates,
   SubtractTimestamps,
-  TimeAdd,
+  TimestampAddInterval,
   UnaryMinus,
   UnaryPositive
 }
@@ -77,7 +77,7 @@ object AnsiStringPromotionTypeCoercion {
       s.copy(left = Cast(s.left, DateType))
     case s @ SubtractDates(_, right @ StringTypeExpression(), _) =>
       s.copy(right = Cast(s.right, DateType))
-    case t @ TimeAdd(left @ StringTypeExpression(), _, _) =>
+    case t @ TimestampAddInterval(left @ StringTypeExpression(), _, _) =>
       t.copy(start = Cast(t.start, TimestampType))
     case t @ SubtractTimestamps(left @ StringTypeExpression(), _, _, _) =>
       t.copy(left = Cast(t.left, t.right.dataType))
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/BinaryArithmeticWithDatetimeResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/BinaryArithmeticWithDatetimeResolver.scala
index 36a059b2b0f3c..08407bbe96cce 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/BinaryArithmeticWithDatetimeResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/BinaryArithmeticWithDatetimeResolver.scala
@@ -38,8 +38,10 @@ import org.apache.spark.sql.catalyst.expressions.{
   MultiplyYMInterval,
   Subtract,
   SubtractDates,
+  SubtractTimes,
   SubtractTimestamps,
-  TimeAdd,
+  TimeAddInterval,
+  TimestampAddInterval,
   TimestampAddYMInterval,
   UnaryMinus
 }
@@ -47,12 +49,14 @@ import org.apache.spark.sql.types.{
   AnsiIntervalType,
   AnyTimestampTypeExpression,
   CalendarIntervalType,
+  DatetimeType,
   DateType,
   DayTimeIntervalType,
   NullType,
   StringType,
   TimestampNTZType,
   TimestampType,
+  TimeType,
   YearMonthIntervalType
 }
 import org.apache.spark.sql.types.DayTimeIntervalType.DAY
@@ -62,9 +66,9 @@ object BinaryArithmeticWithDatetimeResolver {
     case a @ Add(l, r, mode) =>
       (l.dataType, r.dataType) match {
         case (DateType, DayTimeIntervalType(DAY, DAY)) => DateAdd(l, ExtractANSIIntervalDays(r))
-        case (DateType, _: DayTimeIntervalType) => TimeAdd(Cast(l, TimestampType), r)
+        case (DateType, _: DayTimeIntervalType) => TimestampAddInterval(Cast(l, TimestampType), r)
         case (DayTimeIntervalType(DAY, DAY), DateType) => DateAdd(r, ExtractANSIIntervalDays(l))
-        case (_: DayTimeIntervalType, DateType) => TimeAdd(Cast(r, TimestampType), l)
+        case (_: DayTimeIntervalType, DateType) => TimestampAddInterval(Cast(r, TimestampType), l)
         case (DateType, _: YearMonthIntervalType) => DateAddYMInterval(l, r)
         case (_: YearMonthIntervalType, DateType) => DateAddYMInterval(r, l)
         case (TimestampType | TimestampNTZType, _: YearMonthIntervalType) =>
@@ -80,10 +84,18 @@ object BinaryArithmeticWithDatetimeResolver {
           a.copy(right = Cast(a.right, a.left.dataType))
         case (DateType, CalendarIntervalType) =>
           DateAddInterval(l, r, ansiEnabled = mode == EvalMode.ANSI)
-        case (_, CalendarIntervalType | _: DayTimeIntervalType) => Cast(TimeAdd(l, r), l.dataType)
+        case (_: TimeType, _: DayTimeIntervalType) => TimeAddInterval(l, r)
+        case (_: DatetimeType, _: NullType) =>
+          a.copy(right = Cast(a.right, DayTimeIntervalType.DEFAULT))
+        case (_: DayTimeIntervalType, _: TimeType) => TimeAddInterval(r, l)
+        case (_: NullType, _: DatetimeType) =>
+          a.copy(left = Cast(a.left, DayTimeIntervalType.DEFAULT))
+        case (_, CalendarIntervalType | _: DayTimeIntervalType) =>
+          Cast(TimestampAddInterval(l, r), l.dataType)
         case (CalendarIntervalType, DateType) =>
           DateAddInterval(r, l, ansiEnabled = mode == EvalMode.ANSI)
-        case (CalendarIntervalType | _: DayTimeIntervalType, _) => Cast(TimeAdd(r, l), r.dataType)
+        case (CalendarIntervalType | _: DayTimeIntervalType, _) =>
+          Cast(TimestampAddInterval(r, l), r.dataType)
         case (DateType, dt) if dt != StringType => DateAdd(l, r)
         case (dt, DateType) if dt != StringType => DateAdd(r, l)
         case _ => a
@@ -93,7 +105,8 @@ object BinaryArithmeticWithDatetimeResolver {
         case (DateType, DayTimeIntervalType(DAY, DAY)) =>
           DateAdd(l, UnaryMinus(ExtractANSIIntervalDays(r), mode == EvalMode.ANSI))
         case (DateType, _: DayTimeIntervalType) =>
-          DatetimeSub(l, r, TimeAdd(Cast(l, TimestampType), UnaryMinus(r, mode == EvalMode.ANSI)))
+          DatetimeSub(l, r,
+            TimestampAddInterval(Cast(l, TimestampType), UnaryMinus(r, mode == EvalMode.ANSI)))
         case (DateType, _: YearMonthIntervalType) =>
           DatetimeSub(l, r, DateAddYMInterval(l, UnaryMinus(r, mode == EvalMode.ANSI)))
         case (TimestampType | TimestampNTZType, _: YearMonthIntervalType) =>
@@ -101,9 +114,9 @@ object BinaryArithmeticWithDatetimeResolver {
         case (CalendarIntervalType, CalendarIntervalType) |
              (_: DayTimeIntervalType, _: DayTimeIntervalType) =>
           s
-        case (_: NullType, _: AnsiIntervalType) =>
+        case (_: NullType, _: AnsiIntervalType | _: DatetimeType) =>
           s.copy(left = Cast(s.left, s.right.dataType))
-        case (_: AnsiIntervalType, _: NullType) =>
+        case (_: AnsiIntervalType | _: DatetimeType, _: NullType) =>
           s.copy(right = Cast(s.right, s.left.dataType))
         case (DateType, CalendarIntervalType) =>
           DatetimeSub(
@@ -115,14 +128,18 @@ object BinaryArithmeticWithDatetimeResolver {
               ansiEnabled = mode == EvalMode.ANSI
             )
           )
+        case (_: TimeType, _: DayTimeIntervalType) =>
+          DatetimeSub(l, r, TimeAddInterval(l, UnaryMinus(r, mode == EvalMode.ANSI)))
         case (_, CalendarIntervalType | _: DayTimeIntervalType) =>
-          Cast(DatetimeSub(l, r, TimeAdd(l, UnaryMinus(r, mode == EvalMode.ANSI))), l.dataType)
+          Cast(DatetimeSub(l, r,
+            TimestampAddInterval(l, UnaryMinus(r, mode == EvalMode.ANSI))), l.dataType)
         case _
           if AnyTimestampTypeExpression.unapply(l) ||
             AnyTimestampTypeExpression.unapply(r) =>
           SubtractTimestamps(l, r)
         case (_, DateType) => SubtractDates(l, r)
         case (DateType, dt) if dt != StringType => DateSub(l, r)
+        case (_: TimeType, _: TimeType) => SubtractTimes(l, r)
         case _ => s
       }
     case m @ Multiply(l, r, mode) =>
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/CheckAnalysis.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/CheckAnalysis.scala
index f34cf8ce53498..2ff842553bee6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/CheckAnalysis.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/CheckAnalysis.scala
@@ -19,11 +19,12 @@ package org.apache.spark.sql.catalyst.analysis
 import scala.collection.mutable
 
 import org.apache.spark.{SparkException, SparkThrowable}
+import org.apache.spark.api.python.PythonEvalType
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.ExtendedAnalysisException
 import org.apache.spark.sql.catalyst.analysis.ResolveWithCTE.checkIfSelfReferenceIsPlacedCorrectly
 import org.apache.spark.sql.catalyst.expressions._
-import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, AggregateFunction, ListAgg, Median, PercentileCont, PercentileDisc}
+import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, AggregateFunction, ListAgg}
 import org.apache.spark.sql.catalyst.optimizer.InlineCTE
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.trees.TreePattern.{LATERAL_COLUMN_ALIAS_REFERENCE, PLAN_EXPRESSION, UNRESOLVED_WINDOW_EXPRESSION}
@@ -437,51 +438,13 @@ trait CheckAnalysis extends LookupCatalog with QueryErrorsBase with PlanToString
               errorClass = "WINDOW_FUNCTION_WITHOUT_OVER_CLAUSE",
               messageParameters = Map("funcName" -> toSQLExpr(w)))
 
-          case w @ WindowExpression(AggregateExpression(_, _, true, _, _), _) =>
-            w.failAnalysis(
-              errorClass = "DISTINCT_WINDOW_FUNCTION_UNSUPPORTED",
-              messageParameters = Map("windowExpr" -> toSQLExpr(w)))
-
-          case w @ WindowExpression(wf: FrameLessOffsetWindowFunction,
-            WindowSpecDefinition(_, order, frame: SpecifiedWindowFrame))
-             if order.isEmpty || !frame.isOffset =>
-            w.failAnalysis(
-              errorClass = "WINDOW_FUNCTION_AND_FRAME_MISMATCH",
-              messageParameters = Map(
-                "funcName" -> toSQLExpr(wf),
-                "windowExpr" -> toSQLExpr(w)))
-
           case agg @ AggregateExpression(listAgg: ListAgg, _, _, _, _)
             if agg.isDistinct && listAgg.needSaveOrderValue =>
             throw QueryCompilationErrors.functionAndOrderExpressionMismatchError(
               listAgg.prettyName, listAgg.child, listAgg.orderExpressions)
 
           case w: WindowExpression =>
-            // Only allow window functions with an aggregate expression or an offset window
-            // function or a Pandas window UDF.
-            w.windowFunction match {
-              case agg @ AggregateExpression(fun: ListAgg, _, _, _, _)
-                // listagg(...) WITHIN GROUP (ORDER BY ...) OVER (ORDER BY ...) is unsupported
-                if fun.orderingFilled && (w.windowSpec.orderSpec.nonEmpty ||
-                  w.windowSpec.frameSpecification !=
-                  SpecifiedWindowFrame(RowFrame, UnboundedPreceding, UnboundedFollowing)) =>
-                agg.failAnalysis(
-                  errorClass = "INVALID_WINDOW_SPEC_FOR_AGGREGATION_FUNC",
-                  messageParameters = Map("aggFunc" -> toSQLExpr(agg.aggregateFunction)))
-              case agg @ AggregateExpression(
-                _: PercentileCont | _: PercentileDisc | _: Median, _, _, _, _)
-                if w.windowSpec.orderSpec.nonEmpty || w.windowSpec.frameSpecification !=
-                    SpecifiedWindowFrame(RowFrame, UnboundedPreceding, UnboundedFollowing) =>
-                agg.failAnalysis(
-                  errorClass = "INVALID_WINDOW_SPEC_FOR_AGGREGATION_FUNC",
-                  messageParameters = Map("aggFunc" -> toSQLExpr(agg.aggregateFunction)))
-              case _: AggregateExpression | _: FrameLessOffsetWindowFunction |
-                  _: AggregateWindowFunction => // OK
-              case other =>
-                other.failAnalysis(
-                  errorClass = "UNSUPPORTED_EXPR_FOR_WINDOW",
-                  messageParameters = Map("sqlExpr" -> toSQLExpr(other)))
-            }
+            WindowResolution.validateResolvedWindowExpression(w)
 
           case s: SubqueryExpression =>
             checkSubqueryExpression(operator, s)
@@ -569,7 +532,19 @@ trait CheckAnalysis extends LookupCatalog with QueryErrorsBase with PlanToString
                 messageParameters = Map.empty)
             }
 
-          case a: Aggregate => ExprUtils.assertValidAggregation(a)
+          case a: Aggregate =>
+            a.groupingExpressions.foreach(
+              expression =>
+                if (!expression.deterministic) {
+                  throw SparkException.internalError(
+                    msg = s"Non-deterministic expression '${toSQLExpr(expression)}' should not " +
+                      "appear in grouping expression.",
+                    context = expression.origin.getQueryContext,
+                    summary = expression.origin.context.summary
+                  )
+                }
+            )
+            ExprUtils.assertValidAggregation(a)
 
           case CollectMetrics(name, metrics, _, _) =>
             if (name == null || name.isEmpty) {
@@ -747,7 +722,7 @@ trait CheckAnalysis extends LookupCatalog with QueryErrorsBase with PlanToString
 
           case c: CreateVariable
               if c.resolved && c.defaultExpr.child.containsPattern(PLAN_EXPRESSION) =>
-            val ident = c.name.asInstanceOf[ResolvedIdentifier]
+            val ident = c.names(0).asInstanceOf[ResolvedIdentifier]
             val varName = toSQLId(
               (ident.catalog.name +: ident.identifier.namespace :+ ident.identifier.name)
                 .toImmutableArraySeq)
@@ -915,6 +890,17 @@ trait CheckAnalysis extends LookupCatalog with QueryErrorsBase with PlanToString
               messageParameters = Map(
                 "invalidExprSqls" -> invalidExprSqls.mkString(", ")))
 
+          case j @ LateralJoin(_, right, _, _)
+              if j.getTagValue(LateralJoin.BY_TABLE_ARGUMENT).isEmpty =>
+            right.plan.foreach {
+              case Generate(pyudtf: PythonUDTF, _, _, _, _, _)
+                  if pyudtf.evalType == PythonEvalType.SQL_ARROW_UDTF =>
+                  j.failAnalysis(
+                    errorClass = "LATERAL_JOIN_WITH_ARROW_UDTF_UNSUPPORTED",
+                    messageParameters = Map.empty)
+              case _ =>
+            }
+
           case _ => // Analysis successful!
         }
     }
@@ -947,30 +933,14 @@ trait CheckAnalysis extends LookupCatalog with QueryErrorsBase with PlanToString
     if (expr.plan.isStreaming) {
       plan.failAnalysis("INVALID_SUBQUERY_EXPRESSION.STREAMING_QUERY", Map.empty)
     }
-    assertNoRecursiveCTE(expr.plan)
     checkAnalysis0(expr.plan)
     ValidateSubqueryExpression(plan, expr)
   }
 
-  private def assertNoRecursiveCTE(plan: LogicalPlan): Unit = {
-    plan.foreach {
-      case r: CTERelationRef if r.recursive =>
-        throw new AnalysisException(
-          errorClass = "INVALID_RECURSIVE_REFERENCE.PLACE",
-          messageParameters = Map.empty)
-      case p => p.expressions.filter(_.containsPattern(PLAN_EXPRESSION)).foreach {
-        expr => expr.foreach {
-          case s: SubqueryExpression => assertNoRecursiveCTE(s.plan)
-          case _ =>
-        }
-      }
-    }
-  }
-
   /**
    * Validate that collected metrics names are unique. The same name cannot be used for metrics
-   * with different results. However multiple instances of metrics with with same result and name
-   * are allowed (e.g. self-joins).
+   * with different results. However, multiple instances of metrics with same result and name are
+   * allowed (e.g. self-joins).
    */
   private def checkCollectedMetrics(plan: LogicalPlan): Unit = {
     val metricsMap = mutable.Map.empty[String, CollectMetrics]
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ColumnResolutionHelper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ColumnResolutionHelper.scala
index 6823cdbf36ba2..bade5f0bee9d6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ColumnResolutionHelper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ColumnResolutionHelper.scala
@@ -23,14 +23,12 @@ import scala.collection.mutable
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.SqlScriptingContextManager
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.SubExprUtils.wrapOuterReference
-import org.apache.spark.sql.catalyst.parser.SqlScriptingLabelContext.isForbiddenLabelName
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.trees.CurrentOrigin.withOrigin
 import org.apache.spark.sql.catalyst.trees.TreePattern._
-import org.apache.spark.sql.connector.catalog.{CatalogManager, Identifier}
+import org.apache.spark.sql.connector.catalog.CatalogManager
 import org.apache.spark.sql.errors.{DataTypeErrorsBase, QueryCompilationErrors}
 import org.apache.spark.sql.internal.SQLConf
 
@@ -210,7 +208,11 @@ trait ColumnResolutionHelper extends Logging with DataTypeErrorsBase {
         case u @ UnresolvedHaving(_, agg: Aggregate) =>
           agg.resolveChildren(nameParts, conf.resolver)
             .orElse(u.resolveChildren(nameParts, conf.resolver))
-            .map(wrapOuterReference)
+            .map {
+              case alias: Alias =>
+                wrapOuterReference(alias.child)
+              case other => wrapOuterReference(other)
+            }
         case other =>
           other.resolveChildren(nameParts, conf.resolver).map(wrapOuterReference)
       }
@@ -231,102 +233,17 @@ trait ColumnResolutionHelper extends Logging with DataTypeErrorsBase {
     }
   }
 
-  /**
-   * Look up variable by nameParts.
-   * If in SQL Script, first check local variables, unless in EXECUTE IMMEDIATE
-   * (EXECUTE IMMEDIATE generated query cannot access local variables).
-   * if not found fall back to session variables.
-   * @param nameParts NameParts of the variable.
-   * @return Reference to the variable.
-   */
-  def lookupVariable(nameParts: Seq[String]): Option[VariableReference] = {
-    // The temp variables live in `SYSTEM.SESSION`, and the name can be qualified or not.
-    def maybeTempVariableName(nameParts: Seq[String]): Boolean = {
-      nameParts.length == 1 || {
-        if (nameParts.length == 2) {
-          nameParts.head.equalsIgnoreCase(CatalogManager.SESSION_NAMESPACE)
-        } else if (nameParts.length == 3) {
-          nameParts(0).equalsIgnoreCase(CatalogManager.SYSTEM_CATALOG_NAME) &&
-            nameParts(1).equalsIgnoreCase(CatalogManager.SESSION_NAMESPACE)
-        } else {
-          false
-        }
-      }
-    }
-
-    val namePartsCaseAdjusted = if (conf.caseSensitiveAnalysis) {
-      nameParts
-    } else {
-      nameParts.map(_.toLowerCase(Locale.ROOT))
-    }
-
-    SqlScriptingContextManager.get().map(_.getVariableManager)
-      // If we are in EXECUTE IMMEDIATE lookup only session variables.
-      .filterNot(_ => AnalysisContext.get.isExecuteImmediate)
-      // If variable name is qualified with session.<varName> treat it as a session variable.
-      .filterNot(_ =>
-        nameParts.length > 2 || (nameParts.length == 2 && isForbiddenLabelName(nameParts.head)))
-      .flatMap(_.get(namePartsCaseAdjusted))
-      .map { varDef =>
-        VariableReference(
-          nameParts,
-          FakeLocalCatalog,
-          Identifier.of(Array(varDef.identifier.namespace().last), namePartsCaseAdjusted.last),
-          varDef)
-      }
-      .orElse(
-        if (maybeTempVariableName(nameParts)) {
-          catalogManager.tempVariableManager
-            .get(namePartsCaseAdjusted)
-            .map { varDef =>
-              VariableReference(
-                nameParts,
-                FakeSystemCatalog,
-                Identifier.of(Array(CatalogManager.SESSION_NAMESPACE), namePartsCaseAdjusted.last),
-                varDef
-              )}
-        } else {
-          None
-        }
-      )
-  }
-
   // Resolves `UnresolvedAttribute` to its value.
   protected def resolveVariables(e: Expression): Expression = {
-    def resolveVariable(nameParts: Seq[String]): Option[Expression] = {
-      val isResolvingView = AnalysisContext.get.catalogAndNamespace.nonEmpty
-      if (isResolvingView) {
-        if (AnalysisContext.get.referredTempVariableNames.contains(nameParts)) {
-          lookupVariable(nameParts)
-        } else {
-          None
-        }
-      } else {
-        lookupVariable(nameParts)
-      }
-    }
+    val variableResolution = new VariableResolution(catalogManager.tempVariableManager)
 
     def resolve(nameParts: Seq[String]): Option[Expression] = {
-      var resolvedVariable: Option[Expression] = None
-      // We only support temp variables for now, so the variable name can at most have 3 parts.
-      var numInnerFields: Int = math.max(0, nameParts.length - 3)
-      // Follow the column resolution and prefer the longest match. This makes sure that users
-      // can always use fully qualified variable name to avoid name conflicts.
-      while (resolvedVariable.isEmpty && numInnerFields < nameParts.length) {
-        resolvedVariable = resolveVariable(nameParts.dropRight(numInnerFields))
-        if (resolvedVariable.isEmpty) numInnerFields += 1
-      }
-
-      resolvedVariable.map { variable =>
-        if (numInnerFields != 0) {
-          val nestedFields = nameParts.takeRight(numInnerFields)
-          nestedFields.foldLeft(variable: Expression) { (e, name) =>
-            ExtractValue(e, Literal(name), conf.resolver)
-          }
-        } else {
-          variable
-        }
-      }.map(e => Alias(e, nameParts.last)())
+      variableResolution.resolveMultipartName(
+        nameParts = nameParts,
+        resolvingView = AnalysisContext.get.catalogAndNamespace.nonEmpty,
+        resolvingExecuteImmediate = AnalysisContext.get.isExecuteImmediate,
+        referredTempVariableNames = AnalysisContext.get.referredTempVariableNames
+      ).map(e => Alias(e, nameParts.last)())
     }
 
     def innerResolve(e: Expression, isTopLevel: Boolean): Expression = withOrigin(e.origin) {
@@ -505,6 +422,33 @@ trait ColumnResolutionHelper extends Logging with DataTypeErrorsBase {
       includeLastResort = includeLastResort)
   }
 
+  // Try to resolve `UnresolvedAttribute` by the children with Plan Ids.
+  // The `UnresolvedAttribute` must have a Plan Id:
+  //  - If Plan Id not found in the plan, raise CANNOT_RESOLVE_DATAFRAME_COLUMN.
+  //  - If Plan Id found in the plan, but column not found, return None.
+  //  - Otherwise, return the resolved expression.
+  private[sql] def tryResolveColumnByPlanChildren(
+      u: UnresolvedAttribute,
+      q: LogicalPlan,
+      includeLastResort: Boolean = false): Option[Expression] = {
+    assert(u.getTagValue(LogicalPlan.PLAN_ID_TAG).nonEmpty,
+      s"UnresolvedAttribute $u should have a Plan Id tag")
+
+    resolveDataFrameColumn(u, q.children).map { r =>
+      resolveExpression(
+        r,
+        resolveColumnByName = nameParts => {
+          q.resolveChildren(nameParts, conf.resolver)
+        },
+        getAttrCandidates = () => {
+          assert(q.children.length == 1)
+          q.children.head.output
+        },
+        throws = true,
+        includeLastResort = includeLastResort)
+    }
+  }
+
   /**
    * The last resort to resolve columns. Currently it does two things:
    *  - Try to resolve column names as outer references
@@ -526,10 +470,15 @@ trait ColumnResolutionHelper extends Logging with DataTypeErrorsBase {
   // expression are from Spark Connect, and need to be resolved in this way:
   //    1. extract the attached plan id from UnresolvedAttribute;
   //    2. top-down traverse the query plan to find the plan node that matches the plan id;
-  //    3. if can not find the matching node, fail the analysis due to illegal references;
-  //    4. if more than one matching nodes are found, fail due to ambiguous column reference;
-  //    5. resolve the expression with the matching node, if any error occurs here, return the
-  //       original expression as it is.
+  //    3. if can not find the matching node, fails with 'CANNOT_RESOLVE_DATAFRAME_COLUMN';
+  //    4, if the matching node is found, but can not resolve the column, also fails with
+  //       'CANNOT_RESOLVE_DATAFRAME_COLUMN';
+  //    5, resolve the expression against the target node, the resolved attribute will be
+  //       filtered by the output attributes of nodes in the path (from matching to root node);
+  //    6. if more than one resolved attributes are found in the above recursive process,
+  //       fails with 'AMBIGUOUS_COLUMN_REFERENCE'.
+  //    7. if all the resolved attributes are filtered out, return the original expression
+  //       as it is.
   private def tryResolveDataFrameColumns(
       e: Expression,
       q: Seq[LogicalPlan]): Expression = e match {
@@ -591,18 +540,16 @@ trait ColumnResolutionHelper extends Logging with DataTypeErrorsBase {
       p: LogicalPlan,
       currentDepth: Int): (Option[(NamedExpression, Int)], Boolean) = {
     val (resolved, matched) = if (p.getTagValue(LogicalPlan.PLAN_ID_TAG).contains(id)) {
-      val resolved = try {
-        if (!isMetadataAccess) {
-          p.resolve(u.nameParts, conf.resolver)
-        } else if (u.nameParts.size == 1) {
-          p.getMetadataAttributeByNameOpt(u.nameParts.head)
-        } else {
-          None
-        }
-      } catch {
-        case e: AnalysisException =>
-          logDebug(s"Fail to resolve $u with $p due to $e")
-          None
+      val resolved = if (!isMetadataAccess) {
+        p.resolve(u.nameParts, conf.resolver)
+      } else if (u.nameParts.size == 1) {
+        p.getMetadataAttributeByNameOpt(u.nameParts.head)
+      } else {
+        None
+      }
+      if (resolved.isEmpty) {
+        // The targe plan node is found, but the column cannot be resolved.
+        throw QueryCompilationErrors.cannotResolveDataFrameColumn(u)
       }
       (resolved.map(r => (r, currentDepth)), true)
     } else {
@@ -631,14 +578,20 @@ trait ColumnResolutionHelper extends Logging with DataTypeErrorsBase {
     // When resolving the column reference df1.a, the target node with plan_id=1
     // can be found in both sides of the Join node.
     // To correctly resolve df1.a, the analyzer discards the resolved attribute
-    // in the right side, by filtering out the result by the output attributes of
+    // on the right side, by filtering out the result by the output attributes of
     // Project plan_id=2.
     //
     // However, there are analyzer rules (e.g. ResolveReferencesInSort)
     // supporting missing column resolution. Then a valid resolved attribute
-    // maybe filtered out here. In this case, resolveDataFrameColumnByPlanId
-    // returns None, the dataframe column will remain unresolved, and the analyzer
-    // will try to resolve it without plan id later.
+    // maybe filtered out here. For example:
+    //
+    // from pyspark.sql import functions as sf
+    // df = spark.range(10).withColumn("v", sf.col("id") + 1)
+    // df.select(df.v).sort(df.id)
+    //
+    // In this case, resolveDataFrameColumnByPlanId returns None,
+    // the dataframe column 'df.id' will remain unresolved, and the analyzer
+    // will try to resolve 'id' without plan id later.
     val filtered = resolved.filter { r =>
       if (isMetadataAccess) {
         r._1.references.subsetOf(AttributeSet(p.output ++ p.metadataOutput))
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/DeduplicateRelations.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/DeduplicateRelations.scala
index 752a2a648ce99..b8da376bead6f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/DeduplicateRelations.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/DeduplicateRelations.scala
@@ -19,16 +19,14 @@ package org.apache.spark.sql.catalyst.analysis
 
 import scala.collection.mutable
 
+import org.apache.spark.sql.catalyst.analysis.resolver.ResolverTag
 import org.apache.spark.sql.catalyst.expressions.{Alias, Attribute, AttributeMap, AttributeReference, AttributeSet, Expression, NamedExpression, OuterReference, SubqueryExpression}
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.rules.Rule
-import org.apache.spark.sql.catalyst.trees.TreeNodeTag
 import org.apache.spark.sql.catalyst.trees.TreePattern._
+import org.apache.spark.sql.internal.SQLConf
 
 object DeduplicateRelations extends Rule[LogicalPlan] {
-  val PROJECT_FOR_EXPRESSION_ID_DEDUPLICATION =
-    TreeNodeTag[Unit]("project_for_expression_id_deduplication")
-
   type ExprIdMap = mutable.HashMap[Class[_], mutable.HashSet[Long]]
 
   override def apply(plan: LogicalPlan): LogicalPlan = {
@@ -59,23 +57,30 @@ object DeduplicateRelations extends Rule[LogicalPlan] {
       case e @ Except(left, right, _) if !e.duplicateResolved && noMissingInput(right) =>
         e.copy(right = dedupRight(left, right))
       // Only after we finish by-name resolution for Union
-      case u: Union if !u.byName && !u.duplicateResolved =>
+      case u: Union if !u.byName && !u.duplicatesResolvedBetweenBranches =>
+        val unionWithChildOutputsDeduplicated =
+          DeduplicateUnionChildOutput.deduplicateOutputPerChild(u)
         // Use projection-based de-duplication for Union to avoid breaking the checkpoint sharing
         // feature in streaming.
-        val newChildren = u.children.foldRight(Seq.empty[LogicalPlan]) { (head, tail) =>
-          head +: tail.map {
-            case child if head.outputSet.intersect(child.outputSet).isEmpty =>
-              child
-            case child =>
-              val projectList = child.output.map { attr =>
-                Alias(attr, attr.name)()
+        val newChildren =
+          unionWithChildOutputsDeduplicated.children.foldRight(Seq.empty[LogicalPlan]) {
+            (head, tail) =>
+              head +: tail.map {
+                case child if head.outputSet.intersect(child.outputSet).isEmpty =>
+                  child
+                case child =>
+                  val projectList = child.output.map { attr =>
+                    Alias(attr, attr.name)()
+                  }
+                  val project = Project(projectList, child)
+                  project.setTagValue(
+                    ResolverTag.PROJECT_FOR_EXPRESSION_ID_DEDUPLICATION,
+                    ()
+                  )
+                  project
               }
-              val project = Project(projectList, child)
-              project.setTagValue(DeduplicateRelations.PROJECT_FOR_EXPRESSION_ID_DEDUPLICATION, ())
-              project
           }
-        }
-        u.copy(children = newChildren)
+        unionWithChildOutputsDeduplicated.copy(children = newChildren)
       case merge: MergeIntoTable
           if !merge.duplicateResolved && noMissingInput(merge.sourceTable) =>
         merge.copy(sourceTable = dedupRight(merge.targetTable, merge.sourceTable))
@@ -237,8 +242,17 @@ object DeduplicateRelations extends Rule[LogicalPlan] {
       if (planChanged) {
         if (planWithNewSubquery.childrenResolved) {
           val planWithNewChildren = planWithNewSubquery.withNewChildren(newChildren.toSeq)
+          val childrenOutputLookup = AttributeSet.fromAttributeSets(newChildren.map(_.outputSet))
+          val childrenOutput = newChildren.flatMap(_.output)
           val attrMap = AttributeMap(plan.children.flatMap(_.output)
-            .zip(newChildren.flatMap(_.output)).filter { case (a1, a2) => a1.exprId != a2.exprId })
+            .zip(childrenOutput).filter { case (a1, a2) => a1.exprId != a2.exprId })
+          val preventDeduplicationIfOldExprIdStillExists =
+            conf.getConf(SQLConf.DONT_DEDUPLICATE_EXPRESSION_IF_EXPR_ID_IN_OUTPUT)
+          val missingAttributeMap = AttributeMap(attrMap.filter {
+            case (oldAttribute, _) =>
+              !preventDeduplicationIfOldExprIdStillExists ||
+              !childrenOutputLookup.contains(oldAttribute)
+          })
           if (attrMap.isEmpty) {
             planWithNewChildren
           } else {
@@ -282,7 +296,7 @@ object DeduplicateRelations extends Rule[LogicalPlan] {
                   rightDeserializer = newRightDes, leftGroup = newLeftGroup,
                   rightGroup = newRightGroup, leftAttr = newLeftAttr, rightAttr = newRightAttr,
                   leftOrder = newLeftOrder, rightOrder = newRightOrder)
-              case _ => planWithNewChildren.rewriteAttrs(attrMap)
+              case _ => planWithNewChildren.rewriteAttrs(missingAttributeMap)
             }
           }
         } else {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/DeduplicateUnionChildOutput.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/DeduplicateUnionChildOutput.scala
new file mode 100644
index 0000000000000..11a10710a6170
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/DeduplicateUnionChildOutput.scala
@@ -0,0 +1,82 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis
+
+import scala.collection.mutable
+
+import org.apache.spark.sql.catalyst.expressions.{Alias, ExprId}
+import org.apache.spark.sql.catalyst.plans.logical.{Project, Union}
+import org.apache.spark.sql.types.MetadataBuilder
+
+/**
+ * Deduplicates columns with same [[ExprId]]s in single [[Union]] child output, by placing aliases
+ * on non-first duplicates.
+ */
+object DeduplicateUnionChildOutput {
+
+  /**
+   * Deduplicate expression IDs at the scope of each individual child output. This is necessary to
+   * handle the following case:
+   *
+   * {{{
+   * -- The correct answer is (1, 1), (1, 2). Without deduplication it would be (1, 1), because
+   * -- aggregation would be done only based on the first column.
+   * SELECT
+   *   a, a
+   * FROM
+   *   VALUES (1, 1), (1, 2) AS t1 (a, b)
+   * UNION
+   * SELECT
+   *  a, b
+   * FROM
+   *   VALUES (1, 1), (1, 2) AS t2 (a, b)
+   * }}}
+   *
+   * Putting [[Alias]] introduces a new expression ID for the attribute duplicates in the output. We
+   * also add `__is_duplicate` metadata so that [[AttributeSeq.getCandidatesForResolution]] doesn't
+   * produce conflicting candidates when resolving names in the upper [[Project]] - this is
+   * technically still the same attribute.
+   *
+   * See SPARK-37865 for more details.
+   */
+  def deduplicateOutputPerChild(union: Union): Union = {
+    val newChildren = union.children.map { c =>
+      if (c.output.map(_.exprId).distinct.length < c.output.length) {
+        val existingExprIds = mutable.HashSet[ExprId]()
+        val projectList = c.output.map { attr =>
+          if (existingExprIds.contains(attr.exprId)) {
+            // replace non-first duplicates with aliases and tag them
+            val newMetadata = new MetadataBuilder()
+              .withMetadata(attr.metadata)
+              .putNull("__is_duplicate")
+              .build()
+            Alias(attr, attr.name)(explicitMetadata = Some(newMetadata))
+          } else {
+            // leave first duplicate alone
+            existingExprIds.add(attr.exprId)
+            attr
+          }
+        }
+        Project(projectList, c)
+      } else {
+        c
+      }
+    }
+    union.withNewChildren(newChildren).asInstanceOf[Union]
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/FunctionRegistry.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/FunctionRegistry.scala
index 66db1fe8b5965..99e0c707d8871 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/FunctionRegistry.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/FunctionRegistry.scala
@@ -24,7 +24,7 @@ import scala.collection.mutable
 import scala.reflect.ClassTag
 
 import org.apache.spark.SparkUnsupportedOperationException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.FUNCTION_NAME
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.FunctionIdentifier
@@ -463,6 +463,7 @@ object FunctionRegistry {
     expressionBuilder("try_sum", TrySumExpressionBuilder, setAlias = true),
     expression[TryToBinary]("try_to_binary"),
     expressionBuilder("try_to_timestamp", TryToTimestampExpressionBuilder, setAlias = true),
+    expressionBuilder("try_to_date", TryToDateExpressionBuilder, setAlias = true),
     expressionBuilder("try_to_time", TryToTimeExpressionBuilder, setAlias = true),
     expression[TryAesDecrypt]("try_aes_decrypt"),
     expression[TryReflect]("try_reflect"),
@@ -527,6 +528,8 @@ object FunctionRegistry {
     expressionBuilder("mode", ModeBuilder),
     expression[HllSketchAgg]("hll_sketch_agg"),
     expression[HllUnionAgg]("hll_union_agg"),
+    expression[ApproxTopK]("approx_top_k"),
+    expression[ApproxTopKAccumulate]("approx_top_k_accumulate"),
 
     // string functions
     expression[Ascii]("ascii"),
@@ -652,6 +655,7 @@ object FunctionRegistry {
     expressionBuilder("second", SecondExpressionBuilder),
     expression[ParseToTimestamp]("to_timestamp"),
     expression[ParseToDate]("to_date"),
+    expression[TimeDiff]("time_diff"),
     expression[ToTime]("to_time"),
     expression[ToBinary]("to_binary"),
     expression[ToUnixTimestamp]("to_unix_timestamp"),
@@ -672,7 +676,8 @@ object FunctionRegistry {
     expression[WindowTime]("window_time"),
     expression[MakeDate]("make_date"),
     expression[MakeTime]("make_time"),
-    expression[MakeTimestamp]("make_timestamp"),
+    expression[TimeTrunc]("time_trunc"),
+    expressionBuilder("make_timestamp", MakeTimestampExpressionBuilder),
     expression[TryMakeTimestamp]("try_make_timestamp"),
     expression[MonthName]("monthname"),
     // We keep the 2 expression builders below to have different function docs.
@@ -785,6 +790,7 @@ object FunctionRegistry {
     expression[EqualNull]("equal_null"),
     expression[HllSketchEstimate]("hll_sketch_estimate"),
     expression[HllUnion]("hll_union"),
+    expression[ApproxTopKEstimate]("approx_top_k_estimate"),
 
     // grouping sets
     expression[Grouping]("grouping"),
@@ -870,6 +876,7 @@ object FunctionRegistry {
     castAlias("decimal", DecimalType.USER_DEFAULT),
     castAlias("date", DateType),
     castAlias("timestamp", TimestampType),
+    castAlias("time", TimeType()),
     castAlias("binary", BinaryType),
     castAlias("string", StringType),
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/HintErrorLogger.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/HintErrorLogger.scala
index 5301a3683c7da..8edc5278b5319 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/HintErrorLogger.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/HintErrorLogger.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.catalyst.analysis
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{QUERY_HINT, RELATION_NAME, UNSUPPORTED_HINT_REASON}
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.plans.logical.{HintErrorHandler, HintInfo}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/IdentifierResolution.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/IdentifierResolution.scala
new file mode 100644
index 0000000000000..e274c1e2162a5
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/IdentifierResolution.scala
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis
+
+import org.apache.spark.sql.catalyst.expressions.{AliasHelper, EvalHelper, Expression}
+import org.apache.spark.sql.catalyst.parser.CatalystSqlParser
+import org.apache.spark.sql.types.StringType
+
+object IdentifierResolution extends AliasHelper with EvalHelper {
+  def evalIdentifierExpr(expr: Expression): Seq[String] = {
+    trimAliases(prepareForEval(expr)) match {
+      case e if !e.foldable =>
+        expr.failAnalysis(
+          errorClass = "NOT_A_CONSTANT_STRING.NOT_CONSTANT",
+          messageParameters = Map("name" -> "IDENTIFIER", "expr" -> expr.sql)
+        )
+      case e if e.dataType != StringType =>
+        expr.failAnalysis(
+          errorClass = "NOT_A_CONSTANT_STRING.WRONG_TYPE",
+          messageParameters =
+            Map("name" -> "IDENTIFIER", "expr" -> expr.sql, "dataType" -> e.dataType.catalogString)
+        )
+      case e =>
+        e.eval() match {
+          case null =>
+            expr.failAnalysis(
+              errorClass = "NOT_A_CONSTANT_STRING.NULL",
+              messageParameters = Map("name" -> "IDENTIFIER", "expr" -> expr.sql)
+            )
+          case other =>
+            // Parse the identifier string to name parts.
+            CatalystSqlParser.parseMultipartIdentifier(other.toString)
+        }
+    }
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/NondeterministicExpressionCollection.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/NondeterministicExpressionCollection.scala
index d530cfe5175ba..1dc5d79dc1b59 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/NondeterministicExpressionCollection.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/NondeterministicExpressionCollection.scala
@@ -38,7 +38,7 @@ object NondeterministicExpressionCollection {
             case namedExpression: NamedExpression => namedExpression
             case _ => Alias(nondeterministicExpr, "_nondeterministic")()
           }
-          nonDeterministicToAttributes.put(nondeterministicExpr, namedExpression)
+          nonDeterministicToAttributes.put(nondeterministicExpr.canonicalized, namedExpression)
         }
       }
     }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/PullOutNondeterministic.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/PullOutNondeterministic.scala
index e0b984540cac0..09d3a6f93a878 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/PullOutNondeterministic.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/PullOutNondeterministic.scala
@@ -19,7 +19,9 @@ package org.apache.spark.sql.catalyst.analysis
 
 import scala.jdk.CollectionConverters._
 
+import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst.expressions._
+import org.apache.spark.sql.catalyst.expressions.ExprUtils.toSQLExpr
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.rules.Rule
 
@@ -39,10 +41,20 @@ object PullOutNondeterministic extends Rule[LogicalPlan] {
       val nondeterToAttr =
         NondeterministicExpressionCollection.getNondeterministicToAttributes(a.groupingExpressions)
       val newChild = Project(a.child.output ++ nondeterToAttr.values.asScala.toSeq, a.child)
-      a.transformExpressions { case e =>
-        Option(nondeterToAttr.get(e)).map(_.toAttribute).getOrElse(e)
+      val deterministicAggregate = a.transformExpressions { case e =>
+        Option(nondeterToAttr.get(e.canonicalized)).map(_.toAttribute).getOrElse(e)
       }.copy(child = newChild)
 
+      deterministicAggregate.groupingExpressions.foreach(expr => if (!expr.deterministic) {
+        throw SparkException.internalError(
+          msg = s"Non-deterministic expression '${toSQLExpr(expr)}' should not appear in " +
+            "grouping expression.",
+          context = expr.origin.getQueryContext,
+          summary = expr.origin.context.summary)
+      })
+
+      deterministicAggregate
+
     // Don't touch collect metrics. Top-level metrics are not supported (check analysis will fail)
     // and we want to retain them inside the aggregate functions.
     case m: CollectMetrics => m
@@ -57,7 +69,7 @@ object PullOutNondeterministic extends Rule[LogicalPlan] {
       val nondeterToAttr =
         NondeterministicExpressionCollection.getNondeterministicToAttributes(p.expressions)
       val newPlan = p.transformExpressions { case e =>
-        Option(nondeterToAttr.get(e)).map(_.toAttribute).getOrElse(e)
+        Option(nondeterToAttr.get(e.canonicalized)).map(_.toAttribute).getOrElse(e)
       }
       val newChild = Project(p.child.output ++ nondeterToAttr.values.asScala.toSeq, p.child)
       Project(p.output, newPlan.withNewChildren(newChild :: Nil))
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveCatalogs.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveCatalogs.scala
index 72d92e5a9445e..851db598c4e39 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveCatalogs.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveCatalogs.scala
@@ -40,35 +40,40 @@ class ResolveCatalogs(val catalogManager: CatalogManager)
   override def apply(plan: LogicalPlan): LogicalPlan = plan resolveOperatorsDown {
     // We only support temp variables for now and the system catalog is not properly implemented
     // yet. We need to resolve `UnresolvedIdentifier` for variable commands specially.
-    case c @ CreateVariable(UnresolvedIdentifier(nameParts, _), _, _) =>
-      // From scripts we can only create local variables, which must be unqualified,
-      // and must not be DECLARE OR REPLACE.
-      val resolved = if (withinSqlScript) {
-        if (c.replace) {
-          throw new AnalysisException(
-            "INVALID_VARIABLE_DECLARATION.REPLACE_LOCAL_VARIABLE",
-            Map("varName" -> toSQLId(nameParts))
-          )
-        }
-
-        if (nameParts.length != 1) {
-          throw new AnalysisException(
-            "INVALID_VARIABLE_DECLARATION.QUALIFIED_LOCAL_VARIABLE",
-            Map("varName" -> toSQLId(nameParts)))
-        }
-
-        SqlScriptingContextManager.get().map(_.getVariableManager)
-          .getOrElse(throw SparkException.internalError(
-              "Scripting local variable manager should be present in SQL script."))
-          .qualify(nameParts.last)
-      } else {
-        val resolvedIdentifier = catalogManager.tempVariableManager.qualify(nameParts.last)
-
-        assertValidSessionVariableNameParts(nameParts, resolvedIdentifier)
-        resolvedIdentifier
+    case c @ CreateVariable(identifiers, _, _) =>
+      // We resolve only UnresolvedIdentifiers, and pass on the other nodes
+      val resolved = identifiers.map {
+        case UnresolvedIdentifier(nameParts, _) =>
+          // From scripts we can only create local variables, which must be unqualified,
+          // and must not be DECLARE OR REPLACE.
+          if (withinSqlScript) {
+            if (c.replace) {
+              throw new AnalysisException(
+                "INVALID_VARIABLE_DECLARATION.REPLACE_LOCAL_VARIABLE",
+                Map("varName" -> toSQLId(nameParts))
+              )
+            }
+
+            if (nameParts.length != 1) {
+              throw new AnalysisException(
+                "INVALID_VARIABLE_DECLARATION.QUALIFIED_LOCAL_VARIABLE",
+                Map("varName" -> toSQLId(nameParts)))
+            }
+
+            SqlScriptingContextManager.get().map(_.getVariableManager)
+              .getOrElse(throw SparkException.internalError(
+                "Scripting local variable manager should be present in SQL script."))
+              .qualify(nameParts.last)
+          } else {
+            val resolvedIdentifier
+            = catalogManager.tempVariableManager.qualify(nameParts.last)
+
+            assertValidSessionVariableNameParts(nameParts, resolvedIdentifier)
+            resolvedIdentifier
+          }
+        case plan => plan
       }
-
-      c.copy(name = resolved)
+      c.copy(names = resolved)
     case d @ DropVariable(UnresolvedIdentifier(nameParts, _), _) =>
       if (withinSqlScript) {
         throw new AnalysisException(
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataFrameDropColumns.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataFrameDropColumns.scala
index 0f9b93cc2986d..a0f67fa3f445f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataFrameDropColumns.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataFrameDropColumns.scala
@@ -17,8 +17,8 @@
 
 package org.apache.spark.sql.catalyst.analysis
 
+import org.apache.spark.sql.catalyst.SQLConfHelper
 import org.apache.spark.sql.catalyst.plans.logical.{DataFrameDropColumns, LogicalPlan, Project}
-import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.trees.TreePattern.DF_DROP_COLUMNS
 import org.apache.spark.sql.connector.catalog.CatalogManager
 
@@ -27,17 +27,24 @@ import org.apache.spark.sql.connector.catalog.CatalogManager
  * Note that DataFrameDropColumns allows and ignores non-existing columns.
  */
 class ResolveDataFrameDropColumns(val catalogManager: CatalogManager)
-  extends Rule[LogicalPlan] with ColumnResolutionHelper  {
+  extends SQLConfHelper with ColumnResolutionHelper  {
 
-  override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsWithPruning(
+  def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsWithPruning(
     _.containsPattern(DF_DROP_COLUMNS)) {
     case d: DataFrameDropColumns if d.childrenResolved =>
       // expressions in dropList can be unresolved, e.g.
       //   df.drop(col("non-existing-column"))
-      val dropped = d.dropList.map {
+      val dropped = d.dropList.flatMap {
         case u: UnresolvedAttribute =>
-          resolveExpressionByPlanChildren(u, d)
-        case e => e
+          if (u.getTagValue(LogicalPlan.PLAN_ID_TAG).nonEmpty) {
+            // Plan Id comes from Spark Connect,
+            // Here we ignore the `UnresolvedAttribute` if its Plan Id can be found
+            // but column not found.
+            tryResolveColumnByPlanChildren(u, d)
+          } else {
+            Some(resolveExpressionByPlanChildren(u, d))
+          }
+        case e => Some(e)
       }
       val remaining = d.child.output.filterNot(attr => dropped.exists(_.semanticEquals(attr)))
       if (remaining.size == d.child.output.size) {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveIdentifierClause.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveIdentifierClause.scala
index 96ed8a63585d0..7150c81ad64ec 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveIdentifierClause.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveIdentifierClause.scala
@@ -19,20 +19,18 @@ package org.apache.spark.sql.catalyst.analysis
 
 import scala.collection.mutable
 
-import org.apache.spark.sql.catalyst.expressions.{AliasHelper, EvalHelper, Expression, SubqueryExpression, VariableReference}
-import org.apache.spark.sql.catalyst.parser.CatalystSqlParser
+import org.apache.spark.sql.catalyst.expressions.{Expression, SubqueryExpression, VariableReference}
 import org.apache.spark.sql.catalyst.plans.logical.{CreateView, LogicalPlan}
 import org.apache.spark.sql.catalyst.rules.{Rule, RuleExecutor}
 import org.apache.spark.sql.catalyst.trees.TreePattern._
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.types.StringType
 
 /**
  * Resolves the identifier expressions and builds the original plans/expressions.
  */
 class ResolveIdentifierClause(earlyBatches: Seq[RuleExecutor[LogicalPlan]#Batch])
-  extends Rule[LogicalPlan] with AliasHelper with EvalHelper {
+  extends Rule[LogicalPlan] {
 
   private val executor = new RuleExecutor[LogicalPlan] {
     override def batches: Seq[Batch] = earlyBatches.asInstanceOf[Seq[Batch]]
@@ -70,7 +68,8 @@ class ResolveIdentifierClause(earlyBatches: Seq[RuleExecutor[LogicalPlan]#Batch]
           referredTempVars.get ++= collectTemporaryVariablesInLogicalPlan(p)
         }
 
-        executor.execute(p.planBuilder.apply(evalIdentifierExpr(p.identifierExpr), p.children))
+        executor.execute(p.planBuilder.apply(
+          IdentifierResolution.evalIdentifierExpr(p.identifierExpr), p.children))
       case other =>
         other.transformExpressionsWithPruning(_.containsAnyPattern(UNRESOLVED_IDENTIFIER)) {
           case e: ExpressionWithUnresolvedIdentifier if e.identifierExpr.resolved =>
@@ -79,7 +78,8 @@ class ResolveIdentifierClause(earlyBatches: Seq[RuleExecutor[LogicalPlan]#Batch]
               referredTempVars.get ++= collectTemporaryVariablesInExpressionTree(e)
             }
 
-            e.exprBuilder.apply(evalIdentifierExpr(e.identifierExpr), e.otherExprs)
+            e.exprBuilder.apply(
+              IdentifierResolution.evalIdentifierExpr(e.identifierExpr), e.otherExprs)
         }
     }
 
@@ -104,31 +104,4 @@ class ResolveIdentifierClause(earlyBatches: Seq[RuleExecutor[LogicalPlan]#Batch]
     }
     collectTempVars(child)
   }
-
-  private def evalIdentifierExpr(expr: Expression): Seq[String] = {
-    trimAliases(prepareForEval(expr)) match {
-      case e if !e.foldable => expr.failAnalysis(
-        errorClass = "NOT_A_CONSTANT_STRING.NOT_CONSTANT",
-        messageParameters = Map(
-          "name" -> "IDENTIFIER",
-          "expr" -> expr.sql))
-      case e if e.dataType != StringType => expr.failAnalysis(
-        errorClass = "NOT_A_CONSTANT_STRING.WRONG_TYPE",
-        messageParameters = Map(
-          "name" -> "IDENTIFIER",
-          "expr" -> expr.sql,
-          "dataType" -> e.dataType.catalogString))
-      case e =>
-        e.eval() match {
-          case null => expr.failAnalysis(
-            errorClass = "NOT_A_CONSTANT_STRING.NULL",
-            messageParameters = Map(
-              "name" -> "IDENTIFIER",
-              "expr" -> expr.sql))
-          case other =>
-            // Parse the identifier string to name parts.
-            CatalystSqlParser.parseMultipartIdentifier(other.toString)
-        }
-    }
-  }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTables.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTables.scala
index 62f3997491c07..08cb70ddd5dba 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTables.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTables.scala
@@ -17,11 +17,11 @@
 
 package org.apache.spark.sql.catalyst.analysis
 
-import org.apache.spark.sql.catalyst.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.catalyst.expressions.EvalHelper
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.trees.AlwaysProcess
+import org.apache.spark.sql.catalyst.util.EvaluateUnresolvedInlineTable
 
 /**
  * An analyzer rule that replaces [[UnresolvedInlineTable]] with [[ResolvedInlineTable]].
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveLateralColumnAliasReference.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveLateralColumnAliasReference.scala
index 632d01f18ec2a..042e4483a37d3 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveLateralColumnAliasReference.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveLateralColumnAliasReference.scala
@@ -113,7 +113,7 @@ import org.apache.spark.sql.internal.SQLConf
  * [[ExtractWindowExpressions]].
  */
 // scalastyle:on line.size.limit
-object ResolveLateralColumnAliasReference extends Rule[LogicalPlan] {
+object ResolveLateralColumnAliasReference extends Rule[LogicalPlan] with AliasHelper {
   case class AliasEntry(alias: Alias, index: Int)
 
   private def assignAlias(expr: Expression): NamedExpression = {
@@ -170,7 +170,7 @@ object ResolveLateralColumnAliasReference extends Rule[LogicalPlan] {
               UnresolvedAttribute(lcaRef.nameParts)
           }.asInstanceOf[NamedExpression]
         }
-        val newProjectList = projectList.zipWithIndex.map {
+        val newProjectList = projectList.map(trimNonTopLevelAliases).zipWithIndex.map {
           case (a: Alias, idx) =>
             val lcaResolved = unwrapLCAReference(a)
             // Insert the original alias instead of rewritten one to detect chained LCA
@@ -229,7 +229,9 @@ object ResolveLateralColumnAliasReference extends Rule[LogicalPlan] {
             case e => e.children.forall(eligibleToLiftUp)
           }
         }
-        if (!aggregateExpressions.forall(eligibleToLiftUp)) {
+        val aggregateExpressionsWithTrimmedAliases =
+          aggregateExpressions.map(trimNonTopLevelAliases)
+        if (!aggregateExpressionsWithTrimmedAliases.forall(eligibleToLiftUp)) {
           agg
         } else {
           val newAggExprs = new LinkedHashSet[NamedExpression]
@@ -268,8 +270,9 @@ object ResolveLateralColumnAliasReference extends Rule[LogicalPlan] {
               case e => e.mapChildren(extractExpressions)
             }
           }
-          val projectExprs = aggregateExpressions.map(
-            extractExpressions(_).asInstanceOf[NamedExpression])
+          val projectExprs = aggregateExpressionsWithTrimmedAliases.map(
+            extractExpressions(_).asInstanceOf[NamedExpression]
+          )
           val newProject = Project(
             projectList = projectExprs,
             child = agg.copy(aggregateExpressions = newAggExprs.asScala.toSeq)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveMergeIntoSchemaEvolution.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveMergeIntoSchemaEvolution.scala
new file mode 100644
index 0000000000000..7e7776098a04a
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveMergeIntoSchemaEvolution.scala
@@ -0,0 +1,65 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis
+
+import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.catalyst.types.DataTypeUtils
+import org.apache.spark.sql.connector.catalog.{CatalogV2Util, TableCatalog}
+import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
+import org.apache.spark.sql.errors.QueryCompilationErrors
+import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
+
+
+/**
+ * A rule that resolves schema evolution for MERGE INTO.
+ *
+ * This rule will call the DSV2 Catalog to update the schema of the target table.
+ */
+object ResolveMergeIntoSchemaEvolution extends Rule[LogicalPlan] {
+
+  override def apply(plan: LogicalPlan): LogicalPlan = plan resolveOperators {
+    case m @ MergeIntoTable(_, _, _, _, _, _, _)
+      if m.needSchemaEvolution =>
+        val newTarget = m.targetTable.transform {
+          case r : DataSourceV2Relation => performSchemaEvolution(r, m.sourceTable)
+        }
+        m.copy(targetTable = newTarget)
+  }
+
+  private def performSchemaEvolution(relation: DataSourceV2Relation, source: LogicalPlan)
+    : DataSourceV2Relation = {
+    (relation.catalog, relation.identifier) match {
+      case (Some(c: TableCatalog), Some(i)) =>
+        val changes = MergeIntoTable.schemaChanges(relation.schema, source.schema)
+        c.alterTable(i, changes: _*)
+        val newTable = c.loadTable(i)
+        val newSchema = CatalogV2Util.v2ColumnsToStructType(newTable.columns())
+        // Check if there are any remaining changes not applied.
+        val remainingChanges = MergeIntoTable.schemaChanges(newSchema, source.schema)
+        if (remainingChanges.nonEmpty) {
+          throw QueryCompilationErrors.unsupportedTableChangesInAutoSchemaEvolutionError(
+            remainingChanges, i.toQualifiedNameParts(c))
+        }
+        relation.copy(table = newTable, output = DataTypeUtils.toAttributes(newSchema))
+      case _ => logWarning(s"Schema Evolution enabled but data source $relation " +
+        s"does not support it, skipping.")
+        relation
+    }
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveReferencesInSort.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveReferencesInSort.scala
index 6fa723d4a75fd..6e120ef015026 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveReferencesInSort.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveReferencesInSort.scala
@@ -20,53 +20,78 @@ import org.apache.spark.sql.catalyst.SQLConfHelper
 import org.apache.spark.sql.catalyst.expressions.SortOrder
 import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, LogicalPlan, Project, Sort}
 import org.apache.spark.sql.connector.catalog.CatalogManager
+import org.apache.spark.sql.internal.SQLConf
 
 /**
  * A virtual rule to resolve [[UnresolvedAttribute]] in [[Sort]]. It's only used by the real
  * rule `ResolveReferences`. The column resolution order for [[Sort]] is:
- * 1. Resolves the column to [[AttributeReference]] with the output of the child plan. This
+ * 1. Checks whether there are [[UnresolvedOrdinal]]s in the sort order list. In case there are
+ *    delay the resolution until we resolve all the ordinals. Without this check, we proceed to
+ *    resolve the following query correctly:
+ *    {{{ SELECT col1 FROM VALUES(1, 2) ORDER BY 2, col2; }}}
+ *    That's because we add missing input in `ResolveReferencesInSort` to the underlying operator
+ *    and then successfully resolve the ordinal because at that point there are two elements below.
+ * 2. Resolves the column to [[AttributeReference]] with the output of the child plan. This
  *    includes metadata columns as well.
- * 2. Resolves the column to a literal function which is allowed to be invoked without braces, e.g.
+ * 3. Resolves the column to a literal function which is allowed to be invoked without braces, e.g.
  *    `SELECT col, current_date FROM t`.
- * 3. If the child plan is Aggregate or Filter(_, Aggregate), resolves the column to
+ * 4. If the child plan is Aggregate or Filter(_, Aggregate), resolves the column to
  *    [[TempResolvedColumn]] with the output of Aggregate's child plan.
  *    This is to allow Sort to host grouping expressions and aggregate functions, which can
  *    be pushed down to the Aggregate later. For example,
  *    `SELECT max(a) FROM t GROUP BY b HAVING max(a) > 1 ORDER BY min(a)`.
- * 4. Resolves the column to [[AttributeReference]] with the output of a descendant plan node.
+ * 5. Resolves the column to [[AttributeReference]] with the output of a descendant plan node.
  *    Spark will propagate the missing attributes from the descendant plan node to the Sort node.
  *    This is to allow users to ORDER BY columns that are not in the SELECT clause, which is
  *    widely supported in other SQL dialects. For example, `SELECT a FROM t ORDER BY b`.
- * 5. If the order by expressions only have one single unresolved column named ALL, expanded it to
+ * 6. If the order by expressions only have one single unresolved column named ALL, expanded it to
  *    include all columns in the SELECT list. This is to support SQL pattern like
  *    `SELECT col1, col2 FROM t ORDER BY ALL`. This should also support specifying asc/desc, and
  *    nulls first/last.
- * 6. Resolves the column to outer references with the outer plan if we are resolving subquery
+ * 7. Resolves the column to outer references with the outer plan if we are resolving subquery
  *    expressions.
  *
- * Note, 3 and 4 are actually orthogonal. If the child plan is Aggregate, 4 can only resolve columns
- * as the grouping columns, which is completely covered by 3.
+ * Note, 4 and 5 are actually orthogonal. If the child plan is Aggregate, 5 can only resolve columns
+ * as the grouping columns, which is completely covered by 4.
  */
 class ResolveReferencesInSort(val catalogManager: CatalogManager)
   extends SQLConfHelper with ColumnResolutionHelper {
 
   def apply(s: Sort): LogicalPlan = {
-    val resolvedBasic = s.order.map(resolveExpressionByPlanOutput(_, s.child))
-    val resolvedWithAgg = s.child match {
+    if (conf.getConf(SQLConf.PRIORITIZE_ORDINAL_RESOLUTION_IN_SORT) && hasUnresolvedOrdinals(s)) {
+      s
+    } else {
+      resolveReferencesInSort(s)
+    }
+  }
+
+  private def hasUnresolvedOrdinals(sort: Sort): Boolean = {
+    sort.order.exists { sortOrder =>
+      sortOrder.child match {
+        case _: UnresolvedOrdinal => true
+        case _ => false
+      }
+    }
+  }
+
+  private def resolveReferencesInSort(sort: Sort): LogicalPlan = {
+    val resolvedBasic = sort.order.map(resolveExpressionByPlanOutput(_, sort.child))
+    val resolvedWithAgg = sort.child match {
       case Filter(_, agg: Aggregate) => resolvedBasic.map(resolveColWithAgg(_, agg))
-      case _ => resolvedBasic.map(resolveColWithAgg(_, s.child))
+      case _ => resolvedBasic.map(resolveColWithAgg(_, sort.child))
     }
-    val (missingAttrResolved, newChild) = resolveExprsAndAddMissingAttrs(resolvedWithAgg, s.child)
+    val (missingAttrResolved, newChild) =
+      resolveExprsAndAddMissingAttrs(resolvedWithAgg, sort.child)
     val orderByAllResolved = resolveOrderByAll(
-      s.global, newChild, missingAttrResolved.map(_.asInstanceOf[SortOrder]))
+      sort.global, newChild, missingAttrResolved.map(_.asInstanceOf[SortOrder]))
     val resolvedFinal = orderByAllResolved
       .map(e => resolveColsLastResort(e).asInstanceOf[SortOrder])
-    if (s.child.output == newChild.output) {
-      s.copy(order = resolvedFinal)
+    if (sort.child.output == newChild.output) {
+      sort.copy(order = resolvedFinal)
     } else {
       // Add missing attributes and then project them away.
-      val newSort = s.copy(order = resolvedFinal, child = newChild)
-      Project(s.child.output, newSort)
+      val newSort = sort.copy(order = resolvedFinal, child = newChild)
+      Project(sort.child.output, newSort)
     }
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveRowLevelCommandAssignments.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveRowLevelCommandAssignments.scala
index 3f3e707b054bb..83520b780f121 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveRowLevelCommandAssignments.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveRowLevelCommandAssignments.scala
@@ -48,7 +48,8 @@ object ResolveRowLevelCommandAssignments extends Rule[LogicalPlan] {
     case u: UpdateTable if !u.skipSchemaResolution && u.resolved && !u.aligned =>
       resolveAssignments(u)
 
-    case m: MergeIntoTable if !m.skipSchemaResolution && m.resolved && m.rewritable && !m.aligned =>
+    case m: MergeIntoTable if !m.skipSchemaResolution && m.resolved && m.rewritable && !m.aligned &&
+      !m.needSchemaEvolution =>
       validateStoreAssignmentPolicy()
       m.copy(
         targetTable = cleanAttrMetadata(m.targetTable),
@@ -56,7 +57,8 @@ object ResolveRowLevelCommandAssignments extends Rule[LogicalPlan] {
         notMatchedActions = alignActions(m.targetTable.output, m.notMatchedActions),
         notMatchedBySourceActions = alignActions(m.targetTable.output, m.notMatchedBySourceActions))
 
-    case m: MergeIntoTable if !m.skipSchemaResolution && m.resolved && !m.aligned =>
+    case m: MergeIntoTable if !m.skipSchemaResolution && m.resolved && !m.aligned
+      && !m.needSchemaEvolution =>
       resolveAssignments(m)
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSetVariable.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSetVariable.scala
index 24b6b04de514b..ab44084357670 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSetVariable.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSetVariable.scala
@@ -33,6 +33,7 @@ import org.apache.spark.sql.types.IntegerType
  */
 class ResolveSetVariable(val catalogManager: CatalogManager) extends Rule[LogicalPlan]
   with ColumnResolutionHelper {
+  private val variableResolution = new VariableResolution(catalogManager.tempVariableManager)
 
   override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsWithPruning(
     _.containsPattern(COMMAND), ruleId) {
@@ -40,7 +41,10 @@ class ResolveSetVariable(val catalogManager: CatalogManager) extends Rule[Logica
     case setVariable: SetVariable if !setVariable.targetVariables.forall(_.resolved) =>
       val resolvedVars = setVariable.targetVariables.map {
         case u: UnresolvedAttribute =>
-          lookupVariable(u.nameParts) match {
+          variableResolution.lookupVariable(
+            nameParts = u.nameParts,
+            resolvingExecuteImmediate = AnalysisContext.get.isExecuteImmediate
+          ) match {
             case Some(variable) => variable.copy(canFold = false)
             case _ => throw unresolvedVariableError(u.nameParts, Seq("SYSTEM", "SESSION"))
           }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveTableConstraints.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveTableConstraints.scala
index 3b86b9580ae19..41631b24a83ed 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveTableConstraints.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveTableConstraints.scala
@@ -19,17 +19,22 @@ package org.apache.spark.sql.catalyst.analysis
 import scala.collection.mutable
 
 import org.apache.spark.sql.catalyst.expressions.{And, CheckInvariant, Expression, V2ExpressionUtils}
-import org.apache.spark.sql.catalyst.plans.logical.{Filter, LogicalPlan, V2WriteCommand}
+import org.apache.spark.sql.catalyst.plans.logical.{Filter, LogicalPlan, V2WriteCommand, WriteDelta}
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.trees.TreePattern.COMMAND
 import org.apache.spark.sql.connector.catalog.CatalogManager
 import org.apache.spark.sql.connector.catalog.constraints.Check
+import org.apache.spark.sql.connector.write.RowLevelOperation
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
 
 class ResolveTableConstraints(val catalogManager: CatalogManager) extends Rule[LogicalPlan] {
 
   override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveOperatorsWithPruning(
     _.containsPattern(COMMAND), ruleId) {
+    // Deleting a delta of rows from an existing table doesn't produce any new rows, thus enforcing
+    // check constraints is unnecessary.
+    case w: WriteDelta if w.operation.command() == RowLevelOperation.Command.DELETE =>
+      w
     case v2Write: V2WriteCommand
       if v2Write.table.resolved && v2Write.query.resolved &&
         !containsCheckInvariant(v2Write.query) && v2Write.outputResolved =>
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveWithCTE.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveWithCTE.scala
index 2a522e98a7683..0f6fcec467ce1 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveWithCTE.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveWithCTE.scala
@@ -59,6 +59,10 @@ object ResolveWithCTE extends Rule[LogicalPlan] {
               cteDefMap.put(cteDef.id, cteDef)
             }
             cteDef
+          case cteDef if cteDef.hasSelfReferenceInAnchor || cteDef.hasSelfReferenceInSubCTE =>
+            throw new AnalysisException(
+              errorClass = "INVALID_RECURSIVE_CTE",
+              messageParameters = Map.empty)
           case cteDef =>
             // Multiple self-references are not allowed within one cteDef.
             cteDef.child match {
@@ -306,7 +310,10 @@ object ResolveWithCTE extends Rule[LogicalPlan] {
       columnNames: Option[Seq[String]]) = {
     recursion.transformUpWithSubqueriesAndPruning(_.containsPattern(CTE)) {
       case r: CTERelationRef if r.recursive && r.cteId == cteDefId =>
-        val ref = UnionLoopRef(r.cteId, anchor.output.map(_.newInstance()), false)
+        // We mark the output of UnionLoopRef as nullable as it may become NULL in the following
+        // iterations.
+        val ref =
+          UnionLoopRef(r.cteId, anchor.output.map(_.newInstance().withNullability(true)), false)
         columnNames.map(UnresolvedSubqueryColumnAliases(_, ref)).getOrElse(ref)
     }
   }
@@ -319,35 +326,42 @@ object ResolveWithCTE extends Rule[LogicalPlan] {
   def checkIfSelfReferenceIsPlacedCorrectly(
       plan: LogicalPlan,
       cteId: Long,
-      allowRecursiveRef: Boolean = true): Unit = plan match {
-    case Join(left, right, Inner, _, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
-      checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef)
-    case Join(left, right, Cross, _, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
-      checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef)
-    case Join(left, right, LeftOuter, _, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
-      checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
-    case Join(left, right, RightOuter, _, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef = false)
-      checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef)
-    case Join(left, right, LeftSemi, _, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
-      checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
-    case Join(left, right, LeftAnti, _, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
-      checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
-    case Join(left, right, _, _, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef = false)
-      checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
-    case Aggregate(_, _, child, _) =>
-      checkIfSelfReferenceIsPlacedCorrectly(child, cteId, allowRecursiveRef = false)
-    case r: UnionLoopRef if !allowRecursiveRef && r.loopId == cteId =>
-      throw new AnalysisException(
-        errorClass = "INVALID_RECURSIVE_REFERENCE.PLACE",
-        messageParameters = Map.empty)
-    case other =>
-      other.children.foreach(checkIfSelfReferenceIsPlacedCorrectly(_, cteId, allowRecursiveRef))
+      allowRecursiveRef: Boolean = true): Unit = {
+    plan match {
+      case Join(left, right, Inner, _, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
+        checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef)
+      case Join(left, right, Cross, _, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
+        checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef)
+      case Join(left, right, LeftOuter, _, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
+        checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
+      case Join(left, right, RightOuter, _, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef = false)
+        checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef)
+      case Join(left, right, LeftSemi, _, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
+        checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
+      case Join(left, right, LeftAnti, _, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef)
+        checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
+      case Join(left, right, _, _, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(left, cteId, allowRecursiveRef = false)
+        checkIfSelfReferenceIsPlacedCorrectly(right, cteId, allowRecursiveRef = false)
+      case Aggregate(_, _, child, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(child, cteId, allowRecursiveRef = false)
+      case Window(_, _, _, child, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(child, cteId, allowRecursiveRef = false)
+      case Sort(_, _, child, _) =>
+        checkIfSelfReferenceIsPlacedCorrectly(child, cteId, allowRecursiveRef = false)
+      case r: UnionLoopRef if !allowRecursiveRef && r.loopId == cteId =>
+        throw new AnalysisException(
+          errorClass = "INVALID_RECURSIVE_REFERENCE.PLACE",
+          messageParameters = Map.empty)
+      case other =>
+        other.children.foreach(checkIfSelfReferenceIsPlacedCorrectly(_, cteId, allowRecursiveRef))
+    }
+    plan.subqueries.foreach(checkIfSelfReferenceIsPlacedCorrectly(_, cteId, allowRecursiveRef))
   }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/RewriteMergeIntoTable.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/RewriteMergeIntoTable.scala
index 7e2cf4f29807c..9e67aa156fa21 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/RewriteMergeIntoTable.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/RewriteMergeIntoTable.scala
@@ -23,7 +23,7 @@ import org.apache.spark.sql.catalyst.expressions.Literal.{FalseLiteral, TrueLite
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
 import org.apache.spark.sql.catalyst.plans.{FullOuter, Inner, JoinType, LeftAnti, LeftOuter, RightOuter}
 import org.apache.spark.sql.catalyst.plans.logical.{AppendData, DeleteAction, Filter, HintInfo, InsertAction, Join, JoinHint, LogicalPlan, MergeAction, MergeIntoTable, MergeRows, NO_BROADCAST_AND_REPLICATION, Project, ReplaceData, UpdateAction, WriteDelta}
-import org.apache.spark.sql.catalyst.plans.logical.MergeRows.{Discard, Instruction, Keep, ROW_ID, Split}
+import org.apache.spark.sql.catalyst.plans.logical.MergeRows.{Copy, Delete, Discard, Insert, Instruction, Keep, ROW_ID, Split, Update}
 import org.apache.spark.sql.catalyst.util.RowDeltaUtils.{OPERATION_COLUMN, WRITE_OPERATION, WRITE_WITH_METADATA_OPERATION}
 import org.apache.spark.sql.connector.catalog.SupportsRowLevelOperations
 import org.apache.spark.sql.connector.write.{RowLevelOperationTable, SupportsDelta}
@@ -45,8 +45,8 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
 
   override def apply(plan: LogicalPlan): LogicalPlan = plan resolveOperators {
     case m @ MergeIntoTable(aliasedTable, source, cond, matchedActions, notMatchedActions,
-        notMatchedBySourceActions, _) if m.resolved && m.rewritable && m.aligned &&
-        matchedActions.isEmpty && notMatchedActions.size == 1 &&
+      notMatchedBySourceActions, _) if m.resolved && m.rewritable && m.aligned &&
+        !m.needSchemaEvolution && matchedActions.isEmpty && notMatchedActions.size == 1 &&
         notMatchedBySourceActions.isEmpty =>
 
       EliminateSubqueryAliases(aliasedTable) match {
@@ -79,7 +79,8 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
       }
 
     case m @ MergeIntoTable(aliasedTable, source, cond, matchedActions, notMatchedActions,
-        notMatchedBySourceActions, _) if m.resolved && m.rewritable && m.aligned &&
+        notMatchedBySourceActions, _)
+      if m.resolved && m.rewritable && m.aligned && !m.needSchemaEvolution &&
         matchedActions.isEmpty && notMatchedBySourceActions.isEmpty =>
 
       EliminateSubqueryAliases(aliasedTable) match {
@@ -93,7 +94,7 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
 
           val notMatchedInstructions = notMatchedActions.map {
             case InsertAction(cond, assignments) =>
-              Keep(cond.getOrElse(TrueLiteral), assignments.map(_.value))
+              Keep(Insert, cond.getOrElse(TrueLiteral), assignments.map(_.value))
             case other =>
               throw new AnalysisException(
                 errorClass = "_LEGACY_ERROR_TEMP_3053",
@@ -120,7 +121,8 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
       }
 
     case m @ MergeIntoTable(aliasedTable, source, cond, matchedActions, notMatchedActions,
-        notMatchedBySourceActions, _) if m.resolved && m.rewritable && m.aligned =>
+        notMatchedBySourceActions, _)
+      if m.resolved && m.rewritable && m.aligned && !m.needSchemaEvolution =>
 
       EliminateSubqueryAliases(aliasedTable) match {
         case r @ DataSourceV2Relation(tbl: SupportsRowLevelOperations, _, _, _, _) =>
@@ -199,7 +201,7 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
     // as the last MATCHED and NOT MATCHED BY SOURCE instruction
     // this logic is specific to data sources that replace groups of data
     val carryoverRowsOutput = Literal(WRITE_WITH_METADATA_OPERATION) +: targetTable.output
-    val keepCarryoverRowsInstruction = Keep(TrueLiteral, carryoverRowsOutput)
+    val keepCarryoverRowsInstruction = Keep(Copy, TrueLiteral, carryoverRowsOutput)
 
     val matchedInstructions = matchedActions.map { action =>
       toInstruction(action, metadataAttrs)
@@ -436,7 +438,7 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
         val rowValues = assignments.map(_.value)
         val metadataValues = nullifyMetadataOnUpdate(metadataAttrs)
         val output = Seq(Literal(WRITE_WITH_METADATA_OPERATION)) ++ rowValues ++ metadataValues
-        Keep(cond.getOrElse(TrueLiteral), output)
+        Keep(Update, cond.getOrElse(TrueLiteral), output)
 
       case DeleteAction(cond) =>
         Discard(cond.getOrElse(TrueLiteral))
@@ -445,7 +447,7 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
         val rowValues = assignments.map(_.value)
         val metadataValues = metadataAttrs.map(attr => Literal(null, attr.dataType))
         val output = Seq(Literal(WRITE_OPERATION)) ++ rowValues ++ metadataValues
-        Keep(cond.getOrElse(TrueLiteral), output)
+        Keep(Insert, cond.getOrElse(TrueLiteral), output)
 
       case other =>
         throw new AnalysisException(
@@ -471,15 +473,15 @@ object RewriteMergeIntoTable extends RewriteRowLevelCommand with PredicateHelper
 
       case UpdateAction(cond, assignments) =>
         val output = deltaUpdateOutput(assignments, metadataAttrs, originalRowIdValues)
-        Keep(cond.getOrElse(TrueLiteral), output)
+        Keep(Update, cond.getOrElse(TrueLiteral), output)
 
       case DeleteAction(cond) =>
         val output = deltaDeleteOutput(rowAttrs, rowIdAttrs, metadataAttrs, originalRowIdValues)
-        Keep(cond.getOrElse(TrueLiteral), output)
+        Keep(Delete, cond.getOrElse(TrueLiteral), output)
 
       case InsertAction(cond, assignments) =>
         val output = deltaInsertOutput(assignments, metadataAttrs, originalRowIdValues)
-        Keep(cond.getOrElse(TrueLiteral), output)
+        Keep(Insert, cond.getOrElse(TrueLiteral), output)
 
       case other =>
         throw new AnalysisException(
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/StreamingJoinHelper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/StreamingJoinHelper.scala
index ef425be42f981..c4549a189e8e1 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/StreamingJoinHelper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/StreamingJoinHelper.scala
@@ -21,7 +21,6 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.planning.ExtractEquiJoinKeys
 import org.apache.spark.sql.catalyst.plans.logical.{EventTimeWatermark, LogicalPlan}
@@ -239,7 +238,7 @@ object StreamingJoinHelper extends PredicateHelper with Logging {
           collect(left, negate) ++ collect(right, negate)
         case Subtract(left, right, _) =>
           collect(left, negate) ++ collect(right, !negate)
-        case TimeAdd(left, right, _) =>
+        case TimestampAddInterval(left, right, _) =>
           collect(left, negate) ++ collect(right, negate)
         case DatetimeSub(_, _, child) => collect(child, negate)
         case UnaryMinus(child, _) =>
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TableOutputResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TableOutputResolver.scala
index adf74c489ce1f..5243e17afe5da 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TableOutputResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TableOutputResolver.scala
@@ -132,7 +132,11 @@ object TableOutputResolver extends SQLConfHelper with Logging {
       case (valueType, colType) if DataType.equalsIgnoreCompatibleNullability(valueType, colType) =>
         val canWriteExpr = canWrite(
           tableName, valueType, colType, byName = true, conf, addError, colPath)
-        if (canWriteExpr) checkNullability(value, col, conf, colPath) else value
+        if (canWriteExpr) {
+          applyColumnMetadata(checkNullability(value, col, conf, colPath), col)
+        } else {
+          value
+        }
       case (valueType: StructType, colType: StructType) =>
         val resolvedValue = resolveStructType(
           tableName, value, valueType, col, colType,
@@ -180,12 +184,67 @@ object TableOutputResolver extends SQLConfHelper with Logging {
       } else {
         CharVarcharUtils.stringLengthCheck(casted, attr.dataType)
       }
-      Alias(exprWithStrLenCheck, attr.name)(explicitMetadata = Some(attr.metadata))
+      applyColumnMetadata(exprWithStrLenCheck, attr)
     } else {
       value
     }
   }
 
+
+  /**
+   * Add an [[Alias]] with the name and metadata from the given target table attribute.
+   *
+   * The metadata may be used by writers to get certain table properties.
+   * For example [[org.apache.spark.sql.catalyst.json.JacksonGenerator]]
+   * looks for default value metadata to control some behavior.
+   * This is not the best design, but it is the way at this time.
+   * We should change all the writers to pick up table configuration
+   * from the table directly. However, there are many third-party
+   * connectors that may rely on this behavior.
+   *
+   * We also must remove any [[CharVarcharUtils.CHAR_VARCHAR_TYPE_STRING_METADATA_KEY]]
+   * metadata from flowing out the top of the query.
+   * If we don't do this, the write operation will remain unresolved, or worse
+   * it may flip from resolved to unresolved.  We assume that the read-side
+   * handling is performed lower in the query.
+   *
+   * Moreover, we cannot propagate other source metadata, like source table
+   * default value definitions without confusing writers with reader metadata.
+   * So we need to be sure we block the source metadata from propagating.
+   *
+   * See SPARK-52772 for a discussion on rewrites that caused trouble with
+   * going from resolved to unresolved.
+   */
+  private def applyColumnMetadata(expr: Expression, column: Attribute): NamedExpression = {
+    // We have dealt with the required write-side char/varchar processing.
+    // We do not want to transfer that information to the read-side.
+    // If we do, the write operation will fail to resolve.
+    val requiredMetadata = CharVarcharUtils.cleanMetadata(column.metadata)
+
+    // Make sure that the result has the requiredMetadata and only that.
+    // If the expr is an Attribute or NamedLambdaVariable with the proper name and metadata,
+    // it should remain stable, but we do not trust that other NamedAttributes will
+    // remain stable (namely Alias).
+    expr match {
+      case a: Attribute if a.name == column.name && a.metadata == requiredMetadata =>
+        a
+      case v: NamedLambdaVariable if v.name == column.name && v.metadata == requiredMetadata =>
+        v
+      case _ =>
+        // We cannot keep an Alias with the correct name and metadata because the
+        // metadata might be derived, and derived metadata is not stable upon rewrites.
+        // eg:
+        //   Alias(cast(attr, attr.dataType), n).metadata is empty =>
+        //   Alias(attr, n).metadata == attr.metadata.
+        val stripAlias = expr match {
+          case a: Alias => a.child
+          case _ => expr
+        }
+        Alias(stripAlias, column.name)(explicitMetadata = Some(requiredMetadata))
+    }
+  }
+
+
   private def canWrite(
       tableName: String,
       valueType: DataType,
@@ -227,20 +286,14 @@ object TableOutputResolver extends SQLConfHelper with Logging {
             tableName, newColPath.quoted
           )
         }
-        defaultExpr
+        Some(applyColumnMetadata(defaultExpr.get, expectedCol))
       } else if (matched.length > 1) {
         throw QueryCompilationErrors.incompatibleDataToTableAmbiguousColumnNameError(
           tableName, newColPath.quoted
         )
       } else {
         matchedCols += matched.head.name
-        val expectedName = expectedCol.name
-        val matchedCol = matched.head match {
-          // Save an Alias if we can change the name directly.
-          case a: Attribute => a.withName(expectedName)
-          case a: Alias => a.withName(expectedName)
-          case other => other
-        }
+        val matchedCol = matched.head
         val actualExpectedCol = expectedCol.withDataType {
           CharVarcharUtils.getRawType(expectedCol.metadata).getOrElse(expectedCol.dataType)
         }
@@ -386,7 +439,7 @@ object TableOutputResolver extends SQLConfHelper with Logging {
       } else {
         struct
       }
-      Some(Alias(res, expected.name)())
+      Some(applyColumnMetadata(res, expected))
     } else {
       None
     }
@@ -412,16 +465,15 @@ object TableOutputResolver extends SQLConfHelper with Logging {
       resolveColumnsByPosition(tableName, Seq(param), Seq(fakeAttr), conf, addError, colPath)
     }
     if (res.length == 1) {
-      if (res.head == param) {
-        // If the element type is the same, we can reuse the input array directly.
-        Some(
-          Alias(nullCheckedInput, expected.name)(
-            nonInheritableMetadataKeys =
-              Seq(CharVarcharUtils.CHAR_VARCHAR_TYPE_STRING_METADATA_KEY)))
-      } else {
-        val func = LambdaFunction(res.head, Seq(param))
-        Some(Alias(ArrayTransform(nullCheckedInput, func), expected.name)())
-      }
+      val castedArray =
+        if (res.head == param) {
+          // If the element type is the same, we can reuse the input array directly.
+          nullCheckedInput
+        } else {
+          val func = LambdaFunction(res.head, Seq(param))
+          ArrayTransform(nullCheckedInput, func)
+        }
+      Some(applyColumnMetadata(castedArray, expected))
     } else {
       None
     }
@@ -461,26 +513,25 @@ object TableOutputResolver extends SQLConfHelper with Logging {
     if (resKey.length == 1 && resValue.length == 1) {
       // If the key and value expressions have not changed, we just check original map field.
       // Otherwise, we construct a new map by adding transformations to the keys and values.
-      if (resKey.head == keyParam && resValue.head == valueParam) {
-        Some(
-          Alias(nullCheckedInput, expected.name)(
-            nonInheritableMetadataKeys =
-              Seq(CharVarcharUtils.CHAR_VARCHAR_TYPE_STRING_METADATA_KEY)))
-      } else {
-        val newKeys = if (resKey.head != keyParam) {
-          val keyFunc = LambdaFunction(resKey.head, Seq(keyParam))
-          ArrayTransform(MapKeys(nullCheckedInput), keyFunc)
-        } else {
-          MapKeys(nullCheckedInput)
-        }
-        val newValues = if (resValue.head != valueParam) {
-          val valueFunc = LambdaFunction(resValue.head, Seq(valueParam))
-          ArrayTransform(MapValues(nullCheckedInput), valueFunc)
+      val casted =
+        if (resKey.head == keyParam && resValue.head == valueParam) {
+          nullCheckedInput
         } else {
-          MapValues(nullCheckedInput)
+          val newKeys = if (resKey.head != keyParam) {
+            val keyFunc = LambdaFunction(resKey.head, Seq(keyParam))
+            ArrayTransform(MapKeys(nullCheckedInput), keyFunc)
+          } else {
+            MapKeys(nullCheckedInput)
+          }
+          val newValues = if (resValue.head != valueParam) {
+            val valueFunc = LambdaFunction(resValue.head, Seq(valueParam))
+            ArrayTransform(MapValues(nullCheckedInput), valueFunc)
+          } else {
+            MapValues(nullCheckedInput)
+          }
+          MapFromArrays(newKeys, newValues)
         }
-        Some(Alias(MapFromArrays(newKeys, newValues), expected.name)())
-      }
+      Some(applyColumnMetadata(casted, expected))
     } else {
       None
     }
@@ -525,12 +576,6 @@ object TableOutputResolver extends SQLConfHelper with Logging {
       !Cast.canUpCast(cast.child.dataType, cast.dataType)
   }
 
-  private def isCompatible(tableAttr: Attribute, queryExpr: NamedExpression): Boolean = {
-    DataTypeUtils.sameType(tableAttr.dataType, queryExpr.dataType) &&
-      tableAttr.name == queryExpr.name &&
-      tableAttr.metadata == queryExpr.metadata
-  }
-
   private def checkField(
       tableName: String,
       tableAttr: Attribute,
@@ -546,33 +591,32 @@ object TableOutputResolver extends SQLConfHelper with Logging {
     } else {
       tableAttr.dataType
     }
-    lazy val outputField = if (isCompatible(tableAttr, queryExpr)) {
-      if (requiresNullChecks(queryExpr, tableAttr, conf)) {
-        val assert = AssertNotNull(queryExpr, colPath)
-        Some(Alias(assert, tableAttr.name)(explicitMetadata = Some(tableAttr.metadata)))
-      } else {
-        Some(queryExpr)
-      }
-    } else {
-      val nullCheckedQueryExpr = checkNullability(queryExpr, tableAttr, conf, colPath)
-      val udtUnwrapped = unwrapUDT(nullCheckedQueryExpr)
-      val casted = cast(udtUnwrapped, attrTypeWithoutCharVarchar, conf, colPath.quoted)
-      val exprWithStrLenCheck = if (conf.charVarcharAsString || !attrTypeHasCharVarchar) {
-        casted
-      } else {
-        CharVarcharUtils.stringLengthCheck(casted, tableAttr.dataType)
-      }
-      // Renaming is needed for handling the following cases like
-      // 1) Column names/types do not match, e.g., INSERT INTO TABLE tab1 SELECT 1, 2
-      // 2) Target tables have column metadata
-      Some(Alias(exprWithStrLenCheck, tableAttr.name)(explicitMetadata = Some(tableAttr.metadata)))
-    }
 
     val canWriteExpr = canWrite(
       tableName, queryExpr.dataType, attrTypeWithoutCharVarchar,
       byName, conf, addError, colPath)
 
-    if (canWriteExpr) outputField else None
+    if (canWriteExpr) {
+      val prepared =
+        if (DataTypeUtils.sameType(tableAttr.dataType, queryExpr.dataType)) {
+          // If the types are an exact match, we can leave UDTs alone,
+          // we obviously do not need a cast, and the constraints of the target
+          // table char/varchar types must be met.
+          queryExpr
+        } else {
+          val udtUnwrapped = unwrapUDT(queryExpr)
+          val casted = cast(udtUnwrapped, attrTypeWithoutCharVarchar, conf, colPath.quoted)
+          if (conf.charVarcharAsString || !attrTypeHasCharVarchar) {
+            casted
+          } else {
+            CharVarcharUtils.stringLengthCheck(casted, tableAttr.dataType)
+          }
+        }
+      val nullChecked = checkNullability(prepared, tableAttr, conf, colPath)
+      Some(applyColumnMetadata(nullChecked, tableAttr))
+    } else {
+      None
+    }
   }
 
   private def unwrapUDT(expr: Expression): Expression = expr.dataType match {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionBase.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionBase.scala
index a8832aada0839..271e151e709cc 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionBase.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionBase.scala
@@ -42,6 +42,7 @@ import org.apache.spark.sql.catalyst.plans.logical.{
   Project,
   ReplaceTable,
   Union,
+  UnionLoop,
   Unpivot
 }
 import org.apache.spark.sql.catalyst.rules.Rule
@@ -49,6 +50,7 @@ import org.apache.spark.sql.catalyst.trees.CurrentOrigin.withOrigin
 import org.apache.spark.sql.catalyst.util.ResolveDefaultColumns
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.MultipartIdentifierHelper
 import org.apache.spark.sql.connector.catalog.procedures.BoundProcedure
+import org.apache.spark.sql.errors.DataTypeErrors.cannotMergeIncompatibleDataTypesError
 import org.apache.spark.sql.types.DataType
 
 abstract class TypeCoercionBase extends TypeCoercionHelper {
@@ -247,6 +249,25 @@ abstract class TypeCoercionBase extends TypeCoercionHelper {
             val attrMapping = s.children.head.output.zip(newChildren.head.output)
             s.copy(children = newChildren) -> attrMapping
           }
+
+        case s: UnionLoop
+            if s.childrenResolved && s.anchor.output.length == s.recursion.output.length
+              && !s.resolved =>
+          // If the anchor data type is wider than the recursion data type, we cast the recursion
+          // type to match the anchor type.
+          // On the other hand, we cannot cast the anchor type into a wider recursion type, as at
+          // this point the UnionLoopRefs inside the recursion are already resolved with the
+          // narrower anchor type.
+          val projectList = s.recursion.output.zip(s.anchor.output.map(_.dataType)).map {
+            case (attr, dt) =>
+              val widerType = findWiderTypeForTwo(attr.dataType, dt)
+              if (widerType.isDefined && widerType.get == dt) {
+                Alias(Cast(attr, dt), attr.name)()
+              } else {
+                throw cannotMergeIncompatibleDataTypesError(dt, attr.dataType)
+              }
+          }
+          s.copy(recursion = Project(projectList, s.recursion)) -> Nil
       }
     }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionHelper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionHelper.scala
index 390ff2f3114d9..0e7d44e98bfb8 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionHelper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionHelper.scala
@@ -51,7 +51,7 @@ import org.apache.spark.sql.catalyst.expressions.{
   SpecialFrameBoundary,
   SpecifiedWindowFrame,
   SubtractTimestamps,
-  TimeAdd,
+  TimestampAddInterval,
   WindowSpecDefinition
 }
 import org.apache.spark.sql.catalyst.expressions.aggregate.{Average, Sum}
@@ -671,7 +671,7 @@ abstract class TypeCoercionHelper {
         case (e, _: DateType) => e
         case (e, _: TimestampType) => e
         case (e: Expression, t) if e.dataType != t && canCast(e.dataType, t) =>
-          Cast(e, t)
+          Cast(child = e, dataType = t).withTimeZone(conf.sessionLocalTimeZone)
         case _ => boundary
       }
     }
@@ -700,7 +700,8 @@ abstract class TypeCoercionHelper {
         val newRight = castIfNotSameType(s.right, TimestampNTZType)
         s.copy(left = newLeft, right = newRight)
 
-      case t @ TimeAdd(StringTypeExpression(), _, _) => t.copy(start = Cast(t.start, TimestampType))
+      case t @ TimestampAddInterval(StringTypeExpression(), _, _) =>
+        t.copy(start = Cast(t.start, TimestampType))
 
       case other => other
     }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/UnsupportedOperationChecker.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/UnsupportedOperationChecker.scala
index 55b5b8ddfe6a3..fd4e081c91b52 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/UnsupportedOperationChecker.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/UnsupportedOperationChecker.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.catalyst.analysis
 
 import java.util.Locale
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ANALYSIS_ERROR, QUERY_PLAN}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.ExtendedAnalysisException
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ValidateSubqueryExpression.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ValidateSubqueryExpression.scala
index 4e35bd313d370..f88e2d112b558 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ValidateSubqueryExpression.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ValidateSubqueryExpression.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.catalyst.analysis
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.SubExprUtils._
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/VariableResolution.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/VariableResolution.scala
new file mode 100644
index 0000000000000..72af7c619a083
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/VariableResolution.scala
@@ -0,0 +1,186 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis
+
+import java.util.Locale
+
+import org.apache.spark.sql.catalyst.{SQLConfHelper, SqlScriptingContextManager}
+import org.apache.spark.sql.catalyst.catalog.TempVariableManager
+import org.apache.spark.sql.catalyst.expressions.{
+  Expression,
+  ExtractValue,
+  Literal,
+  VariableReference
+}
+import org.apache.spark.sql.catalyst.parser.SqlScriptingLabelContext.isForbiddenLabelOrForVariableName
+import org.apache.spark.sql.connector.catalog.{
+  CatalogManager,
+  Identifier
+}
+
+class VariableResolution(tempVariableManager: TempVariableManager) extends SQLConfHelper {
+
+  /**
+   * Resolves a `multipartName` to an [[Expression]] tree, supporting nested field access.
+   *
+   * This method implements a longest-match strategy similar to column resolution,
+   * preferring fully qualified variable names to avoid naming conflicts. It supports
+   * accessing nested fields within variables through dot notation.
+   *
+   * The resolution process works as follows:
+   * 1. Attempts to resolve the full name as a variable
+   * 2. If unsuccessful, treats the rightmost parts as nested field access
+   * 3. Continues until a variable is found or all combinations are exhausted
+   * 4. Wraps the result in ExtractValue expressions for nested field access
+   *
+   * @param nameParts The sequence of name parts representing the variable identifier
+   *   (e.g., ["catalog", "schema", "variable", "field1", "field2"])
+   * @param resolvingView Whether this resolution is happening within a view context.
+   *   When true, only variables explicitly referred to in the view definition are accessible.
+   * @param resolvingExecuteImmediate Whether this resolution is happening within an
+   *   EXECUTE IMMEDIATE context. When true, local variables are not accessible, only session
+   *   variables.
+   * @param referredTempVariableNames When resolving within a view, this contains the list of
+   *   variable names that the view explicitly references and should have access to.
+   *
+   * @return Some(Expression) if a variable is successfully resolved, potentially wrapped in
+   *   [[ExtractValue]] expressions for nested field access. None if no variable can be resolved
+   *   from the given name parts.
+   */
+  def resolveMultipartName(
+      nameParts: Seq[String],
+      resolvingView: Boolean,
+      resolvingExecuteImmediate: Boolean,
+      referredTempVariableNames: Seq[Seq[String]]): Option[Expression] = {
+    var resolvedVariable: Option[Expression] = None
+    // We only support temp variables for now, so the variable name can at most have 3 parts.
+    var numInnerFields: Int = math.max(0, nameParts.length - 3)
+    // Follow the column resolution and prefer the longest match. This makes sure that users
+    // can always use fully qualified variable name to avoid name conflicts.
+    while (resolvedVariable.isEmpty && numInnerFields < nameParts.length) {
+      resolvedVariable = resolveVariable(
+        nameParts = nameParts.dropRight(numInnerFields),
+        resolvingView = resolvingView,
+        resolvingExecuteImmediate = resolvingExecuteImmediate,
+        referredTempVariableNames = referredTempVariableNames
+      )
+
+      if (resolvedVariable.isEmpty) {
+        numInnerFields += 1
+      }
+    }
+
+    resolvedVariable.map { variable =>
+      if (numInnerFields != 0) {
+        val nestedFields = nameParts.takeRight(numInnerFields)
+        nestedFields.foldLeft(variable: Expression) { (e, name) =>
+          ExtractValue(e, Literal(name), conf.resolver)
+        }
+      } else {
+        variable
+      }
+    }
+  }
+
+  /**
+   * Look up variable by nameParts.
+   * If in SQL Script, first check local variables, unless in EXECUTE IMMEDIATE
+   * (EXECUTE IMMEDIATE generated query cannot access local variables).
+   * if not found fall back to session variables.
+   * @param nameParts NameParts of the variable.
+   * @param resolvingExecuteImmediate Whether the current context is in EXECUTE IMMEDIATE.
+   * @return Reference to the variable.
+   */
+  def lookupVariable(
+      nameParts: Seq[String],
+      resolvingExecuteImmediate: Boolean): Option[VariableReference] = {
+    val namePartsCaseAdjusted = if (conf.caseSensitiveAnalysis) {
+      nameParts
+    } else {
+      nameParts.map(_.toLowerCase(Locale.ROOT))
+    }
+
+    SqlScriptingContextManager
+      .get()
+      .map(_.getVariableManager)
+      // If we are in EXECUTE IMMEDIATE lookup only session variables.
+      .filterNot(_ => resolvingExecuteImmediate)
+      // If variable name is qualified with session.<varName> treat it as a session variable.
+      .filterNot(
+        _ =>
+          nameParts.length > 2
+          || (nameParts.length == 2 && isForbiddenLabelOrForVariableName(nameParts.head))
+      )
+      .flatMap(_.get(namePartsCaseAdjusted))
+      .map { varDef =>
+        VariableReference(
+          nameParts,
+          FakeLocalCatalog,
+          Identifier.of(Array(varDef.identifier.namespace().last), namePartsCaseAdjusted.last),
+          varDef
+        )
+      }
+      .orElse(
+        if (maybeTempVariableName(nameParts)) {
+          tempVariableManager
+            .get(namePartsCaseAdjusted)
+            .map { varDef =>
+              VariableReference(
+                nameParts,
+                FakeSystemCatalog,
+                Identifier.of(Array(CatalogManager.SESSION_NAMESPACE), namePartsCaseAdjusted.last),
+                varDef
+              )
+            }
+        } else {
+          None
+        }
+      )
+  }
+
+  private def resolveVariable(
+      nameParts: Seq[String],
+      resolvingView: Boolean,
+      resolvingExecuteImmediate: Boolean,
+      referredTempVariableNames: Seq[Seq[String]]): Option[Expression] = {
+    if (resolvingView) {
+      if (referredTempVariableNames.contains(nameParts)) {
+        lookupVariable(nameParts = nameParts, resolvingExecuteImmediate = resolvingExecuteImmediate)
+      } else {
+        None
+      }
+    } else {
+      lookupVariable(nameParts = nameParts, resolvingExecuteImmediate = resolvingExecuteImmediate)
+    }
+  }
+
+  // The temp variables live in `SYSTEM.SESSION`, and the name can be qualified or not.
+  private def maybeTempVariableName(nameParts: Seq[String]): Boolean = {
+    nameParts.length == 1 || {
+      if (nameParts.length == 2) {
+        nameParts.head.equalsIgnoreCase(CatalogManager.SESSION_NAMESPACE)
+      } else if (nameParts.length == 3) {
+        nameParts(0).equalsIgnoreCase(CatalogManager.SYSTEM_CATALOG_NAME) &&
+        nameParts(1).equalsIgnoreCase(CatalogManager.SESSION_NAMESPACE)
+      } else {
+        false
+      }
+    }
+  }
+
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ViewResolution.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ViewResolution.scala
index 371be97bebc0e..faa3b9081cbfd 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ViewResolution.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/ViewResolution.scala
@@ -43,7 +43,13 @@ object ViewResolution {
           view
         )
       }
-      SQLConf.withExistingConf(View.effectiveSQLConf(view.desc.viewSQLConfigs, view.isTempView)) {
+      SQLConf.withExistingConf(
+        View.effectiveSQLConf(
+          configs = view.desc.viewSQLConfigs,
+          isTempView = view.isTempView,
+          createSparkVersion = view.desc.createVersion
+        )
+      ) {
         resolveChild(view.child)
       }
     }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/WindowResolution.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/WindowResolution.scala
new file mode 100644
index 0000000000000..a477fe4398f65
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/WindowResolution.scala
@@ -0,0 +1,174 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis
+
+import org.apache.spark.sql.catalyst.expressions.{
+  AggregateWindowFunction,
+  CurrentRow,
+  FrameLessOffsetWindowFunction,
+  RangeFrame,
+  RankLike,
+  RowFrame,
+  SpecifiedWindowFrame,
+  UnboundedFollowing,
+  UnboundedPreceding,
+  UnspecifiedFrame,
+  WindowExpression,
+  WindowFunction,
+  WindowSpecDefinition
+}
+import org.apache.spark.sql.catalyst.expressions.aggregate.{
+  AggregateExpression,
+  ListAgg,
+  Median,
+  PercentileCont,
+  PercentileDisc
+}
+import org.apache.spark.sql.catalyst.util.TypeUtils.toSQLExpr
+import org.apache.spark.sql.errors.QueryCompilationErrors
+
+/**
+ * Utility object for resolving [[WindowExpression]].
+ *
+ * It ensures that window frame defintions and order specs are consistent between the
+ * [[WindowFunction]] and [[WindowSpecDefinition]], throwing errors if configurations are
+ * incompatible or missing.
+ */
+object WindowResolution {
+
+  /**
+   * Validates the window frame of a [[WindowExpression]].
+   *
+   * It enforces that the frame in [[WindowExpression.windowFunction]] matches the frame
+   * in [[WindowExpression.windowSpec]], alterantively it provides a default frame when it
+   * is unspecified.
+   */
+  def resolveFrame(windowExpression: WindowExpression): WindowExpression = windowExpression match {
+    case WindowExpression(
+        wf: FrameLessOffsetWindowFunction,
+        WindowSpecDefinition(_, _, f: SpecifiedWindowFrame)
+        ) if wf.frame != f =>
+      throw QueryCompilationErrors.cannotSpecifyWindowFrameError(wf.prettyName)
+
+    case WindowExpression(wf: WindowFunction, WindowSpecDefinition(_, _, f: SpecifiedWindowFrame))
+        if wf.frame != UnspecifiedFrame && wf.frame != f =>
+      throw QueryCompilationErrors.windowFrameNotMatchRequiredFrameError(f, wf.frame)
+
+    case WindowExpression(wf: WindowFunction, s @ WindowSpecDefinition(_, _, UnspecifiedFrame))
+        if wf.frame != UnspecifiedFrame =>
+      WindowExpression(wf, s.copy(frameSpecification = wf.frame))
+
+    case we @ WindowExpression(e, s @ WindowSpecDefinition(_, o, UnspecifiedFrame)) if e.resolved =>
+      val frame = if (o.nonEmpty) {
+        SpecifiedWindowFrame(RangeFrame, UnboundedPreceding, CurrentRow)
+      } else {
+        SpecifiedWindowFrame(RowFrame, UnboundedPreceding, UnboundedFollowing)
+      }
+      we.copy(windowSpec = s.copy(frameSpecification = frame))
+
+    case e => e
+  }
+
+  /**
+   * Ensures that [[WindowExpression.windowSpec.orderSpec]] is not missing.
+   *
+   * In case of [[RankLike]] window functions, it attaches the resolved order to the
+   * function to finalize it.
+   */
+  def resolveOrder(windowExpression: WindowExpression): WindowExpression = windowExpression match {
+    case WindowExpression(wf: WindowFunction, spec) if spec.orderSpec.isEmpty =>
+      throw QueryCompilationErrors.windowFunctionWithWindowFrameNotOrderedError(wf)
+
+    case WindowExpression(rank: RankLike, spec) if spec.resolved =>
+      val order = spec.orderSpec.map(_.child)
+      WindowExpression(rank.withOrder(order), spec)
+
+    case e => e
+  }
+
+  /**
+   * Validates a resolved [[WindowExpression]] to ensure it conforms to the allowed constraints.
+   *
+   * By checking the type and configuration of [[WindowExpression.windowFunction]] it enforces the
+   * following rules:
+   * - Disallows [[FrameLessOffsetWindowFunction]] (e.g. [[Lag]]) without defined ordering or
+   *   one with a frame which is defined as something other than an offset frame (e.g.
+   *   `ROWS BETWEEN` is logically incompatible with offset functions).
+   * - Disallows distinct aggregate expressions in window functions.
+   * - Disallows use of certain aggregate functions - [[ListAgg]], [[PercentileCont]],
+   *   [[PercentileDisc]], [[Median]]
+   * - Allows only window functions of following types:
+   *   - [[AggregateExpression]] (non-distinct)
+   *   - [[FrameLessOffsetWindowFunction]]
+   *   - [[AggregateWindowFunction]]
+   */
+  def validateResolvedWindowExpression(windowExpression: WindowExpression): Unit = {
+    checkWindowFunctionAndFrameMismatch(windowExpression)
+    checkWindowFunction(windowExpression)
+  }
+
+  def checkWindowFunctionAndFrameMismatch(windowExpression: WindowExpression): Unit = {
+    windowExpression match {
+      case _ @ WindowExpression(
+      windowFunction: FrameLessOffsetWindowFunction,
+      WindowSpecDefinition(_, order, frame: SpecifiedWindowFrame)
+      ) if order.isEmpty || !frame.isOffset =>
+        windowExpression.failAnalysis(
+          errorClass = "WINDOW_FUNCTION_AND_FRAME_MISMATCH",
+          messageParameters = Map(
+            "funcName" -> toSQLExpr(windowFunction),
+            "windowExpr" -> toSQLExpr(windowExpression)
+          )
+        )
+      case _ =>
+    }
+  }
+
+  def checkWindowFunction(windowExpression: WindowExpression): Unit = {
+    windowExpression.windowFunction match {
+      case AggregateExpression(_, _, true, _, _) =>
+        windowExpression.failAnalysis(
+          errorClass = "DISTINCT_WINDOW_FUNCTION_UNSUPPORTED",
+          messageParameters = Map("windowExpr" -> toSQLExpr(windowExpression))
+        )
+      case agg @ AggregateExpression(fun: ListAgg, _, _, _, _)
+        // listagg(...) WITHIN GROUP (ORDER BY ...) OVER (ORDER BY ...) is unsupported
+        if fun.orderingFilled && (windowExpression.windowSpec.orderSpec.nonEmpty ||
+          windowExpression.windowSpec.frameSpecification !=
+            SpecifiedWindowFrame(RowFrame, UnboundedPreceding, UnboundedFollowing)) =>
+        agg.failAnalysis(
+          errorClass = "INVALID_WINDOW_SPEC_FOR_AGGREGATION_FUNC",
+          messageParameters = Map("aggFunc" -> toSQLExpr(agg.aggregateFunction))
+        )
+      case agg @ AggregateExpression(_: PercentileCont | _: PercentileDisc | _: Median, _, _, _, _)
+        if windowExpression.windowSpec.orderSpec.nonEmpty ||
+          windowExpression.windowSpec.frameSpecification !=
+            SpecifiedWindowFrame(RowFrame, UnboundedPreceding, UnboundedFollowing) =>
+        agg.failAnalysis(
+          errorClass = "INVALID_WINDOW_SPEC_FOR_AGGREGATION_FUNC",
+          messageParameters = Map("aggFunc" -> toSQLExpr(agg.aggregateFunction))
+        )
+      case _: AggregateExpression | _: FrameLessOffsetWindowFunction | _: AggregateWindowFunction =>
+      case other =>
+        other.failAnalysis(
+          errorClass = "UNSUPPORTED_EXPR_FOR_WINDOW",
+          messageParameters = Map("sqlExpr" -> toSQLExpr(other))
+        )
+    }
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/executeImmediate.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/executeImmediate.scala
index 2b7eed0dc7950..b926cdf57f169 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/executeImmediate.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/executeImmediate.scala
@@ -51,7 +51,8 @@ class SubstituteExecuteImmediate(
     val catalogManager: CatalogManager,
     resolveChild: LogicalPlan => LogicalPlan,
     checkAnalysis: LogicalPlan => Unit)
-  extends Rule[LogicalPlan] with ColumnResolutionHelper {
+  extends Rule[LogicalPlan] {
+  private val variableResolution = new VariableResolution(catalogManager.tempVariableManager)
 
   def resolveVariable(e: Expression): Expression = {
 
@@ -201,7 +202,10 @@ class SubstituteExecuteImmediate(
   }
 
   private def getVariableReference(expr: Expression, nameParts: Seq[String]): VariableReference = {
-    lookupVariable(nameParts) match {
+    variableResolution.lookupVariable(
+      nameParts = nameParts,
+      resolvingExecuteImmediate = AnalysisContext.get.isExecuteImmediate
+    ) match {
       case Some(variable) => variable
       case _ =>
         throw QueryCompilationErrors
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateExpressionResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateExpressionResolver.scala
index 4a01bf14fe4bc..b194a4e44a9d1 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateExpressionResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateExpressionResolver.scala
@@ -18,11 +18,6 @@
 package org.apache.spark.sql.catalyst.analysis.resolver
 
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.analysis.{
-  AnsiTypeCoercion,
-  CollationTypeCoercion,
-  TypeCoercion
-}
 import org.apache.spark.sql.catalyst.expressions.{Expression, OuterReference, SubExprUtils}
 import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, ListAgg}
 import org.apache.spark.sql.catalyst.util.toPrettySQL
@@ -41,11 +36,6 @@ class AggregateExpressionResolver(
 
   private val traversals = expressionResolver.getExpressionTreeTraversals
 
-  protected override val ansiTransformations: CoercesExpressionTypes.Transformations =
-    AggregateExpressionResolver.ANSI_TYPE_COERCION_TRANSFORMATIONS
-  protected override val nonAnsiTransformations: CoercesExpressionTypes.Transformations =
-    AggregateExpressionResolver.TYPE_COERCION_TRANSFORMATIONS
-
   private val expressionResolutionContextStack =
     expressionResolver.getExpressionResolutionContextStack
   private val subqueryRegistry = operatorResolver.getSubqueryRegistry
@@ -58,6 +48,7 @@ class AggregateExpressionResolver(
    * resolving its children recursively and validating the resolved expression.
    */
   override def resolve(aggregateExpression: AggregateExpression): Expression = {
+    expressionResolutionContextStack.peek().resolvingTreeUnderAggregateExpression = true
     val aggregateExpressionWithChildrenResolved =
       withResolvedChildren(aggregateExpression, expressionResolver.resolve _)
         .asInstanceOf[AggregateExpression]
@@ -132,15 +123,13 @@ class AggregateExpressionResolver(
           throwNestedAggregateFunction(aggregateExpression)
         }
 
-        val nonDeterministicChild =
-          aggregateExpression.aggregateFunction.children.collectFirst {
-            case child if !child.deterministic => child
+        aggregateExpression.aggregateFunction.children.foreach { child =>
+          if (!child.deterministic) {
+            throwAggregateFunctionWithNondeterministicExpression(
+              aggregateExpression,
+              child
+            )
           }
-        if (nonDeterministicChild.nonEmpty) {
-          throwAggregateFunctionWithNondeterministicExpression(
-            aggregateExpression,
-            nonDeterministicChild.get
-          )
         }
     }
 
@@ -249,23 +238,3 @@ class AggregateExpressionResolver(
     )
   }
 }
-
-object AggregateExpressionResolver {
-  // Ordering in the list of type coercions should be in sync with the list in [[TypeCoercion]].
-  private val TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    CollationTypeCoercion.apply,
-    TypeCoercion.InTypeCoercion.apply,
-    TypeCoercion.FunctionArgumentTypeCoercion.apply,
-    TypeCoercion.IfTypeCoercion.apply,
-    TypeCoercion.ImplicitTypeCoercion.apply
-  )
-
-  // Ordering in the list of type coercions should be in sync with the list in [[AnsiTypeCoercion]].
-  private val ANSI_TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    CollationTypeCoercion.apply,
-    AnsiTypeCoercion.InTypeCoercion.apply,
-    AnsiTypeCoercion.FunctionArgumentTypeCoercion.apply,
-    AnsiTypeCoercion.IfTypeCoercion.apply,
-    AnsiTypeCoercion.ImplicitTypeCoercion.apply
-  )
-}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolutionResult.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolutionResult.scala
index d96185f642fd8..d4bb96e8d72f0 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolutionResult.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolutionResult.scala
@@ -20,14 +20,15 @@ package org.apache.spark.sql.catalyst.analysis.resolver
 import java.util.HashSet
 
 import org.apache.spark.sql.catalyst.expressions.{Alias, ExprId, NamedExpression}
-import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LogicalPlan}
 
 /**
- * Stores the resulting operator, output list, grouping attributes and list of aliases from
- * aggregate list, obtained by resolving an [[Aggregate]] operator.
+ * Stores the resulting operator, output list, grouping attributes, list of aliases from
+ * aggregate list and base [[Aggregate]], obtained by resolving an [[Aggregate]] operator.
  */
 case class AggregateResolutionResult(
     operator: LogicalPlan,
     outputList: Seq[NamedExpression],
-    groupingAttributeIds: Option[HashSet[ExprId]],
-    aggregateListAliases: Seq[Alias])
+    groupingAttributeIds: HashSet[ExprId],
+    aggregateListAliases: Seq[Alias],
+    baseAggregate: Aggregate)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolver.scala
index fffd55b5897bd..7591452b76d21 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateResolver.scala
@@ -17,24 +17,18 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import java.util.{HashSet, LinkedHashMap}
+import java.util.HashSet
 
-import scala.jdk.CollectionConverters._
-
-import org.apache.spark.sql.catalyst.analysis.{
-  AnalysisErrorAt,
-  NondeterministicExpressionCollection,
-  UnresolvedAttribute
-}
+import org.apache.spark.sql.catalyst.analysis.{AnalysisErrorAt, UnresolvedAttribute}
 import org.apache.spark.sql.catalyst.expressions.{
   Alias,
+  AliasHelper,
   AttributeReference,
   Expression,
   ExprId,
-  ExprUtils,
-  NamedExpression
+  ExprUtils
 }
-import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LogicalPlan, Project}
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LogicalPlan}
 
 /**
  * Resolves an [[Aggregate]] by resolving its child, aggregate expressions and grouping
@@ -42,7 +36,8 @@ import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LogicalPlan, Proj
  * related to [[Aggregate]] resolution.
  */
 class AggregateResolver(operatorResolver: Resolver, expressionResolver: ExpressionResolver)
-    extends TreeNodeResolver[Aggregate, LogicalPlan] {
+    extends TreeNodeResolver[Aggregate, LogicalPlan]
+    with AliasHelper {
   private val scopes = operatorResolver.getNameScopes
   private val lcaResolver = expressionResolver.getLcaResolver
 
@@ -50,17 +45,27 @@ class AggregateResolver(operatorResolver: Resolver, expressionResolver: Expressi
    * Resolve [[Aggregate]] operator.
    *
    * 1. Resolve the child (inline table).
-   * 2. Resolve aggregate expressions using [[ExpressionResolver.resolveAggregateExpressions]] and
+   * 2. Clear [[NameScope.availableAliases]]. Those are only relevant for the immediate aggregate
+   *    expressions for output prioritization to work correctly in
+   *    [[NameScope.tryResolveMultipartNameByOutput]].
+   * 3. Resolve aggregate expressions using [[ExpressionResolver.resolveAggregateExpressions]] and
    *    set [[NameScope.ordinalReplacementExpressions]] for grouping expressions resolution.
-   * 3. If there's just one [[UnresolvedAttribute]] with a single-part name "ALL", expand it using
+   * 4. If there's just one [[UnresolvedAttribute]] with a single-part name "ALL", expand it using
    *    aggregate expressions which don't contain aggregate functions. There should not exist a
    *    column with that name in the lower operator's output, otherwise it takes precedence.
-   * 4. Resolve grouping expressions using [[ExpressionResolver.resolveGroupingExpressions]]. This
+   * 5. Resolve grouping expressions using [[ExpressionResolver.resolveGroupingExpressions]]. This
    *    includes alias references to aggregate expressions, which is done in
    *    [[NameScope.resolveMultipartName]] and replacing [[UnresolvedOrdinals]] with corresponding
    *    expressions from aggregate list, done in [[OrdinalResolver]].
-   * 5. Substitute non-deterministic expressions with derived attribute references to an
-   *    artificial [[Project]] list.
+   * 6. Remove all the unnecessary [[Alias]]es from the grouping (all the aliases) and aggregate
+   *    (keep the outermost one) expressions. This is needed to stay compatible with the
+   *    fixed-point implementation. For example:
+   *
+   *    {{{ SELECT timestamp(col1:str) FROM VALUES('a') GROUP BY timestamp(col1:str); }}}
+   *
+   *    Here we end up having inner [[Alias]]es in both the grouping and aggregate expressions
+   *    lists which are uncomparable because they have different expression IDs (thus we have to
+   *    strip them).
    *
    * If the resulting [[Aggregate]] contains lateral columns references, delegate the resolution of
    * these columns to [[LateralColumnAliasResolver.handleLcaInAggregate]]. Otherwise, validate the
@@ -73,6 +78,8 @@ class AggregateResolver(operatorResolver: Resolver, expressionResolver: Expressi
     val resolvedAggregate = try {
       val resolvedChild = operatorResolver.resolve(unresolvedAggregate.child)
 
+      scopes.current.availableAliases.clear()
+
       val resolvedAggregateExpressions = expressionResolver.resolveAggregateExpressions(
         unresolvedAggregate.aggregateExpressions,
         unresolvedAggregate
@@ -100,21 +107,25 @@ class AggregateResolver(operatorResolver: Resolver, expressionResolver: Expressi
           )
         }
 
-      val partiallyResolvedAggregate = unresolvedAggregate.copy(
-        groupingExpressions = resolvedGroupingExpressions,
-        aggregateExpressions = resolvedAggregateExpressions.expressions,
+      val resolvedGroupingExpressionsWithoutAliases = resolvedGroupingExpressions.map(trimAliases)
+      val resolvedAggregateExpressionsWithoutAliases =
+        resolvedAggregateExpressions.expressions.map(trimNonTopLevelAliases)
+
+      val resolvedAggregate = unresolvedAggregate.copy(
+        groupingExpressions = resolvedGroupingExpressionsWithoutAliases,
+        aggregateExpressions = resolvedAggregateExpressionsWithoutAliases,
         child = resolvedChild
       )
 
-      val resolvedAggregate = tryPullOutNondeterministic(partiallyResolvedAggregate)
-
       if (resolvedAggregateExpressions.hasLateralColumnAlias) {
         val aggregateWithLcaResolutionResult = lcaResolver.handleLcaInAggregate(resolvedAggregate)
         AggregateResolutionResult(
           operator = aggregateWithLcaResolutionResult.resolvedOperator,
           outputList = aggregateWithLcaResolutionResult.outputList,
-          groupingAttributeIds = None,
-          aggregateListAliases = aggregateWithLcaResolutionResult.aggregateListAliases
+          groupingAttributeIds =
+            getGroupingAttributeIds(aggregateWithLcaResolutionResult.baseAggregate),
+          aggregateListAliases = aggregateWithLcaResolutionResult.aggregateListAliases,
+          baseAggregate = aggregateWithLcaResolutionResult.baseAggregate
         )
       } else {
         // TODO: This validation function does a post-traversal. This is discouraged in single-pass
@@ -124,8 +135,9 @@ class AggregateResolver(operatorResolver: Resolver, expressionResolver: Expressi
         AggregateResolutionResult(
           operator = resolvedAggregate,
           outputList = resolvedAggregate.aggregateExpressions,
-          groupingAttributeIds = Some(getGroupingAttributeIds(resolvedAggregate)),
-          aggregateListAliases = scopes.current.getTopAggregateExpressionAliases
+          groupingAttributeIds = getGroupingAttributeIds(resolvedAggregate),
+          aggregateListAliases = scopes.current.getTopAggregateExpressionAliases,
+          baseAggregate = resolvedAggregate
         )
       }
     } finally {
@@ -134,8 +146,9 @@ class AggregateResolver(operatorResolver: Resolver, expressionResolver: Expressi
 
     scopes.overwriteOutputAndExtendHiddenOutput(
       output = resolvedAggregate.outputList.map(_.toAttribute),
-      groupingAttributeIds = resolvedAggregate.groupingAttributeIds,
-      aggregateListAliases = resolvedAggregate.aggregateListAliases
+      groupingAttributeIds = Some(resolvedAggregate.groupingAttributeIds),
+      aggregateListAliases = resolvedAggregate.aggregateListAliases,
+      baseAggregate = Some(resolvedAggregate.baseAggregate)
     )
 
     resolvedAggregate.operator
@@ -208,53 +221,6 @@ class AggregateResolver(operatorResolver: Resolver, expressionResolver: Expressi
     }
   }
 
-  /**
-   * In case there are non-deterministic expressions in either `groupingExpressions` or
-   * `aggregateExpressions` replace them with attributes created out of corresponding
-   * non-deterministic expression. Example:
-   *
-   * {{{ SELECT RAND() GROUP BY 1; }}}
-   *
-   * This query would have the following analyzed plan:
-   *   Aggregate(
-   *     groupingExpressions = [AttributeReference(_nonDeterministic)]
-   *     aggregateExpressions = [Alias(AttributeReference(_nonDeterministic), `rand()`)]
-   *     child = Project(
-   *               projectList = [Alias(Rand(...), `_nondeterministic`)]
-   *               child = OneRowRelation
-   *             )
-   *   )
-   */
-  private def tryPullOutNondeterministic(aggregate: Aggregate): Aggregate = {
-    val nondeterministicToAttributes: LinkedHashMap[Expression, NamedExpression] =
-      NondeterministicExpressionCollection.getNondeterministicToAttributes(
-        aggregate.groupingExpressions
-      )
-
-    if (!nondeterministicToAttributes.isEmpty) {
-      val newChild = Project(
-        scopes.current.output ++ nondeterministicToAttributes.values.asScala.toSeq,
-        aggregate.child
-      )
-      val resolvedAggregateExpressions = aggregate.aggregateExpressions.map { expression =>
-        PullOutNondeterministicExpressionInExpressionTree(expression, nondeterministicToAttributes)
-      }
-      val resolvedGroupingExpressions = aggregate.groupingExpressions.map { expression =>
-        PullOutNondeterministicExpressionInExpressionTree(
-          expression,
-          nondeterministicToAttributes
-        )
-      }
-      aggregate.copy(
-        groupingExpressions = resolvedGroupingExpressions,
-        aggregateExpressions = resolvedAggregateExpressions,
-        child = newChild
-      )
-    } else {
-      aggregate
-    }
-  }
-
   private def canGroupByAll(expressions: Seq[Expression]): Boolean = {
     val isOrderByAll = expressions match {
       case Seq(unresolvedAttribute: UnresolvedAttribute) =>
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateWithLcaResolutionResult.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateWithLcaResolutionResult.scala
index 535c41cad39ec..15d4ac4f5ceb3 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateWithLcaResolutionResult.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AggregateWithLcaResolutionResult.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.catalyst.analysis.resolver
 
 import org.apache.spark.sql.catalyst.expressions.{Alias, NamedExpression}
-import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LogicalPlan}
 
 /**
  * Stores the result of resolution of lateral column aliases in an [[Aggregate]].
@@ -26,8 +26,11 @@ import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
  * @param outputList The output list of the resolved operator.
  * @param aggregateListAliases List of aliases from aggregate list and all artificially inserted
  *   [[Project]] nodes.
+ * @param baseAggregate [[Aggregate]] node constructed by [[LateralColumnAliasResolver]] while
+ *   resolving lateral column references in [[Aggregate]].
  */
 case class AggregateWithLcaResolutionResult(
     resolvedOperator: LogicalPlan,
     outputList: Seq[NamedExpression],
-    aggregateListAliases: Seq[Alias])
+    aggregateListAliases: Seq[Alias],
+    baseAggregate: Aggregate)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AliasResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AliasResolver.scala
index 83329c0fe464d..b56281fa12ba8 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AliasResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AliasResolver.scala
@@ -17,13 +17,14 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import org.apache.spark.sql.catalyst.analysis.{AliasResolution, MultiAlias, UnresolvedAlias}
+import org.apache.spark.sql.catalyst.analysis.{AliasResolution, UnresolvedAlias}
 import org.apache.spark.sql.catalyst.expressions.{
   Alias,
   Expression,
   NamedExpression,
   OuterReference
 }
+import org.apache.spark.sql.errors.QueryCompilationErrors
 
 /**
  * Resolver class that resolves unresolved aliases and handles user-specified aliases.
@@ -45,25 +46,32 @@ class AliasResolver(expressionResolver: ExpressionResolver)
    * we create a new [[Alias]] using the [[AutoGeneratedAliasProvider]]. Here we allow inner
    * aliases to persist until the end of single-pass resolution, after which they will be removed
    * in the post-processing phase.
+   *
+   * Resulting [[Alias]] must be added to the list of `availableAliases` in the current
+   * [[NameScope]].
    */
   override def resolve(unresolvedAlias: UnresolvedAlias): NamedExpression =
-    scopes.current.lcaRegistry.withNewLcaScope {
+    scopes.current.lcaRegistry.withNewLcaScope(
+      isTopLevelAlias = expressionResolutionContextStack.peek().isTopOfProjectList
+    ) {
       val aliasWithResolvedChildren =
         withResolvedChildren(unresolvedAlias, expressionResolver.resolve _)
           .asInstanceOf[UnresolvedAlias]
 
-      val resolvedAlias =
+      val resolvedNode =
         AliasResolution.resolve(aliasWithResolvedChildren).asInstanceOf[NamedExpression]
 
-      resolvedAlias match {
-        case multiAlias: MultiAlias =>
-          throw new ExplicitlyUnsupportedResolverFeature(
-            s"unsupported expression: ${multiAlias.getClass.getName}"
-          )
+      resolvedNode match {
         case alias: Alias =>
-          expressionResolver.getExpressionIdAssigner.mapExpression(alias)
+          val resultAlias = expressionResolver.getExpressionIdAssigner.mapExpression(alias)
+          scopes.current.availableAliases.add(resultAlias.exprId)
+          resultAlias
         case outerReference: OuterReference =>
           autoGeneratedAliasProvider.newAlias(outerReference)
+        case _ =>
+          throw QueryCompilationErrors.unsupportedSinglePassAnalyzerFeature(
+            s"${resolvedNode.getClass} expression resolution"
+          )
       }
     }
 
@@ -77,18 +85,21 @@ class AliasResolver(expressionResolver: ExpressionResolver)
    * those aliases. See [[ExpressionIdAssigner.mapExpression]] doc for more details.
    */
   def handleResolvedAlias(alias: Alias): Alias = {
-    val resolvedAlias = scopes.current.lcaRegistry.withNewLcaScope {
+    val resolvedAlias = scopes.current.lcaRegistry.withNewLcaScope(
+      isTopLevelAlias = expressionResolutionContextStack.peek().isTopOfProjectList
+    ) {
       val aliasWithResolvedChildren =
         withResolvedChildren(alias, expressionResolver.resolve _).asInstanceOf[Alias]
 
-      val mappedAlias = expressionResolver.getExpressionIdAssigner.mapExpression(
+      val resultAlias = expressionResolver.getExpressionIdAssigner.mapExpression(
         originalExpression = aliasWithResolvedChildren,
         prioritizeOldDuplicateAliasId =
           expressionResolutionContextStack.peek().resolvingGroupingExpressions
       )
-      scopes.current.availableAliases.add(mappedAlias.exprId)
 
-      mappedAlias
+      scopes.current.availableAliases.add(resultAlias.exprId)
+
+      resultAlias
     }
 
     collapseAlias(resolvedAlias)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AutoGeneratedAliasProvider.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AutoGeneratedAliasProvider.scala
index 2a49581b3499b..5fd5a5ff7870e 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AutoGeneratedAliasProvider.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/AutoGeneratedAliasProvider.scala
@@ -62,7 +62,7 @@ class AutoGeneratedAliasProvider(expressionIdAssigner: ExpressionIdAssigner) {
       name: Option[String] = None,
       explicitMetadata: Option[Metadata] = None,
       skipExpressionIdAssigner: Boolean = false): Alias = {
-    var alias = Alias(
+    val alias = Alias(
       child = child,
       name = name.getOrElse(toPrettySQL(child))
     )(
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/BinaryArithmeticResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/BinaryArithmeticResolver.scala
index d88a450a5acda..0668c0a6513b7 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/BinaryArithmeticResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/BinaryArithmeticResolver.scala
@@ -17,19 +17,11 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import org.apache.spark.sql.catalyst.analysis.{
-  AnsiStringPromotionTypeCoercion,
-  AnsiTypeCoercion,
-  BinaryArithmeticWithDatetimeResolver,
-  DecimalPrecisionTypeCoercion,
-  DivisionTypeCoercion,
-  IntegralDivisionTypeCoercion,
-  StringPromotionTypeCoercion,
-  TypeCoercion
-}
+import org.apache.spark.sql.catalyst.analysis.BinaryArithmeticWithDatetimeResolver
 import org.apache.spark.sql.catalyst.expressions.{
   Add,
   BinaryArithmetic,
+  Cast,
   DateAdd,
   Divide,
   Expression,
@@ -37,7 +29,7 @@ import org.apache.spark.sql.catalyst.expressions.{
   Subtract,
   SubtractDates
 }
-import org.apache.spark.sql.types.{DateType, StringType}
+import org.apache.spark.sql.types._
 
 /**
  * [[BinaryArithmeticResolver]] is invoked by [[ExpressionResolver]] in order to resolve
@@ -63,7 +55,7 @@ import org.apache.spark.sql.types.{DateType, StringType}
  *
  *     Cast(
  *         DatetimeSub(
- *             TimeAdd(
+ *             TimestampAddInterval(
  *                 Literal('4 11:11', StringType),
  *                 UnaryMinus(
  *                     Literal(Interval('4 22:12' DAY TO MINUTE), DayTimeIntervalType(0,2))
@@ -77,8 +69,8 @@ import org.apache.spark.sql.types.{DateType, StringType}
  * top-most node itself is not resolved recursively in order to avoid recursive calls to
  * [[BinaryArithmeticResolver]] and other sub-resolvers. To prevent a case where we resolve the
  * same node twice, we need to mark nodes that will act as a limit for the downwards traversal by
- * applying a [[ExpressionResolver.SINGLE_PASS_SUBTREE_BOUNDARY]] tag to them. These children
- * along with all the nodes below them are guaranteed to be resolved at this point. When
+ * applying a [[ResolverTag.SINGLE_PASS_SUBTREE_BOUNDARY]] tag to them. These children along with
+ * all the nodes below them are guaranteed to be resolved at this point. When
  * [[ExpressionResolver]] reaches one of the tagged nodes, it returns identity rather than
  * resolving it. Finally, after resolving the subtree, we need to resolve the top-most node itself,
  * which in this case means applying a timezone, if necessary.
@@ -90,11 +82,6 @@ class BinaryArithmeticResolver(expressionResolver: ExpressionResolver)
 
   private val traversals = expressionResolver.getExpressionTreeTraversals
 
-  protected override val ansiTransformations: CoercesExpressionTypes.Transformations =
-    BinaryArithmeticResolver.ANSI_TYPE_COERCION_TRANSFORMATIONS
-  protected override val nonAnsiTransformations: CoercesExpressionTypes.Transformations =
-    BinaryArithmeticResolver.TYPE_COERCION_TRANSFORMATIONS
-
   override def resolve(unresolvedBinaryArithmetic: BinaryArithmetic): Expression = {
     val binaryArithmeticWithResolvedChildren: BinaryArithmetic =
       withResolvedChildren(unresolvedBinaryArithmetic, expressionResolver.resolve _)
@@ -117,8 +104,9 @@ class BinaryArithmeticResolver(expressionResolver: ExpressionResolver)
    * of nodes.
    */
   private def transformBinaryArithmeticNode(binaryArithmetic: BinaryArithmetic): Expression = {
+    val binaryArithmeticWithNullReplaced: Expression = replaceNullType(binaryArithmetic)
     val binaryArithmeticWithDateTypeReplaced: Expression =
-      replaceDateType(binaryArithmetic)
+      replaceDateType(binaryArithmeticWithNullReplaced)
     val binaryArithmeticWithTypeCoercion: Expression =
       coerceExpressionTypes(
         expression = binaryArithmeticWithDateTypeReplaced,
@@ -154,26 +142,29 @@ class BinaryArithmeticResolver(expressionResolver: ExpressionResolver)
       BinaryArithmeticWithDatetimeResolver.resolve(arithmetic)
     case other => other
   }
-}
 
-object BinaryArithmeticResolver {
-  // Ordering in the list of type coercions should be in sync with the list in [[TypeCoercion]].
-  private val TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    StringPromotionTypeCoercion.apply,
-    DecimalPrecisionTypeCoercion.apply,
-    DivisionTypeCoercion.apply,
-    IntegralDivisionTypeCoercion.apply,
-    TypeCoercion.ImplicitTypeCoercion.apply,
-    TypeCoercion.DateTimeOperationsTypeCoercion.apply
-  )
-
-  // Ordering in the list of type coercions should be in sync with the list in [[AnsiTypeCoercion]].
-  private val ANSI_TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    AnsiStringPromotionTypeCoercion.apply,
-    DecimalPrecisionTypeCoercion.apply,
-    DivisionTypeCoercion.apply,
-    IntegralDivisionTypeCoercion.apply,
-    AnsiTypeCoercion.ImplicitTypeCoercion.apply,
-    AnsiTypeCoercion.AnsiDateTimeOperationsTypeCoercion.apply
-  )
+  /**
+   * Replaces NullType by a compatible type in arithmetic expressions over Datetime operands.
+   * This avoids recursive calls of [[BinaryArithmeticWithDatetimeResolver]] which converts
+   * unacceptable nulls of `NullType` to an expected types of datetime expressions at the
+   * first step, and replacing arithmetic `Add` and `Subtract` by the same datetime expressions
+   * on the following steps.
+   */
+  private def replaceNullType(expression: Expression): Expression = expression match {
+    case a @ Add(l, r, _) => (l.dataType, r.dataType) match {
+      case (_: DatetimeType, _: NullType) =>
+        a.copy(right = Cast(a.right, DayTimeIntervalType.DEFAULT))
+      case (_: NullType, _: DatetimeType) =>
+        a.copy(left = Cast(a.left, DayTimeIntervalType.DEFAULT))
+      case _ => a
+    }
+    case s @ Subtract(l, r, _) => (l.dataType, r.dataType) match {
+      case (_: NullType, _: DatetimeType) =>
+        s.copy(left = Cast(s.left, s.right.dataType))
+      case (_: DatetimeType, _: NullType) =>
+        s.copy(right = Cast(s.right, s.left.dataType))
+      case _ => s
+    }
+    case other => other
+  }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TryExtractOrdinal.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CandidatesForResolution.scala
similarity index 67%
rename from sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TryExtractOrdinal.scala
rename to sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CandidatesForResolution.scala
index 42766a78e248f..3b8ec61bf5ee8 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TryExtractOrdinal.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CandidatesForResolution.scala
@@ -17,18 +17,10 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import org.apache.spark.sql.catalyst.expressions.{Expression, IntegerLiteral}
+import org.apache.spark.sql.catalyst.expressions.Attribute
 
 /**
- * Try to extract ordinal from an expression. Return `Some(ordinal)` if the type of the expression
- * is [[IntegerLitera]], `None` otherwise.
+ * [[CandidatesForResolution]] is used by the [[NameScope]] during multipart name resolution to
+ * prioritize attributes from different types of operator output (main, hidden, metadata).
  */
-object TryExtractOrdinal {
-  def apply(expression: Expression): Option[Int] = {
-    expression match {
-      case IntegerLiteral(literal) =>
-        Some(literal)
-      case other => None
-    }
-  }
-}
+case class CandidatesForResolution(attributes: Seq[Attribute], outputType: OutputType.OutputType)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CoercesExpressionTypes.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CoercesExpressionTypes.scala
index 0fc6a6742edad..34be99a1abc0d 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CoercesExpressionTypes.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CoercesExpressionTypes.scala
@@ -33,6 +33,7 @@ import org.apache.spark.sql.catalyst.analysis.{
   TypeCoercion
 }
 import org.apache.spark.sql.catalyst.expressions.{Cast, Expression}
+import org.apache.spark.sql.catalyst.trees.CurrentOrigin.withOrigin
 
 /**
  * [[CoercesExpressionTypes]] is extended by resolvers that need to apply type coercion.
@@ -57,27 +58,42 @@ trait CoercesExpressionTypes extends SQLConfHelper {
    *
    * In the end, we apply [[DefaultCollationTypeCoercion]].
    * See [[DefaultCollationTypeCoercion]] doc for more info.
+   *
+   * Additionally, we copy the tags and origin in case the call to this method didn't come from
+   * [[ExpressionResolver]], where they are copied generically.
    */
   def coerceExpressionTypes(
       expression: Expression,
       expressionTreeTraversal: ExpressionTreeTraversal): Expression = {
-    val coercedExpressionOnce = applyTypeCoercion(
-      expression = expression,
-      expressionTreeTraversal = expressionTreeTraversal
-    )
-    // This is a hack necessary because fixed-point analyzer sometimes requires multiple passes to
-    // resolve type coercion. Instead, in single pass, we apply type coercion twice on the same
-    // node in order to ensure that types are resolved.
-    val coercedExpressionTwice = applyTypeCoercion(
-      expression = coercedExpressionOnce,
-      expressionTreeTraversal = expressionTreeTraversal
-    )
+    withOrigin(expression.origin) {
+      val coercedExpressionOnce = applyTypeCoercion(
+        expression = expression,
+        expressionTreeTraversal = expressionTreeTraversal
+      )
+
+      // If the expression isn't changed by the first iteration of type coercion,
+      // second iteration won't be effective either.
+      val expressionAfterTypeCoercion = if (coercedExpressionOnce.eq(expression)) {
+        coercedExpressionOnce
+      } else {
+        // This is a hack necessary because fixed-point analyzer sometimes requires multiple passes
+        // to resolve type coercion. Instead, in single pass, we apply type coercion twice on the
+        // same node in order to ensure that types are resolved.
+        applyTypeCoercion(
+          expression = coercedExpressionOnce,
+          expressionTreeTraversal = expressionTreeTraversal
+        )
+      }
+
+      val coercionResult = expressionTreeTraversal.defaultCollation match {
+        case Some(defaultCollation) =>
+          DefaultCollationTypeCoercion(expressionAfterTypeCoercion, defaultCollation)
+        case None =>
+          expressionAfterTypeCoercion
+      }
 
-    expressionTreeTraversal.defaultCollation match {
-      case Some(defaultCollation) =>
-        DefaultCollationTypeCoercion(coercedExpressionTwice, defaultCollation)
-      case None =>
-        coercedExpressionTwice
+      coercionResult.copyTagsFrom(expression)
+      coercionResult
     }
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ConditionalExpressionResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ConditionalExpressionResolver.scala
deleted file mode 100644
index 0d847cf09adf0..0000000000000
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ConditionalExpressionResolver.scala
+++ /dev/null
@@ -1,63 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.catalyst.analysis.resolver
-
-import org.apache.spark.sql.catalyst.analysis.{AnsiTypeCoercion, TypeCoercion}
-import org.apache.spark.sql.catalyst.expressions.{ConditionalExpression, Expression}
-
-/**
- * Resolver for [[If]], [[CaseWhen]] and [[Coalesce]] expressions.
- */
-class ConditionalExpressionResolver(expressionResolver: ExpressionResolver)
-    extends TreeNodeResolver[ConditionalExpression, Expression]
-    with ResolvesExpressionChildren
-    with CoercesExpressionTypes {
-
-  private val traversals = expressionResolver.getExpressionTreeTraversals
-
-  protected override val ansiTransformations: CoercesExpressionTypes.Transformations =
-    ConditionalExpressionResolver.ANSI_TYPE_COERCION_TRANSFORMATIONS
-  protected override val nonAnsiTransformations: CoercesExpressionTypes.Transformations =
-    ConditionalExpressionResolver.TYPE_COERCION_TRANSFORMATIONS
-
-  override def resolve(unresolvedConditionalExpression: ConditionalExpression): Expression = {
-    val conditionalExpressionWithResolvedChildren =
-      withResolvedChildren(unresolvedConditionalExpression, expressionResolver.resolve _)
-
-    coerceExpressionTypes(
-      expression = conditionalExpressionWithResolvedChildren,
-      expressionTreeTraversal = traversals.current
-    )
-  }
-}
-
-object ConditionalExpressionResolver {
-  // Ordering in the list of type coercions should be in sync with the list in [[TypeCoercion]].
-  private val TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    TypeCoercion.CaseWhenTypeCoercion.apply,
-    TypeCoercion.FunctionArgumentTypeCoercion.apply,
-    TypeCoercion.IfTypeCoercion.apply
-  )
-
-  // Ordering in the list of type coercions should be in sync with the list in [[AnsiTypeCoercion]].
-  private val ANSI_TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    AnsiTypeCoercion.CaseWhenTypeCoercion.apply,
-    AnsiTypeCoercion.FunctionArgumentTypeCoercion.apply,
-    AnsiTypeCoercion.IfTypeCoercion.apply
-  )
-}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CreateNamedStructResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CreateNamedStructResolver.scala
deleted file mode 100644
index d0e4ecea25cb3..0000000000000
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/CreateNamedStructResolver.scala
+++ /dev/null
@@ -1,62 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.catalyst.analysis.resolver
-
-import org.apache.spark.sql.catalyst.expressions.{Alias, CreateNamedStruct, Expression}
-
-/**
- * Resolves [[CreateNamedStruct]] nodes by recursively resolving children. If [[CreateNamedStruct]]
- * is not directly under an [[Alias]], removes aliases from struct fields. Otherwise, let
- * [[AliasResolver]] handle the removal.
- */
-class CreateNamedStructResolver(expressionResolver: ExpressionResolver)
-    extends TreeNodeResolver[CreateNamedStruct, Expression]
-    with ResolvesExpressionChildren {
-
-  override def resolve(createNamedStruct: CreateNamedStruct): Expression = {
-    val createNamedStructWithResolvedChildren =
-      withResolvedChildren(createNamedStruct, expressionResolver.resolve)
-        .asInstanceOf[CreateNamedStruct]
-    CreateNamedStructResolver.cleanupAliases(createNamedStructWithResolvedChildren)
-  }
-}
-
-object CreateNamedStructResolver {
-
-  /**
-   * For a query like:
-   *
-   * {{{ SELECT STRUCT(1 AS a, 2 AS b) }}}
-   *
-   * [[CreateNamedStruct]] will be: CreateNamedStruct(Seq("a", Alias(1, "a"), "b", Alias(2, "b")))
-   *
-   * Because inner aliases are not expected in the analyzed logical plan, we need to remove them
-   * here. However, we only do so if [[CreateNamedStruct]] is not directly under an [[Alias]], in
-   * which case the removal will be handled by [[AliasResolver]]. This is because in single-pass,
-   * [[Alias]] is resolved after [[CreateNamedStruct]] and in order to compute the correct output
-   * name, it needs to know complete structure of the child.
-   */
-  def cleanupAliases(createNamedStruct: CreateNamedStruct): CreateNamedStruct = {
-    createNamedStruct
-      .withNewChildren(createNamedStruct.children.map {
-        case a: Alias if a.metadata.isEmpty => a.child
-        case other => other
-      })
-      .asInstanceOf[CreateNamedStruct]
-  }
-}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionIdAssigner.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionIdAssigner.scala
index 71bc7f24d5f28..9cd4c525b48c2 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionIdAssigner.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionIdAssigner.scala
@@ -326,9 +326,17 @@ class ExpressionIdAssigner {
    * child mappings will have collisions during this merge operation. We need to decide which of
    * the new IDs get the priority for the old ID. This is done based on the IDs that are actually
    * outputted into the multi-child operator. This information is provided with `newOutputIds`.
-   * If the new ID is present in that set, we treat it as a P0 over the IDs that are hidden in the
-   * branch. Also, we iterate over child mappings from right to left, prioritizing IDs from the
-   * left, because that's how operators like [[Union]] propagate IDs upwards.
+   *
+   * The principles:
+   * 1. If the destination ID is present in `newOutputIds`, we treat it as a higher priority over
+   *   the ID that is "hidden" in the logical plan branch.
+   * 2. If both destination IDs are present in `newOutputIds`, we prioritize the identity mapping -
+   *   the new ID which is equal to the old ID, and not the "remapping". This is valid in SQL
+   *   because we are dealing with a fully unresolved plan and the remapping is not needed.
+   *   DataFrame queries that contain a self-join or a self-union and are referencing the same
+   *   attribute from both branches will fail (which is expected).
+   * 3. We iterate over child mappings from right to left, prioritizing IDs from the left, because
+   *   that's how multi-child operators like [[Join]] or [[Union]] propagate IDs upwards.
    *
    * Example 1:
    * {{{
@@ -360,8 +368,19 @@ class ExpressionIdAssigner {
    * df2.join(df1, df2("b") === df1("a"))
    * }}}
    *
-   * This is used by multi child operators like [[Join]] or [[Union]] to propagate mapped
-   * expression IDs upwards.
+   * Example 3:
+   * {{{
+   * -- In this query CTE references a table which is also present in a JOIN. First, CTE definition
+   * -- is analyzed with `t1` inside. Let's say it outputs col1#0. Once we get to a left JOIN child,
+   * -- which is also `t1`, we know that expression IDs in `t1` have to be regenerated to col#1
+   * -- because it's a duplicate relation. After resolving the JOIN, we are left with (#0 -> #0),
+   * -- (#1 -> #1) and (#0 -> #1) mappings. Also, JOIN outputs both #0 and #1. This is an example
+   * -- of principle 2. when identity (#0 -> #0) and (#1 -> #1) mappings have to be prioritized,
+   * -- because (#0 -> #1) is a remapping and not needed in SQL.
+   * SELECT * FROM (
+   *   WITH cte1 AS (SELECT * FROM t1) SELECT t1.col1 FROM t1 JOIN cte1 USING (col1)
+   * );
+   * }}}
    *
    * When `mergeIntoExisting` is true, we merge child mappings into an existing mapping entry
    * instead of creating a new one. This setting is used when resolving [[LateralJoin]]s.
@@ -380,15 +399,19 @@ class ExpressionIdAssigner {
       throw SparkException.internalError("No child mappings to create new current mapping")
     }
 
-    val priorityMapping = new ExpressionIdAssigner.PriorityMapping(newOutputIds.size)
+    val newMapping = if (mergeIntoExisting) {
+      currentStackEntry.mapping.get
+    } else {
+      new ExpressionIdAssigner.Mapping
+    }
 
     while (!currentStackEntry.childMappings.isEmpty) {
       val nextMapping = currentStackEntry.childMappings.pop()
 
       nextMapping.forEach {
         case (oldId, remappedId) =>
-          updatePriorityMapping(
-            priorityMapping = priorityMapping,
+          updateNewMapping(
+            newMapping = newMapping,
             oldId = oldId,
             remappedId = remappedId,
             newOutputIds = newOutputIds
@@ -396,17 +419,6 @@ class ExpressionIdAssigner {
       }
     }
 
-    val newMapping = if (mergeIntoExisting) {
-      currentStackEntry.mapping.get
-    } else {
-      new ExpressionIdAssigner.Mapping
-    }
-
-    priorityMapping.forEach {
-      case (oldId, priority) =>
-        newMapping.put(oldId, priority.pick())
-    }
-
     setCurrentMapping(newMapping)
   }
 
@@ -606,27 +618,31 @@ class ExpressionIdAssigner {
   }
 
   /**
-   * Update the priority mapping for the given `oldId` and `remappedId`. If the `remappedId` is
-   * contained in the `newOutputIds`, we treat it as a P0 over the IDs that are not exposed from
-   * the operator branch. Otherwise, we treat it as a P1.
+   * Update `newMapping` with the `oldId -> remappedId` mapping, based on the principles described
+   * in [[createMappingFromChildMappings]]:
+   * 1. If no mapping from `oldId` exists, we create it
+   * 2. If the mapping from `oldId` already exists but is not present in `newOutputIds`, we
+   *   deprioritize old mapping in favor of new one
+   * 3. If the mapping from `oldId` already exists and is present in `newOutputIds` and the new
+   *   mapping is the identity one, we deprioritize old mapping in favor of new one
+   * 4. Otherwise we keep the existing mapping
    */
-  private def updatePriorityMapping(
-      priorityMapping: ExpressionIdAssigner.PriorityMapping,
+  private def updateNewMapping(
+      newMapping: ExpressionIdAssigner.Mapping,
       oldId: ExprId,
       remappedId: ExprId,
       newOutputIds: Set[ExprId]): Unit = {
-    if (newOutputIds.contains(remappedId)) {
-      priorityMapping.merge(
-        oldId,
-        ExpressionIdPriority(p0 = Some(remappedId)),
-        (priority, _) => priority.copy(p0 = Some(remappedId))
-      )
-    } else {
-      priorityMapping.merge(
-        oldId,
-        ExpressionIdPriority(p1 = Some(remappedId)),
-        (priority, _) => priority.copy(p1 = Some(remappedId))
-      )
+    newMapping.get(oldId) match {
+      case null =>
+        newMapping.put(oldId, remappedId)
+
+      case knownRemappedId if !newOutputIds.contains(knownRemappedId) =>
+        newMapping.put(oldId, remappedId)
+
+      case knownRemappedId if newOutputIds.contains(remappedId) && remappedId == oldId =>
+        newMapping.put(oldId, remappedId)
+
+      case _ =>
     }
   }
 }
@@ -641,8 +657,6 @@ object ExpressionIdAssigner {
 
   type Stack = ArrayDeque[StackEntry]
 
-  type PriorityMapping = HashMap[ExprId, ExpressionIdPriority]
-
   /**
    * Assert that `outputs` don't have conflicting expression IDs.
    */
@@ -696,15 +710,3 @@ object ExpressionIdAssigner {
     }
   }
 }
-
-/**
- * [[ExpressionIdPriority]] is used by the [[ExpressionIdAssigner]] when merging child mappings
- * of a multi-child operator to determine which new ID gets picked in case of an old ID collision.
- */
-case class ExpressionIdPriority(p0: Option[ExprId] = None, p1: Option[ExprId] = None) {
-  def pick(): ExprId = p0.getOrElse {
-    p1.getOrElse {
-      throw SparkException.internalError("No expression ID to pick")
-    }
-  }
-}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionResolver.scala
index cfeaa54a39f60..2b78b92518b91 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ExpressionResolver.scala
@@ -40,7 +40,6 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, AggregateFunction}
 import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, LogicalPlan, Sort}
 import org.apache.spark.sql.catalyst.trees.CurrentOrigin
-import org.apache.spark.sql.catalyst.trees.TreeNodeTag
 import org.apache.spark.sql.catalyst.util.CollationFactory
 import org.apache.spark.sql.errors.QueryCompilationErrors
 
@@ -126,7 +125,6 @@ class ExpressionResolver(
 
   private val aliasResolver = new AliasResolver(this)
   private val timezoneAwareExpressionResolver = new TimezoneAwareExpressionResolver(this)
-  private val conditionalExpressionResolver = new ConditionalExpressionResolver(this)
   private val binaryArithmeticResolver = new BinaryArithmeticResolver(this)
   private val limitLikeExpressionValidator = new LimitLikeExpressionValidator
   private val aggregateExpressionResolver = new AggregateExpressionResolver(resolver, this)
@@ -136,11 +134,10 @@ class ExpressionResolver(
     aggregateExpressionResolver,
     binaryArithmeticResolver
   )
-  private val timeAddResolver = new TimeAddResolver(this)
-  private val unaryMinusResolver = new UnaryMinusResolver(this)
   private val subqueryExpressionResolver = new SubqueryExpressionResolver(this, resolver)
   private val ordinalResolver = new OrdinalResolver(this)
   private val lcaResolver = new LateralColumnAliasResolver(this)
+  private val semiStructuredExtractResolver = new SemiStructuredExtractResolver(this)
 
   /**
    * Get the expression tree traversal stack.
@@ -262,16 +259,16 @@ class ExpressionResolver(
             subqueryExpressionResolver.resolveScalarSubquery(unresolvedScalarSubquery)
           case unresolvedListQuery: ListQuery =>
             subqueryExpressionResolver.resolveListQuery(unresolvedListQuery)
-          case unresolvedTimeAdd: TimeAdd =>
-            timeAddResolver.resolve(unresolvedTimeAdd)
+          case unresolvedTimestampAdd: TimestampAddInterval =>
+            resolveExpressionGenericallyWithTimezoneWithTypeCoercion(unresolvedTimestampAdd)
           case unresolvedUnaryMinus: UnaryMinus =>
-            unaryMinusResolver.resolve(unresolvedUnaryMinus)
+            resolveExpressionGenericallyWithTypeCoercion(unresolvedUnaryMinus)
           case createNamedStruct: CreateNamedStruct =>
             resolveExpressionGenerically(createNamedStruct)
           case sortOrder: SortOrder =>
             resolveExpressionGenerically(sortOrder)
           case unresolvedConditionalExpression: ConditionalExpression =>
-            conditionalExpressionResolver.resolve(unresolvedConditionalExpression)
+            resolveExpressionGenericallyWithTypeCoercion(unresolvedConditionalExpression)
           case getViewColumnByNameAndOrdinal: GetViewColumnByNameAndOrdinal =>
             resolveGetViewColumnByNameAndOrdinal(getViewColumnByNameAndOrdinal)
           case getTimeField: GetTimeField =>
@@ -286,6 +283,8 @@ class ExpressionResolver(
             resolveUpCast(unresolvedUpCast)
           case unresolvedCollation: UnresolvedCollation =>
             resolveCollation(unresolvedCollation)
+          case semiStructuredExtract: SemiStructuredExtract =>
+            semiStructuredExtractResolver.resolve(semiStructuredExtract)
           case expression: Expression =>
             resolveExpressionGenericallyWithTypeCoercion(expression)
         }
@@ -584,15 +583,10 @@ class ExpressionResolver(
         aliasResolver.resolve(unresolvedAlias)
       case unresolvedAttribute: UnresolvedAttribute =>
         resolveAttribute(unresolvedAttribute)
-      case unresolvedStar: UnresolvedStar =>
-        // We don't support edge cases of star usage, e.g. `WHERE col1 IN (*)`
-        throw new ExplicitlyUnsupportedResolverFeature("Star outside of Project list")
       case attributeReference: AttributeReference =>
         handleResolvedAttributeReference(attributeReference)
       case outerReference: OuterReference =>
         handleResolvedOuterReference(outerReference)
-      case _: UnresolvedNamedLambdaVariable =>
-        throw new ExplicitlyUnsupportedResolverFeature("Lambda variables")
       case _ =>
         withPosition(unresolvedNamedExpression) {
           throwUnsupportedSinglePassAnalyzerFeature(unresolvedNamedExpression)
@@ -646,6 +640,9 @@ class ExpressionResolver(
    * In case that attribute is resolved as a literal function (i.e. result is [[CurrentDate]]),
    * perform additional resolution on it.
    *
+   * In case result of the previous step is a recursive data type, we coerce it to stay compatible
+   * with the fixed-point analyzer.
+   *
    * If the attribute is at the top of the project list (which is indicated by
    * [[ExpressionResolutionContext.isTopOfProjectList]]), we preserve the [[Alias]] or remove it
    * otherwise.
@@ -667,7 +664,6 @@ class ExpressionResolver(
               .resolvingGroupingExpressions && traversals.current.groupByAliases
         ),
         canResolveNameByHiddenOutput = canResolveNameByHiddenOutput,
-        shouldPreferTableColumnsOverAliases = shouldPreferTableColumnsOverAliases,
         shouldPreferHiddenOutput = traversals.current.isFilterOnTopOfAggregate,
         canResolveNameByHiddenOutputInSubquery =
           subqueryRegistry.currentScope.aggregateExpressionsExtractor.isDefined,
@@ -689,7 +685,7 @@ class ExpressionResolver(
           case Some(lateralAttributeReference) =>
             scopes.current.lcaRegistry
               .markAttributeLaterallyReferenced(lateralAttributeReference)
-            candidate.setTagValue(ExpressionResolver.SINGLE_PASS_IS_LCA, ())
+            candidate.setTagValue(ResolverTag.SINGLE_PASS_IS_LCA, ())
             expressionResolutionContext.hasLateralColumnAlias = true
           case None =>
         }
@@ -703,11 +699,16 @@ class ExpressionResolver(
         case other => other
       }
 
+      val coercedCandidate = candidateOrLiteralFunction match {
+        case extractValue: ExtractValue => coerceRecursiveDataTypes(extractValue)
+        case other => other
+      }
+
       val properlyAliasedExpressionTree =
         if (expressionResolutionContext.isTopOfProjectList && nameTarget.aliasName.isDefined) {
-          Alias(candidateOrLiteralFunction, nameTarget.aliasName.get)()
+          Alias(coercedCandidate, nameTarget.aliasName.get)()
         } else {
-          candidateOrLiteralFunction
+          coercedCandidate
         }
 
       properlyAliasedExpressionTree match {
@@ -718,17 +719,41 @@ class ExpressionResolver(
       }
     }
 
+  /**
+   * Coerces recursive types ([[ExtractValue]] expressions) in a bottom up manner. For example:
+   *
+   * {{{
+   * CREATE OR REPLACE TABLE t(col MAP<BIGINT, DOUBLE>);
+   * SELECT col.field FROM t;
+   * }}}
+   *
+   * In this example we need to cast inner field from `String` to `BIGINT`, thus analyzed plan
+   * should look like:
+   *
+   * {{{
+   * Project [col#x[cast(field as bigint)] AS field#x]
+   * +- SubqueryAlias spark_catalog.default.t
+   *    +- Relation spark_catalog.default.t[col#x] parquet
+   * }}}
+   *
+   * This is needed to stay compatible with the fixed-point implementation.
+   */
+  private def coerceRecursiveDataTypes(extractValue: ExtractValue): Expression = {
+    extractValue.transformUp {
+      case field => coerceExpressionTypes(field, traversals.current)
+    }
+  }
+
   private def isFilterOnTopOfAggregate(parentOperator: LogicalPlan): Boolean = {
     parentOperator match {
-      case _ @Filter(_, _: Aggregate) => true
+      case _: Filter if scopes.current.baseAggregate.isDefined => true
       case _ => false
     }
   }
 
   private def isSortOnTopOfAggregate(parentOperator: LogicalPlan): Boolean = {
     parentOperator match {
-      case _ @Sort(_, _, _: Aggregate, _) => true
-      case _ @Sort(_, _, _ @Filter(_, _: Aggregate), _) => true
+      case _: Sort if scopes.current.baseAggregate.isDefined => true
       case _ => false
     }
   }
@@ -738,11 +763,6 @@ class ExpressionResolver(
     case other => false
   }
 
-  private def shouldPreferTableColumnsOverAliases = traversals.current.parentOperator match {
-    case _: Sort => true
-    case _ => false
-  }
-
   /**
    * [[AttributeReference]] is already resolved if it's passed to us from DataFrame `col(...)`
    * function, for example.
@@ -1027,8 +1047,12 @@ class ExpressionResolver(
       TypeCoercionValidation.failOnTypeCheckResult(resolvedExpression)
     }
 
-    if (!resolvedExpression.resolved) {
-      throwSinglePassFailedToResolveExpression(resolvedExpression)
+    resolvedExpression match {
+      case runtimeReplaceable: RuntimeReplaceable if !runtimeReplaceable.replacement.resolved =>
+        throwFailedToResolveRuntimeReplaceableExpression(runtimeReplaceable)
+      case expression if !expression.resolved =>
+        throwSinglePassFailedToResolveExpression(resolvedExpression)
+      case _ =>
     }
 
     validateExpressionUnderSupportedOperator(resolvedExpression)
@@ -1066,10 +1090,12 @@ class ExpressionResolver(
       context = expression.origin.getQueryContext,
       summary = expression.origin.context.summary()
     )
-}
 
-object ExpressionResolver {
-  private val AMBIGUOUS_SELF_JOIN_METADATA = Seq("__dataset_id", "__col_position")
-  val SINGLE_PASS_SUBTREE_BOUNDARY = TreeNodeTag[Unit]("single_pass_subtree_boundary")
-  val SINGLE_PASS_IS_LCA = TreeNodeTag[Unit]("single_pass_is_lca")
+  private def throwFailedToResolveRuntimeReplaceableExpression(
+      runtimeReplaceable: RuntimeReplaceable) = {
+    throw SparkException.internalError(
+      s"Cannot resolve the runtime replaceable expression ${toSQLExpr(runtimeReplaceable)}. " +
+      s"The replacement is unresolved: ${toSQLExpr(runtimeReplaceable.replacement)}."
+    )
+  }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/FilterResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/FilterResolver.scala
index 599270b28b1d4..4489278f0b238 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/FilterResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/FilterResolver.scala
@@ -65,8 +65,7 @@ class FilterResolver(resolver: Resolver, expressionResolver: ExpressionResolver)
     retainOriginalOutput(
       operator = finalFilter,
       missingExpressions = missingAttributes,
-      output = scopes.current.output,
-      hiddenOutput = scopes.current.hiddenOutput
+      scopes = scopes
     )
   }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/GroupingAndAggregateExpressionsExtractor.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/GroupingAndAggregateExpressionsExtractor.scala
index e28526959f851..4929ffc57b6da 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/GroupingAndAggregateExpressionsExtractor.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/GroupingAndAggregateExpressionsExtractor.scala
@@ -33,13 +33,23 @@ import org.apache.spark.sql.catalyst.plans.logical.Aggregate
 class GroupingAndAggregateExpressionsExtractor(
     aggregate: Aggregate,
     autoGeneratedAliasProvider: AutoGeneratedAliasProvider) {
-  private val aliasChildToAliasInAggregateExpressions = new IdentityHashMap[Expression, Alias]
+
+  /**
+   * Maps children of aliases from aggregate list to their parents or to `None` if the expression
+   * doesn't have an alias. This map only accounts for the first appearance of the expression. For
+   * example, for `SELECT col1, col1 AS a` map entry should be (col1 -> None), but for
+   * `SELECT col1 AS a, col1` map entry should be (col1 -> Some(a)).
+   */
+  private val aliasChildToAliasInAggregateExpressions =
+    new IdentityHashMap[Expression, Option[Alias]]
   private val aggregateExpressionsSemanticComparator = new SemanticComparator(
     aggregate.aggregateExpressions.map {
       case alias: Alias =>
-        aliasChildToAliasInAggregateExpressions.put(alias.child, alias)
+        aliasChildToAliasInAggregateExpressions.putIfAbsent(alias.child, Some(alias))
         alias.child
-      case other => other
+      case other =>
+        aliasChildToAliasInAggregateExpressions.put(other, None)
+        other
     }
   )
 
@@ -53,43 +63,48 @@ class GroupingAndAggregateExpressionsExtractor(
    * (grouping expressions used for extraction) and `extractedAggregateExpressionAliases` (aliases
    * of [[AggregateExpression]]s that are transformed to attributes during extraction) in order to
    * insert missing attributes to below operators.
+   *
+   * When an expression exists in both grouping and aggregate expressions (for example, when there
+   * are lateral column references in [[Aggregate]], LCA algorithm will copy grouping expressions
+   * to aggregate list prior to entering this method), we still extract grouping expression but
+   * don't add it later if it is not necessary.
    */
   def extractReferencedGroupingAndAggregateExpressions(
       expression: Expression,
       referencedGroupingExpressions: mutable.ArrayBuffer[NamedExpression],
       extractedAggregateExpressionAliases: mutable.ArrayBuffer[Alias]): Expression = {
-    collectFirstAggregateExpression(expression) match {
-      case (Some(attribute: Attribute), _)
-          if !aliasChildToAliasInAggregateExpressions.containsKey(attribute) =>
-        attribute
-      case (Some(expression), alias) =>
-        alias match {
-          case None =>
-            throw SparkException.internalError(
-              s"No parent alias for expression $expression while extracting aggregate" +
-              s"expressions in Sort operator."
-            )
-          case Some(alias) =>
-            alias.toAttribute
-        }
-      case (None, _) if groupingExpressionsSemanticComparator.exists(expression) =>
-        expression match {
-          case attribute: Attribute =>
-            referencedGroupingExpressions += attribute
-            attribute
-          case other =>
-            val alias = autoGeneratedAliasProvider.newAlias(child = other)
-            referencedGroupingExpressions += alias
-            alias.toAttribute
-        }
-      case _ =>
-        expression match {
-          case aggregateExpression: AggregateExpression =>
-            val alias = autoGeneratedAliasProvider.newAlias(child = aggregateExpression)
-            extractedAggregateExpressionAliases += alias
-            alias.toAttribute
-          case other => other
-        }
+    val aggregateExpressionWithAlias = collectFirstAggregateExpression(expression)
+    val isGroupingExpression = groupingExpressionsSemanticComparator.exists(expression)
+    if (isGroupingExpression) {
+      val groupingExpressionReference = aggregateExpressionWithAlias match {
+        case (Some(attribute: Attribute), None) => attribute
+        case (Some(_), Some(alias)) => alias.toAttribute
+        case _ =>
+          expression match {
+            case attribute: Attribute => attribute
+            case other => autoGeneratedAliasProvider.newAlias(child = other)
+          }
+      }
+      referencedGroupingExpressions += groupingExpressionReference
+      groupingExpressionReference.toAttribute
+    } else {
+      aggregateExpressionWithAlias match {
+        case (Some(attribute: Attribute), None) => attribute
+        case (Some(_), Some(alias)) => alias.toAttribute
+        case (Some(expression), None) =>
+          throw SparkException.internalError(
+            s"No parent alias for expression $expression while extracting aggregate" +
+            s"expressions in an operator."
+          )
+        case _ =>
+          expression match {
+            case aggregateExpression: AggregateExpression =>
+              val alias = autoGeneratedAliasProvider.newAlias(child = aggregateExpression)
+              extractedAggregateExpressionAliases += alias
+              alias.toAttribute
+            case other => other
+          }
+      }
     }
   }
 
@@ -103,7 +118,7 @@ class GroupingAndAggregateExpressionsExtractor(
       aggregateExpressionsSemanticComparator.collectFirst(expression)
     referencedAggregateExpression match {
       case Some(expression) =>
-        (Some(expression), Option(aliasChildToAliasInAggregateExpressions.get(expression)))
+        (Some(expression), aliasChildToAliasInAggregateExpressions.get(expression))
       case None =>
         (None, None)
     }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HavingResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HavingResolver.scala
index 4bbcd43a0377a..ec0907807d5d0 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HavingResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HavingResolver.scala
@@ -22,13 +22,14 @@ import scala.collection.mutable
 import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst.analysis.UnresolvedHaving
 import org.apache.spark.sql.catalyst.expressions.{Alias, Expression, NamedExpression}
-import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, LogicalPlan}
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, LogicalPlan, Project}
 
 /**
  * Resolves [[UnresolvedHaving]] node and its condition.
  */
 class HavingResolver(resolver: Resolver, expressionResolver: ExpressionResolver)
     extends TreeNodeResolver[UnresolvedHaving, LogicalPlan]
+    with RewritesAliasesInTopLcaProject
     with ResolvesNameByHiddenOutput
     with ValidatesFilter {
   private val scopes: NameScopeStack = resolver.getNameScopes
@@ -53,29 +54,48 @@ class HavingResolver(resolver: Resolver, expressionResolver: ExpressionResolver)
 
     val partiallyResolvedHaving =
       Filter(condition = unresolvedHaving.havingCondition, child = resolvedChild)
-    val resolvedCondition = expressionResolver.resolveExpressionTreeInOperator(
+    val partiallyResolvedCondition = expressionResolver.resolveExpressionTreeInOperator(
       partiallyResolvedHaving.condition,
       partiallyResolvedHaving
     )
 
-    val (finalCondition, missingExpressions) = resolvedChild match {
-      case _ if scopes.current.hasLcaInAggregate =>
-        throw new ExplicitlyUnsupportedResolverFeature(
-          "Lateral column alias in Aggregate below HAVING"
+    val (resolvedCondition, missingExpressions) = resolvedChild match {
+      case _ @(_: Project | _: Aggregate) if scopes.current.baseAggregate.isDefined =>
+        handleAggregateBelowHaving(
+          scopes.current.baseAggregate.get,
+          partiallyResolvedCondition
         )
-      case aggregate: Aggregate =>
-        handleAggregateBelowHaving(aggregate, resolvedCondition)
       case other =>
         throw SparkException.internalError(
           s"Unexpected operator ${other.getClass.getSimpleName} under HAVING"
         )
     }
 
+    val (resolvedConditionWithAliasReplacement, filteredMissingExpressions) =
+      tryReplaceSortOrderOrHavingConditionWithAlias(resolvedCondition, scopes, missingExpressions)
+
+    val deduplicatedMissingExpressions = deduplicateMissingExpressions(filteredMissingExpressions)
+
     val resolvedChildWithMissingAttributes =
-      insertMissingExpressions(resolvedChild, missingExpressions.toSeq)
+      insertMissingExpressions(resolvedChild, deduplicatedMissingExpressions)
+
+    val isChildChangedByMissingExpressions = !resolvedChildWithMissingAttributes.eq(resolvedChild)
+
+    val (finalChild, finalCondition) = resolvedChildWithMissingAttributes match {
+      case project: Project if scopes.current.baseAggregate.isDefined =>
+        val (newProject, newExpressions) = rewriteNamedExpressionsInTopLcaProject(
+          projectToRewrite = project,
+          baseAggregate = scopes.current.baseAggregate.get,
+          expressionsToRewrite = Seq(resolvedConditionWithAliasReplacement),
+          rewriteCandidates = missingExpressions,
+          autoGeneratedAliasProvider = autoGeneratedAliasProvider
+        )
+        (newProject, newExpressions.head)
+      case other => (other, resolvedCondition)
+    }
 
     val resolvedHaving = partiallyResolvedHaving.copy(
-      child = resolvedChildWithMissingAttributes,
+      child = finalChild,
       condition = finalCondition
     )
 
@@ -85,12 +105,15 @@ class HavingResolver(resolver: Resolver, expressionResolver: ExpressionResolver)
       resolvedFilter = resolvedHaving
     )
 
-    retainOriginalOutput(
-      operator = resolvedHaving,
-      missingExpressions = missingExpressions.toSeq,
-      output = scopes.current.output,
-      hiddenOutput = scopes.current.hiddenOutput
-    )
+    if (isChildChangedByMissingExpressions) {
+      retainOriginalOutput(
+        operator = resolvedHaving,
+        missingExpressions = missingExpressions.toSeq,
+        scopes = scopes
+      )
+    } else {
+      resolvedHaving
+    }
   }
 
   /**
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HybridAnalyzer.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HybridAnalyzer.scala
index c21d1aacadeaf..0117b3fc2fb55 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HybridAnalyzer.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/HybridAnalyzer.scala
@@ -75,21 +75,17 @@ class HybridAnalyzer(
   private val sampleRateGenerator = new Random()
 
   def apply(plan: LogicalPlan, tracker: QueryPlanningTracker): LogicalPlan = {
-    val passedResolvedGuard = resolverGuard.apply(plan)
-
     val dualRun =
       conf.getConf(SQLConf.ANALYZER_DUAL_RUN_LEGACY_AND_SINGLE_PASS_RESOLVER) &&
-      passedResolvedGuard &&
-      checkDualRunSampleRate()
+      checkDualRunSampleRate() &&
+      checkResolverGuard(plan)
 
     withTrackedAnalyzerBridgeState(dualRun) {
       if (dualRun) {
         resolveInDualRun(plan, tracker)
       } else if (conf.getConf(SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_ENABLED)) {
         resolveInSinglePass(plan, tracker)
-      } else if (passedResolvedGuard && conf.getConf(
-          SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_ENABLED_TENTATIVELY
-        )) {
+      } else if (conf.getConf(SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_ENABLED_TENTATIVELY)) {
         resolveInSinglePassTentatively(plan, tracker)
       } else {
         resolveInFixedPoint(plan, tracker)
@@ -97,10 +93,6 @@ class HybridAnalyzer(
     }
   }
 
-  def getSinglePassResolutionDuration: Option[Long] = singlePassResolutionDuration
-
-  def getFixedPointResolutionDuration: Option[Long] = fixedPointResolutionDuration
-
   /**
    * Call `body` in the context of tracked [[AnalyzerBridgeState]]. Set the new bridge state
    * depending on whether we are in dual-run mode or not:
@@ -206,10 +198,21 @@ class HybridAnalyzer(
   private def resolveInSinglePassTentatively(
       plan: LogicalPlan,
       tracker: QueryPlanningTracker): LogicalPlan = {
-    try {
-      resolveInSinglePass(plan, tracker)
-    } catch {
-      case _: ExplicitlyUnsupportedResolverFeature =>
+    val singlePassResult = if (checkResolverGuard(plan)) {
+      try {
+        Some(resolveInSinglePass(plan, tracker))
+      } catch {
+        case _: ExplicitlyUnsupportedResolverFeature =>
+          None
+      }
+    } else {
+      None
+    }
+
+    singlePassResult match {
+      case Some(result) =>
+        result
+      case None =>
         resolveInFixedPoint(plan, tracker)
     }
   }
@@ -256,6 +259,16 @@ class HybridAnalyzer(
     }
   }
 
+  private def checkResolverGuard(plan: LogicalPlan): Boolean = {
+    try {
+      resolverGuard.apply(plan)
+    } catch {
+      case e: Throwable
+          if !conf.getConf(SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_EXPOSE_RESOLVER_GUARD_FAILURE) =>
+        false
+    }
+  }
+
   /**
    * Normalizes the logical plan using [[NormalizePlan]].
    *
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/JoinResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/JoinResolver.scala
index ff752bd76f41e..c718a8ba3782c 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/JoinResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/JoinResolver.scala
@@ -208,7 +208,7 @@ class JoinResolver(resolver: Resolver, expressionResolver: ExpressionResolver)
       scopes.current.hiddenOutput.filter(_.qualifiedAccessOnly)
 
     val newProjectList =
-      if (unresolvedJoin.getTagValue(Resolver.TOP_LEVEL_OPERATOR).isEmpty) {
+      if (unresolvedJoin.getTagValue(ResolverTag.TOP_LEVEL_OPERATOR).isEmpty) {
         newOutputList ++ qualifiedAccessOnlyColumnsFromHiddenOutput
       } else {
         newOutputList
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/KeyTransformingMap.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/KeyTransformingMap.scala
index ae56c6ed04193..7815b3b0c79cd 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/KeyTransformingMap.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/KeyTransformingMap.scala
@@ -17,16 +17,17 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import java.util.{Collection, HashMap, Iterator}
+import java.util.{Collection, Iterator, LinkedHashMap}
 import java.util.Map.Entry
 import java.util.function.Function
 
 /**
  * The [[KeyTransformingMap]] is a partial implementation of [[mutable.Map]] that transforms input
  * keys with a custom [[mapKey]] method.
+ * It preserves the order of insertion by using the [[LinkedHashMap]] as an underlying map.
  */
 private abstract class KeyTransformingMap[K, V] {
-  private val impl = new HashMap[K, V]
+  private val impl = new LinkedHashMap[K, V]
 
   def get(key: K): Option[V] = Option(impl.get(mapKey(key)))
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasProhibitedRegistry.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasProhibitedRegistry.scala
index bc0f11f5bd6de..e6e084115adec 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasProhibitedRegistry.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasProhibitedRegistry.scala
@@ -28,7 +28,7 @@ import org.apache.spark.sql.catalyst.expressions.{Alias, Attribute}
  * idempotent.
  */
 class LateralColumnAliasProhibitedRegistry extends LateralColumnAliasRegistry {
-  def withNewLcaScope(body: => Alias): Alias = body
+  def withNewLcaScope(isTopLevelAlias: Boolean)(body: => Alias): Alias = body
 
   def getAttribute(attributeName: String): Option[Attribute] =
     throwLcaResolutionNotEnabled()
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistry.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistry.scala
index 45a38417a8eed..fa539a4d9110f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistry.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistry.scala
@@ -30,7 +30,7 @@ import org.apache.spark.sql.catalyst.expressions.{Alias, Attribute}
  *  LCA resolution is disabled by [[SQLConf.LATERAL_COLUMN_ALIAS_IMPLICIT_ENABLED]].
  */
 abstract class LateralColumnAliasRegistry {
-  def withNewLcaScope(body: => Alias): Alias
+  def withNewLcaScope(isTopLevelAlias: Boolean)(body: => Alias): Alias
 
   def getAttribute(attributeName: String): Option[Attribute]
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistryImpl.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistryImpl.scala
index c685b098db2d2..94520455ee8d3 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistryImpl.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasRegistryImpl.scala
@@ -81,13 +81,15 @@ class LateralColumnAliasRegistryImpl(attributes: Seq[Attribute])
 
   /**
    * Creates a new LCA resolution scope for each [[Alias]] resolution. Executes the lambda and
-   * registers the resolved alias for later LCA resolution.
+   * registers top-level resolved aliases for later LCA resolution.
    */
-  def withNewLcaScope(body: => Alias): Alias = {
+  def withNewLcaScope(isTopLevelAlias: Boolean)(body: => Alias): Alias = {
     currentAttributeDependencyLevelStack.push(0)
     try {
       val resolvedAlias = body
-      registerAlias(resolvedAlias)
+      if (isTopLevelAlias) {
+        registerAlias(resolvedAlias)
+      }
       resolvedAlias
     } finally {
       currentAttributeDependencyLevelStack.pop()
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasResolver.scala
index 1ffaf73fc356a..5d268f087aa92 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LateralColumnAliasResolver.scala
@@ -57,9 +57,13 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
    *  - In order to be able to resolve [[Sort]] on top of an [[Aggregate]] that has LCAs, we need
    *  to collect all aliases from [[Aggregate]], as well as any aliases from artificially inserted
    *  [[Project]] nodes.
+   *  - Collects all aliases from newly created [[Aggregate]] and [[Project]] nodes and adds them
+   *  to `aliasesToCollect`
    */
   def handleLcaInAggregate(resolvedAggregate: Aggregate): AggregateWithLcaResolutionResult = {
-    extractLcaAndReplaceAggWithProject(resolvedAggregate) match {
+    val aliasesToCollect = new ArrayBuffer[Alias]
+
+    extractLcaAndReplaceAggWithProject(resolvedAggregate, aliasesToCollect) match {
       case _ @Project(projectList: Seq[_], aggregate: Aggregate) =>
         // TODO: This validation function does a post-traversal. This is discouraged in single-pass
         //       Analyzer.
@@ -76,21 +80,17 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
           scope = scopes.current,
           originalProjectList = projectList,
           firstIterationProjectList = aggregate.aggregateExpressions.map(_.toAttribute),
-          remappedAliases = Some(remappedAliases)
+          remappedAliases = Some(remappedAliases),
+          aliasesToCollect = aliasesToCollect
         )
 
-        val aggregateListAliases =
-          scopes.current.lcaRegistry.getAliasDependencyLevels().asScala.flatMap(_.asScala).toSeq
-
-        scopes.overwriteCurrent(
-          output = Some(finalProject.projectList.map(_.toAttribute)),
-          hasLcaInAggregate = true
-        )
+        scopes.overwriteCurrent(output = Some(finalProject.projectList.map(_.toAttribute)))
 
         AggregateWithLcaResolutionResult(
           resolvedOperator = finalProject,
           outputList = finalProject.projectList,
-          aggregateListAliases = aggregateListAliases
+          aggregateListAliases = aliasesToCollect.toSeq,
+          baseAggregate = aggregate
         )
       case _ =>
         throw SparkException.internalError(
@@ -128,6 +128,8 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
    *  full definitions ( `attr` as `name` ) have already been defined on lower levels.
    *  - If an attribute is never referenced, it does not show up in multi-level project lists, but
    *  instead only in the top-most [[Project]].
+   *  - Additionally, collect all aliases from newly created [[Project]] nodes and add them to
+   *  `aliasesToCollect`.
    *
    *  For previously given query, following above rules, resolved [[Project]] would look like:
    *
@@ -142,7 +144,8 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
       scope: NameScope,
       originalProjectList: Seq[NamedExpression],
       firstIterationProjectList: Seq[NamedExpression],
-      remappedAliases: Option[HashMap[ExprId, Alias]] = None): Project = {
+      remappedAliases: Option[HashMap[ExprId, Alias]] = None,
+      aliasesToCollect: ArrayBuffer[Alias] = ArrayBuffer.empty): Project = {
     val aliasDependencyMap = scope.lcaRegistry.getAliasDependencyLevels()
     val (finalChildPlan, _) = aliasDependencyMap.asScala.foldLeft(
       (resolvedChild, firstIterationProjectList)
@@ -159,6 +162,12 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
 
         if (referencedAliases.nonEmpty) {
           val newProjectList = currentProjectList.map(_.toAttribute) ++ referencedAliases
+
+          newProjectList.foreach {
+            case alias: Alias => aliasesToCollect += alias
+            case _ =>
+          }
+
           (Project(newProjectList, currentPlan), newProjectList)
         } else {
           (currentPlan, currentProjectList)
@@ -173,6 +182,11 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
       }
     }
 
+    finalProjectList.foreach {
+      case alias: Alias => aliasesToCollect += alias
+      case _ =>
+    }
+
     Project(finalProjectList, finalChildPlan)
   }
 
@@ -184,6 +198,8 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
    *  [[NamedExpression]] we don't need to alias it again.
    *  - Places a [[Project]] on top of the new [[Aggregate]] operator, where the project list will
    *  be created from [[Alias]] references to original aggregate expressions.
+   *  - Additionally, collect aliases from newly created aggregate expressions and add them to
+   *  `aliasesToCollect`.
    *
    * For example, for a query like:
    *
@@ -198,7 +214,9 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
    * The [[Project]] is unresolved, which is fine, because it will later be resolved as if we only
    * had a lateral alias reference in [[Project]] and not [[Aggregate]].
    */
-  private def extractLcaAndReplaceAggWithProject(aggregate: Aggregate): Project = {
+  private def extractLcaAndReplaceAggWithProject(
+      aggregate: Aggregate,
+      aliasesToCollect: ArrayBuffer[Alias]): Project = {
     val newAggregateExpressions = new LinkedHashSet[NamedExpression]
     val extractedExpressionAliases = new HashMap[Expression, NamedExpression]()
     val groupingExpressionSemanticComparator = new SemanticComparator(aggregate.groupingExpressions)
@@ -212,9 +230,16 @@ class LateralColumnAliasResolver(expressionResolver: ExpressionResolver) extends
             newAggregateExpressions = newAggregateExpressions
           ).asInstanceOf[NamedExpression]
       )
+
+    val newAggregateExpressionsSeq = newAggregateExpressions.asScala.toSeq
+    newAggregateExpressionsSeq.foreach {
+      case alias: Alias => aliasesToCollect += alias
+      case _ =>
+    }
+
     val result = Project(
       projectList = extractedExpressions,
-      child = aggregate.copy(aggregateExpressions = newAggregateExpressions.asScala.toSeq)
+      child = aggregate.copy(aggregateExpressions = newAggregateExpressionsSeq)
     )
     result
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LimitExpressionResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LimitExpressionResolver.scala
deleted file mode 100644
index d25112d78c6e7..0000000000000
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/LimitExpressionResolver.scala
+++ /dev/null
@@ -1,110 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.catalyst.analysis.resolver
-
-import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.expressions.Expression
-import org.apache.spark.sql.types.IntegerType
-
-/**
- * The [[LimitExpressionResolver]] is a resolver that resolves a [[LocalLimit]] or [[GlobalLimit]]
- * expression and performs all the necessary validation.
- */
-class LimitExpressionResolver extends TreeNodeResolver[Expression, Expression] {
-
-  /**
-   * Resolve a limit expression of [[GlobalLimit]] or [[LocalLimit]] and perform validation.
-   */
-  override def resolve(unresolvedLimitExpression: Expression): Expression = {
-    validateLimitExpression(unresolvedLimitExpression, expressionName = "limit")
-    unresolvedLimitExpression
-  }
-
-  /**
-   * Validate a resolved limit expression of [[GlobalLimit]] or [[LocalLimit]]:
-   *  - The expression has to be foldable
-   *  - The result data type has to be [[IntegerType]]
-   *  - The evaluated expression has to be non-null
-   *  - The evaluated expression has to be positive
-   *
-   * The `foldable` check is implemented in some expressions
-   * as a recursive expression tree traversal.
-   * It is not an ideal approach for the single-pass [[ExpressionResolver]],
-   * but __is__ practical, since:
-   *  - We have to call `eval` here anyway, and it's recursive
-   *  - In practice `LIMIT` expression trees are very small
-   */
-  private def validateLimitExpression(expression: Expression, expressionName: String): Unit = {
-    if (!expression.foldable) {
-      throwInvalidLimitLikeExpressionIsUnfoldable(expressionName, expression)
-    }
-    if (expression.dataType != IntegerType) {
-      throwInvalidLimitLikeExpressionDataType(expressionName, expression)
-    }
-    expression.eval() match {
-      case null =>
-        throwInvalidLimitLikeExpressionIsNull(expressionName, expression)
-      case value: Int if value < 0 =>
-        throwInvalidLimitLikeExpressionIsNegative(expressionName, expression, value)
-      case _ =>
-    }
-  }
-
-  private def throwInvalidLimitLikeExpressionIsUnfoldable(
-      name: String,
-      expression: Expression): Nothing =
-    throw new AnalysisException(
-      errorClass = "INVALID_LIMIT_LIKE_EXPRESSION.IS_UNFOLDABLE",
-      messageParameters = Map(
-        "name" -> name,
-        "expr" -> toSQLExpr(expression)
-      ),
-      origin = expression.origin
-    )
-
-  private def throwInvalidLimitLikeExpressionDataType(
-      name: String,
-      expression: Expression): Nothing =
-    throw new AnalysisException(
-      errorClass = "INVALID_LIMIT_LIKE_EXPRESSION.DATA_TYPE",
-      messageParameters = Map(
-        "name" -> name,
-        "expr" -> toSQLExpr(expression),
-        "dataType" -> toSQLType(expression.dataType)
-      ),
-      origin = expression.origin
-    )
-
-  private def throwInvalidLimitLikeExpressionIsNull(name: String, expression: Expression): Nothing =
-    throw new AnalysisException(
-      errorClass = "INVALID_LIMIT_LIKE_EXPRESSION.IS_NULL",
-      messageParameters = Map("name" -> name, "expr" -> toSQLExpr(expression)),
-      origin = expression.origin
-    )
-
-  private def throwInvalidLimitLikeExpressionIsNegative(
-      name: String,
-      expression: Expression,
-      value: Int): Nothing =
-    throw new AnalysisException(
-      errorClass = "INVALID_LIMIT_LIKE_EXPRESSION.IS_NEGATIVE",
-      messageParameters =
-        Map("name" -> name, "expr" -> toSQLExpr(expression), "v" -> toSQLValue(value, IntegerType)),
-      origin = expression.origin
-    )
-}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/MetadataResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/MetadataResolver.scala
index bccc038f87eff..12ca6b4b333d6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/MetadataResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/MetadataResolver.scala
@@ -17,17 +17,9 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import org.apache.spark.sql.catalyst.analysis.{
-  FunctionResolution,
-  RelationResolution,
-  UnresolvedRelation
-}
-import org.apache.spark.sql.catalyst.plans.logical.{
-  AnalysisHelper,
-  LogicalPlan,
-  SubqueryAlias,
-  UnresolvedWith
-}
+import org.apache.spark.sql.catalyst.SQLConfHelper
+import org.apache.spark.sql.catalyst.analysis.{RelationResolution, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.trees.TreePattern.{UNRESOLVED_RELATION, UNRESOLVED_WITH}
 import org.apache.spark.sql.connector.catalog.CatalogManager
 
@@ -45,9 +37,9 @@ import org.apache.spark.sql.connector.catalog.CatalogManager
 class MetadataResolver(
     override val catalogManager: CatalogManager,
     override val relationResolution: RelationResolution,
-    functionResolution: FunctionResolution,
     override val extensions: Seq[ResolverExtension] = Seq.empty)
-    extends RelationMetadataProvider
+    extends SQLConfHelper
+    with RelationMetadataProvider
     with DelegatesResolutionToExtensions {
   override val relationsWithResolvedMetadata = new RelationsWithResolvedMetadata
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/NameScope.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/NameScope.scala
index aed5b767b2066..3ccae116cb187 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/NameScope.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/NameScope.scala
@@ -38,6 +38,7 @@ import org.apache.spark.sql.catalyst.expressions.{
   NamedExpression,
   OuterReference
 }
+import org.apache.spark.sql.catalyst.plans.logical.Aggregate
 import org.apache.spark.sql.catalyst.util._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.Metadata
@@ -141,8 +142,9 @@ import org.apache.spark.sql.types.Metadata
  *  to this [[NameScope]]. If the [[Aggregate]] has lateral column references, this list contains
  *  both the aliases from [[Aggregate]] as well as all aliases from artificially inserted
  *  [[Project]] nodes.
- * @param hasLcaInAggregate Flag that indicates whether there is a lateral column alias reference
- *   in the [[Aggregate]] corresponding to this [[NameScope]].
+ * @param baseAggregate [[Aggregate]] node that is either a resolved [[Aggregate]] corresponding to
+ *  this node or base [[Aggregate]] constructed when resolving lateral column references in
+ *  [[Aggregate]].
  */
 class NameScope(
     val output: Seq[Attribute] = Seq.empty,
@@ -150,7 +152,7 @@ class NameScope(
     val isSubqueryRoot: Boolean = false,
     val availableAliases: HashSet[ExprId] = new HashSet[ExprId],
     val aggregateListAliases: Seq[Alias] = Seq.empty,
-    val hasLcaInAggregate: Boolean = false,
+    val baseAggregate: Option[Aggregate] = None,
     planLogger: PlanLogger = new PlanLogger
 ) extends SQLConfHelper {
 
@@ -223,21 +225,21 @@ class NameScope(
   /**
    * Returns new [[NameScope]] which preserves all the immutable [[NameScope]] properties but
    * overwrites `output`, `hiddenOutput`, `availableAliases`, `aggregateListAliases` and
-   * `hasLcaInAggregate` if provided. Mutable state like `lcaRegistry` is not preserved.
+   * `baseAggregate` if provided. Mutable state like `lcaRegistry` is not preserved.
    */
   def overwrite(
       output: Option[Seq[Attribute]] = None,
       hiddenOutput: Option[Seq[Attribute]] = None,
       availableAliases: Option[HashSet[ExprId]] = None,
       aggregateListAliases: Seq[Alias] = Seq.empty,
-      hasLcaInAggregate: Boolean = false): NameScope = {
+      baseAggregate: Option[Aggregate] = None): NameScope = {
     new NameScope(
       output = output.getOrElse(this.output),
       hiddenOutput = hiddenOutput.getOrElse(this.hiddenOutput),
       isSubqueryRoot = isSubqueryRoot,
       availableAliases = availableAliases.getOrElse(this.availableAliases),
       aggregateListAliases = aggregateListAliases,
-      hasLcaInAggregate = hasLcaInAggregate || this.hasLcaInAggregate,
+      baseAggregate = baseAggregate,
       planLogger = planLogger
     )
   }
@@ -300,6 +302,26 @@ class NameScope(
   def getOrdinalReplacementExpressions: Option[OrdinalReplacementExpressions] =
     ordinalReplacementExpressions
 
+  /**
+   * Returns attribute with `expressionId` if `output` contains it. This is used to preserve
+   * nullability for resolved [[AttributeReference]].
+   */
+  def getAttributeById(expressionId: ExprId): Option[Attribute] =
+    Option(outputById.get(expressionId))
+
+  /**
+   * Returns attribute with `expressionId` if `hiddenOutput` contains it.
+   */
+  def getHiddenAttributeById(expressionId: ExprId): Option[Attribute] =
+    Option(hiddenAttributesById.get(expressionId))
+
+  /**
+   * Return all the explicitly outputted expression IDs. Hidden or metadata output are not included.
+   */
+  def getOutputIds: Set[ExprId] = {
+    output.map(_.exprId).toSet
+  }
+
   /**
    * Expand the [[UnresolvedStar]]. The expected use case for this method is star expansion inside
    * [[Project]].
@@ -351,6 +373,28 @@ class NameScope(
     )
   }
 
+  /**
+   * Find attributes in this [[NameScope]] that match a provided one-part `name`.
+   *
+   * This method is simpler and more lightweight than [[resolveMultipartName]], because here we
+   * just return all the attributes matched by the one-part `name`. This is only suitable
+   * for situations where name _resolution_ is not required (e.g. accessing struct fields
+   * from the lower operator's output).
+   *
+   * For example, this method is used to look up attributes to match a specific [[View]] schema.
+   * See [[ExpressionResolver.resolveGetViewColumnByNameAndOrdinal]] for more info on view column
+   * lookup.
+   *
+   * We are relying on a simple [[IdentifierMap]] to perform that work, since we just need to match
+   * one-part name from the lower operator's output here.
+   */
+  def findAttributesByName(name: String): Seq[Attribute] = {
+    attributesByName.get(name) match {
+      case Some(attributes) => attributes.toSeq
+      case None => Seq.empty
+    }
+  }
+
   /**
    * Resolve multipart name into a [[NameTarget]]. [[NameTarget]]'s `candidates` may contain
    * simple [[AttributeReference]]s if it's a column or alias, or [[ExtractValue]] expressions if
@@ -445,19 +489,6 @@ class NameScope(
    * Even though there is ambiguity with the name `col1`, the [[SortOrder]] expression should be
    * resolved as a table column from the project list and not throw [[AMBIGUOUS_REFERENCE]].
    *
-   * On the other hand, in the following example:
-   *
-   * {{{
-   * val df = sql("SELECT 1 AS col1, col1 FROM VALUES(1)")
-   * df.select("col1")
-   * }}}
-   *
-   * Resolution of name `col1` in the second [[Project]] produce [[AMBIGUOUS_REFERENCE]] error.
-   *
-   * In order to achieve this we are using [[shouldPreferTableColumnsOverAliases]] flag which
-   * should be set to true when the parent operator is [[Sort]] and only when we are resolving by
-   * `output` (we don't consider this flag for `metadataOutput` or `hiddenOutput`).
-   *
    * The names in [[Aggregate.groupingExpressions]] can reference
    * [[Aggregate.aggregateExpressions]] aliases. `canReferenceAggregateExpressionAliases` will be
    * true when we are resolving the grouping expressions.
@@ -484,17 +515,35 @@ class NameScope(
    * SELECT COUNT(col1) FROM t1 GROUP BY col1 ORDER BY MAX(col2);
    * }}}
    *
-   * We are relying on the [[AttributeSeq]] to perform that work, since it requires complex
-   * resolution logic involving nested field extraction and multipart name matching.
+   * Spark is being smart about name resolution and prioritizes candidates from output levels that
+   * can actually be resolved, even though that output level might not be the first choice.
+   * For example, ORDER BY clause prefers attributes from SELECT list (namely, aliases) over table
+   * columns from below. However, if attributes on the SELECT level have name ambiguity or other
+   * issues, Spark will try to resolve the name using the table columns from below. Examples:
+   *
+   * {{{
+   * CREATE TABLE t1 (col1 INT);
+   * CREATE TABLE t2 (col1 STRUCT<field: INT>);
+   *
+   * -- Main output is ambiguous, so col1 from t1 is used for sorting.
+   * SELECT 1 AS col1, 2 AS col1 FROM t1 ORDER BY col1;
+   *
+   * -- col1 from main output does not have `field`, so struct field of col1 from t2 is used for
+   * -- sorting.
+   * SELECT 1 AS col1 FROM t2 ORDER BY col1.field;
+   * }}}
+   *
+   * This is achieved using candidate prioritization mechanism in [[pickSuitableCandidates]].
    *
-   * Also, see [[AttributeSeq.resolve]] for more details.
+   * We are relying on the [[AttributeSeq]] to perform name resolution, since it requires complex
+   * resolution logic involving nested field extraction and multipart name matching. See
+   * [[AttributeSeq.resolve]] for more details.
    */
   def resolveMultipartName(
       multipartName: Seq[String],
       canLaterallyReferenceColumn: Boolean = false,
       canReferenceAggregateExpressionAliases: Boolean = false,
       canResolveNameByHiddenOutput: Boolean = false,
-      shouldPreferTableColumnsOverAliases: Boolean = false,
       shouldPreferHiddenOutput: Boolean = false,
       canReferenceAggregatedAccessOnlyAttributes: Boolean = false): NameTarget = {
     val resolvedMultipartName: ResolvedMultipartName =
@@ -502,7 +551,6 @@ class NameScope(
         multipartName = multipartName,
         nameComparator = nameComparator,
         canResolveNameByHiddenOutput = canResolveNameByHiddenOutput,
-        shouldPreferTableColumnsOverAliases = shouldPreferTableColumnsOverAliases,
         shouldPreferHiddenOutput = shouldPreferHiddenOutput,
         canReferenceAggregatedAccessOnlyAttributes = canReferenceAggregatedAccessOnlyAttributes
       ).orElse(tryResolveMultipartNameAsLiteralFunction(multipartName))
@@ -536,149 +584,104 @@ class NameScope(
   }
 
   /**
-   * Find attributes in this [[NameScope]] that match a provided one-part `name`.
-   *
-   * This method is simpler and more lightweight than [[resolveMultipartName]], because here we
-   * just return all the attributes matched by the one-part `name`. This is only suitable
-   * for situations where name _resolution_ is not required (e.g. accessing struct fields
-   * from the lower operator's output).
-   *
-   * For example, this method is used to look up attributes to match a specific [[View]] schema.
-   * See [[ExpressionResolver.resolveGetViewColumnByNameAndOrdinal]] for more info on view column
-   * lookup.
-   *
-   * We are relying on a simple [[IdentifierMap]] to perform that work, since we just need to match
-   * one-part name from the lower operator's output here.
-   */
-  def findAttributesByName(name: String): Seq[Attribute] = {
-    attributesByName.get(name) match {
-      case Some(attributes) => attributes.toSeq
-      case None => Seq.empty
-    }
-  }
-
-  /**
-   * Returns attribute with `expressionId` if `output` contains it. This is used to preserve
-   * nullability for resolved [[AttributeReference]].
-   */
-  def getAttributeById(expressionId: ExprId): Option[Attribute] =
-    Option(outputById.get(expressionId))
-
-  /**
-   * Returns attribute with `expressionId` if `hiddenOutput` contains it.
-   */
-  def getHiddenAttributeById(expressionId: ExprId): Option[Attribute] =
-    Option(hiddenAttributesById.get(expressionId))
-
-  /**
-   * Return all the explicitly outputted expression IDs. Hidden or metadata output are not included.
-   */
-  def getOutputIds: Set[ExprId] = {
-    output.map(_.exprId).toSet
-  }
-
-  /**
-   * Resolution by attributes available in the current [[NameScope]] is done in the following way:
-   *  - First, we resolve the name using all the available attributes in the current scope
-   *  - For all the candidates that are found, we lookup the expression IDs in the maps created
-   *    when [[NameScope]] is updated to distinguish attributes resolved using the main output,
-   *    hidden output and metadata output (for hidden output, we use
-   *    `canReferenceAggregatedAccessOnlyAttributes` flag to determine if all the attributes can be
-   *    used or only the ones that are not tagged as `aggregatedAccessOnly`).
-   *  - We prioritize the hidden output over the other ones if `shouldPreferHiddenOutput` is set to
-   *    true. This is done in case of HAVING where attributes from grouping expressions of the
-   *    underlying [[Aggregate]] are preferred over aliases from operator below. Example:
-   *
-   *    {{{ SELECT 1 AS col1 FROM VALUES(1, 2) GROUP BY col1 HAVING col1 = 1; }}}
-   *
-   *    Plan would be:
-   *    Project [col1#2]
-   *    +- Filter (col1#1 = 1)
-   *       +- Aggregate [col1#1], [a AS col1#2, col1#1]
-   *          +- LocalRelation [col1#1, col2#3]
-   *
-   *    Otherwise, we prioritize main output over the metadata output and metadata output
-   *    over the hidden output.
-   *  - If `shouldPreferTableColumnsOverAliases` is set to true, we prefer the table columns over
-   *    the aliases which can be used for name resolution.
-   *  - If we didn't find any candidates this way we fallback to other ways of resolution described
-   *    in `resolveMultipartName` doc.
+   * Try resolve [[multipartName]] using attributes from a relevant operator output. This algorithm
+   * splits candidates from [[attributesForResolution]] into several groups and picks the best match
+   * ensuring that there's no choice ambiguity.
+   *
+   * Detailed flow:
+   * 1. Match the given [[multipartName]] using
+   *   [[attributesForResolution.getCandidatesForResolution]] and get a subset of candidates for
+   *   that name.
+   * 2. If nested fields were inferred during the name matching process, we are dealing with
+   *   struct/map/array field/element extraction. Further narrow down those attributes that are
+   *   suitable for field extraction using [[ExtractValue.isExtractable]]. We can safely do this
+   *   right away, because nested fields cannot be applied to non-recursive data types.
+   * 3. Triage the candidates into several groups: main output, metadata output and hidden output.
+   *   Main output is the topmost output of a relevant operator (actual SELECT list). Metadata
+   *   output is a special qualified-access only output which originates from [[NaturalJoin]] or
+   *   [[UsingJoin]] and can only be accessed by a qualified multipart name. If we have it, it
+   *   means that [[attributesForResolution.getCandidatesForResolution]] inferred a qualified
+   *   attribute name. Hidden output is only used if [[canResolveNameByHiddenOutput]] is specified
+   *   (in ORDER BY and HAVING clauses). These attributes can sometimes be accessed from below in
+   *   relation to the relevant operator - the attributes are not explicitly mentioned in a SELECT
+   *   clause, but SQL language rules still allow referencing them. Not all hidden attributes can
+   *   be referenced if we are dealing with an [[Aggregate]] - only those that are part of grouping
+   *   expressions, or if we are resolving a name under an aggregate function (if
+   *   [[canReferenceAggregatedAccessOnlyAttributes]] is specified).
+   * 4. Infer the right resolution priority depending on [[canResolveNameByHiddenOutput]] and
+   *   [[shouldPreferHiddenOutput]] flag values. These flags are set depending on the operator
+   *   in which context we are currently resolving the [[multipartName]]. For example, ORDER BY
+   *   clause prefers attributes from SELECT list over lower attributes from the table, but HAVING
+   *   clause has the opposite rules.
+   * 5. Pick the best suitable candidates using [[pickSuitableCandidates]]. We prioritize candidates
+   *   that have exactly 1 match for the [[multipartName]], because other options would fail.
+   *   If there was a single match, we return [[ResolvedMultipartName]] with that attribute, and
+   *   multipart name resolution process succeeds. If none of the options are suitable, we fall
+   *   back to the main output and either return [[ResolvedMultipartName]] with multiple candidates
+   *   from that main output to throw a descriptive [[AMBIGUOUS_REFERENCE]] error later or return
+   *   [[None]] to continue the name resolution process using other sources.
+   *
+   * This algorithm is incomplete and completely covers just the SQL scenarios. DataFrame
+   * programs can prioritize several layers of [[Project]] outputs if several nested
+   * `.select(...)` calls have conflicting attributes.
    */
   private def tryResolveMultipartNameByOutput(
       multipartName: Seq[String],
       nameComparator: NameComparator,
       canResolveNameByHiddenOutput: Boolean,
-      shouldPreferTableColumnsOverAliases: Boolean,
       shouldPreferHiddenOutput: Boolean,
       canReferenceAggregatedAccessOnlyAttributes: Boolean): Option[ResolvedMultipartName] = {
-    val (candidates, nestedFields) =
-      attributesForResolution.getCandidatesForResolution(multipartName, nameComparator)
-
-    val hiddenOutputCandidates = candidates.filter { element =>
-      !outputById.containsKey(element.exprId) &&
-      (canReferenceAggregatedAccessOnlyAttributes || !element.aggregatedAccessOnly)
-    }
+    val (candidates, nestedFields) = getCandidatesForResolution(multipartName)
 
-    val (currentCandidates: Seq[Attribute], resolutionType: String) =
-      if (shouldPreferHiddenOutput && hiddenOutputCandidates.nonEmpty) {
-        (hiddenOutputCandidates, "hidden")
-      } else {
-        val outputCandidates = candidates.filter { element =>
-          outputById.containsKey(element.exprId)
-        }
+    val mainOutputCandidates = getMainOutputCandidates(candidates)
+    val metadataOutputCandidates = getMetadataOutputCandidates(candidates)
 
-        if (outputCandidates.nonEmpty) {
-          (outputCandidates, "normal")
-        } else {
-          val metadataOutputCandidates =
-            candidates.filter { element =>
-              !outputById.containsKey(element.exprId) && element.qualifiedAccessOnly
-            }
+    val resolutionOrder = if (canResolveNameByHiddenOutput) {
+      val hiddenOutputCandidates =
+        getHiddenOutputCandidates(candidates, canReferenceAggregatedAccessOnlyAttributes)
 
-          if (metadataOutputCandidates.nonEmpty) {
-            (metadataOutputCandidates, "metadata")
-          } else {
-            if (canResolveNameByHiddenOutput &&
-              !shouldPreferHiddenOutput &&
-              hiddenOutputCandidates.nonEmpty) {
-              (hiddenOutputCandidates, "hidden")
-            } else {
-              (Seq.empty, "")
-            }
-          }
-        }
+      if (shouldPreferHiddenOutput) {
+        Seq(
+          CandidatesForResolution(hiddenOutputCandidates, OutputType.Hidden),
+          CandidatesForResolution(mainOutputCandidates, OutputType.Main),
+          CandidatesForResolution(metadataOutputCandidates, OutputType.Metadata)
+        )
+      } else {
+        Seq(
+          CandidatesForResolution(mainOutputCandidates, OutputType.Main),
+          CandidatesForResolution(metadataOutputCandidates, OutputType.Metadata),
+          CandidatesForResolution(hiddenOutputCandidates, OutputType.Hidden)
+        )
       }
+    } else {
+      Seq(
+        CandidatesForResolution(mainOutputCandidates, OutputType.Main),
+        CandidatesForResolution(metadataOutputCandidates, OutputType.Metadata)
+      )
+    }
+
+    val suitableCandidates = pickSuitableCandidates(
+      resolutionOrder = resolutionOrder,
+      fallbackCandidates = CandidatesForResolution(mainOutputCandidates, OutputType.Main)
+    )
 
     val resolvedCandidates = attributesForResolution.resolveCandidates(
       multipartName,
       nameComparator,
-      currentCandidates,
+      suitableCandidates.attributes,
       nestedFields
     )
 
     if (resolvedCandidates.nonEmpty) {
-      val candidatesWithPreferredColumnsOverAliases = if (shouldPreferTableColumnsOverAliases) {
-        val (aliasCandidates, nonAliasCandidates) =
-          resolvedCandidates.partition(candidate => availableAliases.contains(candidate.exprId))
-
-        if (nonAliasCandidates.nonEmpty) {
-          nonAliasCandidates
-        } else {
-          aliasCandidates
-        }
-      } else {
-        resolvedCandidates
-      }
-
       planLogger.logNameResolutionEvent(
         multipartName,
-        candidatesWithPreferredColumnsOverAliases,
-        s"From $resolutionType output"
+        resolvedCandidates,
+        s"From ${suitableCandidates.outputType} output"
       )
 
       Some(
         ResolvedMultipartName(
-          candidates = candidatesWithPreferredColumnsOverAliases,
+          candidates = resolvedCandidates,
           referencedAttribute = None
         )
       )
@@ -687,6 +690,54 @@ class NameScope(
     }
   }
 
+  private def getCandidatesForResolution(
+      multipartName: Seq[String]): (Seq[Attribute], Seq[String]) = {
+    val (candidates, nestedFields) =
+      attributesForResolution.getCandidatesForResolution(multipartName, nameComparator)
+
+    val filteredCandidates = if (nestedFields.nonEmpty) {
+      candidates.filter { attribute =>
+        ExtractValue.isExtractable(attribute, nestedFields, nameComparator)
+      }
+    } else {
+      candidates
+    }
+
+    (filteredCandidates, nestedFields)
+  }
+
+  private def getMainOutputCandidates(candidates: Seq[Attribute]): Seq[Attribute] = {
+    candidates.filter { attribute =>
+      outputById.containsKey(attribute.exprId)
+    }
+  }
+
+  private def getMetadataOutputCandidates(candidates: Seq[Attribute]): Seq[Attribute] = {
+    candidates.filter { element =>
+      !outputById.containsKey(element.exprId) && element.qualifiedAccessOnly
+    }
+  }
+
+  private def getHiddenOutputCandidates(
+      candidates: Seq[Attribute],
+      canReferenceAggregatedAccessOnlyAttributes: Boolean): Seq[Attribute] = {
+    candidates.filter { attribute =>
+      !availableAliases.contains(attribute.exprId) &&
+      (canReferenceAggregatedAccessOnlyAttributes || !attribute.aggregatedAccessOnly)
+    }
+  }
+
+  private def pickSuitableCandidates(
+      resolutionOrder: Seq[CandidatesForResolution],
+      fallbackCandidates: CandidatesForResolution): CandidatesForResolution = {
+    resolutionOrder
+      .collectFirst {
+        case candidates if candidates.attributes.size == 1 =>
+          candidates
+      }
+      .getOrElse(fallbackCandidates)
+  }
+
   private def tryResolveMultipartNameAsLiteralFunction(
       multipartName: Seq[String]): Option[ResolvedMultipartName] = {
     val literalFunction = LiteralFunctionResolution.resolve(multipartName).toSeq
@@ -841,8 +892,8 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
 
   /**
    * Completely overwrite the current scope state with operator `output`, `hiddenOutput`,
-   * `availableAliases`, `aggregateListAliases` and `hasLcaInAggregate`. If `hiddenOutput`,
-   * `availableAliases` or `hasLcaInAggregate` are not provided, preserve the previous values.
+   * `availableAliases`, `aggregateListAliases` and `baseAggregate`. If `hiddenOutput`,
+   * `availableAliases` or `baseAggregate` are not provided, preserve the previous values.
    * Additionally, update nullabilities of attributes in hidden output from new output, so that if
    * attribute was nullable in either old hidden output or new output, it must stay nullable in new
    * hidden output as well.
@@ -869,7 +920,7 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
       hiddenOutput: Option[Seq[Attribute]] = None,
       availableAliases: Option[HashSet[ExprId]] = None,
       aggregateListAliases: Seq[Alias] = Seq.empty,
-      hasLcaInAggregate: Boolean = false): Unit = {
+      baseAggregate: Option[Aggregate] = None): Unit = {
     val hiddenOutputWithUpdatedNullabilities = updateHiddenOutputProperties(
       output.getOrElse(stack.peek().output),
       hiddenOutput.getOrElse(stack.peek().hiddenOutput)
@@ -880,15 +931,15 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
       hiddenOutput = Some(hiddenOutputWithUpdatedNullabilities),
       availableAliases = availableAliases,
       aggregateListAliases = aggregateListAliases,
-      hasLcaInAggregate = hasLcaInAggregate
+      baseAggregate = baseAggregate
     )
 
     stack.push(newScope)
   }
 
   /**
-   * Overwrites `output`, `groupingAttributeIds` and `aggregateListAliases` of the current
-   * [[NameScope]] entry and:
+   * Overwrites `output`, `groupingAttributeIds`, `aggregateListAliases` and `baseAggregate` of the
+   * current [[NameScope]] entry and:
    *  1. extends hidden output with the provided output (only attributes that are not in the hidden
    *  output are added). This is done because resolution of arguments can be done through certain
    *  operators by hidden output. This use case is specific to Dataframe programs. Example:
@@ -916,7 +967,8 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
   def overwriteOutputAndExtendHiddenOutput(
       output: Seq[Attribute],
       groupingAttributeIds: Option[HashSet[ExprId]] = None,
-      aggregateListAliases: Seq[Alias] = Seq.empty): Unit = {
+      aggregateListAliases: Seq[Alias] = Seq.empty,
+      baseAggregate: Option[Aggregate] = None): Unit = {
     val prevScope = stack.pop
 
     val hiddenOutputWithUpdatedProperties: Seq[Attribute] = updateHiddenOutputProperties(
@@ -932,7 +984,8 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
     val newScope = prevScope.overwrite(
       output = Some(output),
       hiddenOutput = Some(hiddenOutput),
-      aggregateListAliases = aggregateListAliases
+      aggregateListAliases = aggregateListAliases,
+      baseAggregate = baseAggregate
     )
 
     stack.push(newScope)
@@ -989,11 +1042,11 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
 
   /**
    * After finishing the resolution after [[pushScope]], the caller needs to call [[popScope]] to
-   * clear the stack. We propagate `hiddenOutput`, `availableAliases` and `hasLcaInAggregate`
-   * upwards because of name resolution by overwriting their current values with the popped ones.
-   * This is not done in case [[pushScope]] and [[popScope]] were called in the context of subquery
-   * resolution (which is indicated by `isSubqueryRoot` flag), because we don't want to overwrite
-   * the existing `hiddenOutput` of the main plan.
+   * clear the stack. We propagate `hiddenOutput`, `availableAliases` upwards because of name
+   * resolution by overwriting their current values with the popped ones. This is not done in case
+   * [[pushScope]] and [[popScope]] were called in the context of subquery resolution (which is
+   * indicated by `isSubqueryRoot` flag), because we don't want to overwrite the existing
+   * `hiddenOutput` of the main plan.
    */
   def popScope(): Unit = {
     val childScope = stack.pop()
@@ -1002,8 +1055,7 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
       stack.push(
         currentScope.overwrite(
           hiddenOutput = Some(childScope.hiddenOutput),
-          availableAliases = Some(childScope.availableAliases),
-          hasLcaInAggregate = childScope.hasLcaInAggregate
+          availableAliases = Some(childScope.availableAliases)
         )
       )
     }
@@ -1082,7 +1134,6 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
       canLaterallyReferenceColumn = canLaterallyReferenceColumn,
       canReferenceAggregateExpressionAliases = canReferenceAggregateExpressionAliases,
       canResolveNameByHiddenOutput = canResolveNameByHiddenOutput,
-      shouldPreferTableColumnsOverAliases = shouldPreferTableColumnsOverAliases,
       shouldPreferHiddenOutput = shouldPreferHiddenOutput,
       canReferenceAggregatedAccessOnlyAttributes = canReferenceAggregatedAccessOnlyAttributes
     )
@@ -1103,7 +1154,9 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
           if (nameTarget.candidates.nonEmpty) {
             nameTarget.copy(
               isOuterReference = true,
-              candidates = nameTarget.candidates.map(wrapCandidateInOuterReference)
+              candidates = nameTarget.candidates.map { candidate =>
+                wrapCandidateInOuterReference(candidate, outer)
+              }
             )
           } else {
             nameTargetFromCurrentScope
@@ -1136,18 +1189,60 @@ class NameScopeStack(planLogger: PlanLogger = new PlanLogger) extends SQLConfHel
   /**
    * Wrap candidate in [[OuterReference]]. If the root is not an [[Attribute]], but an
    * [[ExtractValue]] (struct/map/array field reference) we find the actual [[Attribute]] and wrap
-   * it in [[OuterReference]].
+   * it in [[OuterReference]]. In case found [[Attribute]] is aliased in the outer scope, we
+   * replace it with an [[Attribute]] created from the [[Alias]].
    */
-  private def wrapCandidateInOuterReference(candidate: Expression): Expression = candidate match {
-    case candidate: Attribute =>
-      OuterReference(candidate)
-    case extractValue: ExtractValue =>
-      extractValue.transformUp {
-        case attribute: Attribute => OuterReference(attribute)
-        case other => other
+  private def wrapCandidateInOuterReference(
+      candidate: Expression,
+      outerScope: NameScope): Expression = {
+    candidate match {
+      case extractValue: ExtractValue =>
+        extractValue.transformUp {
+          case attribute: Attribute =>
+            tryReplaceOuterReferenceAttributeWithAlias(attribute, outerScope)
+          case other => other
+        }
+      case attribute: Attribute =>
+        tryReplaceOuterReferenceAttributeWithAlias(attribute, outerScope)
+      case other => other
+    }
+  }
+
+  /**
+   * Try to replace an [[Attribute]] with an [[Attribute]] created out of the [[Alias]] from the
+   * outer scope. For example:
+   *
+   * {{{ SELECT col1 AS alias FROM VALUES('a') GROUP BY col1 HAVING (SELECT col1 = 'a'); }}}
+   *
+   * Plan should be:
+   *
+   * {{{
+   * Filter cast(scalar-subquery#2 [alias#1] as boolean)
+   *    +- Project [(outer(alias#1) = a) AS (outer(col1) = a)#3]
+   *       +- OneRowRelation
+   * +- Aggregate [col1#0], [col1#0 AS alias#1]
+   *    +- LocalRelation [col1#0]
+   * }}}
+   *
+   * As it can be seen, we replace `outer(col1)` with `outer(alias)` but keep the original
+   * [[Attribute]] in the name (to be compatible with the fixed-point implementation).
+   */
+  private def tryReplaceOuterReferenceAttributeWithAlias(
+      attribute: Attribute,
+      outerScope: NameScope): OuterReference = {
+    val replacedAttribute = outerScope.aggregateListAliases
+      .collectFirst {
+        case alias if alias.child.semanticEquals(attribute) => alias.toAttribute
       }
-    case _ =>
-      candidate
+      .getOrElse(attribute)
+
+    val outerReference = OuterReference(replacedAttribute)
+    outerReference.setTagValue(
+      OuterReference.SINGLE_PASS_SQL_STRING_OVERRIDE,
+      toPrettySQL(OuterReference(attribute))
+    )
+
+    outerReference
   }
 
   /**
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/OperatorWithUncomparableTypeValidator.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/OperatorWithUncomparableTypeValidator.scala
new file mode 100644
index 0000000000000..6afa9e379297d
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/OperatorWithUncomparableTypeValidator.scala
@@ -0,0 +1,80 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis.resolver
+
+import org.apache.spark.sql.catalyst.expressions.Attribute
+import org.apache.spark.sql.catalyst.plans.logical.{Distinct, LogicalPlan, SetOperation}
+import org.apache.spark.sql.errors.QueryCompilationErrors
+import org.apache.spark.sql.types.{DataType, MapType, VariantType}
+
+/**
+ * [[OperatorWithUncomparableTypeValidator]] performs the validation of a logical plan to ensure
+ * that it (if it is [[Distinct]] or [[SetOperation]]) does not contain any uncomparable types:
+ * [[VariantType]], [[MapType]], [[GeometryType]] or [[GeographyType]].
+ */
+object OperatorWithUncomparableTypeValidator {
+
+  /**
+   * Validates that the provided logical plan does not contain any uncomparable types:
+   * [[VariantType]], [[MapType]], [[GeometryType]] or [[GeographyType]] (throws a specific
+   * user-facing error if it does). Operators that are not supported are [[Distinct]] and
+   * [[SetOperation]] ([[Union]], [[Except]], [[Intersect]]).
+   */
+  def validate(operator: LogicalPlan, output: Seq[Attribute]): Unit = {
+    operator match {
+      case unsupportedOperator @ (_: SetOperation | _: Distinct) =>
+
+        output.foreach { element =>
+          if (hasMapType(element.dataType)) {
+            throwUnsupportedSetOperationOnMapType(element, unsupportedOperator)
+          }
+
+          if (hasVariantType(element.dataType)) {
+            throwUnsupportedSetOperationOnVariantType(element, unsupportedOperator)
+          }
+        }
+      case _ =>
+    }
+  }
+
+  private def hasMapType(dt: DataType): Boolean = {
+    dt.existsRecursively(_.isInstanceOf[MapType])
+  }
+
+  private def hasVariantType(dt: DataType): Boolean = {
+    dt.existsRecursively(_.isInstanceOf[VariantType])
+  }
+
+  private def throwUnsupportedSetOperationOnMapType(
+      mapCol: Attribute,
+      unresolvedPlan: LogicalPlan): Unit = {
+    throw QueryCompilationErrors.unsupportedSetOperationOnMapType(
+      mapCol = mapCol,
+      origin = unresolvedPlan.origin
+    )
+  }
+
+  private def throwUnsupportedSetOperationOnVariantType(
+      variantCol: Attribute,
+      unresolvedPlan: LogicalPlan): Unit = {
+    throw QueryCompilationErrors.unsupportedSetOperationOnVariantType(
+      variantCol = variantCol,
+      origin = unresolvedPlan.origin
+    )
+  }
+}
diff --git a/connect-examples/server-library-example/common/src/main/protobuf/relations.proto b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/OutputType.scala
similarity index 73%
rename from connect-examples/server-library-example/common/src/main/protobuf/relations.proto
rename to sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/OutputType.scala
index 1ebf0e640bef1..04152870e0014 100644
--- a/connect-examples/server-library-example/common/src/main/protobuf/relations.proto
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/OutputType.scala
@@ -15,20 +15,14 @@
  * limitations under the License.
  */
 
-syntax = 'proto3';
+package org.apache.spark.sql.catalyst.analysis.resolver
 
-option java_multiple_files = true;
-option java_package = "org.apache.connect.examples.serverlibrary.proto";
-
-import "base.proto";
-
-message CustomRelation {
-  oneof relation_type {
-    Scan scan = 1;
-  }
-}
+/**
+ * [[OutputType]] represents different types of output used during multipart name resolution in the
+ * [[NameScope]].
+ */
+object OutputType extends Enumeration {
+  type OutputType = Value
 
-message Scan {
-  // (Required) Table to scan.
-  CustomTable table = 1;
+  val Main, Hidden, Metadata = Value
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanLogger.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanLogger.scala
index 3c9fb4bea4913..d1cd7adbe994a 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanLogger.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanLogger.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{MESSAGE, QUERY_PLAN}
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanRewriter.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanRewriter.scala
index 73a83fd8c3eec..544d8180fa1fe 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanRewriter.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PlanRewriter.scala
@@ -59,7 +59,7 @@ class PlanRewriter(
     val planWithRewrittenSubqueries =
       plan.transformAllExpressionsWithPruning(_.containsPattern(PLAN_EXPRESSION)) {
         case subqueryExpression: SubqueryExpression =>
-          val rewrittenSubqueryPlan = rewrite(subqueryExpression.plan)
+          val rewrittenSubqueryPlan = doRewriteWithSubqueries(subqueryExpression.plan)
 
           subqueryExpression.withNewPlan(rewrittenSubqueryPlan)
       }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProducesUnresolvedSubtree.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProducesUnresolvedSubtree.scala
index 576cb98bbabe8..61f5457b42688 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProducesUnresolvedSubtree.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProducesUnresolvedSubtree.scala
@@ -25,8 +25,8 @@ import org.apache.spark.sql.catalyst.expressions.Expression
  * called produces partially-unresolved subtrees. In order to resolve the subtree a callback
  * resolver is called recursively. This callback must ensure that no node is resolved twice in
  * order to not break the single-pass invariant. This is done by tagging the limits of this
- * traversal with [[ExpressionResolver.SINGLE_PASS_SUBTREE_BOUNDARY]] tag. This tag is applied to
- * the original expression's children, which are guaranteed to be resolved at the time of given
+ * traversal with [[ResolverTag.SINGLE_PASS_SUBTREE_BOUNDARY]] tag. This tag is applied to the
+ * original expression's children, which are guaranteed to be resolved at the time of given
  * expression's resolution. When callback resolver encounters the node that is tagged, it should
  * return identity instead of trying to resolve it.
  */
@@ -40,20 +40,20 @@ trait ProducesUnresolvedSubtree extends ResolvesExpressionChildren {
    *
    * If the result of the callback is the same object as the source `expression`, we don't perform
    * the downwards traversal. This is both more optimal and a fail-safe mechanism in case we
-   * accidentally lose the [[ExpressionResolver.SINGLE_PASS_SUBTREE_BOUNDARY]] tag.
+   * accidentally lose the [[ResolverTag.SINGLE_PASS_SUBTREE_BOUNDARY]] tag.
    */
   protected def withResolvedSubtree(
       expression: Expression,
       expressionResolver: Expression => Expression)(body: => Expression): Expression = {
     expression.children.foreach { child =>
-      child.setTagValue(ExpressionResolver.SINGLE_PASS_SUBTREE_BOUNDARY, ())
+      child.setTagValue(ResolverTag.SINGLE_PASS_SUBTREE_BOUNDARY, ())
     }
 
     val resultExpression = body
 
     if (resultExpression.eq(expression)) {
       expression.children.foreach { child =>
-        child.unsetTagValue(ExpressionResolver.SINGLE_PASS_SUBTREE_BOUNDARY)
+        child.unsetTagValue(ResolverTag.SINGLE_PASS_SUBTREE_BOUNDARY)
       }
       resultExpression
     } else {
@@ -68,9 +68,9 @@ trait ProducesUnresolvedSubtree extends ResolvesExpressionChildren {
    */
   protected def tryPopSinglePassSubtreeBoundary(unresolvedExpression: Expression): Boolean = {
     if (unresolvedExpression
-        .getTagValue(ExpressionResolver.SINGLE_PASS_SUBTREE_BOUNDARY)
+        .getTagValue(ResolverTag.SINGLE_PASS_SUBTREE_BOUNDARY)
         .isDefined) {
-      unresolvedExpression.unsetTagValue(ExpressionResolver.SINGLE_PASS_SUBTREE_BOUNDARY)
+      unresolvedExpression.unsetTagValue(ResolverTag.SINGLE_PASS_SUBTREE_BOUNDARY)
       true
     } else {
       false
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProjectResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProjectResolver.scala
index 076ba6019d786..9e6522968b5b4 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProjectResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ProjectResolver.scala
@@ -60,12 +60,19 @@ class ProjectResolver(operatorResolver: Resolver, expressionResolver: Expression
    *
    * After the subtree and project-list expressions are resolved in the child scope we overwrite
    * current scope with resolved operators output to expose new names to the parent operators.
+   *
+   * We need to clear [[NameScope.availableAliases]]. Those are only relevant for the immediate
+   * project list for output prioritization to work correctly in
+   * [[NameScope.tryResolveMultipartNameByOutput]].
    */
   override def resolve(unresolvedProject: Project): LogicalPlan = {
     scopes.pushScope()
 
     val (resolvedOperator, resolvedProjectList) = try {
       val resolvedChild = operatorResolver.resolve(unresolvedProject.child)
+
+      scopes.current.availableAliases.clear()
+
       val childReferencedAttributes = expressionResolver.getLastReferencedAttributes
       val resolvedProjectList =
         expressionResolver.resolveProjectList(unresolvedProject.projectList, unresolvedProject)
@@ -87,7 +94,8 @@ class ProjectResolver(operatorResolver: Resolver, expressionResolver: Expression
             expressions = aggregateWithLcaResolutionResult.outputList,
             hasAggregateExpressions = false,
             hasLateralColumnAlias = false,
-            aggregateListAliases = aggregateWithLcaResolutionResult.aggregateListAliases
+            aggregateListAliases = aggregateWithLcaResolutionResult.aggregateListAliases,
+            baseAggregate = Some(aggregateWithLcaResolutionResult.baseAggregate)
           )
           (aggregateWithLcaResolutionResult.resolvedOperator, projectList)
         } else {
@@ -95,8 +103,10 @@ class ProjectResolver(operatorResolver: Resolver, expressionResolver: Expression
           // single-pass Analyzer.
           ExprUtils.assertValidAggregation(aggregate)
 
-          val resolvedAggregateList =
-            resolvedProjectList.copy(aggregateListAliases = scopes.current.aggregateListAliases)
+          val resolvedAggregateList = resolvedProjectList.copy(
+            aggregateListAliases = scopes.current.aggregateListAliases,
+            baseAggregate = Some(aggregate)
+          )
 
           (aggregate, resolvedAggregateList)
         }
@@ -119,7 +129,8 @@ class ProjectResolver(operatorResolver: Resolver, expressionResolver: Expression
 
     scopes.overwriteOutputAndExtendHiddenOutput(
       output = resolvedProjectList.expressions.map(namedExpression => namedExpression.toAttribute),
-      aggregateListAliases = resolvedProjectList.aggregateListAliases
+      aggregateListAliases = resolvedProjectList.aggregateListAliases,
+      baseAggregate = resolvedProjectList.baseAggregate
     )
 
     resolvedOperator
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionCheckRunner.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionCheckRunner.scala
new file mode 100644
index 0000000000000..79a3f9cf1707c
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionCheckRunner.scala
@@ -0,0 +1,63 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis.resolver
+
+import org.apache.spark.sql.catalyst.SQLConfHelper
+import org.apache.spark.sql.catalyst.expressions.SubqueryExpression
+import org.apache.spark.sql.catalyst.plans.logical.{AnalysisHelper, LogicalPlan}
+import org.apache.spark.sql.catalyst.trees.TreePattern.PLAN_EXPRESSION
+import org.apache.spark.sql.internal.SQLConf
+
+/**
+ * The [[ResolutionCheckRunner]] is used to run `resolutionChecks` on the logical plan.
+ *
+ * Important note: these checks are not always idempotent, and sometimes perform heavy network
+ * operations.
+ */
+class ResolutionCheckRunner(resolutionChecks: Seq[LogicalPlan => Unit]) extends SQLConfHelper {
+
+  /**
+   * Runs the resolution checks on `plan`. Invokes all the checks for every subquery plan, and
+   * eventually for the main query plan.
+   */
+  def runWithSubqueries(plan: LogicalPlan): Unit = {
+    if (conf.getConf(SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_RUN_EXTENDED_RESOLUTION_CHECKS)) {
+      AnalysisHelper.allowInvokingTransformsInAnalyzer {
+        doRunWithSubqueries(plan)
+      }
+    }
+  }
+
+  private def doRunWithSubqueries(plan: LogicalPlan): Unit = {
+    val planWithRewrittenSubqueries =
+      plan.transformAllExpressionsWithPruning(_.containsPattern(PLAN_EXPRESSION)) {
+        case subqueryExpression: SubqueryExpression =>
+          doRunWithSubqueries(subqueryExpression.plan)
+
+          subqueryExpression
+      }
+
+    run(planWithRewrittenSubqueries)
+  }
+
+  private def run(plan: LogicalPlan): Unit = {
+    for (check <- resolutionChecks) {
+      check(plan)
+    }
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidator.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidator.scala
index b621e396a8839..326ee8463a79f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidator.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidator.scala
@@ -101,6 +101,8 @@ class ResolutionValidator {
         validateJoin(join)
       case repartition: Repartition =>
         validateRepartition(repartition)
+      case sample: Sample =>
+        validateSample(sample)
       // [[LogicalRelation]], [[HiveTableRelation]] and other specific relations can't be imported
       // because of a potential circular dependency, so we match a generic Catalyst
       // [[MultiInstanceRelation]] instead.
@@ -269,6 +271,10 @@ class ResolutionValidator {
     validate(repartition.child)
   }
 
+  private def validateSample(sample: Sample): Unit = {
+    validate(sample.child)
+  }
+
   private def validateJoin(join: Join) = {
     attributeScopeStack.pushScope()
     try {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvedProjectList.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvedProjectList.scala
index 6c436d4176d22..9bbce99bb1130 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvedProjectList.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvedProjectList.scala
@@ -18,6 +18,7 @@
 package org.apache.spark.sql.catalyst.analysis.resolver
 
 import org.apache.spark.sql.catalyst.expressions.{Alias, NamedExpression}
+import org.apache.spark.sql.catalyst.plans.logical.Aggregate
 
 /**
  * Structure used to return results of the resolved project list.
@@ -28,9 +29,12 @@ import org.apache.spark.sql.catalyst.expressions.{Alias, NamedExpression}
  *  - hasLateralColumnAlias: True if the resolved project list contains any lateral column aliases.
  *  - aggregateListAliases: List of aliases in aggregate list if there are aggregate expressions in
  *                          the [[Project]].
+ *  - baseAggregate: Base [[Aggregate]] node constructed by [[LateralColumnAliasResolver]] while
+ *                          resolving lateral column references in [[Aggregate]].
  */
 case class ResolvedProjectList(
     expressions: Seq[NamedExpression],
     hasAggregateExpressions: Boolean,
     hasLateralColumnAlias: Boolean,
-    aggregateListAliases: Seq[Alias])
+    aggregateListAliases: Seq[Alias],
+    baseAggregate: Option[Aggregate] = None)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/Resolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/Resolver.scala
index d9d698b1fecac..75d23f29ecfc5 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/Resolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/Resolver.scala
@@ -21,7 +21,6 @@ import java.util.HashSet
 
 import org.apache.spark.SparkException
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.catalyst.analysis.{
   withPosition,
   AnalysisErrorAt,
@@ -43,7 +42,7 @@ import org.apache.spark.sql.catalyst.expressions.{
 }
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.trees.CurrentOrigin
-import org.apache.spark.sql.catalyst.trees.TreeNodeTag
+import org.apache.spark.sql.catalyst.util.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.connector.catalog.CatalogManager
 import org.apache.spark.sql.errors.QueryCompilationErrors
 
@@ -112,7 +111,6 @@ class Resolver(
   private var relationMetadataProvider: RelationMetadataProvider = new MetadataResolver(
     catalogManager,
     relationResolution,
-    functionResolution,
     metadataResolverExtensions
   )
 
@@ -173,7 +171,7 @@ class Resolver(
 
     planLogger.logPlanResolutionEvent(planAfterSubstitution, "Main resolution")
 
-    planAfterSubstitution.setTagValue(Resolver.TOP_LEVEL_OPERATOR, ())
+    planAfterSubstitution.setTagValue(ResolverTag.TOP_LEVEL_OPERATOR, ())
 
     resolve(planAfterSubstitution)
   }
@@ -257,6 +255,8 @@ class Resolver(
             resolveSupervisingCommand(supervisingCommand)
           case repartition: Repartition =>
             resolveRepartition(repartition)
+          case sample: Sample =>
+            resolveSample(sample)
           case _ =>
             tryDelegateResolutionToExtension(unresolvedPlan).getOrElse {
               handleUnmatchedOperator(unresolvedPlan)
@@ -476,12 +476,18 @@ class Resolver(
 
   /**
    * [[Distinct]] operator doesn't require any special resolution.
+   * We validate results of the resolution using the [[OperatorWithUncomparableTypeValidator]]
+   * ([[MapType]], [[VariantType]], [[GeometryType]] and [[GeographyType]] are not supported
+   * under [[Distinct]] operator).
    *
    * `hiddenOutput` and `availableAliases` are reset when [[Distinct]] is reached during tree
    * traversal.
    */
   private def resolveDistinct(unresolvedDistinct: Distinct): LogicalPlan = {
     val resolvedDistinct = unresolvedDistinct.copy(child = resolve(unresolvedDistinct.child))
+
+    OperatorWithUncomparableTypeValidator.validate(resolvedDistinct, scopes.current.output)
+
     scopes.overwriteCurrent(
       hiddenOutput = Some(scopes.current.output),
       availableAliases = Some(new HashSet[ExprId])
@@ -660,6 +666,14 @@ class Resolver(
     repartition.copy(child = resolve(repartition.child))
   }
 
+  /**
+   * Resolve [[Sample]] operator. Its resolution doesn't require any specific logic (besides
+   * child resolution).
+   */
+  private def resolveSample(sample: Sample): LogicalPlan = {
+    sample.copy(child = resolve(sample.child))
+  }
+
   private def createCteRelationRef(name: String, cteRelationDef: CTERelationDef): LogicalPlan = {
     SubqueryAlias(
       identifier = name,
@@ -771,11 +785,6 @@ class Resolver(
 
 object Resolver {
 
-  /**
-   * Marks the operator as the top-most operator in a query or a view.
-   */
-  val TOP_LEVEL_OPERATOR = TreeNodeTag[Unit]("top_level_operator")
-
   /**
    * Create a new instance of the [[RelationResolution]].
    */
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverGuard.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverGuard.scala
index 75215524d2144..5b28d5369e387 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverGuard.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverGuard.scala
@@ -19,7 +19,11 @@ package org.apache.spark.sql.catalyst.analysis.resolver
 
 import java.util.Locale
 
-import org.apache.spark.sql.catalyst.{FunctionIdentifier, SQLConfHelper, SqlScriptingContextManager}
+import org.apache.spark.sql.catalyst.{
+  FunctionIdentifier,
+  SQLConfHelper,
+  SqlScriptingContextManager
+}
 import org.apache.spark.sql.catalyst.analysis.{
   FunctionRegistry,
   GetViewColumnByNameAndOrdinal,
@@ -143,6 +147,8 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
         checkRepartition(repartition)
       case having: UnresolvedHaving =>
         checkHaving(having)
+      case sample: Sample =>
+        checkSample(sample)
       case _ =>
         false
     }
@@ -168,8 +174,6 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
         checkUnresolvedCast(unresolvedCast)
       case unresolvedUpCast: UpCast =>
         checkUnresolvedUpCast(unresolvedUpCast)
-      case unresolvedStar: UnresolvedStar =>
-        checkUnresolvedStar(unresolvedStar)
       case unresolvedAlias: UnresolvedAlias =>
         checkUnresolvedAlias(unresolvedAlias)
       case unresolvedAttribute: UnresolvedAttribute =>
@@ -194,6 +198,8 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
         checkUnresolvedFunction(unresolvedFunction)
       case getViewColumnByNameAndOrdinal: GetViewColumnByNameAndOrdinal =>
         checkGetViewColumnBynameAndOrdinal(getViewColumnByNameAndOrdinal)
+      case semiStructuredExtract: SemiStructuredExtract =>
+        checkSemiStructuredExtract(semiStructuredExtract)
       case expression if isGenerallySupportedExpression(expression) =>
         expression.children.forall(checkExpression)
       case _ =>
@@ -219,13 +225,23 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
   }
 
   private def checkProject(project: Project) = {
-    checkOperator(project.child) && project.projectList.forall(checkExpression)
+    checkOperator(project.child) && project.projectList.forall {
+      case _: UnresolvedStar =>
+        true
+      case other =>
+        checkExpression(other)
+    }
   }
 
   private def checkAggregate(aggregate: Aggregate) = {
     checkOperator(aggregate.child) &&
     aggregate.groupingExpressions.forall(checkExpression) &&
-    aggregate.aggregateExpressions.forall(checkExpression)
+    aggregate.aggregateExpressions.forall {
+      case _: UnresolvedStar =>
+        true
+      case other =>
+        checkExpression(other)
+    }
   }
 
   private def checkJoin(join: Join) = {
@@ -267,7 +283,8 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
   private def checkUnresolvedInlineTable(unresolvedInlineTable: UnresolvedInlineTable) =
     unresolvedInlineTable.rows.forall(_.forall(checkExpression))
 
-  private def checkUnresolvedRelation(unresolvedRelation: UnresolvedRelation) = true
+  private def checkUnresolvedRelation(unresolvedRelation: UnresolvedRelation) =
+    !unresolvedRelation.isStreaming
 
   private def checkResolvedInlineTable(resolvedInlineTable: ResolvedInlineTable) =
     resolvedInlineTable.rows.forall(_.forall(checkExpression))
@@ -306,8 +323,6 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
 
   private def checkUnresolvedUpCast(upCast: UpCast) = checkExpression(upCast.child)
 
-  private def checkUnresolvedStar(unresolvedStar: UnresolvedStar) = true
-
   private def checkUnresolvedAlias(unresolvedAlias: UnresolvedAlias) =
     checkExpression(unresolvedAlias.child)
 
@@ -331,6 +346,7 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
   }
 
   private def checkUnresolvedFunction(unresolvedFunction: UnresolvedFunction) =
+    unresolvedFunction.nameParts.size == 1 &&
     !ResolverGuard.UNSUPPORTED_FUNCTION_NAMES.contains(unresolvedFunction.nameParts.head) &&
     // UDFs are not supported
     FunctionRegistry.functionSet.contains(
@@ -358,6 +374,9 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
   private def checkGetViewColumnBynameAndOrdinal(
       getViewColumnByNameAndOrdinal: GetViewColumnByNameAndOrdinal) = true
 
+  private def checkSemiStructuredExtract(semiStructuredExtract: SemiStructuredExtract) =
+    checkExpression(semiStructuredExtract.child)
+
   private def checkRepartition(repartition: Repartition) = {
     checkOperator(repartition.child)
   }
@@ -365,6 +384,10 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
   private def checkHaving(having: UnresolvedHaving) =
     checkExpression(having.havingCondition) && checkOperator(having.child)
 
+  private def checkSample(sample: Sample) = {
+    checkOperator(sample.child)
+  }
+
   /**
    * Most of the expressions come from resolving the [[UnresolvedFunction]], but here we have some
    * popular expressions allowlist for two reasons:
@@ -417,8 +440,8 @@ class ResolverGuard(catalogManager: CatalogManager) extends SQLConfHelper {
           _: RegExpCount | _: RegExpSubStr | _: RegExpInStr =>
         true
       // JSON
-      case _: JsonToStructs | _: StructsToJson | _: SchemaOfJson | _: JsonObjectKeys |
-          _: LengthOfJsonArray =>
+      case _: GetJsonObject | _: JsonTuple | _: JsonToStructs | _: StructsToJson |
+          _: SchemaOfJson | _: JsonObjectKeys | _: LengthOfJsonArray =>
         true
       // CSV
       case _: SchemaOfCsv | _: StructsToCsv | _: CsvToStructs =>
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverMetricTracker.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverMetricTracker.scala
index 680360836eb7d..0e92684dc2a45 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverMetricTracker.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverMetricTracker.scala
@@ -24,7 +24,6 @@ import org.apache.spark.sql.catalyst.rules.QueryExecutionMetering
  * Trait for tracking and logging timing metrics for single-pass resolver.
  */
 trait ResolverMetricTracker {
-  private val profilerGroup: String = getClass.getSimpleName
 
   /**
    * Log top-level timing metrics for single-pass analyzer. In order to utilize existing logging
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverRunner.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverRunner.scala
index 37d41919f1323..fa06d39f13ccb 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverRunner.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverRunner.scala
@@ -18,7 +18,11 @@
 package org.apache.spark.sql.catalyst.analysis.resolver
 
 import org.apache.spark.sql.catalyst.{QueryPlanningTracker, SQLConfHelper}
-import org.apache.spark.sql.catalyst.analysis.{AnalysisContext, CleanupAliases}
+import org.apache.spark.sql.catalyst.analysis.{
+  AnalysisContext,
+  CleanupAliases,
+  PullOutNondeterministic
+}
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.internal.SQLConf
@@ -41,7 +45,8 @@ class ResolverRunner(
    */
   private val planRewriteRules: Seq[Rule[LogicalPlan]] = Seq(
     PruneMetadataColumns,
-    CleanupAliases
+    CleanupAliases,
+    PullOutNondeterministic
   )
 
   /**
@@ -50,6 +55,11 @@ class ResolverRunner(
    */
   private val planRewriter = new PlanRewriter(planRewriteRules, extendedRewriteRules)
 
+  /**
+   * `resolutionCheckRunner` is used to run `extendedResolutionChecks` on the resolved plan.
+   */
+  private val resolutionCheckRunner = new ResolutionCheckRunner(extendedResolutionChecks)
+
   /**
    * Entry point for the resolver. This method performs following 4 steps:
    *  - Resolves the plan in a bottom-up using [[Resolver]], single-pass manner.
@@ -69,7 +79,7 @@ class ResolverRunner(
 
         runValidator(rewrittenPlan)
 
-        runExtendedResolutionChecks(rewrittenPlan)
+        resolutionCheckRunner.runWithSubqueries(rewrittenPlan)
 
         rewrittenPlan
       }
@@ -82,12 +92,4 @@ class ResolverRunner(
       validator.validatePlan(plan)
     }
   }
-
-  private def runExtendedResolutionChecks(plan: LogicalPlan): Unit = {
-    if (conf.getConf(SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_RUN_EXTENDED_RESOLUTION_CHECKS)) {
-      for (check <- extendedResolutionChecks) {
-        check(plan)
-      }
-    }
-  }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PullOutNondeterministicExpressionInExpressionTree.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverTag.scala
similarity index 50%
rename from sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PullOutNondeterministicExpressionInExpressionTree.scala
rename to sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverTag.scala
index 3272c6975075c..6de583e1a1c12 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/PullOutNondeterministicExpressionInExpressionTree.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolverTag.scala
@@ -17,28 +17,34 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import java.util.LinkedHashMap
-
-import org.apache.spark.sql.catalyst.expressions.{Expression, NamedExpression}
+import org.apache.spark.sql.catalyst.trees.TreeNodeTag
 
 /**
- * Pull out nondeterministic expressions in an expression tree and replace them with the
- * corresponding attributes in the `nondeterministicToAttributes` map.
+ * Object used to store single-pass resolver related tags.
  */
-object PullOutNondeterministicExpressionInExpressionTree {
-  def apply[ExpressionType <: Expression](
-      expression: ExpressionType,
-      nondeterministicToAttributes: LinkedHashMap[Expression, NamedExpression]): ExpressionType = {
-    expression
-      .transform {
-        case childExpression =>
-          nondeterministicToAttributes.get(childExpression) match {
-            case null =>
-              childExpression
-            case namedExpression =>
-              namedExpression.toAttribute
-          }
-      }
-      .asInstanceOf[ExpressionType]
-  }
+object ResolverTag {
+
+  /**
+   * Tag used to mark [[Project]] nodes added for expression ID deduplication.
+   */
+  val PROJECT_FOR_EXPRESSION_ID_DEDUPLICATION =
+    TreeNodeTag[Unit]("project_for_expression_id_deduplication")
+
+  /**
+   * Tag used to mark a node after resolving it to avoid traversing into its subtree twice.
+   */
+  val SINGLE_PASS_SUBTREE_BOUNDARY =
+    TreeNodeTag[Unit]("single_pass_subtree_boundary")
+
+  /**
+   * Tag used to determine whether a node is an LCA.
+   */
+  val SINGLE_PASS_IS_LCA =
+    TreeNodeTag[Unit]("single_pass_is_lca")
+
+  /**
+   * Tag used to mark the operator as the top-most operator in a query or a view.
+   */
+  val TOP_LEVEL_OPERATOR =
+    TreeNodeTag[Unit]("top_level_operator")
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvesNameByHiddenOutput.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvesNameByHiddenOutput.scala
index 06a93910f2c59..ca6f4a63c88ef 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvesNameByHiddenOutput.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolvesNameByHiddenOutput.scala
@@ -21,22 +21,11 @@ import java.util.HashSet
 
 import scala.collection.mutable
 
-import org.apache.spark.sql.catalyst.expressions.{
-  Attribute,
-  AttributeReference,
-  ExprId,
-  NamedExpression,
-  PipeOperator
-}
-import org.apache.spark.sql.catalyst.plans.logical.{
-  Aggregate,
-  Distinct,
-  LogicalPlan,
-  Project,
-  SubqueryAlias,
-  UnaryNode
-}
+import org.apache.spark.sql.catalyst.SQLConfHelper
+import org.apache.spark.sql.catalyst.expressions.{ExprId, NamedExpression, PipeOperator}
+import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.util._
+import org.apache.spark.sql.internal.SQLConf
 
 /**
  * [[ResolvesNameByHiddenOutput]] is used by resolvers for operators that are able to resolve
@@ -175,7 +164,7 @@ import org.apache.spark.sql.catalyst.util._
  *
  * In the plan you can see that `col2` is added to the lower [[Project.projectList]].
  */
-trait ResolvesNameByHiddenOutput {
+trait ResolvesNameByHiddenOutput extends SQLConfHelper {
 
   /**
    * Insert the missing expressions in the output list of the operator. Recursively call
@@ -233,6 +222,20 @@ trait ResolvesNameByHiddenOutput {
       case other => other
     }
 
+  /**
+   * Deduplicates missing expressions by [[ExprId]].
+   */
+  def deduplicateMissingExpressions(
+      missingExpressions: Seq[NamedExpression]): Seq[NamedExpression] = {
+    val duplicateMissingExpressions = new HashSet[ExprId]
+    missingExpressions.collect {
+      case expression: NamedExpression
+        if !duplicateMissingExpressions.contains(expression.exprId) =>
+        duplicateMissingExpressions.add(expression.exprId)
+        expression
+    }
+  }
+
   private def expandOperatorsOutputList(
       operator: UnaryNode,
       operatorOutput: Seq[NamedExpression],
@@ -242,24 +245,27 @@ trait ResolvesNameByHiddenOutput {
       missingExpressions = missingExpressions
     )
 
-    val missingAttributes = filteredMissingExpressions.collect {
-      case attribute: AttributeReference => attribute
-    }
-
-    val expandedChild = insertMissingExpressions(operator.child, missingAttributes)
+    if (filteredMissingExpressions.nonEmpty) {
+      val (metadataCols, nonMetadataCols) =
+        operatorOutput.partition(_.toAttribute.qualifiedAccessOnly)
 
-    val (metadataCols, nonMetadataCols) =
-      operatorOutput.partition(_.toAttribute.qualifiedAccessOnly)
+      operator match {
+        case aggregate: Aggregate =>
+          val newAggregateList = nonMetadataCols ++ filteredMissingExpressions ++ metadataCols
+          aggregate.copy(aggregateExpressions = newAggregateList)
+        case project: Project =>
+          val expandedChild = insertMissingExpressions(
+            operator = operator.child,
+            missingExpressions = filteredMissingExpressions
+          )
+          val newProjectList =
+            nonMetadataCols ++ filteredMissingExpressions.map(_.toAttribute) ++ metadataCols
 
-    val newOutputList = nonMetadataCols ++ filteredMissingExpressions ++ metadataCols
-    val newOperator = operator match {
-      case aggregate: Aggregate =>
-        aggregate.copy(aggregateExpressions = newOutputList, child = expandedChild)
-      case project: Project =>
-        project.copy(projectList = newOutputList, child = expandedChild)
+          project.copy(projectList = newProjectList, child = expandedChild)
+      }
+    } else {
+      operator
     }
-
-    newOperator
   }
 
   private def filterMissingExpressions(
@@ -300,12 +306,43 @@ trait ResolvesNameByHiddenOutput {
    * because they may be needed in upper operators (if not, they will be pruned away in
    * [[PruneMetadataColumns]]). Other hidden attributes are thrown away, because we cannot
    * reference them from the new [[Project]] (they are not outputted from below).
+   *
+   * If [[SQLConf.SINGLE_PASS_RESOLVER_PREVENT_USING_ALIASES_FROM_NON_DIRECT_CHILDREN]] is set to
+   * true, we need to overwrite the current scope and clear `aggregateListAliases` and
+   * `baseAggregate`. This is needed in order to prevent later replacement of Sort/Having
+   * expressions using semantically equal aliased expressions from non-direct children. For
+   * example, in the following query:
+   *
+   * {{{ SELECT col1 AS a FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 > 1 ORDER BY col1; }}}
+   *
+   * With flag set to false, analyzed plan will be:
+   *
+   * Sort [a#3 ASC NULLS FIRST], true
+   * +- Project [a#3]
+   *    +- Filter (col2#2 > 1)
+   *       +- Aggregate [col1#1, col2#2], [col1#1 AS a#3, col2#2, col1#1]
+   *          +- LocalRelation [col1#1, col2#2]
+   *
+   * Instead of using missing attribute `col1#1` we can use its alias `a#3` in the [[Sort]] and
+   * avoid adding an extra projection. This is because all of [[Sort]], [[Project]], [[Filter]] and
+   * [[Aggregate]] belong to the same [[NameScope]] since [[Project]] was artificially inserted.
+   *
+   * However, fixed-point can't handle this case properly and produces the following plan:
+   *
+   * Project [a#3]
+   * +- Sort [col1#1 ASC NULLS FIRST], true
+   *    +- Project [a#3, col1#1]
+   *       +- Filter (col2#2 > 1)
+   *          +- Aggregate [col1#1, col2#2], [col1#1 AS a#3, col2#2, col1#1]
+   *             +- LocalRelation [col1#1, col2#2]
+   *
+   * Therefore, we need to match this behavior of fixed-point in single-pass in order to avoid
+   * logical plan mismatches.
    */
   def retainOriginalOutput(
       operator: LogicalPlan,
       missingExpressions: Seq[NamedExpression],
-      output: Seq[Attribute],
-      hiddenOutput: Seq[Attribute]): LogicalPlan = {
+      scopes: NameScopeStack): LogicalPlan = {
     if (missingExpressions.isEmpty) {
       operator
     } else {
@@ -314,17 +351,29 @@ trait ResolvesNameByHiddenOutput {
         missingExpressionIds.add(expression.exprId)
       }
 
-      val hiddenOutputToPreserve = hiddenOutput.filter { hiddenAttribute =>
+      val hiddenOutputToPreserve = scopes.current.hiddenOutput.filter { hiddenAttribute =>
         hiddenAttribute.qualifiedAccessOnly && missingExpressionIds.contains(
           hiddenAttribute.exprId
         )
       }
 
       val project = Project(
-        projectList = output ++ hiddenOutputToPreserve,
+        projectList = scopes.current.output ++ hiddenOutputToPreserve,
         child = operator
       )
 
+      if (conf.getConf(
+          SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_PREVENT_USING_ALIASES_FROM_NON_DIRECT_CHILDREN
+        )) {
+        scopes.overwriteCurrent(
+          output = Some(scopes.current.output),
+          hiddenOutput = Some(scopes.current.hiddenOutput),
+          availableAliases = Some(scopes.current.availableAliases),
+          aggregateListAliases = Seq.empty,
+          baseAggregate = None
+        )
+      }
+
       project
     }
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/RewritesAliasesInTopLcaProject.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/RewritesAliasesInTopLcaProject.scala
new file mode 100644
index 0000000000000..1fc9d579f6324
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/RewritesAliasesInTopLcaProject.scala
@@ -0,0 +1,256 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis.resolver
+
+import java.util.{HashMap, HashSet}
+
+import org.apache.spark.sql.catalyst.expressions.{
+  Alias,
+  AttributeReference,
+  Expression,
+  ExprId,
+  NamedExpression
+}
+import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Project}
+import org.apache.spark.sql.catalyst.trees.TreePattern.{AGGREGATE_EXPRESSION, ATTRIBUTE_REFERENCE}
+
+/**
+ * During LCA resolution some aliases may be rewritten as new aliases with new [[ExprId]]s. This
+ * trait handles remapping of old aliases to new ones, when these attributes appear in
+ * [[SortOrder]] expressions and Having conditions.
+ */
+trait RewritesAliasesInTopLcaProject {
+
+  /**
+   * When resolving lateral column references in [[Aggregate]] below [[Sort]] or HAVING operators,
+   * fixed-point first resolves [[SortOrder]] expressions and HAVING conditions using
+   * [[TempResolvedColumn]] and only after that resolves lateral column references. For example,
+   * consider the following query:
+   *
+   * {{{ SELECT avg(col1) AS a, a AS b FROM VALUES(1,2,3) GROUP BY col2 ORDER BY max(col3) }}}
+   *
+   * Fixed-point plan before resolving [[SortOrder]]:
+   *
+   * Sort [max(tempresolvedcolumn(col3#5, col3, false)) ASC NULLS FIRST], true
+   * +- Aggregate [col2#4], [avg(col1#3) AS a#6, lateralAliasReference(a) AS b#7]
+   *    +- LocalRelation [col1#3, col2#4, col3#5]
+   *
+   * After resolving [[TempResolvedColumn]]:
+   *
+   * Project [a#6, b#7]
+   * +- Sort [max(col3)#10 ASC NULLS FIRST], true
+   *    +- Aggregate [col2#4], [avg(col1#3) AS a#6, lca(a) AS b#7, max(col3#5) AS max(col3)#10]
+   *       +- LocalRelation [col1#3, col2#4, col3#5]
+   *
+   * In the above case fixed-point first resolves [[SortOrder]] to `max(col3)#10` and only then
+   * resolves LCAs. However, while resolving LCAs in [[Aggregate]], fixed-point first constructs
+   * a base [[Aggregate]] by pushing down all aggregate expressions with new aliases. It then
+   * places a [[Project]] on top reinstating the original alias on top of a newly created one,
+   * in order to still match the attribute reference from [[SortOrder]]:
+   *
+   * Project [a#6, b#7]
+   * +- Sort [max(col3)#10 ASC NULLS FIRST], true
+   *    +- Project [avg(col1)#11 AS a#6, lca(a) AS b#7, max(col3)#12 AS max(col3)#10]
+   *       +- Aggregate [col2#4], [avg(col1#3) AS avg(col1)#11, max(col3#5) AS max(col3)#12]
+   *          +- LocalRelation [col1#3, col2#4, col3#5]
+   *
+   * In the example above, `max(col3#5)` gets pushed down and aliased as `max(col3)#12`, even
+   * though `max(col3)#10` attribute reference already exists. Because of that `max(col3)#12` needs
+   * to be remapped back to `max(col3)#10`.
+   *
+   * However, in single-pass analyzer, we will first resolve all lateral column references before
+   * starting the resolution of [[SortOrder]] resulting in the following plan:
+   *
+   * Project [a#6, b#7]
+   * +- Sort [max(col3)#16 ASC NULLS FIRST], true
+   *    +- Project [a#6, a#6 AS b#7, max(col3)#16]
+   *       +- Project [avg(col1)#14, avg(col1)#14 AS a#6, max(col3)#16]
+   *          +- Aggregate [col2#4], [avg(col1#3) AS avg(col1)#14, max(col3#5) AS max(col3)#16]
+   *             +- LocalRelation [col1#3, col2#4, col3#5]
+   *
+   * In the above case, rewriting `max(col3)#16` with an [[Alias]] is not necessary from
+   * correctness perspective, but we need to do it in order to stay compatible with fixed-point
+   * analyzer. Because fixed-point only regenerates aliases from original aggregate list, in
+   * single-pass we need to handle the following:
+   *  1. all aliases from top-level [[Project]] (because they originate from the unresolved
+   *  aggregate list);
+   *  2. all references to aliases from the base aggregate (because they are became attribute
+   *  references during LCA resolution);
+   *
+   * This same issue also applies to HAVING resolution.
+   */
+  def rewriteNamedExpressionsInTopLcaProject[ExpressionType <: Expression](
+      projectToRewrite: Project,
+      baseAggregate: Aggregate,
+      expressionsToRewrite: Seq[ExpressionType],
+      rewriteCandidates: Seq[NamedExpression],
+      autoGeneratedAliasProvider: AutoGeneratedAliasProvider): (Project, Seq[ExpressionType]) = {
+    val candidateExpressions = getCandidateExpressionsForRewrite(
+      baseAggregate = baseAggregate,
+      oldExpressions = rewriteCandidates,
+      autoGeneratedAliasProvider = autoGeneratedAliasProvider
+    )
+    val newProject = rewriteNamedExpressionsInProject(projectToRewrite, candidateExpressions)
+    val newExpressions = updateAttributeReferencesInExpressions[ExpressionType](
+      expressionsToRewrite,
+      candidateExpressions
+    )
+
+    (newProject, newExpressions)
+  }
+
+  /**
+   * When resolving [[Sort]] or Having on top of an [[Aggregate]] that has lateral column
+   * references, aggregate and grouping expressions might not be correctly replaced in
+   * [[SortOrder]] and HAVING condition, because of [[Project]] nodes created when resolving
+   * lateral column references. Because of that, we need to additionally try and replace
+   * [[SortOrder]] expressions and HAVING conditions that don't appear in the child [[Project]],
+   * but the aliases of semantically equivalent expressions do. In case both the attribute and its
+   * alias exist in the output, don't replace the attribute in [[SortOrder]] / HAVING condition,
+   * because there is no missing input in that case.
+   * For example, consider the following query:
+   *
+   * {{{ SELECT col1 AS a, a FROM VALUES(1) GROUP BY col1 ORDER BY col1 }}}
+   *
+   * After resolving lateral column references and partially resolving [[SortOrder]] expression, we
+   * get the following plan:
+   *
+   * !Sort [col1#3 ASC NULLS FIRST], true
+   * +- Project [a#4, a#4]
+   *    +- Project [col1#3, col1#3 AS a#4]
+   *       +- Aggregate [col1#3], [col1#3]
+   *          +- LocalRelation [col1#3]
+   *
+   * In the above plan, [[Sort]] has a missing input `col1#3`. Because of LCA resolution this
+   * attribute is pushed down into the [[Project]] stack and aliased as `a#4`. Instead of using
+   * `col1#3` we can reference its semantically equivalent alias `a#4` in the [[SortOrder]]. The
+   * resolved plan looks like:
+   *
+   * Sort [a#4 ASC NULLS FIRST], true
+   * +- Project [a#4, a#4]
+   *    +- Project [col1#3, col1#3 AS a#4]
+   *       +- Aggregate [col1#3], [col1#3]
+   *          +- LocalRelation [col1#3]
+   *
+   * Because we used `a#4` alias instead of `col1#3`, we do not need to insert `col1#3` to the
+   * child [[Project]] as a missing expression. Therefore, `missingExpressions` need to be updated
+   * in order not to insert unnecessary attributes in
+   * [[ResolvesNameByHiddenOutput.insertMissingExpressions]]
+   *
+   * However, for a query like:
+   *
+   * {{{ SELECT col1, col1 AS a FROM VALUES(1) GROUP BY col1 ORDER BY col1 }}}
+   *
+   * The resolved plan will be:
+   *
+   * Sort [col1#4 ASC NULLS FIRST], true
+   * +- Aggregate [col1#4], [col1#4, col1#4 AS a#5]
+   *    +- LocalRelation [col1#4]
+   *
+   * In the above example, we do not replace `col1#4` with `a#5` because `col1#4` is present in the
+   * output.
+   */
+  def tryReplaceSortOrderOrHavingConditionWithAlias(
+      sortOrderOrCondition: Expression,
+      scopes: NameScopeStack,
+      missingExpressions: Seq[NamedExpression]): (Expression, Seq[NamedExpression]) = {
+    val replacedAttributeReferences = new HashSet[ExprId]
+    val expressionWithReplacedAliases = sortOrderOrCondition.transformDownWithPruning(
+      _.containsAnyPattern(AGGREGATE_EXPRESSION, ATTRIBUTE_REFERENCE)
+    ) {
+      case attributeReference: AttributeReference =>
+        scopes.current.aggregateListAliases
+          .collectFirst {
+            case alias
+                if alias.child.semanticEquals(attributeReference) &&
+                scopes.current.getAttributeById(attributeReference.exprId).isEmpty =>
+              replacedAttributeReferences.add(attributeReference.exprId)
+              alias.toAttribute
+          }
+          .getOrElse(attributeReference)
+      case aggregateExpression: AggregateExpression =>
+        scopes.current.aggregateListAliases
+          .collectFirst {
+            case alias if alias.child.semanticEquals(aggregateExpression) =>
+              alias.toAttribute
+          }
+          .getOrElse(aggregateExpression)
+    }
+    val filteredMissingExpressions = missingExpressions.filter(
+      expression => !replacedAttributeReferences.contains(expression.exprId)
+    )
+
+    (expressionWithReplacedAliases, filteredMissingExpressions)
+  }
+
+  private def getCandidateExpressionsForRewrite(
+      baseAggregate: Aggregate,
+      oldExpressions: Seq[NamedExpression],
+      autoGeneratedAliasProvider: AutoGeneratedAliasProvider): HashMap[ExprId, NamedExpression] = {
+    val expressionsToRewrite = new HashMap[ExprId, NamedExpression](oldExpressions.size)
+    val baseAggregateOutputLookup = new HashSet[ExprId](baseAggregate.aggregateExpressions.size)
+    baseAggregate.aggregateExpressions.foreach {
+      case alias: Alias => baseAggregateOutputLookup.add(alias.exprId)
+      case _ =>
+    }
+    oldExpressions.foreach {
+      case oldAlias: Alias =>
+        expressionsToRewrite.put(
+          oldAlias.exprId,
+          autoGeneratedAliasProvider.newAlias(oldAlias.toAttribute)
+        )
+      case oldAttributeReference: AttributeReference
+          if baseAggregateOutputLookup.contains(oldAttributeReference.exprId) =>
+        expressionsToRewrite.put(
+          oldAttributeReference.exprId,
+          autoGeneratedAliasProvider.newAlias(oldAttributeReference.toAttribute)
+        )
+      case other => expressionsToRewrite.put(other.exprId, other)
+    }
+
+    expressionsToRewrite
+  }
+
+  private def rewriteNamedExpressionsInProject(
+      project: Project,
+      candiidateExpressions: HashMap[ExprId, NamedExpression]): Project = {
+    val newProjectList = project.projectList.map {
+      case namedExpression: NamedExpression =>
+        candiidateExpressions.getOrDefault(namedExpression.exprId, namedExpression)
+      case other => other
+    }
+    project.copy(projectList = newProjectList)
+  }
+
+  private def updateAttributeReferencesInExpressions[ExpressionType <: Expression](
+      expressions: Seq[ExpressionType],
+      candidateAliases: HashMap[ExprId, NamedExpression]
+  ): Seq[ExpressionType] = {
+    expressions.map { expression =>
+      expression
+        .transformDownWithPruning(_.containsPattern(ATTRIBUTE_REFERENCE)) {
+          case attributeReference: AttributeReference =>
+            val newAliasOrOldAttribute =
+              candidateAliases.getOrDefault(attributeReference.exprId, attributeReference)
+            newAliasOrOldAttribute.toAttribute
+        }
+        .asInstanceOf[ExpressionType]
+    }
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SemiStructuredExtractResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SemiStructuredExtractResolver.scala
new file mode 100644
index 0000000000000..a5f20ae4abc7a
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SemiStructuredExtractResolver.scala
@@ -0,0 +1,77 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.analysis.resolver
+
+import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.catalyst.expressions.{Expression, Literal, SemiStructuredExtract}
+import org.apache.spark.sql.catalyst.expressions.variant.VariantGet
+import org.apache.spark.sql.types.VariantType
+import org.apache.spark.unsafe.types.UTF8String
+
+/**
+ * Resolver for [[SemiStructuredExtract]]. Resolves [[SemiStructuredExtract]] by resolving its
+ * children, replacing it with the proper semi-structured field extraction method and applying type
+ * coercion to the result.
+ */
+class SemiStructuredExtractResolver(expressionResolver: ExpressionResolver)
+    extends TreeNodeResolver[SemiStructuredExtract, Expression]
+    with ResolvesExpressionChildren
+    with CoercesExpressionTypes {
+
+  private val timezoneAwareExpressionResolver =
+    expressionResolver.getTimezoneAwareExpressionResolver
+
+  /**
+   * Resolves children and replaces [[SemiStructuredExtract]] expressions with the proper
+   * semi-structured field extraction method depending on column type. In case the column is of
+   * [[VariantType]], applies timezone to the result of the previous step.
+   *
+   * Currently only JSON is supported as an extraction method. An important distinction here with
+   * other JSON extraction methods is that the extraction fields provided here should be
+   * case-insensitive, unless explicitly stated through quoting.
+   *
+   * After replacing with proper extraction method, apply type coercion to the result.
+   */
+  override def resolve(semiStructuredExtract: SemiStructuredExtract): Expression = {
+    val semiStructuredExtractWithResolvedChildren =
+      withResolvedChildren(semiStructuredExtract, expressionResolver.resolve _)
+        .asInstanceOf[SemiStructuredExtract]
+
+    val semiStructuredExtractWithProperExtractionMethod =
+      semiStructuredExtractWithResolvedChildren.child.dataType match {
+        case _: VariantType =>
+          val extractResult = VariantGet(
+            child = semiStructuredExtractWithResolvedChildren.child,
+            path = Literal(UTF8String.fromString(semiStructuredExtractWithResolvedChildren.field)),
+            targetType = VariantType,
+            failOnError = true
+          )
+          timezoneAwareExpressionResolver.resolve(extractResult)
+        case _ =>
+          throw new AnalysisException(
+            errorClass = "COLUMN_IS_NOT_VARIANT_TYPE",
+            messageParameters = Map.empty
+          )
+      }
+
+    coerceExpressionTypes(
+      expression = semiStructuredExtractWithProperExtractionMethod,
+      expressionTreeTraversal = expressionResolver.getExpressionTreeTraversals.current
+    )
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SetOperationLikeResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SetOperationLikeResolver.scala
index 695413eaf8434..35ec8efaf8301 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SetOperationLikeResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SetOperationLikeResolver.scala
@@ -22,17 +22,10 @@ import java.util.HashSet
 import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst.analysis.{AnsiTypeCoercion, TypeCoercion, TypeCoercionBase}
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Cast, ExprId}
-import org.apache.spark.sql.catalyst.plans.logical.{
-  Except,
-  Intersect,
-  LogicalPlan,
-  Project,
-  SetOperation,
-  Union
-}
+import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.errors.QueryCompilationErrors
-import org.apache.spark.sql.types.{DataType, MapType, MetadataBuilder, VariantType}
+import org.apache.spark.sql.types.{DataType, MetadataBuilder}
 
 /**
  * The [[SetOperationLikeResolver]] performs [[Union]], [[Intersect]] or [[Except]] operator
@@ -53,16 +46,17 @@ class SetOperationLikeResolver(resolver: Resolver, expressionResolver: Expressio
    *  - Create a new mapping in [[ExpressionIdAssigner]] for the current operator. We only need the
    *    left child mapping, because that's the only child whose expression IDs get propagated
    *    upwards for [[Union]], [[Intersect]] or [[Except]]. This is an optimization.
-   *  - Perform individual output deduplication to handle the distinct union case described in
-   *    [[performIndividualOutputExpressionIdDeduplication]] scaladoc.
-   *  - Validate that child outputs have same length or throw "NUM_COLUMNS_MISMATCH" otherwise.
    *  - Compute widened data types for child output attributes using
    *    [[getTypeCoercion.findWiderTypeForTwo]] or throw "INCOMPATIBLE_COLUMN_TYPE" if coercion
    *    fails.
+   *  - Perform individual output deduplication to handle the distinct union case described in
+   *    [[performIndividualOutputExpressionIdDeduplication]] scaladoc.
+   *  - Validate that child outputs have same length or throw "NUM_COLUMNS_MISMATCH" otherwise.
    *  - Add [[Project]] with [[Cast]] on children needing attribute data type widening.
    *  - Assert that coerced outputs don't have conflicting expression IDs.
    *  - Merge transformed outputs using a separate logic for each operator type.
    *  - Store merged output in current [[NameScope]].
+   *  - Validate that the operator doesn't have unsupported data types in the output
    *  - Create a new mapping in [[ExpressionIdAssigner]] using the coerced and validated outputs.
    *  - Return the resolved operator with new children optionally wrapped in [[WithCTE]]. See
    *    [[CteScope]] scaladoc for more info.
@@ -74,30 +68,32 @@ class SetOperationLikeResolver(resolver: Resolver, expressionResolver: Expressio
       newOutputIds = childScopes.head.getOutputIds
     )
 
-    val (deduplicatedChildren, deduplicatedChildOutputs) =
-      performIndividualOutputExpressionIdDeduplication(
-        resolvedChildren,
-        childScopes.map(_.output),
-        unresolvedOperator
-      )
+    val childOutputs = childScopes.map(_.output)
 
-    val (newChildren, newChildOutputs) =
-      if (needToCoerceChildOutputs(deduplicatedChildOutputs, unresolvedOperator)) {
+    val (coercedChildren, coercedChildOutputs) =
+      if (needToCoerceChildOutputs(childOutputs, unresolvedOperator)) {
         coerceChildOutputs(
-          deduplicatedChildren,
-          deduplicatedChildOutputs,
-          validateAndDeduceTypes(unresolvedOperator, deduplicatedChildOutputs)
+          resolvedChildren,
+          childOutputs,
+          validateAndDeduceTypes(unresolvedOperator, childOutputs)
         )
       } else {
-        (deduplicatedChildren, deduplicatedChildOutputs)
+        (resolvedChildren, childOutputs)
       }
 
+    val (newChildren, newChildOutputs) =
+      performIndividualOutputExpressionIdDeduplication(
+        coercedChildren,
+        coercedChildOutputs,
+        unresolvedOperator
+      )
+
     ExpressionIdAssigner.assertOutputsHaveNoConflictingExpressionIds(newChildOutputs)
 
     val output = mergeChildOutputs(unresolvedOperator, newChildOutputs)
     scopes.overwriteCurrent(output = Some(output), hiddenOutput = Some(output))
 
-    validateOutputs(unresolvedOperator, output)
+    OperatorWithUncomparableTypeValidator.validate(unresolvedOperator, output)
 
     val resolvedOperator = unresolvedOperator.withNewChildren(newChildren)
 
@@ -362,24 +358,6 @@ class SetOperationLikeResolver(resolver: Resolver, expressionResolver: Expressio
     }
   }
 
-  /**
-   * Validate outputs of [[SetOperation]].
-   * - [[MapType]] and [[VariantType]] are currently not supported for [[SetOperations]] and we need
-   * to throw a relevant user-facing error.
-   */
-  private def validateOutputs(unresolvedPlan: LogicalPlan, output: Seq[Attribute]): Unit = {
-    unresolvedPlan match {
-      case _: SetOperation =>
-        output.find(a => hasMapType(a.dataType)).foreach { mapCol =>
-          throwUnsupportedSetOperationOnMapType(mapCol, unresolvedPlan)
-        }
-          output.find(a => hasVariantType(a.dataType)).foreach { variantCol =>
-            throwUnsupportedSetOperationOnVariantType(variantCol, unresolvedPlan)
-          }
-      case _ =>
-    }
-  }
-
   private def getTypeCoercion: TypeCoercionBase = {
     if (conf.ansiEnabled) {
       AnsiTypeCoercion
@@ -388,24 +366,6 @@ class SetOperationLikeResolver(resolver: Resolver, expressionResolver: Expressio
     }
   }
 
-  private def throwUnsupportedSetOperationOnMapType(
-      mapCol: Attribute,
-      unresolvedPlan: LogicalPlan): Unit = {
-    throw QueryCompilationErrors.unsupportedSetOperationOnMapType(
-      mapCol = mapCol,
-      origin = unresolvedPlan.origin
-    )
-  }
-
-  private def throwUnsupportedSetOperationOnVariantType(
-      variantCol: Attribute,
-      unresolvedPlan: LogicalPlan): Unit = {
-    throw QueryCompilationErrors.unsupportedSetOperationOnVariantType(
-      variantCol = variantCol,
-      origin = unresolvedPlan.origin
-    )
-  }
-
   private def throwNumColumnsMismatch(
       expectedNumColumns: Int,
       childColumnTypes: Seq[DataType],
@@ -436,12 +396,4 @@ class SetOperationLikeResolver(resolver: Resolver, expressionResolver: Expressio
       origin = unresolvedOperator.origin
     )
   }
-
-  private def hasMapType(dt: DataType): Boolean = {
-    dt.existsRecursively(_.isInstanceOf[MapType])
-  }
-
-  private def hasVariantType(dt: DataType): Boolean = {
-    dt.existsRecursively(_.isInstanceOf[VariantType])
-  }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SortResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SortResolver.scala
index 3e271a324209e..ead425510d57f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SortResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/SortResolver.scala
@@ -17,15 +17,11 @@
 
 package org.apache.spark.sql.catalyst.analysis.resolver
 
-import java.util.{HashMap, LinkedHashMap}
+import java.util.HashMap
 
 import scala.collection.mutable
-import scala.jdk.CollectionConverters._
 
-import org.apache.spark.sql.catalyst.analysis.{
-  NondeterministicExpressionCollection,
-  UnresolvedAttribute
-}
+import org.apache.spark.sql.catalyst.analysis.UnresolvedAttribute
 import org.apache.spark.sql.catalyst.expressions.{
   Alias,
   Attribute,
@@ -34,13 +30,14 @@ import org.apache.spark.sql.catalyst.expressions.{
   NamedExpression,
   SortOrder
 }
-import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, LogicalPlan, Project, Sort}
+import org.apache.spark.sql.catalyst.plans.logical._
 
 /**
  * Resolves a [[Sort]] by resolving its child and order expressions.
  */
 class SortResolver(operatorResolver: Resolver, expressionResolver: ExpressionResolver)
     extends TreeNodeResolver[Sort, LogicalPlan]
+    with RewritesAliasesInTopLcaProject
     with ResolvesNameByHiddenOutput {
   private val scopes: NameScopeStack = operatorResolver.getNameScopes
   private val autoGeneratedAliasProvider = new AutoGeneratedAliasProvider(
@@ -102,8 +99,6 @@ class SortResolver(operatorResolver: Resolver, expressionResolver: ExpressionRes
    *         +- Aggregate [col1, (col2 + 1)],
    *                      [col1, sum(col1) AS sum(col1)#..., (col2 + 1) AS (col2 + 1)#...]
    *           +- LocalRelation [col1, col2]
-   *  5. In case there are non-deterministic expressions in the order expressions, substitute them
-   *     with derived attribute references to an artificial [[Project]] list.
    */
   override def resolve(unresolvedSort: Sort): LogicalPlan = {
     val resolvedChild = operatorResolver.resolve(unresolvedSort.child)
@@ -123,50 +118,54 @@ class SortResolver(operatorResolver: Resolver, expressionResolver: ExpressionRes
     } else {
       val partiallyResolvedSort = unresolvedSort.copy(child = resolvedChild)
 
-      val (resolvedOrderExpressions, missingAttributes) =
+      val (partiallyResolvedOrderExpressions, missingAttributes) =
         resolveOrderExpressions(partiallyResolvedSort)
 
-      val (finalOrderExpressions, missingExpressions) = resolvedChild match {
-        case _ if scopes.current.hasLcaInAggregate =>
-          throw new ExplicitlyUnsupportedResolverFeature(
-            "Lateral column alias in Aggregate below a Sort"
-          )
-        case aggregate: Aggregate =>
-          val (cleanedOrderExpressions, extractedExpressions) =
-            extractReferencedGroupingAndAggregateExpressions(aggregate, resolvedOrderExpressions)
-          (cleanedOrderExpressions, extractedExpressions)
-        case filter @ Filter(_, aggregate: Aggregate) =>
-          val (cleanedOrderExpressions, extractedExpressions) =
-            extractReferencedGroupingAndAggregateExpressions(aggregate, resolvedOrderExpressions)
-          (cleanedOrderExpressions, extractedExpressions)
-        case project @ Project(_, Filter(_, aggregate: Aggregate)) =>
-          throw new ExplicitlyUnsupportedResolverFeature(
-            "Project on top of HAVING below a Sort"
+      val (resolvedOrderExpressions, missingExpressions) = resolvedChild match {
+        case _ @(_: Aggregate | _: Filter | _: Project) if scopes.current.baseAggregate.isDefined =>
+          extractReferencedGroupingAndAggregateExpressions(
+            scopes.current.baseAggregate.get,
+            partiallyResolvedOrderExpressions
           )
         case other =>
-          (resolvedOrderExpressions, missingAttributes)
+          (partiallyResolvedOrderExpressions, missingAttributes)
       }
 
+      val (resolvedOrderExpressionsWithAliasesReplaced, filteredMissingExpressions) =
+        tryReplaceSortOrderWithAlias(resolvedOrderExpressions, missingExpressions)
+
+      val deduplicatedMissingExpressions = deduplicateMissingExpressions(filteredMissingExpressions)
+
       val resolvedChildWithMissingAttributes =
-        insertMissingExpressions(resolvedChild, missingExpressions)
+        insertMissingExpressions(resolvedChild, deduplicatedMissingExpressions)
+
+      val isChildChangedByMissingExpressions = !resolvedChildWithMissingAttributes.eq(resolvedChild)
+
+      val (finalChild, finalOrderExpressions) = resolvedChildWithMissingAttributes match {
+        case project: Project if scopes.current.baseAggregate.isDefined =>
+          rewriteNamedExpressionsInTopLcaProject[SortOrder](
+            projectToRewrite = project,
+            baseAggregate = scopes.current.baseAggregate.get,
+            expressionsToRewrite = resolvedOrderExpressionsWithAliasesReplaced,
+            rewriteCandidates = missingExpressions,
+            autoGeneratedAliasProvider = autoGeneratedAliasProvider
+          )
+        case other => (other, resolvedOrderExpressionsWithAliasesReplaced)
+      }
 
       val resolvedSort = unresolvedSort.copy(
-        child = resolvedChildWithMissingAttributes,
+        child = finalChild,
         order = finalOrderExpressions
       )
 
-      val sortWithOriginalOutput = retainOriginalOutput(
-        operator = resolvedSort,
-        missingExpressions = missingExpressions,
-        output = scopes.current.output,
-        hiddenOutput = scopes.current.hiddenOutput
-      )
-
-      sortWithOriginalOutput match {
-        case project @ Project(_, sort: Sort) =>
-          project.copy(child = tryPullOutNondeterministic(sort, childOutput = sort.child.output))
-        case sort: Sort =>
-          tryPullOutNondeterministic(sort, childOutput = scopes.current.output)
+      if (isChildChangedByMissingExpressions) {
+        retainOriginalOutput(
+          operator = resolvedSort,
+          missingExpressions = missingExpressions,
+          scopes = scopes
+        )
+      } else {
+        resolvedSort
       }
     }
   }
@@ -197,10 +196,6 @@ class SortResolver(operatorResolver: Resolver, expressionResolver: ExpressionRes
    *     SELECT col1 FROM VALUES(1,2) GROUP BY col1 HAVING col1 > 1 ORDER BY col2;
    *     SELECT col1 FROM VALUES(1) ORDER BY col2;
    *     }}}
-   *
-   * If the order expression is not present in the current scope, but an alias of this expression
-   * is, replace the order expression with its alias (see
-   * [[tryReplaceSortOrderExpressionWithAlias]]).
    */
   private def resolveOrderExpressions(
       partiallyResolvedSort: Sort): (Seq[SortOrder], Seq[Attribute]) = {
@@ -211,11 +206,9 @@ class SortResolver(operatorResolver: Resolver, expressionResolver: ExpressionRes
         .resolveExpressionTreeInOperator(sortOrder, partiallyResolvedSort)
         .asInstanceOf[SortOrder]
 
-      tryReplaceSortOrderExpressionWithAlias(resolvedSortOrder).getOrElse {
-        referencedAttributes.putAll(expressionResolver.getLastReferencedAttributes)
+      referencedAttributes.putAll(expressionResolver.getLastReferencedAttributes)
 
-        resolvedSortOrder
-      }
+      resolvedSortOrder
     }
 
     val missingAttributes = scopes.current.resolveMissingAttributesByHiddenOutput(
@@ -225,37 +218,6 @@ class SortResolver(operatorResolver: Resolver, expressionResolver: ExpressionRes
     (resolvedSortOrder, missingAttributes)
   }
 
-  /**
-   * When resolving [[SortOrder]] on top of an [[Aggregate]], if there is an attribute that is
-   * present in `hiddenOutput` and there is an [[Alias]] of this attribute in the `output`,
-   * [[SortOrder]] should be resolved by the [[Alias]] instead of an attribute. This is done as
-   * optimization in order to avoid a [[Project]] node being added when resolving the attribute via
-   * missing input (because attribute is not present in direct output, only its alias is).
-   *
-   * For example, for a query like:
-   *
-   * {{{
-   * SELECT col1 + 1 AS a FROM VALUES(1) GROUP BY a ORDER BY col1 + 1;
-   * }}}
-   *
-   * The resolved plan should be:
-   *
-   * Sort [a#2 ASC NULLS FIRST], true
-   * +- Aggregate [(col1#1 + 1)], [(col1#1 + 1) AS a#2]
-   *    +- LocalRelation [col1#1]
-   *
-   * [[SortOrder]] expression is resolved to alias of `col1 + 1` instead of `col1 + 1` itself.
-   */
-  private def tryReplaceSortOrderExpressionWithAlias(sortOrder: SortOrder): Option[SortOrder] = {
-    scopes.current.aggregateListAliases
-      .collectFirst {
-        case alias if alias.child.semanticEquals(sortOrder.child) => alias.toAttribute
-      }
-      .map { aliasCandidate =>
-        sortOrder.withNewChildren(newChildren = Seq(aliasCandidate)).asInstanceOf[SortOrder]
-      }
-  }
-
   /**
    * Extracts the referenced grouping and aggregate expressions from the order expressions. This is
    * used to update the output of the child operator and add a [[Project]] as a parent of [[Sort]]
@@ -313,52 +275,33 @@ class SortResolver(operatorResolver: Resolver, expressionResolver: ExpressionRes
   }
 
   /**
-   * In case there are non-deterministic expressions in `order` expressions replace them with
-   * attributes created out of corresponding non-deterministic expression. Example:
-   *
-   * {{{ SELECT 1 ORDER BY RAND(); }}}
-   *
-   * This query would have the following analyzed plan:
-   *
-   * Project [1]
-   *   +- Sort [_nondeterministic ASC NULLS FIRST], true
-   *     +- Project [1, rand(...) AS _nondeterministic#...]
-   *       +- Project [1 AS 1#...]
-   *         +- OneRowRelation
-   *
-   * We use `childOutput` instead of directly calling `scopes.current.output`, because
-   * [[insertMissingExpressions]] could have changed the output of the child operator.
-   * We could just call `sort.child.output`, but this is suboptimal for the simple case when
-   * [[Sort]] child is left unchanged, and in that case we actually call `scopes.current.output`.
-   * See the call site in [[resolve]].
+   * When resolving [[Sort]] on top of an [[Aggregate]] that has lateral column aliases,
+   * [[extractReferencedGroupingAndAggregateExpressions]] may not correctly replace all
+   * [[SortOrder]] expressions because of newly construct [[Project]] nodes coming from LCA
+   * resolution. This method replaces all [[SortOrder]] with their aliases if those expressions
+   * don't exist in child [[Project]] but the aliases do.
+   * For more details see [[tryReplaceSortOrderOrHavingConditionWithAlias]].
    */
-  private def tryPullOutNondeterministic(sort: Sort, childOutput: Seq[Attribute]): LogicalPlan = {
-    val nondeterministicToAttributes: LinkedHashMap[Expression, NamedExpression] =
-      NondeterministicExpressionCollection.getNondeterministicToAttributes(
-        sort.order.map(_.child)
-      )
+  private def tryReplaceSortOrderWithAlias(
+      orderExpressions: Seq[SortOrder],
+      missingExpressions: Seq[NamedExpression]
+  ): (Seq[SortOrder], Seq[NamedExpression]) = {
+    val replacedOrderExpressions = new mutable.ArrayBuffer[SortOrder]
+    var currentMissingExpressions = missingExpressions
 
-    if (!nondeterministicToAttributes.isEmpty) {
-      val newChild = Project(
-        childOutput ++ nondeterministicToAttributes.values.asScala.toSeq,
-        sort.child
-      )
-      val resolvedOrder = sort.order.map { sortOrder =>
-        sortOrder.copy(
-          child = PullOutNondeterministicExpressionInExpressionTree(
-            sortOrder.child,
-            nondeterministicToAttributes
-          )
+    orderExpressions.map { orderExpression =>
+      val (replacedOrder, updatedMissingExpressions) =
+        tryReplaceSortOrderOrHavingConditionWithAlias(
+          sortOrderOrCondition = orderExpression,
+          scopes = scopes,
+          missingExpressions = currentMissingExpressions
         )
-      }
-      val resolvedSort = sort.copy(
-        order = resolvedOrder,
-        child = newChild
-      )
-      Project(projectList = childOutput, child = resolvedSort)
-    } else {
-      sort
+
+      replacedOrderExpressions += replacedOrder.asInstanceOf[SortOrder]
+      currentMissingExpressions = updatedMissingExpressions
     }
+
+    (replacedOrderExpressions.toSeq, currentMissingExpressions)
   }
 
   private def canOrderByAll(expressions: Seq[SortOrder]): Boolean = {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimeAddResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimeAddResolver.scala
deleted file mode 100644
index 561e921d95dd0..0000000000000
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimeAddResolver.scala
+++ /dev/null
@@ -1,71 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.catalyst.analysis.resolver
-
-import org.apache.spark.sql.catalyst.analysis.{
-  AnsiStringPromotionTypeCoercion,
-  AnsiTypeCoercion,
-  StringPromotionTypeCoercion,
-  TypeCoercion
-}
-import org.apache.spark.sql.catalyst.expressions.{Expression, TimeAdd}
-
-/**
- * Helper resolver for [[TimeAdd]] which is produced by resolving [[BinaryArithmetic]] nodes.
- */
-class TimeAddResolver(expressionResolver: ExpressionResolver)
-    extends TreeNodeResolver[TimeAdd, Expression]
-    with ResolvesExpressionChildren
-    with CoercesExpressionTypes {
-
-  private val traversals = expressionResolver.getExpressionTreeTraversals
-
-  protected override val ansiTransformations: CoercesExpressionTypes.Transformations =
-    TimeAddResolver.ANSI_TYPE_COERCION_TRANSFORMATIONS
-  protected override val nonAnsiTransformations: CoercesExpressionTypes.Transformations =
-    TimeAddResolver.TYPE_COERCION_TRANSFORMATIONS
-
-  override def resolve(unresolvedTimeAdd: TimeAdd): Expression = {
-    val timeAddWithResolvedChildren =
-      withResolvedChildren(unresolvedTimeAdd, expressionResolver.resolve _)
-    val timeAddWithTypeCoercion: Expression = coerceExpressionTypes(
-      expression = timeAddWithResolvedChildren,
-      expressionTreeTraversal = traversals.current
-    )
-    TimezoneAwareExpressionResolver.resolveTimezone(
-      timeAddWithTypeCoercion,
-      traversals.current.sessionLocalTimeZone
-    )
-  }
-}
-
-object TimeAddResolver {
-  // Ordering in the list of type coercions should be in sync with the list in [[TypeCoercion]].
-  private val TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    StringPromotionTypeCoercion.apply,
-    TypeCoercion.ImplicitTypeCoercion.apply,
-    TypeCoercion.DateTimeOperationsTypeCoercion.apply
-  )
-
-  // Ordering in the list of type coercions should be in sync with the list in [[AnsiTypeCoercion]].
-  private val ANSI_TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    AnsiStringPromotionTypeCoercion.apply,
-    AnsiTypeCoercion.ImplicitTypeCoercion.apply,
-    AnsiTypeCoercion.AnsiDateTimeOperationsTypeCoercion.apply
-  )
-}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolver.scala
index c084932813c29..712efcef5e7a3 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolver.scala
@@ -123,6 +123,22 @@ object TimezoneAwareExpressionResolver {
   /**
    * Applies a timezone to a [[TimeZoneAwareExpression]] while preserving original tags.
    *
+   * Method is applied recursively to all the nested [[TimeZoneAwareExpression]]s which lack a
+   * timezone until we find one which has it. This is because sometimes type coercion rules (or
+   * other code) can produce multiple [[Cast]]s on top of an expression. For example:
+   *
+   * {{{ SELECT NANVL(1, null); }}}
+   *
+   * Plan:
+   *
+   * {{{
+   * Project [nanvl(cast(1 as double), cast(cast(null as int) as double)) AS nanvl(1, NULL)#0]
+   * +- OneRowRelation
+   * }}}
+   *
+   * As it can be seen, there are multiple nested [[Cast]] nodes and timezone should be applied to
+   * all of them.
+   *
    * This method is particularly useful for cases like resolving [[Cast]] expressions where tags
    * such as [[USER_SPECIFIED_CAST]] need to be preserved.
    *
@@ -133,7 +149,13 @@ object TimezoneAwareExpressionResolver {
   def resolveTimezone(expression: Expression, timeZoneId: String): Expression = {
     expression match {
       case timezoneExpression: TimeZoneAwareExpression if timezoneExpression.timeZoneId.isEmpty =>
-        val withTimezone = timezoneExpression.withTimeZone(timeZoneId)
+        val childrenWithTimeZone = timezoneExpression.children.map { child =>
+          resolveTimezone(child, timeZoneId)
+        }
+        val withNewChildren = timezoneExpression
+          .withNewChildren(childrenWithTimeZone)
+          .asInstanceOf[TimeZoneAwareExpression]
+        val withTimezone = withNewChildren.withTimeZone(timeZoneId)
         withTimezone.copyTagsFrom(timezoneExpression)
         withTimezone
       case other => other
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/UnaryMinusResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/UnaryMinusResolver.scala
deleted file mode 100644
index 48ceb7e10ebd5..0000000000000
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/UnaryMinusResolver.scala
+++ /dev/null
@@ -1,60 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.catalyst.analysis.resolver
-
-import org.apache.spark.sql.catalyst.analysis.{AnsiTypeCoercion, TypeCoercion}
-import org.apache.spark.sql.catalyst.expressions.{Expression, UnaryMinus}
-
-/**
- * Resolver for [[UnaryMinus]]. Resolves children and applies type coercion to target node.
- */
-class UnaryMinusResolver(expressionResolver: ExpressionResolver)
-    extends TreeNodeResolver[UnaryMinus, Expression]
-    with ResolvesExpressionChildren
-    with CoercesExpressionTypes {
-
-  private val traversals = expressionResolver.getExpressionTreeTraversals
-
-  protected override val ansiTransformations: CoercesExpressionTypes.Transformations =
-    UnaryMinusResolver.ANSI_TYPE_COERCION_TRANSFORMATIONS
-  protected override val nonAnsiTransformations: CoercesExpressionTypes.Transformations =
-    UnaryMinusResolver.TYPE_COERCION_TRANSFORMATIONS
-
-  override def resolve(unresolvedUnaryMinus: UnaryMinus): Expression = {
-    val unaryMinusWithResolvedChildren =
-      withResolvedChildren(unresolvedUnaryMinus, expressionResolver.resolve _)
-    coerceExpressionTypes(
-      expression = unaryMinusWithResolvedChildren,
-      expressionTreeTraversal = traversals.current
-    )
-  }
-}
-
-object UnaryMinusResolver {
-  // Ordering in the list of type coercions should be in sync with the list in [[TypeCoercion]].
-  private val TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    TypeCoercion.ImplicitTypeCoercion.apply,
-    TypeCoercion.DateTimeOperationsTypeCoercion.apply
-  )
-
-  // Ordering in the list of type coercions should be in sync with the list in [[AnsiTypeCoercion]].
-  private val ANSI_TYPE_COERCION_TRANSFORMATIONS: Seq[Expression => Expression] = Seq(
-    AnsiTypeCoercion.ImplicitTypeCoercion.apply,
-    AnsiTypeCoercion.AnsiDateTimeOperationsTypeCoercion.apply
-  )
-}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/UnsupportedExpressionInOperatorValidation.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/UnsupportedExpressionInOperatorValidation.scala
index ae0b5d4a48019..def4e3c30a6c3 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/UnsupportedExpressionInOperatorValidation.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/UnsupportedExpressionInOperatorValidation.scala
@@ -19,16 +19,7 @@ package org.apache.spark.sql.catalyst.analysis.resolver
 
 import org.apache.spark.sql.catalyst.expressions.{Expression, Generator, WindowExpression}
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
-import org.apache.spark.sql.catalyst.plans.logical.{
-  Aggregate,
-  BaseEvalPythonUDTF,
-  CollectMetrics,
-  Generate,
-  LateralJoin,
-  LogicalPlan,
-  Project,
-  Window
-}
+import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.errors.QueryCompilationErrors
 
 object UnsupportedExpressionInOperatorValidation {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ViewResolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ViewResolver.scala
index 3470bed9cfb2e..ad1926772e7f1 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ViewResolver.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/ViewResolver.scala
@@ -165,6 +165,7 @@ class ViewResolver(resolver: Resolver, catalogManager: CatalogManager)
  *
  * @param nestedViewDepth Current nested view depth. Cannot exceed the `maxNestedViewDepth`.
  * @param maxNestedViewDepth Maximum allowed nested view depth. Configured in the upper context
+ *   based on [[SQLConf.MAX_NESTED_VIEW_DEPTH]].
  * @param collation View's default collation if explicitly set.
  * @param catalogAndNamespace Catalog and camespace under which the [[View]] was created.
  */
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/package.scala
similarity index 100%
rename from sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver.scala
rename to sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/analysis/resolver/package.scala
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalog.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalog.scala
index 979613ae11266..d1f37020f2111 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalog.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalog.scala
@@ -120,9 +120,21 @@ trait ExternalCatalog {
    * @param db Database that table to alter schema for exists in
    * @param table Name of table to alter schema for
    * @param newDataSchema Updated data schema to be used for the table.
+   * @deprecated since 4.1.0 use `alterTableSchema` instead.
    */
   def alterTableDataSchema(db: String, table: String, newDataSchema: StructType): Unit
 
+  /**
+   * Alter the schema of a table identified by the provided database and table name.
+   *
+   * All partition columns must be preserved.
+   *
+   * @param db Database that table to alter schema for exists in
+   * @param table Name of table to alter schema for
+   * @param newSchema Updated data schema to be used for the table.
+   */
+  def alterTableSchema(db: String, table: String, newSchema: StructType): Unit
+
   /** Alter the statistics of a table. If `stats` is None, then remove all existing statistics. */
   def alterTableStats(db: String, table: String, stats: Option[CatalogStatistics]): Unit
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogWithListener.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogWithListener.scala
index c2613ff74da4a..33f088079caa7 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogWithListener.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogWithListener.scala
@@ -125,6 +125,12 @@ class ExternalCatalogWithListener(delegate: ExternalCatalog)
     postToAll(AlterTableEvent(db, table, AlterTableKind.DATASCHEMA))
   }
 
+  override def alterTableSchema(db: String, table: String, newSchema: StructType): Unit = {
+    postToAll(AlterTablePreEvent(db, table, AlterTableKind.SCHEMA))
+    delegate.alterTableSchema(db, table, newSchema)
+    postToAll(AlterTableEvent(db, table, AlterTableKind.SCHEMA))
+  }
+
   override def alterTableStats(
       db: String,
       table: String,
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/InMemoryCatalog.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/InMemoryCatalog.scala
index 284ca63d820fe..5d0184579faac 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/InMemoryCatalog.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/InMemoryCatalog.scala
@@ -331,6 +331,21 @@ class InMemoryCatalog(
     catalog(db).tables(table).table = origTable.copy(schema = newSchema)
   }
 
+  override def alterTableSchema(
+      db: String,
+      table: String,
+      newSchema: StructType): Unit = synchronized {
+    requireTableExists(db, table)
+    val origTable = catalog(db).tables(table).table
+
+    val partCols = origTable.partitionColumnNames
+    assert(newSchema.map(_.name).takeRight(partCols.length) == partCols,
+      s"Partition columns ${partCols.mkString("[", ", ", "]")} are only supported at the end of " +
+        s"the new schema ${newSchema.catalogString} for now.")
+
+    catalog(db).tables(table).table = origTable.copy(schema = newSchema)
+  }
+
   override def alterTableStats(
       db: String,
       table: String,
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalog.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalog.scala
index 3eb1b35d24195..e0d1cf011e06a 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalog.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalog.scala
@@ -41,7 +41,7 @@ import org.apache.spark.sql.catalyst.catalog.SQLFunction.parseDefault
 import org.apache.spark.sql.catalyst.expressions.{Alias, Attribute, AttributeReference, Cast, Expression, ExpressionInfo, LateralSubquery, NamedArgumentExpression, NamedExpression, OuterReference, ScalarSubquery, UpCast}
 import org.apache.spark.sql.catalyst.parser.{CatalystSqlParser, ParserInterface}
 import org.apache.spark.sql.catalyst.plans.Inner
-import org.apache.spark.sql.catalyst.plans.logical.{FunctionSignature, InputParameter, LateralJoin, LocalRelation, LogicalPlan, NamedParametersSupport, OneRowRelation, Project, SubqueryAlias, View}
+import org.apache.spark.sql.catalyst.plans.logical.{FunctionSignature, InputParameter, LateralJoin, LogicalPlan, NamedParametersSupport, OneRowRelation, Project, SubqueryAlias, View}
 import org.apache.spark.sql.catalyst.trees.CurrentOrigin
 import org.apache.spark.sql.catalyst.util.{CharVarcharUtils, StringUtils}
 import org.apache.spark.sql.connector.catalog.CatalogManager
@@ -484,6 +484,7 @@ class SessionCatalog(
    *
    * @param identifier TableIdentifier
    * @param newDataSchema Updated data schema to be used for the table
+   * @deprecated since 4.1.0 use `alterTableSchema` instead.
    */
   def alterTableDataSchema(
       identifier: TableIdentifier,
@@ -507,6 +508,25 @@ class SessionCatalog(
     externalCatalog.alterTableDataSchema(db, table, newDataSchema)
   }
 
+  /**
+   * Alter the schema of a table identified by the provided table identifier. All partition columns
+   * must be preserved.
+   *
+   * @param identifier TableIdentifier
+   * @param newSchema Updated schema to be used for the table
+   */
+  def alterTableSchema(
+      identifier: TableIdentifier,
+      newSchema: StructType): Unit = {
+    val qualifiedIdent = qualifyIdentifier(identifier)
+    val db = qualifiedIdent.database.get
+    val table = qualifiedIdent.table
+    requireDbExists(db)
+    requireTableExists(qualifiedIdent)
+
+    externalCatalog.alterTableSchema(db, table, newSchema)
+  }
+
   private def columnNameResolved(
       resolver: Resolver,
       schema: StructType,
@@ -982,7 +1002,13 @@ class SessionCatalog(
       objectType = Some("VIEW"),
       objectName = Some(metadata.qualifiedName)
     )
-    val parsedPlan = SQLConf.withExistingConf(View.effectiveSQLConf(viewConfigs, isTempView)) {
+    val parsedPlan = SQLConf.withExistingConf(
+      View.effectiveSQLConf(
+        configs = viewConfigs,
+        isTempView = isTempView,
+        createSparkVersion = metadata.createVersion
+      )
+    ) {
         CurrentOrigin.withOrigin(origin) {
           parser.parseQuery(viewText)
         }
@@ -1010,7 +1036,11 @@ class SessionCatalog(
         // Note that, the column names may have duplication, e.g. `CREATE VIEW v(x, y) AS
         // SELECT 1 col, 2 col`. We need to make sure that the matching attributes have the same
         // number of duplications, and pick the corresponding attribute by ordinal.
-        val viewConf = View.effectiveSQLConf(metadata.viewSQLConfigs, isTempView)
+        val viewConf = View.effectiveSQLConf(
+          configs = metadata.viewSQLConfigs,
+          isTempView = isTempView,
+          createSparkVersion = metadata.createVersion
+        )
         val normalizeColName: String => String = if (viewConf.caseSensitiveAnalysis) {
           identity
         } else {
@@ -1459,7 +1489,12 @@ class SessionCatalog(
     requireDbExists(db)
     val newFuncDefinition = funcDefinition.copy(identifier = qualifiedIdent)
     if (!functionExists(qualifiedIdent)) {
-      externalCatalog.createFunction(db, newFuncDefinition)
+      try {
+        externalCatalog.createFunction(db, newFuncDefinition)
+      } catch {
+        case e: FunctionAlreadyExistsException if ignoreIfExists =>
+          // Ignore the exception as ignoreIfNotExists is set to true
+      }
     } else if (!ignoreIfExists) {
       throw new FunctionAlreadyExistsException(Seq(db, qualifiedIdent.funcName))
     }
@@ -1481,6 +1516,8 @@ class SessionCatalog(
         // For a permanent function, because we loaded it to the FunctionRegistry
         // when it's first used, we also need to drop it from the FunctionRegistry.
         functionRegistry.dropFunction(qualifiedIdent)
+      } else if (tableFunctionRegistry.functionExists(qualifiedIdent)) {
+        tableFunctionRegistry.dropFunction(qualifiedIdent)
       }
       externalCatalog.dropFunction(db, funcName)
     } else if (!ignoreIfNotExists) {
@@ -1615,6 +1652,7 @@ class SessionCatalog(
     // Use captured SQL configs when parsing a SQL function.
     val conf = new SQLConf()
     function.getSQLConfigs.foreach { case (k, v) => conf.settings.put(k, v) }
+    Analyzer.trySetAnsiValue(conf)
     SQLConf.withExistingConf(conf) {
       val inputParam = function.inputParam
       val returnType = function.getScalarFuncReturnType
@@ -1646,7 +1684,14 @@ class SessionCatalog(
 
         paddedInput.zip(param.fields).map {
           case (expr, param) =>
-            Alias(Cast(expr, param.dataType), param.name)(
+            // Add outer references to all resolved attributes and outer references in the function
+            // input. Outer references also need to be wrapped because the function input may
+            // already contain outer references.
+            val outer = expr.transform {
+              case a: Attribute if a.resolved => OuterReference(a)
+              case o: OuterReference => OuterReference(o)
+            }
+            Alias(Cast(outer, param.dataType), param.name)(
               qualifier = qualifier,
               // mark the alias as function input
               explicitMetadata = Some(metaForFuncInputAlias))
@@ -1654,8 +1699,7 @@ class SessionCatalog(
       }.getOrElse(Nil)
 
       val body = if (query.isDefined) ScalarSubquery(query.get) else expression.get
-      Project(Alias(Cast(body, returnType), funcName)() :: Nil,
-        Project(inputs, LocalRelation(inputs.flatMap(_.references))))
+      Project(Alias(Cast(body, returnType), funcName)() :: Nil, Project(inputs, OneRowRelation()))
     }
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/UserDefinedFunctionErrors.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/UserDefinedFunctionErrors.scala
index 904a17bc8ce44..ad142704f1047 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/UserDefinedFunctionErrors.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/UserDefinedFunctionErrors.scala
@@ -98,6 +98,12 @@ object UserDefinedFunctionErrors extends QueryErrorsBase {
         "tempObjName" -> toSQLId(varName)))
   }
 
+  def cyclicFunctionReference(path: String): Throwable = {
+    new AnalysisException(
+      errorClass = "CYCLIC_FUNCTION_REFERENCE",
+      messageParameters = Map("path" -> path))
+  }
+
   def routinePropertyTooLarge(routineName: String): Throwable = {
     new AnalysisException(
       errorClass = "USER_DEFINED_FUNCTIONS.ROUTINE_PROPERTY_TOO_LARGE",
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/VariableManager.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/VariableManager.scala
index ae313f66c9f3d..4c7d8db6604b6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/VariableManager.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/VariableManager.scala
@@ -81,6 +81,14 @@ trait VariableManager {
    * @return true if at least one variable exists, false otherwise.
    */
   def isEmpty: Boolean
+
+  /**
+   *
+   * @param variableName Name of the variable
+   * @return variable name formatting for the error
+   */
+  def getVariableNameForError(variableName: String): String
+
 }
 
 /**
@@ -105,6 +113,9 @@ class TempVariableManager extends VariableManager with DataTypeErrorsBase {
   @GuardedBy("this")
   private val variables = new mutable.HashMap[String, VariableDefinition]
 
+  override def getVariableNameForError(variableName: String): String =
+    toSQLId(Seq(SYSTEM_CATALOG_NAME, SESSION_NAMESPACE, variableName))
+
   override def create(
       nameParts: Seq[String],
       varDef: VariableDefinition,
@@ -114,7 +125,7 @@ class TempVariableManager extends VariableManager with DataTypeErrorsBase {
       throw new AnalysisException(
         errorClass = "VARIABLE_ALREADY_EXISTS",
         messageParameters = Map(
-          "variableName" -> toSQLId(Seq(SYSTEM_CATALOG_NAME, SESSION_NAMESPACE, name))))
+          "variableName" -> getVariableNameForError(name)))
     }
     variables.put(name, varDef)
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/events.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/events.scala
index e7d41644392d5..974c225afbae3 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/events.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/events.scala
@@ -126,6 +126,7 @@ case class RenameTableEvent(
 object AlterTableKind extends Enumeration {
   val TABLE = "table"
   val DATASCHEMA = "dataSchema"
+  val SCHEMA = "schema"
   val STATS = "stats"
 }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/interface.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/interface.scala
index d92d2881445ce..badfd0dfafb63 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/interface.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/interface.scala
@@ -22,17 +22,17 @@ import java.time.{ZoneId, ZoneOffset}
 import java.util.Date
 
 import scala.collection.mutable
+import scala.util.Try
 import scala.util.control.NonFatal
 
 import com.fasterxml.jackson.annotation.JsonInclude.Include
 import com.fasterxml.jackson.databind.{DeserializationFeature, ObjectMapper}
 import com.fasterxml.jackson.module.scala.{ClassTagExtensions, DefaultScalaModule}
-import org.apache.commons.lang3.StringUtils
 import org.json4s.JsonAST.{JArray, JBool, JDecimal, JDouble, JInt, JLong, JNull, JObject, JString, JValue}
 import org.json4s.jackson.JsonMethods._
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.{CurrentUserContext, FunctionIdentifier, InternalRow, SQLConfHelper, TableIdentifier}
@@ -50,6 +50,7 @@ import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.util.{CaseInsensitiveStringMap, SchemaUtils}
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.Utils
 
 /**
  * Interface providing util to convert JValue to String representation of catalog entities.
@@ -629,10 +630,6 @@ case class CatalogTable(
       if (lastAccessTime <= 0) JString("UNKNOWN")
       else JLong(lastAccessTime)
 
-    val viewQueryOutputColumns: JValue =
-      if (viewQueryColumnNames.nonEmpty) JArray(viewQueryColumnNames.map(JString).toList)
-      else JNull
-
     val map = mutable.LinkedHashMap[String, JValue]()
 
     if (identifier.catalog.isDefined) map += "Catalog" -> JString(identifier.catalog.get)
@@ -649,21 +646,35 @@ case class CatalogTable(
     }
     if (comment.isDefined) map += "Comment" -> JString(comment.get)
     if (collation.isDefined) map += "Collation" -> JString(collation.get)
-    if (tableType == CatalogTableType.VIEW && viewText.isDefined) {
-      map += "View Text" -> JString(viewText.get)
-    }
-    if (tableType == CatalogTableType.VIEW && viewOriginalText.isDefined) {
-      map += "View Original Text" -> JString(viewOriginalText.get)
-    }
-    if (SQLConf.get.viewSchemaBindingEnabled && tableType == CatalogTableType.VIEW) {
-      map += "View Schema Mode" -> JString(viewSchemaMode.toString)
-    }
-    if (viewCatalogAndNamespace.nonEmpty && tableType == CatalogTableType.VIEW) {
-      import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
-      map += "View Catalog and Namespace" -> JString(viewCatalogAndNamespace.quoted)
-    }
-    if (viewQueryOutputColumns != JNull) {
-      map += "View Query Output Columns" -> viewQueryOutputColumns
+
+    if (tableType == CatalogTableType.VIEW) {
+      if (viewText.isDefined) {
+        map += "View Text" -> JString(viewText.get)
+      }
+      if (viewOriginalText.isDefined) {
+        map += "View Original Text" -> JString(viewOriginalText.get)
+      }
+      if (SQLConf.get.viewSchemaBindingEnabled) {
+        val viewSchemaModeInfo = Try(viewSchemaMode.toString).getOrElse("UNKNOWN")
+        map += "View Schema Mode" -> JString(viewSchemaModeInfo)
+      }
+      val viewCatalogAndNamespaceInfos = Try(viewCatalogAndNamespace).getOrElse(Seq.empty)
+      if (viewCatalogAndNamespaceInfos.nonEmpty) {
+        import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
+        map += "View Catalog and Namespace" -> JString(viewCatalogAndNamespaceInfos.quoted)
+      }
+      val viewQueryOutputColumns: JValue = Try {
+        if (viewSchemaMode == SchemaEvolution) {
+          JArray(schema.map(_.name).map(JString).toList)
+        } else if (viewQueryColumnNames.nonEmpty) {
+          JArray(viewQueryColumnNames.map(JString).toList)
+        } else {
+          JNull
+        }
+      }.getOrElse(JNull)
+      if (viewQueryOutputColumns != JNull) {
+        map += "View Query Output Columns" -> viewQueryOutputColumns
+      }
     }
     if (tableProperties != JNull) map += "Table Properties" -> tableProperties
     stats.foreach { s =>
@@ -1144,7 +1155,7 @@ case class HiveTableRelation(
     val metadataEntries = metadata.toSeq.map {
       case (key, value) if key == "CatalogTable" => value
       case (key, value) =>
-        key + ": " + StringUtils.abbreviate(value, SQLConf.get.maxMetadataStringLength)
+        key + ": " + Utils.abbreviate(value, SQLConf.get.maxMetadataStringLength)
     }
 
     val metadataStr = truncatedString(metadataEntries, "[", ", ", "]", maxFields)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVExprUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVExprUtils.scala
index 7b6664a4117a2..5f1f0bff6df40 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVExprUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVExprUtils.scala
@@ -17,8 +17,6 @@
 
 package org.apache.spark.sql.catalyst.csv
 
-import org.apache.commons.lang3.StringUtils
-
 import org.apache.spark.SparkIllegalArgumentException
 
 object CSVExprUtils {
@@ -134,7 +132,7 @@ object CSVExprUtils {
       // in order to use existing escape logic
       val readAhead = if (str(idx) == '\\') 2 else 1
       // get the chunk of 1 or 2 input characters to convert to a single delimiter char
-      val chunk = StringUtils.substring(str, idx, idx + readAhead)
+      val chunk = str.substring(idx, idx + readAhead)
       delimiter += toChar(chunk)
       // advance the counter by the length of input chunk processed
       idx += chunk.length()
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVHeaderChecker.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVHeaderChecker.scala
index 1c6eecad170f1..bec52747dea7c 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVHeaderChecker.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/csv/CSVHeaderChecker.scala
@@ -21,7 +21,7 @@ import com.univocity.parsers.common.AbstractParser
 import com.univocity.parsers.csv.{CsvParser, CsvParserSettings}
 
 import org.apache.spark.SparkIllegalArgumentException
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys.{CSV_HEADER_COLUMN_NAME, CSV_HEADER_COLUMN_NAMES, CSV_HEADER_LENGTH, CSV_SCHEMA_FIELD_NAME, CSV_SCHEMA_FIELD_NAMES, CSV_SOURCE, NUM_COLUMNS}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StructType
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/AliasHelper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/AliasHelper.scala
index 2cd313c873c63..6ea79f7363227 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/AliasHelper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/AliasHelper.scala
@@ -99,16 +99,12 @@ trait AliasHelper {
     val res = CurrentOrigin.withOrigin(e.origin) {
       e match {
         case a: Alias =>
-          val metadata = if (a.metadata == Metadata.empty) {
-            None
-          } else {
-            Some(a.metadata)
-          }
+          // Preserve the _effective_ metadata.
           a.copy(child = trimAliases(a.child))(
             exprId = a.exprId,
             qualifier = a.qualifier,
-            explicitMetadata = metadata,
-            nonInheritableMetadataKeys = a.nonInheritableMetadataKeys)
+            explicitMetadata = Some(a.metadata),
+            nonInheritableMetadataKeys = Nil)
         case a: MultiAlias =>
           a.copy(child = trimAliases(a.child))
         case other => trimAliases(other)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ApproxTopKExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ApproxTopKExpressions.scala
new file mode 100644
index 0000000000000..3c9440764a9a1
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ApproxTopKExpressions.scala
@@ -0,0 +1,143 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.expressions
+
+import org.apache.datasketches.frequencies.ItemsSketch
+import org.apache.datasketches.memory.Memory
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.analysis.FunctionRegistry
+import org.apache.spark.sql.catalyst.analysis.TypeCheckResult
+import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{TypeCheckFailure, TypeCheckSuccess}
+import org.apache.spark.sql.catalyst.expressions.aggregate.ApproxTopK
+import org.apache.spark.sql.catalyst.expressions.codegen.CodegenFallback
+import org.apache.spark.sql.types._
+
+/**
+ * An expression that estimates the top K items from a sketch.
+ *
+ * The input is a sketch state that is generated by the ApproxTopKAccumulation function.
+ * The output is an array of structs, each containing a frequent item and its estimated frequency.
+ * The items are sorted by their estimated frequency in descending order.
+ *
+ * @param state The sketch state, which is a struct containing the serialized sketch data,
+ *              the original data type and the max items tracked of the sketch.
+ * @param k     The number of top items to estimate.
+ */
+// scalastyle:off line.size.limit
+@ExpressionDescription(
+  usage = """
+    _FUNC_(state, k) - Returns top k items with their frequency.
+      `k` An optional INTEGER literal greater than 0. If k is not specified, it defaults to 5.
+  """,
+  examples = """
+    Examples:
+      > SELECT _FUNC_(approx_top_k_accumulate(expr)) FROM VALUES (0), (0), (1), (1), (2), (3), (4), (4) AS tab(expr);
+       [{"item":0,"count":2},{"item":4,"count":2},{"item":1,"count":2},{"item":2,"count":1},{"item":3,"count":1}]
+
+      > SELECT _FUNC_(approx_top_k_accumulate(expr), 2) FROM VALUES 'a', 'b', 'c', 'c', 'c', 'c', 'd', 'd' tab(expr);
+       [{"item":"c","count":4},{"item":"d","count":2}]
+  """,
+  group = "misc_funcs",
+  since = "4.1.0")
+// scalastyle:on line.size.limit
+case class ApproxTopKEstimate(state: Expression, k: Expression)
+  extends BinaryExpression
+  with CodegenFallback
+  with ImplicitCastInputTypes {
+
+  def this(child: Expression, topK: Int) = this(child, Literal(topK))
+
+  def this(child: Expression) = this(child, Literal(ApproxTopK.DEFAULT_K))
+
+  private lazy val itemDataType: DataType = {
+    // itemDataType is the type of the second field of the output of ACCUMULATE or COMBINE
+    state.dataType.asInstanceOf[StructType](1).dataType
+  }
+
+  override def left: Expression = state
+
+  override def right: Expression = k
+
+  override def inputTypes: Seq[AbstractDataType] = Seq(StructType, IntegerType)
+
+  private def checkStateFieldAndType(state: Expression): TypeCheckResult = {
+    val stateStructType = state.dataType.asInstanceOf[StructType]
+    if (stateStructType.length != 3) {
+      return TypeCheckFailure("State must be a struct with 3 fields. " +
+        "Expected struct: struct<sketch:binary,itemDataType:any,maxItemsTracked:int>. " +
+        "Got: " + state.dataType.simpleString)
+    }
+
+    if (stateStructType.head.dataType != BinaryType) {
+      TypeCheckFailure("State struct must have the first field to be binary. " +
+        "Got: " + stateStructType.head.dataType.simpleString)
+    } else if (!ApproxTopK.isDataTypeSupported(itemDataType)) {
+      TypeCheckFailure("State struct must have the second field to be a supported data type. " +
+        "Got: " + itemDataType.simpleString)
+    } else if (stateStructType(2).dataType != IntegerType) {
+      TypeCheckFailure("State struct must have the third field to be int. " +
+        "Got: " + stateStructType(2).dataType.simpleString)
+    } else {
+      TypeCheckSuccess
+    }
+  }
+
+
+  override def checkInputDataTypes(): TypeCheckResult = {
+    val defaultCheck = super.checkInputDataTypes()
+    if (defaultCheck.isFailure) {
+      defaultCheck
+    } else {
+      val stateCheck = checkStateFieldAndType(state)
+      if (stateCheck.isFailure) {
+        stateCheck
+      } else if (!k.foldable) {
+        TypeCheckFailure("K must be a constant literal")
+      } else {
+        TypeCheckSuccess
+      }
+    }
+  }
+
+  override def dataType: DataType = ApproxTopK.getResultDataType(itemDataType)
+
+  override def eval(input: InternalRow): Any = {
+    // null check
+    ApproxTopK.checkExpressionNotNull(k, "k")
+    // eval
+    val stateEval = left.eval(input)
+    val kEval = right.eval(input)
+    val dataSketchBytes = stateEval.asInstanceOf[InternalRow].getBinary(0)
+    val maxItemsTrackedVal = stateEval.asInstanceOf[InternalRow].getInt(2)
+    val kVal = kEval.asInstanceOf[Int]
+    ApproxTopK.checkK(kVal)
+    ApproxTopK.checkMaxItemsTracked(maxItemsTrackedVal, kVal)
+    val itemsSketch = ItemsSketch.getInstance(
+      Memory.wrap(dataSketchBytes), ApproxTopK.genSketchSerDe(itemDataType))
+    ApproxTopK.genEvalResult(itemsSketch, kVal, itemDataType)
+  }
+
+  override protected def withNewChildrenInternal(newState: Expression, newK: Expression)
+  : Expression = copy(state = newState, k = newK)
+
+  override def nullable: Boolean = false
+
+  override def prettyName: String =
+    getTagValue(FunctionRegistry.FUNC_ALIAS).getOrElse("approx_top_k_estimate")
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Cast.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Cast.scala
index 7a4145933fc7f..23610f97dbbd4 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Cast.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Cast.scala
@@ -115,6 +115,8 @@ object Cast extends QueryErrorsBase {
     case (_: AnsiIntervalType, _: IntegralType | _: DecimalType) => true
     case (_: IntegralType | _: DecimalType, _: AnsiIntervalType) => true
 
+    case (_: TimeType, _: DecimalType) => true
+
     case (_: DayTimeIntervalType, _: DayTimeIntervalType) => true
     case (_: YearMonthIntervalType, _: YearMonthIntervalType) => true
 
@@ -134,6 +136,9 @@ object Cast extends QueryErrorsBase {
     // to convert data of these types to Variant Objects.
     case (_, VariantType) => variant.VariantGet.checkDataType(from, allowStructsAndMaps = false)
 
+    case (_: TimeType, _: TimeType) => true
+    case (_: TimeType, _: IntegralType) => true
+
     // non-null variants can generate nulls even in ANSI mode
     case (ArrayType(fromType, fn), ArrayType(toType, tn)) =>
       canAnsiCast(fromType, toType) && resolvableNullability(fn || (fromType == VariantType), tn)
@@ -228,6 +233,8 @@ object Cast extends QueryErrorsBase {
     case (TimestampType, DateType) => true
     case (TimestampNTZType, DateType) => true
 
+    case (_: TimeType, _: DecimalType) => true
+
     case (_: StringType, CalendarIntervalType) => true
     case (_: StringType, _: DayTimeIntervalType) => true
     case (_: StringType, _: YearMonthIntervalType) => true
@@ -251,6 +258,9 @@ object Cast extends QueryErrorsBase {
     // to convert data of these types to Variant Objects.
     case (_, VariantType) => variant.VariantGet.checkDataType(from, allowStructsAndMaps = false)
 
+    case (_: TimeType, _: TimeType) => true
+    case (_: TimeType, _: IntegralType) => true
+
     case (ArrayType(fromType, fn), ArrayType(toType, tn)) =>
       canCast(fromType, toType) &&
         resolvableNullability(fn || forceNullable(fromType, toType), tn)
@@ -366,6 +376,7 @@ object Cast extends QueryErrorsBase {
     case (_, _: StringType) => false
 
     case (TimestampType, ByteType | ShortType | IntegerType) => true
+    case (_: TimeType, ByteType | ShortType) => true
     case (FloatType | DoubleType, TimestampType) => true
     case (TimestampType, DateType) => false
     case (_, DateType) => true
@@ -493,6 +504,10 @@ case class Cast(
 
   final override def nodePatternsInternal(): Seq[TreePattern] = Seq(CAST)
 
+  override def contextIndependentFoldable: Boolean = {
+    child.contextIndependentFoldable && !Cast.needsTimeZone(child.dataType, dataType)
+  }
+
   def ansiEnabled: Boolean = {
     evalMode == EvalMode.ANSI || (evalMode == EvalMode.TRY && !canUseLegacyCastForTryCast)
   }
@@ -716,6 +731,9 @@ case class Cast(
   private[this] def timestampToDouble(ts: Long): Double = {
     ts / MICROS_PER_SECOND.toDouble
   }
+  private[this] def timeToLong(timeNanos: Long): Long = {
+    Math.floorDiv(timeNanos, NANOS_PER_SECOND)
+  }
 
   // DateConverter
   private[this] def castToDate(from: DataType): Any => Any = from match {
@@ -733,13 +751,15 @@ case class Cast(
       buildCast[Long](_, t => microsToDays(t, ZoneOffset.UTC))
   }
 
-  private[this] def castToTime(from: DataType): Any => Any = from match {
+  private[this] def castToTime(from: DataType, to: TimeType): Any => Any = from match {
     case _: StringType =>
       if (ansiEnabled) {
         buildCast[UTF8String](_, s => DateTimeUtils.stringToTimeAnsi(s, getContextOrNull()))
       } else {
         buildCast[UTF8String](_, s => DateTimeUtils.stringToTime(s).orNull)
       }
+    case _: TimeType =>
+      buildCast[Long](_, nanos => DateTimeUtils.truncateTimeToPrecision(nanos, to.precision))
   }
 
   // IntervalConverter
@@ -801,6 +821,8 @@ case class Cast(
       buildCast[Int](_, d => null)
     case TimestampType =>
       buildCast[Long](_, t => timestampToLong(t))
+    case _: TimeType =>
+      buildCast[Long](_, t => timeToLong(t))
     case x: NumericType if ansiEnabled =>
       val exactNumeric = PhysicalNumericType.exactNumeric(x)
       b => exactNumeric.toLong(b)
@@ -841,6 +863,8 @@ case class Cast(
           errorOrNull(t, from, IntegerType)
         }
       })
+    case _: TimeType =>
+      buildCast[Long](_, t => timeToLong(t).toInt)
     case x: NumericType if ansiEnabled =>
       val exactNumeric = PhysicalNumericType.exactNumeric(x)
       b => exactNumeric.toInt(b)
@@ -877,6 +901,15 @@ case class Cast(
           errorOrNull(t, from, ShortType)
         }
       })
+    case _: TimeType =>
+      buildCast[Long](_, t => {
+        val longValue = timeToLong(t)
+        if (longValue == longValue.toShort) {
+          longValue.toShort
+        } else {
+          errorOrNull(t, from, ShortType)
+        }
+      })
     case x: NumericType if ansiEnabled =>
       val exactNumeric = PhysicalNumericType.exactNumeric(x)
       b =>
@@ -924,6 +957,15 @@ case class Cast(
           errorOrNull(t, from, ByteType)
         }
       })
+    case _: TimeType =>
+      buildCast[Long](_, t => {
+        val longValue = timeToLong(t)
+        if (longValue == longValue.toByte) {
+          longValue.toByte
+        } else {
+          errorOrNull(t, from, ByteType)
+        }
+      })
     case x: NumericType if ansiEnabled =>
       val exactNumeric = PhysicalNumericType.exactNumeric(x)
       b =>
@@ -1002,9 +1044,15 @@ case class Cast(
         b => toPrecision(if (b) Decimal.ONE else Decimal.ZERO, target, getContextOrNull()))
     case DateType =>
       buildCast[Int](_, d => null) // date can't cast to decimal in Hive
-    case TimestampType =>
-      // Note that we lose precision here.
-      buildCast[Long](_, t => changePrecision(Decimal(timestampToDouble(t)), target))
+    case TimestampType => buildCast[Long](_, t => changePrecision(
+        // 19 digits is enough to represent any TIMESTAMP value in Long.
+        // 6 digits of scale is for microseconds precision of TIMESTAMP values.
+        Decimal.apply(t, 19, 6), target))
+    case _: TimeType => buildCast[Long](_, t => changePrecision(
+      // 14 digits is enough to cover the full range of TIME value [0, 24:00) which is
+      // [0, 24 * 60 * 60 * 1000 * 1000 * 1000) = [0, 86400000000000).
+      // 9 digits of scale is for nanoseconds precision of TIME values.
+      Decimal.apply(t, precision = 14, scale = 9), target))
     case dt: DecimalType =>
       b => toPrecision(b.asInstanceOf[Decimal], target, getContextOrNull())
     case t: IntegralType =>
@@ -1149,7 +1197,7 @@ case class Cast(
         case s: StringType => castToString(from, s.constraint)
         case BinaryType => castToBinary(from)
         case DateType => castToDate(from)
-        case _: TimeType => castToTime(from)
+        case it: TimeType => castToTime(from, it)
         case decimal: DecimalType => castToDecimal(from, decimal)
         case TimestampType => castToTimestamp(from)
         case TimestampNTZType => castToTimestampNTZ(from)
@@ -1257,7 +1305,7 @@ case class Cast(
       (c, evPrim, _) => castToStringCode(from, ctx, s.constraint).apply(c, evPrim)
     case BinaryType => castToBinaryCode(from)
     case DateType => castToDateCode(from, ctx)
-    case _: TimeType => castToTimeCode(from, ctx)
+    case it: TimeType => castToTimeCode(from, it, ctx)
     case decimal: DecimalType => castToDecimalCode(from, decimal, ctx)
     case TimestampType => castToTimestampCode(from, ctx)
     case TimestampNTZType => castToTimestampNTZCode(from, ctx)
@@ -1354,6 +1402,7 @@ case class Cast(
 
   private[this] def castToTimeCode(
       from: DataType,
+      to: TimeType,
       ctx: CodegenContext): CastFunction = {
     from match {
       case _: StringType =>
@@ -1374,7 +1423,11 @@ case class Cast(
               }
             """
           }
-
+      case _: TimeType =>
+        (nanos, evPrim, _) =>
+          code"""
+            $evPrim = $dateTimeUtilsCls.truncateTimeToPrecision($nanos, ${to.precision});
+          """
       case _ =>
         (_, _, evNull) => code"$evNull = true;"
     }
@@ -1458,11 +1511,15 @@ case class Cast(
         // date can't cast to decimal in Hive
         (c, evPrim, evNull) => code"$evNull = true;"
       case TimestampType =>
-        // Note that we lose precision here.
         (c, evPrim, evNull) =>
           code"""
-            Decimal $tmp = Decimal.apply(
-              scala.math.BigDecimal.valueOf(${timestampToDoubleCode(c)}));
+            Decimal $tmp = Decimal.apply($c, 19, 6);
+            ${changePrecision(tmp, target, evPrim, evNull, canNullSafeCast, ctx)}
+          """
+      case _: TimeType =>
+        (c, evPrim, evNull) =>
+          code"""
+            Decimal $tmp = Decimal.apply($c, 14, 9);
             ${changePrecision(tmp, target, evPrim, evNull, canNullSafeCast, ctx)}
           """
       case DecimalType() =>
@@ -1712,6 +1769,9 @@ case class Cast(
   private[this] def timestampToDoubleCode(ts: ExprValue): Block =
     code"$ts / (double)$MICROS_PER_SECOND"
 
+  private[this] def timeToLongCode(timeValue: ExprValue): Block =
+    code"Math.floorDiv($timeValue, ${NANOS_PER_SECOND}L)"
+
   private[this] def castToBooleanCode(
       from: DataType,
       ctx: CodegenContext): CastFunction = from match {
@@ -1771,6 +1831,33 @@ case class Cast(
         """
   }
 
+  private[this] def castTimeToIntegralTypeCode(
+      ctx: CodegenContext,
+      integralType: String,
+      from: DataType,
+      to: DataType): CastFunction = {
+
+    val longValue = ctx.freshName("longValue")
+    val fromDt = ctx.addReferenceObj("from", from, from.getClass.getName)
+    val toDt = ctx.addReferenceObj("to", to, to.getClass.getName)
+
+    (c, evPrim, evNull) =>
+      val overflow = if (ansiEnabled) {
+        code"""throw QueryExecutionErrors.castingCauseOverflowError($c, $fromDt, $toDt);"""
+      } else {
+        code"$evNull = true;"
+      }
+
+      code"""
+      long $longValue = ${timeToLongCode(c)};
+      if ($longValue == ($integralType) $longValue) {
+        $evPrim = ($integralType) $longValue;
+      } else {
+        $overflow
+      }
+    """
+  }
+
   private[this] def castDayTimeIntervalToIntegralTypeCode(
       startField: Byte,
       endField: Byte,
@@ -1877,6 +1964,7 @@ case class Cast(
     case DateType =>
       (c, evPrim, evNull) => code"$evNull = true;"
     case TimestampType => castTimestampToIntegralTypeCode(ctx, "byte", from, ByteType)
+    case _: TimeType => castTimeToIntegralTypeCode(ctx, "byte", from, ByteType)
     case DecimalType() => castDecimalToIntegralTypeCode("byte")
     case ShortType | IntegerType | LongType if ansiEnabled =>
       castIntegralTypeToIntegralTypeExactCode(ctx, "byte", from, ByteType)
@@ -1914,6 +2002,7 @@ case class Cast(
     case DateType =>
       (c, evPrim, evNull) => code"$evNull = true;"
     case TimestampType => castTimestampToIntegralTypeCode(ctx, "short", from, ShortType)
+    case _: TimeType => castTimeToIntegralTypeCode(ctx, "short", from, ShortType)
     case DecimalType() => castDecimalToIntegralTypeCode("short")
     case IntegerType | LongType if ansiEnabled =>
       castIntegralTypeToIntegralTypeExactCode(ctx, "short", from, ShortType)
@@ -1949,6 +2038,8 @@ case class Cast(
     case DateType =>
       (c, evPrim, evNull) => code"$evNull = true;"
     case TimestampType => castTimestampToIntegralTypeCode(ctx, "int", from, IntegerType)
+    case _: TimeType =>
+      (c, evPrim, _) => code"$evPrim = (int) ${timeToLongCode(c)};"
     case DecimalType() => castDecimalToIntegralTypeCode("int")
     case LongType if ansiEnabled =>
       castIntegralTypeToIntegralTypeExactCode(ctx, "int", from, IntegerType)
@@ -1985,6 +2076,8 @@ case class Cast(
       (c, evPrim, evNull) => code"$evNull = true;"
     case TimestampType =>
       (c, evPrim, evNull) => code"$evPrim = (long) ${timestampToLongCode(c)};"
+    case _: TimeType =>
+      (c, evPrim, evNull) => code"$evPrim = (long) ${timeToLongCode(c)};"
     case DecimalType() => castDecimalToIntegralTypeCode("long")
     case FloatType | DoubleType if ansiEnabled =>
       castFractionToIntegralTypeCode(ctx, "long", from, LongType)
@@ -2221,6 +2314,10 @@ case class UpCast(child: Expression, target: AbstractDataType, walkedTypePath: S
     case _ => target.asInstanceOf[DataType]
   }
 
+  override def contextIndependentFoldable: Boolean = {
+    child.contextIndependentFoldable && !Cast.needsTimeZone(child.dataType, dataType)
+  }
+
   override protected def withNewChildInternal(newChild: Expression): UpCast = copy(child = newChild)
 }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExprUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExprUtils.scala
index 8b7d641828ba1..783de160f83b6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExprUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExprUtils.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.catalyst.expressions
 import java.text.{DecimalFormat, DecimalFormatSymbols, ParsePosition}
 import java.util.Locale
 
-import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst.analysis._
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{DataTypeMismatch, TypeCheckSuccess}
@@ -209,17 +208,6 @@ object ExprUtils extends EvalHelper with QueryErrorsBase {
             "sqlExpr" -> toSQLExpr(expr),
             "dataType" -> toSQLType(expr.dataType)))
       }
-
-      if (!expr.deterministic) {
-        // This is just a sanity check, our analysis rule PullOutNondeterministic should
-        // already pull out those nondeterministic expressions and evaluate them in
-        // a Project node.
-        throw SparkException.internalError(
-          msg = s"Non-deterministic expression '${toSQLExpr(expr)}' should not appear in " +
-            "grouping expression.",
-          context = expr.origin.getQueryContext,
-          summary = expr.origin.context.summary)
-      }
     }
 
     a.groupingExpressions.foreach(checkValidGroupingExprs)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Expression.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Expression.scala
index cfdad6e9a51fe..f706741fc98ce 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Expression.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/Expression.scala
@@ -103,6 +103,18 @@ abstract class Expression extends TreeNode[Expression] {
    */
   def foldable: Boolean = false
 
+  /**
+   * Returns true if the expression can be folded without relying on external context,
+   * such as current time zone, session configurations, or catalogs.
+   *
+   * When an expression is context-independent foldable, it can be safely evaluated during DDL
+   * operations like creating tables, views, or constraints. This allows systems to store the
+   * computed value rather than the expression itself, improving both simplicity and performance.
+   *
+   * Default is false to ensure explicit marking of context independence.
+   */
+  def contextIndependentFoldable: Boolean = false
+
   /**
    * Returns true when the current expression always return the same result for fixed inputs from
    * children. The non-deterministic expressions should not change in number and order. They should
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSet.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSet.scala
index cc6fea2f1b7f1..0c4395d98475f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSet.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSet.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.catalyst.expressions
 import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
 
-import org.apache.spark.sql.catalyst.util.SparkStringUtils
+import org.apache.spark.util.SparkStringUtils
 
 object ExpressionSet {
   /**
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/InterpretedUnsafeProjection.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/InterpretedUnsafeProjection.scala
index 46e92e0f38e23..004cd576ace03 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/InterpretedUnsafeProjection.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/InterpretedUnsafeProjection.scala
@@ -268,7 +268,7 @@ object InterpretedUnsafeProjection {
             writer.setNull2Bytes(i)
           }
         }
-      case IntegerType | DateType | FloatType =>
+      case IntegerType | DateType | FloatType | _: YearMonthIntervalType =>
         (v, i) => {
           if (!v.isNullAt(i)) {
             unsafeWriter(v, i)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/PythonUDF.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/PythonUDF.scala
index 287f044a81610..e4d0f9642773e 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/PythonUDF.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/PythonUDF.scala
@@ -46,7 +46,8 @@ object PythonUDF {
   }
 
   def isWindowPandasUDF(e: PythonFuncExpression): Boolean = {
-    // This is currently only `PythonUDAF` (which means SQL_GROUPED_AGG_PANDAS_UDF), but we might
+    // This is currently only `PythonUDAF` (which means SQL_GROUPED_AGG_PANDAS_UDF or
+    // SQL_GROUPED_AGG_ARROW_UDF), but we might
     // support new types in the future, e.g, N -> N transform.
     e.isInstanceOf[PythonUDAF]
   }
@@ -120,11 +121,10 @@ case class PythonUDAF(
     dataType: DataType,
     children: Seq[Expression],
     udfDeterministic: Boolean,
+    evalType: Int = PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF,
     resultId: ExprId = NamedExpression.newExprId)
   extends UnevaluableAggregateFunc with PythonFuncExpression {
 
-  override def evalType: Int = PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF
-
   override def sql(isDistinct: Boolean): String = {
     val distinct = if (isDistinct) "DISTINCT " else ""
     s"$name($distinct${children.mkString(", ")})"
@@ -176,6 +176,7 @@ abstract class UnevaluableGenerator extends Generator {
  * @param pythonUDTFPartitionColumnIndexes holds the zero-based indexes of the projected results of
  *                                         all PARTITION BY expressions within the TABLE argument of
  *                                         the Python UDTF call, if applicable
+ * @param tableArguments holds whether an input argument is a table argument
  */
 case class PythonUDTF(
     name: String,
@@ -186,7 +187,8 @@ case class PythonUDTF(
     evalType: Int,
     udfDeterministic: Boolean,
     resultId: ExprId = NamedExpression.newExprId,
-    pythonUDTFPartitionColumnIndexes: Option[PythonUDTFPartitionColumnIndexes] = None)
+    pythonUDTFPartitionColumnIndexes: Option[PythonUDTFPartitionColumnIndexes] = None,
+    tableArguments: Option[Seq[Boolean]] = None)
   extends UnevaluableGenerator with PythonFuncExpression {
 
   override lazy val canonicalized: Expression = {
@@ -215,7 +217,8 @@ case class UnresolvedPolymorphicPythonUDTF(
     evalType: Int,
     udfDeterministic: Boolean,
     resolveElementMetadata: (PythonFunction, Seq[Expression]) => PythonUDTFAnalyzeResult,
-    resultId: ExprId = NamedExpression.newExprId)
+    resultId: ExprId = NamedExpression.newExprId,
+    tableArguments: Option[Seq[Boolean]] = None)
   extends UnevaluableGenerator with PythonFuncExpression {
 
   override lazy val resolved = false
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/SemiStructuredExtract.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/SemiStructuredExtract.scala
new file mode 100644
index 0000000000000..af5d2ec39d00e
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/SemiStructuredExtract.scala
@@ -0,0 +1,60 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.expressions
+
+import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.catalyst.expressions.variant.VariantGet
+import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
+import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.catalyst.trees.TreePattern.{SEMI_STRUCTURED_EXTRACT, TreePattern}
+import org.apache.spark.sql.types.{DataType, StringType, VariantType}
+import org.apache.spark.unsafe.types.UTF8String
+
+/**
+ * Represents the extraction of data from a field that contains semi-structured data. The
+ * semi-structured column can only be a Variant type for now.
+ * @param child The semi-structured column
+ * @param field The field to extract
+ */
+case class SemiStructuredExtract(
+    child: Expression, field: String) extends UnaryExpression with Unevaluable {
+  override lazy val resolved = false
+  override def dataType: DataType = StringType
+
+  final override val nodePatterns: Seq[TreePattern] = Seq(SEMI_STRUCTURED_EXTRACT)
+
+  override protected def withNewChildInternal(newChild: Expression): SemiStructuredExtract =
+    copy(child = newChild)
+}
+
+/**
+ * Replaces SemiStructuredExtract expressions by extracting the specified field from the
+ * semi-structured column (only VariantType is supported for now).
+ */
+case object ExtractSemiStructuredFields extends Rule[LogicalPlan] {
+  override def apply(plan: LogicalPlan): LogicalPlan = plan.resolveExpressionsWithPruning(
+    _.containsPattern(SEMI_STRUCTURED_EXTRACT), ruleId) {
+    case SemiStructuredExtract(column, field) if column.resolved =>
+      if (column.dataType.isInstanceOf[VariantType]) {
+        VariantGet(column, Literal(UTF8String.fromString(field)), VariantType, failOnError = true)
+      } else {
+        throw new AnalysisException(
+          errorClass = "COLUMN_IS_NOT_VARIANT_TYPE", messageParameters = Map.empty)
+      }
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/SpecificInternalRow.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/SpecificInternalRow.scala
index 971cfcae8e478..1f755df0516ff 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/SpecificInternalRow.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/SpecificInternalRow.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.sql.catalyst.expressions
 
+import scala.annotation.tailrec
+
 import org.apache.spark.sql.types._
 
 /**
@@ -192,6 +194,7 @@ final class MutableAny extends MutableValue {
  */
 final class SpecificInternalRow(val values: Array[MutableValue]) extends BaseGenericInternalRow {
 
+  @tailrec
   private[this] def dataTypeToMutableValue(dataType: DataType): MutableValue = dataType match {
     // We use INT for DATE and YearMonthIntervalType internally
     case IntegerType | DateType | _: YearMonthIntervalType => new MutableInt
@@ -203,6 +206,7 @@ final class SpecificInternalRow(val values: Array[MutableValue]) extends BaseGen
     case BooleanType => new MutableBoolean
     case ByteType => new MutableByte
     case ShortType => new MutableShort
+    case udt: UserDefinedType[_] => dataTypeToMutableValue(udt.sqlType)
     case _ => new MutableAny
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ToStringBase.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ToStringBase.scala
index 2e649763a9ac9..bc294fd722b3e 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ToStringBase.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ToStringBase.scala
@@ -22,7 +22,7 @@ import java.time.ZoneOffset
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.codegen._
 import org.apache.spark.sql.catalyst.expressions.codegen.Block._
-import org.apache.spark.sql.catalyst.util.{ArrayData, CharVarcharCodegenUtils, DateFormatter, FractionTimeFormatter, IntervalStringStyles, IntervalUtils, MapData, SparkStringUtils, TimestampFormatter}
+import org.apache.spark.sql.catalyst.util.{ArrayData, CharVarcharCodegenUtils, DateFormatter, FractionTimeFormatter, IntervalStringStyles, IntervalUtils, MapData, TimestampFormatter}
 import org.apache.spark.sql.catalyst.util.IntervalStringStyles.ANSI_STYLE
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.BinaryOutputStyle
@@ -30,6 +30,7 @@ import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.UTF8StringBuilder
 import org.apache.spark.unsafe.types.{CalendarInterval, UTF8String}
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.SparkStringUtils
 
 trait ToStringBase { self: UnaryExpression with TimeZoneAwareExpression =>
 
@@ -165,7 +166,7 @@ trait ToStringBase { self: UnaryExpression with TimeZoneAwareExpression =>
       })
     case pudt: PythonUserDefinedType => castToString(pudt.sqlType)
     case udt: UserDefinedType[_] =>
-      o => UTF8String.fromString(udt.deserialize(o).toString)
+      o => UTF8String.fromString(udt.stringifyValue(udt.deserialize(o)))
     case YearMonthIntervalType(startField, endField) =>
       acceptAny[Int](i => UTF8String.fromString(
         IntervalUtils.toYearMonthIntervalString(i, ANSI_STYLE, startField, endField)))
@@ -274,7 +275,7 @@ trait ToStringBase { self: UnaryExpression with TimeZoneAwareExpression =>
       case udt: UserDefinedType[_] =>
         val udtRef = JavaCode.global(ctx.addReferenceObj("udt", udt), udt.sqlType)
         (c, evPrim) =>
-          code"$evPrim = UTF8String.fromString($udtRef.deserialize($c).toString());"
+          code"$evPrim = UTF8String.fromString($udtRef.stringifyValue($udtRef.deserialize($c)));"
       case i: YearMonthIntervalType =>
         val iu = IntervalUtils.getClass.getName.stripSuffix("$")
         val iss = IntervalStringStyles.getClass.getName.stripSuffix("$")
@@ -471,7 +472,24 @@ object ToStringBase {
         (array: Array[Byte]) => UTF8String.fromString(SparkStringUtils.getHexString(array))
     }
   }
+
+  def getBinaryParser: BinaryParser = {
+    val style = SQLConf.get.getConf(SQLConf.BINARY_OUTPUT_STYLE)
+    style match {
+      case Some(BinaryOutputStyle.UTF8) =>
+        (utf8: UTF8String) => utf8.getBytes
+      case Some(BinaryOutputStyle.BASIC) =>
+        (utf8: UTF8String) =>
+          utf8.toString.stripPrefix("[").stripSuffix("]").split(",").map(_.trim.toByte)
+      case Some(BinaryOutputStyle.BASE64) =>
+        (utf8: UTF8String) => java.util.Base64.getDecoder.decode(utf8.getBytes)
+      case Some(BinaryOutputStyle.HEX) =>
+        (utf8: UTF8String) => Hex.unhex(utf8.getBytes)
+      case _ =>
+        (utf8: UTF8String) => SparkStringUtils.fromHexString(utf8.toString)
+    }
+  }
 }
 
 trait BinaryFormatter extends (Array[Byte] => UTF8String) with Serializable
-
+trait BinaryParser extends (UTF8String => Array[Byte]) with Serializable
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/V2ExpressionUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/V2ExpressionUtils.scala
index 7cc03f3ac3fa6..fd3d1daae6742 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/V2ExpressionUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/V2ExpressionUtils.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.catalyst.expressions
 
 import java.lang.reflect.{Method, Modifier}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FUNCTION_NAME, FUNCTION_PARAM}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.{InternalRow, SQLConfHelper}
@@ -243,6 +243,7 @@ object V2ExpressionUtils extends SQLConfHelper with Logging {
       case "ENDS_WITH" => convertBinaryExpr(expr, EndsWith)
       case "CONTAINS" => convertBinaryExpr(expr, Contains)
       case "IN" => convertExpr(expr, children => In(children.head, children.tail))
+      case "BOOLEAN_EXPRESSION" => toCatalyst(expr.children().head)
       case _ => None
     }
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/aggregate/ApproxTopKAggregates.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/aggregate/ApproxTopKAggregates.scala
new file mode 100644
index 0000000000000..cefe0a14dee56
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/aggregate/ApproxTopKAggregates.scala
@@ -0,0 +1,437 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.expressions.aggregate
+
+import org.apache.datasketches.common._
+import org.apache.datasketches.frequencies.{ErrorType, ItemsSketch}
+import org.apache.datasketches.memory.Memory
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.analysis.{FunctionRegistry, TypeCheckResult}
+import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{TypeCheckFailure, TypeCheckSuccess}
+import org.apache.spark.sql.catalyst.expressions.{ArrayOfDecimalsSerDe, Expression, ExpressionDescription, ImplicitCastInputTypes, Literal}
+import org.apache.spark.sql.catalyst.trees.{BinaryLike, TernaryLike}
+import org.apache.spark.sql.catalyst.util.{CollationFactory, GenericArrayData}
+import org.apache.spark.sql.errors.QueryExecutionErrors
+import org.apache.spark.sql.types._
+import org.apache.spark.unsafe.types.UTF8String
+
+/**
+ * The ApproxTopK function (i.e., "approx_top_k") is an aggregate function that estimates
+ * the approximate top K (aka. k-most-frequent) items in a column.
+ *
+ * The result is an array of structs, each containing a frequent item and its estimated frequency.
+ * The items are sorted by their estimated frequency in descending order.
+ *
+ * The function uses the ItemsSketch from the DataSketches library to do the estimation.
+ *
+ * See [[https://datasketches.apache.org/docs/Frequency/FrequencySketches.html]]
+ * for more information.
+ *
+ * @param expr                   the child expression to estimate the top K items from
+ * @param k                      the number of top items to return (K)
+ * @param maxItemsTracked        the maximum number of items to track in the sketch
+ * @param mutableAggBufferOffset the offset for mutable aggregation buffer
+ * @param inputAggBufferOffset   the offset for input aggregation buffer
+ */
+// scalastyle:off line.size.limit
+@ExpressionDescription(
+  usage = """
+    _FUNC_(expr, k, maxItemsTracked) - Returns top k items with their frequency.
+      `k` An optional INTEGER literal greater than 0. If k is not specified, it defaults to 5.
+      `maxItemsTracked` An optional INTEGER literal greater than or equal to k and has upper limit of 1000000. If maxItemsTracked is not specified, it defaults to 10000.
+  """,
+  examples = """
+    Examples:
+      > SELECT _FUNC_(expr) FROM VALUES (0), (0), (1), (1), (2), (3), (4), (4) AS tab(expr);
+       [{"item":0,"count":2},{"item":4,"count":2},{"item":1,"count":2},{"item":2,"count":1},{"item":3,"count":1}]
+
+      > SELECT _FUNC_(expr, 2) FROM VALUES 'a', 'b', 'c', 'c', 'c', 'c', 'd', 'd' AS tab(expr);
+       [{"item":"c","count":4},{"item":"d","count":2}]
+
+      > SELECT _FUNC_(expr, 10, 100) FROM VALUES (0), (1), (1), (2), (2), (2) AS tab(expr);
+       [{"item":2,"count":3},{"item":1,"count":2},{"item":0,"count":1}]
+  """,
+  group = "agg_funcs",
+  since = "4.1.0")
+// scalastyle:on line.size.limit
+case class ApproxTopK(
+    expr: Expression,
+    k: Expression,
+    maxItemsTracked: Expression,
+    mutableAggBufferOffset: Int = 0,
+    inputAggBufferOffset: Int = 0)
+  extends TypedImperativeAggregate[ItemsSketch[Any]]
+  with ImplicitCastInputTypes
+  with TernaryLike[Expression] {
+
+  def this(child: Expression, topK: Expression, maxItemsTracked: Expression) =
+    this(child, topK, maxItemsTracked, 0, 0)
+
+  def this(child: Expression, topK: Int, maxItemsTracked: Int) =
+    this(child, Literal(topK), Literal(maxItemsTracked), 0, 0)
+
+  def this(child: Expression, topK: Expression) =
+    this(child, topK, Literal(ApproxTopK.DEFAULT_MAX_ITEMS_TRACKED), 0, 0)
+
+  def this(child: Expression, topK: Int) =
+    this(child, Literal(topK), Literal(ApproxTopK.DEFAULT_MAX_ITEMS_TRACKED), 0, 0)
+
+  def this(child: Expression) =
+    this(child, Literal(ApproxTopK.DEFAULT_K), Literal(ApproxTopK.DEFAULT_MAX_ITEMS_TRACKED), 0, 0)
+
+  private lazy val itemDataType: DataType = expr.dataType
+  private lazy val kVal: Int = {
+    ApproxTopK.checkExpressionNotNull(k, "k")
+    val kVal = k.eval().asInstanceOf[Int]
+    ApproxTopK.checkK(kVal)
+    kVal
+  }
+  private lazy val maxItemsTrackedVal: Int = {
+    ApproxTopK.checkExpressionNotNull(maxItemsTracked, "maxItemsTracked")
+    val maxItemsTrackedVal = maxItemsTracked.eval().asInstanceOf[Int]
+    ApproxTopK.checkMaxItemsTracked(maxItemsTrackedVal, kVal)
+    maxItemsTrackedVal
+  }
+
+  override def first: Expression = expr
+
+  override def second: Expression = k
+
+  override def third: Expression = maxItemsTracked
+
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyDataType, IntegerType, IntegerType)
+
+  override def checkInputDataTypes(): TypeCheckResult = {
+    val defaultCheck = super.checkInputDataTypes()
+    if (defaultCheck.isFailure) {
+      defaultCheck
+    } else if (!ApproxTopK.isDataTypeSupported(itemDataType)) {
+      TypeCheckFailure(f"${itemDataType.typeName} columns are not supported")
+    } else if (!k.foldable) {
+      TypeCheckFailure("K must be a constant literal")
+    } else if (!maxItemsTracked.foldable) {
+      TypeCheckFailure("Number of items tracked must be a constant literal")
+    } else {
+      TypeCheckSuccess
+    }
+  }
+
+  override def dataType: DataType = ApproxTopK.getResultDataType(itemDataType)
+
+  override def createAggregationBuffer(): ItemsSketch[Any] = {
+    val maxMapSize = ApproxTopK.calMaxMapSize(maxItemsTrackedVal)
+    ApproxTopK.createAggregationBuffer(expr, maxMapSize)
+  }
+
+  override def update(buffer: ItemsSketch[Any], input: InternalRow): ItemsSketch[Any] =
+    ApproxTopK.updateSketchBuffer(expr, buffer, input)
+
+  override def merge(buffer: ItemsSketch[Any], input: ItemsSketch[Any]): ItemsSketch[Any] =
+    buffer.merge(input)
+
+  override def eval(buffer: ItemsSketch[Any]): GenericArrayData =
+    ApproxTopK.genEvalResult(buffer, kVal, itemDataType)
+
+  override def serialize(buffer: ItemsSketch[Any]): Array[Byte] =
+    buffer.toByteArray(ApproxTopK.genSketchSerDe(itemDataType))
+
+  override def deserialize(storageFormat: Array[Byte]): ItemsSketch[Any] =
+    ItemsSketch.getInstance(Memory.wrap(storageFormat), ApproxTopK.genSketchSerDe(itemDataType))
+
+  override def withNewMutableAggBufferOffset(newMutableAggBufferOffset: Int): ImperativeAggregate =
+    copy(mutableAggBufferOffset = newMutableAggBufferOffset)
+
+  override def withNewInputAggBufferOffset(newInputAggBufferOffset: Int): ImperativeAggregate =
+    copy(inputAggBufferOffset = newInputAggBufferOffset)
+
+  override protected def withNewChildrenInternal(
+      newExpr: Expression,
+      newK: Expression,
+      newMaxItemsTracked: Expression): Expression =
+    copy(expr = newExpr, k = newK, maxItemsTracked = newMaxItemsTracked)
+
+  override def nullable: Boolean = false
+
+  override def prettyName: String =
+    getTagValue(FunctionRegistry.FUNC_ALIAS).getOrElse("approx_top_k")
+}
+
+object ApproxTopK {
+
+  val DEFAULT_K: Int = 5
+  val DEFAULT_MAX_ITEMS_TRACKED: Int = 10000
+  private val MAX_ITEMS_TRACKED_LIMIT: Int = 1000000
+
+  def checkExpressionNotNull(expr: Expression, exprName: String): Unit = {
+    if (expr == null || expr.eval() == null) {
+      throw QueryExecutionErrors.approxTopKNullArg(exprName)
+    }
+  }
+
+  def checkK(k: Int): Unit = {
+    if (k <= 0) {
+      throw QueryExecutionErrors.approxTopKNonPositiveValue("k", k)
+    }
+  }
+
+  def checkMaxItemsTracked(maxItemsTracked: Int): Unit = {
+    if (maxItemsTracked > MAX_ITEMS_TRACKED_LIMIT) {
+      throw QueryExecutionErrors.approxTopKMaxItemsTrackedExceedsLimit(
+        maxItemsTracked, MAX_ITEMS_TRACKED_LIMIT)
+    }
+    if (maxItemsTracked <= 0) {
+      throw QueryExecutionErrors.approxTopKNonPositiveValue("maxItemsTracked", maxItemsTracked)
+    }
+  }
+
+  def checkMaxItemsTracked(maxItemsTracked: Int, k: Int): Unit = {
+    checkMaxItemsTracked(maxItemsTracked)
+    if (maxItemsTracked < k) {
+      throw QueryExecutionErrors.approxTopKMaxItemsTrackedLessThanK(maxItemsTracked, k)
+    }
+  }
+
+  def getResultDataType(itemDataType: DataType): DataType = {
+    val resultEntryType = StructType(
+      StructField("item", itemDataType, nullable = false) ::
+        StructField("count", LongType, nullable = false) :: Nil)
+    ArrayType(resultEntryType, containsNull = false)
+  }
+
+  def isDataTypeSupported(itemType: DataType): Boolean = {
+    itemType match {
+      case _: BooleanType | _: ByteType | _: ShortType | _: IntegerType |
+           _: LongType | _: FloatType | _: DoubleType | _: DateType |
+           _: TimestampType | _: TimestampNTZType | _: StringType | _: DecimalType => true
+      // BinaryType is not supported now, as ItemsSketch seems cannot count the frequency correctly
+      case _ => false
+    }
+  }
+
+  def calMaxMapSize(maxItemsTracked: Int): Int = {
+    // The maximum capacity of this internal hash map has maxMapCap = 0.75 * maxMapSize
+    // Therefore, the maxMapSize must be at least ceil(maxItemsTracked / 0.75)
+    // https://datasketches.apache.org/docs/Frequency/FrequentItemsOverview.html
+    val ceilMaxMapSize = math.ceil(maxItemsTracked / 0.75).toInt
+    // The maxMapSize must be a power of 2 and greater than ceilMaxMapSize
+    math.pow(2, math.ceil(math.log(ceilMaxMapSize) / math.log(2))).toInt
+  }
+
+  def createAggregationBuffer(itemExpression: Expression, maxMapSize: Int): ItemsSketch[Any] = {
+    itemExpression.dataType match {
+      case _: BooleanType =>
+        new ItemsSketch[Boolean](maxMapSize).asInstanceOf[ItemsSketch[Any]]
+      case _: ByteType | _: ShortType | _: IntegerType | _: FloatType | _: DateType =>
+        new ItemsSketch[Number](maxMapSize).asInstanceOf[ItemsSketch[Any]]
+      case _: LongType | _: TimestampType | _: TimestampNTZType =>
+        new ItemsSketch[Long](maxMapSize).asInstanceOf[ItemsSketch[Any]]
+      case _: DoubleType =>
+        new ItemsSketch[Double](maxMapSize).asInstanceOf[ItemsSketch[Any]]
+      case _: StringType =>
+        new ItemsSketch[String](maxMapSize).asInstanceOf[ItemsSketch[Any]]
+      case _: DecimalType =>
+        new ItemsSketch[Decimal](maxMapSize).asInstanceOf[ItemsSketch[Any]]
+    }
+  }
+
+  def updateSketchBuffer(
+      itemExpression: Expression,
+      buffer: ItemsSketch[Any],
+      input: InternalRow): ItemsSketch[Any] = {
+    val v = itemExpression.eval(input)
+    if (v != null) {
+      itemExpression.dataType match {
+        case _: BooleanType => buffer.update(v.asInstanceOf[Boolean])
+        case _: ByteType => buffer.update(v.asInstanceOf[Byte])
+        case _: ShortType => buffer.update(v.asInstanceOf[Short])
+        case _: IntegerType => buffer.update(v.asInstanceOf[Int])
+        case _: LongType => buffer.update(v.asInstanceOf[Long])
+        case _: FloatType => buffer.update(v.asInstanceOf[Float])
+        case _: DoubleType => buffer.update(v.asInstanceOf[Double])
+        case _: DateType => buffer.update(v.asInstanceOf[Int])
+        case _: TimestampType => buffer.update(v.asInstanceOf[Long])
+        case _: TimestampNTZType => buffer.update(v.asInstanceOf[Long])
+        case st: StringType =>
+          val cKey = CollationFactory.getCollationKey(v.asInstanceOf[UTF8String], st.collationId)
+          buffer.update(cKey.toString)
+        case _: DecimalType => buffer.update(v.asInstanceOf[Decimal])
+      }
+    }
+    buffer
+  }
+
+  def genEvalResult(
+      itemsSketch: ItemsSketch[Any],
+      k: Int,
+      itemDataType: DataType): GenericArrayData = {
+    val items = itemsSketch.getFrequentItems(ErrorType.NO_FALSE_POSITIVES)
+    val resultLength = math.min(items.length, k)
+    val result = new Array[AnyRef](resultLength)
+    for (i <- 0 until resultLength) {
+      val row = items(i)
+      itemDataType match {
+        case _: BooleanType | _: ByteType | _: ShortType | _: IntegerType |
+             _: LongType | _: FloatType | _: DoubleType | _: DecimalType |
+             _: DateType | _: TimestampType | _: TimestampNTZType =>
+          result(i) = InternalRow.apply(row.getItem, row.getEstimate)
+        case _: StringType =>
+          val item = UTF8String.fromString(row.getItem.asInstanceOf[String])
+          result(i) = InternalRow.apply(item, row.getEstimate)
+      }
+    }
+    new GenericArrayData(result)
+  }
+
+  def genSketchSerDe(dataType: DataType): ArrayOfItemsSerDe[Any] = {
+    dataType match {
+      case _: BooleanType => new ArrayOfBooleansSerDe().asInstanceOf[ArrayOfItemsSerDe[Any]]
+      case _: ByteType | _: ShortType | _: IntegerType | _: FloatType | _: DateType =>
+        new ArrayOfNumbersSerDe().asInstanceOf[ArrayOfItemsSerDe[Any]]
+      case _: LongType | _: TimestampType | _: TimestampNTZType =>
+        new ArrayOfLongsSerDe().asInstanceOf[ArrayOfItemsSerDe[Any]]
+      case _: DoubleType =>
+        new ArrayOfDoublesSerDe().asInstanceOf[ArrayOfItemsSerDe[Any]]
+      case _: StringType =>
+        new ArrayOfStringsSerDe().asInstanceOf[ArrayOfItemsSerDe[Any]]
+      case dt: DecimalType =>
+        new ArrayOfDecimalsSerDe(dt).asInstanceOf[ArrayOfItemsSerDe[Any]]
+    }
+  }
+
+  def getSketchStateDataType(itemDataType: DataType): StructType =
+    StructType(
+      StructField("sketch", BinaryType, nullable = false) ::
+        StructField("itemDataType", itemDataType) ::
+        StructField("maxItemsTracked", IntegerType, nullable = false) :: Nil)
+}
+
+/**
+ * An aggregate function that accumulates items into a sketch, which can then be used
+ * to combine with other sketches, via ApproxTopKCombine,
+ * or to estimate the top K items, via ApproxTopKEstimate.
+ *
+ * The output of this function is a struct containing the sketch in binary format,
+ * a null object indicating the type of items in the sketch,
+ * and the maximum number of items tracked by the sketch.
+ *
+ * @param expr                   the child expression to accumulate items from
+ * @param maxItemsTracked        the maximum number of items to track in the sketch
+ * @param mutableAggBufferOffset the offset for mutable aggregation buffer
+ * @param inputAggBufferOffset   the offset for input aggregation buffer
+ */
+// scalastyle:off line.size.limit
+@ExpressionDescription(
+  usage = """
+    _FUNC_(expr, maxItemsTracked) - Accumulates items into a sketch.
+      `maxItemsTracked` An optional positive INTEGER literal with upper limit of 1000000. If maxItemsTracked is not specified, it defaults to 10000.
+  """,
+  examples = """
+    Examples:
+      > SELECT approx_top_k_estimate(_FUNC_(expr)) FROM VALUES (0), (0), (1), (1), (2), (3), (4), (4) AS tab(expr);
+       [{"item":0,"count":2},{"item":4,"count":2},{"item":1,"count":2},{"item":2,"count":1},{"item":3,"count":1}]
+
+      > SELECT approx_top_k_estimate(_FUNC_(expr, 100), 2) FROM VALUES 'a', 'b', 'c', 'c', 'c', 'c', 'd', 'd' AS tab(expr);
+       [{"item":"c","count":4},{"item":"d","count":2}]
+  """,
+  group = "agg_funcs",
+  since = "4.1.0")
+// scalastyle:on line.size.limit
+case class ApproxTopKAccumulate(
+    expr: Expression,
+    maxItemsTracked: Expression,
+    mutableAggBufferOffset: Int = 0,
+    inputAggBufferOffset: Int = 0)
+  extends TypedImperativeAggregate[ItemsSketch[Any]]
+  with ImplicitCastInputTypes
+  with BinaryLike[Expression] {
+
+  def this(child: Expression, maxItemsTracked: Expression) = this(child, maxItemsTracked, 0, 0)
+
+  def this(child: Expression, maxItemsTracked: Int) = this(child, Literal(maxItemsTracked), 0, 0)
+
+  def this(child: Expression) = this(child, Literal(ApproxTopK.DEFAULT_MAX_ITEMS_TRACKED), 0, 0)
+
+  private lazy val itemDataType: DataType = expr.dataType
+
+  private lazy val maxItemsTrackedVal: Int = {
+    ApproxTopK.checkExpressionNotNull(maxItemsTracked, "maxItemsTracked")
+    val maxItemsTrackedVal = maxItemsTracked.eval().asInstanceOf[Int]
+    ApproxTopK.checkMaxItemsTracked(maxItemsTrackedVal)
+    maxItemsTrackedVal
+  }
+
+  override def left: Expression = expr
+
+  override def right: Expression = maxItemsTracked
+
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyDataType, IntegerType)
+
+  override def checkInputDataTypes(): TypeCheckResult = {
+    val defaultCheck = super.checkInputDataTypes()
+    if (defaultCheck.isFailure) {
+      defaultCheck
+    } else if (!ApproxTopK.isDataTypeSupported(itemDataType)) {
+      TypeCheckFailure(f"${itemDataType.typeName} columns are not supported")
+    } else if (!maxItemsTracked.foldable) {
+      TypeCheckFailure("Number of items tracked must be a constant literal")
+    } else {
+      TypeCheckSuccess
+    }
+  }
+
+  override def dataType: DataType = ApproxTopK.getSketchStateDataType(itemDataType)
+
+  override def createAggregationBuffer(): ItemsSketch[Any] = {
+    val maxMapSize = ApproxTopK.calMaxMapSize(maxItemsTrackedVal)
+    ApproxTopK.createAggregationBuffer(expr, maxMapSize)
+  }
+
+  override def update(buffer: ItemsSketch[Any], input: InternalRow): ItemsSketch[Any] =
+    ApproxTopK.updateSketchBuffer(expr, buffer, input)
+
+  override def merge(buffer: ItemsSketch[Any], input: ItemsSketch[Any]): ItemsSketch[Any] =
+    buffer.merge(input)
+
+  override def eval(buffer: ItemsSketch[Any]): Any = {
+    val sketchBytes = serialize(buffer)
+    InternalRow.apply(sketchBytes, null, maxItemsTrackedVal)
+  }
+
+  override def serialize(buffer: ItemsSketch[Any]): Array[Byte] =
+    buffer.toByteArray(ApproxTopK.genSketchSerDe(itemDataType))
+
+  override def deserialize(storageFormat: Array[Byte]): ItemsSketch[Any] =
+    ItemsSketch.getInstance(Memory.wrap(storageFormat), ApproxTopK.genSketchSerDe(itemDataType))
+
+  override def withNewMutableAggBufferOffset(newMutableAggBufferOffset: Int): ImperativeAggregate =
+    copy(mutableAggBufferOffset = newMutableAggBufferOffset)
+
+  override def withNewInputAggBufferOffset(newInputAggBufferOffset: Int): ImperativeAggregate =
+    copy(inputAggBufferOffset = newInputAggBufferOffset)
+
+  override protected def withNewChildrenInternal(
+      newLeft: Expression,
+      newRight: Expression): Expression =
+    copy(expr = newLeft, maxItemsTracked = newRight)
+
+  override def nullable: Boolean = false
+
+  override def prettyName: String =
+    getTagValue(FunctionRegistry.FUNC_ALIAS).getOrElse("approx_top_k_accumulate")
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/arithmetic.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/arithmetic.scala
index f9e8b6a17896f..c98e988ad3079 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/arithmetic.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/arithmetic.scala
@@ -55,6 +55,8 @@ case class UnaryMinus(
 
   override def dataType: DataType = child.dataType
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def toString: String = s"-$child"
 
   private lazy val numeric = TypeUtils.getNumeric(dataType, failOnError)
@@ -123,6 +125,8 @@ case class UnaryPositive(child: Expression)
 
   override def dataType: DataType = child.dataType
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def sql: String = s"(+ ${child.sql})"
 
   override lazy val replacement: Expression = child
@@ -155,6 +159,8 @@ case class Abs(child: Expression, failOnError: Boolean = SQLConf.get.ansiEnabled
 
   override def dataType: DataType = child.dataType
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   private lazy val numeric = (dataType match {
     case _: DayTimeIntervalType => LongExactNumeric
     case _: YearMonthIntervalType => IntegerExactNumeric
@@ -187,6 +193,9 @@ case class Abs(child: Expression, failOnError: Boolean = SQLConf.get.ansiEnabled
 abstract class BinaryArithmetic extends BinaryOperator with SupportQueryContext {
   override def nullIntolerant: Boolean = true
 
+  override def contextIndependentFoldable: Boolean =
+    left.contextIndependentFoldable && right.contextIndependentFoldable
+
   protected val evalMode: EvalMode.Value
 
   private lazy val internalDataType: DataType = (left.dataType, right.dataType) match {
@@ -1193,6 +1202,7 @@ case class Least(children: Seq[Expression]) extends ComplexTypeMergingExpression
 
   override def nullable: Boolean = children.forall(_.nullable)
   override def foldable: Boolean = children.forall(_.foldable)
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   private lazy val ordering = TypeUtils.getInterpretedOrdering(dataType)
 
@@ -1281,6 +1291,7 @@ case class Greatest(children: Seq[Expression]) extends ComplexTypeMergingExpress
 
   override def nullable: Boolean = children.forall(_.nullable)
   override def foldable: Boolean = children.forall(_.foldable)
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   private lazy val ordering = TypeUtils.getInterpretedOrdering(dataType)
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeFormatter.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeFormatter.scala
index 2ec31458270f3..4fb180a720129 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeFormatter.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeFormatter.scala
@@ -144,7 +144,7 @@ private class CodeFormatter {
     // Lines starting with '}' should be de-indented even if they contain '{' after;
     // in addition, lines ending with ':' are typically labels
     val thisLineIndent = if (line.startsWith("}") || line.startsWith(")") || line.endsWith(":")) {
-      " " * (indentSize * (indentLevel - 1))
+      " ".repeat(indentSize * (indentLevel - 1))
     } else {
       indentString
     }
@@ -157,7 +157,7 @@ private class CodeFormatter {
     }
     code.append("\n")
     indentLevel = newIndentLevel
-    indentString = " " * (indentSize * newIndentLevel)
+    indentString = " ".repeat(indentSize * newIndentLevel)
     currentLine += 1
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeGenerator.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeGenerator.scala
index 2564d4eab9bd6..8c702815e9b9f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeGenerator.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/codegen/CodeGenerator.scala
@@ -33,7 +33,7 @@ import org.codehaus.janino.util.ClassFile.CodeAttribute
 
 import org.apache.spark.{SparkException, SparkIllegalArgumentException, TaskContext, TaskKilledException}
 import org.apache.spark.executor.InputMetrics
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.metrics.source.CodegenMetrics
 import org.apache.spark.sql.catalyst.InternalRow
@@ -1989,7 +1989,7 @@ object CodeGenerator extends Logging {
     case ByteType => java.lang.Byte.TYPE
     case ShortType => java.lang.Short.TYPE
     case IntegerType | DateType | _: YearMonthIntervalType => java.lang.Integer.TYPE
-    case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType =>
+    case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType =>
       java.lang.Long.TYPE
     case FloatType => java.lang.Float.TYPE
     case DoubleType => java.lang.Double.TYPE
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/collectionOperations.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/collectionOperations.scala
index b4978fbe1f70a..59196a959f758 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/collectionOperations.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/collectionOperations.scala
@@ -116,6 +116,7 @@ case class Size(child: Expression, legacySizeOfNull: Boolean)
   def this(child: Expression) = this(child, SQLConf.get.legacySizeOfNull)
 
   override def dataType: DataType = IntegerType
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
   override def inputTypes: Seq[AbstractDataType] = Seq(TypeCollection(ArrayType, MapType))
   override def nullable: Boolean = if (legacySizeOfNull) false else super.nullable
 
@@ -1003,7 +1004,7 @@ case class MapSort(base: Expression)
        |    ${CodeGenerator.getValue(values, valueType, i)});
        |}
        |
-       |java.util.Arrays.sort($sortArray, new java.util.Comparator<Object>() {
+       |java.util.Arrays.parallelSort($sortArray, new java.util.Comparator<Object>() {
        |  @Override public int compare(Object $o1entry, Object $o2entry) {
        |    Object $o1 = (($simpleEntryType) $o1entry).getKey();
        |    Object $o2 = (($simpleEntryType) $o2entry).getKey();
@@ -1148,7 +1149,7 @@ case class SortArray(base: Expression, ascendingOrder: Expression)
   private def sortEval(array: Any, ascending: Boolean): Any = {
     val data = array.asInstanceOf[ArrayData].toArray[AnyRef](elementType)
     if (elementType != NullType) {
-      java.util.Arrays.sort(data, if (ascending) lt else gt)
+      java.util.Arrays.parallelSort(data, if (ascending) lt else gt)
     }
     new GenericArrayData(data.asInstanceOf[Array[Any]])
   }
@@ -1190,7 +1191,7 @@ case class SortArray(base: Expression, ascendingOrder: Expression)
         s"""
            |if ($order) {
            |  $javaType[] $array = $base.to${primitiveTypeName}Array();
-           |  java.util.Arrays.sort($array);
+           |  java.util.Arrays.parallelSort($array);
            |  ${ev.value} = $unsafeArrayData.fromPrimitiveArray($array);
            |} else
            """.stripMargin
@@ -1202,7 +1203,7 @@ case class SortArray(base: Expression, ascendingOrder: Expression)
          |{
          |  Object[] $array = $base.toObjectArray($elementTypeTerm);
          |  final int $sortOrder = $order ? 1 : -1;
-         |  java.util.Arrays.sort($array, new java.util.Comparator() {
+         |  java.util.Arrays.parallelSort($array, new java.util.Comparator() {
          |    @Override public int compare(Object $o1, Object $o2) {
          |      if ($o1 == null && $o2 == null) {
          |        return 0;
@@ -2158,6 +2159,8 @@ case class ArrayJoin(
 
   override def foldable: Boolean = children.forall(_.foldable)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def eval(input: InternalRow): Any = {
     val arrayEval = array.eval(input)
     if (arrayEval == null) return null
@@ -2897,6 +2900,8 @@ case class Concat(children: Seq[Expression]) extends ComplexTypeMergingExpressio
 
   override def foldable: Boolean = children.forall(_.foldable)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def eval(input: InternalRow): Any = doConcat(input)
 
   @transient private lazy val doConcat: InternalRow => Any = dataType match {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeCreator.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeCreator.scala
index 81484f8dd7da5..f4232cae1066d 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeCreator.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeCreator.scala
@@ -71,6 +71,8 @@ case class CreateArray(children: Seq[Expression], useStringTypeWhenEmpty: Boolea
 
   override def foldable: Boolean = children.forall(_.foldable)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def stringArgs: Iterator[Any] = super.stringArgs.take(1)
 
   override def checkInputDataTypes(): TypeCheckResult = {
@@ -204,6 +206,8 @@ case class CreateMap(children: Seq[Expression], useStringTypeWhenEmpty: Boolean)
 
   override def foldable: Boolean = children.forall(_.foldable)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def stringArgs: Iterator[Any] = super.stringArgs.take(1)
 
   override def checkInputDataTypes(): TypeCheckResult = {
@@ -450,6 +454,8 @@ case class CreateNamedStruct(children: Seq[Expression]) extends Expression with
 
   override def foldable: Boolean = valExprs.forall(_.foldable)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   final override val nodePatterns: Seq[TreePattern] = Seq(CREATE_NAMED_STRUCT)
 
   override lazy val dataType: StructType = {
@@ -591,18 +597,21 @@ case class StringToMap(text: Expression, pairDelim: Expression, keyValueDelim: E
 
   private final lazy val collationId: Int = text.dataType.asInstanceOf[StringType].collationId
 
+  private lazy val legacySplitTruncate =
+    SQLConf.get.getConf(SQLConf.LEGACY_TRUNCATE_FOR_EMPTY_REGEX_SPLIT)
+
   override def nullSafeEval(
       inputString: Any,
       stringDelimiter: Any,
       keyValueDelimiter: Any): Any = {
     val keyValues = CollationAwareUTF8String.splitSQL(inputString.asInstanceOf[UTF8String],
-      stringDelimiter.asInstanceOf[UTF8String], -1, collationId)
+      stringDelimiter.asInstanceOf[UTF8String], -1, collationId, legacySplitTruncate)
     val keyValueDelimiterUTF8String = keyValueDelimiter.asInstanceOf[UTF8String]
 
     var i = 0
     while (i < keyValues.length) {
       val keyValueArray = CollationAwareUTF8String.splitSQL(
-        keyValues(i), keyValueDelimiterUTF8String, 2, collationId)
+        keyValues(i), keyValueDelimiterUTF8String, 2, collationId, legacySplitTruncate)
       val key = keyValueArray(0)
       val value = if (keyValueArray.length < 2) null else keyValueArray(1)
       mapBuilder.put(key, value)
@@ -617,9 +626,11 @@ case class StringToMap(text: Expression, pairDelim: Expression, keyValueDelim: E
 
     nullSafeCodeGen(ctx, ev, (text, pd, kvd) =>
       s"""
-         |UTF8String[] $keyValues = CollationAwareUTF8String.splitSQL($text, $pd, -1, $collationId);
+         |UTF8String[] $keyValues =
+         |  CollationAwareUTF8String.splitSQL($text, $pd, -1, $collationId, $legacySplitTruncate);
          |for(UTF8String kvEntry: $keyValues) {
-         |  UTF8String[] kv = CollationAwareUTF8String.splitSQL(kvEntry, $kvd, 2, $collationId);
+         |  UTF8String[] kv = CollationAwareUTF8String.splitSQL(
+         |    kvEntry, $kvd, 2, $collationId, $legacySplitTruncate);
          |  $builderTerm.put(kv[0], kv.length == 2 ? kv[1] : null);
          |}
          |${ev.value} = $builderTerm.build();
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeExtractors.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeExtractors.scala
index 804c80bd68b49..5cdbdf3f0e7c7 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeExtractors.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/complexTypeExtractors.scala
@@ -35,6 +35,27 @@ import org.apache.spark.sql.types._
 
 
 object ExtractValue {
+  /**
+   * Returns the resolved `ExtractValue` using the `extractValue` method call. In case the method
+   * returns `None`, it throws.
+   *
+   * See `extractValue` doc for more info.
+   */
+  def apply(
+      child: Expression,
+      extraction: Expression,
+      resolver: Resolver): Expression = {
+    extractValue(child, extraction, resolver) match {
+      case Some(expression) => expression
+      case None =>
+        throw QueryCompilationErrors.dataTypeUnsupportedByExtractValueError(
+          child.dataType,
+          extraction,
+          child
+        )
+    }
+  }
+
   /**
    * Returns the resolved `ExtractValue`. It will return one kind of concrete `ExtractValue`,
    * depend on the type of `child` and `extraction`.
@@ -46,33 +67,52 @@ object ExtractValue {
    *    Array       |   Integral type    |         GetArrayItem
    *     Map        |   map key type     |         GetMapValue
    */
-  def apply(
+  def extractValue(
       child: Expression,
       extraction: Expression,
-      resolver: Resolver): Expression = {
-
+      resolver: Resolver): Option[Expression] = {
     (child.dataType, extraction) match {
       case (StructType(fields), NonNullLiteral(v, _: StringType)) =>
         val fieldName = v.toString
         val ordinal = findField(fields, fieldName, resolver)
-        GetStructField(child, ordinal, Some(fieldName))
+        Some(GetStructField(child, ordinal, Some(fieldName)))
 
       case (ArrayType(StructType(fields), containsNull), NonNullLiteral(v, _: StringType)) =>
         val fieldName = v.toString
         val ordinal = findField(fields, fieldName, resolver)
-        GetArrayStructFields(child, fields(ordinal).copy(name = fieldName),
-          ordinal, fields.length, containsNull || fields(ordinal).nullable)
+        Some(
+          GetArrayStructFields(
+            child,
+            fields(ordinal).copy(name = fieldName),
+            ordinal,
+            fields.length,
+            containsNull || fields(ordinal).nullable
+          )
+        )
 
-      case (_: ArrayType, _) => GetArrayItem(child, extraction)
+      case (_: ArrayType, _) => Some(GetArrayItem(child, extraction))
 
-      case (MapType(_, _, _), _) => GetMapValue(child, extraction)
+      case (MapType(_, _, _), _) => Some(GetMapValue(child, extraction))
 
-      case (otherType, _) =>
-        throw QueryCompilationErrors.dataTypeUnsupportedByExtractValueError(
-          otherType, extraction, child)
+      case (otherType, _) => None
     }
   }
 
+  /**
+   * Check that [[attribute]] can be fully extracted using the given [[nestedFields]].
+   */
+  def isExtractable(
+      attribute: Attribute, nestedFields: Seq[String], resolver: Resolver): Boolean = {
+    nestedFields
+      .foldLeft(Some(attribute): Option[Expression]) {
+        case (Some(expression), field) =>
+          ExtractValue.extractValue(expression, Literal(field), resolver)
+        case _ =>
+          None
+      }
+      .isDefined
+  }
+
   /**
    * Find the ordinal of StructField, report error if no desired field or over one
    * desired fields are found.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/conditionalExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/conditionalExpressions.scala
index 609d457fbd067..621f02ca18b86 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/conditionalExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/conditionalExpressions.scala
@@ -200,6 +200,8 @@ case class CaseWhen(
     branches.exists(_._2.nullable) || elseValue.map(_.nullable).getOrElse(true)
   }
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def checkInputDataTypes(): TypeCheckResult = {
     if (TypeCoercion.haveSameType(inputTypesForMerging)) {
       // Make sure all branch conditions are boolean types.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/datetimeExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/datetimeExpressions.scala
index 4ae8883dae043..375b58d8bb7e2 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/datetimeExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/datetimeExpressions.scala
@@ -29,6 +29,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.{ExpressionBuilder, FunctionRegistry}
 import org.apache.spark.sql.catalyst.expressions.codegen._
 import org.apache.spark.sql.catalyst.expressions.codegen.Block._
+import org.apache.spark.sql.catalyst.expressions.objects.StaticInvoke
 import org.apache.spark.sql.catalyst.trees.CurrentOrigin.withOrigin
 import org.apache.spark.sql.catalyst.trees.TreePattern._
 import org.apache.spark.sql.catalyst.util.{DateTimeUtils, LegacyDateFormats, TimestampFormatter}
@@ -323,6 +324,7 @@ case class DateAdd(startDate: Expression, days: Expression)
   override def nullIntolerant: Boolean = true
   override def left: Expression = startDate
   override def right: Expression = days
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   override def inputTypes: Seq[AbstractDataType] =
     Seq(DateType, TypeCollection(IntegerType, ShortType, ByteType))
@@ -362,6 +364,7 @@ case class DateSub(startDate: Expression, days: Expression)
   override def nullIntolerant: Boolean = true
   override def left: Expression = startDate
   override def right: Expression = days
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   override def inputTypes: Seq[AbstractDataType] =
     Seq(DateType, TypeCollection(IntegerType, ShortType, ByteType))
@@ -1646,7 +1649,10 @@ case class NextDay(
 /**
  * Adds an interval to timestamp.
  */
-case class TimeAdd(start: Expression, interval: Expression, timeZoneId: Option[String] = None)
+case class TimestampAddInterval(
+    start: Expression,
+    interval: Expression,
+    timeZoneId: Option[String] = None)
   extends BinaryExpression with TimeZoneAwareExpression with ExpectsInputTypes {
   override def nullIntolerant: Boolean = true
 
@@ -1689,7 +1695,7 @@ case class TimeAdd(start: Expression, interval: Expression, timeZoneId: Option[S
   }
 
   override protected def withNewChildrenInternal(
-      newLeft: Expression, newRight: Expression): TimeAdd =
+      newLeft: Expression, newRight: Expression): TimestampAddInterval =
     copy(start = newLeft, interval = newRight)
 }
 
@@ -2119,7 +2125,7 @@ case class ParseToDate(
     this(left, None)
   }
 
-  override def prettyName: String = "to_date"
+  override def nodeName: String = "to_date"
 
   override def withTimeZone(timeZoneId: String): TimeZoneAwareExpression =
     copy(timeZoneId = Some(timeZoneId))
@@ -2149,6 +2155,45 @@ case class ParseToDate(
   }
 }
 
+// scalastyle:off line.size.limit
+@ExpressionDescription(
+  usage = """
+    _FUNC_(date_str[, fmt]) - Parses the `date_str` expression with the `fmt` expression to a date.
+      The function always returns null on an invalid input with/without ANSI SQL mode enabled. By
+      default, it follows casting rules to a date if the `fmt` is omitted.
+  """,
+  arguments = """
+    Arguments:
+      * date_str - A string to be parsed to date.
+      * fmt - Date format pattern to follow. See <a href="https://spark.apache.org/docs/latest/sql-ref-datetime-pattern.html">Datetime Patterns</a> for valid
+              date and time format patterns.
+  """,
+  examples = """
+    Examples:
+      > SELECT _FUNC_('2016-12-31');
+       2016-12-31
+      > SELECT _FUNC_('2016-12-31', 'yyyy-MM-dd');
+       2016-12-31
+      > SELECT _FUNC_('foo', 'yyyy-MM-dd');
+       NULL
+  """,
+  group = "datetime_funcs",
+  since = "4.0.0")
+// scalastyle:on line.size.limit
+object TryToDateExpressionBuilder extends ExpressionBuilder {
+  override def build(funcName: String, expressions: Seq[Expression]): Expression = {
+    val numArgs = expressions.length
+    if (numArgs == 1 || numArgs == 2) {
+      ParseToDate(
+        expressions.head,
+        expressions.drop(1).lastOption,
+        ansiEnabled = false)
+    } else {
+      throw QueryCompilationErrors.wrongNumArgsError(funcName, Seq(1, 2), numArgs)
+    }
+  }
+}
+
 /**
  * Parses a column to a timestamp based on the supplied format.
  */
@@ -2554,9 +2599,36 @@ case class MakeDate(
     copy(year = newFirst, month = newSecond, day = newThird)
 }
 
+case class MakeTimestampNTZ(left: Expression, right: Expression)
+  extends BinaryExpression
+  with RuntimeReplaceable
+  with ExpectsInputTypes {
+
+  override def replacement: Expression = StaticInvoke(
+    classOf[DateTimeUtils.type],
+    TimestampNTZType,
+    "makeTimestampNTZ",
+    Seq(left, right),
+    Seq(left.dataType, right.dataType)
+  )
+
+  override def inputTypes: Seq[AbstractDataType] = Seq(DateType, AnyTimeType)
+
+  override def prettyName: String = "make_timestamp_ntz"
+
+  override protected def withNewChildrenInternal(
+    newLeft: Expression, newRight: Expression): Expression = {
+    copy(left = newLeft, right = newRight)
+  }
+}
+
 // scalastyle:off line.size.limit
 @ExpressionDescription(
-  usage = "_FUNC_(year, month, day, hour, min, sec) - Create local date-time from year, month, day, hour, min, sec fields. If the configuration `spark.sql.ansi.enabled` is false, the function returns NULL on invalid inputs. Otherwise, it will throw an error instead.",
+  usage = """
+    _FUNC_(year, month, day, hour, min, sec) - Create local date-time from year, month, day, hour, min, sec fields. If the configuration `spark.sql.ansi.enabled` is false, the function returns NULL on invalid inputs. Otherwise, it will throw an error instead.
+
+    _FUNC_(date, time) - Create a local date-time from date and time fields.
+    """,
   arguments = """
     Arguments:
       * year - the year to represent, from 1 to 9999
@@ -2567,6 +2639,8 @@ case class MakeDate(
       * sec - the second-of-minute and its micro-fraction to represent, from
               0 to 60. If the sec argument equals to 60, the seconds field is set
               to 0 and 1 minute is added to the final timestamp.
+      * date - a date to represent, from 0001-01-01 to 9999-12-31
+      * time - a local time to represent, from 00:00:00 to 23:59:59.999999
   """,
   examples = """
     Examples:
@@ -2576,6 +2650,8 @@ case class MakeDate(
        2019-07-01 00:00:00
       > SELECT _FUNC_(null, 7, 22, 15, 30, 0);
        NULL
+      > SELECT _FUNC_(DATE'2014-12-28', TIME'6:30:45.887');
+       2014-12-28 06:30:45.887
   """,
   group = "datetime_funcs",
   since = "3.4.0")
@@ -2583,7 +2659,9 @@ case class MakeDate(
 object MakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
   override def build(funcName: String, expressions: Seq[Expression]): Expression = {
     val numArgs = expressions.length
-    if (numArgs == 6) {
+    if (numArgs == 2) {
+      MakeTimestampNTZ(expressions(0), expressions(1))
+    } else if (numArgs == 6) {
       MakeTimestamp(
         expressions(0),
         expressions(1),
@@ -2593,14 +2671,18 @@ object MakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
         expressions(5),
         dataType = TimestampNTZType)
     } else {
-      throw QueryCompilationErrors.wrongNumArgsError(funcName, Seq(6), numArgs)
+      throw QueryCompilationErrors.wrongNumArgsError(funcName, Seq(2, 6), numArgs)
     }
   }
 }
 
 // scalastyle:off line.size.limit
 @ExpressionDescription(
-  usage = "_FUNC_(year, month, day, hour, min, sec) - Try to create local date-time from year, month, day, hour, min, sec fields. The function returns NULL on invalid inputs.",
+  usage = """
+    _FUNC_(year, month, day, hour, min, sec) - Try to create local date-time from year, month, day, hour, min, sec fields. The function returns NULL on invalid inputs.
+
+    _FUNC_(date, time) - Create a local date-time from date and time fields.
+    """,
   arguments = """
     Arguments:
       * year - the year to represent, from 1 to 9999
@@ -2611,6 +2693,8 @@ object MakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
       * sec - the second-of-minute and its micro-fraction to represent, from
               0 to 60. If the sec argument equals to 60, the seconds field is set
               to 0 and 1 minute is added to the final timestamp.
+      * date - a date to represent, from 0001-01-01 to 9999-12-31
+      * time - a local time to represent, from 00:00:00 to 23:59:59.999999
   """,
   examples = """
     Examples:
@@ -2622,6 +2706,8 @@ object MakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
        NULL
       > SELECT _FUNC_(2024, 13, 22, 15, 30, 0);
        NULL
+      > SELECT _FUNC_(DATE'2014-12-28', TIME'6:30:45.887');
+       2014-12-28 06:30:45.887
   """,
   group = "datetime_funcs",
   since = "4.0.0")
@@ -2629,7 +2715,9 @@ object MakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
 object TryMakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
   override def build(funcName: String, expressions: Seq[Expression]): Expression = {
     val numArgs = expressions.length
-    if (numArgs == 6) {
+    if (numArgs == 2) {
+      TryEval(MakeTimestampNTZ(expressions(0), expressions(1)))
+    } else if (numArgs == 6) {
       MakeTimestamp(
         expressions(0),
         expressions(1),
@@ -2647,7 +2735,11 @@ object TryMakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
 
 // scalastyle:off line.size.limit
 @ExpressionDescription(
-  usage = "_FUNC_(year, month, day, hour, min, sec[, timezone]) - Create the current timestamp with local time zone from year, month, day, hour, min, sec and timezone fields. If the configuration `spark.sql.ansi.enabled` is false, the function returns NULL on invalid inputs. Otherwise, it will throw an error instead.",
+  usage = """
+    _FUNC_(year, month, day, hour, min, sec[, timezone]) - Create the current timestamp with local time zone from year, month, day, hour, min, sec and (optional) timezone fields. If the configuration `spark.sql.ansi.enabled` is false, the function returns NULL on invalid inputs. Otherwise, it will throw an error instead.
+
+    _FUNC_(date, time[, timezone]) - Create a local date-time from date, time and (optional) timezone fields.
+    """,
   arguments = """
     Arguments:
       * year - the year to represent, from 1 to 9999
@@ -2659,6 +2751,8 @@ object TryMakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
               0 to 60. If the sec argument equals to 60, the seconds field is set
               to 0 and 1 minute is added to the final timestamp.
       * timezone - the time zone identifier. For example, CET, UTC and etc.
+      * date - a date to represent, from 0001-01-01 to 9999-12-31
+      * time - a local time to represent, from 00:00:00 to 23:59:59.999999
   """,
   examples = """
     Examples:
@@ -2670,6 +2764,10 @@ object TryMakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
        2019-07-01 00:00:00
       > SELECT _FUNC_(null, 7, 22, 15, 30, 0);
        NULL
+      > SELECT _FUNC_(DATE'2014-12-28', TIME'6:30:45.887');
+       2014-12-28 06:30:45.887
+      > SELECT _FUNC_(DATE'2014-12-28', TIME'6:30:45.887', 'CET');
+       2014-12-27 21:30:45.887
   """,
   group = "datetime_funcs",
   since = "3.4.0")
@@ -2677,7 +2775,16 @@ object TryMakeTimestampNTZExpressionBuilder extends ExpressionBuilder {
 object MakeTimestampLTZExpressionBuilder extends ExpressionBuilder {
   override def build(funcName: String, expressions: Seq[Expression]): Expression = {
     val numArgs = expressions.length
-    if (numArgs == 6 || numArgs == 7) {
+    if (numArgs == 2 || numArgs == 3) {
+      // Overload for: date, time[, timezone].
+      MakeTimestampFromDateTime(
+        expressions(0),
+        Some(expressions(1)),
+        expressions.drop(2).lastOption
+      )
+    }
+    else if (numArgs == 6 || numArgs == 7) {
+      // Overload for: year, month, day, hour, min, sec[, timezone].
       MakeTimestamp(
         expressions(0),
         expressions(1),
@@ -2688,7 +2795,7 @@ object MakeTimestampLTZExpressionBuilder extends ExpressionBuilder {
         expressions.drop(6).lastOption,
         dataType = TimestampType)
     } else {
-      throw QueryCompilationErrors.wrongNumArgsError(funcName, Seq(6), numArgs)
+      throw QueryCompilationErrors.wrongNumArgsError(funcName, Seq(2, 6), numArgs)
     }
   }
 }
@@ -2744,38 +2851,6 @@ object TryMakeTimestampLTZExpressionBuilder extends ExpressionBuilder {
   }
 }
 
-// scalastyle:off line.size.limit
-@ExpressionDescription(
-  usage = "_FUNC_(year, month, day, hour, min, sec[, timezone]) - Create timestamp from year, month, day, hour, min, sec and timezone fields. The result data type is consistent with the value of configuration `spark.sql.timestampType`. If the configuration `spark.sql.ansi.enabled` is false, the function returns NULL on invalid inputs. Otherwise, it will throw an error instead.",
-  arguments = """
-    Arguments:
-      * year - the year to represent, from 1 to 9999
-      * month - the month-of-year to represent, from 1 (January) to 12 (December)
-      * day - the day-of-month to represent, from 1 to 31
-      * hour - the hour-of-day to represent, from 0 to 23
-      * min - the minute-of-hour to represent, from 0 to 59
-      * sec - the second-of-minute and its micro-fraction to represent, from 0 to 60.
-              The value can be either an integer like 13 , or a fraction like 13.123.
-              If the sec argument equals to 60, the seconds field is set
-              to 0 and 1 minute is added to the final timestamp.
-      * timezone - the time zone identifier. For example, CET, UTC and etc.
-  """,
-  examples = """
-    Examples:
-      > SELECT _FUNC_(2014, 12, 28, 6, 30, 45.887);
-       2014-12-28 06:30:45.887
-      > SELECT _FUNC_(2014, 12, 28, 6, 30, 45.887, 'CET');
-       2014-12-27 21:30:45.887
-      > SELECT _FUNC_(2019, 6, 30, 23, 59, 60);
-       2019-07-01 00:00:00
-      > SELECT _FUNC_(2019, 6, 30, 23, 59, 1);
-       2019-06-30 23:59:01
-      > SELECT _FUNC_(null, 7, 22, 15, 30, 0);
-       NULL
-  """,
-  group = "datetime_funcs",
-  since = "3.0.0")
-// scalastyle:on line.size.limit
 case class MakeTimestamp(
     year: Expression,
     month: Expression,
@@ -3030,6 +3105,147 @@ case class TryMakeTimestamp(
   }
 }
 
+case class MakeTimestampFromDateTime(
+    date: Expression,
+    time: Option[Expression] = None,
+    timezone: Option[Expression] = None,
+    timeZoneId: Option[String] = None)
+  extends Expression with RuntimeReplaceable with ExpectsInputTypes with TimeZoneAwareExpression {
+
+  def this(date: Expression) =
+    this(date, None, None, None)
+
+  def this(date: Expression, time: Expression) =
+    this(date, Some(time), None, None)
+
+  def this(date: Expression, time: Expression, timezone: Expression) =
+    this(date, Some(time), Some(timezone), None)
+
+  override def children: Seq[Expression] = Seq(date) ++ time ++ timezone
+
+  override def inputTypes: Seq[AbstractDataType] = Seq(DateType, AnyTimeType) ++
+    timezone.map(_ => StringTypeWithCollation(supportsTrimCollation = true))
+
+  override def replacement: Expression = {
+    // If time is not provided, we use midnight, i.e. 00:00:00.
+    val timeExpr = time.getOrElse(Literal(0L, TimeType(0)))
+    // If timezone is not provided, we use the session timezone.
+    val zoneIdExpr = timezone.getOrElse(Literal(timeZoneId.get))
+    StaticInvoke(
+      classOf[DateTimeUtils.type],
+      TimestampType,
+      "makeTimestamp",
+      Seq(date, timeExpr, zoneIdExpr),
+      Seq(date.dataType, timeExpr.dataType, zoneIdExpr.dataType),
+      returnNullable = children.exists(_.nullable)
+    )
+  }
+
+  override def prettyName: String = "make_timestamp"
+
+  override def withTimeZone(timeZoneId: String): TimeZoneAwareExpression =
+    copy(timeZoneId = Option(timeZoneId))
+
+  override def nodePatternsInternal(): Seq[TreePattern] = Seq(RUNTIME_REPLACEABLE)
+
+  override protected def withNewChildrenInternal(
+      newChildren: IndexedSeq[Expression]): Expression = {
+    val timeOpt = if (time.isDefined) Some(newChildren(1)) else None
+    val timezoneOpt = if (timezone.isDefined) Some(newChildren(2)) else None
+    copy(date = newChildren(0), time = timeOpt, timezone = timezoneOpt)
+  }
+}
+
+/**
+ * This make_timestamp expression builder creates a timestamp from:
+ *   - a year, month, day, hour, min, sec and optional timezone, or
+ *   - a date, optional time, and optional timezone.
+ */
+// scalastyle:off line.size.limit
+@ExpressionDescription(
+  usage = """
+    _FUNC_(year, month, day, hour, min, sec[, timezone]) - Create the current timestamp with local time zone from year, month, day, hour, min, sec and timezone fields. If the configuration `spark.sql.ansi.enabled` is false, the function returns NULL on invalid inputs. Otherwise, it will throw an error instead.
+
+    _FUNC_(date[, time[, timezone]]) - Create timestamp from date and time fields.
+    """,
+  arguments = """
+    Arguments:
+      * year - the year to represent, from 1 to 9999
+      * month - the month-of-year to represent, from 1 (January) to 12 (December)
+      * day - the day-of-month to represent, from 1 to 31
+      * hour - the hour-of-day to represent, from 0 to 23
+      * min - the minute-of-hour to represent, from 0 to 59
+      * sec - the second-of-minute and its micro-fraction to represent, from
+              0 to 60. If the sec argument equals to 60, the seconds field is set
+              to 0 and 1 minute is added to the final timestamp.
+      * date - a date expression
+      * time - a time expression (optional). Default is 00:00:00.
+      * timezone - the time zone identifier (optional). For example, CET, UTC and etc.
+  """,
+  examples = """
+    Examples:
+      > SELECT _FUNC_(2014, 12, 28, 6, 30, 45.887);
+       2014-12-28 06:30:45.887
+      > SELECT _FUNC_(2014, 12, 28, 6, 30, 45.887, 'CET');
+       2014-12-27 21:30:45.887
+      > SELECT _FUNC_(DATE'2014-12-28');
+       2014-12-28 00:00:00
+      > SELECT _FUNC_(DATE'2014-12-28', TIME'6:30:45.887');
+       2014-12-28 06:30:45.887
+      > SELECT _FUNC_(DATE'2014-12-28', TIME'6:30:45.887', 'CET');
+       2014-12-27 21:30:45.887
+  """,
+  group = "datetime_funcs",
+  since = "3.0.0")
+// scalastyle:on line.size.limit
+object MakeTimestampExpressionBuilder extends ExpressionBuilder {
+  override def build(funcName: String, expressions: Seq[Expression]): Expression = {
+    val numArgs = expressions.length
+    if (numArgs == 1) {
+      // date
+      MakeTimestampFromDateTime(
+        expressions(0)
+      )
+    } else if (numArgs == 2) {
+      // date, time
+      MakeTimestampFromDateTime(
+        expressions(0),
+        Some(expressions(1))
+      )
+    } else if (numArgs == 3) {
+      // date, time, timezone
+      MakeTimestampFromDateTime(
+        expressions(0),
+        Some(expressions(1)),
+        Some(expressions(2))
+      )
+    } else if (numArgs == 6) {
+      // year, month, day, hour, min, sec
+      MakeTimestamp(
+        expressions(0),
+        expressions(1),
+        expressions(2),
+        expressions(3),
+        expressions(4),
+        expressions(5)
+      )
+    } else if (numArgs == 7) {
+      // year, month, day, hour, min, sec, timezone
+      MakeTimestamp(
+        expressions(0),
+        expressions(1),
+        expressions(2),
+        expressions(3),
+        expressions(4),
+        expressions(5),
+        Some(expressions(6))
+      )
+    } else {
+      throw QueryCompilationErrors.wrongNumArgsError(funcName, Seq(1, 2, 3, 6, 7), numArgs)
+    }
+  }
+}
+
 object DatePart {
 
   def parseExtractField(
@@ -3294,6 +3510,8 @@ case class SubtractDates(
     if (legacyInterval) CalendarIntervalType else DayTimeIntervalType(DAY)
   }
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   @transient
   private lazy val evalFunc: (Int, Int) => Any = if (legacyInterval) {
     (leftDays: Int, rightDays: Int) => subtractDates(leftDays, rightDays)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/hash.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/hash.scala
index 7cb645e601d36..88e22a91a64a7 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/hash.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/hash.scala
@@ -38,6 +38,7 @@ import org.apache.spark.sql.catalyst.util.DateTimeConstants._
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
+import org.apache.spark.sql.util.SchemaUtils
 import org.apache.spark.unsafe.Platform
 import org.apache.spark.unsafe.hash.Murmur3_x86_32
 import org.apache.spark.unsafe.types.{CalendarInterval, UTF8String}
@@ -68,6 +69,8 @@ case class Md5(child: Expression)
 
   override def inputTypes: Seq[DataType] = Seq(BinaryType)
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   protected override def nullSafeEval(input: Any): Any =
     UTF8String.fromString(DigestUtils.md5Hex(input.asInstanceOf[Array[Byte]]))
 
@@ -112,6 +115,8 @@ case class Sha2(left: Expression, right: Expression)
 
   override def inputTypes: Seq[DataType] = Seq(BinaryType, IntegerType)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   protected override def nullSafeEval(input1: Any, input2: Any): Any = {
     val bitLength = input2.asInstanceOf[Int]
     val input = input1.asInstanceOf[Array[Byte]]
@@ -178,6 +183,8 @@ case class Sha1(child: Expression)
 
   override def inputTypes: Seq[DataType] = Seq(BinaryType)
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   protected override def nullSafeEval(input: Any): Any =
     UTF8String.fromString(DigestUtils.sha1Hex(input.asInstanceOf[Array[Byte]]))
 
@@ -211,6 +218,8 @@ case class Crc32(child: Expression)
 
   override def inputTypes: Seq[DataType] = Seq(BinaryType)
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   protected override def nullSafeEval(input: Any): Any = {
     val checksum = new CRC32
     checksum.update(input.asInstanceOf[Array[Byte]], 0, input.asInstanceOf[Array[Byte]].length)
@@ -273,8 +282,15 @@ abstract class HashExpression[E] extends Expression {
 
   override def foldable: Boolean = children.forall(_.foldable)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def nullable: Boolean = false
 
+  protected def isCollationAware: Boolean
+
+  protected lazy val legacyCollationAwareHashing: Boolean =
+    SQLConf.get.getConf(SQLConf.COLLATION_AWARE_HASHING_ENABLED)
+
   private def hasMapType(dt: DataType): Boolean = {
     dt.existsRecursively(_.isInstanceOf[MapType])
   }
@@ -429,14 +445,43 @@ abstract class HashExpression[E] extends Expression {
       val numBytes = s"$input.numBytes()"
       s"$result = $hasherClassName.hashUnsafeBytes($baseObject, $baseOffset, $numBytes, $result);"
     } else {
-      val stringHash = ctx.freshName("stringHash")
-      s"""
-        long $stringHash = CollationFactory.fetchCollation(${stringType.collationId})
-          .hashFunction.applyAsLong($input);
-        $result = $hasherClassName.hashLong($stringHash, $result);
-      """
+      if (isCollationAware) {
+        val key = ctx.freshName("key")
+        val offset = "Platform.BYTE_ARRAY_OFFSET"
+        s"""
+          byte[] $key = (byte[]) CollationFactory.fetchCollation(${stringType.collationId})
+            .sortKeyFunction.apply($input);
+          $result = $hasherClassName.hashUnsafeBytes($key, $offset, $key.length, $result);
+        """
+      } else if (legacyCollationAwareHashing) {
+        val collation = CollationFactory.fetchCollation(stringType.collationId)
+        val stringHash = ctx.freshName("stringHash")
+        if (collation.isUtf8BinaryType || collation.isUtf8LcaseType) {
+          s"""
+            long $stringHash = UTF8String.fromBytes((byte[]) CollationFactory
+              .fetchCollation(${stringType.collationId}).sortKeyFunction.apply($input)).hashCode();
+            $result = $hasherClassName.hashLong($stringHash, $result);
+          """
+        } else if (collation.supportsSpaceTrimming) {
+          s"""
+            long $stringHash = CollationFactory.fetchCollation(${stringType.collationId})
+              .getCollator().getCollationKey($input.trimRight().toValidString()).hashCode();
+            $result = $hasherClassName.hashLong($stringHash, $result);
+          """
+        } else {
+          s"""
+            long $stringHash = CollationFactory.fetchCollation(${stringType.collationId})
+              .getCollator().getCollationKey($input.toValidString()).hashCode();
+            $result = $hasherClassName.hashLong($stringHash, $result);
+          """
+        }
+      } else {
+        val baseObject = s"$input.getBaseObject()"
+        val baseOffset = s"$input.getBaseOffset()"
+        val numBytes = s"$input.numBytes()"
+        s"$result = $hasherClassName.hashUnsafeBytes($baseObject, $baseOffset, $numBytes, $result);"
+      }
     }
-
   }
 
   protected def genHashForMap(
@@ -546,10 +591,38 @@ abstract class InterpretedHashFunction {
   protected def hashUnsafeBytes(base: AnyRef, offset: Long, length: Int, seed: Long): Long
 
   /**
-   * Computes hash of a given `value` of type `dataType`. The caller needs to check the validity
-   * of input `value`.
+   * This method is intended for callers using the old hash API and preserves compatibility for
+   * supported data types. It must only be used for data types that do not include collated strings
+   * or complex types (e.g., structs, arrays, maps) that may contain collated strings.
+   *
+   * The caller is responsible for ensuring that `dataType` does not involve collation-aware fields.
+   * This is validated via an internal assertion.
+   *
+   * @throws IllegalArgumentException if `dataType` contains non-UTF8 binary collation.
    */
   def hash(value: Any, dataType: DataType, seed: Long): Long = {
+    require(!SchemaUtils.hasNonUTF8BinaryCollation(dataType))
+    // For UTF8_BINARY, hashing behavior is the same regardless of the isCollationAware flag.
+    hash(
+      value = value,
+      dataType = dataType,
+      seed = seed,
+      isCollationAware = false,
+      legacyCollationAwareHashing = false)
+  }
+
+  /**
+   * Computes hash of a given `value` of type `dataType`. The caller needs to check the validity
+   * of input `value`. The `isCollationAware` boolean flag indicates whether hashing should take
+   * a string's collation into account. If not, the bytes of the string are hashed, otherwise the
+   * collation key of the string is hashed.
+   */
+  def hash(
+      value: Any,
+      dataType: DataType,
+      seed: Long,
+      isCollationAware: Boolean,
+      legacyCollationAwareHashing: Boolean): Long = {
     value match {
       case null => seed
       case b: Boolean => hashInt(if (b) 1 else 0, seed)
@@ -575,12 +648,25 @@ abstract class InterpretedHashFunction {
       case s: UTF8String =>
         val st = dataType.asInstanceOf[StringType]
         if (st.supportsBinaryEquality) {
-          hashUnsafeBytes(s.getBaseObject, s.getBaseOffset, s.numBytes(), seed)
+          hashUnsafeBytes(s.getBaseObject, s.getBaseOffset, s.numBytes, seed)
         } else {
-          val stringHash = CollationFactory
-            .fetchCollation(st.collationId)
-            .hashFunction.applyAsLong(s)
-          hashLong(stringHash, seed)
+          if (isCollationAware) {
+            val key = CollationFactory.fetchCollation(st.collationId).sortKeyFunction.apply(s)
+              .asInstanceOf[Array[Byte]]
+            hashUnsafeBytes(key, Platform.BYTE_ARRAY_OFFSET, key.length, seed)
+          } else if (legacyCollationAwareHashing) {
+            val collation = CollationFactory.fetchCollation(st.collationId)
+            val stringHash = if (collation.isUtf8BinaryType || collation.isUtf8LcaseType) {
+              UTF8String.fromBytes(collation.sortKeyFunction.apply(s)).hashCode
+            } else if (collation.supportsSpaceTrimming) {
+              collation.getCollator.getCollationKey(s.trimRight.toValidString).hashCode
+            } else {
+              collation.getCollator.getCollationKey(s.toValidString).hashCode
+            }
+            hashLong(stringHash, seed)
+          } else {
+            hashUnsafeBytes(s.getBaseObject, s.getBaseOffset, s.numBytes, seed)
+          }
         }
 
       case array: ArrayData =>
@@ -591,7 +677,12 @@ abstract class InterpretedHashFunction {
         var result = seed
         var i = 0
         while (i < array.numElements()) {
-          result = hash(array.get(i, elementType), elementType, result)
+          result = hash(
+            array.get(i, elementType),
+            elementType,
+            result,
+            isCollationAware,
+            legacyCollationAwareHashing)
           i += 1
         }
         result
@@ -608,8 +699,18 @@ abstract class InterpretedHashFunction {
         var result = seed
         var i = 0
         while (i < map.numElements()) {
-          result = hash(keys.get(i, kt), kt, result)
-          result = hash(values.get(i, vt), vt, result)
+          result = hash(
+            keys.get(i, kt),
+            kt,
+            result,
+            isCollationAware,
+            legacyCollationAwareHashing)
+          result = hash(
+            values.get(i, vt),
+            vt,
+            result,
+            isCollationAware,
+            legacyCollationAwareHashing)
           i += 1
         }
         result
@@ -624,7 +725,12 @@ abstract class InterpretedHashFunction {
         var i = 0
         val len = struct.numFields
         while (i < len) {
-          result = hash(struct.get(i, types(i)), types(i), result)
+          result = hash(
+            struct.get(i, types(i)),
+            types(i),
+            result,
+            isCollationAware,
+            legacyCollationAwareHashing)
           i += 1
         }
         result
@@ -656,8 +762,12 @@ case class Murmur3Hash(children: Seq[Expression], seed: Int) extends HashExpress
 
   override protected def hasherClassName: String = classOf[Murmur3_x86_32].getName
 
+  override protected def isCollationAware: Boolean = false
+
   override protected def computeHash(value: Any, dataType: DataType, seed: Int): Int = {
-    Murmur3HashFunction.hash(value, dataType, seed).toInt
+    Murmur3HashFunction.hash(
+      value, dataType, seed, isCollationAware, legacyCollationAwareHashing
+    ).toInt
   }
 
   override protected def withNewChildrenInternal(newChildren: IndexedSeq[Expression]): Murmur3Hash =
@@ -678,6 +788,29 @@ object Murmur3HashFunction extends InterpretedHashFunction {
   }
 }
 
+case class CollationAwareMurmur3Hash(children: Seq[Expression], seed: Int)
+  extends HashExpression[Int]
+{
+  def this(arguments: Seq[Expression]) = this(arguments, 42)
+
+  override def dataType: DataType = IntegerType
+
+  override def prettyName: String = "collation_aware_hash"
+
+  override protected def hasherClassName: String = classOf[Murmur3_x86_32].getName
+
+  override protected def isCollationAware: Boolean = true
+
+  override protected def computeHash(value: Any, dataType: DataType, seed: Int): Int = {
+    Murmur3HashFunction.hash(
+      value, dataType, seed, isCollationAware, legacyCollationAwareHashing
+    ).toInt
+  }
+
+  override protected def withNewChildrenInternal(newChildren: IndexedSeq[Expression]):
+    CollationAwareMurmur3Hash = copy(children = newChildren)
+}
+
 /**
  * A xxHash64 64-bit hash expression.
  */
@@ -700,8 +833,10 @@ case class XxHash64(children: Seq[Expression], seed: Long) extends HashExpressio
 
   override protected def hasherClassName: String = classOf[XXH64].getName
 
+  override protected def isCollationAware: Boolean = false
+
   override protected def computeHash(value: Any, dataType: DataType, seed: Long): Long = {
-    XxHash64Function.hash(value, dataType, seed)
+    XxHash64Function.hash(value, dataType, seed, isCollationAware, legacyCollationAwareHashing)
   }
 
   override protected def withNewChildrenInternal(newChildren: IndexedSeq[Expression]): XxHash64 =
@@ -718,6 +853,28 @@ object XxHash64Function extends InterpretedHashFunction {
   }
 }
 
+case class CollationAwareXxHash64(children: Seq[Expression], seed: Long)
+  extends HashExpression[Long]
+{
+  def this(arguments: Seq[Expression]) = this(arguments, 42L)
+
+  override def dataType: DataType = LongType
+
+  override def prettyName: String = "collation_aware_xxhash64"
+
+  override protected def hasherClassName: String = classOf[XXH64].getName
+
+  override protected def isCollationAware: Boolean = true
+
+  override protected def computeHash(value: Any, dataType: DataType, seed: Long): Long = {
+    XxHash64Function.hash(
+      value, dataType, seed, isCollationAware, legacyCollationAwareHashing)
+  }
+
+  override protected def withNewChildrenInternal(newChildren: IndexedSeq[Expression]):
+    CollationAwareXxHash64 = copy(children = newChildren)
+}
+
 /**
  * Simulates Hive's hashing function from Hive v1.2.1 at
  * org.apache.hadoop.hive.serde2.objectinspector.ObjectInspectorUtils#hashcode()
@@ -738,8 +895,12 @@ case class HiveHash(children: Seq[Expression]) extends HashExpression[Int] {
 
   override protected def hasherClassName: String = classOf[HiveHasher].getName
 
+  override protected def isCollationAware: Boolean = true
+
   override protected def computeHash(value: Any, dataType: DataType, seed: Int): Int = {
-    HiveHashFunction.hash(value, dataType, this.seed).toInt
+    HiveHashFunction.hash(
+      value, dataType, this.seed, isCollationAware, legacyCollationAwareHashing
+    ).toInt
   }
 
   override def doGenCode(ctx: CodegenContext, ev: ExprCode): ExprCode = {
@@ -825,17 +986,18 @@ case class HiveHash(children: Seq[Expression]) extends HashExpression[Int] {
 
   override protected def genHashString(
       ctx: CodegenContext, stringType: StringType, input: String, result: String): String = {
-    if (stringType.supportsBinaryEquality) {
+    if (stringType.supportsBinaryEquality || !isCollationAware) {
       val baseObject = s"$input.getBaseObject()"
       val baseOffset = s"$input.getBaseOffset()"
       val numBytes = s"$input.numBytes()"
       s"$result = $hasherClassName.hashUnsafeBytes($baseObject, $baseOffset, $numBytes);"
     } else {
-      val stringHash = ctx.freshName("stringHash")
+      val key = ctx.freshName("key")
+      val offset = Platform.BYTE_ARRAY_OFFSET
       s"""
-        long $stringHash = CollationFactory.fetchCollation(${stringType.collationId})
-          .hashFunction.applyAsLong($input);
-        $result = $hasherClassName.hashLong($stringHash);
+        byte[] $key = (byte[]) CollationFactory.fetchCollation(${stringType.collationId})
+          .sortKeyFunction.apply($input);
+        $result = $hasherClassName.hashUnsafeBytes($key, $offset, $key.length, $result);
       """
     }
   }
@@ -1018,7 +1180,12 @@ object HiveHashFunction extends InterpretedHashFunction {
      (result * 37) + nanoSeconds
   }
 
-  override def hash(value: Any, dataType: DataType, seed: Long): Long = {
+  override def hash(
+      value: Any,
+      dataType: DataType,
+      seed: Long,
+      isCollationAware: Boolean,
+      legacyCollationAwareHashing: Boolean): Long = {
     value match {
       case null => 0
       case array: ArrayData =>
@@ -1031,7 +1198,9 @@ object HiveHashFunction extends InterpretedHashFunction {
         var i = 0
         val length = array.numElements()
         while (i < length) {
-          result = (31 * result) + hash(array.get(i, elementType), elementType, 0).toInt
+          result = (31 * result) + hash(
+            array.get(i, elementType), elementType, 0, isCollationAware, legacyCollationAwareHashing
+          ).toInt
           i += 1
         }
         result
@@ -1050,7 +1219,11 @@ object HiveHashFunction extends InterpretedHashFunction {
         var i = 0
         val length = map.numElements()
         while (i < length) {
-          result += hash(keys.get(i, kt), kt, 0).toInt ^ hash(values.get(i, vt), vt, 0).toInt
+          result += hash(
+            keys.get(i, kt), kt, 0, isCollationAware, legacyCollationAwareHashing
+          ).toInt ^ hash(
+            values.get(i, vt), vt, 0, isCollationAware, legacyCollationAwareHashing
+          ).toInt
           i += 1
         }
         result
@@ -1066,7 +1239,10 @@ object HiveHashFunction extends InterpretedHashFunction {
         var i = 0
         val length = struct.numFields
         while (i < length) {
-          result = (31 * result) + hash(struct.get(i, types(i)), types(i), 0).toInt
+          result = (31 * result) +
+            hash(
+              struct.get(i, types(i)), types(i), 0, isCollationAware, legacyCollationAwareHashing
+            ).toInt
           i += 1
         }
         result
@@ -1074,7 +1250,7 @@ object HiveHashFunction extends InterpretedHashFunction {
       case d: Decimal => normalizeDecimal(d.toJavaBigDecimal).hashCode()
       case timestamp: Long if dataType.isInstanceOf[TimestampType] => hashTimestamp(timestamp)
       case calendarInterval: CalendarInterval => hashCalendarInterval(calendarInterval)
-      case _ => super.hash(value, dataType, 0)
+      case _ => super.hash(value, dataType, 0, isCollationAware, legacyCollationAwareHashing)
     }
   }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/json/JsonExpressionEvalUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/json/JsonExpressionEvalUtils.scala
index b942006e87e9d..f0473f5a414f2 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/json/JsonExpressionEvalUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/json/JsonExpressionEvalUtils.scala
@@ -33,13 +33,13 @@ import org.apache.spark.sql.types.{ArrayType, DataType, MapType, StringType, Str
 import org.apache.spark.unsafe.types.{UTF8String, VariantVal}
 import org.apache.spark.util.Utils
 
-private[this] sealed trait PathInstruction
-private[this] object PathInstruction {
+sealed trait PathInstruction
+object PathInstruction {
   private[expressions] case object Subscript extends PathInstruction
   private[expressions] case object Wildcard extends PathInstruction
   private[expressions] case object Key extends PathInstruction
   private[expressions] case class Index(index: Long) extends PathInstruction
-  private[expressions] case class Named(name: String) extends PathInstruction
+  case class Named(name: String) extends PathInstruction
 }
 
 private[this] sealed trait WriteStyle
@@ -49,7 +49,7 @@ private[this] object WriteStyle {
   private[expressions] case object FlattenStyle extends WriteStyle
 }
 
-private[this] object JsonPathParser extends RegexParsers {
+object JsonPathParser extends RegexParsers {
   import PathInstruction._
 
   def root: Parser[Char] = '$'
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/literals.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/literals.scala
index e3ed2c4a0b0b8..c799415dfc706 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/literals.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/literals.scala
@@ -30,14 +30,13 @@ import java.nio.charset.StandardCharsets
 import java.sql.{Date, Timestamp}
 import java.time.{Duration, Instant, LocalDate, LocalDateTime, LocalTime, Period, ZoneOffset}
 import java.util
-import java.util.Objects
+import java.util.{HexFormat, Objects}
 
 import scala.collection.{immutable, mutable}
 import scala.math.{BigDecimal, BigInt}
 import scala.reflect.runtime.universe.TypeTag
 import scala.util.Try
 
-import org.apache.commons.codec.binary.{Hex => ApacheHex}
 import org.json4s.JsonAST._
 
 import org.apache.spark.sql.catalyst.{CatalystTypeConverters, FunctionIdentifier, InternalRow, ScalaReflection}
@@ -49,7 +48,7 @@ import org.apache.spark.sql.catalyst.trees.TreePattern
 import org.apache.spark.sql.catalyst.trees.TreePattern.{LITERAL, NULL_LITERAL, TRUE_OR_FALSE_LITERAL}
 import org.apache.spark.sql.catalyst.types._
 import org.apache.spark.sql.catalyst.util._
-import org.apache.spark.sql.catalyst.util.DateTimeUtils.{instantToMicros, localTimeToMicros}
+import org.apache.spark.sql.catalyst.util.DateTimeUtils.{instantToMicros, localTimeToNanos}
 import org.apache.spark.sql.catalyst.util.IntervalStringStyles.ANSI_STYLE
 import org.apache.spark.sql.catalyst.util.IntervalUtils.{durationToMicros, periodToMonths, toDayTimeIntervalString, toYearMonthIntervalString}
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors}
@@ -89,7 +88,7 @@ object Literal {
     case l: LocalDateTime => Literal(DateTimeUtils.localDateTimeToMicros(l), TimestampNTZType)
     case ld: LocalDate => Literal(ld.toEpochDay.toInt, DateType)
     case d: Date => Literal(DateTimeUtils.fromJavaDate(d), DateType)
-    case lt: LocalTime => Literal(localTimeToMicros(lt), TimeType())
+    case lt: LocalTime => Literal(localTimeToNanos(lt), TimeType())
     case d: Duration => Literal(durationToMicros(d), DayTimeIntervalType())
     case p: Period => Literal(periodToMonths(p), YearMonthIntervalType())
     case a: Array[Byte] => Literal(a, BinaryType)
@@ -415,6 +414,9 @@ case class Literal (value: Any, dataType: DataType) extends LeafExpression {
   Literal.validateLiteralValue(value, dataType)
 
   override def foldable: Boolean = true
+
+  override def contextIndependentFoldable: Boolean = true
+
   override def nullable: Boolean = value == null
 
   private def timeZoneId = DateTimeUtils.getZoneId(SQLConf.get.sessionLocalTimeZone)
@@ -429,7 +431,7 @@ case class Literal (value: Any, dataType: DataType) extends LeafExpression {
 
   override def toString: String = value match {
     case null => "null"
-    case binary: Array[Byte] => "0x" + ApacheHex.encodeHexString(binary, false)
+    case binary: Array[Byte] => "0x" + HexFormat.of().withUpperCase().formatHex(binary)
     case d: ArrayBasedMapData => s"map(${d.toString})"
     case other =>
       dataType match {
@@ -575,7 +577,7 @@ case class Literal (value: Any, dataType: DataType) extends LeafExpression {
       s"TIMESTAMP_NTZ '$toString'"
     case (i: CalendarInterval, CalendarIntervalType) =>
       s"INTERVAL '${i.toString}'"
-    case (v: Array[Byte], BinaryType) => s"X'${ApacheHex.encodeHexString(v, false)}'"
+    case (v: Array[Byte], BinaryType) => s"X'${HexFormat.of().withUpperCase().formatHex(v)}'"
     case (i: Long, DayTimeIntervalType(startField, endField)) =>
       toDayTimeIntervalString(i, ANSI_STYLE, startField, endField)
     case (i: Int, YearMonthIntervalType(startField, endField)) =>
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/mathExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/mathExpressions.scala
index 9db2ac7f9b041..ee3e3e0272767 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/mathExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/mathExpressions.scala
@@ -48,6 +48,7 @@ abstract class LeafMathExpression(c: Double, name: String)
 
   override def dataType: DataType = DoubleType
   override def foldable: Boolean = true
+  override def contextIndependentFoldable: Boolean = true
   override def nullable: Boolean = false
   override def toString: String = s"$name()"
   override def prettyName: String = name
@@ -68,6 +69,7 @@ abstract class UnaryMathExpression(val f: Double => Double, name: String)
 
   override def inputTypes: Seq[AbstractDataType] = Seq(DoubleType)
   override def dataType: DataType = DoubleType
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
   override def nullable: Boolean = true
   override def toString: String = s"$prettyName($child)"
   override def prettyName: String = getTagValue(FunctionRegistry.FUNC_ALIAS).getOrElse(name)
@@ -87,6 +89,8 @@ abstract class UnaryMathExpression(val f: Double => Double, name: String)
 abstract class UnaryLogExpression(f: Double => Double, name: String)
     extends UnaryMathExpression(f, name) {
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def nullable: Boolean = true
 
   // values less than or equal to yAsymptote eval to null in Hive, instead of NaN or -Infinity
@@ -123,6 +127,8 @@ abstract class BinaryMathExpression(f: (Double, Double) => Double, name: String)
 
   override def inputTypes: Seq[DataType] = Seq(DoubleType, DoubleType)
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def toString: String = s"$prettyName($left, $right)"
 
   override def prettyName: String = getTagValue(FunctionRegistry.FUNC_ALIAS).getOrElse(name)
@@ -1011,6 +1017,7 @@ case class Bin(child: Expression)
   with DefaultStringProducingExpression {
   override def nullIntolerant: Boolean = true
   override def inputTypes: Seq[DataType] = Seq(LongType)
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
 
   protected override def nullSafeEval(input: Any): Any =
     UTF8String.toBinaryString(input.asInstanceOf[Long])
@@ -1129,6 +1136,8 @@ case class Hex(child: Expression)
     case _ => super.dataType
   }
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   protected override def nullSafeEval(num: Any): Any = child.dataType match {
     case LongType => Hex.hex(num.asInstanceOf[Long])
     case BinaryType => Hex.hex(num.asInstanceOf[Array[Byte]])
@@ -1164,6 +1173,7 @@ case class Hex(child: Expression)
 case class Unhex(child: Expression, failOnError: Boolean = false)
   extends UnaryExpression with ImplicitCastInputTypes {
   override def nullIntolerant: Boolean = true
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
 
   def this(expr: Expression) = this(expr, false)
 
@@ -1263,7 +1273,7 @@ case class Pow(left: Expression, right: Expression)
 sealed trait BitShiftOperation
   extends BinaryExpression with ImplicitCastInputTypes {
   override def nullIntolerant: Boolean = true
-
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
   def symbol: String
   def shiftInt: (Int, Int) => Int
   def shiftLong: (Long, Int) => Long
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/misc.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/misc.scala
index dcbca34b240b5..6f806760b3736 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/misc.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/misc.scala
@@ -327,6 +327,7 @@ case class SparkVersion()
 case class TypeOf(child: Expression) extends UnaryExpression with DefaultStringProducingExpression {
   override def nullable: Boolean = false
   override def foldable: Boolean = true
+  override def contextIndependentFoldable: Boolean = true
   override def eval(input: InternalRow): Any = UTF8String.fromString(child.dataType.catalogString)
 
   override def doGenCode(ctx: CodegenContext, ev: ExprCode): ExprCode = {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/nullExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/nullExpressions.scala
index 290f523cc02c1..1aa1d0b25e44c 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/nullExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/nullExpressions.scala
@@ -285,6 +285,8 @@ case class IsNaN(child: Expression) extends UnaryExpression
 
   override def inputTypes: Seq[AbstractDataType] = Seq(TypeCollection(DoubleType, FloatType))
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def nullable: Boolean = false
 
   override def eval(input: InternalRow): Any = {
@@ -334,6 +336,8 @@ case class NaNvl(left: Expression, right: Expression)
   override def inputTypes: Seq[AbstractDataType] =
     Seq(TypeCollection(DoubleType, FloatType), TypeCollection(DoubleType, FloatType))
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   /**
    * We can only guarantee the left child can be always accessed. If we hit the left child,
    * the right child will not be accessed.
@@ -406,6 +410,8 @@ case class NaNvl(left: Expression, right: Expression)
 case class IsNull(child: Expression) extends UnaryExpression with Predicate {
   override def nullable: Boolean = false
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   final override val nodePatterns: Seq[TreePattern] = Seq(NULL_CHECK)
 
   override def eval(input: InternalRow): Any = {
@@ -440,6 +446,8 @@ case class IsNotNull(child: Expression) extends UnaryExpression with Predicate {
 
   final override val nodePatterns: Seq[TreePattern] = Seq(NULL_CHECK)
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def eval(input: InternalRow): Any = {
     child.eval(input) != null
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/numberFormatExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/numberFormatExpressions.scala
index 21dcbba818d9f..0a6d23977d2f6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/numberFormatExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/numberFormatExpressions.scala
@@ -54,6 +54,9 @@ abstract class ToNumberBase(left: Expression, right: Expression, errorOnFail: Bo
       StringTypeWithCollation(supportsTrimCollation = true),
       StringTypeWithCollation(supportsTrimCollation = true))
 
+
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def checkInputDataTypes(): TypeCheckResult = {
     val inputTypeCheck = super.checkInputDataTypes()
     if (inputTypeCheck.isSuccess) {
@@ -310,6 +313,7 @@ case class ToCharacter(left: Expression, right: Expression)
       inputTypeCheck
     }
   }
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
   override def prettyName: String = "to_char"
   override def nullSafeEval(decimal: Any, format: Any): Any = {
     val input = decimal.asInstanceOf[Decimal]
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ordering.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ordering.scala
index 37a3b3a34e49c..c735f5b334bd5 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ordering.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/ordering.scala
@@ -38,6 +38,8 @@ class BaseOrdering extends Ordering[InternalRow] {
  * An interpreted row ordering comparator.
  */
 class InterpretedOrdering(ordering: Seq[SortOrder]) extends BaseOrdering {
+  private val leftEvaluators = ordering.map(_.child)
+  private val rightEvaluators = leftEvaluators.map(_.freshCopyIfContainsStatefulExpression())
   private lazy val physicalDataTypes = ordering.map { order =>
     val dt = order.dataType match {
       case udt: UserDefinedType[_] => udt.sqlType
@@ -54,8 +56,8 @@ class InterpretedOrdering(ordering: Seq[SortOrder]) extends BaseOrdering {
     val size = ordering.size
     while (i < size) {
       val order = ordering(i)
-      val left = order.child.eval(a)
-      val right = order.child.eval(b)
+      val left = leftEvaluators(i).eval(a)
+      val right = rightEvaluators(i).eval(b)
 
       if (left == null && right == null) {
         // Both null, continue looking.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/predicates.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/predicates.scala
index c31c72bc11488..7767e97d34ac5 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/predicates.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/predicates.scala
@@ -32,11 +32,11 @@ import org.apache.spark.sql.catalyst.expressions.codegen.Block._
 import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, LeafNode, LogicalPlan, Project, Union}
 import org.apache.spark.sql.catalyst.trees.TreePattern._
 import org.apache.spark.sql.catalyst.util.{CollationFactory, TypeUtils}
-import org.apache.spark.sql.catalyst.util.SparkStringUtils.truncatedString
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.UTF8String
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.SparkStringUtils.truncatedString
 
 /**
  * A base class for generated/interpreted predicate
@@ -67,6 +67,8 @@ case class InterpretedPredicate(expression: Expression) extends BasePredicate {
  */
 trait Predicate extends Expression {
   override def dataType: DataType = BooleanType
+
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 }
 
 /**
@@ -319,6 +321,8 @@ case class Not(child: Expression)
   extends UnaryExpression with Predicate with ImplicitCastInputTypes {
   override def nullIntolerant: Boolean = true
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def toString: String = s"NOT $child"
 
   override def inputTypes: Seq[DataType] = Seq(BooleanType)
@@ -481,6 +485,7 @@ case class In(value: Expression, list: Seq[Expression]) extends Predicate {
 
   override def nullable: Boolean = children.exists(_.nullable)
   override def foldable: Boolean = children.forall(_.foldable)
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   final override val nodePatterns: Seq[TreePattern] = Seq(IN)
   private val legacyNullInEmptyBehavior =
@@ -619,6 +624,8 @@ case class InSet(child: Expression, hset: Set[Any]) extends UnaryExpression with
 
   require(hset != null, "hset could not be null")
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def simpleString(maxFields: Int): String = {
     if (!child.resolved) {
       return s"$child INSET (values with unresolved data types)"
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/regexpExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/regexpExpressions.scala
index be7d227d80026..c6e5c480f3c2c 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/regexpExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/regexpExpressions.scala
@@ -37,8 +37,8 @@ import org.apache.spark.sql.catalyst.trees.BinaryLike
 import org.apache.spark.sql.catalyst.trees.TreePattern.{LIKE_FAMLIY, REGEXP_EXTRACT_FAMILY, REGEXP_REPLACE, TreePattern}
 import org.apache.spark.sql.catalyst.util.{CollationSupport, GenericArrayData, StringUtils}
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors}
-import org.apache.spark.sql.internal.types.{
-  StringTypeBinaryLcase, StringTypeWithCollation}
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.internal.types.{StringTypeBinaryLcase, StringTypeWithCollation}
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.UTF8String
 
@@ -293,6 +293,8 @@ sealed abstract class MultiLikeBase
   extends UnaryExpression with ImplicitCastInputTypes with Predicate {
   override def nullIntolerant: Boolean = true
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   protected def patterns: Seq[UTF8String]
 
   protected def isNotSpecified: Boolean
@@ -578,20 +580,33 @@ case class StringSplit(str: Expression, regex: Expression, limit: Expression)
 
   final lazy val collationId: Int = str.dataType.asInstanceOf[StringType].collationId
 
+  private lazy val legacySplitTruncate =
+    SQLConf.get.getConf(SQLConf.LEGACY_TRUNCATE_FOR_EMPTY_REGEX_SPLIT)
+
   def this(exp: Expression, regex: Expression) = this(exp, regex, Literal(-1))
 
   override def nullSafeEval(string: Any, regex: Any, limit: Any): Any = {
-    val pattern = CollationSupport.collationAwareRegex(regex.asInstanceOf[UTF8String], collationId)
-    val strings = string.asInstanceOf[UTF8String].split(pattern, limit.asInstanceOf[Int])
+    val pattern = CollationSupport.collationAwareRegex(
+      regex.asInstanceOf[UTF8String], collationId, legacySplitTruncate)
+    val strings = if (legacySplitTruncate) {
+      string.asInstanceOf[UTF8String].splitLegacyTruncate(pattern, limit.asInstanceOf[Int])
+    } else {
+      string.asInstanceOf[UTF8String].split(pattern, limit.asInstanceOf[Int])
+    }
     new GenericArrayData(strings.asInstanceOf[Array[Any]])
   }
 
   override def doGenCode(ctx: CodegenContext, ev: ExprCode): ExprCode = {
     val arrayClass = classOf[GenericArrayData].getName
+    val pattern = ctx.freshName("pattern")
     nullSafeCodeGen(ctx, ev, (str, regex, limit) => {
       // Array in java is covariant, so we don't need to cast UTF8String[] to Object[].
-      s"""${ev.value} = new $arrayClass($str.split(
-         |CollationSupport.collationAwareRegex($regex, $collationId),$limit));""".stripMargin
+      s"""
+         |UTF8String $pattern =
+         |  CollationSupport.collationAwareRegex($regex, $collationId, $legacySplitTruncate);
+         |${ev.value} = new $arrayClass($legacySplitTruncate ?
+         |  $str.splitLegacyTruncate($pattern, $limit) : $str.split($pattern, $limit));
+         |""".stripMargin
     })
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/stringExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/stringExpressions.scala
index 55cc030a99537..3d32a2ef606c7 100755
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/stringExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/stringExpressions.scala
@@ -94,6 +94,7 @@ case class ConcatWs(children: Seq[Expression])
 
   override def nullable: Boolean = children.head.nullable
   override def foldable: Boolean = children.forall(_.foldable)
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   override def checkInputDataTypes(): TypeCheckResult = {
     if (children.isEmpty) {
@@ -440,6 +441,7 @@ trait String2StringExpression extends ImplicitCastInputTypes {
   override def dataType: DataType = child.dataType
   override def inputTypes: Seq[AbstractDataType] =
     Seq(StringTypeWithCollation(supportsTrimCollation = true))
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
 
   protected override def nullSafeEval(input: Any): Any =
     convert(input.asInstanceOf[UTF8String])
@@ -1264,6 +1266,8 @@ case class FindInSet(left: Expression, right: Expression) extends BinaryExpressi
       StringTypeWithCollation(supportsTrimCollation = true)
     )
 
+  override def contextIndependentFoldable: Boolean = super.contextIndependentFoldable
+
   override protected def nullSafeEval(word: Any, set: Any): Any = {
     CollationSupport.FindInSet.
       exec(word.asInstanceOf[UTF8String], set.asInstanceOf[UTF8String], collationId)
@@ -1297,6 +1301,7 @@ trait String2TrimExpression extends Expression with ImplicitCastInputTypes {
 
   override def nullable: Boolean = children.exists(_.nullable)
   override def foldable: Boolean = children.forall(_.foldable)
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   protected def doEval(srcString: UTF8String): UTF8String
   protected def doEval(srcString: UTF8String, trimString: UTF8String): UTF8String
@@ -1678,6 +1683,8 @@ case class StringInstr(str: Expression, substr: Expression)
       StringTypeNonCSAICollation(supportsTrimCollation = true)
     )
 
+  override def contextIndependentFoldable: Boolean = super.contextIndependentFoldable
+
   override def nullSafeEval(string: Any, sub: Any): Any = {
     CollationSupport.StringInstr.
       exec(string.asInstanceOf[UTF8String], sub.asInstanceOf[UTF8String], collationId) + 1
@@ -1729,6 +1736,7 @@ case class SubstringIndex(strExpr: Expression, delimExpr: Expression, countExpr:
       StringTypeNonCSAICollation(supportsTrimCollation = true),
       IntegerType
     )
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
   override def first: Expression = strExpr
   override def second: Expression = delimExpr
   override def third: Expression = countExpr
@@ -2050,6 +2058,7 @@ case class FormatString(children: Expression*) extends Expression with ImplicitC
 
 
   override def foldable: Boolean = children.forall(_.foldable)
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
   override def nullable: Boolean = children(0).nullable
   override def dataType: DataType = children(0).dataType
 
@@ -2205,6 +2214,8 @@ case class StringRepeat(str: Expression, times: Expression)
       IntegerType
     )
 
+  override def contextIndependentFoldable: Boolean = super.contextIndependentFoldable
+
   override def nullSafeEval(string: Any, n: Any): Any = {
     string.asInstanceOf[UTF8String].repeat(n.asInstanceOf[Integer])
   }
@@ -2235,6 +2246,7 @@ case class StringSpace(child: Expression)
   extends UnaryExpression with ImplicitCastInputTypes with DefaultStringProducingExpression {
   override def nullIntolerant: Boolean = true
   override def inputTypes: Seq[DataType] = Seq(IntegerType)
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
 
   override def nullSafeEval(s: Any): Any = {
     val length = s.asInstanceOf[Int]
@@ -2302,6 +2314,8 @@ case class Substring(str: Expression, pos: Expression, len: Expression)
       IntegerType
     )
 
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
+
   override def first: Expression = str
   override def second: Expression = pos
   override def third: Expression = len
@@ -2354,7 +2368,7 @@ case class Right(str: Expression, len: Expression) extends RuntimeReplaceable
     If(
       LessThanOrEqual(len, Literal(0)),
       Literal(UTF8String.EMPTY_UTF8, str.dataType),
-      new Substring(str, UnaryMinus(len))
+      new Substring(str, UnaryMinus(len, failOnError = false))
     )
   )
 
@@ -2441,6 +2455,7 @@ case class Length(child: Expression)
         BinaryType
       )
     )
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
 
   protected override def nullSafeEval(value: Any): Any = child.dataType match {
     case _: StringType => value.asInstanceOf[UTF8String].numChars
@@ -2482,6 +2497,7 @@ case class BitLength(child: Expression)
         BinaryType
       )
     )
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
   protected override def nullSafeEval(value: Any): Any = child.dataType match {
     case _: StringType => value.asInstanceOf[UTF8String].numBytes * 8
     case BinaryType => value.asInstanceOf[Array[Byte]].length * 8
@@ -2526,6 +2542,7 @@ case class OctetLength(child: Expression)
         BinaryType
       )
     )
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
 
   protected override def nullSafeEval(value: Any): Any = child.dataType match {
     case _: StringType => value.asInstanceOf[UTF8String].numBytes
@@ -2617,6 +2634,7 @@ case class Levenshtein(
   override def nullIntolerant: Boolean = true
 
   override def foldable: Boolean = children.forall(_.foldable)
+  override def contextIndependentFoldable: Boolean = children.forall(_.contextIndependentFoldable)
 
   override def eval(input: InternalRow): Any = {
     val leftEval = left.eval(input)
@@ -2722,6 +2740,8 @@ case class SoundEx(child: Expression)
   override def inputTypes: Seq[AbstractDataType] =
     Seq(StringTypeWithCollation(supportsTrimCollation = true))
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def nullSafeEval(input: Any): Any = input.asInstanceOf[UTF8String].soundex()
 
   override def doGenCode(ctx: CodegenContext, ev: ExprCode): ExprCode = {
@@ -2811,6 +2831,8 @@ case class Chr(child: Expression)
     }
   }
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def doGenCode(ctx: CodegenContext, ev: ExprCode): ExprCode = {
     nullSafeCodeGen(ctx, ev, lon => {
       s"""
@@ -2853,6 +2875,8 @@ case class Base64(child: Expression, chunkBase64: Boolean)
 
   override def inputTypes: Seq[DataType] = Seq(BinaryType)
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override lazy val replacement: Expression = StaticInvoke(
     classOf[Base64],
     dataType,
@@ -2901,6 +2925,7 @@ case class UnBase64(child: Expression, failOnError: Boolean = false)
   override def dataType: DataType = BinaryType
   override def inputTypes: Seq[AbstractDataType] =
     Seq(StringTypeWithCollation(supportsTrimCollation = true))
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
 
   def this(expr: Expression) = this(expr, false)
 
@@ -3340,6 +3365,7 @@ case class FormatNumber(x: Expression, d: Expression)
   override def right: Expression = d
   override def nullable: Boolean = true
   override def nullIntolerant: Boolean = true
+  override def contextIndependentFoldable: Boolean = super.contextIndependentFoldable
 
   override def inputTypes: Seq[AbstractDataType] =
     Seq(
@@ -3590,6 +3616,7 @@ case class StringSplitSQL(
   override def left: Expression = str
   override def right: Expression = delimiter
   override def nullIntolerant: Boolean = true
+  override def contextIndependentFoldable: Boolean = super.contextIndependentFoldable
 
   override def nullSafeEval(string: Any, delimiter: Any): Any = {
     val strings = CollationSupport.StringSplitSQL.exec(string.asInstanceOf[UTF8String],
@@ -3752,6 +3779,8 @@ case class Quote(input: Expression)
     Seq(StringTypeWithCollation(supportsTrimCollation = true))
   }
 
+  override def contextIndependentFoldable: Boolean = child.contextIndependentFoldable
+
   override def nodeName: String = "quote"
 
   override def nullable: Boolean = true
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/timeExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/timeExpressions.scala
index 47f2d5d73e212..ff088876969bd 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/timeExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/timeExpressions.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.catalyst.expressions
 import java.time.DateTimeException
 import java.util.Locale
 
+import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.{ExpressionBuilder, TypeCheckResult}
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{DataTypeMismatch, TypeCheckSuccess}
@@ -32,7 +33,8 @@ import org.apache.spark.sql.catalyst.util.TimeFormatter
 import org.apache.spark.sql.catalyst.util.TypeUtils.ordinalNumber
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors}
 import org.apache.spark.sql.internal.types.StringTypeWithCollation
-import org.apache.spark.sql.types.{AbstractDataType, DataType, DecimalType, IntegerType, ObjectType, TimeType, TypeCollection}
+import org.apache.spark.sql.types.{AbstractDataType, AnyTimeType, ByteType, DataType, DayTimeIntervalType, DecimalType, IntegerType, LongType, ObjectType, TimeType}
+import org.apache.spark.sql.types.DayTimeIntervalType.{HOUR, SECOND}
 import org.apache.spark.unsafe.types.UTF8String
 
 /**
@@ -208,8 +210,7 @@ case class MinutesOfTime(child: Expression)
     Seq(child.dataType)
   )
 
-  override def inputTypes: Seq[AbstractDataType] =
-    Seq(TypeCollection(TimeType.MIN_PRECISION to TimeType.MAX_PRECISION map TimeType.apply: _*))
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyTimeType)
 
   override def children: Seq[Expression] = Seq(child)
 
@@ -268,8 +269,7 @@ case class HoursOfTime(child: Expression)
     Seq(child.dataType)
   )
 
-  override def inputTypes: Seq[AbstractDataType] =
-    Seq(TypeCollection(TimeType.MIN_PRECISION to TimeType.MAX_PRECISION map TimeType.apply: _*))
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyTimeType)
 
   override def children: Seq[Expression] = Seq(child)
 
@@ -317,9 +317,11 @@ object HourExpressionBuilder extends ExpressionBuilder {
 case class SecondsOfTimeWithFraction(child: Expression)
   extends RuntimeReplaceable
   with ExpectsInputTypes {
-
   override def replacement: Expression = {
-
+    val precision = child.dataType match {
+      case TimeType(p) => p
+      case _ => TimeType.MIN_PRECISION
+    }
     StaticInvoke(
       classOf[DateTimeUtils.type],
       DecimalType(8, 6),
@@ -327,10 +329,8 @@ case class SecondsOfTimeWithFraction(child: Expression)
       Seq(child, Literal(precision)),
       Seq(child.dataType, IntegerType))
   }
-  private val precision: Int = child.dataType.asInstanceOf[TimeType].precision
 
-  override def inputTypes: Seq[AbstractDataType] =
-    Seq(TimeType(precision))
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyTimeType)
 
   override def children: Seq[Expression] = Seq(child)
 
@@ -352,8 +352,7 @@ case class SecondsOfTime(child: Expression)
     Seq(child.dataType)
   )
 
-  override def inputTypes: Seq[AbstractDataType] =
-    Seq(TypeCollection(TimeType.MIN_PRECISION to TimeType.MAX_PRECISION map TimeType.apply: _*))
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyTimeType)
 
   override def children: Seq[Expression] = Seq(child)
 
@@ -516,8 +515,8 @@ case class CurrentTime(
   override def inputTypes: Seq[AbstractDataType] = Seq(IntegerType)
 
   override def eval(input: InternalRow): Any = {
-    val currentTimeOfDayMicros = DateTimeUtils.instantToMicrosOfDay(java.time.Instant.now(), zoneId)
-    DateTimeUtils.truncateTimeMicrosToPrecision(currentTimeOfDayMicros, precision)
+    val currentTimeOfDayNanos = DateTimeUtils.instantToNanosOfDay(java.time.Instant.now(), zoneId)
+    DateTimeUtils.truncateTimeToPrecision(currentTimeOfDayNanos, precision)
   }
 }
 
@@ -558,7 +557,7 @@ case class MakeTime(
   override def replacement: Expression = StaticInvoke(
     classOf[DateTimeUtils.type],
     TimeType(TimeType.MICROS_PRECISION),
-    "timeToMicros",
+    "makeTime",
     children,
     inputTypes
   )
@@ -566,3 +565,187 @@ case class MakeTime(
   override protected def withNewChildrenInternal(newChildren: IndexedSeq[Expression]): MakeTime =
     copy(hours = newChildren(0), minutes = newChildren(1), secsAndMicros = newChildren(2))
 }
+
+/**
+ * Adds day-time interval to time.
+ */
+case class TimeAddInterval(time: Expression, interval: Expression)
+  extends BinaryExpression with RuntimeReplaceable with ExpectsInputTypes {
+  override def nullIntolerant: Boolean = true
+
+  override def left: Expression = time
+  override def right: Expression = interval
+
+  override def toString: String = s"$left + $right"
+  override def sql: String = s"${left.sql} + ${right.sql}"
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyTimeType, DayTimeIntervalType)
+
+  override def replacement: Expression = {
+    val (timePrecision, intervalEndField) = (time.dataType, interval.dataType) match {
+      case (TimeType(p), DayTimeIntervalType(_, endField)) => (p, endField)
+      case _ => throw SparkException.internalError("Unexpected input types: " +
+        s"time type ${time.dataType.sql}, interval type ${interval.dataType.sql}.")
+    }
+    val intervalPrecision = if (intervalEndField < SECOND) {
+      TimeType.MIN_PRECISION
+    } else {
+      TimeType.MICROS_PRECISION
+    }
+    val targetPrecision = Math.max(timePrecision, intervalPrecision)
+    StaticInvoke(
+      classOf[DateTimeUtils.type],
+      TimeType(targetPrecision),
+      "timeAddInterval",
+      Seq(time, Literal(timePrecision), interval, Literal(intervalEndField),
+        Literal(targetPrecision)),
+      Seq(AnyTimeType, IntegerType, DayTimeIntervalType, ByteType, IntegerType),
+      propagateNull = nullIntolerant)
+  }
+
+  override protected def withNewChildrenInternal(
+      newTime: Expression, newInterval: Expression): TimeAddInterval =
+    copy(time = newTime, interval = newInterval)
+}
+
+/**
+ * Returns a day-time interval between time values.
+ */
+case class SubtractTimes(left: Expression, right: Expression)
+  extends BinaryExpression with RuntimeReplaceable with ExpectsInputTypes {
+  override def nullIntolerant: Boolean = true
+  override def inputTypes: Seq[AbstractDataType] = Seq(AnyTimeType, AnyTimeType)
+
+  override def replacement: Expression = StaticInvoke(
+    classOf[DateTimeUtils.type],
+    DayTimeIntervalType(HOUR, SECOND),
+    "subtractTimes",
+    children,
+    inputTypes,
+    propagateNull = nullIntolerant)
+
+  override def toString: String = s"$left - $right"
+  override def sql: String = s"${left.sql} - ${right.sql}"
+
+  override protected def withNewChildrenInternal(
+      newLeft: Expression, newRight: Expression): SubtractTimes =
+    copy(left = newLeft, right = newRight)
+}
+
+/**
+ * Returns the difference between two times, measured in specified units.
+ */
+// scalastyle:off line.size.limit
+@ExpressionDescription(
+  usage = """
+    _FUNC_(unit, start, end) - Gets the difference between the times in the specified units.
+  """,
+  arguments = """
+    Arguments:
+      * unit - the unit of the difference between the given times
+          - "HOUR"
+          - "MINUTE"
+          - "SECOND"
+          - "MILLISECOND"
+          - "MICROSECOND"
+      * start - a starting TIME expression
+      * end - an ending TIME expression
+  """,
+  examples = """
+    Examples:
+      > SELECT _FUNC_('HOUR', TIME'20:30:29', TIME'21:30:28');
+       0
+      > SELECT _FUNC_('HOUR', TIME'20:30:29', TIME'21:30:29');
+       1
+      > SELECT _FUNC_('HOUR', TIME'20:30:29', TIME'12:00:00');
+       -8
+  """,
+  group = "datetime_funcs",
+  since = "4.1.0")
+// scalastyle:on line.size.limit
+case class TimeDiff(
+    unit: Expression,
+    start: Expression,
+    end: Expression)
+  extends TernaryExpression
+  with RuntimeReplaceable
+  with ImplicitCastInputTypes {
+
+  override def first: Expression = unit
+  override def second: Expression = start
+  override def third: Expression = end
+
+  override def inputTypes: Seq[AbstractDataType] =
+    Seq(StringTypeWithCollation(supportsTrimCollation = true), AnyTimeType, AnyTimeType)
+
+  override def dataType: DataType = LongType
+
+  override def prettyName: String = "time_diff"
+
+  override protected def withNewChildrenInternal(
+      newUnit: Expression, newStart: Expression, newEnd: Expression): TimeDiff = {
+    copy(unit = newUnit, start = newStart, end = newEnd)
+  }
+
+  override def replacement: Expression = {
+    StaticInvoke(
+      classOf[DateTimeUtils.type],
+      dataType,
+      "timeDiff",
+      Seq(unit, start, end),
+      Seq(unit.dataType, start.dataType, end.dataType)
+    )
+  }
+}
+
+// scalastyle:off line.size.limit
+@ExpressionDescription(
+  usage = """
+    _FUNC_(unit, time) - Returns `time` truncated to the `unit`.
+  """,
+  arguments = """
+    Arguments:
+      * unit - the unit to truncate to
+          - "HOUR" - zero out the minutes and seconds with fraction part
+          - "MINUTE" - zero out the seconds with fraction part
+          - "SECOND" - zero out the fraction part of seconds
+          - "MILLISECOND" - zero out the microseconds
+          - "MICROSECOND" - zero out the nanoseconds
+      * time - a TIME expression
+  """,
+  examples = """
+    Examples:
+      > SELECT _FUNC_('HOUR', TIME'09:32:05.359');
+       09:00:00
+      > SELECT _FUNC_('MILLISECOND', TIME'09:32:05.123456');
+       09:32:05.123
+  """,
+  group = "datetime_funcs",
+  since = "4.1.0")
+// scalastyle:on line.size.limit
+case class TimeTrunc(unit: Expression, time: Expression)
+  extends BinaryExpression with RuntimeReplaceable with ImplicitCastInputTypes {
+
+  override def left: Expression = unit
+  override def right: Expression = time
+
+  override def inputTypes: Seq[AbstractDataType] =
+    Seq(StringTypeWithCollation(supportsTrimCollation = true), AnyTimeType)
+
+  override def dataType: DataType = time.dataType
+
+  override def prettyName: String = "time_trunc"
+
+  override protected def withNewChildrenInternal(
+      newUnit: Expression, newTime: Expression): TimeTrunc =
+    copy(unit = newUnit, time = newTime)
+
+  override def replacement: Expression = {
+    StaticInvoke(
+      classOf[DateTimeUtils.type],
+      dataType,
+      "timeTrunc",
+      Seq(unit, time),
+      Seq(unit.dataType, time.dataType)
+    )
+  }
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/windowExpressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/windowExpressions.scala
index ab787663c9923..f26a4dc9a0c0c 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/windowExpressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/expressions/windowExpressions.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.catalyst.expressions
 import java.util.Locale
 
 import org.apache.spark.SparkException
+import org.apache.spark.api.python.PythonEvalType
 import org.apache.spark.sql.catalyst.analysis.{TypeCheckResult, UnresolvedException}
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{DataTypeMismatch, TypeCheckSuccess}
 import org.apache.spark.sql.catalyst.dsl.expressions._
@@ -401,6 +402,16 @@ object WindowFunctionType {
     // consider its type to be SQL as literal(0) is also a SQL expression.
     t.getOrElse(SQL)
   }
+
+  def pythonEvalType(windowExpression: NamedExpression): Option[Int] = {
+    windowExpression.collectFirst {
+      case udf: PythonUDAF => udf.evalType match {
+        // Infer the eval type of window operation, from the input aggregation type
+        case PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF => PythonEvalType.SQL_WINDOW_AGG_PANDAS_UDF
+        case PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF => PythonEvalType.SQL_WINDOW_AGG_ARROW_UDF
+      }
+    }
+  }
 }
 
 trait OffsetWindowFunction extends WindowFunction {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/InlineCTE.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/InlineCTE.scala
index 62d99f7854891..ad1a1a99b8257 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/InlineCTE.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/InlineCTE.scala
@@ -61,10 +61,7 @@ case class InlineCTE(
     // 1) It is fine to inline a CTE if it references another CTE that is non-deterministic;
     // 2) Any `CTERelationRef` that contains `OuterReference` would have been inlined first.
     refCount == 1 ||
-      // Don't inline recursive CTEs if not necessary as recursion is very costly.
-      // The check if cteDef is recursive is performed by checking if it contains
-      // a UnionLoopRef with the same ID.
-      (cteDef.deterministic && !cteDef.hasSelfReferenceAsUnionLoopRef) ||
+      cteDef.deterministic ||
       cteDef.child.exists(_.expressions.exists(_.isInstanceOf[OuterReference]))
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/Optimizer.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/Optimizer.scala
index 66c3bfb46530a..ef505a0144113 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/Optimizer.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/Optimizer.scala
@@ -20,10 +20,9 @@ package org.apache.spark.sql.catalyst.optimizer
 import scala.collection.mutable
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.sql.catalyst.SQLConfHelper
 import org.apache.spark.sql.catalyst.analysis._
-import org.apache.spark.sql.catalyst.catalog.{InMemoryCatalog, SessionCatalog}
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.SubqueryExpression.hasCorrelatedSubquery
 import org.apache.spark.sql.catalyst.expressions.aggregate._
@@ -573,19 +572,6 @@ object EliminateAggregateFilter extends Rule[LogicalPlan] {
   }
 }
 
-/**
- * An optimizer used in test code.
- *
- * To ensure extendability, we leave the standard rules in the abstract optimizer rules, while
- * specific rules go to the subclasses
- */
-object SimpleTestOptimizer extends SimpleTestOptimizer
-
-class SimpleTestOptimizer extends Optimizer(
-  new CatalogManager(
-    FakeV2SessionCatalog,
-    new SessionCatalog(new InMemoryCatalog, EmptyFunctionRegistry, EmptyTableFunctionRegistry)))
-
 /**
  * Remove redundant aliases from a query plan. A redundant alias is an alias that does not change
  * the name or metadata of a column, and does not deduplicate it.
@@ -611,7 +597,7 @@ object RemoveRedundantAliases extends Rule[LogicalPlan] {
     // If the alias name is different from attribute name, we can't strip it either, or we
     // may accidentally change the output schema name of the root plan.
     case a @ Alias(attr: Attribute, name)
-      if (a.metadata == Metadata.empty || a.metadata == attr.metadata) &&
+      if (a.metadata == attr.metadata) &&
         name == attr.name &&
         !excludeList.contains(attr) &&
         !excludeList.contains(a) =>
@@ -654,16 +640,23 @@ object RemoveRedundantAliases extends Rule[LogicalPlan] {
       case u: Union =>
         var first = true
         plan.mapChildren { child =>
-          if (first) {
-            first = false
-            // `Union` inherits its first child's outputs. We don't remove those aliases from the
-            // first child's tree that prevent aliased attributes to appear multiple times in the
-            // `Union`'s output. A parent projection node on the top of an `Union` with non-unique
-            // output attributes could return incorrect result.
-            removeRedundantAliases(child, excluded ++ child.outputSet)
+          if (!conf.unionIsResolvedWhenDuplicatesPerChildResolved || shouldRemoveAliasesUnderUnion(
+            child
+          )) {
+            if (first) {
+              first = false
+              // `Union` inherits its first child's outputs. We don't remove those aliases from the
+              // first child's tree that prevent aliased attributes to appear multiple times in the
+              // `Union`'s output. A parent projection node on the top of an `Union` with
+              // non-unique output attributes could return incorrect result.
+              removeRedundantAliases(child, excluded ++ child.outputSet)
+            } else {
+              // We don't need to exclude those attributes that `Union` inherits from its first
+              // child.
+              removeRedundantAliases(child, excluded -- u.children.head.outputSet)
+            }
           } else {
-            // We don't need to exclude those attributes that `Union` inherits from its first child.
-            removeRedundantAliases(child, excluded -- u.children.head.outputSet)
+            child
           }
         }
 
@@ -708,6 +701,44 @@ object RemoveRedundantAliases extends Rule[LogicalPlan] {
     }
   }
 
+  /**
+   * In case a [[Project]], [[Aggregate]] or [[Window]] is a child of [[Union]], we don't remove an
+   * [[Alias]] in case it is on top of an [[Attribute]] which exists in the output set of the
+   * operator. This is needed because otherwise, we end up having an operator with duplicates in
+   * its output. When that happens, [[Union]] is not resolved, and we fail (but we shouldn't).
+   * In this example:
+   *
+   * {{{ SELECT col1 FROM values(1) WHERE 100 IN (SELECT col1 UNION SELECT col1); }}}
+   *
+   * Without `shouldRemoveAliasesUnderUnion` check, we would remove the [[Alias]] introduced in
+   * [[DeduplicateRelations]] rule (in a [[Project]] tagged as
+   * `PROJECT_FOR_EXPRESSION_ID_DEDUPLICATION`), the result is unresolved [[Union]] which causes the
+   * failure. With the check, [[Alias]] stays, and we resolve the plan properly.
+   */
+  private def shouldRemoveAliasesUnderUnion(operator: LogicalPlan): Boolean = {
+    operator match {
+      case project: Project =>
+        project.projectList.forall {
+          case Alias(attribute: Attribute, _) =>
+            !project.outputSet.contains(attribute)
+          case _ => true
+        }
+      case aggregate: Aggregate =>
+        aggregate.aggregateExpressions.forall {
+          case Alias(attribute: Attribute, _) =>
+            !aggregate.outputSet.contains(attribute)
+          case _ => true
+        }
+      case window: Window =>
+        window.windowExpressions.forall {
+          case Alias(attribute: Attribute, _) =>
+            !window.outputSet.contains(attribute)
+          case _ => true
+        }
+      case other => true
+    }
+  }
+
   def apply(plan: LogicalPlan): LogicalPlan = removeRedundantAliases(plan, AttributeSet.empty)
 }
 
@@ -936,6 +967,15 @@ object PushProjectionThroughUnion extends Rule[LogicalPlan] {
     result.asInstanceOf[A]
   }
 
+  /**
+   * If [[SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED]] is true, [[Project]] can
+   * only be pushed down if there are no duplicate [[ExprId]]s in the project list.
+   */
+  def canPushProjectionThroughUnion(project: Project): Boolean = {
+    !conf.unionIsResolvedWhenDuplicatesPerChildResolved ||
+    project.outputSet.size == project.projectList.size
+  }
+
   def pushProjectionThroughUnion(projectList: Seq[NamedExpression], u: Union): Seq[LogicalPlan] = {
     val newFirstChild = Project(projectList, u.children.head)
     val newOtherChildren = u.children.tail.map { child =>
@@ -949,8 +989,9 @@ object PushProjectionThroughUnion extends Rule[LogicalPlan] {
     _.containsAllPatterns(UNION, PROJECT)) {
 
     // Push down deterministic projection through UNION ALL
-    case Project(projectList, u: Union)
-        if projectList.forall(_.deterministic) && u.children.nonEmpty =>
+    case project @ Project(projectList, u: Union)
+      if projectList.forall(_.deterministic) && u.children.nonEmpty &&
+        canPushProjectionThroughUnion(project) =>
       u.copy(children = pushProjectionThroughUnion(projectList, u))
   }
 }
@@ -1041,8 +1082,7 @@ object ColumnPruning extends Rule[LogicalPlan] {
         p
       }
 
-    // TODO: Pruning `UnionLoop`s needs to take into account both the outer `Project` and the inner
-    //  `UnionLoopRef` nodes.
+    // Avoid pruning UnionLoop because of its recursive nature.
     case p @ Project(_, _: UnionLoop) => p
 
     // Prune unnecessary window expressions
@@ -1280,8 +1320,22 @@ object CollapseProject extends Rule[LogicalPlan] with AliasHelper {
   def buildCleanedProjectList(
       upper: Seq[NamedExpression],
       lower: Seq[NamedExpression]): Seq[NamedExpression] = {
+    val explicitlyPreserveAliasMetadata =
+      conf.getConf(SQLConf.PRESERVE_ALIAS_METADATA_WHEN_COLLAPSING_PROJECTS)
     val aliases = getAliasMap(lower)
-    upper.map(replaceAliasButKeepName(_, aliases))
+    upper.map {
+      case alias: Alias if !alias.metadata.isEmpty && explicitlyPreserveAliasMetadata =>
+        replaceAliasButKeepName(alias, aliases) match {
+          case newAlias: Alias => Alias(child = newAlias.child, name = newAlias.name)(
+            exprId = newAlias.exprId,
+            qualifier = newAlias.qualifier,
+            explicitMetadata = Some(alias.metadata),
+            nonInheritableMetadataKeys = newAlias.nonInheritableMetadataKeys
+          )
+          case other => other
+        }
+      case other => replaceAliasButKeepName(other, aliases)
+    }
   }
 
   /**
@@ -1576,7 +1630,7 @@ object InferFiltersFromConstraints extends Rule[LogicalPlan]
  */
 object CombineUnions extends Rule[LogicalPlan] {
   import CollapseProject.{buildCleanedProjectList, canCollapseExpressions}
-  import PushProjectionThroughUnion.pushProjectionThroughUnion
+  import PushProjectionThroughUnion.{canPushProjectionThroughUnion, pushProjectionThroughUnion}
 
   def apply(plan: LogicalPlan): LogicalPlan = plan.transformDownWithPruning(
     _.containsAnyPattern(UNION, DISTINCT_LIKE), ruleId) {
@@ -1621,17 +1675,19 @@ object CombineUnions extends Rule[LogicalPlan] {
           stack.pushAll(children.reverse)
         // Push down projection through Union and then push pushed plan to Stack if
         // there is a Project.
-        case Project(projectList, Distinct(u @ Union(children, byName, allowMissingCol)))
+        case project @ Project(projectList, Distinct(u @ Union(children, byName, allowMissingCol)))
             if projectList.forall(_.deterministic) && children.nonEmpty &&
-              flattenDistinct && byName == topByName && allowMissingCol == topAllowMissingCol =>
+              flattenDistinct && byName == topByName && allowMissingCol == topAllowMissingCol &&
+              canPushProjectionThroughUnion(project) =>
           stack.pushAll(pushProjectionThroughUnion(projectList, u).reverse)
-        case Project(projectList, Deduplicate(keys: Seq[Attribute], u: Union))
+        case project @ Project(projectList, Deduplicate(keys: Seq[Attribute], u: Union))
             if projectList.forall(_.deterministic) && flattenDistinct && u.byName == topByName &&
-              u.allowMissingCol == topAllowMissingCol && AttributeSet(keys) == u.outputSet =>
+              u.allowMissingCol == topAllowMissingCol && AttributeSet(keys) == u.outputSet &&
+              canPushProjectionThroughUnion(project) =>
           stack.pushAll(pushProjectionThroughUnion(projectList, u).reverse)
-        case Project(projectList, u @ Union(children, byName, allowMissingCol))
-            if projectList.forall(_.deterministic) && children.nonEmpty &&
-              byName == topByName && allowMissingCol == topAllowMissingCol =>
+        case project @ Project(projectList, u @ Union(children, byName, allowMissingCol))
+            if projectList.forall(_.deterministic) && children.nonEmpty && byName == topByName &&
+              allowMissingCol == topAllowMissingCol && canPushProjectionThroughUnion(project) =>
           stack.pushAll(pushProjectionThroughUnion(projectList, u).reverse)
         case child =>
           flattened += child
@@ -2574,6 +2630,28 @@ object GenerateOptimization extends Rule[LogicalPlan] {
             p.withNewChildren(Seq(updatedGenerate))
           case _ => p
         }
+
+      case p @ Project(_, g: Generate) if g.generator.isInstanceOf[JsonTuple] =>
+        val generatorOutput = g.generatorOutput
+        val usedOutputs =
+          AttributeSet(generatorOutput).intersect(AttributeSet(p.projectList.flatMap(_.references)))
+
+        usedOutputs.size match {
+          case 0 =>
+            p.withNewChildren(g.children)
+          case n if n < generatorOutput.size =>
+            val originJsonTuple = g.generator.asInstanceOf[JsonTuple]
+            val (newJsonExpressions, newGeneratorOutput) =
+              generatorOutput.zipWithIndex.collect {
+                case (attr, i) if usedOutputs.contains(attr) =>
+                  (originJsonTuple.children(i + 1), attr)
+              }.unzip
+            p.withNewChildren(Seq(g.copy(
+              generator = JsonTuple(originJsonTuple.children.head +: newJsonExpressions),
+              generatorOutput = newGeneratorOutput)))
+          case _ =>
+            p
+        }
     }
 }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregates.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregates.scala
index d6a4bd030c9d6..b4602d0ddcc93 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregates.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregates.scala
@@ -54,7 +54,13 @@ object RemoveRedundantAggregates extends Rule[LogicalPlan] with AliasHelper {
         .map(_.toAttribute)
     ))
 
-    upperHasNoDuplicateSensitiveAgg && upperRefsOnlyDeterministicNonAgg
+    // If the lower aggregation is global, it is not redundant because a project with
+    // non-aggregate expressions is different with global aggregation in semantics.
+    // E.g., if the input relation is empty, a project might be optimized to an empty
+    // relation, while a global aggregation will return a single row.
+    lazy val lowerIsGlobalAgg = lower.groupingExpressions.isEmpty
+
+    upperHasNoDuplicateSensitiveAgg && upperRefsOnlyDeterministicNonAgg && !lowerIsGlobalAgg
   }
 
   private def isDuplicateSensitive(ae: AggregateExpression): Boolean = {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/ReplaceNullWithFalseInPredicate.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/ReplaceNullWithFalseInPredicate.scala
index 0358c45815944..7134c3daf3baa 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/ReplaceNullWithFalseInPredicate.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/ReplaceNullWithFalseInPredicate.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.catalyst.optimizer
 
 import org.apache.spark.SparkIllegalArgumentException
 import org.apache.spark.internal.LogKeys.{SQL_TEXT, UNSUPPORTED_EXPR}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.expressions.{And, ArrayExists, ArrayFilter, CaseWhen, EqualNullSafe, Expression, If, In, InSet, LambdaFunction, Literal, MapFilter, Not, Or}
 import org.apache.spark.sql.catalyst.expressions.Literal.{FalseLiteral, TrueLiteral}
 import org.apache.spark.sql.catalyst.plans.logical.{DeleteAction, DeleteFromTable, Filter, InsertAction, InsertStarAction, Join, LogicalPlan, MergeAction, MergeIntoTable, ReplaceData, UpdateAction, UpdateStarAction, UpdateTable, WriteDelta}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/expressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/expressions.scala
index b3236bbfa3755..856236750f7bf 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/expressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/expressions.scala
@@ -59,7 +59,20 @@ object ConstantFolding extends Rule[LogicalPlan] {
     case _ => false
   }
 
-  private def constantFolding(
+  private def tryFold(expr: Expression, isConditionalBranch: Boolean): Expression = {
+    try {
+      Literal.create(expr.freshCopyIfContainsStatefulExpression().eval(EmptyRow), expr.dataType)
+    } catch {
+      case NonFatal(_) if isConditionalBranch =>
+        // When doing constant folding inside conditional expressions, we should not fail
+        // during expression evaluation, as the branch we are evaluating may not be reached at
+        // runtime, and we shouldn't fail the query, to match the original behavior.
+        expr.setTagValue(FAILED_TO_EVALUATE, ())
+        expr
+    }
+  }
+
+  private[sql] def constantFolding(
       e: Expression,
       isConditionalBranch: Boolean = false): Expression = e match {
     case c: ConditionalExpression if !c.foldable =>
@@ -78,17 +91,7 @@ object ConstantFolding extends Rule[LogicalPlan] {
     case e if e.getTagValue(FAILED_TO_EVALUATE).isDefined => e
 
     // Fold expressions that are foldable.
-    case e if e.foldable =>
-      try {
-        Literal.create(e.freshCopyIfContainsStatefulExpression().eval(EmptyRow), e.dataType)
-      } catch {
-        case NonFatal(_) if isConditionalBranch =>
-          // When doing constant folding inside conditional expressions, we should not fail
-          // during expression evaluation, as the branch we are evaluating may not be reached at
-          // runtime, and we shouldn't fail the query, to match the original behavior.
-          e.setTagValue(FAILED_TO_EVALUATE, ())
-          e
-      }
+    case e if e.foldable => tryFold(e, isConditionalBranch)
 
     // Don't replace ScalarSubquery if its plan is an aggregate that may suffer from a COUNT bug.
     case s @ ScalarSubquery(_, _, _, _, _, mayHaveCountBug, _)
@@ -100,7 +103,13 @@ object ConstantFolding extends Rule[LogicalPlan] {
     case s: ScalarSubquery if s.plan.maxRows.contains(0) =>
       Literal(null, s.dataType)
 
-    case other => other.mapChildren(constantFolding(_, isConditionalBranch))
+    case other =>
+      val newOther = other.mapChildren(constantFolding(_, isConditionalBranch))
+      if (newOther.foldable) {
+        tryFold(newOther, isConditionalBranch)
+      } else {
+        newOther
+      }
   }
 
   def apply(plan: LogicalPlan): LogicalPlan = plan.transformWithPruning(AlwaysProcess.fn, ruleId) {
@@ -726,7 +735,7 @@ object SupportedBinaryExpr {
     case _: BinaryArithmetic => Some(expr, expr.children.head, expr.children.last)
     case _: BinaryMathExpression => Some(expr, expr.children.head, expr.children.last)
     case _: AddMonths | _: DateAdd | _: DateAddInterval | _: DateDiff | _: DateSub |
-         _: DateAddYMInterval | _: TimestampAddYMInterval | _: TimeAdd =>
+         _: DateAddYMInterval | _: TimestampAddYMInterval | _: TimestampAddInterval =>
       Some(expr, expr.children.head, expr.children.last)
     case _: FindInSet | _: RoundBase => Some(expr, expr.children.head, expr.children.last)
     case BinaryPredicate(expr) =>
@@ -743,10 +752,11 @@ object SupportedBinaryExpr {
 object LikeSimplification extends Rule[LogicalPlan] with PredicateHelper {
   // if guards below protect from escapes on trailing %.
   // Cases like "something\%" are not optimized, but this does not affect correctness.
-  private val startsWith = "([^_%]+)%".r
-  private val endsWith = "%([^_%]+)".r
-  private val startsAndEndsWith = "([^_%]+)%([^_%]+)".r
-  private val contains = "%([^_%]+)%".r
+  // Consecutive wildcard characters are equivalent to a single wildcard character.
+  private val startsWith = "([^_%]+)%+".r
+  private val endsWith = "%+([^_%]+)".r
+  private val startsAndEndsWith = "([^_%]+)%+([^_%]+)".r
+  private val contains = "%+([^_%]+)%+".r
   private val equalTo = "([^_%]*)".r
 
   private def simplifyLike(
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/finishAnalysis.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/finishAnalysis.scala
index 21e09f2e56d19..c9c26d473b982 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/finishAnalysis.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/finishAnalysis.scala
@@ -31,7 +31,7 @@ import org.apache.spark.sql.catalyst.trees.TreePattern._
 import org.apache.spark.sql.catalyst.trees.TreePatternBits
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.catalyst.util.DateTimeUtils.{convertSpecialDate, convertSpecialTimestamp, convertSpecialTimestampNTZ, instantToMicros, localDateTimeToMicros}
-import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils.{instantToMicrosOfDay, truncateTimeMicrosToPrecision}
+import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils.{instantToNanosOfDay, truncateTimeToPrecision}
 import org.apache.spark.sql.catalyst.util.TypeUtils.toSQLExpr
 import org.apache.spark.sql.connector.catalog.CatalogManager
 import org.apache.spark.sql.types._
@@ -114,7 +114,7 @@ object ComputeCurrentTime extends Rule[LogicalPlan] {
     val instant = Instant.now()
     val currentTimestampMicros = instantToMicros(instant)
     val currentTime = Literal.create(currentTimestampMicros, TimestampType)
-    val currentTimeOfDayMicros = instantToMicrosOfDay(instant, conf.sessionLocalTimeZone)
+    val currentTimeOfDayNanos = instantToNanosOfDay(instant, conf.sessionLocalTimeZone)
     val timezone = Literal.create(conf.sessionLocalTimeZone, StringType)
     val currentDates = collection.mutable.HashMap.empty[ZoneId, Literal]
     val localTimestamps = collection.mutable.HashMap.empty[ZoneId, Literal]
@@ -132,7 +132,7 @@ object ComputeCurrentTime extends Rule[LogicalPlan] {
                 DateTimeUtils.microsToDays(currentTimestampMicros, cd.zoneId), DateType)
             })
           case currentTimeType : CurrentTime =>
-            val truncatedTime = truncateTimeMicrosToPrecision(currentTimeOfDayMicros,
+            val truncatedTime = truncateTimeToPrecision(currentTimeOfDayNanos,
               currentTimeType.precision)
             Literal.create(truncatedTime, TimeType(currentTimeType.precision))
           case CurrentTimestamp() | Now() => currentTime
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/joins.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/joins.scala
index 9413bd7b454d4..be07b440a118b 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/joins.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/optimizer/joins.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.catalyst.optimizer
 import scala.annotation.tailrec
 import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{HASH_JOIN_KEYS, JOIN_CONDITION}
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/AstBuilder.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/AstBuilder.scala
index 9b9ff2175457b..4e930280381c1 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/AstBuilder.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/AstBuilder.scala
@@ -28,28 +28,30 @@ import org.antlr.v4.runtime.{ParserRuleContext, RuleContext, Token}
 import org.antlr.v4.runtime.tree.{ParseTree, RuleNode, TerminalNode}
 
 import org.apache.spark.{SparkArithmeticException, SparkException, SparkIllegalArgumentException, SparkThrowable, SparkThrowableHelper}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PARTITION_SPECIFICATION
-import org.apache.spark.sql.catalyst.{EvaluateUnresolvedInlineTable, FunctionIdentifier, SQLConfHelper, TableIdentifier}
+import org.apache.spark.sql.catalyst.{FunctionIdentifier, SQLConfHelper, TableIdentifier}
 import org.apache.spark.sql.catalyst.analysis._
 import org.apache.spark.sql.catalyst.analysis.FunctionRegistry.FUNC_ALIAS
 import org.apache.spark.sql.catalyst.catalog.{BucketSpec, CatalogStorageFormat, ClusterBySpec}
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.{AnyValue, First, Last}
+import org.apache.spark.sql.catalyst.expressions.json.JsonPathParser
+import org.apache.spark.sql.catalyst.expressions.json.PathInstruction.Named
 import org.apache.spark.sql.catalyst.parser.SqlBaseParser._
 import org.apache.spark.sql.catalyst.plans._
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.trees.{CurrentOrigin, Origin}
 import org.apache.spark.sql.catalyst.trees.TreePattern.PARAMETER
 import org.apache.spark.sql.catalyst.types.DataTypeUtils
-import org.apache.spark.sql.catalyst.util.{CharVarcharUtils, CollationFactory, DateTimeUtils, IntervalUtils, SparkParserUtils}
+import org.apache.spark.sql.catalyst.util.{CharVarcharUtils, CollationFactory, DateTimeUtils, EvaluateUnresolvedInlineTable, IntervalUtils}
 import org.apache.spark.sql.catalyst.util.DateTimeUtils.{convertSpecialDate, convertSpecialTimestamp, convertSpecialTimestampNTZ, getZoneId, stringToDate, stringToTime, stringToTimestamp, stringToTimestampWithoutTimeZone}
 import org.apache.spark.sql.connector.catalog.{CatalogV2Util, SupportsNamespaces, TableCatalog, TableWritePrivilege}
 import org.apache.spark.sql.connector.catalog.TableChange.ColumnPosition
 import org.apache.spark.sql.connector.expressions.{ApplyTransform, BucketTransform, DaysTransform, Expression => V2Expression, FieldReference, HoursTransform, IdentityTransform, LiteralValue, MonthsTransform, Transform, YearsTransform}
 import org.apache.spark.sql.errors.{DataTypeErrorsBase, QueryCompilationErrors, QueryParsingErrors, SqlScriptingErrors}
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.internal.SQLConf.LEGACY_BANG_EQUALS_NOT
+import org.apache.spark.sql.internal.SQLConf.{LEGACY_BANG_EQUALS_NOT, LEGACY_CONSECUTIVE_STRING_LITERALS}
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 import org.apache.spark.unsafe.types.{CalendarInterval, UTF8String}
@@ -128,7 +130,7 @@ class AstBuilder extends DataTypeAstBuilder
    * @return The original input text, including all whitespaces and formatting.
    */
   private def getOriginalText(ctx: ParserRuleContext): String = {
-    SparkParserUtils.source(ctx)
+    source(ctx)
   }
 
   /**
@@ -555,6 +557,7 @@ class AstBuilder extends DataTypeAstBuilder
     val query = withOrigin(queryCtx) {
       SingleStatement(visitQuery(queryCtx))
     }
+    parsingCtx.labelContext.enterForScope(Option(ctx.multipartIdentifier()))
     val varName = Option(ctx.multipartIdentifier()).map(_.getText)
     val body = visitCompoundBodyImpl(
       ctx.compoundBody(),
@@ -562,6 +565,7 @@ class AstBuilder extends DataTypeAstBuilder
       parsingCtx,
       isScope = false
     )
+    parsingCtx.labelContext.exitForScope(Option(ctx.multipartIdentifier()))
     parsingCtx.labelContext.exitLabeledScope(Option(ctx.beginLabel()))
 
     ForStatement(query, varName, body, Some(labelText))
@@ -1823,7 +1827,7 @@ class AstBuilder extends DataTypeAstBuilder
             // syntax error here accordingly.
             val error: String = (if (n.name != null) n.name else n.identifierList).getText
             throw new ParseException(
-              command = Some(SparkParserUtils.command(n)),
+              command = Some(command(n)),
               start = Origin(),
               errorClass = "PARSE_SYNTAX_ERROR",
               messageParameters = Map(
@@ -3322,6 +3326,24 @@ class AstBuilder extends DataTypeAstBuilder
     }
   }
 
+  /**
+   * Create a [[SemiStructuredExtract]] expression.
+   */
+  override def visitSemiStructuredExtract(
+      ctx: SemiStructuredExtractContext): Expression = withOrigin(ctx) {
+    val field = ctx.path.getText
+    // When `field` starts with a bracket, do not add a `.` as the bracket already implies nesting
+    // Also the bracket will imply case sensitive field extraction.
+    val path = if (field.startsWith("[")) "$" + field else s"$$.$field"
+    val parsedPath = JsonPathParser.parse(path)
+    if (parsedPath.isEmpty) {
+      throw new ParseException(errorClass = "PARSE_SYNTAX_ERROR", ctx = ctx)
+    }
+    val potentialAlias = parsedPath.get.collect { case Named(name) => name }.lastOption
+    val node = SemiStructuredExtract(expression(ctx.col), path)
+    potentialAlias.map { colName => Alias(node, colName)() }.getOrElse(node)
+  }
+
   /**
    * Create an [[UnresolvedAttribute]] expression or a [[UnresolvedRegex]] if it is a regex
    * quoted in ``
@@ -3622,6 +3644,8 @@ class AstBuilder extends DataTypeAstBuilder
   private def createString(ctx: StringLiteralContext): String = {
     if (conf.escapedStringLiterals) {
       ctx.stringLit.asScala.map(x => stringWithoutUnescape(visitStringLit(x))).mkString
+    } else if (conf.getConf(LEGACY_CONSECUTIVE_STRING_LITERALS)) {
+      ctx.stringLit.asScala.map(x => stringIgnoreQuoteQuote(visitStringLit(x))).mkString
     } else {
       ctx.stringLit.asScala.map(x => string(visitStringLit(x))).mkString
     }
@@ -4872,8 +4896,23 @@ class AstBuilder extends DataTypeAstBuilder
             .mkString(", ")
         throw QueryParsingErrors.multiplePrimaryKeysError(ctx, primaryKeyColumns)
       }
+      // If there is a primary key constraint, all the columns in the primary key are not null.
+      val updatedColumns = if (primaryKeys.nonEmpty) {
+        val lowerCasePkColumns = primaryKeys.head.asInstanceOf[PrimaryKeyConstraint].columns
+            .map(_.toLowerCase(Locale.ROOT))
+        columnDefs.map { colDef =>
+          if (colDef.nullable &&
+            lowerCasePkColumns.contains(colDef.name.toLowerCase(Locale.ROOT))) {
+            colDef.copy(nullable = false)
+          } else {
+            colDef
+          }
+        }
+      } else {
+        columnDefs
+      }
 
-      (columnDefs.toSeq, constraints.toSeq)
+      (updatedColumns.toSeq, constraints.toSeq)
     }
   }
 
@@ -6340,7 +6379,7 @@ class AstBuilder extends DataTypeAstBuilder
    *
    * For example:
    * {{{
-   *   DECLARE [OR REPLACE] [VARIABLE] [db_name.]variable_name
+   *   DECLARE [OR REPLACE] [VARIABLE] variable_name [COMMA variable_name]*
    *   [dataType] [defaultExpression];
    * }}}
    *
@@ -6353,7 +6392,7 @@ class AstBuilder extends DataTypeAstBuilder
         throw new ParseException(
           errorClass = "INVALID_SQL_SYNTAX.VARIABLE_TYPE_OR_DEFAULT_REQUIRED",
           messageParameters = Map.empty,
-          ctx.identifierReference)
+          ctx.identifierReferences.get(0))
       }
       DefaultValueExpression(Literal(null, dataTypeOpt.get), "null")
     } else {
@@ -6361,7 +6400,11 @@ class AstBuilder extends DataTypeAstBuilder
       dataTypeOpt.map { dt => default.copy(child = Cast(default.child, dt)) }.getOrElse(default)
     }
     CreateVariable(
-      withIdentClause(ctx.identifierReference(), UnresolvedIdentifier(_)),
+      ctx.identifierReferences.asScala.map (
+        identifierReference => {
+          withIdentClause(identifierReference, UnresolvedIdentifier(_))
+        }
+      ).toSeq,
       defaultExpression,
       ctx.REPLACE() != null
     )
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/ParserUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/ParserUtils.scala
index 38e92cf9aebdd..a19b4cca28173 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/ParserUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/parser/ParserUtils.scala
@@ -28,7 +28,7 @@ import org.antlr.v4.runtime.tree.{ParseTree, TerminalNodeImpl}
 
 import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst.analysis.UnresolvedIdentifier
-import org.apache.spark.sql.catalyst.parser.SqlBaseParser.{BeginLabelContext, EndLabelContext}
+import org.apache.spark.sql.catalyst.parser.SqlBaseParser.{BeginLabelContext, EndLabelContext, MultipartIdentifierContext}
 import org.apache.spark.sql.catalyst.plans.logical.{CreateVariable, ErrorCondition}
 import org.apache.spark.sql.catalyst.trees.CurrentOrigin
 import org.apache.spark.sql.catalyst.util.SparkParserUtils
@@ -151,7 +151,8 @@ class CompoundBodyParsingContext {
   def variable(createVariable: CreateVariable, allowVarDeclare: Boolean): Unit = {
     if (!allowVarDeclare) {
       throw SqlScriptingErrors.variableDeclarationNotAllowedInScope(
-        createVariable.origin, createVariable.name.asInstanceOf[UnresolvedIdentifier].nameParts)
+        createVariable.origin,
+        createVariable.names(0).asInstanceOf[UnresolvedIdentifier].nameParts)
     }
     transitionTo(State.VARIABLE, createVariable = Some(createVariable), None)
   }
@@ -229,12 +230,12 @@ class CompoundBodyParsingContext {
       case (State.STATEMENT, State.VARIABLE) =>
         throw SqlScriptingErrors.variableDeclarationOnlyAtBeginning(
           createVariable.get.origin,
-          createVariable.get.name.asInstanceOf[UnresolvedIdentifier].nameParts)
+          createVariable.get.names(0).asInstanceOf[UnresolvedIdentifier].nameParts)
 
       case (State.HANDLER, State.VARIABLE) =>
         throw SqlScriptingErrors.variableDeclarationOnlyAtBeginning(
           createVariable.get.origin,
-          createVariable.get.name.asInstanceOf[UnresolvedIdentifier].nameParts)
+          createVariable.get.names(0).asInstanceOf[UnresolvedIdentifier].nameParts)
 
       // Invalid transitions to CONDITION state.
       case (State.STATEMENT, State.CONDITION) =>
@@ -245,7 +246,7 @@ class CompoundBodyParsingContext {
       case (State.HANDLER, State.CONDITION) =>
         throw SqlScriptingErrors.variableDeclarationOnlyAtBeginning(
           createVariable.get.origin,
-          createVariable.get.name.asInstanceOf[UnresolvedIdentifier].nameParts)
+          createVariable.get.names(0).asInstanceOf[UnresolvedIdentifier].nameParts)
 
       // Invalid transitions to HANDLER state.
       case (State.STATEMENT, State.HANDLER) =>
@@ -316,6 +317,23 @@ class SqlScriptingLabelContext {
     beginLabelCtx.map(_.multipartIdentifier().getText).isDefined
   }
 
+  /**
+   * Assert the identifier is not contained within seenLabels.
+   * If the identifier is contained within seenLabels, raise an exception.
+   */
+  private def assertIdentifierNotInSeenLabels(
+      identifierCtx: Option[MultipartIdentifierContext]): Unit = {
+    identifierCtx.foreach { ctx =>
+      val identifierName = ctx.getText
+      if (seenLabels.contains(identifierName.toLowerCase(Locale.ROOT))) {
+        withOrigin(ctx) {
+          throw SqlScriptingErrors
+            .duplicateLabels(CurrentOrigin.get, identifierName.toLowerCase(Locale.ROOT))
+        }
+      }
+    }
+  }
+
   /**
    * Enter a labeled scope and return the label text.
    * If the label is defined, it will be returned and added to seenLabels.
@@ -342,9 +360,9 @@ class SqlScriptingLabelContext {
       // Do not add the label to the seenLabels set if it is not defined.
       java.util.UUID.randomUUID.toString.toLowerCase(Locale.ROOT)
     }
-    if (SqlScriptingLabelContext.isForbiddenLabelName(labelText)) {
+    if (SqlScriptingLabelContext.isForbiddenLabelOrForVariableName(labelText)) {
       withOrigin(beginLabelCtx.get) {
-        throw SqlScriptingErrors.labelNameForbidden(CurrentOrigin.get, labelText)
+        throw SqlScriptingErrors.labelOrForVariableNameForbidden(CurrentOrigin.get, labelText)
       }
     }
     labelText
@@ -359,13 +377,46 @@ class SqlScriptingLabelContext {
       seenLabels.remove(beginLabelCtx.get.multipartIdentifier().getText.toLowerCase(Locale.ROOT))
     }
   }
+
+  /**
+   * Enter a for loop scope.
+   * If the for loop variable is defined, it will be asserted to not be inside seenLabels;
+   * Then, if the for loop variable is defined, it will be added to seenLabels.
+   */
+  def enterForScope(identifierCtx: Option[MultipartIdentifierContext]): Unit = {
+    identifierCtx.foreach { ctx =>
+      val identifierName = ctx.getText
+      assertIdentifierNotInSeenLabels(identifierCtx)
+      seenLabels.add(identifierName.toLowerCase(Locale.ROOT))
+
+      if (SqlScriptingLabelContext.isForbiddenLabelOrForVariableName(identifierName)) {
+        withOrigin(ctx) {
+          throw SqlScriptingErrors.labelOrForVariableNameForbidden(
+            CurrentOrigin.get,
+            identifierName.toLowerCase(Locale.ROOT))
+        }
+      }
+    }
+  }
+
+  /**
+   * Exit a for loop scope.
+   * If the for loop variable is defined, it will be removed from seenLabels.
+   */
+  def exitForScope(identifierCtx: Option[MultipartIdentifierContext]): Unit = {
+    identifierCtx.foreach { ctx =>
+      val identifierName = ctx.getText
+      seenLabels.remove(identifierName.toLowerCase(Locale.ROOT))
+    }
+  }
+
 }
 
 object SqlScriptingLabelContext {
   private val forbiddenLabelNames: immutable.Set[Regex] =
     immutable.Set("builtin".r, "session".r, "sys.*".r)
 
-  def isForbiddenLabelName(labelName: String): Boolean = {
+  def isForbiddenLabelOrForVariableName(labelName: String): Boolean = {
     forbiddenLabelNames.exists(_.matches(labelName.toLowerCase(Locale.ROOT)))
   }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/NormalizePlan.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/NormalizePlan.scala
index b679514a26056..df2f95e1cf1e0 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/NormalizePlan.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/NormalizePlan.scala
@@ -19,11 +19,8 @@ package org.apache.spark.sql.catalyst.plans
 
 import java.util.HashMap
 
-import org.apache.spark.sql.catalyst.analysis.{
-  DeduplicateRelations,
-  GetViewColumnByNameAndOrdinal,
-  NormalizeableRelation
-}
+import org.apache.spark.sql.catalyst.analysis.NormalizeableRelation
+import org.apache.spark.sql.catalyst.analysis.resolver.ResolverTag
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
 import org.apache.spark.sql.catalyst.optimizer.ReplaceExpressions
@@ -150,24 +147,42 @@ object NormalizePlan extends PredicateHelper {
             .reduce(And)
         Join(left, right, newJoinType, Some(newCondition), hint)
       case project: Project
-          if project
-            .getTagValue(DeduplicateRelations.PROJECT_FOR_EXPRESSION_ID_DEDUPLICATION)
-            .isDefined =>
+          if project.getTagValue(ResolverTag.PROJECT_FOR_EXPRESSION_ID_DEDUPLICATION).isDefined =>
         project.child
+
       case aggregate @ Aggregate(_, _, innerProject: Project, _) =>
-        val newInnerProject = Project(
-          innerProject.projectList.sortBy(_.name),
-          innerProject.child
-        )
-        aggregate.copy(child = newInnerProject)
-      case Project(outerProjectList, innerProject: Project) =>
-        val newInnerProject = Project(
-          innerProject.projectList.sortBy(_.name),
-          innerProject.child
+        aggregate.copy(child = normalizeProjectListOrder(innerProject))
+
+      case project @ Project(_, innerProject: Project) =>
+        project.copy(child = normalizeProjectListOrder(innerProject))
+
+      case project @ Project(_, innerAggregate: Aggregate) =>
+        project.copy(child = normalizeAggregateListOrder(innerAggregate))
+
+      /**
+       * ORDER BY covered by an output-retaining project on top of GROUP BY
+       */
+      case project @ Project(_, sort @ Sort(_, _, innerAggregate: Aggregate, _)) =>
+        project.copy(child = sort.copy(child = normalizeAggregateListOrder(innerAggregate)))
+
+      /**
+       * HAVING covered by an output-retaining project on top of GROUP BY
+       */
+      case project @ Project(_, filter @ Filter(_, innerAggregate: Aggregate)) =>
+        project.copy(child = filter.copy(child = normalizeAggregateListOrder(innerAggregate)))
+
+      /**
+       * HAVING ... ORDER BY covered by an output-retaining project on top of GROUP BY
+       */
+      case project @ Project(
+            _,
+            sort @ Sort(_, _, filter @ Filter(_, innerAggregate: Aggregate), _)
+          ) =>
+        project.copy(
+          child =
+            sort.copy(child = filter.copy(child = normalizeAggregateListOrder(innerAggregate)))
         )
-        Project(normalizeProjectList(outerProjectList), newInnerProject)
-      case Project(projectList, child) =>
-        Project(normalizeProjectList(projectList), child)
+
       case c: KeepAnalyzedQuery => c.storeAnalyzedQuery()
       case localRelation: LocalRelation if !localRelation.data.isEmpty =>
         /**
@@ -204,14 +219,12 @@ object NormalizePlan extends PredicateHelper {
     case _ => condition // Don't reorder.
   }
 
-  private def normalizeProjectList(projectList: Seq[NamedExpression]): Seq[NamedExpression] = {
-    projectList
-      .map { e =>
-        e.transformUp {
-          case g: GetViewColumnByNameAndOrdinal => g.copy(viewDDL = None)
-        }
-      }
-      .asInstanceOf[Seq[NamedExpression]]
+  private def normalizeProjectListOrder(project: Project): Project = {
+    project.copy(projectList = project.projectList.sortBy(_.name))
+  }
+
+  private def normalizeAggregateListOrder(aggregate: Aggregate): Aggregate = {
+    aggregate.copy(aggregateExpressions = aggregate.aggregateExpressions.sortBy(_.name))
   }
 }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/QueryPlan.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/QueryPlan.scala
index 3eb4cdef9ea9b..7801cd347f7dc 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/QueryPlan.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/QueryPlan.scala
@@ -24,6 +24,7 @@ import scala.collection.mutable
 
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.SQLConfHelper
+import org.apache.spark.sql.catalyst.analysis.UnresolvedException
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.rules.RuleId
 import org.apache.spark.sql.catalyst.rules.UnknownRuleId
@@ -55,6 +56,32 @@ abstract class QueryPlan[PlanType <: QueryPlan[PlanType]]
 
   def output: Seq[Attribute]
 
+  override def nodeWithOutputColumnsString(maxColumns: Int): String = {
+    try {
+      nodeName + {
+        if (this.output.length > maxColumns) {
+          val outputWithNullability = this.output.take(maxColumns).map { attr =>
+            attr.toString + s"[nullable=${attr.nullable}]"
+          }
+
+          outputWithNullability.mkString(" <output=", ", ",
+            s" ... ${this.output.length - maxColumns} more columns>")
+        } else {
+          val outputWithNullability = this.output.map { attr =>
+            attr.toString + s"[nullable=${attr.nullable}]"
+          }
+
+          outputWithNullability.mkString(" <output=", ", ", ">")
+        }
+      }
+    } catch {
+      case _: UnresolvedException =>
+        // If we encounter an UnresolvedException, it's high likely that the call of `this.output`
+        // throws it. In this case, we may have to give up and only show the nodeName.
+        nodeName + " <output='Unresolved'>"
+    }
+  }
+
   /**
    * Returns the set of attributes that are output by this node.
    */
@@ -70,7 +97,7 @@ abstract class QueryPlan[PlanType <: QueryPlan[PlanType]]
   def outputOrdering: Seq[SortOrder] = Nil
 
   // Override `treePatternBits` to propagate bits for its expressions.
-  override lazy val treePatternBits: BitSet = {
+  private val _treePatternBits = new BestEffortLazyVal[BitSet](() => {
     val bits: BitSet = getDefaultTreePatternBits
     // Propagate expressions' pattern bits
     val exprIterator = expressions.iterator
@@ -78,7 +105,8 @@ abstract class QueryPlan[PlanType <: QueryPlan[PlanType]]
       bits.union(exprIterator.next().treePatternBits)
     }
     bits
-  }
+  })
+  override def treePatternBits: BitSet = _treePatternBits()
 
   /**
    * The set of all attributes that are input to this operator by its children.
@@ -378,8 +406,6 @@ abstract class QueryPlan[PlanType <: QueryPlan[PlanType]]
           newValidAttrMapping.filterNot { case (_, a) => existingAttrMappingSet.contains(a) }
         }
         val resultAttrMapping = if (canGetOutput(plan)) {
-          // We propagate the attributes mapping to the parent plan node to update attributes, so
-          // the `newAttr` must be part of this plan's output.
           (transferAttrMapping ++ newOtherAttrMapping).filter {
             case (_, newAttr) => planAfterRule.outputSet.contains(newAttr)
           }
@@ -797,9 +823,10 @@ object QueryPlan extends PredicateHelper {
       verbose: Boolean,
       addSuffix: Boolean,
       maxFields: Int = SQLConf.get.maxToStringFields,
-      printOperatorId: Boolean = false): Unit = {
+      printOperatorId: Boolean = false,
+      printOutputColumns: Boolean = false): Unit = {
     try {
-      plan.treeString(append, verbose, addSuffix, maxFields, printOperatorId)
+      plan.treeString(append, verbose, addSuffix, maxFields, printOperatorId, printOutputColumns)
     } catch {
       case e: AnalysisException => append(e.toString)
     }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/MergeRows.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/MergeRows.scala
index f7f515c29481d..3730e3d16e471 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/MergeRows.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/MergeRows.scala
@@ -87,7 +87,17 @@ object MergeRows {
     override def dataType: DataType = NullType
   }
 
-  case class Keep(condition: Expression, output: Seq[Expression]) extends Instruction {
+  sealed trait Context
+  case object Copy extends Context
+  case object Delete extends Context
+  case object Insert extends Context
+  case object Update extends Context
+
+  case class Keep(
+      context: Context,
+      condition: Expression,
+      output: Seq[Expression])
+    extends Instruction {
     def children: Seq[Expression] = condition +: output
     override def outputs: Seq[Seq[Expression]] = Seq(output)
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/Statistics.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/Statistics.scala
index 6f3ec3bf37d92..a2850a0b179f7 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/Statistics.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/Statistics.scala
@@ -19,6 +19,7 @@ package org.apache.spark.sql.catalyst.plans.logical
 
 import java.io.{ByteArrayInputStream, ByteArrayOutputStream, DataInputStream, DataOutputStream}
 import java.math.{MathContext, RoundingMode}
+import java.util.Base64
 
 import net.jpountz.lz4.{LZ4BlockInputStream, LZ4BlockOutputStream}
 
@@ -202,12 +203,12 @@ object HistogramSerializer {
     out.flush()
     out.close()
 
-    org.apache.commons.codec.binary.Base64.encodeBase64String(bos.toByteArray)
+    Base64.getEncoder().encodeToString(bos.toByteArray)
   }
 
   /** Deserializes a given string to a histogram. */
   final def deserialize(str: String): Histogram = {
-    val bytes = org.apache.commons.codec.binary.Base64.decodeBase64(str)
+    val bytes = Base64.getDecoder().decode(str)
     val bis = new ByteArrayInputStream(bytes)
     val ins = new DataInputStream(new LZ4BlockInputStream(bis))
     val height = ins.readDouble()
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/basicLogicalOperators.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/basicLogicalOperators.scala
index 03d1a9fca3cc8..add31448bef78 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/basicLogicalOperators.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/basicLogicalOperators.scala
@@ -97,8 +97,9 @@ case class Project(projectList: Seq[NamedExpression], child: LogicalPlan)
     val noSemanticChange = projectList.length == child.output.length &&
       projectList.zip(child.output).forall {
         case (alias: Alias, attr) =>
-          alias.child.semanticEquals(attr) && alias.explicitMetadata.isEmpty &&
-            alias.qualifier.isEmpty && alias.nonInheritableMetadataKeys.isEmpty
+          alias.qualifier.isEmpty &&
+            alias.metadata == attr.metadata &&
+            alias.child.semanticEquals(attr)
         case (attr1: Attribute, attr2) => attr1.semanticEquals(attr2)
         case _ => false
       }
@@ -546,6 +547,23 @@ abstract class UnionBase extends LogicalPlan {
       .map(child => rewriteConstraints(children.head.output, child.output, child.constraints))
       .reduce(merge(_, _))
   }
+
+
+
+
+  /**
+   * Checks whether the child outputs are compatible by using `DataType.equalsStructurally`. Do
+   * that by comparing the size of the output with the size of the first child's output and by
+   * comparing output data types with the data types of the first child's output.
+   *
+   * This method needs to be evaluated after `childrenResolved`.
+   */
+  def allChildrenCompatible: Boolean = childrenResolved && children.tail.forall { child =>
+    child.output.length == children.head.output.length &&
+      child.output.zip(children.head.output).forall {
+        case (l, r) => DataType.equalsStructurally(l.dataType, r.dataType, true)
+      }
+  }
 }
 
 /**
@@ -597,22 +615,20 @@ case class Union(
     Some(sum.toLong)
   }
 
-  def duplicateResolved: Boolean = {
+  private def duplicatesResolvedPerBranch: Boolean =
+    children.forall(child => child.outputSet.size == child.output.size)
+
+  def duplicatesResolvedBetweenBranches: Boolean = {
     children.map(_.outputSet.size).sum ==
       AttributeSet.fromAttributeSets(children.map(_.outputSet)).size
   }
 
   override lazy val resolved: Boolean = {
-    // allChildrenCompatible needs to be evaluated after childrenResolved
-    def allChildrenCompatible: Boolean =
-      children.tail.forall( child =>
-        // compare the attribute number with the first child
-        child.output.length == children.head.output.length &&
-        // compare the data types with the first child
-        child.output.zip(children.head.output).forall {
-          case (l, r) => DataType.equalsStructurally(l.dataType, r.dataType, true)
-        })
-    children.length > 1 && !(byName || allowMissingCol) && childrenResolved && allChildrenCompatible
+    children.length > 1 &&
+    !(byName || allowMissingCol) &&
+    childrenResolved &&
+    allChildrenCompatible &&
+    (!conf.unionIsResolvedWhenDuplicatesPerChildResolved || duplicatesResolvedPerBranch)
   }
 
   override protected def withNewChildrenInternal(newChildren: IndexedSeq[LogicalPlan]): Union =
@@ -848,7 +864,10 @@ case class View(
 }
 
 object View {
-  def effectiveSQLConf(configs: Map[String, String], isTempView: Boolean): SQLConf = {
+  def effectiveSQLConf(
+      configs: Map[String, String],
+      isTempView: Boolean,
+      createSparkVersion: String = ""): SQLConf = {
     val activeConf = SQLConf.get
     // For temporary view, we always use captured sql configs
     if (activeConf.useCurrentSQLConfigsForView && !isTempView) return activeConf
@@ -857,7 +876,12 @@ object View {
     for ((k, v) <- configs) {
       sqlConf.settings.put(k, v)
     }
-    Analyzer.retainResolutionConfigsForAnalysis(newConf = sqlConf, existingConf = activeConf)
+    Analyzer.retainResolutionConfigsForAnalysis(
+      newConf = sqlConf,
+      existingConf = activeConf,
+      createSparkVersion = createSparkVersion
+    )
+
     sqlConf
   }
 }
@@ -2099,6 +2123,15 @@ case class LateralJoin(
   }
 }
 
+
+object LateralJoin {
+  /**
+   * A tag to identify if a Lateral Join is added by resolving table argument.
+   */
+  val BY_TABLE_ARGUMENT = TreeNodeTag[Unit]("by_table_argument")
+}
+
+
 /**
  * A logical plan for as-of join.
  */
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/cteOperators.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/cteOperators.scala
index de980f8f6396e..c3c662c471f8f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/cteOperators.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/cteOperators.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.catalyst.plans.logical
 
-import org.apache.spark.sql.catalyst.analysis.MultiInstanceRelation
+import org.apache.spark.sql.catalyst.analysis.{MultiInstanceRelation, UnresolvedSubqueryColumnAliases}
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.plans._
 import org.apache.spark.sql.catalyst.trees.TreePattern._
@@ -59,6 +59,11 @@ case class UnionLoop(
     id.toString + limit.map(", " + _.toString).getOrElse("") +
       maxDepth.map(", " + _.toString).getOrElse("")
   }
+
+  override lazy val resolved: Boolean = {
+    // allChildrenCompatible needs to be evaluated after childrenResolved
+    childrenResolved && allChildrenCompatible
+  }
 }
 
 /**
@@ -68,8 +73,8 @@ case class UnionLoop(
  * @param loopId The id of the loop, inherited from [[CTERelationRef]] which got resolved into this
  *               UnionLoopRef.
  * @param output The output attributes of this recursive reference.
- * @param accumulated If false the the reference stands for the result of the previous iteration.
- *                    If it is true then then it stands for the union of all previous iteration
+ * @param accumulated If false the reference stands for the result of the previous iteration.
+ *                    If it is true then it stands for the union of all previous iteration
  *                    results.
  */
 case class UnionLoopRef(
@@ -125,6 +130,42 @@ case class CTERelationDef(
   lazy val hasSelfReferenceAsCTERef: Boolean = child.collectFirstWithSubqueries {
     case CTERelationRef(this.id, _, _, _, _, true, _) => true
   }.getOrElse(false)
+  lazy val hasSelfReferenceInAnchor: Boolean = {
+    val unionNode: Option[Union] = child match {
+      case SubqueryAlias(_, union: Union) =>
+        Some(union)
+      case SubqueryAlias(_, UnresolvedSubqueryColumnAliases(_, union: Union)) =>
+        Some(union)
+      case SubqueryAlias(_, WithCTE(union: Union, _)) =>
+        Some(union)
+      case SubqueryAlias(_, UnresolvedSubqueryColumnAliases(_, WithCTE(union: Union, _))) =>
+        Some(union)
+      case _ => None
+    }
+    if (unionNode.isDefined) {
+      unionNode.get.children.head.collectFirstWithSubqueries {
+        case CTERelationRef(this.id, _, _, _, _, true, _) => true
+      }.getOrElse(false)
+    } else {
+      false
+    }
+  }
+  lazy val hasSelfReferenceInSubCTE: Boolean = {
+    val withCTENode: Option[WithCTE] = child match {
+      case SubqueryAlias(_, withCTE @ WithCTE(_, _)) =>
+        Some(withCTE)
+      case SubqueryAlias(_, UnresolvedSubqueryColumnAliases(_, withCTE @ WithCTE(_, _))) =>
+        Some(withCTE)
+      case _ => None
+    }
+    if (withCTENode.isDefined) {
+      withCTENode.exists(_.cteDefs.exists(_.collectFirstWithSubqueries {
+        case CTERelationRef(this.id, _, _, _, _, true, _) => true
+      }.isDefined))
+    } else {
+      false
+    }
+  }
   lazy val hasSelfReferenceAsUnionLoopRef: Boolean = child.collectFirstWithSubqueries {
     case UnionLoopRef(this.id, _, _) => true
   }.getOrElse(false)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/v2Commands.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/v2Commands.scala
index 43756ce5eacbb..f2f7a0490f91f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/v2Commands.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/logical/v2Commands.scala
@@ -38,8 +38,10 @@ import org.apache.spark.sql.connector.expressions.filter.Predicate
 import org.apache.spark.sql.connector.write.{DeltaWrite, RowLevelOperation, RowLevelOperationTable, SupportsDelta, Write}
 import org.apache.spark.sql.connector.write.RowLevelOperation.Command.{DELETE, MERGE, UPDATE}
 import org.apache.spark.sql.errors.DataTypeErrors.toSQLType
+import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
-import org.apache.spark.sql.types.{BooleanType, DataType, IntegerType, MapType, MetadataBuilder, StringType, StructType}
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.types.{ArrayType, BooleanType, DataType, IntegerType, MapType, MetadataBuilder, StringType, StructField, StructType}
 import org.apache.spark.util.ArrayImplicits._
 import org.apache.spark.util.Utils
 
@@ -894,6 +896,17 @@ case class MergeIntoTable(
   override protected def withNewChildrenInternal(
       newLeft: LogicalPlan, newRight: LogicalPlan): MergeIntoTable =
     copy(targetTable = newLeft, sourceTable = newRight)
+
+  def needSchemaEvolution: Boolean =
+    schemaEvolutionEnabled &&
+      MergeIntoTable.schemaChanges(targetTable.schema, sourceTable.schema).nonEmpty
+
+  private def schemaEvolutionEnabled: Boolean = withSchemaEvolution && {
+    EliminateSubqueryAliases(targetTable) match {
+      case r: DataSourceV2Relation if r.autoSchemaEvolution() => true
+      case _ => false
+    }
+  }
 }
 
 object MergeIntoTable {
@@ -909,6 +922,69 @@ object MergeIntoTable {
     }
     privileges.toSeq
   }
+
+  def schemaChanges(
+      originalTarget: StructType,
+      originalSource: StructType,
+      fieldPath: Array[String] = Array()): Array[TableChange] = {
+    schemaChanges(originalTarget, originalSource, originalTarget, originalSource, fieldPath)
+  }
+
+  private def schemaChanges(
+      current: DataType,
+      newType: DataType,
+      originalTarget: StructType,
+      originalSource: StructType,
+      fieldPath: Array[String]): Array[TableChange] = {
+    (current, newType) match {
+      case (StructType(currentFields), StructType(newFields)) =>
+        val newFieldMap = toFieldMap(newFields)
+
+        // Update existing field types
+        val updates = {
+          currentFields collect {
+            case currentField: StructField if newFieldMap.contains(currentField.name) =>
+              schemaChanges(currentField.dataType, newFieldMap(currentField.name).dataType,
+                originalTarget, originalSource, fieldPath ++ Seq(currentField.name))
+          }}.flatten
+
+        // Identify the newly added fields and append to the end
+        val currentFieldMap = toFieldMap(currentFields)
+        val adds = newFields.filterNot (f => currentFieldMap.contains (f.name))
+          .map(f => TableChange.addColumn(fieldPath ++ Set(f.name), f.dataType))
+
+        updates ++ adds
+
+      case (ArrayType(currentElementType, _), ArrayType(newElementType, _)) =>
+        schemaChanges(currentElementType, newElementType,
+          originalTarget, originalSource, fieldPath ++ Seq("element"))
+
+      case (MapType(currentKeyType, currentElementType, _),
+      MapType(updateKeyType, updateElementType, _)) =>
+        schemaChanges(currentKeyType, updateKeyType, originalTarget, originalSource,
+          fieldPath ++ Seq("key")) ++
+          schemaChanges(currentElementType, updateElementType,
+            originalTarget, originalSource, fieldPath ++ Seq("value"))
+
+      case (currentType, newType) if currentType == newType =>
+        // No change needed
+        Array.empty[TableChange]
+
+      case _ =>
+        // For now do not support type widening
+        throw QueryExecutionErrors.failedToMergeIncompatibleSchemasError(
+          originalTarget, originalSource, null)
+    }
+  }
+
+  def toFieldMap(fields: Array[StructField]): Map[String, StructField] = {
+    val fieldMap = fields.map(field => field.name -> field).toMap
+    if (SQLConf.get.caseSensitiveAnalysis) {
+      fieldMap
+    } else {
+      CaseInsensitiveMap(fieldMap)
+    }
+  }
 }
 
 sealed abstract class MergeAction extends Expression with Unevaluable {
@@ -1684,12 +1760,14 @@ case class TableSpec(
  * The logical plan of the DECLARE [OR REPLACE] TEMPORARY VARIABLE command.
  */
 case class CreateVariable(
-    name: LogicalPlan,
+    names: Seq[LogicalPlan],
     defaultExpr: DefaultValueExpression,
-    replace: Boolean) extends UnaryCommand with SupportsSubquery {
-  override def child: LogicalPlan = name
-  override protected def withNewChildInternal(newChild: LogicalPlan): LogicalPlan =
-    copy(name = newChild)
+    replace: Boolean) extends Command with SupportsSubquery {
+  override def children: Seq[LogicalPlan] = names
+  override def withNewChildrenInternal(newChildren: IndexedSeq[LogicalPlan]): LogicalPlan = {
+    assert(newChildren.size == names.size, "Incorrect number of children")
+    copy(names = newChildren)
+  }
 }
 
 /**
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/physical/partitioning.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/physical/partitioning.scala
index 6e19a1d6bbc8c..038105f9bfdf7 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/physical/partitioning.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/plans/physical/partitioning.scala
@@ -316,7 +316,9 @@ case class HashPartitioning(expressions: Seq[Expression], numPartitions: Int)
    * Returns an expression that will produce a valid partition ID(i.e. non-negative and is less
    * than numPartitions) based on hashing expressions.
    */
-  def partitionIdExpression: Expression = Pmod(new Murmur3Hash(expressions), Literal(numPartitions))
+  def partitionIdExpression: Expression = Pmod(
+    new CollationAwareMurmur3Hash(expressions), Literal(numPartitions)
+  )
 
   override protected def withNewChildrenInternal(
     newChildren: IndexedSeq[Expression]): HashPartitioning = copy(expressions = newChildren)
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleExecutor.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleExecutor.scala
index c1fbdb710efe0..b5a35608a54e6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleExecutor.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleExecutor.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.catalyst.rules
 import org.apache.spark.SparkException
 import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.QueryPlanningTracker
 import org.apache.spark.sql.catalyst.trees.TreeNode
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.NANOS_PER_MILLIS
@@ -59,10 +58,19 @@ class PlanChangeLogger[TreeType <: TreeNode[_]] extends Logging {
     if (!newPlan.fastEquals(oldPlan)) {
       if (logRules.isEmpty || logRules.get.contains(ruleName)) {
         def message(): MessageWithContext = {
+          val oldPlanStringWithOutput = oldPlan.treeString(verbose = false,
+            printOutputColumns = true)
+          val newPlanStringWithOutput = newPlan.treeString(verbose = false,
+            printOutputColumns = true)
+          // scalastyle:off line.size.limit
           log"""
              |=== Applying Rule ${MDC(RULE_NAME, ruleName)} ===
              |${MDC(QUERY_PLAN, sideBySide(oldPlan.treeString, newPlan.treeString).mkString("\n"))}
+             |
+             |Output Information:
+             |${MDC(QUERY_PLAN, sideBySide(oldPlanStringWithOutput, newPlanStringWithOutput).mkString("\n"))}
            """.stripMargin
+           // scalastyle:on line.size.limit
         }
 
         logBasedOnLevel(logLevel)(message())
@@ -74,10 +82,19 @@ class PlanChangeLogger[TreeType <: TreeNode[_]] extends Logging {
     if (logBatches.isEmpty || logBatches.get.contains(batchName)) {
       def message(): MessageWithContext = {
         if (!oldPlan.fastEquals(newPlan)) {
+          val oldPlanStringWithOutput = oldPlan.treeString(verbose = false,
+            printOutputColumns = true)
+          val newPlanStringWithOutput = newPlan.treeString(verbose = false,
+            printOutputColumns = true)
+          // scalastyle:off line.size.limit
           log"""
              |=== Result of Batch ${MDC(BATCH_NAME, batchName)} ===
              |${MDC(QUERY_PLAN, sideBySide(oldPlan.treeString, newPlan.treeString).mkString("\n"))}
+             |
+             |Output Information:
+             |${MDC(QUERY_PLAN, sideBySide(oldPlanStringWithOutput, newPlanStringWithOutput).mkString("\n"))}
           """.stripMargin
+          // scalastyle:on line.size.limit
         } else {
           log"Batch ${MDC(BATCH_NAME, batchName)} has no effect."
         }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleIdCollection.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleIdCollection.scala
index 0d376861ddfb9..e7b59af5e7766 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleIdCollection.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleIdCollection.scala
@@ -113,6 +113,7 @@ object RuleIdCollection {
       "org.apache.spark.sql.catalyst.expressions.ValidateAndStripPipeExpressions" ::
       "org.apache.spark.sql.catalyst.analysis.ResolveUnresolvedHaving" ::
       "org.apache.spark.sql.catalyst.analysis.ResolveTableConstraints" ::
+      "org.apache.spark.sql.catalyst.expressions.ExtractSemiStructuredFields" ::
       // Catalyst Optimizer rules
       "org.apache.spark.sql.catalyst.optimizer.BooleanSimplification" ::
       "org.apache.spark.sql.catalyst.optimizer.CollapseProject" ::
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreeNode.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreeNode.scala
index a2ace2596d6a4..60585fdb33a86 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreeNode.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreeNode.scala
@@ -49,8 +49,8 @@ import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 import org.apache.spark.storage.StorageLevel
+import org.apache.spark.util.{BestEffortLazyVal, Utils}
 import org.apache.spark.util.ArrayImplicits._
-import org.apache.spark.util.Utils
 import org.apache.spark.util.collection.BitSet
 
 /** Used by [[TreeNode.getNodeNumbered]] when traversing the tree for a given number */
@@ -118,7 +118,8 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
    * A BitSet of tree patterns for this TreeNode and its subtree. If this TreeNode and its
    * subtree contains a pattern `P`, the corresponding bit for `P.id` is set in this BitSet.
    */
-  override lazy val treePatternBits: BitSet = getDefaultTreePatternBits
+  private val _treePatternBits = new BestEffortLazyVal[BitSet](() => getDefaultTreePatternBits)
+  override def treePatternBits: BitSet = _treePatternBits()
 
   /**
    * A BitSet of rule ids to record ineffective rules for this TreeNode and its subtree.
@@ -180,6 +181,17 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
     }
   }
 
+  def mergeTagsFrom(other: BaseType): Unit = {
+    if (!other.isTagsEmpty) {
+      // Merge all tags from the other node into this node.
+      // Unlike copyTagsFrom which only copies when this node has no tags,
+      // mergeTagsFrom will always merge tags regardless of existing state.
+      // If both nodes have the same tag with different values, the value
+      // from the other node will overwrite the existing value in this node.
+      tags ++= other.tags
+    }
+  }
+
   def setTagValue[T](tag: TreeNodeTag[T], value: T): Unit = {
     tags(tag) = value
   }
@@ -204,12 +216,15 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
    */
   def children: Seq[BaseType]
 
-  lazy val containsChild: Set[TreeNode[_]] = children.toSet
+  private val _containsChild = new BestEffortLazyVal[Set[TreeNode[_]]](() => children.toSet)
+  def containsChild: Set[TreeNode[_]] = _containsChild()
 
-  lazy val height: Int = children.map(_.height).reduceOption(_ max _).getOrElse(0) + 1
+  private val _height = new BestEffortLazyVal[Integer](() =>
+    children.map(_.height).reduceOption(_ max _).getOrElse(0) + 1)
+  def height: Int = _height()
 
-  private lazy val _hashCode: Int = MurmurHash3.productHash(this)
-  override def hashCode(): Int = _hashCode
+  private val _hashCode = new BestEffortLazyVal[Integer](() => MurmurHash3.productHash(this))
+  override def hashCode(): Int = _hashCode()
 
   /**
    * Faster version of equality which short-circuits when two treeNodes are the same instance.
@@ -847,13 +862,14 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
    */
   protected def stringArgs: Iterator[Any] = productIterator
 
-  private lazy val allChildren: IdentityHashMap[TreeNode[_], Any] = {
+  private val _allChildren = new BestEffortLazyVal[IdentityHashMap[TreeNode[_], Any]](() => {
     val set = new IdentityHashMap[TreeNode[_], Any]()
     (children ++ innerChildren).foreach {
       set.put(_, null)
     }
     set
-  }
+  })
+  private def allChildren = _allChildren()
 
   private def redactMapString[K, V](map: Map[K, V], maxFields: Int): List[String] = {
     // For security reason, redact the map value if the key is in certain patterns
@@ -947,9 +963,10 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
       verbose: Boolean,
       addSuffix: Boolean = false,
       maxFields: Int = SQLConf.get.maxToStringFields,
-      printOperatorId: Boolean = false): String = {
+      printOperatorId: Boolean = false,
+      printOutputColumns: Boolean = false): String = {
     val concat = new PlanStringConcat()
-    treeString(concat.append, verbose, addSuffix, maxFields, printOperatorId)
+    treeString(concat.append, verbose, addSuffix, maxFields, printOperatorId, printOutputColumns)
     concat.toString
   }
 
@@ -958,9 +975,10 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
       verbose: Boolean,
       addSuffix: Boolean,
       maxFields: Int,
-      printOperatorId: Boolean): Unit = {
+      printOperatorId: Boolean,
+      printOutputColumns: Boolean): Unit = {
     generateTreeString(0, new java.util.ArrayList(), append, verbose, "", addSuffix, maxFields,
-      printOperatorId, 0)
+      printOperatorId, printOutputColumns, 0)
   }
 
   /**
@@ -1011,6 +1029,8 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
    */
   def innerChildren: Seq[TreeNode[_]] = Seq.empty
 
+  def nodeWithOutputColumnsString(maxColumns: Int): String = simpleString(maxColumns)
+
   /**
    * Appends the string representation of this node and its children to the given Writer.
    *
@@ -1029,6 +1049,7 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
       addSuffix: Boolean = false,
       maxFields: Int,
       printNodeId: Boolean,
+      printOutputColumns: Boolean,
       indent: Int = 0): Unit = {
     (0 until indent).foreach(_ => append("   "))
     if (depth > 0) {
@@ -1044,6 +1065,8 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
       if (addSuffix) verboseStringWithSuffix(maxFields) else verboseString(maxFields)
     } else if (printNodeId) {
       simpleStringWithNodeId()
+    } else if (printOutputColumns) {
+      nodeWithOutputColumnsString(maxFields)
     } else {
       simpleString(maxFields)
     }
@@ -1057,7 +1080,8 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
       lastChildren.add(false)
       innerChildrenLocal.init.foreach(_.generateTreeString(
         depth + 2, lastChildren, append, verbose,
-        addSuffix = addSuffix, maxFields = maxFields, printNodeId = printNodeId, indent = indent))
+        addSuffix = addSuffix, maxFields = maxFields, printNodeId = printNodeId,
+        printOutputColumns = printOutputColumns, indent = indent))
       lastChildren.remove(lastChildren.size() - 1)
       lastChildren.remove(lastChildren.size() - 1)
 
@@ -1065,7 +1089,8 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
       lastChildren.add(true)
       innerChildrenLocal.last.generateTreeString(
         depth + 2, lastChildren, append, verbose,
-        addSuffix = addSuffix, maxFields = maxFields, printNodeId = printNodeId, indent = indent)
+        addSuffix = addSuffix, maxFields = maxFields, printNodeId = printNodeId,
+        printOutputColumns = printOutputColumns, indent = indent)
       lastChildren.remove(lastChildren.size() - 1)
       lastChildren.remove(lastChildren.size() - 1)
     }
@@ -1074,14 +1099,16 @@ abstract class TreeNode[BaseType <: TreeNode[BaseType]]
       lastChildren.add(false)
       children.init.foreach(_.generateTreeString(
         depth + 1, lastChildren, append, verbose, prefix, addSuffix,
-        maxFields, printNodeId = printNodeId, indent = indent)
+        maxFields, printNodeId = printNodeId, printOutputColumns = printOutputColumns,
+        indent = indent)
       )
       lastChildren.remove(lastChildren.size() - 1)
 
       lastChildren.add(true)
       children.last.generateTreeString(
         depth + 1, lastChildren, append, verbose, prefix,
-        addSuffix, maxFields, printNodeId = printNodeId, indent = indent)
+        addSuffix, maxFields, printNodeId = printNodeId, printOutputColumns = printOutputColumns,
+        indent = indent)
       lastChildren.remove(lastChildren.size() - 1)
     }
   }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatternBits.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatternBits.scala
index 7b0c99b35203e..963b6d27fc796 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatternBits.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatternBits.scala
@@ -22,7 +22,7 @@ import org.apache.spark.util.collection.BitSet
 
 // A wrapper of BitSet for pattern enums.
 trait TreePatternBits {
-  protected val treePatternBits: BitSet
+  protected def treePatternBits: BitSet
 
   /**
    * @param t, the tree pattern enum to be tested.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatterns.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatterns.scala
index 471e68b6b7082..c35aa7403d767 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatterns.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/trees/TreePatterns.scala
@@ -80,6 +80,7 @@ object TreePattern extends Enumeration  {
   val REGEXP_EXTRACT_FAMILY: Value = Value
   val REGEXP_REPLACE: Value = Value
   val RUNTIME_REPLACEABLE: Value = Value
+  val SEMI_STRUCTURED_EXTRACT: Value = Value
   val SCALAR_SUBQUERY: Value = Value
   val SCALAR_SUBQUERY_REFERENCE: Value = Value
   val SCALA_UDF: Value = Value
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/types/DataTypeUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/types/DataTypeUtils.scala
index f8bb1077a080f..c6e51aab4584b 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/types/DataTypeUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/types/DataTypeUtils.scala
@@ -22,7 +22,7 @@ import org.apache.spark.sql.catalyst.util.TypeUtils.toSQLId
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.internal.SQLConf.StoreAssignmentPolicy
 import org.apache.spark.sql.internal.SQLConf.StoreAssignmentPolicy.{ANSI, STRICT}
-import org.apache.spark.sql.types.{ArrayType, AtomicType, DataType, Decimal, DecimalType, MapType, NullType, StringType, StructField, StructType, UserDefinedType}
+import org.apache.spark.sql.types._
 import org.apache.spark.sql.types.DecimalType.{forType, fromDecimal}
 
 object DataTypeUtils {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/CharVarcharUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/CharVarcharUtils.scala
index 6ba7e528ea230..6fe35e08f88cf 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/CharVarcharUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/CharVarcharUtils.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.catalyst.util
 
 import scala.collection.mutable
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.objects.StaticInvoke
@@ -90,9 +90,18 @@ object CharVarcharUtils extends Logging with SparkCharVarcharUtils {
    * the given attribute's metadata.
    */
   def cleanAttrMetadata(attr: AttributeReference): AttributeReference = {
-    val cleaned = new MetadataBuilder().withMetadata(attr.metadata)
-      .remove(CHAR_VARCHAR_TYPE_STRING_METADATA_KEY).build()
-    attr.withMetadata(cleaned)
+    attr.withMetadata(cleanMetadata(attr.metadata))
+  }
+
+  /**
+   * Removes the metadata entry that contains the original type string of CharType/VarcharType from
+   * the given metadata.
+   */
+  def cleanMetadata(metadata: Metadata): Metadata = {
+    new MetadataBuilder()
+      .withMetadata(metadata)
+      .remove(CHAR_VARCHAR_TYPE_STRING_METADATA_KEY)
+      .build()
   }
 
   def getRawTypeString(metadata: Metadata): Option[String] = {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/DateTimeUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/DateTimeUtils.scala
index d7cbb9886ba1e..9310f4b9ae755 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/DateTimeUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/DateTimeUtils.scala
@@ -108,8 +108,8 @@ object DateTimeUtils extends SparkDateTimeUtils {
   /**
    * Returns the hour value of a given TIME (TimeType) value.
    */
-  def getHoursOfTime(micros: Long): Int = {
-    microsToLocalTime(micros).getHour
+  def getHoursOfTime(nanos: Long): Int = {
+    nanosToLocalTime(nanos).getHour
   }
 
   /**
@@ -123,8 +123,8 @@ object DateTimeUtils extends SparkDateTimeUtils {
   /**
    * Returns the minute value of a given TIME (TimeType) value.
    */
-  def getMinutesOfTime(micros: Long): Int = {
-    microsToLocalTime(micros).getMinute
+  def getMinutesOfTime(nanos: Long): Int = {
+    nanosToLocalTime(nanos).getMinute
   }
 
   /**
@@ -138,8 +138,8 @@ object DateTimeUtils extends SparkDateTimeUtils {
   /**
    * Returns the second value of a given TIME (TimeType) value.
    */
-  def getSecondsOfTime(micros: Long): Int = {
-    microsToLocalTime(micros).getSecond
+  def getSecondsOfTime(nanos: Long): Int = {
+    nanosToLocalTime(nanos).getSecond
   }
   /**
    * Returns the seconds part and its fractional part with microseconds.
@@ -151,16 +151,16 @@ object DateTimeUtils extends SparkDateTimeUtils {
 
   /**
    * Returns the second value with fraction from a given TIME (TimeType) value.
-   * @param micros
-   *   The number of microseconds since the epoch.
+   * @param nanos
+   *   The number of nanoseconds since the epoch.
    * @param precision
    *   The time fractional seconds precision, which indicates the number of decimal digits
    *   maintained.
    */
-  def getSecondsOfTimeWithFraction(micros: Long, precision: Int): Decimal = {
-    val seconds = (micros / MICROS_PER_SECOND) % SECONDS_PER_MINUTE
+  def getSecondsOfTimeWithFraction(nanos: Long, precision: Int): Decimal = {
+    val seconds = (nanos / NANOS_PER_SECOND) % SECONDS_PER_MINUTE
     val scaleFactor = math.pow(10, precision).toLong
-    val scaledFraction = (micros % MICROS_PER_SECOND) * scaleFactor / MICROS_PER_SECOND
+    val scaledFraction = (nanos % NANOS_PER_SECOND) * scaleFactor / NANOS_PER_SECOND
     val fraction = scaledFraction.toDouble / scaleFactor
     Decimal(seconds + fraction, 8, 6)
   }
@@ -508,6 +508,30 @@ object DateTimeUtils extends SparkDateTimeUtils {
     }
   }
 
+  /**
+   * Returns time truncated to the unit specified by the level.
+   */
+  private def parseTimeTruncLevel(level: UTF8String): ChronoUnit = {
+    assert(level != null, "Truncation level cannot be null")
+    level.toString.toUpperCase(Locale.ROOT) match {
+      case "HOUR" => ChronoUnit.HOURS
+      case "MINUTE" => ChronoUnit.MINUTES
+      case "SECOND" => ChronoUnit.SECONDS
+      case "MILLISECOND" => ChronoUnit.MILLIS
+      case "MICROSECOND" => ChronoUnit.MICROS
+      case _ =>
+        throw QueryExecutionErrors.invalidTimeUnitError("time_trunc", level.toString)
+    }
+  }
+
+  /**
+   * Returns time truncated to the unit specified by the level. Trunc level is parsed directly to
+   * corresponding ChronoUnits. Note that only levels from 'MICROSECOND' to 'HOUR' are supported.
+   */
+  def timeTrunc(level: UTF8String, nanos: Long): Long = {
+    localTimeToNanos(nanosToLocalTime(nanos).truncatedTo(parseTimeTruncLevel(level)))
+  }
+
   /**
    * Returns the truncate level, could be from TRUNC_TO_MICROSECOND to TRUNC_TO_YEAR,
    * or TRUNC_INVALID, TRUNC_INVALID means unsupported truncate level.
@@ -679,6 +703,56 @@ object DateTimeUtils extends SparkDateTimeUtils {
     new CalendarInterval(months, days, 0)
   }
 
+  /**
+   * Subtracts two time values expressed as nanoseconds since 00:00:00, and returns
+   * the difference in microseconds.
+   *
+   * @param endNanos The end time as nanoseconds since the midnight, exclusive
+   * @param startNanos The end time as nanoseconds since the midnight, inclusive
+   * @return The difference in microseconds between local time corresponded to the input
+   *         `endNanos` and `startNanos`.
+   */
+  def subtractTimes(endNanos: Long, startNanos: Long): Long = {
+    (endNanos - startNanos) / NANOS_PER_MICROS
+  }
+
+  // Helper method to get the number of nanoseconds per the given time unit, used for calculating
+  // the difference between two time values (timediff function). Supported units are: MICROSECOND,
+  // MILLISECOND, SECOND, MINUTE, HOUR.
+  private def getNanosPerTimeUnit(unit: UTF8String, functionName: String): Long = {
+    val unitStr = unit.toString
+    unitStr.toUpperCase(Locale.ROOT) match {
+      case "MICROSECOND" =>
+        NANOS_PER_MICROS
+      case "MILLISECOND" =>
+        NANOS_PER_MILLIS
+      case "SECOND" =>
+        NANOS_PER_SECOND
+      case "MINUTE" =>
+        NANOS_PER_SECOND * SECONDS_PER_MINUTE
+      case "HOUR" =>
+        NANOS_PER_SECOND * SECONDS_PER_MINUTE * MINUTES_PER_HOUR
+      case _ =>
+        throw QueryExecutionErrors.invalidTimeUnitError(functionName, unitStr)
+    }
+  }
+
+  /**
+   * Gets the difference between two time values in the specified unit.
+   *
+   * @param unit Specifies the interval units in which to express the difference between
+   *             the two time parameters. Supported units are: MICROSECOND, MILLISECOND,
+   *             SECOND, MINUTE, HOUR.
+   * @param startNanos A time value expressed as nanoseconds since the start of the day,
+   *                   which the function subtracts from `endNanos`.
+   * @param endNanos A time value expressed as nanoseconds since the start of the day,
+   *                 from which the function subtracts `startNanos`.
+   * @return The time span between two time values, in the units specified.
+   */
+  def timeDiff(unit: UTF8String, startNanos: Long, endNanos: Long): Long = {
+    (endNanos - startNanos) / getNanosPerTimeUnit(unit, "time_diff")
+  }
+
   /**
    * Subtracts two timestamps expressed as microseconds since 1970-01-01 00:00:00Z, and returns
    * the difference in microseconds between local timestamps at the given time zone.
@@ -788,14 +862,14 @@ object DateTimeUtils extends SparkDateTimeUtils {
   }
 
   /**
-   * Converts separate time fields in a long that represents microseconds since the start of
+   * Converts separate time fields in a long that represents nanoseconds since the start of
    * the day
    * @param hours the hour, from 0 to 23
    * @param minutes the minute, from 0 to 59
    * @param secsAndMicros the second, from 0 to 59.999999
-   * @return A time value represented as microseconds since the start of the day
+   * @return A time value represented as nanoseconds since the start of the day
    */
-  def timeToMicros(hours: Int, minutes: Int, secsAndMicros: Decimal): Long = {
+  def makeTime(hours: Int, minutes: Int, secsAndMicros: Decimal): Long = {
     try {
       val unscaledSecFrac = secsAndMicros.toUnscaledLong
       val fullSecs = Math.floorDiv(unscaledSecFrac, MICROS_PER_SECOND)
@@ -816,10 +890,77 @@ object DateTimeUtils extends SparkDateTimeUtils {
 
       val nanos = Math.floorMod(unscaledSecFrac, MICROS_PER_SECOND) * NANOS_PER_MICROS
       val lt = LocalTime.of(hours, minutes, fullSecs.toInt, nanos.toInt)
-      localTimeToMicros(lt)
+      localTimeToNanos(lt)
     } catch {
       case e @ (_: DateTimeException | _: ArithmeticException) =>
         throw QueryExecutionErrors.ansiDateTimeArgumentOutOfRangeWithoutSuggestion(e)
     }
   }
+
+  /**
+   * Makes a timestamp without time zone from a date and a local time.
+   *
+   * @param days The number of days since the epoch 1970-01-01.
+   *             Negative numbers represent earlier days.
+   * @param nanos The number of nanoseconds within the day since the midnight.
+   * @return The number of microseconds since the epoch 1970-01-01 00:00:00Z.
+   */
+  def makeTimestampNTZ(days: Int, nanos: Long): Long = {
+    localDateTimeToMicros(LocalDateTime.of(daysToLocalDate(days), nanosToLocalTime(nanos)))
+  }
+
+  /**
+   * Makes a timestamp from a date and a local time.
+   *
+   * @param days The number of days since the epoch 1970-01-01.
+   *             Negative numbers represent earlier days.
+   * @param nanos The number of nanoseconds within the day since the midnight.
+   * @param zoneId The time zone ID at which the operation is performed.
+   * @return The number of microseconds since the epoch 1970-01-01 00:00:00Z.
+   */
+  def makeTimestamp(days: Int, nanos: Long, zoneId: ZoneId): Long = {
+    val ldt = LocalDateTime.of(daysToLocalDate(days), nanosToLocalTime(nanos))
+    instantToMicros(ldt.atZone(zoneId).toInstant)
+  }
+
+  /**
+   * Makes a timestamp from a date and a local time with timezone string.
+   *
+   * @param days The number of days since the epoch 1970-01-01.
+   *             Negative numbers represent earlier days.
+   * @param nanos The number of nanoseconds within the day since the midnight.
+   * @param timezone The time zone string.
+   * @return The number of microseconds since the epoch 1970-01-01 00:00:00Z.
+   */
+  def makeTimestamp(days: Int, nanos: Long, timezone: UTF8String): Long = {
+    val zoneId = getZoneId(timezone.toString)
+    makeTimestamp(days, nanos, zoneId)
+  }
+
+  /**
+   * Adds a day-time interval to a time.
+   *
+   * @param time A time in nanoseconds.
+   * @param timePrecision The number of digits of the fraction part of time.
+   * @param interval A day-time interval in microseconds.
+   * @param intervalEndField The rightmost field which the interval comprises of.
+   *                         Valid values: 0 (DAY), 1 (HOUR), 2 (MINUTE), 3 (SECOND).
+   * @param targetPrecision The number of digits of the fraction part of the resulting time.
+   * @return A time value in nanoseconds or throw an arithmetic overflow
+   *         if the result out of valid time range [00:00, 24:00).
+   */
+  def timeAddInterval(
+      time: Long,
+      timePrecision: Int,
+      interval: Long,
+      intervalEndField: Byte,
+      targetPrecision: Int): Long = {
+    val result = MathUtils.addExact(time, MathUtils.multiplyExact(interval, NANOS_PER_MICROS))
+    if (0 <= result && result < NANOS_PER_DAY) {
+      truncateTimeToPrecision(result, targetPrecision)
+    } else {
+      throw QueryExecutionErrors.timeAddIntervalOverflowError(
+        time, timePrecision, interval, intervalEndField)
+    }
+  }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/EvaluateUnresolvedInlineTable.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/EvaluateUnresolvedInlineTable.scala
index 51cab6bff3b03..93d99a16e26b6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/EvaluateUnresolvedInlineTable.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/EvaluateUnresolvedInlineTable.scala
@@ -14,8 +14,9 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.catalyst
+package org.apache.spark.sql.catalyst.util
 
+import org.apache.spark.sql.catalyst.SQLConfHelper
 import org.apache.spark.sql.catalyst.analysis._
 import org.apache.spark.sql.catalyst.expressions.{AliasHelper, EvalHelper, Expression}
 import org.apache.spark.sql.catalyst.optimizer.EvalInlineTables
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/HyperLogLogPlusPlusHelper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/HyperLogLogPlusPlusHelper.scala
index fc947386487a1..38425f7212361 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/HyperLogLogPlusPlusHelper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/HyperLogLogPlusPlusHelper.scala
@@ -24,7 +24,6 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.XxHash64Function
 import org.apache.spark.sql.catalyst.optimizer.NormalizeFloatingNumbers.{DOUBLE_NORMALIZER, FLOAT_NORMALIZER}
 import org.apache.spark.sql.types._
-import org.apache.spark.unsafe.types.UTF8String
 
 // A helper class for HyperLogLogPlusPlus.
 class HyperLogLogPlusPlusHelper(relativeSD: Double) extends Serializable {
@@ -94,12 +93,16 @@ class HyperLogLogPlusPlusHelper(relativeSD: Double) extends Serializable {
     val value = dataType match {
       case FloatType => FLOAT_NORMALIZER.apply(_value)
       case DoubleType => DOUBLE_NORMALIZER.apply(_value)
-      case st: StringType if !st.supportsBinaryEquality =>
-        CollationFactory.getCollationKeyBytes(_value.asInstanceOf[UTF8String], st.collationId)
       case _ => _value
     }
     // Create the hashed value 'x'.
-    val x = XxHash64Function.hash(value, dataType, 42L)
+    val x = XxHash64Function.hash(
+      value,
+      dataType,
+      42L,
+      isCollationAware = true,
+      // legacyCollationAwareHashing only matters when isCollationAware is false.
+      legacyCollationAwareHashing = false)
 
     // Determine the index of the register we are going to use.
     val idx = (x >>> idxShift).toInt
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/InternalRowComparableWrapper.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/InternalRowComparableWrapper.scala
index d2bdad2d880de..ba3d65fea0273 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/InternalRowComparableWrapper.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/InternalRowComparableWrapper.scala
@@ -39,7 +39,13 @@ class InternalRowComparableWrapper(val row: InternalRow, val dataTypes: Seq[Data
   private val structType = structTypeCache.get(dataTypes)
   private val ordering = orderingCache.get(dataTypes)
 
-  override def hashCode(): Int = Murmur3HashFunction.hash(row, structType, 42L).toInt
+  override def hashCode(): Int = Murmur3HashFunction.hash(
+    row,
+    structType,
+    42L,
+    isCollationAware = true,
+    // legacyCollationAwareHashing only matters when isCollationAware is false.
+    legacyCollationAwareHashing = false).toInt
 
   override def equals(other: Any): Boolean = {
     if (!other.isInstanceOf[InternalRowComparableWrapper]) {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ParseMode.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ParseMode.scala
index cc1a01083af41..24662b8bbf4c6 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ParseMode.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ParseMode.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.catalyst.util
 
 import java.util.Locale
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PARSE_MODE
 
 sealed trait ParseMode {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ResolveDefaultColumnsUtil.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ResolveDefaultColumnsUtil.scala
index a3f4a95eec747..be17dc8ea470c 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ResolveDefaultColumnsUtil.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ResolveDefaultColumnsUtil.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable.ArrayBuffer
 import scala.util.control.NonFatal
 
 import org.apache.spark.{SparkException, SparkUnsupportedOperationException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.{InternalRow, SQLConfHelper}
@@ -33,7 +33,7 @@ import org.apache.spark.sql.catalyst.optimizer.{ConstantFolding, Optimizer}
 import org.apache.spark.sql.catalyst.parser.{CatalystSqlParser, ParseException}
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.trees.TreePattern.PLAN_EXPRESSION
-import org.apache.spark.sql.connector.catalog.{CatalogManager, DefaultValue, FunctionCatalog, Identifier, TableCatalog, TableCatalogCapability}
+import org.apache.spark.sql.connector.catalog.{CatalogManager, Column, DefaultValue, FunctionCatalog, Identifier, TableCatalog, TableCatalogCapability}
 import org.apache.spark.sql.connector.catalog.functions.UnboundFunction
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryErrorsBase}
 import org.apache.spark.sql.internal.SQLConf
@@ -573,6 +573,14 @@ object ResolveDefaultColumns extends QueryErrorsBase
     rows.toSeq
   }
 
+  /** If any fields in a schema have default values, appends them to the result. */
+  def getDescribeMetadata(cols: Array[Column]): Seq[(String, String, String)] = {
+    cols.filter(_.defaultValue() != null).flatMap { col =>
+      ("", "", "") :: ("# Column Default Values", "", "") ::
+        (col.name, col.dataType.simpleString, col.defaultValue().getSql) :: Nil
+    }.toSeq
+  }
+
   /**
    * These define existence default values for the struct fields for efficiency purposes.
    * The caller should avoid using such methods in a loop for efficiency.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/StringUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/StringUtils.scala
index b4d737dcf791f..da83096903ad9 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/StringUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/StringUtils.scala
@@ -24,7 +24,7 @@ import scala.collection.mutable.ArrayBuffer
 
 import org.apache.commons.text.similarity.LevenshteinDistance
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.catalyst.analysis.UnresolvedAttribute
 import org.apache.spark.sql.errors.QueryCompilationErrors
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ToNumberParser.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ToNumberParser.scala
index b66658467c1b7..ea2f48fafc0dd 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ToNumberParser.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/ToNumberParser.scala
@@ -619,7 +619,7 @@ class ToNumberParser(numberFormat: String, errorOnFail: Boolean) extends Seriali
     // digits as the scale. This is necessary because we must determine the scale from the format
     // string alone but each input string may include a variable number of digits after the decimal
     // point.
-    val extraZeros = "0" * (scale - parsedAfterDecimalPoint.length)
+    val extraZeros = "0".repeat(scale - parsedAfterDecimalPoint.length)
     val afterDecimalPadded = parsedAfterDecimalPoint.toString + extraZeros
     val prefix = if (negateResult) "-" else ""
     val suffix = if (afterDecimalPadded.nonEmpty) "." + afterDecimalPadded else ""
@@ -763,11 +763,11 @@ class ToNumberParser(numberFormat: String, errorOnFail: Boolean) extends Seriali
     // than specified in the format string, this is an overflow.
     if (numFormatDigitsBeforeDecimalPoint < beforeDecimalPoint.length ||
       numFormatDigitsAfterDecimalPoint < afterDecimalPoint.length) {
-      beforeDecimalPoint = "#" * numFormatDigitsBeforeDecimalPoint
-      afterDecimalPoint = "#" * numFormatDigitsAfterDecimalPoint
+      beforeDecimalPoint = "#".repeat(numFormatDigitsBeforeDecimalPoint)
+      afterDecimalPoint = "#".repeat(numFormatDigitsAfterDecimalPoint)
     }
-    val leadingSpaces = " " * (numFormatDigitsBeforeDecimalPoint - beforeDecimalPoint.length)
-    val trailingZeros = "0" * (numFormatDigitsAfterDecimalPoint - afterDecimalPoint.length)
+    val leadingSpaces = " ".repeat(numFormatDigitsBeforeDecimalPoint - beforeDecimalPoint.length)
+    val trailingZeros = "0".repeat(numFormatDigitsAfterDecimalPoint - afterDecimalPoint.length)
     (leadingSpaces + beforeDecimalPoint, afterDecimalPoint + trailingZeros)
   }
 
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/V2ExpressionBuilder.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/V2ExpressionBuilder.scala
index fad73a6d81464..e42802de40f2f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/V2ExpressionBuilder.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/V2ExpressionBuilder.scala
@@ -17,11 +17,12 @@
 
 package org.apache.spark.sql.catalyst.util
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.EXPR
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, AggregateFunction, Complete}
 import org.apache.spark.sql.catalyst.expressions.objects.{Invoke, StaticInvoke}
+import org.apache.spark.sql.catalyst.optimizer.ConstantFolding
 import org.apache.spark.sql.connector.catalog.functions.ScalarFunction
 import org.apache.spark.sql.connector.expressions.{Cast => V2Cast, Expression => V2Expression, Extract => V2Extract, FieldReference, GeneralScalarExpression, LiteralValue, NullOrdering, SortDirection, SortValue, UserDefinedScalarFunc}
 import org.apache.spark.sql.connector.expressions.aggregate.{AggregateFunc, Avg, Count, CountStar, GeneralAggregateFunc, Max, Min, Sum, UserDefinedAggregateFunc}
@@ -37,12 +38,21 @@ class V2ExpressionBuilder(e: Expression, isPredicate: Boolean = false) extends L
   def build(): Option[V2Expression] = generateExpression(e, isPredicate)
 
   def buildPredicate(): Option[V2Predicate] = {
-
     if (isPredicate) {
-      val translated = build()
+      val translated0 = build()
+      val conf = SQLConf.get
+      val alwaysCreateV2Predicate = conf.getConf(SQLConf.DATA_SOURCE_ALWAYS_CREATE_V2_PREDICATE)
+      val translated = if (alwaysCreateV2Predicate && e.dataType == BooleanType) {
+        translated0.map {
+          case p: V2Predicate => p
+          case other => new V2Predicate("BOOLEAN_EXPRESSION", Array(other))
+        }
+      } else {
+        translated0
+      }
 
       val modifiedExprOpt = if (
-        SQLConf.get.getConf(SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE)
+        conf.getConf(SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE)
           && translated.isDefined
           && !translated.get.isInstanceOf[V2Predicate]) {
 
@@ -74,11 +84,20 @@ class V2ExpressionBuilder(e: Expression, isPredicate: Boolean = false) extends L
     case _ => false
   }
 
+  private def translateLiteral(l: Literal): V2Expression = l match {
+    case Literal(true, BooleanType) => new AlwaysTrue()
+    case Literal(false, BooleanType) => new AlwaysFalse()
+    case other => LiteralValue(other.value, other.dataType)
+  }
+
   private def generateExpression(
       expr: Expression, isPredicate: Boolean = false): Option[V2Expression] = expr match {
-    case Literal(true, BooleanType) => Some(new AlwaysTrue())
-    case Literal(false, BooleanType) => Some(new AlwaysFalse())
-    case Literal(value, dataType) => Some(LiteralValue(value, dataType))
+    case literal: Literal => Some(translateLiteral(literal))
+    case _ if expr.contextIndependentFoldable =>
+      // If the expression is context independent foldable, we can convert it to a literal.
+      // This is useful for increasing the coverage of V2 expressions.
+      val constantExpr = ConstantFolding.constantFolding(expr)
+      generateExpression(constantExpr, isPredicate)
     case col @ ColumnOrField(nameParts) =>
       val ref = FieldReference(nameParts)
       if (isPredicate && col.dataType.isInstanceOf[BooleanType]) {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/package.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/package.scala
index 197e687d62de4..562a02e6a111f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/package.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/util/package.scala
@@ -18,18 +18,15 @@
 package org.apache.spark.sql.catalyst
 
 import java.io._
-import java.nio.charset.Charset
 import java.nio.charset.StandardCharsets.UTF_8
 
-import com.google.common.io.ByteStreams
-
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.analysis.TempResolvedColumn
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.connector.catalog.MetadataColumn
 import org.apache.spark.sql.types.{MetadataBuilder, NumericType, StringType, StructType}
 import org.apache.spark.unsafe.types.UTF8String
-import org.apache.spark.util.{SparkErrorUtils, Utils}
+import org.apache.spark.util.{SparkErrorUtils, SparkStringUtils, Utils}
 
 package object util extends Logging {
 
@@ -48,21 +45,12 @@ package object util extends Logging {
     }
   }
 
-  def fileToString(file: File, encoding: Charset = UTF_8): String = {
-    val inStream = new FileInputStream(file)
-    try {
-      new String(ByteStreams.toByteArray(inStream), encoding)
-    } finally {
-      inStream.close()
-    }
-  }
-
   def resourceToBytes(
       resource: String,
       classLoader: ClassLoader = Utils.getSparkClassLoader): Array[Byte] = {
     val inStream = classLoader.getResourceAsStream(resource)
     try {
-      ByteStreams.toByteArray(inStream)
+      inStream.readAllBytes()
     } finally {
       inStream.close()
     }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXMLRecordReader.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXMLRecordReader.scala
new file mode 100644
index 0000000000000..8793eebc97202
--- /dev/null
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXMLRecordReader.scala
@@ -0,0 +1,132 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.sql.catalyst.xml
+
+import java.io.InputStream
+import javax.xml.stream.{XMLEventReader, XMLStreamConstants, XMLStreamReader}
+import javax.xml.stream.events.{EndDocument, StartElement, XMLEvent}
+import javax.xml.transform.stax.StAXSource
+
+import scala.util.control.NonFatal
+
+import org.apache.hadoop.shaded.com.ctc.wstx.exc.WstxEOFException
+
+import org.apache.spark.internal.Logging
+import org.apache.spark.util.SparkErrorUtils
+
+/**
+ * XML record reader that reads the next XML record in the underlying XML stream. It can support XSD
+ * schema validation by maintaining a separate XML reader and keep it in sync with the primary XML
+ * reader.
+ */
+case class StaxXMLRecordReader(inputStream: () => InputStream, options: XmlOptions)
+    extends XMLEventReader
+    with Logging {
+  // Reader for the XML record parsing.
+  private lazy val in1 = inputStream()
+  private lazy val primaryEventReader = StaxXmlParserUtils.filteredReader(in1, options)
+
+  private val xsdSchemaValidator = Option(options.rowValidationXSDPath)
+    .map(path => ValidatorUtil.getSchema(path).newValidator())
+  // Reader for the XSD validation, if an XSD schema is provided.
+  private lazy val in2 = xsdSchemaValidator.map(_ => inputStream())
+  // An XMLStreamReader used by StAXSource for XSD validation.
+  private lazy val xsdValidationStreamReader =
+    in2.map(in => StaxXmlParserUtils.filteredStreamReader(in, options))
+
+  final var hasMoreRecord: Boolean = true
+
+  /**
+   * Skip through the XML stream until we find the next row start element.
+   * Returns true if a row start element is found, false if end of stream is reached.
+   */
+  def skipToNextRecord(): Boolean = {
+    hasMoreRecord = skipToNextRowStart()
+    if (hasMoreRecord) {
+      xsdValidationStreamReader.foreach(validateXSDSchema)
+    } else {
+      close()
+    }
+    hasMoreRecord
+  }
+
+  /**
+   * Skip through the XML stream until we find the next row start element.
+   */
+  private def skipToNextRowStart(): Boolean = {
+    val rowTagName = options.rowTag
+    try {
+      while (primaryEventReader.hasNext) {
+        val event = primaryEventReader.peek()
+        event match {
+          case startElement: StartElement =>
+            val elementName = StaxXmlParserUtils.getName(startElement.getName, options)
+            if (elementName == rowTagName) {
+              return true
+            }
+          case _: EndDocument =>
+            return false
+          case _ =>
+          // Continue searching
+        }
+        // if not the event we want, advance the reader
+        primaryEventReader.nextEvent()
+      }
+      false
+    } catch {
+      case NonFatal(e) if SparkErrorUtils.getRootCause(e).isInstanceOf[WstxEOFException] =>
+        logWarning("Reached end of file while looking for next row start element.")
+        false
+    }
+  }
+
+  private def validateXSDSchema(streamReader: XMLStreamReader): Unit = {
+    // StAXSource requires the stream reader to start with the START_DOCUMENT OR START_ELEMENT
+    // events.
+    def rowTagStarted: Boolean =
+      streamReader.getEventType == XMLStreamConstants.START_ELEMENT &&
+      StaxXmlParserUtils.getName(streamReader.getName, options) == options.rowTag
+    while (!rowTagStarted && streamReader.hasNext) {
+      streamReader.next()
+    }
+    xsdSchemaValidator.get.reset()
+    xsdSchemaValidator.get.validate(new StAXSource(streamReader))
+  }
+
+  override def close(): Unit = {
+    hasMoreRecord = false
+    try {
+      in1.close()
+      in2.foreach(_.close())
+      primaryEventReader.close()
+      xsdValidationStreamReader.foreach(_.close())
+    } catch {
+      case NonFatal(e) =>
+        // If the file is corrupted/missing, we won't be able to close the input streams. We do a
+        // best-effort to close the streams and log the error if closing fails.
+        logWarning("Error closing XML stream", e)
+    }
+  }
+
+  override def nextEvent(): XMLEvent = primaryEventReader.nextEvent()
+  override def hasNext: Boolean = primaryEventReader.hasNext
+  override def peek(): XMLEvent = primaryEventReader.peek()
+  override def getElementText: String = primaryEventReader.getElementText
+  override def nextTag(): XMLEvent = primaryEventReader.nextTag()
+  override def getProperty(name: String): AnyRef = primaryEventReader.getProperty(name)
+  override def next(): AnyRef = primaryEventReader.next()
+}
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlGenerator.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlGenerator.scala
index 9e4e25ba1746c..b6a4d74a8e979 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlGenerator.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlGenerator.scala
@@ -27,6 +27,7 @@ import org.apache.hadoop.shaded.com.ctc.wstx.api.WstxOutputProperties
 
 import org.apache.spark.SparkIllegalArgumentException
 import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.expressions.ToStringBase
 import org.apache.spark.sql.catalyst.util.{ArrayData, DateFormatter, DateTimeUtils, MapData, TimestampFormatter}
 import org.apache.spark.sql.catalyst.util.LegacyDateFormats.FAST_DATE_FORMAT
 import org.apache.spark.sql.types._
@@ -63,6 +64,8 @@ class StaxXmlGenerator(
     legacyFormat = FAST_DATE_FORMAT,
     isParsing = false)
 
+  private val binaryFormatter = ToStringBase.getBinaryFormatter
+
   private val gen = {
     val factory = XMLOutputFactory.newInstance()
     // to_xml disables structure validation to allow multiple root tags
@@ -197,6 +200,7 @@ class StaxXmlGenerator(
     case (DecimalType(), v: Decimal) => gen.writeCharacters(v.toString)
     case (ByteType, v: Byte) => gen.writeCharacters(v.toString)
     case (BooleanType, v: Boolean) => gen.writeCharacters(v.toString)
+    case (BinaryType, v: Array[Byte]) => gen.writeCharacters(binaryFormatter(v).toString)
 
     // For the case roundtrip in reading and writing XML files, [[ArrayType]] cannot have
     // [[ArrayType]] as element type. It always wraps the element with [[StructType]]. So,
@@ -228,6 +232,8 @@ class StaxXmlGenerator(
         writeChild(field.name, field.dataType, value)
       }
 
+    case (u: UserDefinedType[_], v) => writeElement(u.sqlType, v, options)
+
     case (_, _) =>
       throw new SparkIllegalArgumentException(
         errorClass = "_LEGACY_ERROR_TEMP_3238",
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParser.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParser.scala
index 00497c1c31f35..1a47fa7bd43f0 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParser.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParser.scala
@@ -33,14 +33,14 @@ import scala.util.control.Exception.allCatch
 import scala.util.control.NonFatal
 import scala.xml.SAXException
 
-import org.apache.commons.lang3.exception.ExceptionUtils
+import com.google.common.io.ByteStreams
 import org.apache.hadoop.hdfs.BlockMissingException
 import org.apache.hadoop.security.AccessControlException
 
 import org.apache.spark.{SparkIllegalArgumentException, SparkUpgradeException}
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
-import org.apache.spark.sql.catalyst.expressions.{ExprUtils, GenericInternalRow}
+import org.apache.spark.sql.catalyst.expressions.{ExprUtils, GenericInternalRow, ToStringBase}
 import org.apache.spark.sql.catalyst.util.{ArrayBasedMapData, BadRecordException, DateFormatter, DropMalformedMode, FailureSafeParser, GenericArrayData, MapData, ParseMode, PartialResultArrayException, PartialResultException, PermissiveMode, TimestampFormatter}
 import org.apache.spark.sql.catalyst.util.LegacyDateFormats.FAST_DATE_FORMAT
 import org.apache.spark.sql.catalyst.xml.StaxXmlParser.convertStream
@@ -51,6 +51,7 @@ import org.apache.spark.types.variant.{Variant, VariantBuilder}
 import org.apache.spark.types.variant.VariantBuilder.FieldEntry
 import org.apache.spark.types.variant.VariantUtil
 import org.apache.spark.unsafe.types.{UTF8String, VariantVal}
+import org.apache.spark.util.{SparkErrorUtils, Utils}
 
 class StaxXmlParser(
     schema: StructType,
@@ -76,6 +77,8 @@ class StaxXmlParser(
     legacyFormat = FAST_DATE_FORMAT,
     isParsing = true)
 
+  private lazy val binaryParser = ToStringBase.getBinaryParser
+
   private val decimalParser = ExprUtils.getDecimalParser(options.locale)
 
   private val caseSensitive = SQLConf.get.caseSensitiveAnalysis
@@ -125,12 +128,12 @@ class StaxXmlParser(
     // is not manually specified, then fall back to DROPMALFORMED, which will return
     // null column values where parsing fails.
     val parseMode =
-    if (options.parseMode == PermissiveMode &&
-      !schema.fields.exists(_.name == options.columnNameOfCorruptRecord)) {
-      DropMalformedMode
-    } else {
-      options.parseMode
-    }
+      if (options.parseMode == PermissiveMode &&
+        !schema.fields.exists(_.name == options.columnNameOfCorruptRecord)) {
+        DropMalformedMode
+      } else {
+        options.parseMode
+      }
     val xsdSchema = Option(options.rowValidationXSDPath).map(ValidatorUtil.getSchema)
     doParseColumn(xml, parseMode, xsdSchema).orNull
   }
@@ -186,6 +189,111 @@ class StaxXmlParser(
     }
   }
 
+  /**
+   * XML stream parser that reads XML records from the input file stream sequentially without
+   * loading each individual XML record string into memory.
+   */
+  def parseStreamOptimized(
+      inputStream: () => InputStream,
+      schema: StructType): Iterator[InternalRow] = {
+    val streamLiteral = () =>
+      Utils.tryWithResource(
+        inputStream()
+      ) { is =>
+        UTF8String.fromBytes(ByteStreams.toByteArray(is))
+      }
+    val safeParser = new FailureSafeParser[StaxXMLRecordReader](
+      input => doParseColumnOptimized(input, streamLiteral),
+      options.parseMode,
+      schema,
+      options.columnNameOfCorruptRecord
+    )
+
+    convertStream(inputStream, options) { reader =>
+      safeParser.parse(reader)
+    }.flatten
+  }
+
+  /**
+   * Parse the next XML record from the XML event stream.
+   * Note that the method will **NOT** close the XML event stream as there could have more XML
+   * records to parse. It's the caller's responsibility to close the stream.
+   *
+   * @param parser The XML event reader.
+   * @param xmlLiteral A function that returns the entire XML file content as a UTF8String. Used
+   *                   to create a BadRecordException in case of parsing errors.
+   *                   TODO: Only include the file content starting with the current record.
+   */
+  def doParseColumnOptimized(
+      parser: StaxXMLRecordReader,
+      xmlLiteral: () => UTF8String): Option[InternalRow] = {
+    try {
+      if (!parser.skipToNextRecord()) {
+        return None
+      }
+
+      options.singleVariantColumn match {
+        case Some(_) =>
+          // If the singleVariantColumn is specified, parse the entire xml record as a Variant
+          val v = StaxXmlParser.parseVariant(parser, options)
+          Some(InternalRow(v))
+        case _ =>
+          // Otherwise, parse the xml record as Structs
+          val rootAttributes = parser.nextEvent().asStartElement.getAttributes.asScala.toArray
+          val result = Some(convertObject(parser, schema, rootAttributes))
+          result
+      }
+    } catch {
+      case e: SparkUpgradeException =>
+        parser.close()
+        throw e
+      case e: CharConversionException if options.charset.isEmpty =>
+        val msg =
+          """XML parser cannot handle a character in its input.
+            |Specifying encoding as an input option explicitly might help to resolve the issue.
+            |""".stripMargin + e.getMessage
+        val wrappedCharException = new CharConversionException(msg)
+        wrappedCharException.initCause(e)
+        throw BadRecordException(xmlLiteral, () => Array.empty,
+          wrappedCharException)
+      case PartialResultException(row, cause) =>
+        throw BadRecordException(
+          record = xmlLiteral,
+          partialResults = () => Array(row),
+          cause)
+      case PartialResultArrayException(rows, cause) =>
+        throw BadRecordException(record = xmlLiteral, partialResults = () => rows, cause)
+      case e: Throwable =>
+        SparkErrorUtils.getRootCause(e) match {
+          case _: FileNotFoundException if options.ignoreMissingFiles =>
+            logWarning("Skipped missing file", e)
+            parser.close()
+            None
+          case _: IOException | _: RuntimeException | _: InternalError | _: AssertionError
+              if options.ignoreCorruptFiles =>
+            logWarning("Skipped the rest of the content in the corrupted file", e)
+            parser.close()
+            None
+          case _: XMLStreamException | _: MalformedInputException =>
+            // Skip rest of the content in the parser and put the whole XML file in the
+            // BadRecordException.
+            parser.close()
+            // XML parser currently doesn't support partial results for corrupted records.
+            // For such records, all fields other than the field configured by
+            // `columnNameOfCorruptRecord` are set to `null`.
+            throw BadRecordException(xmlLiteral, () => Array.empty, e)
+          case _: SAXException =>
+            // XSD validation failed, throw a bad record exception and continue to parse the rest
+            // records.
+            val record = UTF8String.fromString(
+              StaxXmlParserUtils.currentElementAsString(parser, options.rowTag, options).trim
+            )
+            throw BadRecordException(() => record, () => Array.empty, e)
+          case _ => throw e
+        }
+    }
+  }
+
   /**
    * Parse the current token (and related children) according to a desired schema
    */
@@ -493,6 +601,7 @@ class StaxXmlParser(
         case _: TimestampNTZType => timestampNTZFormatter.parseWithoutTimeZone(datum, false)
         case _: DateType => parseXmlDate(datum, options)
         case _: StringType => UTF8String.fromString(datum)
+        case _: BinaryType => binaryParser(UTF8String.fromString(datum))
         case _ => throw new SparkIllegalArgumentException(
           errorClass = "_LEGACY_ERROR_TEMP_3244",
           messageParameters = Map("castType" -> "castType.typeName"))
@@ -536,6 +645,7 @@ class StaxXmlParser(
         case DoubleType => signSafeToDouble(value)
         case BooleanType => castTo(value, BooleanType)
         case StringType => castTo(value, StringType)
+        case BinaryType => castTo(value, BinaryType)
         case DateType => castTo(value, DateType)
         case TimestampType => castTo(value, TimestampType)
         case TimestampNTZType => castTo(value, TimestampNTZType)
@@ -683,7 +793,7 @@ class XmlTokenizer(
               " the content in the missing file during schema inference",
             e)
         case NonFatal(e) =>
-          ExceptionUtils.getRootCause(e) match {
+          Utils.getRootCause(e) match {
             case _: AccessControlException | _: BlockMissingException =>
               reader.close()
               reader = null
@@ -925,6 +1035,20 @@ object StaxXmlParser {
     }
   }
 
+  def convertStream[T](inputStream: () => InputStream, options: XmlOptions)(
+      convert: StaxXMLRecordReader => T): Iterator[T] = new Iterator[T] {
+    private val reader = StaxXMLRecordReader(inputStream, options)
+
+    override def hasNext: Boolean = reader.hasMoreRecord
+
+    override def next(): T = {
+      if (!hasNext) {
+        throw QueryExecutionErrors.endOfStreamError()
+      }
+      convert(reader)
+    }
+  }
+
   /**
    * Parse the input XML string as a Variant value
    */
@@ -936,6 +1060,12 @@ object StaxXmlParser {
     v
   }
 
+  def parseVariant(parser: StaxXMLRecordReader, options: XmlOptions): VariantVal = {
+    val rootAttributes = parser.nextEvent().asStartElement.getAttributes.asScala.toArray
+    val v = convertVariant(parser, rootAttributes, options)
+    new VariantVal(v.getValue, v.getMetadata)
+  }
+
   /**
    * Parse an XML element from the XML event stream into a Variant.
    * This method transforms the XML element along with its attributes and child elements
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParserUtils.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParserUtils.scala
index 5d267143b06c9..0bafa6a42f76f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParserUtils.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/StaxXmlParserUtils.scala
@@ -18,12 +18,21 @@ package org.apache.spark.sql.catalyst.xml
 
 import java.io.StringReader
 import javax.xml.namespace.QName
-import javax.xml.stream.{EventFilter, XMLEventReader, XMLInputFactory, XMLStreamConstants}
+import javax.xml.stream.{
+  EventFilter,
+  StreamFilter,
+  XMLEventReader,
+  XMLInputFactory,
+  XMLStreamConstants,
+  XMLStreamReader
+}
 import javax.xml.stream.events._
 
 import scala.annotation.tailrec
 import scala.jdk.CollectionConverters._
 
+import org.apache.commons.io.input.BOMInputStream
+
 object StaxXmlParserUtils {
 
   private[sql] val factory: XMLInputFactory = {
@@ -35,19 +44,21 @@ object StaxXmlParserUtils {
     factory
   }
 
+  private[sql] val eventTypeFilter: Int => Boolean = {
+    // Ignore comments and processing instructions
+    case XMLStreamConstants.COMMENT |
+         XMLStreamConstants.PROCESSING_INSTRUCTION => false
+    // unsupported events
+    case XMLStreamConstants.DTD |
+         XMLStreamConstants.ENTITY_DECLARATION |
+         XMLStreamConstants.ENTITY_REFERENCE |
+         XMLStreamConstants.NOTATION_DECLARATION => false
+    case _ => true
+  }
+
   def filteredReader(xml: String): XMLEventReader = {
     val filter = new EventFilter {
-      override def accept(event: XMLEvent): Boolean =
-        event.getEventType match {
-          // Ignore comments and processing instructions
-          case XMLStreamConstants.COMMENT | XMLStreamConstants.PROCESSING_INSTRUCTION => false
-          // unsupported events
-          case XMLStreamConstants.DTD |
-               XMLStreamConstants.ENTITY_DECLARATION |
-               XMLStreamConstants.ENTITY_REFERENCE |
-               XMLStreamConstants.NOTATION_DECLARATION => false
-          case _ => true
-        }
+      override def accept(event: XMLEvent): Boolean = eventTypeFilter(event.getEventType)
     }
     // It does not have to skip for white space, since `XmlInputFormat`
     // always finds the root tag without a heading space.
@@ -55,9 +66,39 @@ object StaxXmlParserUtils {
     factory.createFilteredReader(eventReader, filter)
   }
 
+  def filteredReader(inputStream: java.io.InputStream, options: XmlOptions): XMLEventReader = {
+    val filter = new EventFilter {
+      override def accept(event: XMLEvent): Boolean = eventTypeFilter(event.getEventType)
+    }
+    val bomInputStreamBuilder = new BOMInputStream.Builder
+    bomInputStreamBuilder.setInputStream(inputStream)
+    bomInputStreamBuilder.setCharset(options.charset)
+    val eventReader = factory.createXMLEventReader(bomInputStreamBuilder.get())
+    factory.createFilteredReader(eventReader, filter)
+  }
+
+  def filteredReader(
+      inputStream: () => java.io.InputStream,
+      options: XmlOptions): StaxXMLRecordReader = {
+    StaxXMLRecordReader(inputStream, options)
+  }
+
+  def filteredStreamReader(
+      inputStream: java.io.InputStream,
+      options: XmlOptions): XMLStreamReader = {
+    val filter = new StreamFilter {
+      override def accept(event: XMLStreamReader): Boolean =
+        StaxXmlParserUtils.eventTypeFilter(event.getEventType)
+    }
+    val bomInputStreamBuilder = new BOMInputStream.Builder
+    bomInputStreamBuilder.setInputStream(inputStream)
+    val streamReader =
+      StaxXmlParserUtils.factory.createXMLStreamReader(bomInputStreamBuilder.get(), options.charset)
+    StaxXmlParserUtils.factory.createFilteredReader(streamReader, filter)
+  }
+
   def gatherRootAttributes(parser: XMLEventReader): Array[Attribute] = {
-    val rootEvent =
-      StaxXmlParserUtils.skipUntil(parser, XMLStreamConstants.START_ELEMENT)
+    val rootEvent = StaxXmlParserUtils.skipUntil(parser, XMLStreamConstants.START_ELEMENT)
     rootEvent.asStartElement.getAttributes.asScala.toArray
   }
 
@@ -124,7 +165,9 @@ object StaxXmlParserUtils {
   }
 
   /**
-   * Convert the current structure of XML document to a XML string.
+   * Convert the structure inside the target element to an XML string, **EXCLUDING** the target
+   * element layer itself. The parser is expected to be positioned **AT** the start tag of the
+   * target element.
    */
   def currentStructureAsString(
       parser: XMLEventReader,
@@ -133,26 +176,9 @@ object StaxXmlParserUtils {
     val xmlString = new StringBuilder()
     var indent = 0
     do {
-      parser.nextEvent match {
-        case e: StartElement =>
-          xmlString.append('<').append(e.getName)
-          e.getAttributes.asScala.foreach { att =>
-            xmlString
-              .append(' ')
-              .append(att.getName)
-              .append("=\"")
-              .append(att.getValue)
-              .append('"')
-          }
-          xmlString.append('>')
-          indent += 1
-        case e: EndElement =>
-          xmlString.append("</").append(e.getName).append('>')
-          indent -= 1
-        case c: Characters =>
-          xmlString.append(c.getData)
-        case _: XMLEvent => // do nothing
-      }
+      val (str, ind) = nextEventToString(parser, indent)
+      indent = ind
+      xmlString.append(str)
     } while (parser.peek() match {
       case _: EndElement =>
         // until the unclosed end element for the whole parent is found
@@ -163,6 +189,52 @@ object StaxXmlParserUtils {
     xmlString.toString()
   }
 
+  /**
+   * Convert the element with the target element name to an XML string. The next event of the parser
+   * is expected to be the start tag of the target element.
+   */
+  def currentElementAsString(
+      parser: XMLEventReader,
+      startElementName: String,
+      options: XmlOptions): String = {
+    assert(
+      getName(parser.peek().asStartElement().getName, options) == startElementName,
+      s"Expected StartElement <$startElementName>, but found ${parser.peek()}"
+    )
+    val xmlString = new StringBuilder()
+    var indent = 0
+    do {
+      val (str, ind) = nextEventToString(parser, indent)
+      indent = ind
+      xmlString.append(str)
+    } while (indent > 0)
+    xmlString.toString()
+  }
+
+  private def nextEventToString(parser: XMLEventReader, currentIdent: Int): (String, Int) = {
+    parser.nextEvent match {
+      case e: StartElement =>
+        val sb = new StringBuilder()
+        sb.append('<').append(e.getName)
+        e.getAttributes.asScala.foreach { att =>
+          sb
+            .append(' ')
+            .append(att.getName)
+            .append("=\"")
+            .append(att.getValue)
+            .append('"')
+        }
+        sb.append('>')
+        (sb.toString(), currentIdent + 1)
+      case e: EndElement =>
+        (s"</${e.getName}>", currentIdent - 1)
+      case c: Characters =>
+        (c.getData, currentIdent)
+      case _: XMLEvent => // do nothing
+        ("", currentIdent)
+    }
+  }
+
   /**
    * Skip the children of the current XML element.
    * Before this function is called, the 'startElement' of the object has already been consumed.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/ValidatorUtil.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/ValidatorUtil.scala
index 8a5291d0bac74..dccbb40fdd985 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/ValidatorUtil.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/ValidatorUtil.scala
@@ -28,7 +28,6 @@ import org.apache.spark.SparkFiles
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 
 /**
  * Utilities for working with XSD validation.
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlInferSchema.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlInferSchema.scala
index ecde7c1715bd5..d328c6c226a92 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlInferSchema.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlInferSchema.scala
@@ -43,6 +43,7 @@ import org.apache.spark.sql.catalyst.util.LegacyDateFormats.FAST_DATE_FORMAT
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.internal.{LegacyBehaviorPolicy, SQLConf}
 import org.apache.spark.sql.types._
+import org.apache.spark.util.SparkErrorUtils
 
 class XmlInferSchema(options: XmlOptions, caseSensitive: Boolean)
     extends Serializable
@@ -73,6 +74,7 @@ class XmlInferSchema(options: XmlOptions, caseSensitive: Boolean)
     isParsing = true)
 
   private def handleXmlErrorsByParseMode(
+      parser: XMLEventReader,
       parseMode: ParseMode,
       columnNameOfCorruptRecord: String,
       e: Throwable): Option[StructType] = {
@@ -82,6 +84,7 @@ class XmlInferSchema(options: XmlOptions, caseSensitive: Boolean)
       case DropMalformedMode =>
         None
       case FailFastMode =>
+        parser.close()
         throw QueryExecutionErrors.malformedRecordsDetectedInSchemaInferenceError(
           e, columnNameOfCorruptRecord)
     }
@@ -144,7 +147,7 @@ class XmlInferSchema(options: XmlOptions, caseSensitive: Boolean)
       schema
     } catch {
       case e @ (_: XMLStreamException | _: MalformedInputException | _: SAXException) =>
-        handleXmlErrorsByParseMode(options.parseMode, options.columnNameOfCorruptRecord, e)
+        handleXmlErrorsByParseMode(parser, options.parseMode, options.columnNameOfCorruptRecord, e)
       case e: CharConversionException if options.charset.isEmpty =>
         val msg =
           """XML parser cannot handle a character in its input.
@@ -153,6 +156,7 @@ class XmlInferSchema(options: XmlOptions, caseSensitive: Boolean)
         val wrappedCharException = new CharConversionException(msg)
         wrappedCharException.initCause(e)
         handleXmlErrorsByParseMode(
+          parser,
           options.parseMode,
           options.columnNameOfCorruptRecord,
           wrappedCharException)
@@ -165,7 +169,7 @@ class XmlInferSchema(options: XmlOptions, caseSensitive: Boolean)
         logWarning("Skipped the rest of the content in the corrupted file", e)
         Some(StructType(Nil))
       case NonFatal(e) =>
-        handleXmlErrorsByParseMode(options.parseMode, options.columnNameOfCorruptRecord, e)
+        handleXmlErrorsByParseMode(parser, options.parseMode, options.columnNameOfCorruptRecord, e)
     } finally {
       if (parser != null) {
         parser.close()
@@ -173,6 +177,123 @@ class XmlInferSchema(options: XmlOptions, caseSensitive: Boolean)
     }
   }
 
+  def inferFromReaders(recordReader: RDD[StaxXMLRecordReader]): StructType = {
+    val sampledRecordReader = if (options.samplingRatio < 1.0) {
+      recordReader.sample(withReplacement = false, options.samplingRatio, 1)
+    } else {
+      recordReader
+    }
+    // perform schema inference on each row and merge afterwards
+    val mergedTypesFromPartitions = sampledRecordReader.mapPartitions { iter =>
+      iter.flatMap { xmlReader =>
+        infer(xmlReader)
+      }.reduceOption(compatibleType(caseSensitive, options.valueTag)).iterator
+    }
+
+    // Here we manually submit a fold-like Spark job, so that we can set the SQLConf when running
+    // the fold functions in the scheduler event loop thread.
+    val existingConf = SQLConf.get
+    var rootType: DataType = StructType(Nil)
+    val foldPartition = (iter: Iterator[DataType]) =>
+      iter.fold(StructType(Nil))(compatibleType(caseSensitive, options.valueTag))
+    val mergeResult = (index: Int, taskResult: DataType) => {
+      rootType = SQLConf.withExistingConf(existingConf) {
+        compatibleType(caseSensitive, options.valueTag)(rootType, taskResult)
+      }
+    }
+    recordReader.sparkContext.runJob(mergedTypesFromPartitions, foldPartition, mergeResult)
+
+    canonicalizeType(rootType) match {
+      case Some(st: StructType) => st
+      case _ =>
+        // canonicalizeType erases all empty structs, including the only one we want to keep
+        // XML shouldn't run into this line
+        StructType(Seq())
+    }
+  }
+
+  /**
+   * Infer the schema of the next XML record in the XML event stream.
+   * Note that the method will **NOT** close the XML event stream as there could have more XML
+   * records to parse. The StaxXMLRecordReader will automatically close the stream when there are
+   * no more XML records to parse.
+   */
+  def infer(parser: StaxXMLRecordReader): Option[DataType] = {
+    try {
+      if (!parser.skipToNextRecord()) {
+        return None
+      }
+
+      val rootAttributes = parser.nextEvent().asStartElement.getAttributes.asScala.toArray
+      val schema = Some(inferObject(parser, rootAttributes))
+      schema
+    } catch {
+      case e: CharConversionException if options.charset.isEmpty =>
+        val msg =
+          """XML parser cannot handle a character in its input.
+            |Specifying encoding as an input option explicitly might help to resolve the issue.
+            |""".stripMargin + e.getMessage
+        val wrappedCharException = new CharConversionException(msg)
+        wrappedCharException.initCause(e)
+        handleXmlErrorsByParseMode(
+          parser,
+          options.parseMode,
+          options.columnNameOfCorruptRecord,
+          wrappedCharException)
+      case e: FileNotFoundException if options.ignoreMissingFiles =>
+        logWarning("Skipped missing file", e)
+        parser.close()
+        Some(StructType(Nil))
+      case e: FileNotFoundException if !options.ignoreMissingFiles =>
+        parser.close()
+        throw e
+      case NonFatal(e) =>
+        SparkErrorUtils.getRootCause(e) match {
+          case _: XMLStreamException | _: MalformedInputException =>
+            logWarning("Malformed XML record found", e)
+            // Close the parser from the first malformed XML record
+            parser.close()
+            handleXmlErrorsByParseMode(
+              parser = parser,
+              parseMode = options.parseMode,
+              columnNameOfCorruptRecord = options.columnNameOfCorruptRecord,
+              e = e
+            )
+          case _: SAXException =>
+            // For XSD validation errors, don't close the parser as there might be more valid
+            // records to parse.
+            // Advance the parser so that the next record can be parsed.
+            parser.nextEvent()
+            handleXmlErrorsByParseMode(
+              parser = parser,
+              parseMode = options.parseMode,
+              columnNameOfCorruptRecord = options.columnNameOfCorruptRecord,
+              e = e
+            )
+          case _: AccessControlException | _: BlockMissingException =>
+            parser.close()
+            throw e
+          case _: IOException | _: RuntimeException | _: InternalError | _: AssertionError
+              if options.ignoreCorruptFiles =>
+            logWarning("Skipped the rest of the content in the corrupted file", e)
+            parser.close()
+            Some(StructType(Nil))
+          case _: IOException | _: RuntimeException | _: InternalError
+              if !options.ignoreCorruptFiles =>
+            parser.close()
+            throw e
+          case _ =>
+            logWarning("Failed to infer schema from XML record", e)
+            handleXmlErrorsByParseMode(
+              parser = parser,
+              parseMode = options.parseMode,
+              columnNameOfCorruptRecord = options.columnNameOfCorruptRecord,
+              e = e
+            )
+        }
+    }
+  }
+
   private def inferFrom(datum: String): DataType = {
     val value = if (datum != null && options.ignoreSurroundingSpaces) {
       datum.trim()
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlOptions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlOptions.scala
index 132bb1e359479..8718a3a16a512 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlOptions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/xml/XmlOptions.scala
@@ -170,6 +170,12 @@ class XmlOptions(
   // E.g. spark.read.format("xml").option("singleVariantColumn", "colName")
   val singleVariantColumn = parameters.get(SINGLE_VARIANT_COLUMN)
 
+  // When set to true, use the legacy XML parser for parsing XML files.
+  // Compared to the default parser, the legacy parser has less stringent validation checks for
+  // malformed content, but it's less memory-efficient
+  val useLegacyXMLParser: Boolean = parameters.get(USE_LEGACY_XML_PARSER).map(_.toBoolean)
+    .getOrElse(SQLConf.get.getConf(SQLConf.LEGACY_XML_PARSER_ENABLED))
+
   def buildXmlFactory(): XMLInputFactory = {
     XMLInputFactory.newInstance()
   }
@@ -214,6 +220,7 @@ object XmlOptions extends DataSourceOptions {
   val PREFERS_DECIMAL = newOption("prefersDecimal")
   val VALIDATE_NAME = newOption("validateName")
   val SINGLE_VARIANT_COLUMN = newOption("singleVariantColumn")
+  val USE_LEGACY_XML_PARSER = newOption("useLegacyXMLParser")
   // Options with alternative
   val ENCODING = "encoding"
   val CHARSET = "charset"
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/expressions/expressions.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/expressions/expressions.scala
index 263508a9d5fb4..18d94969aa27e 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/expressions/expressions.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/expressions/expressions.scala
@@ -17,8 +17,7 @@
 
 package org.apache.spark.sql.connector.expressions
 
-import org.apache.commons.codec.binary.Hex
-import org.apache.commons.lang3.StringUtils
+import java.util.HexFormat
 
 import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst
@@ -390,11 +389,11 @@ private[sql] object HoursTransform {
 
 private[sql] final case class LiteralValue[T](value: T, dataType: DataType) extends Literal[T] {
   override def toString: String = dataType match {
-    case StringType => s"'${StringUtils.replace(s"$value", "'", "''")}'"
+    case StringType => s"'${s"$value".replace("'", "''")}'"
     case BinaryType =>
       assert(value.isInstanceOf[Array[Byte]])
       val bytes = value.asInstanceOf[Array[Byte]]
-      "0x" + Hex.encodeHexString(bytes, false)
+      "0x" + HexFormat.of().withUpperCase().formatHex(bytes)
     case _ => s"$value"
   }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/write/RowLevelOperationTable.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/write/RowLevelOperationTable.scala
index 5980be8635d2e..50179824e255f 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/write/RowLevelOperationTable.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/connector/write/RowLevelOperationTable.scala
@@ -22,7 +22,6 @@ import java.util
 import org.apache.spark.sql.connector.catalog.{Column, SupportsRead, SupportsRowLevelOperations, SupportsWrite, Table, TableCapability}
 import org.apache.spark.sql.connector.catalog.constraints.Constraint
 import org.apache.spark.sql.connector.read.ScanBuilder
-import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 
 /**
@@ -38,7 +37,6 @@ private[sql] case class RowLevelOperationTable(
     operation: RowLevelOperation) extends Table with SupportsRead with SupportsWrite {
 
   override def name: String = table.name
-  override def schema: StructType = table.schema
   override def columns: Array[Column] = table.columns()
   override def capabilities: util.Set[TableCapability] = table.capabilities
   override def constraints(): Array[Constraint] = table.constraints()
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryCompilationErrors.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryCompilationErrors.scala
index 14f279ad5ad7f..74eed741622f1 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryCompilationErrors.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryCompilationErrors.scala
@@ -21,7 +21,7 @@ import java.util.Locale
 
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.{SPARK_DOC_ROOT, SparkException, SparkRuntimeException, SparkThrowable, SparkUnsupportedOperationException}
+import org.apache.spark.{SPARK_DOC_ROOT, SparkException, SparkThrowable, SparkUnsupportedOperationException}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.{ExtendedAnalysisException, FunctionIdentifier, InternalRow, QualifiedTableName, TableIdentifier}
 import org.apache.spark.sql.catalyst.analysis.{CannotReplaceMissingTableException, FunctionAlreadyExistsException, NamespaceAlreadyExistsException, NoSuchFunctionException, NoSuchNamespaceException, NoSuchPartitionException, NoSuchTableException, Star, TableAlreadyExistsException, UnresolvedRegex}
@@ -3348,6 +3348,15 @@ private[sql] object QueryCompilationErrors extends QueryErrorsBase with Compilat
         "change" -> change.toString, "tableName" -> toSQLId(sanitizedTableName)))
   }
 
+  def unsupportedTableChangesInAutoSchemaEvolutionError(
+      changes: Array[TableChange], tableName: Seq[String]): Throwable = {
+    val sanitizedTableName = tableName.map(_.replaceAll("\"", ""))
+    new AnalysisException(
+      errorClass = "UNSUPPORTED_TABLE_CHANGES_IN_AUTO_SCHEMA_EVOLUTION",
+      messageParameters = Map(
+        "changes" -> changes.mkString(","), "tableName" -> toSQLId(sanitizedTableName)))
+  }
+
   def pathOptionNotSetCorrectlyWhenReadingError(): Throwable = {
     new AnalysisException(
       errorClass = "_LEGACY_ERROR_TEMP_1306",
@@ -3754,13 +3763,6 @@ private[sql] object QueryCompilationErrors extends QueryErrorsBase with Compilat
     )
   }
 
-  def indeterminateCollationInExpressionError(expr: Expression): Throwable = {
-    new AnalysisException(
-      errorClass = "INDETERMINATE_COLLATION",
-      messageParameters = Map("expr" -> toSQLExpr(expr))
-    )
-  }
-
   def indeterminateCollationInSchemaError(columnPaths: Seq[ColumnPath]): Throwable = {
     new AnalysisException(
       errorClass = "INDETERMINATE_COLLATION_IN_SCHEMA",
@@ -4085,12 +4087,6 @@ private[sql] object QueryCompilationErrors extends QueryErrorsBase with Compilat
     )
   }
 
-  def foundMultipleDataSources(provider: String): Throwable = {
-    new AnalysisException(
-      errorClass = "FOUND_MULTIPLE_DATA_SOURCES",
-      messageParameters = Map("provider" -> provider))
-  }
-
   def foundMultipleXMLDataSourceError(provider: String,
       sourceNames: Seq[String],
       externalSource: String): Throwable = {
@@ -4203,9 +4199,7 @@ private[sql] object QueryCompilationErrors extends QueryErrorsBase with Compilat
   def mustOverrideOneMethodError(methodName: String): RuntimeException = {
     val msg = s"You must override one `$methodName`. It's preferred to not override the " +
       "deprecated one."
-    new SparkRuntimeException(
-      "INTERNAL_ERROR",
-      Map("message" -> msg))
+    SparkException.mustOverrideOneMethodError(msg)
   }
 
   def cannotAssignEventTimeColumn(): Throwable = {
@@ -4390,10 +4384,4 @@ private[sql] object QueryCompilationErrors extends QueryErrorsBase with Compilat
       origin = origin
     )
   }
-
-  def unsupportedStreamingTVF(funcName: Seq[String]): Throwable = {
-    new AnalysisException(
-      errorClass = "UNSUPPORTED_STREAMING_TABLE_VALUED_FUNCTION",
-      messageParameters = Map("funcName" -> toSQLId(funcName)))
-  }
 }
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryExecutionErrors.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryExecutionErrors.scala
index 0ae7a958058dd..ba229a2e746c4 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryExecutionErrors.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/QueryExecutionErrors.scala
@@ -44,7 +44,7 @@ import org.apache.spark.sql.catalyst.plans.JoinType
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.plans.logical.statsEstimation.ValueInterval
 import org.apache.spark.sql.catalyst.trees.{Origin, TreeNode}
-import org.apache.spark.sql.catalyst.util.{sideBySide, CharsetProvider, DateTimeUtils, FailFastMode, MapData}
+import org.apache.spark.sql.catalyst.util.{sideBySide, CharsetProvider, DateTimeUtils, FailFastMode, IntervalUtils, MapData}
 import org.apache.spark.sql.connector.catalog.{CatalogNotFoundException, Table, TableProvider}
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
 import org.apache.spark.sql.connector.expressions.Transform
@@ -363,15 +363,13 @@ private[sql] object QueryExecutionErrors extends QueryErrorsBase with ExecutionE
 
   def orderedOperationUnsupportedByDataTypeError(
       dataType: DataType): SparkIllegalArgumentException = {
-    new SparkIllegalArgumentException(
-      errorClass = "_LEGACY_ERROR_TEMP_2005",
-      messageParameters = Map("dataType" -> dataType.toString()))
+    return orderedOperationUnsupportedByDataTypeError(dataType.toString())
   }
 
   def orderedOperationUnsupportedByDataTypeError(
       dataType: String): SparkIllegalArgumentException = {
     new SparkIllegalArgumentException(
-      errorClass = "_LEGACY_ERROR_TEMP_2005",
+      errorClass = "DATATYPE_CANNOT_ORDER",
       messageParameters = Map("dataType" -> dataType))
   }
 
@@ -1970,11 +1968,18 @@ private[sql] object QueryExecutionErrors extends QueryErrorsBase with ExecutionE
         "message" -> e.getMessage))
   }
 
-  def multiFailuresInStageMaterializationError(error: Throwable): Throwable = {
+  def multiFailuresInStageMaterializationError(errors: Seq[Throwable]): Throwable = {
+    val failureDetails = errors.zipWithIndex.map { case (error, index) =>
+      s"\n  ${index + 1}. ${error.getClass.getSimpleName}: ${error.getMessage}"
+    }.mkString("")
+
     new SparkException(
-      errorClass = "_LEGACY_ERROR_TEMP_2235",
-      messageParameters = Map.empty,
-      cause = error)
+      errorClass = "STAGE_MATERIALIZATION_MULTIPLE_FAILURES",
+      messageParameters = Map(
+        "failureCount" -> errors.size.toString,
+        "failureDetails" -> failureDetails
+      ),
+      cause = errors.head)
   }
 
   def unrecognizedCompressionSchemaTypeIDError(typeId: Int): SparkUnsupportedOperationException = {
@@ -2101,9 +2106,9 @@ private[sql] object QueryExecutionErrors extends QueryErrorsBase with ExecutionE
       oe: OutOfMemoryError, tables: Seq[TableIdentifier]): Throwable = {
     val analyzeTblMsg = if (tables.nonEmpty) {
       " or analyze these tables through: " +
-        s"${tables.map(t => s"ANALYZE TABLE $t COMPUTE STATISTICS;").mkString(" ")}."
+        s"`${tables.map(t => s"ANALYZE TABLE $t COMPUTE STATISTICS;").mkString(" ")}`"
     } else {
-      "."
+      ""
     }
     new SparkException(
       errorClass = "_LEGACY_ERROR_TEMP_2250",
@@ -2529,6 +2534,21 @@ private[sql] object QueryExecutionErrors extends QueryErrorsBase with ExecutionE
       summary = "")
   }
 
+  def timeAddIntervalOverflowError(
+      time: Long,
+      timePrecision: Int,
+      interval: Long,
+      intervalEndField: Byte): ArithmeticException = {
+    val i = toSQLValue(IntervalUtils.microsToDuration(interval),
+      DayTimeIntervalType(intervalEndField))
+    val t = toSQLValue(DateTimeUtils.nanosToLocalTime(time), TimeType(timePrecision))
+    new SparkArithmeticException(
+      errorClass = "DATETIME_OVERFLOW",
+      messageParameters = Map("operation" -> s"add $i to the time value $t"),
+      context = Array.empty,
+      summary = "")
+  }
+
   def invalidBucketFile(path: String): Throwable = {
     new SparkException(
       errorClass = "INVALID_BUCKET_FILE",
@@ -2764,6 +2784,36 @@ private[sql] object QueryExecutionErrors extends QueryErrorsBase with ExecutionE
         "function" -> toSQLId(function)))
   }
 
+  def approxTopKNonPositiveValue(argName: String, argValue: Int): Throwable = {
+    new SparkRuntimeException(
+      errorClass = "APPROX_TOP_K_NON_POSITIVE_ARG",
+      messageParameters = Map(
+        "argName" -> toSQLId(argName),
+        "argValue" -> toSQLValue(argValue, IntegerType)))
+  }
+
+  def approxTopKNullArg(argName: String): Throwable = {
+    new SparkRuntimeException(
+      errorClass = "APPROX_TOP_K_NULL_ARG",
+      messageParameters = Map("argName" -> toSQLId(argName)))
+  }
+
+  def approxTopKMaxItemsTrackedLessThanK(maxItemsTracked: Int, k: Int): Throwable = {
+    new SparkRuntimeException(
+      errorClass = "APPROX_TOP_K_MAX_ITEMS_TRACKED_LESS_THAN_K",
+      messageParameters = Map(
+        "maxItemsTracked" -> toSQLValue(maxItemsTracked, IntegerType),
+        "k" -> toSQLValue(k, IntegerType)))
+  }
+
+  def approxTopKMaxItemsTrackedExceedsLimit(maxItemsTracked: Int, limit: Int): Throwable = {
+    new SparkRuntimeException(
+      errorClass = "APPROX_TOP_K_MAX_ITEMS_TRACKED_EXCEEDS_LIMIT",
+      messageParameters = Map(
+        "maxItemsTracked" -> toSQLValue(maxItemsTracked, IntegerType),
+        "limit" -> toSQLValue(limit, IntegerType)))
+  }
+
   def mergeCardinalityViolationError(): SparkRuntimeException = {
     new SparkRuntimeException(
       errorClass = "MERGE_CARDINALITY_VIOLATION",
@@ -3017,6 +3067,21 @@ private[sql] object QueryExecutionErrors extends QueryErrorsBase with ExecutionE
     )
   }
 
+  // Throws a SparkIllegalArgumentException when an invalid time unit is specified.
+  // Note that the supported units are: HOUR, MINUTE, SECOND, MILLISECOND, MICROSECOND.
+  def invalidTimeUnitError(
+      functionName: String,
+      invalidValue: String): Throwable = {
+    new SparkIllegalArgumentException(
+      errorClass = "INVALID_PARAMETER_VALUE.TIME_UNIT",
+      messageParameters = Map(
+        "functionName" -> toSQLId(functionName),
+        "parameter" -> toSQLId("unit"),
+        "invalidValue" -> toSQLValue(invalidValue)
+      )
+    )
+  }
+
   // Throws a SparkRuntimeException when a CHECK constraint is violated, including details of the
   // violation. This is a Java-friendly version of the above method.
   def checkViolationJava(
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/SqlScriptingErrors.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/SqlScriptingErrors.scala
index 23b863f24bc8f..0b7b60cbe8dae 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/SqlScriptingErrors.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/errors/SqlScriptingErrors.scala
@@ -33,7 +33,7 @@ private[sql] object SqlScriptingErrors {
   def duplicateLabels(origin: Origin, label: String): Throwable = {
     new SqlScriptingException(
       origin = origin,
-      errorClass = "LABEL_ALREADY_EXISTS",
+      errorClass = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       cause = null,
       messageParameters = Map("label" -> toSQLId(label)))
   }
@@ -54,10 +54,10 @@ private[sql] object SqlScriptingErrors {
       messageParameters = Map("endLabel" -> toSQLId(endLabel)))
   }
 
-  def labelNameForbidden(origin: Origin, label: String): Throwable = {
+  def labelOrForVariableNameForbidden(origin: Origin, label: String): Throwable = {
     new SqlScriptingException(
       origin = origin,
-      errorClass = "LABEL_NAME_FORBIDDEN",
+      errorClass = "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN",
       cause = null,
       messageParameters = Map("label" -> toSQLId(label))
     )
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowWriter.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowWriter.scala
index d91b6de9b1dfd..275fecebdafb8 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowWriter.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowWriter.scala
@@ -68,6 +68,7 @@ object ArrowWriter {
       case (DateType, vector: DateDayVector) => new DateWriter(vector)
       case (TimestampType, vector: TimeStampMicroTZVector) => new TimestampWriter(vector)
       case (TimestampNTZType, vector: TimeStampMicroVector) => new TimestampNTZWriter(vector)
+      case (_: TimeType, vector: TimeNanoVector) => new TimeWriter(vector)
       case (ArrayType(_, _), vector: ListVector) =>
         val elementVector = createFieldWriter(vector.getDataVector())
         new ArrayWriter(vector, elementVector)
@@ -359,6 +360,18 @@ private[arrow] class TimestampNTZWriter(
   }
 }
 
+private[arrow] class TimeWriter(
+    val valueVector: TimeNanoVector) extends ArrowFieldWriter {
+
+  override def setNull(): Unit = {
+    valueVector.setNull(count)
+  }
+
+  override def setValue(input: SpecializedGetters, ordinal: Int): Unit = {
+    valueVector.setSafe(count, input.getLong(ordinal))
+  }
+}
+
 private[arrow] class ArrayWriter(
     val valueVector: ListVector,
     val elementWriter: ArrowFieldWriter) extends ArrowFieldWriter {
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Relation.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Relation.scala
index babdd70d58baf..2b1b40e0a5ebe 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Relation.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Relation.scala
@@ -126,6 +126,9 @@ case class DataSourceV2Relation(
       this
     }
   }
+
+  def autoSchemaEvolution(): Boolean =
+    table.capabilities().contains(TableCapability.AUTOMATIC_SCHEMA_EVOLUTION)
 }
 
 /**
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
index a322ec8a7e215..86807914c2362 100644
--- a/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
+++ b/sql/catalyst/src/main/scala/org/apache/spark/sql/internal/SQLConf.scala
@@ -241,6 +241,24 @@ object SQLConf {
     }
   }
 
+  val DONT_DEDUPLICATE_EXPRESSION_IF_EXPR_ID_IN_OUTPUT =
+    buildConf("spark.sql.analyzer.dontDeduplicateExpressionIfExprIdInOutput")
+    .internal()
+    .doc(
+      "DeduplicateRelations shouldn't remap expressions to new ExprIds if old ExprId still " +
+      "exists in output.")
+    .booleanConf
+    .createWithDefault(true)
+
+  val UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED =
+    buildConf("spark.sql.analyzer.unionIsResolvedWhenDuplicatesPerChildResolved")
+    .internal()
+    .doc(
+      "When true, union should only be resolved once there are no duplicate attributes in " +
+      "each branch.")
+    .booleanConf
+    .createWithDefault(true)
+
   val ONLY_NECESSARY_AND_UNIQUE_METADATA_COLUMNS =
     buildConf("spark.sql.analyzer.uniqueNecessaryMetadataColumns")
     .internal()
@@ -337,6 +355,31 @@ object SQLConf {
       .doubleConf
       .createWithDefault(if (Utils.isTesting) 1.0 else 0.001)
 
+  val ANALYZER_SINGLE_PASS_RESOLVER_EXPOSE_RESOLVER_GUARD_FAILURE =
+    buildConf("spark.sql.analyzer.singlePassResolver.exposeResolverGuardFailure")
+      .internal()
+      .doc(
+        "When true, any failure thrown from ResolverGuard will be exposed as a query failure. " +
+        "Otherwise we just assume that the ResolverGuard returned false and the query is not " +
+        "supported by the single-pass Analyzer. This is important to make dual-runs unnoticeable " +
+        "in production.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(Utils.isTesting)
+
+  val ANALYZER_SINGLE_PASS_RESOLVER_PREVENT_USING_ALIASES_FROM_NON_DIRECT_CHILDREN =
+    buildConf("spark.sql.analyzer.singlePassResolver.preventUsingAliasesFromNonDirectChildren")
+      .internal()
+      .doc("When true, in Sort/Having/Filter expressions allow replacing of these expressions " +
+        "only with semantically equal aliased expressions from direct children. This is " +
+        "necessary in order to stay compatible with fixed-point, but the functionality and " +
+        "correctness remain the same. Because enabling this case would break some cases that " +
+        "are supported in single-pass but not in fixed-point, this flag should only be used to " +
+        "hide false positive logical plan mismatches during testing.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+
   val ANALYZER_SINGLE_PASS_RESOLVER_VALIDATION_ENABLED =
     buildConf("spark.sql.analyzer.singlePassResolver.validationEnabled")
       .internal()
@@ -406,6 +449,15 @@ object SQLConf {
       .intConf
       .createWithDefault(3)
 
+  val PRESERVE_ALIAS_METADATA_WHEN_COLLAPSING_PROJECTS =
+    buildConf("spark.sql.optimizer.preserveAliasMetadataWhenCollapsingProjects")
+    .internal()
+    .doc("When true, make sure to explicitly copy the metadata of the aliases from lower " +
+      "project list.")
+    .version("4.1.0")
+    .booleanConf
+    .createWithDefault(true)
+
   val OPTIMIZER_EXCLUDED_RULES = buildConf("spark.sql.optimizer.excludedRules")
     .doc("Configures a list of rules to be disabled in the optimizer, in which the rules are " +
       "specified by their rule names and separated by comma. It is not guaranteed that all the " +
@@ -973,6 +1025,15 @@ object SQLConf {
       .booleanConf
       .createWithDefault(true)
 
+  lazy val COLLATION_AWARE_HASHING_ENABLED =
+    buildConf("spark.sql.legacy.collationAwareHashFunctions")
+      .internal()
+      .doc("Enables collation aware hashing (legacy behavior) for collated strings in " +
+        "Murmur3Hash and XxHash64 user-facing expressions.")
+      .version("4.0.1")
+      .booleanConf
+      .createWithDefault(false)
+
   val ICU_CASE_MAPPINGS_ENABLED =
     buildConf("spark.sql.icu.caseMappings.enabled")
       .doc("When enabled we use the ICU library (instead of the JVM) to implement case mappings" +
@@ -1188,6 +1249,63 @@ object SQLConf {
     .booleanConf
     .createWithDefault(false)
 
+  val PARSER_DFA_CACHE_FLUSH_RATIO =
+    buildConf("spark.sql.parser.parserDfaCacheFlushRatio")
+      .internal()
+      .doc(
+        """Like `spark.sql.parser.parserDfaCacheFlushThreshold`, but uses a threshold that is a
+          |linear function of the memory allocated to the driver process. Represents the percentage
+          |of the driver memory that the DFA cache can consume before it is flushed.
+          |
+          |Estimates the memory used by the DFA cache, assuming each state consumes
+          |`AbstractParser.BYTES_PER_DFA_STATE` bytes. If this value exceeds the product of the
+          |driver memory with the config value (interpreted as a percentage), the cache is flushed.
+          |
+          |Active values should be in the range 0-100, and a negative value disables the feature.
+          |If both this config and `spark.sql.parser.parserDfaCacheFlushThreshold` are set, the
+          |cache is flushed if either condition is met.
+          |Requires `spark.sql.parser.manageParserCaches` to be true to take effect.
+          |""".stripMargin)
+      .version("4.1.0")
+      .doubleConf
+      .checkValue(_ <= 100.0, "The ratio must be less than 100%")
+      .createWithDefault(-1.0)
+
+  val PARSER_DFA_CACHE_FLUSH_THRESHOLD =
+    buildConf("spark.sql.parser.parserDfaCacheFlushThreshold")
+      .internal()
+      .doc(
+        """When positive, release ANTLR caches after parsing a SQL query when the number of states
+          |in the DFA cache exceeds the value of the config. DFA states empirically consume about
+          |`AbstractParser.BYTES_PER_DFA_STATE` bytes of memory each.
+          |
+          |ANTLR parsers retain a DFA cache designed to speed up parsing future input. However,
+          |there is no limit to how large this cache can become. Parsing large SQL statements can
+          |lead to an accumulation of objects in the cache that are unlikely to be reused, causing
+          |high GC overhead and eventually OOMs.
+          |
+          |If this config is set to a negative value, it is ignored.
+          |If both this config and `spark.sql.parser.parserDfaCacheFlushRatio` are set, the
+          |cache is flushed if either condition is met.
+          |Requires `spark.sql.parser.manageParserCaches` to be true to take effect.
+          |
+          |Can significantly slow down parsing in exchange for better memory stability.
+          |""".stripMargin)
+      .version("4.1.0")
+      .intConf
+      .createWithDefault(-1)
+
+  val MANAGE_PARSER_CACHES =
+    buildConf("spark.sql.parser.manageParserCaches")
+      .internal()
+      .doc(
+        """When true, we install our own ANTLR caches to manage memory usage. When false, we use the
+          |default ANTLR caches. Dependency for
+          |`spark.sql.parser.parserDfaCacheFlushThreshold`.""".stripMargin)
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+
   val FILE_COMPRESSION_FACTOR = buildConf("spark.sql.sources.fileCompressionFactor")
     .internal()
     .doc("When estimating the output data size of a table scan, multiply the file size with this " +
@@ -1695,9 +1813,27 @@ object SQLConf {
     buildConf("spark.sql.dataSource.skipAssertOnPredicatePushdown")
       .internal()
       .doc("Enable skipping assert when expression in not translated to predicate.")
+      .version("4.0.0")
       .booleanConf
       .createWithDefault(!Utils.isTesting)
 
+  val DATA_SOURCE_ALWAYS_CREATE_V2_PREDICATE =
+    buildConf("spark.sql.dataSource.alwaysCreateV2Predicate")
+      .internal()
+      .doc("When true, the v2 push-down framework always wraps the expression that returns " +
+        "boolean type with a v2 Predicate so that it can be pushed down.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
+  val DATA_SOURCE_V2_JOIN_PUSHDOWN =
+    buildConf("spark.sql.optimizer.datasourceV2JoinPushdown")
+      .internal()
+      .doc("When this config is set to true, join is tried to be pushed down" +
+        "for DSv2 data sources in V2ScanRelationPushdown optimization rule.")
+      .booleanConf
+      .createWithDefault(false)
+
   // This is used to set the default data source
   val DEFAULT_DATA_SOURCE_NAME = buildConf("spark.sql.sources.default")
     .doc("The default data source to use in input/output.")
@@ -2327,6 +2463,13 @@ object SQLConf {
       .timeConf(TimeUnit.SECONDS)
       .createWithDefault(300L)
 
+  val STATE_STORE_MAINTENANCE_PROCESSING_TIMEOUT =
+    buildConf("spark.sql.streaming.stateStore.maintenanceProcessingTimeout")
+      .internal()
+      .doc("Timeout in seconds to wait for maintenance to process this partition.")
+      .timeConf(TimeUnit.SECONDS)
+      .createWithDefault(30L)
+
   val STATE_SCHEMA_CHECK_ENABLED =
     buildConf("spark.sql.streaming.stateStore.stateSchemaCheck")
       .doc("When true, Spark will validate the state schema against schema on existing state and " +
@@ -2544,6 +2687,16 @@ object SQLConf {
       .intConf
       .createWithDefault(16)
 
+  val STREAMING_VERIFY_CHECKPOINT_DIRECTORY_EMPTY_ON_START =
+    buildConf("spark.sql.streaming.verifyCheckpointDirectoryEmptyOnStart")
+      .internal()
+      .doc("When true, verifies that the checkpoint directory (offsets, state, commits) is " +
+        "empty when first starting a streaming query. This prevents prevents sharing checkpoint " +
+        "directories between different queries.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
   val STATE_STORE_COMPRESSION_CODEC =
     buildConf("spark.sql.streaming.stateStore.compression.codec")
       .internal()
@@ -2566,6 +2719,17 @@ object SQLConf {
       .booleanConf
       .createWithDefault(false)
 
+  val STATE_STORE_COMMIT_VALIDATION_ENABLED =
+    buildConf("spark.sql.streaming.stateStore.commitValidation.enabled")
+      .doc("When true, Spark will validate that all StateStore instances have committed for " +
+        "stateful streaming queries using foreachBatch. This helps detect cases where " +
+        "user-defined functions in foreachBatch (e.g., show(), limit()) don't process all " +
+        "partitions, which can lead to incorrect results. The validation only applies to " +
+        "foreachBatch sinks without global aggregates or limits.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
   val CHECKPOINT_RENAMEDFILE_CHECK_ENABLED =
     buildConf("spark.sql.streaming.checkpoint.renamedFileCheck.enabled")
       .doc("When true, Spark will validate if renamed checkpoint file exists.")
@@ -3356,6 +3520,13 @@ object SQLConf {
       .intConf
       .createWithDefault(SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD.defaultValue.get)
 
+  val WINDOW_EXEC_BUFFER_SIZE_SPILL_THRESHOLD =
+    buildConf("spark.sql.windowExec.buffer.spill.size.threshold")
+      .internal()
+      .doc("Threshold for size of rows to be spilled by window operator")
+      .version("4.1.0")
+      .fallbackConf(SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD)
+
   val WINDOW_GROUP_LIMIT_THRESHOLD =
     buildConf("spark.sql.optimizer.windowGroupLimitThreshold")
       .internal()
@@ -3377,6 +3548,15 @@ object SQLConf {
       .intConf
       .createWithDefault(4096)
 
+  val SESSION_WINDOW_BUFFER_SPILL_SIZE_THRESHOLD =
+    buildConf("spark.sql.sessionWindow.buffer.spill.size.threshold")
+      .internal()
+      .doc("Threshold for size of rows to be spilled by window operator. Note that " +
+        "the buffer is used only for the query Spark cannot apply aggregations on determining " +
+        "session window.")
+      .version("4.1.0")
+      .fallbackConf(SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD)
+
   val SESSION_WINDOW_BUFFER_SPILL_THRESHOLD =
     buildConf("spark.sql.sessionWindow.buffer.spill.threshold")
       .internal()
@@ -3397,12 +3577,27 @@ object SQLConf {
 
   val SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED =
     buildConf("spark.sql.shuffleDependency.fileCleanup.enabled")
-      .doc("When enabled, shuffle files will be cleaned up at the end of Spark Connect " +
-        "SQL executions.")
+      .doc("(Deprecated since Spark 4.1, please set" +
+        " 'spark.sql.connect.shuffleDependency.fileCleanup.enabled'.)")
       .version("4.0.0")
       .booleanConf
       .createWithDefault(Utils.isTesting)
 
+  val CLASSIC_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED =
+    buildConf("spark.sql.classic.shuffleDependency.fileCleanup.enabled")
+      .doc("When enabled, shuffle files will be cleaned up at the end of classic " +
+        "SQL executions.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(Utils.isTesting)
+
+  val CONNECT_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED =
+    buildConf("spark.sql.connect.shuffleDependency.fileCleanup.enabled")
+      .doc("When enabled, shuffle files will be cleaned up at the end of Spark Connect " +
+        "SQL executions.")
+      .version("4.1.0")
+      .fallbackConf(SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED)
+
   val SORT_MERGE_JOIN_EXEC_BUFFER_IN_MEMORY_THRESHOLD =
     buildConf("spark.sql.sortMergeJoinExec.buffer.in.memory.threshold")
       .internal()
@@ -3420,6 +3615,13 @@ object SQLConf {
       .intConf
       .createWithDefault(SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD.defaultValue.get)
 
+  val SORT_MERGE_JOIN_EXEC_BUFFER_SIZE_SPILL_THRESHOLD =
+    buildConf("spark.sql.sortMergeJoinExec.buffer.spill.size.threshold")
+      .internal()
+      .doc("Threshold for size of rows to be spilled by sort merge join operator")
+      .version("4.1.0")
+      .fallbackConf(SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD)
+
   val CARTESIAN_PRODUCT_EXEC_BUFFER_IN_MEMORY_THRESHOLD =
     buildConf("spark.sql.cartesianProductExec.buffer.in.memory.threshold")
       .internal()
@@ -3437,6 +3639,13 @@ object SQLConf {
       .intConf
       .createWithDefault(SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD.defaultValue.get)
 
+  val CARTESIAN_PRODUCT_EXEC_BUFFER_SIZE_SPILL_THRESHOLD =
+    buildConf("spark.sql.cartesianProductExec.buffer.spill.size.threshold")
+      .internal()
+      .doc("Threshold for size of rows to be spilled by cartesian product operator")
+      .version("4.1.0")
+      .fallbackConf(SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD)
+
   val SUPPORT_QUOTED_REGEX_COLUMN_NAME = buildConf("spark.sql.parser.quotedRegexColumnNames")
     .doc("When true, quoted Identifiers (using backticks) in SELECT statement are interpreted" +
       " as regular expressions.")
@@ -3549,6 +3758,14 @@ object SQLConf {
       .version("4.1.0")
       .fallbackConf(Python.PYTHON_WORKER_KILL_ON_IDLE_TIMEOUT)
 
+  val PYTHON_UDF_WORKER_TRACEBACK_DUMP_INTERVAL_SECONDS =
+    buildConf("spark.sql.execution.pyspark.udf.tracebackDumpIntervalSeconds")
+      .doc(
+        s"Same as ${Python.PYTHON_WORKER_TRACEBACK_DUMP_INTERVAL_SECONDS.key} " +
+          "for Python execution with DataFrame and SQL. It can change during runtime.")
+      .version("4.1.0")
+      .fallbackConf(Python.PYTHON_WORKER_TRACEBACK_DUMP_INTERVAL_SECONDS)
+
   val PYSPARK_PLOT_MAX_ROWS =
     buildConf("spark.sql.pyspark.plotting.max_rows")
       .doc("The visual limit on plots. If set to 1000 for top-n-based plots (pie, bar, barh), " +
@@ -3648,7 +3865,7 @@ object SQLConf {
         errorMsg = "The value of " +
           "spark.sql.execution.arrow.maxBytesPerBatch should be greater " +
           "than zero and less than INT_MAX.")
-      .createWithDefaultString("256MB")
+      .createWithDefaultString("64MB")
 
   val ARROW_TRANSFORM_WITH_STATE_IN_PYSPARK_MAX_STATE_RECORDS_PER_BATCH =
     buildConf("spark.sql.execution.arrow.transformWithStateInPySpark.maxStateRecordsPerBatch")
@@ -3774,6 +3991,15 @@ object SQLConf {
       .booleanConf
       .createWithDefault(false)
 
+  val PYTHON_UDF_PANDAS_INT_TO_DECIMAL_COERCION_ENABLED =
+    buildConf("spark.sql.execution.pythonUDF.pandas.intToDecimalCoercionEnabled")
+      .doc("When true, convert int to Decimal python objects before converting " +
+        "Pandas.Series to Arrow array during serialization." +
+        "Disabled by default, impacts performance.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+
   val PYTHON_TABLE_UDF_ARROW_ENABLED =
     buildConf("spark.sql.execution.pythonUDTF.arrow.enabled")
       .doc("Enable Arrow optimization for Python UDTFs.")
@@ -3792,6 +4018,18 @@ object SQLConf {
       .booleanConf
       .createWithDefault(false)
 
+  val PYTHON_UDF_LEGACY_PANDAS_CONVERSION_ENABLED =
+    buildConf("spark.sql.legacy.execution.pythonUDF.pandas.conversion.enabled")
+      .internal()
+      .doc(s"When true and ${PYTHON_UDF_ARROW_ENABLED.key} is enabled, matches the " +
+        "default Arrow Python UDF behavior before 4.1.0. With this behavior, extra" +
+        "pandas conversion happens during (de)serialization between JVM and Python workers. " +
+        "This matters especially when the produced output has a schema different from " +
+        "specified schema, resulting in a different type coercion.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+
   val PYTHON_PLANNER_EXEC_MEMORY =
     buildConf("spark.sql.planner.pythonExecution.memory")
       .doc("Specifies the memory allocation for executing Python code in Spark driver, in MiB. " +
@@ -3824,7 +4062,7 @@ object SQLConf {
         "check and do type conversions anyway. This config only works for Arrow 0.11.0+.")
       .version("3.0.0")
       .booleanConf
-      .createWithDefault(false)
+      .createWithDefault(true)
 
   val PYSPARK_WORKER_PYTHON_EXECUTABLE =
     buildConf("spark.sql.execution.pyspark.python")
@@ -4078,6 +4316,16 @@ object SQLConf {
     .booleanConf
     .createWithDefault(false)
 
+  val LEGACY_CONSECUTIVE_STRING_LITERALS =
+    buildConf("spark.sql.legacy.consecutiveStringLiterals.enabled")
+      .internal()
+      .doc("When true, consecutive string literals separated by double quotes (e.g. 'a''b') will " +
+        "be parsed as concatenated strings. This preserves pre-Spark 4.0 behavior where" +
+        "'a''b' would be parsed as 'ab' instead of 'a'b'.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+
   val ANSI_RELATION_PRECEDENCE = buildConf("spark.sql.ansi.relationPrecedence")
     .doc(s"When true and '${ANSI_ENABLED.key}' is true, JOIN takes precedence over comma when " +
       "combining relation. For example, `t1, t2 JOIN t3` should result to `t1 X (t2 X t3)`. If " +
@@ -5607,7 +5855,7 @@ object SQLConf {
       .internal()
       .doc("When true, exclude the references from the subquery expressions (in, exists, etc.) " +
         s"while removing redundant aliases.")
-      .version("4.0.0")
+      .version("3.5.1")
       .booleanConf
       .createWithDefault(true)
 
@@ -5829,6 +6077,16 @@ object SQLConf {
     .booleanConf
     .createWithDefault(true)
 
+  val UNION_OUTPUT_PARTITIONING =
+    buildConf("spark.sql.unionOutputPartitioning")
+      .internal()
+      .doc("When set to true, the output partitioning of UnionExec will be the same as the " +
+        "input partitioning if its children have same partitioning. Otherwise, it will be a " +
+        "default partitioning.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
   val LEGACY_PARSE_QUERY_WITHOUT_EOF = buildConf("spark.sql.legacy.parseQueryWithoutEof")
     .internal()
     .doc(
@@ -5949,6 +6207,76 @@ object SQLConf {
       .createWithDefault(2)
   }
 
+  val HADOOP_LINE_RECORD_READER_ENABLED =
+    buildConf("spark.sql.execution.datasources.hadoopLineRecordReader.enabled")
+      .internal()
+      .doc("Enable the imported Hadoop's LineRecordReader. This was imported and renamed to " +
+        "HadoopLineRecordReader to add support for compression option and other " +
+        "future codecs like ZSTD, etc. Setting the conf to false will use the LineRecordReader " +
+        "class from the hadoop jar instead of the imported one.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
+  val ENFORCE_TYPE_COERCION_BEFORE_UNION_DEDUPLICATION =
+    buildConf("spark.sql.enforceTypeCoercionBeforeUnionDeduplication.enabled")
+      .internal()
+      .doc(
+        "When set to true, we enforce type coercion to run before deduplication of UNION " +
+        "children outputs. Otherwise, order is relative to rule ordering."
+      )
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
+  val PRIORITIZE_ORDINAL_RESOLUTION_IN_SORT =
+    buildConf("spark.sql.prioritizeOrdinalResolutionInSort.enabled")
+      .internal()
+      .doc(
+        "When set to true, we prioritize ordinal resolution in Sort over other expressions. " +
+        "Otherwise, no order is enforced."
+      )
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(true)
+
+  val LEGACY_TRUNCATE_FOR_EMPTY_REGEX_SPLIT =
+    buildConf("spark.sql.legacy.truncateForEmptyRegexSplit")
+      .internal()
+      .doc("When set to true, splitting a string of length n using an empty regex with a " +
+        "positive limit discards the last n - limit characters." +
+        "For example: SELECT split('abcd', '', 2) returns ['a', 'b']." +
+        "When set to false, the last element of the resulting array contains all input beyond " +
+        "the last matched regex." +
+        "For example: SELECT split('abcd', '', 2) returns ['a', 'bcd']." +
+        "According to the description of the split function, this should be set to false by " +
+        "default. See SPARK-49968 for details.")
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+
+  val LEGACY_XML_PARSER_ENABLED = {
+    buildConf("spark.sql.xml.legacyXMLParser.enabled")
+      .internal()
+      .doc(
+        "When set to true, use the legacy XML parser for parsing XML files. " +
+        "Compared to the default parser, the legacy parser has less stringent validation checks " +
+        "for malformed content, but it's less memory-efficient"
+      )
+      .version("4.1.0")
+      .booleanConf
+      .createWithDefault(false)
+  }
+
+  val ASSUME_ANSI_FALSE_IF_NOT_PERSISTED =
+    buildConf("spark.sql.assumeAnsiFalseIfNotPersisted.enabled")
+      .internal()
+      .doc("If enabled, assume ANSI mode is false if not persisted during view or UDF " +
+        "creation. Otherwise use the default value.")
+      .version("4.0.1")
+      .booleanConf
+      .createWithDefault(true)
+
   /**
    * Holds information about keys that have been deprecated.
    *
@@ -6000,7 +6328,9 @@ object SQLConf {
       DeprecatedConfig("spark.connect.copyFromLocalToFs.allowDestLocal", "4.0",
         s"Use '${ARTIFACT_COPY_FROM_LOCAL_TO_FS_ALLOW_DEST_LOCAL.key}' instead."),
       DeprecatedConfig(ALLOW_ZERO_INDEX_IN_FORMAT_STRING.key, "4.0", "Increase indexes by 1 " +
-        "in `strfmt` of the `format_string` function. Refer to the first argument by \"1$\".")
+        "in `strfmt` of the `format_string` function. Refer to the first argument by \"1$\"."),
+      DeprecatedConfig(SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED.key, "4.1",
+        s"Use '${CONNECT_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED.key}' instead.")
     )
 
     Map(configs.map { cfg => cfg.key -> cfg } : _*)
@@ -6121,6 +6451,8 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def nameResolutionLogLevel: Level = getConf(NAME_RESOLUTION_LOG_LEVEL)
 
+  def dataSourceV2JoinPushdown: Boolean = getConf(DATA_SOURCE_V2_JOIN_PUSHDOWN)
+
   def dynamicPartitionPruningEnabled: Boolean = getConf(DYNAMIC_PARTITION_PRUNING_ENABLED)
 
   def dynamicPartitionPruningUseStats: Boolean = getConf(DYNAMIC_PARTITION_PRUNING_USE_STATS)
@@ -6151,6 +6483,9 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def stateStoreMaintenanceShutdownTimeout: Long = getConf(STATE_STORE_MAINTENANCE_SHUTDOWN_TIMEOUT)
 
+  def stateStoreMaintenanceProcessingTimeout: Long =
+    getConf(STATE_STORE_MAINTENANCE_PROCESSING_TIMEOUT)
+
   def stateStoreMinDeltasForSnapshot: Int = getConf(STATE_STORE_MIN_DELTAS_FOR_SNAPSHOT)
 
   def stateStoreFormatValidationEnabled: Boolean = getConf(STATE_STORE_FORMAT_VALIDATION_ENABLED)
@@ -6295,6 +6630,8 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def stateStoreUnloadOnCommit: Boolean = getConf(STATE_STORE_UNLOAD_ON_COMMIT)
 
+  def stateStoreCommitValidationEnabled: Boolean = getConf(STATE_STORE_COMMIT_VALIDATION_ENABLED)
+
   def streamingMaintenanceInterval: Long = getConf(STREAMING_MAINTENANCE_INTERVAL)
 
   def stateStoreCompressionCodec: String = getConf(STATE_STORE_COMPRESSION_CODEC)
@@ -6398,6 +6735,12 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def escapedStringLiterals: Boolean = getConf(ESCAPED_STRING_LITERALS)
 
+  def parserDfaCacheFlushRatio: Double = getConf(PARSER_DFA_CACHE_FLUSH_RATIO)
+
+  def parserDfaCacheFlushThreshold: Int = getConf(PARSER_DFA_CACHE_FLUSH_THRESHOLD)
+
+  def manageParserCaches: Boolean = getConf(MANAGE_PARSER_CACHES)
+
   def fileCompressionFactor: Double = getConf(FILE_COMPRESSION_FACTOR)
 
   def stringRedactionPattern: Option[Regex] = getConf(SQL_STRING_REDACTION_PATTERN)
@@ -6649,24 +6992,35 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def windowExecBufferSpillThreshold: Int = getConf(WINDOW_EXEC_BUFFER_SPILL_THRESHOLD)
 
+  def windowExecBufferSpillSizeThreshold: Long = getConf(WINDOW_EXEC_BUFFER_SIZE_SPILL_THRESHOLD)
+
   def windowGroupLimitThreshold: Int = getConf(WINDOW_GROUP_LIMIT_THRESHOLD)
 
   def sessionWindowBufferInMemoryThreshold: Int = getConf(SESSION_WINDOW_BUFFER_IN_MEMORY_THRESHOLD)
 
   def sessionWindowBufferSpillThreshold: Int = getConf(SESSION_WINDOW_BUFFER_SPILL_THRESHOLD)
 
+  def sessionWindowBufferSpillSizeThreshold: Long =
+    getConf(SESSION_WINDOW_BUFFER_SPILL_SIZE_THRESHOLD)
+
   def sortMergeJoinExecBufferInMemoryThreshold: Int =
     getConf(SORT_MERGE_JOIN_EXEC_BUFFER_IN_MEMORY_THRESHOLD)
 
   def sortMergeJoinExecBufferSpillThreshold: Int =
     getConf(SORT_MERGE_JOIN_EXEC_BUFFER_SPILL_THRESHOLD)
 
+  def sortMergeJoinExecBufferSpillSizeThreshold: Long =
+    getConf(SORT_MERGE_JOIN_EXEC_BUFFER_SIZE_SPILL_THRESHOLD)
+
   def cartesianProductExecBufferInMemoryThreshold: Int =
     getConf(CARTESIAN_PRODUCT_EXEC_BUFFER_IN_MEMORY_THRESHOLD)
 
   def cartesianProductExecBufferSpillThreshold: Int =
     getConf(CARTESIAN_PRODUCT_EXEC_BUFFER_SPILL_THRESHOLD)
 
+  def cartesianProductExecBufferSizeSpillThreshold: Long =
+    getConf(CARTESIAN_PRODUCT_EXEC_BUFFER_SIZE_SPILL_THRESHOLD)
+
   def codegenSplitAggregateFunc: Boolean = getConf(SQLConf.CODEGEN_SPLIT_AGGREGATE_FUNC)
 
   def maxNestedViewDepth: Int = getConf(SQLConf.MAX_NESTED_VIEW_DEPTH)
@@ -6709,6 +7063,9 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def pythonUDFWorkerKillOnIdleTimeout: Boolean = getConf(PYTHON_UDF_WORKER_KILL_ON_IDLE_TIMEOUT)
 
+  def pythonUDFWorkerTracebackDumpIntervalSeconds: Long =
+    getConf(PYTHON_UDF_WORKER_TRACEBACK_DUMP_INTERVAL_SECONDS)
+
   def pythonUDFArrowConcurrencyLevel: Option[Int] = getConf(PYTHON_UDF_ARROW_CONCURRENCY_LEVEL)
 
   def pythonUDFArrowFallbackOnUDT: Boolean = getConf(PYTHON_UDF_ARROW_FALLBACK_ON_UDT)
@@ -6752,6 +7109,8 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def legacyPandasConversion: Boolean = getConf(PYTHON_TABLE_UDF_LEGACY_PANDAS_CONVERSION_ENABLED)
 
+  def legacyPandasConversionUDF: Boolean = getConf(PYTHON_UDF_LEGACY_PANDAS_CONVERSION_ENABLED)
+
   def pythonPlannerExecMemory: Option[Long] = getConf(PYTHON_PLANNER_EXEC_MEMORY)
 
   def replaceExceptWithFilter: Boolean = getConf(REPLACE_EXCEPT_WITH_FILTER)
@@ -6799,6 +7158,9 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
   def useNullsForMissingDefaultColumnValues: Boolean =
     getConf(SQLConf.USE_NULLS_FOR_MISSING_DEFAULT_COLUMN_VALUES)
 
+  def unionIsResolvedWhenDuplicatesPerChildResolved: Boolean =
+    getConf(SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED)
+
   override def enforceReservedKeywords: Boolean = ansiEnabled && getConf(ENFORCE_RESERVED_KEYWORDS)
 
   override def doubleQuotedIdentifiers: Boolean = ansiEnabled && getConf(DOUBLE_QUOTED_IDENTIFIERS)
@@ -7021,6 +7383,11 @@ class SQLConf extends Serializable with Logging with SqlApiConf {
 
   def maxFlowRetryAttempts: Int = getConf(SQLConf.PIPELINES_MAX_FLOW_RETRY_ATTEMPTS)
 
+  def hadoopLineRecordReaderEnabled: Boolean = getConf(SQLConf.HADOOP_LINE_RECORD_READER_ENABLED)
+
+  def legacyXMLParserEnabled: Boolean =
+    getConf(SQLConf.LEGACY_XML_PARSER_ENABLED)
+
   /** ********************** SQLConf functionality methods ************ */
 
   /** Set Spark SQL configuration properties. */
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/RandomDataGenerator.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/RandomDataGenerator.scala
index 2f92fe3d083d3..655ff1e728dc5 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/RandomDataGenerator.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/RandomDataGenerator.scala
@@ -292,7 +292,7 @@ object RandomDataGenerator {
         randomNumeric[LocalTime](
           rand,
           (rand: Random) => {
-            DateTimeUtils.microsToLocalTime(rand.between(0, 24 * 60 * 60 * 1000 * 1000L))
+            DateTimeUtils.nanosToLocalTime(rand.between(0, 24 * 60 * 60 * 1000 * 1000L) * 1000L)
           },
           specialTimes.map(LocalTime.parse)
         )
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/CatalystTypeConvertersSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/CatalystTypeConvertersSuite.scala
index e4c48f7467f9a..44796e9fa3816 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/CatalystTypeConvertersSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/CatalystTypeConvertersSuite.scala
@@ -435,7 +435,7 @@ class CatalystTypeConvertersSuite extends SparkFunSuite with SQLHelper {
       "23:59:59.999999").foreach { time =>
       val input = LocalTime.parse(time)
       val result = CatalystTypeConverters.convertToCatalyst(input)
-      val expected = DateTimeUtils.localTimeToMicros(input)
+      val expected = DateTimeUtils.localTimeToNanos(input)
       assert(result === expected)
     }
   }
@@ -449,8 +449,9 @@ class CatalystTypeConvertersSuite extends SparkFunSuite with SQLHelper {
       43200999999L,
       86399000000L,
       86399999999L).foreach { us =>
-      val localTime = DateTimeUtils.microsToLocalTime(us)
-      assert(CatalystTypeConverters.createToScalaConverter(TimeType())(us) === localTime)
+      val nanos = us * 1000L
+      val localTime = DateTimeUtils.nanosToLocalTime(nanos)
+      assert(CatalystTypeConverters.createToScalaConverter(TimeType())(nanos) === localTime)
     }
   }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/DistributionSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/DistributionSuite.scala
index 7cb4d5f123253..4f3efca4ad0f0 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/DistributionSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/DistributionSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.catalyst
 import org.apache.spark.SparkFunSuite
 /* Implicit conversions */
 import org.apache.spark.sql.catalyst.dsl.expressions._
-import org.apache.spark.sql.catalyst.expressions.{Expression, Literal, Murmur3Hash, Pmod}
+import org.apache.spark.sql.catalyst.expressions.{CollationAwareMurmur3Hash, Expression, Literal, Pmod}
 import org.apache.spark.sql.catalyst.plans.physical._
 import org.apache.spark.sql.types.IntegerType
 
@@ -322,7 +322,7 @@ class DistributionSuite extends SparkFunSuite {
     val expressions = Seq($"a", $"b", $"c")
     val hashPartitioning = HashPartitioning(expressions, 10)
     hashPartitioning.partitionIdExpression match {
-      case Pmod(Murmur3Hash(es, 42), Literal(10, IntegerType), _) =>
+      case Pmod(CollationAwareMurmur3Hash(es, 42), Literal(10, IntegerType), _) =>
         assert(es.length == expressions.length && es.zip(expressions).forall {
           case (l, r) => l.semanticEquals(r)
         })
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/SQLKeywordSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/SQLKeywordSuite.scala
index 9977dcd83d6af..5a2eefcb0e932 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/SQLKeywordSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/SQLKeywordSuite.scala
@@ -25,7 +25,6 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.sql.catalyst.plans.SQLHelper
-import org.apache.spark.sql.catalyst.util.fileToString
 
 trait SQLKeywordUtils extends SparkFunSuite with SQLHelper {
 
@@ -38,7 +37,8 @@ trait SQLKeywordUtils extends SparkFunSuite with SQLHelper {
       getWorkspaceFilePath("sql", "api", "src", "main", "antlr4", "org",
         "apache", "spark", "sql", "catalyst", "parser", "SqlBaseLexer.g4").toFile
 
-    (fileToString(sqlBaseParserPath) + fileToString(sqlBaseLexerPath)).split("\n")
+    (Files.readString(sqlBaseParserPath.toPath) +
+      Files.readString(sqlBaseLexerPath.toPath)).split("\n")
   }
 
   // each element is an array of 4 string: the keyword name, reserve or not in Spark ANSI mode,
@@ -47,7 +47,7 @@ trait SQLKeywordUtils extends SparkFunSuite with SQLHelper {
     val docPath = {
       getWorkspaceFilePath("docs", "sql-ref-ansi-compliance.md").toFile
     }
-    fileToString(docPath).split("\n")
+    Files.readString(docPath.toPath).split("\n")
       .dropWhile(!_.startsWith("|Keyword|")).drop(2).takeWhile(_.startsWith("|"))
       .map(_.stripPrefix("|").split("\\|").map(_.trim))
   }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnalysisSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnalysisSuite.scala
index 23aab31c103b9..0c8d2bae418ad 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnalysisSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnalysisSuite.scala
@@ -1034,51 +1034,53 @@ class AnalysisSuite extends AnalysisTest with Matchers {
 
   test("SPARK-30886 Deprecate two-parameter TRIM/LTRIM/RTRIM") {
     Seq("trim", "ltrim", "rtrim").foreach { f =>
-      val logAppender = new LogAppender("deprecated two-parameter TRIM/LTRIM/RTRIM functions")
-      def check(count: Int): Unit = {
-        val message = "Two-parameter TRIM/LTRIM/RTRIM function signatures are deprecated."
-        assert(logAppender.loggingEvents.size == count)
-        assert(logAppender.loggingEvents.exists(
-          e => e.getLevel == Level.WARN &&
-            e.getMessage.getFormattedMessage.contains(message)))
-      }
+      withSQLConf(SQLConf.MANAGE_PARSER_CACHES.key -> "false") { // Avoid additional logging
+        val logAppender = new LogAppender("deprecated two-parameter TRIM/LTRIM/RTRIM functions")
+        def check(count: Int): Unit = {
+          val message = "Two-parameter TRIM/LTRIM/RTRIM function signatures are deprecated."
+          assert(logAppender.loggingEvents.size == count)
+          assert(logAppender.loggingEvents.exists(
+            e => e.getLevel == Level.WARN &&
+              e.getMessage.getFormattedMessage.contains(message)))
+        }
 
-      withLogAppender(logAppender) {
-        val testAnalyzer1 = new Analyzer(
-          new SessionCatalog(new InMemoryCatalog, FunctionRegistry.builtin))
-
-        val plan1 = testRelation2.select(
-          UnresolvedFunction(f, $"a" :: Nil, isDistinct = false))
-        testAnalyzer1.execute(plan1)
-        // One-parameter is not deprecated.
-        assert(logAppender.loggingEvents.isEmpty)
-
-        val plan2 = testRelation2.select(
-          UnresolvedFunction(f, $"a" :: $"b" :: Nil, isDistinct = false))
-        testAnalyzer1.execute(plan2)
-        // Deprecation warning is printed out once.
-        check(1)
-
-        val plan3 = testRelation2.select(
-          UnresolvedFunction(f, $"b" :: $"a" :: Nil, isDistinct = false))
-        testAnalyzer1.execute(plan3)
-        // There is no change in the log.
-        check(1)
-
-        // New analyzer from new SessionState
-        val testAnalyzer2 = new Analyzer(
-          new SessionCatalog(new InMemoryCatalog, FunctionRegistry.builtin))
-        val plan4 = testRelation2.select(
-          UnresolvedFunction(f, $"c" :: $"d" :: Nil, isDistinct = false))
-        testAnalyzer2.execute(plan4)
-        // Additional deprecation warning from new analyzer
-        check(2)
-
-        val plan5 = testRelation2.select(
-          UnresolvedFunction(f, $"c" :: $"d" :: Nil, isDistinct = false))
-        testAnalyzer2.execute(plan5)
-        // There is no change in the log.
-        check(2)
+        withLogAppender(logAppender) {
+          val testAnalyzer1 = new Analyzer(
+            new SessionCatalog(new InMemoryCatalog, FunctionRegistry.builtin))
+
+          val plan1 = testRelation2.select(
+            UnresolvedFunction(f, $"a" :: Nil, isDistinct = false))
+          testAnalyzer1.execute(plan1)
+          // One-parameter is not deprecated.
+          assert(logAppender.loggingEvents.isEmpty)
+
+          val plan2 = testRelation2.select(
+            UnresolvedFunction(f, $"a" :: $"b" :: Nil, isDistinct = false))
+          testAnalyzer1.execute(plan2)
+          // Deprecation warning is printed out once.
+          check(1)
+
+          val plan3 = testRelation2.select(
+            UnresolvedFunction(f, $"b" :: $"a" :: Nil, isDistinct = false))
+          testAnalyzer1.execute(plan3)
+          // There is no change in the log.
+          check(1)
+
+          // New analyzer from new SessionState
+          val testAnalyzer2 = new Analyzer(
+            new SessionCatalog(new InMemoryCatalog, FunctionRegistry.builtin))
+          val plan4 = testRelation2.select(
+            UnresolvedFunction(f, $"c" :: $"d" :: Nil, isDistinct = false))
+          testAnalyzer2.execute(plan4)
+          // Additional deprecation warning from new analyzer
+          check(2)
+
+          val plan5 = testRelation2.select(
+            UnresolvedFunction(f, $"c" :: $"d" :: Nil, isDistinct = false))
+          testAnalyzer2.execute(plan5)
+          // There is no change in the log.
+          check(2)
+        }
       }
     }
   }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnsiTypeCoercionSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnsiTypeCoercionSuite.scala
index 0792c1657456a..42acc38eee2d1 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnsiTypeCoercionSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/AnsiTypeCoercionSuite.scala
@@ -936,7 +936,12 @@ class AnsiTypeCoercionSuite extends TypeCoercionSuiteBase {
       windowSpec(
         Seq(UnresolvedAttribute("a")),
         Seq(SortOrder(Literal(1L), Ascending)),
-        SpecifiedWindowFrame(RangeFrame, Cast(3, LongType), Literal(2147483648L)))
+        SpecifiedWindowFrame(
+          RangeFrame,
+          Cast(3, LongType).withTimeZone(conf.sessionLocalTimeZone),
+          Literal(2147483648L)
+        )
+      )
     )
     // Cannot cast frame boundaries to order dataType.
     ruleTest(WindowFrameCoercion,
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTablesSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTablesSuite.scala
index af7c6eb18ba83..db22c9e48a393 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTablesSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveInlineTablesSuite.scala
@@ -20,11 +20,11 @@ package org.apache.spark.sql.catalyst.analysis
 import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.catalyst.expressions.{Alias, Cast, CurrentTime, CurrentTimestamp, Literal, Rand}
 import org.apache.spark.sql.catalyst.expressions.aggregate.Count
 import org.apache.spark.sql.catalyst.optimizer.{ComputeCurrentTime, EvalInlineTables}
 import org.apache.spark.sql.catalyst.plans.logical.LocalRelation
+import org.apache.spark.sql.catalyst.util.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.types.{LongType, NullType, TimestampType, TimeType}
 
 /**
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveRecursiveCTESuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveRecursiveCTESuite.scala
index 9e9134a7f620d..6a00858faf2be 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveRecursiveCTESuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/ResolveRecursiveCTESuite.scala
@@ -53,7 +53,8 @@ class ResolveRecursiveCTESuite extends AnalysisTest {
     }
 
     def getAfterPlan(): LogicalPlan = {
-      val recursion = UnionLoopRef(cteId, anchor.output, accumulated = false).subquery("t")
+      val recursion = UnionLoopRef(cteId, anchor.output.map(_.withNullability(true)),
+        accumulated = false).subquery("t")
       val cteDef = CTERelationDef(UnionLoop(cteId, anchor, recursion,
         outputExprIds).subquery("t"), cteId)
       val cteRef = CTERelationRef(
@@ -97,8 +98,9 @@ class ResolveRecursiveCTESuite extends AnalysisTest {
     }
 
     def getAfterPlan(): LogicalPlan = {
-      val col = anchor.output.head
-      val recursion = UnionLoopRef(cteId, anchor.output, accumulated = false)
+      val col = anchor.output.head.withNullability(true)
+      val recursion = UnionLoopRef(cteId, anchor.output.map(_.withNullability(true)),
+        accumulated = false)
         .select(col.as("n"))
         .subquery("t")
       val cteDef = CTERelationDef(
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionSuite.scala
index 330252d26dc56..250f20fd09571 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/TypeCoercionSuite.scala
@@ -1635,7 +1635,12 @@ class TypeCoercionSuite extends TypeCoercionSuiteBase {
       windowSpec(
         Seq(UnresolvedAttribute("a")),
         Seq(SortOrder(Literal(1L), Ascending)),
-        SpecifiedWindowFrame(RangeFrame, Cast(3, LongType), Literal(2147483648L)))
+        SpecifiedWindowFrame(
+          RangeFrame,
+          Cast(3, LongType).withTimeZone(conf.sessionLocalTimeZone),
+          Literal(2147483648L)
+        )
+      )
     )
     // Cannot cast frame boundaries to order dataType.
     ruleTest(WindowFrameCoercion,
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/V2WriteAnalysisSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/V2WriteAnalysisSuite.scala
index 0b872d61eca3e..2ed7c612d3f33 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/V2WriteAnalysisSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/V2WriteAnalysisSuite.scala
@@ -331,6 +331,31 @@ abstract class V2WriteAnalysisSuiteBase extends AnalysisTest {
       ArrayType(new StructType().add("x", "int").add("y", "int")),
       ArrayType(new StructType().add("y", "int").add("x", "byte")),
       hasTransform = true)
+
+    withSQLConf("spark.sql.preserveCharVarcharTypeInfo" -> "true") {
+      // exact match on VARCHAR does not need transform
+      assertArrayField(ArrayType(VarcharType(7)), ArrayType(VarcharType(7)), hasTransform = false)
+      // VARCHAR length increase could avoid transform
+      assertArrayField(ArrayType(VarcharType(7)), ArrayType(VarcharType(8)), hasTransform = true)
+      // VARCHAR length decrease requires length check
+      assertArrayField(ArrayType(VarcharType(8)), ArrayType(VarcharType(7)), hasTransform = true)
+      // Widening doesn't really require transform, but does require type change.
+      assertArrayField(ArrayType(VarcharType(7)), ArrayType(StringType), hasTransform = true)
+      // CHAR length increase needs transform to add padding
+      assertArrayField(ArrayType(CharType(7)), ArrayType(CharType(8)), hasTransform = true)
+      // VARCHAR to STRING widening doesn't really require transform, but does require type change.
+      assertArrayField(ArrayType(VarcharType(7)), ArrayType(StringType), hasTransform = true)
+      // Exact match could avoid transform, but structs always transform today...
+      assertArrayField(
+        ArrayType(new StructType().add("x", VarcharType(7)).add("y", CharType(2))),
+        ArrayType(new StructType().add("x", VarcharType(7)).add("y", CharType(2))),
+        hasTransform = true)
+      // struct needs to be reordered
+      assertArrayField(
+        ArrayType(new StructType().add("x", VarcharType(7)).add("y", CharType(2))),
+        ArrayType(new StructType().add("y", CharType(2)).add("x", CharType(7))),
+        hasTransform = true)
+    }
   }
 
   test("SPARK-48922: Avoid redundant array transform of identical expression for map type") {
@@ -487,7 +512,7 @@ abstract class V2WriteAnalysisSuiteBase extends AnalysisTest {
     val y = query.output.last
 
     val parsedPlan = byName(table, query)
-    val expectedPlan = byName(table, Project(Seq(X.withName("x"), y), query))
+    val expectedPlan = byName(table, Project(Seq(Alias(X, "x")(), y), query))
 
     assertNotResolved(parsedPlan)
     checkAnalysis(parsedPlan, expectedPlan, caseSensitive = false)
@@ -620,8 +645,8 @@ abstract class V2WriteAnalysisSuiteBase extends AnalysisTest {
     val parsedPlan = byPosition(table, query)
     val expectedPlan = byPosition(table,
       Project(Seq(
-        Alias(Cast(a, FloatType, Some(conf.sessionLocalTimeZone)), "x")(),
-        Alias(Cast(b, FloatType, Some(conf.sessionLocalTimeZone)), "y")()),
+        Alias(a, "x")(),
+        Alias(b, "y")()),
         query))
 
     assertNotResolved(parsedPlan)
@@ -641,8 +666,8 @@ abstract class V2WriteAnalysisSuiteBase extends AnalysisTest {
     val parsedPlan = byPosition(table, query)
     val expectedPlan = byPosition(table,
       Project(Seq(
-        Alias(Cast(y, FloatType, Some(conf.sessionLocalTimeZone)), "x")(),
-        Alias(Cast(x, FloatType, Some(conf.sessionLocalTimeZone)), "y")()),
+        Alias(y, "x")(),
+        Alias(x, "y")()),
         query))
 
     assertNotResolved(parsedPlan)
@@ -796,14 +821,11 @@ abstract class V2WriteAnalysisSuiteBase extends AnalysisTest {
           IsNull(queryCol),
           Literal(null, expectedColType),
           CreateNamedStruct(Seq(
-            Literal("a"), Cast(
+            Literal("a"),
               GetStructField(queryCol, 0, name = Some("x")),
-              IntegerType,
-              Some(conf.sessionLocalTimeZone)),
-            Literal("b"), Cast(
-              GetStructField(queryCol, 1, name = Some("y")),
-              IntegerType,
-              Some(conf.sessionLocalTimeZone))))),
+            Literal("b"),
+              GetStructField(queryCol, 1, name = Some("y"))
+          ))),
         "col")()),
         query)
       checkAnalysis(parsedPlan, byPosition(tableWithStructCol, expectedQuery))
@@ -1376,8 +1398,8 @@ abstract class V2WriteAnalysisSuiteBase extends AnalysisTest {
 
     val expectedPlan = OverwriteByExpression.byPosition(table,
       Project(Seq(
-        Alias(Cast(a, DoubleType, Some(conf.sessionLocalTimeZone)), "x")(),
-        Alias(Cast(b, DoubleType, Some(conf.sessionLocalTimeZone)), "y")()),
+        Alias(a, "x")(),
+        Alias(b, "y")()),
         query),
       LessThanOrEqual(x, Literal(15.0d)))
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/LimitExpressionResolverSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/LimitExpressionResolverSuite.scala
deleted file mode 100644
index c8b4db3e10aa2..0000000000000
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/LimitExpressionResolverSuite.scala
+++ /dev/null
@@ -1,89 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.spark.sql.catalyst.analysis.resolver
-
-import org.apache.spark.SparkFunSuite
-import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.expressions.{AttributeReference, Cast, Literal}
-import org.apache.spark.sql.errors.QueryErrorsBase
-import org.apache.spark.sql.types.IntegerType
-
-class LimitExpressionResolverSuite extends SparkFunSuite with QueryErrorsBase {
-
-  private val limitExpressionResolver = new LimitExpressionResolver
-
-  test("Basic LIMIT without errors") {
-    val expr = Literal(42, IntegerType)
-    assert(limitExpressionResolver.resolve(expr) == expr)
-  }
-
-  test("Unfoldable LIMIT") {
-    val col = AttributeReference(name = "foo", dataType = IntegerType)()
-    checkError(
-      exception = intercept[AnalysisException] {
-        limitExpressionResolver.resolve(col)
-      },
-      condition = "INVALID_LIMIT_LIKE_EXPRESSION.IS_UNFOLDABLE",
-      parameters = Map("name" -> "limit", "expr" -> toSQLExpr(col))
-    )
-  }
-
-  test("LIMIT with non-integer") {
-    val anyNonInteger = Literal("42")
-    checkError(
-      exception = intercept[AnalysisException] {
-        limitExpressionResolver.resolve(anyNonInteger)
-      },
-      condition = "INVALID_LIMIT_LIKE_EXPRESSION.DATA_TYPE",
-      parameters = Map(
-        "name" -> "limit",
-        "expr" -> toSQLExpr(anyNonInteger),
-        "dataType" -> toSQLType(anyNonInteger.dataType)
-      )
-    )
-  }
-
-  test("LIMIT with null") {
-    val expr = Cast(Literal(null), IntegerType)
-    checkError(
-      exception = intercept[AnalysisException] {
-        limitExpressionResolver.resolve(expr)
-      },
-      condition = "INVALID_LIMIT_LIKE_EXPRESSION.IS_NULL",
-      parameters = Map(
-        "name" -> "limit",
-        "expr" -> toSQLExpr(expr)
-      )
-    )
-  }
-
-  test("LIMIT with negative integer") {
-    val expr = Literal(-1, IntegerType)
-    checkError(
-      exception = intercept[AnalysisException] {
-        limitExpressionResolver.resolve(expr)
-      },
-      condition = "INVALID_LIMIT_LIKE_EXPRESSION.IS_NEGATIVE",
-      parameters = Map(
-        "name" -> "limit",
-        "expr" -> toSQLExpr(expr),
-        "v" -> toSQLValue(-1, IntegerType)
-      )
-    )
-  }
-}
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidatorSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidatorSuite.scala
index 913de4b5a19f8..e4af0df35615b 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidatorSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/ResolutionValidatorSuite.scala
@@ -30,17 +30,10 @@ import org.apache.spark.sql.catalyst.expressions.{
   GreaterThan,
   Literal,
   NamedExpression,
-  TimeAdd
+  TimestampAddInterval
 }
 import org.apache.spark.sql.catalyst.plans.logical.{Filter, LocalRelation, LogicalPlan, Project}
-import org.apache.spark.sql.types.{
-  BooleanType,
-  DayTimeIntervalType,
-  DecimalType,
-  IntegerType,
-  StringType,
-  TimestampType
-}
+import org.apache.spark.sql.types._
 
 class ResolutionValidatorSuite extends SparkFunSuite with SQLConfHelper {
   private val resolveMethodNamesToIgnore = Seq(
@@ -188,7 +181,7 @@ class ResolutionValidatorSuite extends SparkFunSuite with SQLConfHelper {
       Project(
         projectList = Seq(
           Alias(
-            child = TimeAdd(
+            child = TimestampAddInterval(
               start = Cast(
                 child = Literal("2024-10-01"),
                 dataType = TimestampType,
@@ -205,7 +198,7 @@ class ResolutionValidatorSuite extends SparkFunSuite with SQLConfHelper {
         ),
         child = LocalRelation(output = colInteger)
       ),
-      error = Some("TimezoneId is not set for TimeAdd")
+      error = Some("TimezoneId is not set for TimestampAddInterval")
     )
   }
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolverSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolverSuite.scala
index e2e52081e8c65..8897d65654540 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolverSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/analysis/resolver/TimezoneAwareExpressionResolverSuite.scala
@@ -47,6 +47,15 @@ class TimezoneAwareExpressionResolverSuite extends SparkFunSuite {
     AttributeReference(name = "unresolvedChild", dataType = StringType)()
   private val resolvedChild = AttributeReference(name = "resolvedChild", dataType = IntegerType)()
   private val castExpression = Cast(child = unresolvedChild, dataType = IntegerType)
+  private val nestedCasts = Cast(
+    child = Cast(
+      child = Cast(child = unresolvedChild, dataType = IntegerType, timeZoneId = Some("UTC")),
+      dataType = IntegerType,
+      timeZoneId = None
+    ),
+    dataType = IntegerType,
+    timeZoneId = None
+  )
   private val expressionResolver = new HardCodedExpressionResolver(
     catalogManager = mock[CatalogManager],
     resolvedExpression = resolvedChild
@@ -72,4 +81,14 @@ class TimezoneAwareExpressionResolverSuite extends SparkFunSuite {
     assert(resolvedExpression.timeZoneId.nonEmpty)
     assert(resolvedExpression.getTagValue(Cast.USER_SPECIFIED_CAST).nonEmpty)
   }
+
+  test("Timezone is applied recursively") {
+    val expressionWithTimezone =
+      TimezoneAwareExpressionResolver.resolveTimezone(nestedCasts, "UTC")
+
+    assert(expressionWithTimezone.asInstanceOf[Cast].timeZoneId.get == "UTC")
+    assert(
+      expressionWithTimezone.asInstanceOf[Cast].child.asInstanceOf[Cast].timeZoneId.get == "UTC"
+    )
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogEventSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogEventSuite.scala
index 366188c3327be..15858bf2cc691 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogEventSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogEventSuite.scala
@@ -128,9 +128,9 @@ class ExternalCatalogEventSuite extends SparkFunSuite {
 
     // ALTER schema
     val newSchema = new StructType().add("id", "long", nullable = false)
-    catalog.alterTableDataSchema("db5", "tbl1", newSchema)
-    checkEvents(AlterTablePreEvent("db5", "tbl1", AlterTableKind.DATASCHEMA) ::
-      AlterTableEvent("db5", "tbl1", AlterTableKind.DATASCHEMA) :: Nil)
+    catalog.alterTableSchema("db5", "tbl1", newSchema)
+    checkEvents(AlterTablePreEvent("db5", "tbl1", AlterTableKind.SCHEMA) ::
+      AlterTableEvent("db5", "tbl1", AlterTableKind.SCHEMA) :: Nil)
 
     // ALTER stats
     catalog.alterTableStats("db5", "tbl1", None)
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogSuite.scala
index f4b0c232c25f6..5bb81873449cf 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/ExternalCatalogSuite.scala
@@ -245,12 +245,15 @@ abstract class ExternalCatalogSuite extends SparkFunSuite {
 
   test("alter table schema") {
     val catalog = newBasicCatalog()
-    val newDataSchema = StructType(Seq(
+    val newSchema = StructType(Seq(
       StructField("col1", IntegerType),
-      StructField("new_field_2", StringType)))
-    catalog.alterTableDataSchema("db2", "tbl1", newDataSchema)
+      StructField("new_field_2", StringType),
+      StructField("a", IntegerType),
+      StructField("b", StringType)))
+    catalog.alterTableSchema("db2", "tbl1", newSchema)
     val newTbl1 = catalog.getTable("db2", "tbl1")
-    assert(newTbl1.dataSchema == newDataSchema)
+    assert(newTbl1.dataSchema == StructType(newSchema.take(2)))
+    assert(newTbl1.schema == newSchema)
   }
 
   test("alter table stats") {
@@ -983,6 +986,32 @@ abstract class ExternalCatalogSuite extends SparkFunSuite {
       "db2", "tbl1", Seq(part1.spec), ignoreIfNotExists = false, purge = false, retainData = false)
     assert(fs.exists(partPath))
   }
+
+  test("SPARK-52683: support alterTableSchema partitioned columns") {
+    val catalog = newBasicCatalog()
+
+    val schema = new StructType()
+      .add("a", IntegerType)
+      .add("b", IntegerType)
+      .add("c", StringType)
+    val table = CatalogTable(
+      identifier = TableIdentifier("t", Some("db1")),
+      tableType = CatalogTableType.MANAGED,
+      storage = storageFormat,
+      schema = schema,
+      partitionColumnNames = Seq("c"),
+      provider = Some("hive"))
+    catalog.createTable(table, ignoreIfExists = false)
+
+    val newSchema = new StructType()
+      .add("b", LongType)
+      .add("a", IntegerType)
+      .add("c", StringType)
+    catalog.alterTableSchema("db1", "t", newSchema)
+
+    assert(catalog.getTable("db1", "t").schema == newSchema)
+    assert(catalog.getTable("db1", "t").partitionColumnNames == Seq("c"))
+  }
 }
 
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalogSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalogSuite.scala
index cfbc507fb5c74..f319a97d1133f 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalogSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/catalog/SessionCatalogSuite.scala
@@ -564,7 +564,7 @@ abstract class SessionCatalogSuite extends AnalysisTest with Eventually {
     }
   }
 
-  test("alter table add columns") {
+  test("alter data schema add columns") {
     withBasicCatalog { sessionCatalog =>
       sessionCatalog.createTable(newTable("t1", "default"), ignoreIfExists = false)
       val oldTab = sessionCatalog.externalCatalog.getTable("default", "t1")
@@ -580,6 +580,22 @@ abstract class SessionCatalogSuite extends AnalysisTest with Eventually {
     }
   }
 
+  test("alter schema add columns") {
+    withBasicCatalog { sessionCatalog =>
+      sessionCatalog.createTable(newTable("t1", "default"), ignoreIfExists = false)
+      val oldTab = sessionCatalog.externalCatalog.getTable("default", "t1")
+      val newSchema = StructType(oldTab.dataSchema.fields ++
+        Seq(StructField("c3", IntegerType)) ++ oldTab.partitionSchema)
+
+      sessionCatalog.alterTableSchema(
+        TableIdentifier("t1", Some("default")),
+        newSchema)
+
+      val newTab = sessionCatalog.externalCatalog.getTable("default", "t1")
+      assert(newTab.schema == newSchema)
+    }
+  }
+
   test("alter table drop columns") {
     withBasicCatalog { sessionCatalog =>
       sessionCatalog.createTable(newTable("t1", "default"), ignoreIfExists = false)
@@ -749,6 +765,13 @@ abstract class SessionCatalogSuite extends AnalysisTest with Eventually {
     Project(projectList, CatalystSqlParser.parsePlan(metadata.viewText.get))
   }
 
+  private def stripViewDDLFromGetViewColumbByNameAndOrdinal(plan: LogicalPlan): LogicalPlan = {
+    plan.transformAllExpressions {
+      case getViewColumnByNameAndOrdinal: GetViewColumnByNameAndOrdinal =>
+        getViewColumnByNameAndOrdinal.copy(viewDDL = None)
+    }
+  }
+
   test("look up view relation") {
     withBasicCatalog { catalog =>
       val props = CatalogTable.catalogAndNamespaceToProps("cat1", Seq("ns1"))
@@ -762,11 +785,17 @@ abstract class SessionCatalogSuite extends AnalysisTest with Eventually {
       // Look up a view.
       catalog.setCurrentDatabase("default")
       val view = View(desc = metadata, isTempView = false, child = getViewPlan(metadata))
-      comparePlans(catalog.lookupRelation(TableIdentifier("view1", Some("db3"))),
+      comparePlans(
+        stripViewDDLFromGetViewColumbByNameAndOrdinal(
+          catalog.lookupRelation(TableIdentifier("view1", Some("db3")))
+        ),
         SubqueryAlias(Seq(CatalogManager.SESSION_CATALOG_NAME, "db3", "view1"), view))
       // Look up a view using current database of the session catalog.
       catalog.setCurrentDatabase("db3")
-      comparePlans(catalog.lookupRelation(TableIdentifier("view1")),
+      comparePlans(
+        stripViewDDLFromGetViewColumbByNameAndOrdinal(
+          catalog.lookupRelation(TableIdentifier("view1"))
+        ),
         SubqueryAlias(Seq(CatalogManager.SESSION_CATALOG_NAME, "db3", "view1"), view))
     }
   }
@@ -781,7 +810,10 @@ abstract class SessionCatalogSuite extends AnalysisTest with Eventually {
       assert(metadata.viewCatalogAndNamespace == Seq(CatalogManager.SESSION_CATALOG_NAME, "db2"))
 
       val view = View(desc = metadata, isTempView = false, child = getViewPlan(metadata))
-      comparePlans(catalog.lookupRelation(TableIdentifier("view2", Some("db3"))),
+      comparePlans(
+        stripViewDDLFromGetViewColumbByNameAndOrdinal(
+          catalog.lookupRelation(TableIdentifier("view2", Some("db3")))
+        ),
         SubqueryAlias(Seq(CatalogManager.SESSION_CATALOG_NAME, "db3", "view2"), view))
     }
   }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/ExpressionEncoderSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/ExpressionEncoderSuite.scala
index 616c6d65636d7..85e8053a877a4 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/ExpressionEncoderSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/ExpressionEncoderSuite.scala
@@ -796,50 +796,51 @@ class ExpressionEncoderSuite extends CodegenInterpretedPlanTest with AnalysisTes
   }
   // Scala / Java big decimals ----------------------------------------------------------
 
-  encodeDecodeTest(BigDecimal(("9" * 20) + "." + "9" * 18),
+  encodeDecodeTest(BigDecimal("9".repeat(20) + "." + "9".repeat(18)),
     "scala decimal within precision/scale limit")
-  encodeDecodeTest(new java.math.BigDecimal(("9" * 20) + "." + "9" * 18),
+  encodeDecodeTest(new java.math.BigDecimal("9".repeat(20) + "." + "9".repeat(18)),
     "java decimal within precision/scale limit")
 
-  encodeDecodeTest(-BigDecimal(("9" * 20) + "." + "9" * 18),
+  encodeDecodeTest(-BigDecimal("9".repeat(20) + "." + "9".repeat(18)),
     "negative scala decimal within precision/scale limit")
-  encodeDecodeTest(new java.math.BigDecimal(("9" * 20) + "." + "9" * 18).negate,
+  encodeDecodeTest(new java.math.BigDecimal("9".repeat(20) + "." + "9".repeat(18)).negate,
     "negative java decimal within precision/scale limit")
 
-  testOverflowingBigNumeric(BigDecimal("1" * 21), "scala big decimal")
-  testOverflowingBigNumeric(new java.math.BigDecimal("1" * 21), "java big decimal")
+  testOverflowingBigNumeric(BigDecimal("1".repeat(21)), "scala big decimal")
+  testOverflowingBigNumeric(new java.math.BigDecimal("1".repeat(21)), "java big decimal")
 
-  testOverflowingBigNumeric(-BigDecimal("1" * 21), "negative scala big decimal")
-  testOverflowingBigNumeric(new java.math.BigDecimal("1" * 21).negate, "negative java big decimal")
+  testOverflowingBigNumeric(-BigDecimal("1".repeat(21)), "negative scala big decimal")
+  testOverflowingBigNumeric(new java.math.BigDecimal("1".repeat(21)).negate,
+    "negative java big decimal")
 
-  testOverflowingBigNumeric(BigDecimal(("1" * 21) + ".123"),
+  testOverflowingBigNumeric(BigDecimal("1".repeat(21) + ".123"),
     "scala big decimal with fractional part")
-  testOverflowingBigNumeric(new java.math.BigDecimal(("1" * 21) + ".123"),
+  testOverflowingBigNumeric(new java.math.BigDecimal("1".repeat(21) + ".123"),
     "java big decimal with fractional part")
 
-  testOverflowingBigNumeric(BigDecimal(("1" * 21)  + "." + "9999" * 100),
+  testOverflowingBigNumeric(BigDecimal("1".repeat(21)  + "." + "9999".repeat(100)),
     "scala big decimal with long fractional part")
-  testOverflowingBigNumeric(new java.math.BigDecimal(("1" * 21)  + "." + "9999" * 100),
+  testOverflowingBigNumeric(new java.math.BigDecimal("1".repeat(21)  + "." + "9999".repeat(100)),
     "java big decimal with long fractional part")
 
   // Scala / Java big integers ----------------------------------------------------------
 
-  encodeDecodeTest(BigInt("9" * 38), "scala big integer within precision limit")
-  encodeDecodeTest(new BigInteger("9" * 38), "java big integer within precision limit")
+  encodeDecodeTest(BigInt("9".repeat(38)), "scala big integer within precision limit")
+  encodeDecodeTest(new BigInteger("9".repeat(38)), "java big integer within precision limit")
 
-  encodeDecodeTest(-BigInt("9" * 38),
+  encodeDecodeTest(-BigInt("9".repeat(38)),
     "negative scala big integer within precision limit")
-  encodeDecodeTest(new BigInteger("9" * 38).negate(),
+  encodeDecodeTest(new BigInteger("9".repeat(38)).negate(),
     "negative java big integer within precision limit")
 
-  testOverflowingBigNumeric(BigInt("1" * 39), "scala big int")
-  testOverflowingBigNumeric(new BigInteger("1" * 39), "java big integer")
+  testOverflowingBigNumeric(BigInt("1".repeat(39)), "scala big int")
+  testOverflowingBigNumeric(new BigInteger("1".repeat(39)), "java big integer")
 
-  testOverflowingBigNumeric(-BigInt("1" * 39), "negative scala big int")
-  testOverflowingBigNumeric(new BigInteger("1" * 39).negate, "negative java big integer")
+  testOverflowingBigNumeric(-BigInt("1".repeat(39)), "negative scala big int")
+  testOverflowingBigNumeric(new BigInteger("1".repeat(39)).negate, "negative java big integer")
 
-  testOverflowingBigNumeric(BigInt("9" * 100), "scala very large big int")
-  testOverflowingBigNumeric(new BigInteger("9" * 100), "java very big int")
+  testOverflowingBigNumeric(BigInt("9".repeat(100)), "scala very large big int")
+  testOverflowingBigNumeric(new BigInteger("9".repeat(100)), "java very big int")
 
   private def testOverflowingBigNumeric[T: TypeTag](bigNumeric: T, testName: String): Unit = {
     Seq(true, false).foreach { ansiEnabled =>
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/RowEncoderSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/RowEncoderSuite.scala
index 1609e1a4e1136..09247a459b9c5 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/RowEncoderSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/encoders/RowEncoderSuite.scala
@@ -75,6 +75,26 @@ class ExamplePointUDT extends UserDefinedType[ExamplePoint] {
   private[spark] override def asNullable: ExamplePointUDT = this
 }
 
+class ExamplePointNotAnnotated(val x: Double, val y: Double) extends Serializable {
+  private val inner = new ExamplePoint(x, y)
+  override def hashCode: Int = inner.hashCode
+  override def equals(that: Any): Boolean = {
+    that match {
+      case e: ExamplePointNotAnnotated => inner.equals(e.inner)
+      case _ => false
+    }
+  }
+}
+class ExamplePointNotAnnotatedUDT extends UserDefinedType[ExamplePointNotAnnotated] {
+  override def sqlType: DataType = DoubleType
+  override def serialize(p: ExamplePointNotAnnotated): Double = p.x
+  override def deserialize(datum: Any): ExamplePointNotAnnotated = {
+    val x = datum.asInstanceOf[Double]
+    new ExamplePointNotAnnotated(x, 3.14 * datum.asInstanceOf[Double])
+  }
+  override def userClass: Class[ExamplePointNotAnnotated] = classOf[ExamplePointNotAnnotated]
+}
+
 class RowEncoderSuite extends CodegenInterpretedPlanTest {
 
   private val structOfString = new StructType().add("str", StringType)
@@ -111,7 +131,8 @@ class RowEncoderSuite extends CodegenInterpretedPlanTest {
       .add("binary", BinaryType)
       .add("date", DateType)
       .add("timestamp", TimestampType)
-      .add("udt", new ExamplePointUDT))
+      .add("udt", new ExamplePointUDT)
+      .add("udtNotAnnotated", new ExamplePointNotAnnotatedUDT))
 
   encodeDecodeTest(
     new StructType()
@@ -178,8 +199,8 @@ class RowEncoderSuite extends CodegenInterpretedPlanTest {
 
   test("SPARK-23179: RowEncoder should respect nullOnOverflow for decimals") {
     val schema = new StructType().add("decimal", DecimalType.SYSTEM_DEFAULT)
-    testDecimalOverflow(schema, Row(BigDecimal("9" * 100)))
-    testDecimalOverflow(schema, Row(new java.math.BigDecimal("9" * 100)))
+    testDecimalOverflow(schema, Row(BigDecimal("9".repeat(100))))
+    testDecimalOverflow(schema, Row(new java.math.BigDecimal("9".repeat(100))))
   }
 
   private def testDecimalOverflow(schema: StructType, row: Row): Unit = {
@@ -377,7 +398,7 @@ class RowEncoderSuite extends CodegenInterpretedPlanTest {
     val encoder = ExpressionEncoder(schema).resolveAndBind()
     val localTime = java.time.LocalTime.parse("20:38:45.123456")
     val row = toRow(encoder, Row(localTime))
-    assert(row.getLong(0) === DateTimeUtils.localTimeToMicros(localTime))
+    assert(row.getLong(0) === DateTimeUtils.localTimeToNanos(localTime))
     val readback = fromRow(encoder, row)
     assert(readback.get(0).equals(localTime))
   }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ArithmeticExpressionSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ArithmeticExpressionSuite.scala
index 89f0b95f5c18f..68cf654208ccc 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ArithmeticExpressionSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ArithmeticExpressionSuite.scala
@@ -710,11 +710,11 @@ class ArithmeticExpressionSuite extends SparkFunSuite with ExpressionEvalHelper
 
   test("SPARK-22499: Least and greatest should not generate codes beyond 64KB") {
     val N = 2000
-    val strings = (1 to N).map(x => "s" * x)
+    val strings = (1 to N).map(x => "s".repeat(x))
     val inputsExpr = strings.map(Literal.create(_, StringType))
 
-    checkEvaluation(Least(inputsExpr), "s" * 1, EmptyRow)
-    checkEvaluation(Greatest(inputsExpr), "s" * N, EmptyRow)
+    checkEvaluation(Least(inputsExpr), "s".repeat(1), EmptyRow)
+    checkEvaluation(Greatest(inputsExpr), "s".repeat(N), EmptyRow)
   }
 
   test("SPARK-22704: Least and greatest use less global variables") {
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastSuiteBase.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastSuiteBase.scala
index 92642de94a43c..e997cd6f5257a 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastSuiteBase.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastSuiteBase.scala
@@ -545,61 +545,42 @@ abstract class CastSuiteBase extends SparkFunSuite with ExpressionEvalHelper {
     checkCast("0", false)
   }
 
-  protected def checkInvalidCastFromNumericType(to: DataType): Unit = {
-    cast(1.toByte, to).checkInputDataTypes() ==
-      DataTypeMismatch(
-        errorSubClass = "CAST_WITH_FUNC_SUGGESTION",
-        messageParameters = Map(
-          "srcType" -> toSQLType(Literal(1.toByte).dataType),
-          "targetType" -> toSQLType(to),
-          "functionNames" -> "`DATE_FROM_UNIX_DATE`"
-        )
-      )
-    cast(1.toShort, to).checkInputDataTypes() ==
-      DataTypeMismatch(
-        errorSubClass = "CAST_WITH_FUNC_SUGGESTION",
-        messageParameters = Map(
-          "srcType" -> toSQLType(Literal(1.toShort).dataType),
-          "targetType" -> toSQLType(to),
-          "functionNames" -> "`DATE_FROM_UNIX_DATE`"
-        )
-      )
-    cast(1, to).checkInputDataTypes() ==
-      DataTypeMismatch(
-        errorSubClass = "CAST_WITH_FUNC_SUGGESTION",
-        messageParameters = Map(
-          "srcType" -> toSQLType(Literal(1).dataType),
-          "targetType" -> toSQLType(to),
-          "functionNames" -> "`DATE_FROM_UNIX_DATE`"
-        )
-      )
-    cast(1L, to).checkInputDataTypes() ==
-      DataTypeMismatch(
-        errorSubClass = "CAST_WITH_FUNC_SUGGESTION",
-        messageParameters = Map(
-          "srcType" -> toSQLType(Literal(1L).dataType),
-          "targetType" -> toSQLType(to),
-          "functionNames" -> "`DATE_FROM_UNIX_DATE`"
-        )
-      )
-    cast(1.0.toFloat, to).checkInputDataTypes() ==
-      DataTypeMismatch(
-        errorSubClass = "CAST_WITH_FUNC_SUGGESTION",
-        messageParameters = Map(
-          "srcType" -> toSQLType(Literal(1.0.toFloat).dataType),
-          "targetType" -> toSQLType(to),
-          "functionNames" -> "`DATE_FROM_UNIX_DATE`"
-        )
-      )
-    cast(1.0, to).checkInputDataTypes() ==
-      DataTypeMismatch(
-        errorSubClass = "CAST_WITH_FUNC_SUGGESTION",
-        messageParameters = Map(
-          "srcType" -> toSQLType(Literal(1.0).dataType),
-          "targetType" -> toSQLType(to),
-          "functionNames" -> "`DATE_FROM_UNIX_DATE`"
-        )
-      )
+  protected def createCastMismatch(
+      srcType: DataType,
+      targetType: DataType,
+      errorSubClass: String,
+      extraParams: Map[String, String] = Map.empty): DataTypeMismatch = {
+    val baseParams = Map(
+      "srcType" -> toSQLType(srcType),
+      "targetType" -> toSQLType(targetType)
+    )
+    DataTypeMismatch(errorSubClass, baseParams ++ extraParams)
+  }
+
+  protected def checkInvalidCastFromNumericTypeToDateType(): Unit = {
+    val errorSubClass = if (evalMode == EvalMode.LEGACY) {
+      "CAST_WITHOUT_SUGGESTION"
+    } else {
+      "CAST_WITH_FUNC_SUGGESTION"
+    }
+    val funcParams = if (evalMode == EvalMode.LEGACY) {
+      Map.empty[String, String]
+    } else {
+      Map("functionNames" -> "`DATE_FROM_UNIX_DATE`")
+    }
+    Seq(1.toByte, 1.toShort, 1, 1L, 1.0.toFloat, 1.0).foreach { testValue =>
+      val expectedError =
+        createCastMismatch(Literal(testValue).dataType, DateType, errorSubClass, funcParams)
+      assert(cast(testValue, DateType).checkInputDataTypes() == expectedError)
+    }
+  }
+  protected def checkInvalidCastFromNumericTypeToTimestampNTZType(): Unit = {
+    // All numeric types: `CAST_WITHOUT_SUGGESTION`
+    Seq(1.toByte, 1.toShort, 1, 1L, 1.0.toFloat, 1.0).foreach { testValue =>
+      val expectedError =
+        createCastMismatch(Literal(testValue).dataType, TimestampNTZType, "CAST_WITHOUT_SUGGESTION")
+      assert(cast(testValue, TimestampNTZType).checkInputDataTypes() == expectedError)
+    }
   }
 
   test("SPARK-16729 type checking for casting to date type") {
@@ -614,7 +595,7 @@ abstract class CastSuiteBase extends SparkFunSuite with ExpressionEvalHelper {
         )
       )
     )
-    checkInvalidCastFromNumericType(DateType)
+    checkInvalidCastFromNumericTypeToDateType()
   }
 
   test("SPARK-20302 cast with same structure") {
@@ -998,7 +979,7 @@ abstract class CastSuiteBase extends SparkFunSuite with ExpressionEvalHelper {
 
   test("disallow type conversions between Numeric types and Timestamp without time zone type") {
     import DataTypeTestUtils.numericTypes
-    checkInvalidCastFromNumericType(TimestampNTZType)
+    checkInvalidCastFromNumericTypeToTimestampNTZType()
     verifyCastFailure(
       cast(Literal(0L), TimestampNTZType),
       DataTypeMismatch(
@@ -1484,4 +1465,318 @@ abstract class CastSuiteBase extends SparkFunSuite with ExpressionEvalHelper {
     checkEvaluation(cast(Literal.create("23:59:59.000001     "),
       TimeType(6)), localTime(23, 59, 59, 1))
   }
+
+  test("context independent foldable") {
+    val array = Literal.create(Seq(1, 2, 3), ArrayType(IntegerType))
+    val targetArrayType = ArrayType(StringType, containsNull = true)
+    val map = Literal.create(
+      Map("a" -> "123", "b" -> "true", "c" -> "f"),
+      MapType(StringType, StringType, valueContainsNull = true))
+    val targetMapType = MapType(StringType, StringType, valueContainsNull = false)
+    val struct = Literal.create(
+      Row(1, "2", true, null),
+      StructType(Seq(
+        StructField("a", IntegerType),
+        StructField("b", StringType),
+        StructField("c", BooleanType),
+        StructField("d", NullType))))
+    val targetStructType = StructType(Seq(
+      StructField("a", StringType),
+      StructField("b", IntegerType),
+      StructField("c", BooleanType),
+      StructField("d", BooleanType)))
+    Seq(
+      cast(Literal(1), StringType),
+      cast(Literal(1), DateType),
+      cast(Literal(1L), TimestampNTZType),
+      cast(Literal("1"), IntegerType),
+      cast(Literal("true"), BooleanType),
+      cast(Literal("false"), BooleanType),
+      cast(Literal(1.5), IntegerType),
+      cast(Literal(1.5), LongType),
+      cast(Literal(100), ByteType),
+      cast(Literal(1000), ShortType),
+      cast(Literal(1), DoubleType),
+      cast(Literal(2.5), FloatType),
+      cast(Literal(123), DecimalType(10, 2)),
+      cast(Literal("1.5"), DoubleType),
+      cast(Literal("2023-01-01"), DateType),
+      cast(Literal(true), StringType),
+      cast(Literal(false), IntegerType),
+      cast(Literal(Duration.ofDays(1)), StringType),
+      cast(Literal(Period.ofMonths(1)), StringType),
+      cast(Literal(Decimal(10.5)), IntegerType),
+      cast(Literal(null, NullType), BooleanType),
+      cast(array, targetArrayType),
+      cast(map, targetMapType),
+      cast(struct, targetStructType)
+    ).foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(expr.contextIndependentFoldable,
+        s"Expression $expr should be context independent foldable")
+    }
+  }
+
+  test("context dependent foldable") {
+    val array = Literal.create(Seq("1", "2", "3"), ArrayType(StringType))
+    val dateArray = Literal.create(Seq(
+      Date.valueOf("2023-01-01"),
+      Date.valueOf("2023-01-02"),
+      Date.valueOf("2023-01-03")), ArrayType(DateType))
+    val targetArrayType = ArrayType(TimestampType, containsNull = true)
+
+    val map = Literal.create(
+      Map("a" -> "123", "b" -> "true", "c" -> "f"),
+      MapType(StringType, StringType, valueContainsNull = true))
+    val dateMap = Literal.create(
+      Map("a" -> Date.valueOf("2023-01-01"),
+        "b" -> Date.valueOf("2023-01-02"),
+        "c" -> Date.valueOf("2023-01-03")),
+      MapType(StringType, DateType, valueContainsNull = true))
+    val targetMapType = MapType(StringType, TimestampType, valueContainsNull = true)
+    val struct = Literal.create(
+      Row(1, "2", true, null),
+      StructType(Seq(
+        StructField("a", IntegerType),
+        StructField("b", StringType),
+        StructField("c", BooleanType),
+        StructField("d", NullType))))
+    val dateStruct = Literal.create(
+      Row(1, Date.valueOf("2023-01-02"), true, null),
+      StructType(Seq(
+        StructField("a", IntegerType),
+        StructField("b", DateType),
+        StructField("c", BooleanType),
+        StructField("d", NullType))))
+    val targetStructType = StructType(Seq(
+      StructField("a", StringType),
+      StructField("b", TimestampType),
+      StructField("c", BooleanType),
+      StructField("d", BooleanType)))
+    Seq(
+      cast(Literal("abc"), TimestampType),
+      cast(Literal(Date.valueOf("2023-01-01")), TimestampType),
+      cast(array, targetArrayType),
+      cast(dateArray, targetArrayType),
+      cast(map, targetMapType),
+      cast(dateMap, targetMapType),
+      cast(struct, targetStructType),
+      cast(dateStruct, targetStructType)
+    ).foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(!expr.contextIndependentFoldable,
+        s"Expression $expr should not be context independent foldable")
+    }
+  }
+
+  test("SPARK-51562: cast alias - time function") {
+    import org.apache.spark.sql.catalyst.analysis.FunctionRegistry
+    import org.apache.spark.sql.catalyst.FunctionIdentifier
+    // Test that time() function is registered and works correctly.
+    val registry = FunctionRegistry.builtin
+    val timeFunction = registry.lookupFunctionBuilder(FunctionIdentifier("time"))
+    assert(timeFunction.isDefined, "time function should be registered in FunctionRegistry")
+    // Test that time() function creates a proper Cast expression.
+    val stringInput = Literal("12:34:56")
+    val timeExpr = timeFunction.get(Seq(stringInput))
+    assert(timeExpr.isInstanceOf[Cast])
+    // The return type of the cast expression should be TimeType().
+    val castExpr = timeExpr.asInstanceOf[Cast]
+    assert(castExpr.dataType === TimeType())
+
+    // Test basic string to time conversions using the alias.
+    checkEvaluation(timeExpr, localTime(12, 34, 56))
+    val timeExprWithMillis = timeFunction.get(Seq(Literal("12:34:56.789")))
+    checkEvaluation(timeExprWithMillis, localTime(12, 34, 56, 789000))
+    val timeExprWithMicros = timeFunction.get(Seq(Literal("12:34:56.789012")))
+    checkEvaluation(timeExprWithMicros, localTime(12, 34, 56, 789012))
+
+    // Test null inputs.
+    val timeExprNull = timeFunction.get(Seq(Literal.create(null, StringType)))
+    checkEvaluation(timeExprNull, null)
+  }
+
+  test("cast time to time") {
+    checkEvaluation(cast(Literal(localTime(), TimeType(0)), TimeType(0)), 0L)
+    checkEvaluation(cast(Literal(localTime(0, 0, 0, 1), TimeType(6)), TimeType(6)),
+      localTime(0, 0, 0, 1))
+    checkEvaluation(cast(Literal(localTime(0, 0, 0, 19), TimeType(6)), TimeType(5)),
+      localTime(0, 0, 0, 10))
+    checkEvaluation(cast(Literal(localTime(23, 59, 59, 999990), TimeType(5)), TimeType(6)),
+      localTime(23, 59, 59, 999990))
+    checkEvaluation(cast(Literal(localTime(23, 59, 59, 999999), TimeType(6)), TimeType(5)),
+      localTime(23, 59, 59, 999990))
+    checkEvaluation(cast(Literal(localTime(11, 58, 59, 123400), TimeType(4)), TimeType(5)),
+      localTime(11, 58, 59, 123400))
+    checkEvaluation(cast(Literal(localTime(19, 2, 3, 765000), TimeType(3)), TimeType(2)),
+      localTime(19, 2, 3, 760000))
+
+    for (sp <- TimeType.MIN_PRECISION to TimeType.MAX_PRECISION) {
+      for (tp <- TimeType.MIN_PRECISION to TimeType.MAX_PRECISION) {
+        checkConsistencyBetweenInterpretedAndCodegen(
+          (child: Expression) => Cast(child, TimeType(sp)), TimeType(tp))
+      }
+    }
+  }
+
+  test("SPARK-52620: cast time to decimal with sufficient precision and scale") {
+    // Test various TIME values converted to DecimalType(14, 9), which always has sufficient
+    // precision and scale to represent the number of (nano)seconds since midnight. Note that
+    // 5 decimal places are sufficient to represent the maximum number of seconds in any TIME
+    // value, while 9 decimal places are needed to account for nanosecond fractional values.
+    Seq(
+      // 00:00:00 -> 0
+      (LocalTime.MIDNIGHT, Decimal(0)),
+      // 01:00:00 -> 3600
+      (LocalTime.of(1, 0, 0), Decimal(3600)),
+      // 01:01:00 -> 3660
+      (LocalTime.of(1, 1, 0), Decimal(3660)),
+      // 01:01:01 -> 3661
+      (LocalTime.of(1, 1, 1), Decimal(3661)),
+      // 01:02:03 -> 3723
+      (LocalTime.of(1, 2, 3), Decimal(3723)),
+      // 12:00:00 -> 43200
+      (LocalTime.NOON, Decimal(43200)),
+      // 23:59:59 -> 86399
+      (LocalTime.of(23, 59, 59), Decimal(86399)),
+      // 23:59:59.1 -> 86399.1
+      (LocalTime.of(23, 59, 59, 100000000), Decimal(86399.1)),
+      // 23:59:59.01 -> 86399.01
+      (LocalTime.of(23, 59, 59, 10000000), Decimal(86399.01)),
+      // 23:59:59.001 -> 86399.001
+      (LocalTime.of(23, 59, 59, 1000000), Decimal(86399.001)),
+      // 23:59:59.0001 -> 86399.0001
+      (LocalTime.of(23, 59, 59, 100000), Decimal(86399.0001)),
+      // 23:59:59.00001 -> 86399.00001
+      (LocalTime.of(23, 59, 59, 10000), Decimal(86399.00001)),
+      // 23:59:59.000001 -> 86399.000001
+      (LocalTime.of(23, 59, 59, 1000), Decimal(86399.000001)),
+      // 23:59:59.0000001 -> 86399.0000001
+      (LocalTime.of(23, 59, 59, 100), Decimal(86399.0000001)),
+      // 23:59:59.00000001 -> 86399.00000001
+      (LocalTime.of(23, 59, 59, 10), Decimal(86399.00000001)),
+      // 23:59:59.000000001 -> 86399.000000001
+      (LocalTime.of(23, 59, 59, 1), Decimal(86399.000000001))
+    ).foreach { case (time, expectedDecimal) =>
+      checkEvaluation(Cast(Literal(time), DecimalType(14, 9)), expectedDecimal)
+    }
+
+    // Test with different decimal precision and scale. The precision and scale of the
+    // DecimalType should be sufficient to represent the number of seconds since midnight.
+    // However, if the scale of the DecimalType is larger than necessary, the fractional
+    // seconds will be padded with zeros - which is the correct and expected behavior.
+    checkEvaluation(Cast(Literal(LocalTime.NOON), DecimalType(5, 0)), Decimal(43200, 5, 0))
+    checkEvaluation(Cast(Literal(LocalTime.NOON), DecimalType(6, 1)), Decimal(43200.0, 6, 1))
+    checkEvaluation(Cast(Literal(LocalTime.NOON), DecimalType(7, 2)), Decimal(43200.00, 7, 2))
+    checkEvaluation(Cast(Literal(LocalTime.NOON), DecimalType(8, 3)), Decimal(43200.000, 8, 3))
+    checkEvaluation(Cast(Literal(LocalTime.NOON), DecimalType(9, 4)), Decimal(43200.0000, 9, 4))
+    checkEvaluation(Cast(Literal(LocalTime.NOON), DecimalType(10, 5)), Decimal(43200.00000, 10, 5))
+    checkEvaluation(Cast(Literal(LocalTime.NOON), DecimalType(11, 6)), Decimal(43200.000000, 11, 6))
+  }
+
+  test("SPARK-52620: cast time to decimal with insufficient scale") {
+    // Decimal time precision loss happens if the scale of the target the DecimalType is not
+    // sufficient to represent the fractional seconds of the TIME value. The following tests
+    // check that the cast operation correctly rounds the fractional seconds to the nearest
+    // decimal value that can be represented by the DecimalType, as limited by its scale.
+
+    // The following test cases will test DecimalType(1,0). Here, the scale is 0, meaning
+    // that the fractional seconds will be ignored, and rounded to the nearest whole second.
+    var precision = 1
+    var scale = 0
+    Seq(
+      // 00:00:00.1 -> 0 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 100000000), 0),
+      // 00:00:00.4 -> 0 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 400000000), 0),
+      // 00:00:00.49 -> 0 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 490000000), 0),
+      // 00:00:00.499999999 -> 0 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 499999999), 0),
+      // 00:00:00.5 -> 0 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 500000000), 1),
+      // 00:00:00.500000001 -> 1 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 500000001), 1),
+      // 00:00:00.599999999 -> 1 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 599999999), 1),
+      // 00:00:00.999999999 -> 1 (when scale is: 0)
+      (LocalTime.of(0, 0, 0, 999999999), 1)
+    ).foreach { case (timeValue, decimalValue) =>
+      checkEvaluation(
+        expression = Cast(Literal(timeValue), DecimalType(precision, scale)),
+        expected = Decimal(decimalValue, precision, scale)
+      )
+    }
+
+    // The following test cases will test DecimalType(2,1). Here, the scale is 1, meaning
+    // that the fractional seconds will be rounded to the nearest tenth of a second.
+    precision = 2
+    scale = 1
+    Seq(
+      // 00:00:00.1 -> 0.1 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 100000000), 0.1),
+      // 00:00:00.4 -> 0.4 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 400000000), 0.4),
+      // 00:00:00.49 -> 0.5 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 490000000), 0.5),
+      // 00:00:00.499999999 -> 0.5 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 499999999), 0.5),
+      // 00:00:00.5 -> 0.5 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 500000000), 0.5),
+      // 00:00:00.500000001 -> 0.5 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 500000001), 0.5),
+      // 00:00:00.599999999 -> 0.6 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 599999999), 0.6),
+      // 00:00:00.999999999 -> 1.0 (when scale is: 1)
+      (LocalTime.of(0, 0, 0, 999999999), 1.0)
+    ).foreach { case (timeValue, decimalValue) =>
+      checkEvaluation(
+        expression = Cast(Literal(timeValue), DecimalType(precision, scale)),
+        expected = Decimal(decimalValue, precision, scale)
+      )
+    }
+  }
+
+  test("SPARK-52619: cast time to integral types") {
+    // Test normal cases that should work with a small number like 112 seconds after midnight
+    val smallTime = Literal.create(LocalTime.of(0, 1, 52), TimeType(6))
+    checkEvaluation(cast(smallTime, ByteType), 112.toByte)
+    checkEvaluation(cast(smallTime, ShortType), 112.toShort)
+    checkEvaluation(cast(smallTime, IntegerType), 112)
+    checkEvaluation(cast(smallTime, LongType), 112L)
+
+    // Test midnight to all integral types
+    val midnight = Literal.create(LocalTime.MIDNIGHT, TimeType(6))
+    checkEvaluation(cast(midnight, ByteType), 0.toByte)
+    checkEvaluation(cast(midnight, ShortType), 0.toShort)
+    checkEvaluation(cast(midnight, IntegerType), 0)
+    checkEvaluation(cast(midnight, LongType), 0L)
+
+    // Precision rounding/truncation tests with fractional seconds
+    val time0 = Literal.create(LocalTime.NOON, TimeType(0))
+    val time2 = Literal.create(LocalTime.of(12, 0, 0, 120000000), TimeType(2))
+    val time4 = Literal.create(LocalTime.of(12, 0, 0, 345600000), TimeType(4))
+    val oneTwoThreeTime5 = Literal.create(LocalTime.of(1, 2, 3, 555550000), TimeType(5))
+    val maxTime4 = Literal.create(LocalTime.of(23, 59, 59, 999900000), TimeType(4))
+    val fractional5 = Literal.create(LocalTime.of(0, 0, 17, 500000000), TimeType(1))
+    val fractional000001 = Literal.create(LocalTime.of(0, 0, 17, 1000), TimeType(6))
+    val fractional999999 = Literal.create(LocalTime.of(0, 0, 17, 999999000), TimeType(6))
+    val fractional6 = Literal.create(LocalTime.of(0, 0, 17, 600000000), TimeType(1))
+    val fractional4 = Literal.create(LocalTime.of(0, 0, 17, 400000000), TimeType(1))
+    val fractional555 = Literal.create(LocalTime.of(0, 0, 17, 555000000), TimeType(3))
+    checkEvaluation(cast(fractional5, IntegerType), 17)
+    checkEvaluation(cast(fractional5, LongType), 17L)
+    checkEvaluation(cast(fractional000001, IntegerType), 17)
+    checkEvaluation(cast(fractional999999, IntegerType), 17)
+    checkEvaluation(cast(fractional6, IntegerType), 17)
+    checkEvaluation(cast(fractional4, IntegerType), 17)
+    checkEvaluation(cast(fractional555, IntegerType), 17)
+    checkEvaluation(cast(time0, IntegerType), 43200)
+    checkEvaluation(cast(time2, IntegerType), 43200)
+    checkEvaluation(cast(time4, IntegerType), 43200)
+    checkEvaluation(cast(oneTwoThreeTime5, IntegerType), 3723)
+    checkEvaluation(cast(oneTwoThreeTime5, LongType), 3723L)
+    checkEvaluation(cast(maxTime4, IntegerType), 86399)
+    checkEvaluation(cast(maxTime4, LongType), 86399L)
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOffSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOffSuite.scala
index 534563a79742f..ec347a14a9a41 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOffSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOffSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.catalyst.expressions
 
 import java.sql.{Date, Timestamp}
-import java.time.{Duration, Period}
+import java.time.{Duration, LocalTime, Period}
 import java.time.temporal.ChronoUnit
 
 import org.apache.spark.sql.Row
@@ -907,4 +907,27 @@ class CastWithAnsiOffSuite extends CastSuiteBase {
       checkEvaluation(cast(invalidInput, TimeType()), null)
     }
   }
+
+  test("SPARK-52620: cast time to decimal with insufficient precision (ANSI off)") {
+    // Create a time that will overflow Decimal(2, 0): 23:59:59 = 86399 seconds.
+    val largeTime = Literal.create(LocalTime.of(23, 59, 59, 123456000), TimeType(6))
+    // Decimal(2, 0) cannot hold 86399.123456, so it should return null in non-ANSI mode.
+    checkEvaluation(cast(largeTime, DecimalType(2, 0)), null)
+  }
+
+  test("SPARK-52619: cast time to integral types with overflow with ansi off") {
+    // Create a time that will overflow Byte and Short: 23:59:59 = 86399 seconds
+    val largeTime6 = Literal.create(LocalTime.of(23, 59, 59, 123456000), TimeType(6))
+    val largeTime1 = Literal.create(LocalTime.of(23, 59, 59, 100000000), TimeType(1))
+
+    // Long and Int should work (86399 fits in both)
+    // Short and Byte should overflow and return null (non-ANSI mode)
+    // 86399 > Short.MaxValue (32767) and > Byte.MaxValue (127)
+    checkEvaluation(cast(largeTime6, LongType), 86399L)
+    checkEvaluation(cast(largeTime6, IntegerType), 86399)
+    checkEvaluation(cast(largeTime6, ShortType), null)
+    checkEvaluation(cast(largeTime6, ByteType), null)
+    checkEvaluation(cast(largeTime1, ShortType), null)
+    checkEvaluation(cast(largeTime1, ByteType), null)
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOnSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOnSuite.scala
index b62b8c1302ccf..b03d97abd9002 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOnSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CastWithAnsiOnSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.catalyst.expressions
 
 import java.sql.Timestamp
-import java.time.DateTimeException
+import java.time.{DateTimeException, LocalTime}
 
 import org.apache.spark.{SparkArithmeticException, SparkRuntimeException}
 import org.apache.spark.sql.Row
@@ -29,6 +29,7 @@ import org.apache.spark.sql.catalyst.util.DateTimeConstants.MILLIS_PER_SECOND
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils.{withDefaultTimeZone, UTC}
 import org.apache.spark.sql.errors.QueryErrorsBase
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.{UTF8String, VariantVal}
 
@@ -39,6 +40,33 @@ class CastWithAnsiOnSuite extends CastSuiteBase with QueryErrorsBase {
 
   override def evalMode: EvalMode.Value = EvalMode.ANSI
 
+  protected def checkInvalidCastFromNumericTypeToBinaryType(): Unit = {
+    def checkNumericTypeCast(
+        testValue: Any,
+        srcType: DataType,
+        to: DataType,
+        expectedErrorClass: String,
+        extraParams: Map[String, String] = Map.empty): Unit = {
+      val expectedError = createCastMismatch(srcType, to, expectedErrorClass, extraParams)
+      assert(cast(testValue, to).checkInputDataTypes() == expectedError)
+    }
+
+    // Integer types: suggest config change
+    val configParams = Map(
+      "config" -> toSQLConf(SQLConf.ANSI_ENABLED.key),
+      "configVal" -> toSQLValue("false", StringType)
+    )
+    checkNumericTypeCast(1.toByte, ByteType, BinaryType, "CAST_WITH_CONF_SUGGESTION", configParams)
+    checkNumericTypeCast(
+      1.toShort, ShortType, BinaryType, "CAST_WITH_CONF_SUGGESTION", configParams)
+    checkNumericTypeCast(1, IntegerType, BinaryType, "CAST_WITH_CONF_SUGGESTION", configParams)
+    checkNumericTypeCast(1L, LongType, BinaryType, "CAST_WITH_CONF_SUGGESTION", configParams)
+
+    // Floating types: no suggestion
+    checkNumericTypeCast(1.0.toFloat, FloatType, BinaryType, "CAST_WITHOUT_SUGGESTION")
+    checkNumericTypeCast(1.0, DoubleType, BinaryType, "CAST_WITHOUT_SUGGESTION")
+  }
+
   private def isTryCast = evalMode == EvalMode.TRY
 
   private def testIntMaxAndMin(dt: DataType): Unit = {
@@ -142,7 +170,7 @@ class CastWithAnsiOnSuite extends CastSuiteBase with QueryErrorsBase {
 
   test("ANSI mode: disallow type conversions between Numeric types and Date type") {
     import DataTypeTestUtils.numericTypes
-    checkInvalidCastFromNumericType(DateType)
+    checkInvalidCastFromNumericTypeToDateType()
     verifyCastFailure(
       cast(Literal(0L), DateType),
       DataTypeMismatch(
@@ -168,7 +196,7 @@ class CastWithAnsiOnSuite extends CastSuiteBase with QueryErrorsBase {
 
   test("ANSI mode: disallow type conversions between Numeric types and Binary type") {
     import DataTypeTestUtils.numericTypes
-    checkInvalidCastFromNumericType(BinaryType)
+    checkInvalidCastFromNumericTypeToBinaryType()
     val binaryLiteral = Literal(new Array[Byte](1.toByte), BinaryType)
     numericTypes.foreach { numericType =>
       assert(cast(binaryLiteral, numericType).checkInputDataTypes() ==
@@ -797,4 +825,55 @@ class CastWithAnsiOnSuite extends CastSuiteBase with QueryErrorsBase {
         castErrMsg(invalidInput, TimeType()))
     }
   }
+
+  test("SPARK-52620: cast time to decimal with insufficient precision (ANSI on)") {
+    // Create a time that will overflow Decimal(2, 0): 23:59:59 = 86399 seconds.
+    val largeTime = Literal.create(LocalTime.of(23, 59, 59, 123456000), TimeType(6))
+    // Decimal(2, 0) cannot hold 86399, so it should throw an exception in ANSI mode.
+    if (!isTryCast) {
+      // In ANSI mode, a NUMERIC_VALUE_OUT_OF_RANGE exception is thrown.
+      checkError(
+        exception = intercept[SparkArithmeticException](
+          cast(largeTime, DecimalType(2, 0)).eval()
+        ),
+        condition = "NUMERIC_VALUE_OUT_OF_RANGE.WITH_SUGGESTION",
+        parameters = Map(
+          "value" -> "86399.123456000",
+          "precision" -> "2",
+          "scale" -> "0",
+          "config" -> """"spark.sql.ansi.enabled""""
+        ),
+        queryContext = Array(ExpectedContext(fragment = "", start = -1, stop = -1))
+      )
+    } else {
+      // In TRY_CAST mode, null is returned instead of throwing an exception.
+      checkEvaluation(cast(largeTime, DecimalType(2, 0)), null)
+    }
+  }
+
+  test("SPARK-52619: cast time to integral types with overflow with ansi on") {
+    // Test overflow cases: 23:59:59 = 86399 seconds
+    val largeTime6 = Literal.create(LocalTime.of(23, 59, 59, 123456000), TimeType(6))
+    val largeTime4 = Literal.create(LocalTime.of(23, 59, 59, 678900000), TimeType(4))
+
+    // Short and Byte should overflow and throw ArithmeticException (ANSI mode)
+    // 86399 > Short.MaxValue (32767) and > Byte.MaxValue (127)
+    Seq(
+      (largeTime6, ShortType),
+      (largeTime6, ByteType),
+      (largeTime4, ShortType),
+      (largeTime4, ByteType)
+    ).foreach { case (timeValue, targetType) =>
+      checkErrorInExpression[SparkArithmeticException](
+        cast(timeValue, targetType),
+        "CAST_OVERFLOW",
+        Map(
+          "value" -> s"TIME '${timeValue.toString}'",
+          "sourceType" -> s"\"${timeValue.dataType.sql}\"",
+          "targetType" -> s"\"${targetType.sql}\"",
+          "ansiConfig" -> "\"spark.sql.ansi.enabled\""
+        )
+      )
+    }
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CollationRegexpExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CollationRegexpExpressionsSuite.scala
index 2c1244eec3659..3fc0d3b25a3d7 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CollationRegexpExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/CollationRegexpExpressionsSuite.scala
@@ -57,25 +57,37 @@ class CollationRegexpExpressionsSuite extends SparkFunSuite with ExpressionEvalH
   }
 
   test("StringSplit expression with collated strings") {
-    case class StringSplitTestCase[R](s: String, r: String, collation: String, expected: R)
+    case class StringSplitTestCase[R](s: String, r: String, collation: String,
+      expected: R, limit: Int)
     val testCases = Seq(
-      StringSplitTestCase("1A2B3C", "[ABC]", "UTF8_BINARY", Seq("1", "2", "3", "")),
-      StringSplitTestCase("1A2B3C", "[abc]", "UTF8_BINARY", Seq("1A2B3C")),
-      StringSplitTestCase("1A2B3C", "[ABC]", "UTF8_LCASE", Seq("1", "2", "3", "")),
-      StringSplitTestCase("1A2B3C", "[abc]", "UTF8_LCASE", Seq("1", "2", "3", "")),
-      StringSplitTestCase("1A2B3C", "[1-9]+", "UTF8_BINARY", Seq("", "A", "B", "C")),
-      StringSplitTestCase("", "", "UTF8_BINARY", Seq("")),
-      StringSplitTestCase("1A2B3C", "", "UTF8_BINARY", Seq("1", "A", "2", "B", "3", "C")),
-      StringSplitTestCase("", "[1-9]+", "UTF8_BINARY", Seq("")),
-      StringSplitTestCase(null, "[1-9]+", "UTF8_BINARY", null),
-      StringSplitTestCase("1A2B3C", null, "UTF8_BINARY", null),
-      StringSplitTestCase(null, null, "UTF8_BINARY", null)
+      StringSplitTestCase("1A2B3C", "[ABC]", "UTF8_BINARY", Seq("1", "2", "3", ""), -1),
+      StringSplitTestCase("1A2B3C", "[abc]", "UTF8_BINARY", Seq("1A2B3C"), -1),
+      StringSplitTestCase("1A2B3C", "[ABC]", "UTF8_LCASE", Seq("1", "2", "3", ""), -1),
+      StringSplitTestCase("1A2B3C", "[abc]", "UTF8_LCASE", Seq("1", "2", "3", ""), -1),
+      StringSplitTestCase("1A2B3C", "[1-9]+", "UTF8_BINARY", Seq("", "A", "B", "C"), -1),
+      StringSplitTestCase("", "", "UTF8_BINARY", Seq(""), -1),
+      StringSplitTestCase("1A2B3C", "", "UTF8_BINARY", Seq("1", "A", "2", "B", "3", "C"), -1),
+      StringSplitTestCase("1A2B3C", "", "UTF8_LCASE", Seq("1", "A", "2", "B", "3", "C"), -1),
+      StringSplitTestCase("1A2B3C", "", "UTF8_BINARY", Seq("1", "A", "2", "B", "3", "C"), 0),
+      StringSplitTestCase("1A2B3C", "", "UTF8_LCASE", Seq("1", "A", "2", "B", "3", "C"), 0),
+      StringSplitTestCase("1A2B3C", "", "UTF8_BINARY", Seq("1A2B3C"), 1),
+      StringSplitTestCase("1A2B3C", "", "UTF8_LCASE", Seq("1A2B3C"), 1),
+      StringSplitTestCase("1A2B3C", "", "UTF8_BINARY", Seq("1", "A", "2B3C"), 3),
+      StringSplitTestCase("1A2B3C", "", "UTF8_LCASE", Seq("1", "A", "2B3C"), 3),
+      StringSplitTestCase("1A2B3C", "", "UTF8_BINARY", Seq("1", "A", "2", "B", "3", "C"), 6),
+      StringSplitTestCase("1A2B3C", "", "UTF8_LCASE", Seq("1", "A", "2", "B", "3", "C"), 6),
+      StringSplitTestCase("1A2B3C", "", "UTF8_BINARY", Seq("1", "A", "2", "B", "3", "C"), 100),
+      StringSplitTestCase("1A2B3C", "", "UTF8_LCASE", Seq("1", "A", "2", "B", "3", "C"), 100),
+      StringSplitTestCase("", "[1-9]+", "UTF8_BINARY", Seq(""), -1),
+      StringSplitTestCase(null, "[1-9]+", "UTF8_BINARY", null, -1),
+      StringSplitTestCase("1A2B3C", null, "UTF8_BINARY", null, -1),
+      StringSplitTestCase(null, null, "UTF8_BINARY", null, -1)
     )
     testCases.foreach(t => {
       // StringSplit
       checkEvaluation(StringSplit(
         Literal.create(t.s, StringType(CollationFactory.collationNameToId(t.collation))),
-        Literal.create(t.r, StringType), -1), t.expected)
+        Literal.create(t.r, StringType), t.limit), t.expected)
     })
   }
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/DateExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/DateExpressionsSuite.scala
index f166dfb2d7e7c..f8257e8baf2c5 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/DateExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/DateExpressionsSuite.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.catalyst.expressions
 
 import java.sql.{Date, Timestamp}
 import java.text.SimpleDateFormat
-import java.time.{DateTimeException, Duration, Instant, LocalDate, LocalDateTime, Period, ZoneId}
+import java.time.{DateTimeException, Duration, Instant, LocalDate, LocalDateTime, LocalTime, Period, ZoneId}
 import java.time.temporal.ChronoUnit
 import java.util.{Calendar, Locale, TimeZone}
 import java.util.concurrent.TimeUnit._
@@ -483,32 +483,33 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
         val timeZoneId = Option(zid.getId)
         sdf.setTimeZone(TimeZone.getTimeZone(zid))
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             timestampLiteral("2016-01-29 10:00:00.000", sdf, dt),
             Literal(new CalendarInterval(1, 2, 123000L)),
             timeZoneId),
           timestampAnswer("2016-03-02 10:00:00.123", sdf, dt))
 
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             Literal.create(null, dt),
             Literal(new CalendarInterval(1, 2, 123000L)),
             timeZoneId),
           null)
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             timestampLiteral("2016-01-29 10:00:00.000", sdf, dt),
             Literal.create(null, CalendarIntervalType),
             timeZoneId),
           null)
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             Literal.create(null, dt),
             Literal.create(null, CalendarIntervalType),
             timeZoneId),
           null)
         checkConsistencyBetweenInterpretedAndCodegen(
-          (start: Expression, interval: Expression) => TimeAdd(start, interval, timeZoneId),
+          (start: Expression, interval: Expression) =>
+            TimestampAddInterval(start, interval, timeZoneId),
           dt, CalendarIntervalType)
       }
     }
@@ -521,28 +522,28 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
       sdf.setTimeZone(TimeZone.getTimeZone(zid))
 
       checkEvaluation(
-        TimeAdd(
+        TimestampAddInterval(
           Literal(new Timestamp(sdf.parse("2016-03-31 10:00:00.000").getTime)),
           UnaryMinus(Literal(new CalendarInterval(1, 0, 0))),
           timeZoneId),
         DateTimeUtils.fromJavaTimestamp(
           new Timestamp(sdf.parse("2016-02-29 10:00:00.000").getTime)))
       checkEvaluation(
-        TimeAdd(
+        TimestampAddInterval(
           Literal(new Timestamp(sdf.parse("2016-03-31 10:00:00.000").getTime)),
           UnaryMinus(Literal(new CalendarInterval(1, 1, 0))),
           timeZoneId),
         DateTimeUtils.fromJavaTimestamp(
           new Timestamp(sdf.parse("2016-02-28 10:00:00.000").getTime)))
       checkEvaluation(
-        TimeAdd(
+        TimestampAddInterval(
           Literal(new Timestamp(sdf.parse("2016-03-30 00:00:01.000").getTime)),
           UnaryMinus(Literal(new CalendarInterval(1, 0, 2000000.toLong))),
           timeZoneId),
         DateTimeUtils.fromJavaTimestamp(
           new Timestamp(sdf.parse("2016-02-28 23:59:59.000").getTime)))
       checkEvaluation(
-        TimeAdd(
+        TimestampAddInterval(
           Literal(new Timestamp(sdf.parse("2016-03-30 00:00:01.000").getTime)),
           UnaryMinus(Literal(new CalendarInterval(1, 1, 2000000.toLong))),
           timeZoneId),
@@ -550,25 +551,25 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
           new Timestamp(sdf.parse("2016-02-27 23:59:59.000").getTime)))
 
       checkEvaluation(
-        TimeAdd(
+        TimestampAddInterval(
           Literal.create(null, TimestampType),
           UnaryMinus(Literal(new CalendarInterval(1, 2, 123000L))),
           timeZoneId),
         null)
       checkEvaluation(
-        TimeAdd(
+        TimestampAddInterval(
           Literal(new Timestamp(sdf.parse("2016-01-29 10:00:00.000").getTime)),
           UnaryMinus(Literal.create(null, CalendarIntervalType)),
           timeZoneId),
         null)
       checkEvaluation(
-        TimeAdd(
+        TimestampAddInterval(
           Literal.create(null, TimestampType),
           UnaryMinus(Literal.create(null, CalendarIntervalType)),
           timeZoneId),
         null)
       checkConsistencyBetweenInterpretedAndCodegen((start: Expression, interval: Expression) =>
-        TimeAdd(start, UnaryMinus(interval), timeZoneId),
+        TimestampAddInterval(start, UnaryMinus(interval), timeZoneId),
         TimestampType, CalendarIntervalType)
     }
   }
@@ -1637,7 +1638,7 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
 
     // test overflow for decimal input
     checkExceptionInExpression[ArithmeticException](
-      SecondsToTimestamp(Literal(Decimal("9" * 38))), "Overflow"
+      SecondsToTimestamp(Literal(Decimal("9".repeat(38)))), "Overflow"
     )
     // test truncation error for decimal input
     checkExceptionInExpression[ArithmeticException](
@@ -1800,13 +1801,13 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
         val timeZoneId = Option(zid.getId)
         sdf.setTimeZone(TimeZone.getTimeZone(zid))
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             timestampLiteral("2021-01-01 00:00:00.123", sdf, dt),
             Literal(Duration.ofDays(10).plusMinutes(10).plusMillis(321)),
             timeZoneId),
           timestampAnswer("2021-01-11 00:10:00.444", sdf, dt))
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             timestampLiteral("2021-01-01 00:10:00.123", sdf, dt),
             Literal(Duration.ofDays(-10).minusMinutes(9).minusMillis(120)),
             timeZoneId),
@@ -1814,7 +1815,7 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
 
         val e = intercept[Exception] {
           checkEvaluation(
-            TimeAdd(
+            TimestampAddInterval(
               timestampLiteral("2021-01-01 00:00:00.123", sdf, dt),
               Literal(Duration.of(Long.MaxValue, ChronoUnit.MICROS)),
               timeZoneId),
@@ -1824,26 +1825,26 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
         assert(e.getMessage.contains("long overflow"))
 
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             Literal.create(null, dt),
             Literal(Duration.ofDays(1)),
             timeZoneId),
           null)
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             timestampLiteral("2021-01-01 00:00:00.123", sdf, dt),
             Literal.create(null, DayTimeIntervalType()),
             timeZoneId),
           null)
         checkEvaluation(
-          TimeAdd(
+          TimestampAddInterval(
             Literal.create(null, dt),
             Literal.create(null, DayTimeIntervalType()),
             timeZoneId),
           null)
         dayTimeIntervalTypes.foreach { it =>
           checkConsistencyBetweenInterpretedAndCodegen((ts: Expression, interval: Expression) =>
-            TimeAdd(ts, interval, timeZoneId), dt, it)
+            TimestampAddInterval(ts, interval, timeZoneId), dt, it)
         }
       }
     }
@@ -2140,4 +2141,144 @@ class DateExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
       }
     }
   }
+
+  /**
+   * Helper method to create a DATE literal from a string in date format.
+   */
+  private def dateLit(date: String): Expression = Literal(LocalDate.parse(date))
+
+  /**
+   * Helper method to create a TIME literal from a string in time format.
+   */
+  private def timeLit(time: String): Expression = Literal(LocalTime.parse(time))
+
+  /**
+   * Helper method to get the microseconds from a timestamp represented as a string.
+   */
+  private def timestampToMicros(timestamp: String, zoneId: ZoneId): Long = {
+    localDateTimeToMicros(LocalDateTime.parse(timestamp), zoneId)
+  }
+
+  private val sessionZoneId = DateTimeUtils.getZoneId(SQLConf.get.sessionLocalTimeZone)
+
+  test("SPARK-51415: make timestamp from date") {
+    // Test with valid date.
+    checkEvaluation(
+      MakeTimestampFromDateTime(dateLit("2023-10-01")),
+      timestampToMicros("2023-10-01T00:00:00", sessionZoneId)
+    )
+
+    // Test with null date.
+    checkEvaluation(
+      MakeTimestampFromDateTime(Literal(null, DateType)),
+      null
+    )
+  }
+
+  test("SPARK-51415: make timestamp from date and time") {
+    // Test with valid date and time.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        dateLit("2023-10-01"),
+        Some(timeLit("12:34:56.123456"))
+      ),
+      timestampToMicros("2023-10-01T12:34:56.123456", sessionZoneId)
+    )
+
+    // Test with null date.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        Literal(null, DateType),
+        Some(timeLit("12:34:56.123456"))
+      ),
+      null
+    )
+    // Test with null time.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        dateLit("2023-10-01"),
+        Some(Literal(null, TimeType()))
+      ),
+      null
+    )
+    // Test with null date and null time.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        Literal(null, DateType),
+        Some(Literal(null, TimeType())
+        )),
+      null
+    )
+  }
+
+  test("SPARK-51415: make timestamp from date, time, and timezone") {
+    Seq(
+      ("-09:30", MIT),
+      ("-08:00", PST),
+      ("+00:00", UTC),
+      ("+01:00", CET),
+      ("+09:00", JST),
+      ("UTC", UTC),
+      ("America/Los_Angeles", LA)
+    ).foreach( { case (tz, zoneId) =>
+      // Test with valid date, time, and timezone.
+      checkEvaluation(
+        MakeTimestampFromDateTime(
+          dateLit("2023-10-01"),
+          Some(timeLit("12:34:56.123456")),
+          Some(Literal(tz))
+        ),
+        timestampToMicros("2023-10-01T12:34:56.123456", zoneId)
+      )
+    })
+
+    // Test with null date.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        Literal(null, DateType),
+        Some(timeLit("12:34:56.123456")),
+        Some(Literal("+00:00"))
+      ),
+      null
+    )
+    // Test with null time.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        dateLit("2023-10-01"),
+        Some(Literal(null, TimeType())),
+        Some(Literal("+00:00"))
+      ),
+      null
+    )
+    // Test with null timezone.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        dateLit("2023-10-01"),
+        Some(timeLit("12:34:56.123456")),
+        Some(Literal(null, StringType))
+      ),
+      null
+    )
+    // Test with null date and null time.
+    checkEvaluation(
+      MakeTimestampFromDateTime(
+        Literal(null, DateType),
+        Some(Literal(null, TimeType())),
+        Some(Literal("+00:00"))
+      ),
+      null
+    )
+  }
+
+  test("make timestamp_ntz from date and time") {
+    checkEvaluation(MakeTimestampNTZ(dateLit("1970-01-01"), timeLit("00:00:00")), 0L)
+    checkEvaluation(MakeTimestampNTZ(dateLit("2025-06-20"), timeLit("15:20:30.123456")),
+      timestampToMicros("2025-06-20T15:20:30.123456", UTC))
+    checkEvaluation(MakeTimestampNTZ(Literal(null, DateType), timeLit("15:20:30.123456")),
+      null)
+    checkEvaluation(MakeTimestampNTZ(dateLit("2025-06-20"), Literal(null, TimeType())),
+      null)
+    checkEvaluation(MakeTimestampNTZ(Literal(null, DateType), Literal(null, TimeType())),
+      null)
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSQLBuilderSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSQLBuilderSuite.scala
index e88b0e32e9082..4ca6bc4c45418 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSQLBuilderSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ExpressionSQLBuilderSuite.scala
@@ -169,7 +169,7 @@ class ExpressionSQLBuilderSuite extends SparkFunSuite {
     val interval = Literal(new CalendarInterval(0, 0, MICROS_PER_HOUR))
 
     checkSQL(
-      TimeAdd($"a", interval),
+      TimestampAddInterval($"a", interval),
       "a + INTERVAL '1 hours'"
     )
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/HashExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/HashExpressionsSuite.scala
index dddc33aa43580..c084b67d4d57b 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/HashExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/HashExpressionsSuite.scala
@@ -32,6 +32,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.encoders.{ExamplePointUDT, ExpressionEncoder}
 import org.apache.spark.sql.catalyst.expressions.codegen.GenerateMutableProjection
 import org.apache.spark.sql.catalyst.util.{ArrayBasedMapData, CollationFactory, DateTimeUtils, GenericArrayData, IntervalUtils}
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{ArrayType, StructType, _}
 import org.apache.spark.unsafe.types.UTF8String
 import org.apache.spark.util.ArrayImplicits._
@@ -91,7 +92,14 @@ class HashExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
 
   def checkHiveHash(input: Any, dataType: DataType, expected: Long): Unit = {
     // Note : All expected hashes need to be computed using Hive 1.2.1
-    val actual = HiveHashFunction.hash(input, dataType, seed = 0)
+    val actual = HiveHashFunction.hash(
+      input,
+      dataType,
+      seed = 0,
+      isCollationAware = true,
+      // legacyCollationAwareHashing only matters when isCollationAware is false.
+      legacyCollationAwareHashing = false
+    )
 
     withClue(s"hash mismatch for input = `$input` of type `$dataType`.") {
       assert(actual == expected)
@@ -621,12 +629,18 @@ class HashExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
   }
 
   for (collation <- Seq("UTF8_LCASE", "UNICODE_CI", "UTF8_BINARY")) {
-    test(s"hash check for collated $collation strings") {
+    test(s"hash check for collated $collation strings - collation aware") {
       val s1 = "aaa"
       val s2 = "AAA"
 
-      val murmur3Hash1 = Murmur3Hash(Seq(Collate(Literal(s1), ResolvedCollation(collation))), 42)
-      val murmur3Hash2 = Murmur3Hash(Seq(Collate(Literal(s2), ResolvedCollation(collation))), 42)
+      val murmur3Hash1 = CollationAwareMurmur3Hash(
+        Seq(Collate(Literal(s1), ResolvedCollation(collation))),
+        42
+      )
+      val murmur3Hash2 = CollationAwareMurmur3Hash(
+        Seq(Collate(Literal(s2), ResolvedCollation(collation))),
+        42
+      )
 
       // Interpreted hash values for s1 and s2
       val interpretedHash1 = murmur3Hash1.eval()
@@ -644,6 +658,115 @@ class HashExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
     }
   }
 
+  for (collation <- Seq("UTF8_LCASE", "UNICODE_CI", "UTF8_BINARY")) {
+    test(s"hash check for collated $collation strings - collation agnostic") {
+      val s1 = "aaa"
+      val s2 = "AAA"
+
+      val murmur3Hash1 = Murmur3Hash(Seq(Collate(Literal(s1), ResolvedCollation(collation))), 42)
+      val murmur3Hash2 = Murmur3Hash(Seq(Collate(Literal(s2), ResolvedCollation(collation))), 42)
+
+      // Interpreted hash values for s1 and s2
+      val interpretedHash1 = murmur3Hash1.eval()
+      val interpretedHash2 = murmur3Hash2.eval()
+
+      // Check that interpreted and codegen hashes are equal
+      checkEvaluation(murmur3Hash1, interpretedHash1)
+      checkEvaluation(murmur3Hash2, interpretedHash2)
+
+      assert(interpretedHash1 != interpretedHash2)
+
+      // Check that the hash computed is the same as the UTF8_BINARY version of it.
+      if (!CollationFactory.fetchCollation(collation).isUtf8BinaryType) {
+        Seq[String](s1, s2).foreach { s =>
+          val utf8BinaryStringExpr = Collate(Literal(s), ResolvedCollation("UTF8_BINARY"))
+          val murmur3HashBinary = Murmur3Hash(Seq(utf8BinaryStringExpr), 42)
+          val hashBinary = murmur3HashBinary.eval()
+          val murmur3Hash = Murmur3Hash(Seq(Collate(Literal(s), ResolvedCollation(collation))), 42)
+          val interpretedHash = murmur3Hash.eval()
+          assert(interpretedHash == hashBinary)
+        }
+      }
+    }
+  }
+
+  // Below we test the `Murmur3Hash` and `XxHash64` expressions for the old behavior before the fix.
+  // The expected values have been computed using the old implementation of the expression.
+  test("SPARK-52828: always collation aware hash expression") {
+    withSQLConf(SQLConf.COLLATION_AWARE_HASHING_ENABLED.key -> "true") {
+      val testCases = Seq[(String, String, Int, Long)](
+        // UTF8_BINARY
+        ("AAA", "UTF8_BINARY", 22125783, 3965631622972380050L),
+        ("AAA  ", "UTF8_BINARY", 399014599, 196039582279068044L),
+        ("aaa", "UTF8_BINARY", -1689629761, 2465751751477118478L),
+        ("aaa   ", "UTF8_BINARY", -1721438718, -2249763606958050730L),
+        // UTF8_BINARY_RTRIM
+        ("AAA", "UTF8_BINARY_RTRIM", -1493064582, 982928955165138586L),
+        ("AAA  ", "UTF8_BINARY_RTRIM", -1493064582, 982928955165138586L),
+        ("aaa", "UTF8_BINARY_RTRIM", 2132077201, -4940759280126763524L),
+        ("aaa   ", "UTF8_BINARY_RTRIM", 2132077201, -4940759280126763524L),
+        // UTF8_LCASE
+        ("AAA", "UTF8_LCASE", 2132077201, -4940759280126763524L),
+        ("AAA  ", "UTF8_LCASE", -619073595, -1146641051608991690L),
+        ("aaa", "UTF8_LCASE", 2132077201, -4940759280126763524L),
+        ("aaa   ", "UTF8_LCASE", -1498994355, -739345240752106297L),
+        // UTF8_LCASE_RTRIM
+        ("AAA", "UTF8_LCASE_RTRIM", 2132077201, -4940759280126763524L),
+        ("AAA  ", "UTF8_LCASE_RTRIM", 2132077201, -4940759280126763524L),
+        ("aaa", "UTF8_LCASE_RTRIM", 2132077201, -4940759280126763524L),
+        ("aaa   ", "UTF8_LCASE_RTRIM", 2132077201, -4940759280126763524L),
+        // UNICODE
+        ("AAA", "UNICODE", 128537619, 49663227161197117L),
+        ("AAA  ", "UNICODE", 82814175, 3618364417906061797L),
+        ("aaa", "UNICODE", -1822783942, 290910714161494507L),
+        ("aaa   ", "UNICODE", -896289340, 1025563887784400925L),
+        // UNICODE_RTRIM
+        ("AAA", "UNICODE_RTRIM", 128537619, 49663227161197117L),
+        ("AAA  ", "UNICODE_RTRIM", 128537619, 49663227161197117L),
+        ("aaa", "UNICODE_RTRIM", -1822783942, 290910714161494507L),
+        ("aaa   ", "UNICODE_RTRIM", -1822783942, 290910714161494507L),
+        // UNICODE_CI
+        ("AAA", "UNICODE_CI", -443043098, -6629915645815515868L),
+        ("AAA  ", "UNICODE_CI", 667473856, -3263604567598338200L),
+        ("aaa", "UNICODE_CI", -443043098, -6629915645815515868L),
+        ("aaa   ", "UNICODE_CI", -390983808, -5159733933636691741L),
+        // UNICODE_CI_RTRIM
+        ("AAA", "UNICODE_CI_RTRIM", -443043098, -6629915645815515868L),
+        ("AAA  ", "UNICODE_CI_RTRIM", -443043098, -6629915645815515868L),
+        ("aaa", "UNICODE_CI_RTRIM", -443043098, -6629915645815515868L),
+        ("aaa   ", "UNICODE_CI_RTRIM", -443043098, -6629915645815515868L)
+      )
+      testCases.foreach { case (str, collationName, expectedMurmur3, expectedXxHash64) =>
+        val stringExpr = Collate(Literal(str), ResolvedCollation(collationName))
+        val murmur3Expr = Murmur3Hash(Seq(stringExpr), 42)
+        checkEvaluation(murmur3Expr, expectedMurmur3)
+        val xxHash64Expr = XxHash64(Seq(stringExpr), 42L)
+        checkEvaluation(xxHash64Expr, expectedXxHash64)
+      }
+    }
+  }
+
+  test("SPARK-52828: backward-compatible hash API should reject UTF8_LCASE collation") {
+    // This test verifies that the legacy hash API throws an exception when used with
+    // collation-aware strings such as UTF8_LCASE. The assertion ensures we catch unsupported
+    // usage early via the internal assertion (SchemaUtils.hasNonUTF8BinaryCollation).
+    val expr_lcase = Collate(Literal("AAA"), ResolvedCollation("UTF8_LCASE"))
+    intercept[IllegalArgumentException] {
+      Murmur3HashFunction.hash(expr_lcase.eval(null), expr_lcase.dataType, 42)
+    }
+    intercept[IllegalArgumentException] {
+      XxHash64Function.hash(expr_lcase.eval(null), expr_lcase.dataType, 42)
+    }
+    intercept[IllegalArgumentException] {
+      HiveHashFunction.hash(expr_lcase.eval(null), expr_lcase.dataType, 42)
+    }
+
+    val expr_utf8bin = Collate(Literal("AAA"), ResolvedCollation("UTF8_BINARY"))
+    Murmur3HashFunction.hash(expr_utf8bin.eval(null), expr_utf8bin.dataType, 42)
+    XxHash64Function.hash(expr_utf8bin.eval(null), expr_utf8bin.dataType, 42)
+    HiveHashFunction.hash(expr_utf8bin.eval(null), expr_utf8bin.dataType, 42)
+  }
+
   test("SPARK-18207: Compute hash for a lot of expressions") {
     def checkResult(schema: StructType, input: InternalRow): Unit = {
       val exprs = schema.fields.zipWithIndex.map { case (f, i) =>
@@ -756,9 +879,9 @@ class HashExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
 
   test("Support TimeType") {
     val time = Literal.create(LocalTime.of(23, 50, 59, 123456000), TimeType())
-    checkEvaluation(Murmur3Hash(Seq(time), 10), 258472763)
-    checkEvaluation(XxHash64(Seq(time), 10), -9197489935839400467L)
-    checkEvaluation(HiveHash(Seq(time)), -40222445)
+    checkEvaluation(Murmur3Hash(Seq(time), 10), 545499634)
+    checkEvaluation(XxHash64(Seq(time), 10), -3550518982366774761L)
+    checkEvaluation(HiveHash(Seq(time)), -1567775210)
   }
 
   private def testHash(inputSchema: StructType): Unit = {
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/JsonExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/JsonExpressionsSuite.scala
index 467d0fc360321..2a6cd3e3f0c29 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/JsonExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/JsonExpressionsSuite.scala
@@ -254,7 +254,7 @@ class JsonExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
   }
 
   test("some big value") {
-    val value = "x" * 3000
+    val value = "x".repeat(3000)
     checkEvaluation(
       GetJsonObject(NonFoldableLiteral((s"""{"big": "$value"}""")),
       NonFoldableLiteral("$.big")), value)
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralExpressionSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralExpressionSuite.scala
index 9ed0b48680c62..15c21ad089cb1 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralExpressionSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralExpressionSuite.scala
@@ -559,4 +559,100 @@ class LiteralExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
       assert(lit.sql === s"TIME '$str'")
     }
   }
+
+  test("context independent foldable literals") {
+    val array = Literal.create(Seq(1, 2, 3), ArrayType(IntegerType))
+    val map = Literal.create(
+      Map("a" -> "123", "b" -> "true", "c" -> "f"),
+      MapType(StringType, StringType, valueContainsNull = true))
+    val struct = Literal.create(
+      Row(1, "2", true, null),
+      StructType(Seq(
+        StructField("a", IntegerType),
+        StructField("b", StringType),
+        StructField("c", BooleanType),
+        StructField("d", NullType))))
+    // Create an array containing timestamps
+    val array2 = Literal.create(
+      Seq(java.sql.Timestamp.valueOf("2021-01-01 12:00:00")),
+      ArrayType(TimestampType))
+
+    // Create a map with timestamp values
+    val map2 = Literal.create(
+      Map("a" -> java.sql.Timestamp.valueOf("2021-01-01 12:00:00")),
+      MapType(StringType, TimestampType, valueContainsNull = true))
+
+    // Create a struct with a timestamp field
+    val struct2 = Literal.create(
+      Row(1, java.sql.Timestamp.valueOf("2021-01-01 12:00:00")),
+      StructType(Seq(
+        StructField("a", IntegerType),
+        StructField("b", TimestampType))))
+    Seq(
+      Literal(1),
+      Literal(1L),
+      Literal(1.0),
+      Literal(1.0f),
+      Literal("string"),
+      Literal(true),
+      Literal(false),
+      Literal(null, NullType),
+      Literal(Decimal(10.5)),
+      Literal(LocalDate.now()),
+      Literal(LocalTime.of(12, 30, 0)),
+      Literal(Period.ofMonths(1)),
+      Literal(Duration.ofDays(1)),
+      Literal.create(java.sql.Timestamp.valueOf("2021-01-01 12:00:00"), TimestampType),
+      Literal.create(1L, TimestampType),
+      array,
+      array2,
+      map,
+      map2,
+      struct,
+      struct2
+    ).foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(expr.contextIndependentFoldable,
+        s"Expression $expr should be context independent foldable")
+    }
+  }
+
+  test("context independent foldable literals with UDT") {
+    // Create point instances with ExamplePointUDT
+    val point1 = Array(1.0, 2.0)
+    val point2 = Array(3.0, 4.0)
+
+    Seq(
+      // Basic UDT example
+      Literal.create(point1, new ExamplePointUDT),
+
+      // Array containing UDT elements
+      Literal.create(
+        Array(point1, point2),
+        ArrayType(new ExamplePointUDT)),
+
+      // Map with UDT values
+      Literal.create(
+        Map("p1" -> point1, "p2" -> point2),
+        MapType(StringType, new ExamplePointUDT, valueContainsNull = false)),
+
+      // Struct containing UDT fields
+      Literal.create(
+        Row("point", point1, 42),
+        StructType(Seq(
+          StructField("name", StringType),
+          StructField("coordinates", new ExamplePointUDT),
+          StructField("id", IntegerType)
+        ))),
+
+      // Nested structure with UDT
+      Literal.create(
+        Map("points" -> Array(point1, point2)),
+        MapType(StringType, ArrayType(new ExamplePointUDT), valueContainsNull = false))
+    ).foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(expr.contextIndependentFoldable,
+        s"Expression $expr should not be context independent foldable")
+    }
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralGenerator.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralGenerator.scala
index ed5843478c009..49d6c73f506c4 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralGenerator.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/LiteralGenerator.scala
@@ -24,8 +24,9 @@ import java.util.concurrent.TimeUnit
 import org.scalacheck.{Arbitrary, Gen}
 import org.scalatest.Assertions._
 
-import org.apache.spark.sql.catalyst.util.DateTimeConstants.{MICROS_PER_MILLIS, MILLIS_PER_DAY}
+import org.apache.spark.sql.catalyst.util.DateTimeConstants.{MICROS_PER_MILLIS, MILLIS_PER_DAY, NANOS_PER_MICROS}
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
+import org.apache.spark.sql.catalyst.util.DateTimeUtils.{localTimeToNanos, nanosToMicros}
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.CalendarInterval
 
@@ -125,8 +126,8 @@ object LiteralGenerator {
 
   lazy val timeLiteralGen: Gen[Literal] = {
     // Valid range for TimeType is [00:00:00, 23:59:59.999999]
-    val minTime = DateTimeUtils.localTimeToMicros(LocalTime.MIN)
-    val maxTime = DateTimeUtils.localTimeToMicros(LocalTime.MAX)
+    val minTime = nanosToMicros(localTimeToNanos(LocalTime.MIN)) * NANOS_PER_MICROS
+    val maxTime = nanosToMicros(localTimeToNanos(LocalTime.MAX)) * NANOS_PER_MICROS
     for { t <- Gen.choose(minTime, maxTime) }
       yield Literal(t, TimeType())
   }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MathExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MathExpressionsSuite.scala
index 823a6d2ce8675..71787bb121304 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MathExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MathExpressionsSuite.scala
@@ -963,4 +963,51 @@ class MathExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
     checkEvaluation(WidthBucket(5.35, 0.024, Double.NegativeInfinity, 5L), null)
     checkEvaluation(WidthBucket(5.35, 0.024, Double.PositiveInfinity, 5L), null)
   }
+
+  test("context independent foldable math expressions") {
+    // Create some base literals
+    val intLit = Literal(5)
+    val doubleLit = Literal(10.5)
+    val decimalLit = Literal(Decimal(7.5))
+
+    // Create math expressions using these literals
+    val expressions = Seq(
+      // Basic arithmetic
+      Add(intLit, Literal(10)),
+      Subtract(doubleLit, Literal(2.5)),
+      Multiply(intLit, Literal(2)),
+      Divide(decimalLit, Literal(Decimal(2.5))),
+      Remainder(intLit, Literal(2)),
+
+      // Unary operations
+      UnaryMinus(intLit),
+      Abs(Literal(-10)),
+
+      // Math functions
+      Log(doubleLit),
+      Log10(doubleLit),
+      Log2(doubleLit),
+      Exp(doubleLit),
+      Sqrt(doubleLit),
+      Floor(doubleLit),
+      Ceil(doubleLit),
+
+      // Trig functions
+      Sin(doubleLit),
+      Cos(doubleLit),
+      Tan(doubleLit),
+      Asin(Literal(0.5)),
+      Acos(Literal(0.5)),
+      Atan(doubleLit),
+
+      // Nested expressions
+      Add(Multiply(intLit, Literal(2)), Divide(doubleLit, Literal(2.0)))
+    )
+
+    expressions.foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(expr.contextIndependentFoldable,
+        s"Expression $expr should be context independent foldable")
+    }
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MutableProjectionSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MutableProjectionSuite.scala
index 5143039281b48..628aa9874f4c7 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MutableProjectionSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/MutableProjectionSuite.scala
@@ -32,7 +32,8 @@ class MutableProjectionSuite extends SparkFunSuite with ExpressionEvalHelper {
 
   val fixedLengthTypes = Array[DataType](
     BooleanType, ByteType, ShortType, IntegerType, LongType, FloatType, DoubleType,
-    DateType, TimestampType) ++ dayTimeIntervalTypes ++ yearMonthIntervalTypes
+    DateType, TimestampType, TimestampNTZType, new TimeType(6)) ++
+    dayTimeIntervalTypes ++ yearMonthIntervalTypes
 
   val variableLengthTypes = Array(
     StringType, DecimalType.defaultConcreteType, CalendarIntervalType, BinaryType,
@@ -46,7 +47,7 @@ class MutableProjectionSuite extends SparkFunSuite with ExpressionEvalHelper {
 
   testBothCodegenAndInterpreted("fixed-length types") {
     val inputRow = InternalRow.fromSeq(Seq(
-      true, 3.toByte, 15.toShort, -83, 129L, 1.0f, 5.0, 1, 2L) ++
+      true, 3.toByte, 15.toShort, -83, 129L, 1.0f, 5.0, 1, 2L, 3L, 4L) ++
       Seq.tabulate(dayTimeIntervalTypes.length)(_ => Long.MaxValue) ++
       Seq.tabulate(yearMonthIntervalTypes.length)(_ => Int.MaxValue))
     val proj = createMutableProjection(fixedLengthTypes)
@@ -55,7 +56,7 @@ class MutableProjectionSuite extends SparkFunSuite with ExpressionEvalHelper {
 
   testBothCodegenAndInterpreted("unsafe buffer") {
     val inputRow = InternalRow.fromSeq(Seq(
-      false, 1.toByte, 9.toShort, -18, 53L, 3.2f, 7.8, 4, 9L) ++
+      false, 1.toByte, 9.toShort, -18, 53L, 3.2f, 7.8, 4, 9L, 10L, 11L) ++
       Seq.tabulate(dayTimeIntervalTypes.length)(_ => Long.MaxValue) ++
       Seq.tabulate(yearMonthIntervalTypes.length)(_ => Int.MaxValue))
     val numFields = fixedLengthTypes.length
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/OrderingSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/OrderingSuite.scala
index 52ab9ed46c6da..06c8b5ccef652 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/OrderingSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/OrderingSuite.scala
@@ -24,7 +24,9 @@ import org.apache.spark.serializer.KryoSerializer
 import org.apache.spark.sql.{RandomDataGenerator, Row}
 import org.apache.spark.sql.catalyst.{CatalystTypeConverters, InternalRow}
 import org.apache.spark.sql.catalyst.dsl.expressions._
+import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions.codegen.{CodegenContext, GenerateOrdering, LazilyGeneratedOrdering}
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
 import org.apache.spark.util.ArrayImplicits._
 
@@ -166,4 +168,24 @@ class OrderingSuite extends SparkFunSuite with ExpressionEvalHelper {
     GenerateOrdering.genComparisons(ctx, schema)
     assert(ctx.INPUT_ROW == null)
   }
+
+  test("SPARK-53275: ordering by stateful expressions in interpreted mode") {
+    // even though we explicitly create an InterpretedOrdering below, we still need
+    // to set CODEGEN_FACTORY_MODE to NO_CODEGEN because the ScalaUDF expression will
+    // indirectly create an UnsafeProjection, and we want that UnsafeProjection to be
+    // an InterpretedUnsafeProjection
+    withSQLConf(SQLConf.CODEGEN_FACTORY_MODE.key -> CodegenObjectFactoryMode.NO_CODEGEN.toString) {
+      val udfFunc = (s: String) => s
+      val stringUdf = ScalaUDF(udfFunc, StringType, BoundReference(0, StringType, true) :: Nil,
+        Option(ExpressionEncoder[String]().resolveAndBind()) :: Nil,
+        Some(ExpressionEncoder[String]().resolveAndBind()))
+      val sortOrder = Seq(SortOrder(stringUdf, Ascending))
+      val rowOrdering = new InterpretedOrdering(sortOrder)
+      val rowType = StructType(StructField("col1", StringType, nullable = true) :: Nil)
+      val toCatalyst = CatalystTypeConverters.createToCatalystConverter(rowType)
+      val rowB1 = toCatalyst(Row("B")).asInstanceOf[InternalRow]
+      val rowB2 = toCatalyst(Row("A")).asInstanceOf[InternalRow]
+      assert(rowOrdering.compare(rowB1, rowB2) > 0)
+    }
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/PredicateSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/PredicateSuite.scala
index 4a7bf807d1de9..fc3e80d890041 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/PredicateSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/PredicateSuite.scala
@@ -684,4 +684,86 @@ class PredicateSuite extends SparkFunSuite with ExpressionEvalHelper {
     assert(InSet(Literal(1), Set(1, 2)).simpleString(2) === "1 INSET 1, 2")
     assert(InSet(Literal(1), Set(1)).simpleString(1) === "1 INSET 1")
   }
+
+  test("context independent foldable predicate expressions") {
+    // Create some base literals
+    val intLit = Literal(5)
+    val strLit = Literal("test")
+    val boolLit = Literal(true)
+    val nullLit = Literal.create(null, IntegerType)
+    val ts = java.sql.Timestamp.valueOf("2021-01-01 12:00:00")
+    val tsLit = Literal.create(ts, TimestampType)
+    val ts2 = java.sql.Timestamp.valueOf("2021-01-02 12:00:00")
+    val tsLit2 = Literal.create(ts2, TimestampType)
+
+    // Create predicate expressions using these literals
+    val expressions = Seq(
+      // Comparison predicates
+      EqualTo(intLit, Literal(5)),
+      EqualNullSafe(intLit, Literal(5)),
+      GreaterThan(intLit, Literal(3)),
+      LessThan(intLit, Literal(10)),
+      GreaterThanOrEqual(intLit, Literal(5)),
+      LessThanOrEqual(intLit, Literal(5)),
+
+      // Logical operators
+      And(boolLit, Literal(false)),
+      Or(boolLit, Literal(false)),
+      Not(boolLit),
+
+      // String predicates
+      StartsWith(strLit, Literal("te")),
+      EndsWith(strLit, Literal("st")),
+      Contains(strLit, Literal("es")),
+
+      // NULL predicates
+      IsNull(nullLit),
+      IsNotNull(intLit),
+
+      // Other predicates
+      In(intLit, Seq(Literal(1), Literal(5), Literal(10))),
+      InSet(intLit, Set(1, 5, 10)),
+
+      // Nested predicates
+      And(GreaterThan(intLit, Literal(3)), LessThan(intLit, Literal(10))),
+
+      // Timestamp comparisons
+      EqualTo(tsLit, tsLit2),
+      GreaterThan(tsLit,
+        Literal.create(java.sql.Timestamp.valueOf("2020-12-31 12:00:00"), TimestampType)),
+      LessThan(tsLit, tsLit2)
+    )
+
+    expressions.foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(expr.contextIndependentFoldable,
+        s"Expression $expr should be context independent foldable")
+    }
+  }
+
+  test("context dependent foldable predicate expressions") {
+    // Create timestamp literals
+    val ts = java.sql.Timestamp.valueOf("2021-01-01 12:00:00")
+    val tsLit = Literal.create(ts, TimestampType)
+    val ts2 = java.sql.Timestamp.valueOf("2021-01-02 12:00:00")
+    val tsLit2 = Literal.create(ts2, TimestampType)
+
+    // Create predicate expressions that involve timestamps
+    val expressions = Seq(
+      // Predicates with cast operations
+      EqualTo(Cast(tsLit, DateType), Cast(tsLit2, DateType)),
+
+      // Expressions using date/time operations
+      EqualTo(
+        DateDiff(Cast(tsLit, DateType), Cast(tsLit2, DateType)),
+        Literal(-1)
+      )
+    )
+
+    expressions.foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(!expr.contextIndependentFoldable,
+        s"Expression $expr should not be context independent foldable")
+    }
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/RegexpExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/RegexpExpressionsSuite.scala
index 12aeb7d6685bf..e1654b9456f8a 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/RegexpExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/RegexpExpressionsSuite.scala
@@ -564,7 +564,7 @@ class RegexpExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
     checkEvaluation(
       StringSplit(Literal("hello"), Literal(""), 5), Seq("h", "e", "l", "l", "o"), row1)
     checkEvaluation(
-      StringSplit(Literal("hello"), Literal(""), 3), Seq("h", "e", "l"), row1)
+      StringSplit(Literal("hello"), Literal(""), 3), Seq("h", "e", "llo"), row1)
     checkEvaluation(
       StringSplit(Literal("hello"), Literal(""), 100), Seq("h", "e", "l", "l", "o"), row1)
     checkEvaluation(
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/StringExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/StringExpressionsSuite.scala
index 1687d614cc5eb..bca4984cfac9c 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/StringExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/StringExpressionsSuite.scala
@@ -522,7 +522,7 @@ class StringExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
   }
 
   test("SPARK-47307: base64 encoding without chunking") {
-    val longString = "a" * 58
+    val longString = "a".repeat(58)
     val encoded = "YWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYWFhYQ=="
     withSQLConf(SQLConf.CHUNK_BASE64_STRING_ENABLED.key -> "false") {
       checkEvaluation(Base64(Literal(longString.getBytes)), encoded)
@@ -954,7 +954,7 @@ class StringExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
   test("SPARK-22603: FormatString should not generate codes beyond 64KB") {
     val N = 4500
     val args = (1 to N).map(i => Literal.create(i.toString, StringType))
-    val format = "%s" * N
+    val format = "%s".repeat(N)
     val expected = (1 to N).map(i => i.toString).mkString
     checkEvaluation(FormatString(Literal(format) +: args: _*), expected)
   }
@@ -2098,4 +2098,42 @@ class StringExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
         "parameter" -> toSQLId("charset"),
         "charsets" -> CharsetProvider.VALID_CHARSETS.mkString(", ")))
   }
+
+  test("context independent foldable string expressions") {
+    Seq(
+      // Basic string literals
+      Literal("hello"),
+      Literal(""),
+      Literal.create(null, StringType),
+
+      // String functions
+      Concat(Seq(Literal("hello"), Literal("world"))),
+      Upper(Literal("hello")),
+      Lower(Literal("WORLD")),
+      Substring(Literal("hello"), Literal(1), Literal(3)),
+
+      // String with other types
+      Concat(Seq(Literal("count: "), Literal(123))),
+      Concat(Seq(Literal("price: "), Literal(Decimal(10.5)))),
+
+      // Pattern matching
+      Like(Literal("hello"), Literal("hel%"), '\\'),
+      RLike(Literal("hello"), Literal("h.*o")),
+
+      // Nested expressions
+      Concat(Seq(
+        Upper(Literal("hello")),
+        Literal(" "),
+        Lower(Literal("WORLD"))
+      ))
+    ).foreach { expr =>
+      assert(expr.foldable, s"Expression $expr should be foldable")
+      assert(expr.deterministic, s"Expression $expr should be deterministic")
+      if (!expr.references.exists(_.name.contains("RAND")) &&
+        !expr.toString.contains("current_")) {
+        assert(expr.contextIndependentFoldable,
+          s"Expression $expr should be context independent foldable")
+      }
+    }
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TimeExpressionsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TimeExpressionsSuite.scala
index 06ea49f0f71d0..e832c9f4dda69 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TimeExpressionsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TimeExpressionsSuite.scala
@@ -17,14 +17,16 @@
 
 package org.apache.spark.sql.catalyst.expressions
 
-import java.time.LocalTime
+import java.time.{Duration, LocalTime}
 
-import org.apache.spark.{SPARK_DOC_ROOT, SparkDateTimeException, SparkFunSuite}
+import org.apache.spark.{SPARK_DOC_ROOT, SparkDateTimeException, SparkFunSuite, SparkIllegalArgumentException}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{DataTypeMismatch, TypeCheckSuccess}
 import org.apache.spark.sql.catalyst.expressions.Cast.{toSQLId, toSQLValue}
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils._
-import org.apache.spark.sql.types.{Decimal, DecimalType, IntegerType, StringType, TimeType}
+import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils.localTimeToNanos
+import org.apache.spark.sql.types.{DayTimeIntervalType, Decimal, DecimalType, IntegerType, StringType, TimeType}
+import org.apache.spark.sql.types.DayTimeIntervalType.{DAY, HOUR, SECOND}
 
 class TimeExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
   test("ParseToTime") {
@@ -358,8 +360,214 @@ class TimeExpressionsSuite extends SparkFunSuite with ExpressionEvalHelper {
     checkEvaluation(
       SecondsOfTimeWithFraction(Literal.create(null, TimeType(TimeType.MICROS_PRECISION))),
       null)
+    assert(SecondsOfTimeWithFraction(Literal.create(null)).inputTypes.nonEmpty)
+
     checkConsistencyBetweenInterpretedAndCodegen(
       (child: Expression) => SecondsOfTimeWithFraction(child).replacement,
       TimeType())
   }
+
+  test("Add ANSI day-time intervals to TIME") {
+    checkEvaluation(
+      TimeAddInterval(Literal.create(null, TimeType()), Literal(Duration.ofHours(1))),
+      null)
+    checkEvaluation(
+      TimeAddInterval(Literal(LocalTime.of(12, 30)), Literal(null, DayTimeIntervalType(SECOND))),
+      null)
+    checkEvaluation(
+      TimeAddInterval(Literal(LocalTime.of(8, 31)), Literal(Duration.ofMinutes(30))),
+      LocalTime.of(8, 31).plusMinutes(30))
+    // Maximum precision of TIME and DAY-TIME INTERVAL
+    assert(TimeAddInterval(
+      Literal(0L, TimeType(0)),
+      Literal(0L, DayTimeIntervalType(DAY))).dataType == TimeType(0))
+    assert(TimeAddInterval(
+      Literal(1L, TimeType(TimeType.MAX_PRECISION)),
+      Literal(1L, DayTimeIntervalType(HOUR))).dataType == TimeType(TimeType.MAX_PRECISION))
+    assert(TimeAddInterval(
+      Literal(2L, TimeType(TimeType.MIN_PRECISION)),
+      Literal(2L, DayTimeIntervalType(SECOND))).dataType == TimeType(TimeType.MICROS_PRECISION))
+    assert(TimeAddInterval(
+      Literal(3L, TimeType(TimeType.MAX_PRECISION)),
+      Literal(3L, DayTimeIntervalType(SECOND))).dataType == TimeType(TimeType.MAX_PRECISION))
+    checkConsistencyBetweenInterpretedAndCodegenAllowingException(
+      (time: Expression, interval: Expression) => TimeAddInterval(time, interval).replacement,
+      TimeType(), DayTimeIntervalType())
+  }
+
+  test("SPARK-51555: Time difference") {
+    // Test cases for various difference units - from 09:32:05.359123 until 17:23:49.906152.
+    val startTime: Long = localTime(9, 32, 5, 359123)
+    val startTimeLit: Expression = Literal(startTime, TimeType())
+    val endTime: Long = localTime(17, 23, 49, 906152)
+    val endTimeLit: Expression = Literal(endTime, TimeType())
+
+    // Test differences for valid units.
+    checkEvaluation(TimeDiff(Literal("HOUR"), startTimeLit, endTimeLit), 7L)
+    checkEvaluation(TimeDiff(Literal("MINUTE"), startTimeLit, endTimeLit), 471L)
+    checkEvaluation(TimeDiff(Literal("SECOND"), startTimeLit, endTimeLit), 28304L)
+    checkEvaluation(TimeDiff(Literal("MILLISECOND"), startTimeLit, endTimeLit), 28304547L)
+    checkEvaluation(TimeDiff(Literal("MICROSECOND"), startTimeLit, endTimeLit), 28304547029L)
+
+    // Test case-insensitive units.
+    checkEvaluation(TimeDiff(Literal("hour"), startTimeLit, endTimeLit), 7L)
+    checkEvaluation(TimeDiff(Literal("Minute"), startTimeLit, endTimeLit), 471L)
+    checkEvaluation(TimeDiff(Literal("seconD"), startTimeLit, endTimeLit), 28304L)
+    checkEvaluation(TimeDiff(Literal("milliSECOND"), startTimeLit, endTimeLit), 28304547L)
+    checkEvaluation(TimeDiff(Literal("mIcRoSeCoNd"), startTimeLit, endTimeLit), 28304547029L)
+
+    // Test invalid units.
+    val invalidUnits: Seq[String] = Seq("MS", "INVALID", "ABC", "XYZ", " ", "")
+    invalidUnits.foreach { unit =>
+      checkErrorInExpression[SparkIllegalArgumentException](
+        TimeDiff(Literal(unit), startTimeLit, endTimeLit),
+        condition = "INVALID_PARAMETER_VALUE.TIME_UNIT",
+        parameters = Map(
+          "functionName" -> "`time_diff`",
+          "parameter" -> "`unit`",
+          "invalidValue" -> s"'$unit'"
+        )
+      )
+    }
+
+    // Test null inputs.
+    val nullUnit = Literal.create(null, StringType)
+    val nullTime = Literal.create(null, TimeType())
+    checkEvaluation(TimeDiff(nullUnit, startTimeLit, endTimeLit), null)
+    checkEvaluation(TimeDiff(Literal("hour"), nullTime, endTimeLit), null)
+    checkEvaluation(TimeDiff(Literal("hour"), startTimeLit, nullTime), null)
+    checkEvaluation(TimeDiff(nullUnit, nullTime, endTimeLit), null)
+    checkEvaluation(TimeDiff(nullUnit, startTimeLit, nullTime), null)
+    checkEvaluation(TimeDiff(Literal("hour"), nullTime, nullTime), null)
+    checkEvaluation(TimeDiff(nullUnit, nullTime, nullTime), null)
+  }
+
+  test("Subtract times") {
+    checkEvaluation(
+      SubtractTimes(Literal.create(null, TimeType()), Literal(LocalTime.MIN)),
+      null)
+    checkEvaluation(
+      SubtractTimes(Literal(LocalTime.MAX), Literal(null, TimeType())),
+      null)
+    checkEvaluation(
+      SubtractTimes(
+        Literal(LocalTime.of(8, 31).plusMinutes(30)),
+        Literal(LocalTime.of(8, 31))),
+      Duration.ofMinutes(30))
+    assert(SubtractTimes(
+      Literal(0L, TimeType(0)),
+      Literal(0L, TimeType(0))).dataType == DayTimeIntervalType(HOUR, SECOND))
+
+    for (i <- TimeType.MIN_PRECISION to TimeType.MAX_PRECISION) {
+      for (j <- TimeType.MIN_PRECISION to TimeType.MAX_PRECISION) {
+        checkConsistencyBetweenInterpretedAndCodegenAllowingException(
+          (end: Expression, start: Expression) => SubtractTimes(end, start).replacement,
+          TimeType(i), TimeType(j))
+      }
+    }
+  }
+
+  test("SPARK-51554: TimeTrunc") {
+    // Test cases for different truncation units - 09:32:05.359123.
+    val testTime = localTime(9, 32, 5, 359123)
+
+    // Test HOUR truncation.
+    checkEvaluation(
+      TimeTrunc(Literal("HOUR"), Literal(testTime, TimeType())),
+      localTime(9, 0, 0, 0)
+    )
+    // Test MINUTE truncation.
+    checkEvaluation(
+      TimeTrunc(Literal("MINUTE"), Literal(testTime, TimeType())),
+      localTime(9, 32, 0, 0)
+    )
+    // Test SECOND truncation.
+    checkEvaluation(
+      TimeTrunc(Literal("SECOND"), Literal(testTime, TimeType())),
+      localTime(9, 32, 5, 0)
+    )
+    // Test MILLISECOND truncation.
+    checkEvaluation(
+      TimeTrunc(Literal("MILLISECOND"), Literal(testTime, TimeType())),
+      localTime(9, 32, 5, 359000)
+    )
+    // Test MICROSECOND truncation.
+    checkEvaluation(
+      TimeTrunc(Literal("MICROSECOND"), Literal(testTime, TimeType())),
+      testTime
+    )
+
+    // Test case-insensitive units.
+    checkEvaluation(
+      TimeTrunc(Literal("hour"), Literal(testTime, TimeType())),
+      localTime(9, 0, 0, 0)
+    )
+    checkEvaluation(
+      TimeTrunc(Literal("Hour"), Literal(testTime, TimeType())),
+      localTime(9, 0, 0, 0)
+    )
+    checkEvaluation(
+      TimeTrunc(Literal("hoUR"), Literal(testTime, TimeType())),
+      localTime(9, 0, 0, 0)
+    )
+
+    // Test invalid units.
+    val invalidUnits: Seq[String] = Seq("MS", "INVALID", "ABC", "XYZ", " ", "")
+    invalidUnits.foreach { unit =>
+      checkError(
+        exception = intercept[SparkIllegalArgumentException] {
+          TimeTrunc(Literal(unit), Literal(testTime, TimeType())).eval()
+        },
+        condition = "INVALID_PARAMETER_VALUE.TIME_UNIT",
+        parameters = Map(
+          "functionName" -> "`time_trunc`",
+          "parameter" -> "`unit`",
+          "invalidValue" -> s"'$unit'"
+        )
+      )
+    }
+
+    // Test null inputs.
+    checkEvaluation(
+      TimeTrunc(Literal.create(null, StringType), Literal(testTime, TimeType())),
+      null
+    )
+    checkEvaluation(
+      TimeTrunc(Literal("HOUR"), Literal.create(null, TimeType())),
+      null
+    )
+    checkEvaluation(
+      TimeTrunc(Literal.create(null, StringType), Literal.create(null, TimeType())),
+      null
+    )
+
+    // Test edge cases.
+    val midnightTime = localTime(0, 0, 0, 0)
+    val supportedUnits: Seq[String] = Seq("HOUR", "MINUTE", "SECOND", "MILLISECOND", "MICROSECOND")
+    supportedUnits.foreach { unit =>
+      checkEvaluation(
+        TimeTrunc(Literal(unit), Literal(midnightTime, TimeType())),
+        midnightTime
+      )
+    }
+
+    val maxTime = localTimeToNanos(LocalTime.of(23, 59, 59, 999999999))
+    checkEvaluation(
+      TimeTrunc(Literal("HOUR"), Literal(maxTime, TimeType())),
+      localTime(23, 0, 0, 0)
+    )
+    checkEvaluation(
+      TimeTrunc(Literal("MICROSECOND"), Literal(maxTime, TimeType())),
+      localTimeToNanos(LocalTime.of(23, 59, 59, 999999000))
+    )
+
+    // Test precision loss.
+    val timeWithMicroPrecision = localTime(15, 30, 45, 123456)
+    val timeTruncMin = TimeTrunc(Literal("MINUTE"), Literal(timeWithMicroPrecision, TimeType(3)))
+    assert(timeTruncMin.dataType == TimeType(3))
+    checkEvaluation(timeTruncMin, localTime(15, 30, 0, 0))
+    val timeTruncSec = TimeTrunc(Literal("SECOND"), Literal(timeWithMicroPrecision, TimeType(3)))
+    assert(timeTruncSec.dataType == TimeType(3))
+    checkEvaluation(timeTruncSec, localTime(15, 30, 45, 0))
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ToPrettyStringSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ToPrettyStringSuite.scala
index 5c297c00acc0f..6a2651edd9ab2 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ToPrettyStringSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/ToPrettyStringSuite.scala
@@ -136,9 +136,9 @@ class ToPrettyStringSuite extends SparkFunSuite with ExpressionEvalHelper {
   }
 
   test("Time as pretty strings") {
-    checkEvaluation(ToPrettyString(Literal(1000L, TimeType())), "00:00:00.001")
-    checkEvaluation(ToPrettyString(Literal(1L, TimeType())), "00:00:00.000001")
+    checkEvaluation(ToPrettyString(Literal(1000 * 1000L, TimeType())), "00:00:00.001")
+    checkEvaluation(ToPrettyString(Literal(1000L, TimeType())), "00:00:00.000001")
     checkEvaluation(ToPrettyString(Literal(
-      (23 * 3600 + 59 * 60 + 59) * 1000000L, TimeType())), "23:59:59")
+      (23 * 3600 + 59 * 60 + 59) * 1000000000L, TimeType())), "23:59:59")
   }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TryCastSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TryCastSuite.scala
index 446514de91d69..312b057555075 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TryCastSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/TryCastSuite.scala
@@ -61,6 +61,15 @@ class TryCastSuite extends CastWithAnsiOnSuite {
     checkEvaluation(cast(l, to), tryCastResult, InternalRow(l.value))
   }
 
+  override protected def checkInvalidCastFromNumericTypeToBinaryType(): Unit = {
+    // All numeric types: `CAST_WITHOUT_SUGGESTION`
+    Seq(1.toByte, 1.toShort, 1, 1L, 1.0.toFloat, 1.0).foreach { testValue =>
+      val expectedError =
+        createCastMismatch(Literal(testValue).dataType, BinaryType, "CAST_WITHOUT_SUGGESTION")
+      assert(cast(testValue, BinaryType).checkInputDataTypes() == expectedError)
+    }
+  }
+
   test("print string") {
     assert(cast(Literal("1"), IntegerType).toString == "try_cast(1 as int)")
     assert(cast(Literal("1"), IntegerType).sql == "TRY_CAST('1' AS INT)")
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/UnsafeRowConverterSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/UnsafeRowConverterSuite.scala
index 1fbdcd97a346a..37ef843665fa5 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/UnsafeRowConverterSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/UnsafeRowConverterSuite.scala
@@ -114,14 +114,14 @@ class UnsafeRowConverterSuite extends SparkFunSuite with Matchers with Expressio
     // Date is represented as Int in unsafeRow
     assert(DateTimeUtils.toJavaDate(unsafeRow.getInt(2)) === Date.valueOf("1970-01-01"))
     // Timestamp is represented as Long in unsafeRow
-    DateTimeUtils.toJavaTimestamp(unsafeRow.getLong(3)) should be
-    (Timestamp.valueOf("2015-05-08 08:10:25"))
+    DateTimeUtils.toJavaTimestamp(unsafeRow.getLong(3)) should be(
+      Timestamp.valueOf("2015-05-08 08:10:25"))
 
     unsafeRow.setInt(2, DateTimeUtils.fromJavaDate(Date.valueOf("2015-06-22")))
     assert(DateTimeUtils.toJavaDate(unsafeRow.getInt(2)) === Date.valueOf("2015-06-22"))
     unsafeRow.setLong(3, DateTimeUtils.fromJavaTimestamp(Timestamp.valueOf("2015-06-22 08:10:25")))
-    DateTimeUtils.toJavaTimestamp(unsafeRow.getLong(3)) should be
-    (Timestamp.valueOf("2015-06-22 08:10:25"))
+    DateTimeUtils.toJavaTimestamp(unsafeRow.getLong(3)) should be(
+      Timestamp.valueOf("2015-06-22 08:10:25"))
   }
 
   testBothCodegenAndInterpreted(
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/aggregate/ApproxTopKSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/aggregate/ApproxTopKSuite.scala
new file mode 100644
index 0000000000000..2b339003abd4c
--- /dev/null
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/aggregate/ApproxTopKSuite.scala
@@ -0,0 +1,256 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.catalyst.expressions.aggregate
+
+import org.apache.spark.SparkFunSuite
+import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{DataTypeMismatch, TypeCheckFailure}
+import org.apache.spark.sql.catalyst.expressions.{Abs, ApproxTopKEstimate, BoundReference, Literal}
+import org.apache.spark.sql.catalyst.expressions.Cast.ordinalNumber
+import org.apache.spark.sql.types.{ArrayType, BinaryType, IntegerType, LongType, MapType, StringType, StructField, StructType}
+
+class ApproxTopKSuite extends SparkFunSuite {
+
+  /////////////////////////////
+  // ApproxTopK tests
+  /////////////////////////////
+
+  test("SPARK-52515: Accepts literal and foldable inputs") {
+    val agg = new ApproxTopK(
+      expr = BoundReference(0, IntegerType, nullable = true),
+      k = Abs(Literal(10)),
+      maxItemsTracked = Abs(Literal(-10))
+    )
+    assert(agg.checkInputDataTypes().isSuccess)
+  }
+
+  test("SPARK-52515: Fail if parameters are not foldable") {
+    val badAgg = new ApproxTopK(
+      expr = BoundReference(0, IntegerType, nullable = true),
+      k = Sum(BoundReference(1, IntegerType, nullable = true)),
+      maxItemsTracked = Literal(10)
+    )
+    assert(badAgg.checkInputDataTypes().isFailure)
+    assert(badAgg.checkInputDataTypes() ==
+      DataTypeMismatch(
+        errorSubClass = "UNEXPECTED_INPUT_TYPE",
+        messageParameters = Map(
+          "paramIndex" -> ordinalNumber(1),
+          "requiredType" -> "\"INT\"",
+          "inputSql" -> "\"sum(boundreference())\"",
+          "inputType" -> "\"BIGINT\""
+        )
+      )
+    )
+
+    val badAgg2 = new ApproxTopK(
+      expr = BoundReference(0, IntegerType, nullable = true),
+      k = Literal(10),
+      maxItemsTracked = Sum(BoundReference(1, IntegerType, nullable = true))
+    )
+    assert(badAgg2.checkInputDataTypes().isFailure)
+    assert(badAgg2.checkInputDataTypes() ==
+      DataTypeMismatch(
+        errorSubClass = "UNEXPECTED_INPUT_TYPE",
+        messageParameters = Map(
+          "paramIndex" -> ordinalNumber(2),
+          "requiredType" -> "\"INT\"",
+          "inputSql" -> "\"sum(boundreference())\"",
+          "inputType" -> "\"BIGINT\""
+        )
+      )
+    )
+  }
+
+  gridTest("SPARK-52515: invalid ApproxTopK with unsupported item types")(
+    Seq(
+      ("array", ArrayType(IntegerType)),
+      ("map", MapType(StringType, IntegerType)),
+      ("struct", StructType(Seq(StructField("a", IntegerType)))),
+      ("binary", BinaryType)
+    )) { unSupportedType =>
+    val (typeName, dataType) = unSupportedType
+    val agg = new ApproxTopK(
+      expr = BoundReference(0, dataType, nullable = true),
+      k = Literal(10),
+      maxItemsTracked = Literal(10000)
+    )
+    assert(agg.checkInputDataTypes().isFailure)
+    assert(agg.checkInputDataTypes() == TypeCheckFailure(s"$typeName columns are not supported"))
+  }
+
+  /////////////////////////////
+  // ApproxTopKAccumulate tests
+  /////////////////////////////
+
+  gridTest("SPARK-52588: invalid accumulate if item type is not supported")(
+    Seq(
+      ("array", ArrayType(IntegerType)),
+      ("map", MapType(StringType, IntegerType)),
+      ("struct", StructType(Seq(StructField("a", IntegerType)))),
+      ("binary", BinaryType)
+    )) { unSupportedType =>
+    val (typeName, dataType) = unSupportedType
+    val badAccumulate = ApproxTopKAccumulate(
+      expr = BoundReference(0, dataType, nullable = true),
+      maxItemsTracked = Literal(10)
+    )
+    assert(badAccumulate.checkInputDataTypes().isFailure)
+    assert(badAccumulate.checkInputDataTypes() ==
+      TypeCheckFailure(s"$typeName columns are not supported"))
+  }
+
+  test("SPARK-52588: invalid accumulate if maxItemsTracked are not foldable") {
+    val badAccumulate = ApproxTopKAccumulate(
+      expr = BoundReference(0, IntegerType, nullable = true),
+      maxItemsTracked = Sum(BoundReference(1, IntegerType, nullable = true))
+    )
+    assert(badAccumulate.checkInputDataTypes().isFailure)
+    assert(badAccumulate.checkInputDataTypes() ==
+      DataTypeMismatch(
+        errorSubClass = "UNEXPECTED_INPUT_TYPE",
+        messageParameters = Map(
+          "paramIndex" -> ordinalNumber(1),
+          "requiredType" -> "\"INT\"",
+          "inputSql" -> "\"sum(boundreference())\"",
+          "inputType" -> "\"BIGINT\""
+        )
+      )
+    )
+  }
+
+  /////////////////////////////
+  // ApproxTopKEstimate tests
+  /////////////////////////////
+
+  val stateStructType: StructType = StructType(Seq(
+    StructField("sketch", BinaryType),
+    StructField("itemDataType", IntegerType),
+    StructField("maxItemsTracked", IntegerType)
+  ))
+
+  test("SPARK-52588: invalid estimate if k are not foldable") {
+    val badEstimate = ApproxTopKEstimate(
+      state = BoundReference(0, StructType(Seq(
+        StructField("sketch", BinaryType),
+        StructField("itemDataType", IntegerType),
+        StructField("maxItemsTracked", IntegerType))), nullable = false),
+      k = Sum(BoundReference(1, IntegerType, nullable = true))
+    )
+    assert(badEstimate.checkInputDataTypes().isFailure)
+    assert(badEstimate.checkInputDataTypes() ==
+      DataTypeMismatch(
+        errorSubClass = "UNEXPECTED_INPUT_TYPE",
+        messageParameters = Map(
+          "paramIndex" -> ordinalNumber(1),
+          "requiredType" -> "\"INT\"",
+          "inputSql" -> "\"sum(boundreference())\"",
+          "inputType" -> "\"BIGINT\""
+        )
+      )
+    )
+  }
+
+  test("SPARK-52588: invalid estimate if state is not a struct") {
+    val badEstimate = ApproxTopKEstimate(
+      state = BoundReference(0, IntegerType, nullable = false),
+      k = Literal(5)
+    )
+    assert(badEstimate.checkInputDataTypes().isFailure)
+    assert(badEstimate.checkInputDataTypes() ==
+      DataTypeMismatch(
+        errorSubClass = "UNEXPECTED_INPUT_TYPE",
+        messageParameters = Map(
+          "paramIndex" -> ordinalNumber(0),
+          "requiredType" -> "\"STRUCT\"",
+          "inputSql" -> "\"boundreference()\"",
+          "inputType" -> "\"INT\""
+        )
+      )
+    )
+  }
+
+  test("SPARK-52588: invalid estimate if state struct length is not 3") {
+    val invalidState = StructType(Seq(
+      StructField("sketch", BinaryType),
+      StructField("itemDataType", IntegerType)
+      // Missing "maxItemsTracked"
+    ))
+    val badEstimate = ApproxTopKEstimate(
+      state = BoundReference(0, invalidState, nullable = false),
+      k = Literal(5)
+    )
+    assert(badEstimate.checkInputDataTypes().isFailure)
+    assert(badEstimate.checkInputDataTypes() ==
+      TypeCheckFailure("State must be a struct with 3 fields. " +
+        "Expected struct: struct<sketch:binary,itemDataType:any,maxItemsTracked:int>. " +
+        "Got: struct<sketch:binary,itemDataType:int>"))
+  }
+
+  test("SPARK-52588: invalid estimate if state struct's first field is not binary") {
+    val invalidState = StructType(Seq(
+      StructField("notSketch", IntegerType), // Should be BinaryType
+      StructField("itemDataType", IntegerType),
+      StructField("maxItemsTracked", IntegerType)
+    ))
+    val badEstimate = ApproxTopKEstimate(
+      state = BoundReference(0, invalidState, nullable = false),
+      k = Literal(5)
+    )
+    assert(badEstimate.checkInputDataTypes().isFailure)
+    assert(badEstimate.checkInputDataTypes() ==
+      TypeCheckFailure("State struct must have the first field to be binary. Got: int"))
+  }
+
+  gridTest("SPARK-52588: invalid estimate if state struct's second field is not supported")(
+    Seq(
+      ("array<int>", ArrayType(IntegerType)),
+      ("map<string,int>", MapType(StringType, IntegerType)),
+      ("struct<a:int>", StructType(Seq(StructField("a", IntegerType)))),
+      ("binary", BinaryType)
+    )) { unSupportedType =>
+    val (typeName, dataType) = unSupportedType
+    val invalidState = StructType(Seq(
+      StructField("sketch", BinaryType),
+      StructField("itemDataType", dataType),
+      StructField("maxItemsTracked", IntegerType)
+    ))
+    val badEstimate = ApproxTopKEstimate(
+      state = BoundReference(0, invalidState, nullable = false),
+      k = Literal(5)
+    )
+    assert(badEstimate.checkInputDataTypes().isFailure)
+    assert(badEstimate.checkInputDataTypes() ==
+      TypeCheckFailure(s"State struct must have the second field to be a supported data type. " +
+        s"Got: $typeName"))
+  }
+
+  test("SPARK-52588: invalid estimate if state struct's third field is not int") {
+    val invalidState = StructType(Seq(
+      StructField("sketch", BinaryType),
+      StructField("itemDataType", IntegerType),
+      StructField("maxItemsTracked", LongType) // Should be IntegerType
+    ))
+    val badEstimate = ApproxTopKEstimate(
+      state = BoundReference(0, invalidState, nullable = false),
+      k = Literal(5)
+    )
+    assert(badEstimate.checkInputDataTypes().isFailure)
+    assert(badEstimate.checkInputDataTypes() ==
+      TypeCheckFailure("State struct must have the third field to be int. Got: bigint"))
+  }
+}
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionEvalUtilsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionEvalUtilsSuite.scala
index f599fead45015..2aef7c455e64f 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionEvalUtilsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionEvalUtilsSuite.scala
@@ -65,18 +65,18 @@ class VariantExpressionEvalUtilsSuite extends SparkFunSuite {
     check("0.000000001", Array(primitiveHeader(DECIMAL4), 9, 1, 0, 0, 0), emptyMetadata)
     check("0.0000000001",
       Array(primitiveHeader(DECIMAL8), 10, 1, 0, 0, 0, 0, 0, 0, 0), emptyMetadata)
-    check("9" * 38,
-      Array[Byte](primitiveHeader(DECIMAL16), 0) ++ BigInt("9" * 38).toByteArray.reverse,
+    check("9".repeat(38),
+      Array[Byte](primitiveHeader(DECIMAL16), 0) ++ BigInt("9".repeat(38)).toByteArray.reverse,
       emptyMetadata)
-    check("1" + "0" * 38,
+    check("1" + "0".repeat(38),
       Array(primitiveHeader(DOUBLE)) ++
         BigInt(java.lang.Double.doubleToLongBits(1E38)).toByteArray.reverse,
       emptyMetadata)
     check("\"\"", Array(shortStrHeader(0)), emptyMetadata)
     check("\"abcd\"", Array(shortStrHeader(4), 'a', 'b', 'c', 'd'), emptyMetadata)
-    check("\"" + ("x" * 63) + "\"",
+    check("\"" + "x".repeat(63) + "\"",
       Array(shortStrHeader(63)) ++ Array.fill(63)('x'.toByte), emptyMetadata)
-    check("\"" + ("y" * 64) + "\"",
+    check("\"" + "y".repeat(64) + "\"",
       Array[Byte](primitiveHeader(LONG_STR), 64, 0, 0, 0) ++ Array.fill(64)('y'.toByte),
       emptyMetadata)
     check("{}", Array(objectHeader(false, 1, 1),
@@ -133,7 +133,7 @@ class VariantExpressionEvalUtilsSuite extends SparkFunSuite {
       checkException(json, "MALFORMED_RECORD_IN_PARSING.WITHOUT_SUGGESTION",
         Map("badRecord" -> json, "failFastMode" -> "FAILFAST"))
     }
-    for (json <- Seq("\"" + "a" * (16 * 1024 * 1024) + "\"",
+    for (json <- Seq("\"" + "a".repeat(16 * 1024 * 1024) + "\"",
       (0 to 4 * 1024 * 1024).mkString("[", ",", "]"))) {
       checkException(json, "VARIANT_SIZE_LIMIT",
         Map("sizeLimit" -> "16.0 MiB", "functionName" -> "`parse_json`"))
@@ -166,7 +166,7 @@ class VariantExpressionEvalUtilsSuite extends SparkFunSuite {
     check("false", expected = false)
     check("false", expected = false)
     check("65.43", expected = false)
-    check("\"" + "spark" * 100 + "\"", expected = false)
+    check("\"" + "spark".repeat(100) + "\"", expected = false)
     // Short String
     check("\"\"", expected = false)
     check("\"null\"", expected = false)
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionSuite.scala
index 5d61d09cfc4b7..ef2618e8455f2 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/variant/VariantExpressionSuite.scala
@@ -33,6 +33,7 @@ import org.apache.spark.sql.types._
 import org.apache.spark.types.variant.VariantBuilder
 import org.apache.spark.types.variant.VariantUtil._
 import org.apache.spark.unsafe.types.{UTF8String, VariantVal}
+import org.apache.spark.util.collection.Utils.createArray
 
 class VariantExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
   // Zero-extend each byte in the array with the appropriate number of bytes.
@@ -61,7 +62,7 @@ class VariantExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
     // INT8 only has 7 byte content.
     check(Array(primitiveHeader(INT8), 0, 0, 0, 0, 0, 0, 0), emptyMetadata)
     // DECIMAL16 only has 15 byte content.
-    check(Array(primitiveHeader(DECIMAL16)) ++ Array.fill(16)(0.toByte), emptyMetadata)
+    check(Array(primitiveHeader(DECIMAL16)) ++ createArray[Byte](16, 0.toByte), emptyMetadata)
     // 1e38 has a precision of 39. Even if it still fits into 16 bytes, it is not a valid decimal.
     check(Array[Byte](primitiveHeader(DECIMAL16), 0) ++
       BigDecimal(1e38).toBigInt.toByteArray.reverse, emptyMetadata)
@@ -95,13 +96,13 @@ class VariantExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
 
     // Construct binary values that are over SIZE_LIMIT bytes, but otherwise valid.
     val bigVersion = Array[Byte]((VERSION | (3 << 6)).toByte)
-    val a = Array.fill(SIZE_LIMIT)('a'.toByte)
+    val a = createArray[Byte](SIZE_LIMIT, 'a'.toByte)
     val hugeMetadata = bigVersion ++ Array[Byte](2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1) ++
       a ++ Array[Byte]('b')
     check(Array(primitiveHeader(TRUE)), hugeMetadata, "VARIANT_CONSTRUCTOR_SIZE_LIMIT")
 
     // The keys are 'aaa....' and 'b'. Values are "yyy..." and 'true'.
-    val y = Array.fill(SIZE_LIMIT)('y'.toByte)
+    val y = createArray[Byte](SIZE_LIMIT, 'y'.toByte)
     val hugeObject = Array[Byte](objectHeader(true, 4, 4)) ++
       /* size */ padded(Array(2), 4) ++
       /* id list */ padded(Array(0, 1), 4) ++
@@ -198,7 +199,7 @@ class VariantExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
     // bytes for size and offsets, plus 1 byte for the final value, so the large value is 1 << 24 -
     // 14 bytes, or (-14, -1, -1) as a signed little-endian value.
     val aSize = (1 << 24) - 14
-    val a = Array.fill(aSize)('a'.toByte)
+    val a = createArray[Byte](aSize, 'a'.toByte)
     val hugeMetadata = bigVersion ++ Array[Byte](2, 0, 0, 0, 0, 0, -14, -1, -1, -13, -1, -1) ++
       a ++ Array[Byte]('b')
     // Validate metadata in isolation.
@@ -212,7 +213,7 @@ class VariantExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
     // In order to get the full binary to 1 << 24, the large string is (1 << 24) - 26 bytes. As a
     // signed little-endian value, this is (-26, -1, -1).
     val ySize = (1 << 24) - 26
-    val y = Array.fill(ySize)('y'.toByte)
+    val y = createArray[Byte](ySize, 'y'.toByte)
     val hugeObject = Array[Byte](objectHeader(true, 3, 3)) ++
       /* size */ padded(Array(2), 4) ++
       /* id list */ padded(Array(0, 1), 3) ++
@@ -900,14 +901,17 @@ class VariantExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
       check(input, input.toString)
     }
     for (precision <- Seq(9, 18, 38)) {
-      val input = BigDecimal("9" * precision)
+      val input = BigDecimal("9".repeat(precision))
       check(Literal.create(input, DecimalType(precision, 0)), input.toString)
     }
     check("", "\"\"")
-    check("x" * 128, "\"" + ("x" * 128) + "\"")
+    check("x".repeat(128), "\"" + "x".repeat(128) + "\"")
     check(Array[Byte](1, 2, 3), "\"AQID\"")
     check(Literal(0, DateType), "\"1970-01-01\"")
 
+    val floatArray = Array.tabulate(25) { i => i.toFloat }
+    check(floatArray, floatArray.mkString("[", ",", "]"))
+
     withSQLConf(SQLConf.SESSION_LOCAL_TIMEZONE.key -> "UTC") {
       check(Literal(0L, TimestampType), "\"1970-01-01 00:00:00+00:00\"")
       check(Literal(0L, TimestampNTZType), "\"1970-01-01 00:00:00\"")
@@ -981,7 +985,7 @@ class VariantExpressionSuite extends SparkFunSuite with ExpressionEvalHelper {
     val emptyMetadata = Array[Byte](VERSION, 0, 0)
 
     // UUID
-    val uuidVal = Array(primitiveHeader(UUID)) ++ Array.fill(16)(1.toByte)
+    val uuidVal = Array(primitiveHeader(UUID)) ++ createArray[Byte](16, 1.toByte)
     val uuid = Literal(new VariantVal(uuidVal, emptyMetadata))
     checkEvaluation(SchemaOfVariant(uuid), s"UUID")
     // Merge with variantNull retains type.
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/xml/UDFXPathUtilSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/xml/UDFXPathUtilSuite.scala
index 8351e94c0c360..2507107d43776 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/xml/UDFXPathUtilSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/expressions/xml/UDFXPathUtilSuite.scala
@@ -18,6 +18,7 @@
 package org.apache.spark.sql.catalyst.expressions.xml
 
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import javax.xml.xpath.XPathConstants.STRING
 
 import org.w3c.dom.Node
@@ -79,14 +80,13 @@ class UDFXPathUtilSuite extends SparkFunSuite {
   }
 
   test("embedFailure") {
-    import org.apache.commons.io.FileUtils
     import java.io.File
     val secretValue = String.valueOf(Math.random)
     val tempFile = File.createTempFile("verifyembed", ".tmp")
     tempFile.deleteOnExit()
     val fname = tempFile.getAbsolutePath
 
-    FileUtils.writeStringToFile(tempFile, secretValue, StandardCharsets.UTF_8)
+    Files.writeString(tempFile.toPath(), secretValue, StandardCharsets.UTF_8)
 
     val xml =
       s"""<?xml version="1.0" encoding="utf-8"?>
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/ConstantFoldingSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/ConstantFoldingSuite.scala
index d8d58ea6aa903..0489308a1ab24 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/ConstantFoldingSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/ConstantFoldingSuite.scala
@@ -437,6 +437,19 @@ class ConstantFoldingSuite extends PlanTest {
       Optimize.execute(oneRowScalarSubquery),
       oneRowScalarSubquery)
   }
+
+  test("SPARK-53360: Once strategy with ConstantFolding's idempotence should not be broken") {
+    val emptyRelation = LocalRelation($"a".int)
+    val nullIntLit = Literal(null, IntegerType)
+
+    Seq(EqualTo, LessThan, GreaterThan).foreach { comparison =>
+      comparePlans(
+        Optimize.execute(testRelation
+          .select(comparison($"a",
+            Multiply(ScalarSubquery(emptyRelation), Literal(1, IntegerType))).as("o")).analyze),
+        testRelation.select(comparison($"a", nullIntLit).as("o")).analyze)
+    }
+  }
 }
 
 case class SerializableBoxedInt(intVal: Int) {
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/GenerateOptimizationSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/GenerateOptimizationSuite.scala
index 7d67284e46f01..60675a45f08d1 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/GenerateOptimizationSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/GenerateOptimizationSuite.scala
@@ -19,12 +19,12 @@ package org.apache.spark.sql.catalyst.optimizer
 
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.dsl.plans._
-import org.apache.spark.sql.catalyst.expressions.Explode
+import org.apache.spark.sql.catalyst.expressions.{AttributeReference, Explode, JsonTuple, Literal}
 import org.apache.spark.sql.catalyst.optimizer.NestedColumnAliasingSuite.collectGeneratedAliases
 import org.apache.spark.sql.catalyst.plans.PlanTest
-import org.apache.spark.sql.catalyst.plans.logical.{LocalRelation, LogicalPlan}
+import org.apache.spark.sql.catalyst.plans.logical.{Generate, LocalRelation, LogicalPlan, Project}
 import org.apache.spark.sql.catalyst.rules.RuleExecutor
-import org.apache.spark.sql.types.StructType
+import org.apache.spark.sql.types.{StringType, StructType}
 
 class GenerateOptimizationSuite extends PlanTest {
 
@@ -78,4 +78,56 @@ class GenerateOptimizationSuite extends PlanTest {
 
     comparePlans(optimized, expected)
   }
+
+  test("SPARK-53124: prune unnecessary fields from JsonTuple") {
+    val jsonStrAttr = AttributeReference("json_str", StringType)()
+    val aAttr = AttributeReference("a", StringType)()
+    val bAttr = AttributeReference("b", StringType)()
+    val cAttr = AttributeReference("c", StringType)()
+    val jsonRelation = LocalRelation(jsonStrAttr)
+
+    // Create JsonTuple generator with 3 fields
+    val jsonTuple = JsonTuple(Seq(jsonStrAttr, Literal("a"), Literal("b"), Literal("c")))
+    val generate = Generate(
+      generator = jsonTuple,
+      unrequiredChildIndex = Nil,
+      outer = false,
+      qualifier = None,
+      generatorOutput = Seq(aAttr, bAttr, cAttr),
+      child = jsonRelation)
+
+    // Case 1: No generator outputs used - should eliminate Generate completely
+    val projectNone = Project(Seq(jsonStrAttr), generate).analyze
+    val optimizedNone = Optimize.execute(projectNone)
+    val expectedNone = jsonRelation.select(jsonStrAttr).analyze
+    comparePlans(optimizedNone, expectedNone)
+
+    // Case 2: Some generator outputs used (just 'b')
+    val projectSome = Project(Seq(bAttr), generate).analyze
+    val optimizedSome = Optimize.execute(projectSome)
+    val expectedSome = Project(
+      Seq(bAttr),
+      Generate(
+        generator = JsonTuple(Seq(jsonStrAttr, Literal("b"))),
+        unrequiredChildIndex = Seq(0),
+        outer = false,
+        qualifier = None,
+        generatorOutput = Seq(bAttr),
+        child = jsonRelation)).analyze
+    comparePlans(optimizedSome, expectedSome)
+
+    // Case 3: All generator outputs used - plan should remain unchanged
+    val projectAll = Project(Seq(aAttr, bAttr, cAttr), generate)
+    val optimizedAll = Optimize.execute(projectAll)
+    val expectedAll = Project(
+      Seq(aAttr, bAttr, cAttr),
+      Generate(
+        generator = jsonTuple,
+        unrequiredChildIndex = Seq(0),
+        outer = false,
+        qualifier = None,
+        generatorOutput = Seq(aAttr, bAttr, cAttr),
+        child = jsonRelation)).analyze
+    comparePlans(optimizedAll, expectedAll)
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/LikeSimplificationSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/LikeSimplificationSuite.scala
index 992170dbc0d24..e8cb2b2dd8b06 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/LikeSimplificationSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/LikeSimplificationSuite.scala
@@ -165,6 +165,54 @@ class LikeSimplificationSuite extends PlanTest {
     comparePlans(optimized5, correctAnswer5)
   }
 
+  test("SPARK-52817: Spark SQL LIKE expressions show poor performance when using multiple '%'") {
+    val originalQuery1 =
+      testRelation
+        .where($"a" like "abc%%")
+    val optimized1 = Optimize.execute(originalQuery1.analyze)
+    val correctAnswer1 = testRelation
+      .where(StartsWith($"a", "abc"))
+      .analyze
+    comparePlans(optimized1, correctAnswer1)
+
+    val originalQuery2 =
+      testRelation
+        .where($"a" like "%%xyz")
+    val optimized2 = Optimize.execute(originalQuery2.analyze)
+    val correctAnswer2 = testRelation
+      .where(EndsWith($"a", "xyz"))
+      .analyze
+    comparePlans(optimized2, correctAnswer2)
+
+    val originalQuery3 =
+      testRelation
+        .where($"a" like "abc%%def")
+    val optimized3 = Optimize.execute(originalQuery3.analyze)
+    val correctAnswer3 = testRelation
+      .where(
+        (Length($"a") >= 6 && (StartsWith($"a", "abc") && EndsWith($"a", "def"))))
+      .analyze
+    comparePlans(optimized3, correctAnswer3)
+
+    val originalQuery4 =
+      testRelation
+        .where(($"a" like "%%mn%%"))
+    val optimized4 = Optimize.execute(originalQuery4.analyze)
+    val correctAnswer4 = testRelation
+      .where(Contains($"a", "mn"))
+      .analyze
+    comparePlans(optimized4, correctAnswer4)
+
+    val originalQuery5 =
+      testRelation
+        .where(($"a" like "%%%mn%%%"))
+    val optimized5 = Optimize.execute(originalQuery5.analyze)
+    val correctAnswer5 = testRelation
+      .where(Contains($"a", "mn"))
+      .analyze
+    comparePlans(optimized5, correctAnswer5)
+  }
+
   test("simplify LikeAll") {
     val originalQuery =
       testRelation
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/PushFoldableIntoBranchesSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/PushFoldableIntoBranchesSuite.scala
index d88db82d94dd7..6bd0b43790e1e 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/PushFoldableIntoBranchesSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/PushFoldableIntoBranchesSuite.scala
@@ -289,7 +289,7 @@ class PushFoldableIntoBranchesSuite extends PlanTest {
         Literal.create(Period.ofMonths(2), YearMonthIntervalType()))),
       If(a, Literal.create(Timestamp.valueOf("2021-02-01 00:00:00"), TimestampType),
         Literal.create(Timestamp.valueOf("2021-03-01 00:00:00"), TimestampType)))
-    assertEquivalent(TimeAdd(
+    assertEquivalent(TimestampAddInterval(
       Literal.create(Timestamp.valueOf("2021-01-01 00:00:00.000"), TimestampType),
       If(a, Literal(Duration.ofDays(10).plusMinutes(10).plusMillis(321)),
         Literal(Duration.ofDays(10).plusMinutes(10).plusMillis(456)))),
@@ -329,7 +329,7 @@ class PushFoldableIntoBranchesSuite extends PlanTest {
         (c, Literal.create(Period.ofMonths(2), YearMonthIntervalType()))), None)),
       CaseWhen(Seq((a, Literal.create(Timestamp.valueOf("2021-02-01 00:00:00"), TimestampType)),
         (c, Literal.create(Timestamp.valueOf("2021-03-01 00:00:00"), TimestampType))), None))
-    assertEquivalent(TimeAdd(
+    assertEquivalent(TimestampAddInterval(
       Literal.create(Timestamp.valueOf("2021-01-01 00:00:00.000"), TimestampType),
       CaseWhen(Seq((a, Literal(Duration.ofDays(10).plusMinutes(10).plusMillis(321))),
         (c, Literal(Duration.ofDays(10).plusMinutes(10).plusMillis(456)))), None)),
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregatesSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregatesSuite.scala
index 2af3057c0b856..40b3d36d4bfc7 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregatesSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAggregatesSuite.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.catalyst.optimizer
 
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.dsl.plans._
-import org.apache.spark.sql.catalyst.expressions.{Expression, PythonUDAF}
+import org.apache.spark.sql.catalyst.expressions.{Expression, Literal, PythonUDAF}
 import org.apache.spark.sql.catalyst.expressions.Literal.TrueLiteral
 import org.apache.spark.sql.catalyst.plans.{LeftAnti, LeftSemi, PlanTest}
 import org.apache.spark.sql.catalyst.plans.logical.{Distinct, LocalRelation, LogicalPlan}
@@ -289,4 +289,23 @@ class RemoveRedundantAggregatesSuite extends PlanTest {
     val originalQuery = Distinct(x.groupBy($"a", $"b")($"a", TrueLiteral)).analyze
     comparePlans(Optimize.execute(originalQuery), originalQuery)
   }
+
+  test("SPARK-53155: global lower aggregation should not be removed") {
+    object OptimizeNonRemovedRedundantAgg extends RuleExecutor[LogicalPlan] {
+      val batches = Batch("RemoveRedundantAggregates", FixedPoint(10),
+        PropagateEmptyRelation,
+        RemoveRedundantAggregates) :: Nil
+    }
+
+    val query = relation
+      .groupBy()(Literal(1).as("col1"), Literal(2).as("col2"), Literal(3).as("col3"))
+      .groupBy($"col1")(max($"col1"))
+      .analyze
+    val expected = relation
+      .groupBy()(Literal(1).as("col1"), Literal(2).as("col2"), Literal(3).as("col3"))
+      .groupBy($"col1")(max($"col1"))
+      .analyze
+    val optimized = OptimizeNonRemovedRedundantAgg.execute(query)
+    comparePlans(optimized, expected)
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAliasAndProjectSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAliasAndProjectSuite.scala
index 552a638f6e614..fec683183100c 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAliasAndProjectSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/RemoveRedundantAliasAndProjectSuite.scala
@@ -24,7 +24,7 @@ import org.apache.spark.sql.catalyst.plans.PlanTest
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.rules._
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.types.MetadataBuilder
+import org.apache.spark.sql.types.{IntegerType, MetadataBuilder}
 
 class RemoveRedundantAliasAndProjectSuite extends PlanTest {
 
@@ -238,4 +238,35 @@ class RemoveRedundantAliasAndProjectSuite extends PlanTest {
       comparePlans(optimized, expectedWhenNotEnabled)
     }
   }
+
+  test("SPARK-53308: Don't remove aliases in RemoveRedundantAliases that would cause duplicates") {
+    val exprId = NamedExpression.newExprId
+    val attribute = AttributeReference("attr", IntegerType)(exprId = exprId)
+    val project = Project(
+      Seq(
+        Alias(attribute, "attr")(),
+        attribute
+      ),
+      LocalRelation(attribute)
+    )
+    val projectWithoutAlias =
+      Project(
+        Seq(
+          attribute,
+          attribute
+        ),
+        LocalRelation(attribute)
+      )
+    val union = Union(Seq(project, project))
+
+    withSQLConf(SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED.key -> "true") {
+      val optimized = Optimize.execute(union)
+      comparePlans(union, optimized)
+    }
+
+    withSQLConf(SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED.key -> "false") {
+      val optimized = Optimize.execute(union)
+      comparePlans(optimized, Union(Seq(project, projectWithoutAlias)))
+    }
+  }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/SetOperationSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/SetOperationSuite.scala
index b2b1f9014989b..d3aa1e0cd37ca 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/SetOperationSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/SetOperationSuite.scala
@@ -24,6 +24,7 @@ import org.apache.spark.sql.catalyst.expressions.{And, GreaterThan, GreaterThanO
 import org.apache.spark.sql.catalyst.plans.PlanTest
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.rules._
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{BooleanType, DecimalType}
 
 class SetOperationSuite extends PlanTest {
@@ -313,6 +314,27 @@ class SetOperationSuite extends PlanTest {
     comparePlans(unionOptimized, unionCorrectAnswer)
   }
 
+  test("SPARK-52686: no pushdown if project has duplicate expression IDs") {
+    val unionQuery = testUnion.select($"a", $"a")
+    val unionCorrectAnswerWithConfOn = unionQuery.analyze
+    val unionCorrectAnswerWithConfOff = Union(
+      testRelation.select($"a", $"a").analyze ::
+      testRelation2.select($"d", $"d").analyze ::
+      testRelation3.select($"g", $"g").analyze ::
+      Nil
+    )
+
+    withSQLConf(SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED.key -> "true") {
+      val unionOptimized = Optimize.execute(unionQuery.analyze)
+      comparePlans(unionOptimized, unionCorrectAnswerWithConfOn)
+    }
+
+    withSQLConf(SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED.key -> "false") {
+      val unionOptimized = Optimize.execute(unionQuery.analyze)
+      comparePlans(unionOptimized, unionCorrectAnswerWithConfOff)
+    }
+  }
+
   test("CombineUnions only flatten the unions with same byName and allowMissingCol") {
     val union1 = Union(testRelation :: testRelation :: Nil, true, false)
     val union2 = Union(testRelation :: testRelation :: Nil, true, true)
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/SimpleTestOptimizer.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/SimpleTestOptimizer.scala
new file mode 100644
index 0000000000000..007a2b3fd0589
--- /dev/null
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/optimizer/SimpleTestOptimizer.scala
@@ -0,0 +1,34 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.sql.catalyst.optimizer
+
+import org.apache.spark.sql.catalyst.analysis.{EmptyFunctionRegistry, EmptyTableFunctionRegistry, FakeV2SessionCatalog}
+import org.apache.spark.sql.catalyst.catalog.{InMemoryCatalog, SessionCatalog}
+import org.apache.spark.sql.connector.catalog.CatalogManager
+
+/**
+ * An optimizer used in test code.
+ *
+ * To ensure extendability, we leave the standard rules in the abstract optimizer rules, while
+ * specific rules go to the subclasses
+ */
+object SimpleTestOptimizer extends SimpleTestOptimizer
+
+class SimpleTestOptimizer extends Optimizer(
+  new CatalogManager(
+    FakeV2SessionCatalog,
+    new SessionCatalog(new InMemoryCatalog, EmptyFunctionRegistry, EmptyTableFunctionRegistry)))
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/DataTypeParserSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/DataTypeParserSuite.scala
index 8b61328a00999..5d90c2d730e02 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/DataTypeParserSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/DataTypeParserSuite.scala
@@ -58,9 +58,13 @@ class DataTypeParserSuite extends SparkFunSuite with SQLHelper {
   checkDataType("deC", DecimalType.USER_DEFAULT)
   checkDataType("DATE", DateType)
   checkDataType("TimE", TimeType())
+  checkDataType("TimE WiTHOUT TiME ZoNE", TimeType())
   checkDataType("time(0)", TimeType(0))
+  checkDataType("time(0) without time zone", TimeType(0))
   checkDataType("TIME(6)", TimeType(6))
+  checkDataType("TIME(6) WITHOUT TIME ZONE", TimeType(6))
   checkDataType("timestamp", TimestampType)
+  checkDataType("TIMESTAMP WITHOUT TIME ZONE", TimestampNTZType)
   checkDataType("timestamp_ntz", TimestampNTZType)
   checkDataType("timestamp_ltz", TimestampType)
   checkDataType("string", StringType)
@@ -157,6 +161,7 @@ class DataTypeParserSuite extends SparkFunSuite with SQLHelper {
     }
     withSQLConf(SQLConf.TIMESTAMP_TYPE.key -> TimestampTypes.TIMESTAMP_LTZ.toString) {
       assert(parse("timestamp") === TimestampType)
+      assert(parse("timestamp without time zone") === TimestampNTZType)
     }
   }
 
@@ -183,11 +188,53 @@ class DataTypeParserSuite extends SparkFunSuite with SQLHelper {
       },
       condition = "UNSUPPORTED_TIME_PRECISION",
       parameters = Map("precision" -> "9"))
+    checkError(
+      exception = intercept[SparkException] {
+        CatalystSqlParser.parseDataType("time(8) without time zone")
+      },
+      condition = "UNSUPPORTED_TIME_PRECISION",
+      parameters = Map("precision" -> "8"))
     checkError(
       exception = intercept[ParseException] {
         CatalystSqlParser.parseDataType("time(-1)")
       },
       condition = "PARSE_SYNTAX_ERROR",
       parameters = Map("error" -> "'('", "hint" -> ""))
+    checkError(
+      exception = intercept[ParseException] {
+        CatalystSqlParser.parseDataType("time(-100) WITHOUT TIME ZONE")
+      },
+      condition = "PARSE_SYNTAX_ERROR",
+      parameters = Map("error" -> "'('", "hint" -> ""))
+  }
+
+  test("invalid TIME suffix") {
+    checkError(
+      exception = intercept[ParseException] {
+        CatalystSqlParser.parseDataType("time(0) WITHOUT TIMEZONE")
+      },
+      condition = "PARSE_SYNTAX_ERROR",
+      parameters = Map("error" -> "'WITHOUT'", "hint" -> ""))
+    checkError(
+      exception = intercept[ParseException] {
+        CatalystSqlParser.parseDataType("time(0) WITH TIME ZONE")
+      },
+      condition = "PARSE_SYNTAX_ERROR",
+      parameters = Map("error" -> "'WITH'", "hint" -> ""))
+  }
+
+  test("invalid TIMESTAMP suffix") {
+    checkError(
+      exception = intercept[ParseException] {
+        CatalystSqlParser.parseDataType("timestamp WITHOUT TIMEZONE")
+      },
+      condition = "PARSE_SYNTAX_ERROR",
+      parameters = Map("error" -> "'WITHOUT'", "hint" -> ""))
+    checkError(
+      exception = intercept[ParseException] {
+        CatalystSqlParser.parseDataType("timestamp WITH TIME ZONE")
+      },
+      condition = "PARSE_SYNTAX_ERROR",
+      parameters = Map("error" -> "'WITH'", "hint" -> ""))
   }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/ParserUtilsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/ParserUtilsSuite.scala
index e93ec751a7f82..a4828808da633 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/ParserUtilsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/ParserUtilsSuite.scala
@@ -143,6 +143,16 @@ class ParserUtilsSuite extends SparkFunSuite {
     // Guard against off-by-one errors in the "all chars are hex" routine:
     assert(unescapeSQLString("\"abc\\uAAAXa\"") == "abcuAAAXa")
 
+    // Double-quote escaping ("", '')
+    assert(unescapeSQLString(""" "a""a" """.trim) == """ a"a """.trim)
+    assert(unescapeSQLString(""" "a""a" """.trim, true) == "aa")
+    assert(unescapeSQLString(""" 'a''a' """.trim) == "a'a")
+    assert(unescapeSQLString(""" 'a''a' """.trim, true) == "aa")
+    // Single-quoted double quote string or double-quoted single quote string isn't affected
+    assert(unescapeSQLString(""" 'a""a' """.trim) == """ a""a """.trim)
+    assert(unescapeSQLString(""" 'a""a' """.trim, true) == """ a""a """.trim)
+    assert(unescapeSQLString(""" "a''a" """.trim) == "a''a")
+    assert(unescapeSQLString(""" "a''a" """.trim, true) == "a''a")
     // scalastyle:on nonascii
   }
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/PlanParserSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/PlanParserSuite.scala
index 2d35feeb6bfd0..388ee5e582ece 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/PlanParserSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/PlanParserSuite.scala
@@ -20,11 +20,12 @@ package org.apache.spark.sql.catalyst.parser
 import scala.annotation.nowarn
 
 import org.apache.spark.SparkThrowable
-import org.apache.spark.sql.catalyst.{EvaluateUnresolvedInlineTable, FunctionIdentifier, TableIdentifier}
+import org.apache.spark.sql.catalyst.{FunctionIdentifier, TableIdentifier}
 import org.apache.spark.sql.catalyst.analysis.{AnalysisTest, NamedParameter, PosParameter, RelationTimeTravel, UnresolvedAlias, UnresolvedAttribute, UnresolvedFunction, UnresolvedGenerator, UnresolvedInlineTable, UnresolvedRelation, UnresolvedStar, UnresolvedSubqueryColumnAliases, UnresolvedTableValuedFunction, UnresolvedTVFAliases}
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.plans._
 import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.catalyst.util.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{Decimal, DecimalType, IntegerType, LongType, StringType}
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/SqlScriptingParserSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/SqlScriptingParserSuite.scala
index 7f37dee64fb93..abcea96f0831f 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/SqlScriptingParserSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/parser/SqlScriptingParserSuite.scala
@@ -323,7 +323,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_NAME_FORBIDDEN",
+      condition = "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN",
       parameters = Map("label" -> toSQLId("system")))
     assert(exception.origin.line.contains(3))
   }
@@ -345,7 +345,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_NAME_FORBIDDEN",
+      condition = "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN",
       parameters = Map("label" -> toSQLId("sysxyz")))
     assert(exception.origin.line.contains(3))
   }
@@ -367,7 +367,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_NAME_FORBIDDEN",
+      condition = "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN",
       parameters = Map("label" -> toSQLId("session")))
     assert(exception.origin.line.contains(3))
   }
@@ -389,7 +389,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_NAME_FORBIDDEN",
+      condition = "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN",
       parameters = Map("label" -> toSQLId("builtin")))
     assert(exception.origin.line.contains(3))
   }
@@ -411,7 +411,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_NAME_FORBIDDEN",
+      condition = "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN",
       parameters = Map("label" -> toSQLId("system")))
     assert(exception.origin.line.contains(3))
   }
@@ -433,7 +433,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_NAME_FORBIDDEN",
+      condition = "LABEL_OR_FOR_VARIABLE_NAME_FORBIDDEN",
       parameters = Map("label" -> toSQLId("session")))
     assert(exception.origin.line.contains(3))
   }
@@ -2012,7 +2012,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("lbl")))
   }
 
@@ -2031,7 +2031,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("lbl")))
   }
 
@@ -2050,7 +2050,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("lbl")))
   }
 
@@ -2092,7 +2092,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("lbl_1")))
   }
 
@@ -2111,7 +2111,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("lbl")))
   }
 
@@ -2130,7 +2130,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("lbl")))
   }
 
@@ -2149,7 +2149,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("w_loop")))
   }
 
@@ -2170,7 +2170,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("r_loop")))
   }
 
@@ -2189,7 +2189,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("l_loop")))
   }
 
@@ -2208,7 +2208,7 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     }
     checkError(
       exception = exception,
-      condition = "LABEL_ALREADY_EXISTS",
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
       parameters = Map("label" -> toSQLId("f_loop")))
   }
 
@@ -2336,6 +2336,130 @@ class SqlScriptingParserSuite extends SparkFunSuite with SQLHelper {
     assert(forStatement.label.get == "lbl_4")
   }
 
+  test("for variable not the same as labels in scope") {
+    val sqlScriptText =
+      """
+        |BEGIN
+        |  L1: BEGIN
+        |    L2: BEGIN
+        |      L3: FOR L4 AS SELECT 1 DO
+        |        SELECT 1;
+        |        FOR L5 AS SELECT 3 DO
+        |          BEGIN
+        |            SELECT L4;
+        |          END;
+        |         SELECT 4;
+        |        END FOR;
+        |      END FOR L3;
+        |    END L2;
+        |    L4: BEGIN
+        |      SELECT 3;
+        |    END L4;
+        |  END L1;
+        |END""".stripMargin
+
+    val tree = parsePlan(sqlScriptText).asInstanceOf[CompoundBody]
+    assert(tree.collection.length == 1)
+    assert(tree.collection.head.isInstanceOf[CompoundBody])
+  }
+
+  test("for variable name is the same as a label in scope - should fail") {
+    val sqlScriptText =
+      """
+        |BEGIN
+        |  L1: BEGIN
+        |    L2: BEGIN
+        |      L3: FOR L2 AS SELECT 1 DO
+        |        SELECT 1;
+        |        SELECT 2;
+        |      END FOR L3;
+        |    END L2;
+        |    L4: BEGIN
+        |      SELECT 3;
+        |    END L4;
+        |  END L1;
+        |END""".stripMargin
+
+    checkError(
+      exception = intercept[SqlScriptingException] {
+        parsePlan(sqlScriptText)
+      },
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
+      parameters = Map("label" -> "`l2`"))
+  }
+
+  test("for variable name is the same as the label of the for loop - should fail") {
+    val sqlScriptText =
+      """
+        |BEGIN
+        |  L1: FOR L1 AS SELECT 1 DO
+        |    SELECT 2;
+        |  END FOR L1;
+        |END""".stripMargin
+
+    checkError(
+      exception = intercept[SqlScriptingException] {
+        parsePlan(sqlScriptText)
+      },
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
+      parameters = Map("label" -> "`l1`"))
+  }
+
+  test("label name is the same as the for loop variable name - should fail") {
+    val sqlScriptText =
+      """
+        |BEGIN
+        |  FOR L1 AS SELECT 1 DO
+        |    L1: BEGIN
+        |      SELECT 2;
+        |    END L1;
+        |  END FOR;
+        |END""".stripMargin
+
+    checkError(
+      exception = intercept[SqlScriptingException] {
+        parsePlan(sqlScriptText)
+      },
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
+      parameters = Map("label" -> "`l1`"))
+  }
+
+  test("nested for loop variable names are the same - should fail") {
+    val sqlScriptText =
+      """
+        |BEGIN
+        |  FOR L1 AS SELECT 1 DO
+        |    FOR L1 AS SELECT 2 DO
+        |     SELECT 3;
+        |    END FOR;
+        |  END FOR;
+        |END""".stripMargin
+
+    checkError(
+      exception = intercept[SqlScriptingException] {
+        parsePlan(sqlScriptText)
+      },
+      condition = "LABEL_OR_FOR_VARIABLE_ALREADY_EXISTS",
+      parameters = Map("label" -> "`l1`"))
+  }
+
+  test("for loop variable names are the same but for loops are not nested") {
+    val sqlScriptText =
+      """
+        |BEGIN
+        |  FOR L1 AS SELECT 1 DO
+        |    SELECT 2;
+        |  END FOR;
+        |  FOR L1 AS SELECT 3 DO
+        |    SELECT 4;
+        |  END FOR;
+        |END""".stripMargin
+
+    val tree = parsePlan(sqlScriptText).asInstanceOf[CompoundBody]
+    assert(tree.collection.length == 2)
+    assert(tree.collection.forall(_.isInstanceOf[ForStatement]))
+  }
+
   test("for statement") {
     val sqlScriptText =
       """
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/plans/NormalizePlanSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/plans/NormalizePlanSuite.scala
index 87d59be5aa378..d610fb828f862 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/plans/NormalizePlanSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/plans/NormalizePlanSuite.scala
@@ -23,16 +23,7 @@ import org.apache.spark.SparkFunSuite
 import org.apache.spark.sql.catalyst.SQLConfHelper
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.dsl.plans._
-import org.apache.spark.sql.catalyst.expressions.{
-  AssertTrue,
-  Cast,
-  CommonExpressionDef,
-  CommonExpressionId,
-  CommonExpressionRef,
-  If,
-  Literal,
-  TimeZoneAwareExpression
-}
+import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.plans.logical.{LocalRelation, LogicalPlan}
 import org.apache.spark.sql.types.BooleanType
 
@@ -68,6 +59,64 @@ class NormalizePlanSuite extends SparkFunSuite with SQLConfHelper {
     assert(NormalizePlan(baselinePlan) == NormalizePlan(testPlan))
   }
 
+  test("Normalize ordering in an aggregate list of an inner Aggregate under Project") {
+    val baselinePlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col1", $"col2")
+      .select($"col1")
+    val testPlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col2", $"col1")
+      .select($"col1")
+
+    assert(baselinePlan != testPlan)
+    assert(NormalizePlan(baselinePlan) == NormalizePlan(testPlan))
+  }
+
+  test("Normalize ordering in an aggregate list of an inner Aggregate under Project and Filter") {
+    val baselinePlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col1", $"col2")
+      .where($"col1" === 1)
+      .select($"col1")
+    val testPlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col2", $"col1")
+      .where($"col1" === 1)
+      .select($"col1")
+
+    assert(baselinePlan != testPlan)
+    assert(NormalizePlan(baselinePlan) == NormalizePlan(testPlan))
+  }
+
+  test("Normalize ordering in an aggregate list of an inner Aggregate under Project and Sort") {
+    val baselinePlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col1", $"col2")
+      .orderBy(SortOrder($"col1", Ascending))
+      .select($"col1")
+    val testPlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col2", $"col1")
+      .orderBy(SortOrder($"col1", Ascending))
+      .select($"col1")
+
+    assert(baselinePlan != testPlan)
+    assert(NormalizePlan(baselinePlan) == NormalizePlan(testPlan))
+  }
+
+  test(
+    "Normalize ordering in an aggregate list of an inner Aggregate under Project Sort and Filter"
+  ) {
+    val baselinePlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col1", $"col2")
+      .where($"col1" === 1)
+      .orderBy(SortOrder($"col1", Ascending))
+      .select($"col1")
+    val testPlan = LocalRelation($"col1".int, $"col2".string)
+      .groupBy($"col1", $"col2")($"col2", $"col1")
+      .where($"col1" === 1)
+      .orderBy(SortOrder($"col1", Ascending))
+      .select($"col1")
+
+    assert(baselinePlan != testPlan)
+    assert(NormalizePlan(baselinePlan) == NormalizePlan(testPlan))
+  }
+
   test("Normalize InheritAnalysisRules expressions") {
     val castWithoutTimezone =
       Cast(child = Literal(1), dataType = BooleanType, ansiEnabled = conf.ansiEnabled)
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeTestUtils.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeTestUtils.scala
index f281c42bbe715..b17a22778801a 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeTestUtils.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeTestUtils.scala
@@ -24,7 +24,7 @@ import java.util.concurrent.TimeUnit
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.sql.catalyst.util.DateTimeConstants._
-import org.apache.spark.sql.catalyst.util.DateTimeUtils.{getZoneId, localTimeToMicros}
+import org.apache.spark.sql.catalyst.util.DateTimeUtils.{getZoneId, localTimeToNanos}
 
 /**
  * Helper functions for testing date and time functionality.
@@ -113,7 +113,7 @@ object DateTimeTestUtils {
     result
   }
 
-  // Returns microseconds since midnight
+  // Returns nanoseconds since midnight
   def localTime(
       hour: Byte = 0,
       minute: Byte = 0,
@@ -121,6 +121,6 @@ object DateTimeTestUtils {
       micros: Int = 0): Long = {
     val nanos = TimeUnit.MICROSECONDS.toNanos(micros).toInt
     val localTime = LocalTime.of(hour, minute, sec, nanos)
-    localTimeToMicros(localTime)
+    localTimeToNanos(localTime)
   }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeUtilsSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeUtilsSuite.scala
index 24258a2268ba6..b5b69a8340378 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeUtilsSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/DateTimeUtilsSuite.scala
@@ -26,12 +26,15 @@ import java.util.concurrent.TimeUnit
 import org.scalatest.matchers.must.Matchers
 import org.scalatest.matchers.should.Matchers._
 
-import org.apache.spark.{SparkDateTimeException, SparkFunSuite, SparkIllegalArgumentException}
+import org.apache.spark.{SparkArithmeticException, SparkDateTimeException, SparkFunSuite, SparkIllegalArgumentException}
 import org.apache.spark.sql.catalyst.plans.SQLHelper
 import org.apache.spark.sql.catalyst.util.DateTimeConstants._
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils._
 import org.apache.spark.sql.catalyst.util.DateTimeUtils._
 import org.apache.spark.sql.catalyst.util.RebaseDateTime.rebaseJulianToGregorianMicros
+import org.apache.spark.sql.errors.DataTypeErrors.toSQLConf
+import org.apache.spark.sql.internal.SqlApiConf
+import org.apache.spark.sql.types.DayTimeIntervalType.{HOUR, SECOND}
 import org.apache.spark.sql.types.Decimal
 import org.apache.spark.unsafe.types.{CalendarInterval, UTF8String}
 
@@ -763,6 +766,43 @@ class DateTimeUtilsSuite extends SparkFunSuite with Matchers with SQLHelper {
     }
   }
 
+  test("SPARK-51554: time truncation using timeTrunc") {
+    // 01:02:03.400500600
+    val input = localTimeToNanos(LocalTime.of(1, 2, 3, 400500600))
+    // Truncate the minutes, seconds, and fractions of seconds. Result is: 01:00:00.
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("HOUR"), input) === 3600000000000L)
+    // Truncate the seconds and fractions of seconds. Result is: 01:02:00.
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("MINUTE"), input) === 3720000000000L)
+    // Truncate the fractions of seconds. Result is: 01:02:03.
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("SECOND"), input) === 3723000000000L)
+    // Truncate the milliseconds. Result is: 01:02:03.400.
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("MILLISECOND"), input) === 3723400000000L)
+    // Truncate the microseconds. Result is: 01:02:03.400500.
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("MICROSECOND"), input) === 3723400500000L)
+
+    // 00:00:00
+    val midnight = localTimeToNanos(LocalTime.MIDNIGHT)
+    // Midnight time remains the same for any truncation.
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("HOUR"), midnight) === 0)
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("MINUTE"), midnight) === 0)
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("SECOND"), midnight) === 0)
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("MILLISECOND"), midnight) === 0)
+    assert(DateTimeUtils.timeTrunc(UTF8String.fromString("MICROSECOND"), midnight) === 0)
+
+    // Unsupported truncation levels.
+    Seq("DAY", "WEEK", "MONTH", "QUARTER", "YEAR", "INVALID", "ABC", "XYZ", "MS", " ", "").
+        map(UTF8String.fromString).foreach { level =>
+      intercept[IllegalArgumentException] {
+        DateTimeUtils.timeTrunc(level, input)
+        DateTimeUtils.timeTrunc(level, midnight)
+      }
+    }
+    // Null truncation level is not allowed.
+    intercept[AssertionError] {
+      DateTimeUtils.timeTrunc(null, input)
+    }
+  }
+
   test("SPARK-35664: microseconds to LocalDateTime") {
     assert(microsToLocalDateTime(0) == LocalDateTime.parse("1970-01-01T00:00:00"))
     assert(microsToLocalDateTime(100) == LocalDateTime.parse("1970-01-01T00:00:00.0001"))
@@ -1107,25 +1147,27 @@ class DateTimeUtilsSuite extends SparkFunSuite with Matchers with SQLHelper {
           "invalidValue" -> "'SECS'"))
   }
 
-  test("localTimeToMicros and microsToLocalTime") {
-    assert(microsToLocalTime(0) === LocalTime.of(0, 0))
-    assert(localTimeToMicros(LocalTime.of(0, 0)) === 0)
+  test("localTimeToNanos and nanosToLocalTime") {
+    assert(nanosToLocalTime(0) === LocalTime.of(0, 0))
+    assert(localTimeToNanos(LocalTime.of(0, 0)) === 0)
 
-    assert(localTimeToMicros(microsToLocalTime(123456789)) === 123456789)
+    assert(localTimeToNanos(nanosToLocalTime(123456789123L)) === 123456789123L)
 
-    assert(localTimeToMicros(LocalTime.parse("23:59:59.999999")) === (24L * 60 * 60 * 1000000 - 1))
-    assert(microsToLocalTime(24L * 60 * 60 * 1000000 - 1) === LocalTime.of(23, 59, 59, 999999000))
+    assert(localTimeToNanos(LocalTime.parse("23:59:59.999999999")) ===
+      (24L * 60 * 60 * 1000 * 1000 * 1000 - 1))
+    assert(nanosToLocalTime(24L * 60 * 60 * 1000 * 1000 * 1000 - 1) ===
+      LocalTime.of(23, 59, 59, 999999999))
 
-    Seq(-1, 24L * 60 * 60 * 1000000).foreach { invalidMicros =>
+    Seq(-1, 24L * 60 * 60 * 1000 * 1000 * 1000L).foreach { invalidNanos =>
       val msg = intercept[DateTimeException] {
-        microsToLocalTime(invalidMicros)
+        nanosToLocalTime(invalidNanos)
       }.getMessage
       assert(msg.contains("Invalid value"))
     }
-    val msg = intercept[ArithmeticException] {
-      microsToLocalTime(Long.MaxValue)
+    val msg = intercept[DateTimeException] {
+      nanosToLocalTime(Long.MaxValue)
     }.getMessage
-    assert(msg == "long overflow")
+    assert(msg.contains("Invalid value"))
   }
 
   test("stringToTime") {
@@ -1133,6 +1175,9 @@ class DateTimeUtilsSuite extends SparkFunSuite with Matchers with SQLHelper {
       assert(stringToTime(UTF8String.fromString(str)) === expected)
     }
 
+    // Existing 24-hour format tests.
+
+    // Various valid 24-hour format tests.
     checkStringToTime("00:00", Some(localTime()))
     checkStringToTime("00:00:00", Some(localTime()))
     checkStringToTime("00:00:00.1", Some(localTime(micros = 100000)))
@@ -1148,9 +1193,98 @@ class DateTimeUtilsSuite extends SparkFunSuite with Matchers with SQLHelper {
     checkStringToTime("1:2:3.0", Some(localTime(hour = 1, minute = 2, sec = 3)))
     checkStringToTime("T1:02:3.04", Some(localTime(hour = 1, minute = 2, sec = 3, micros = 40000)))
 
-    // Negative tests
-    Seq("2025-03-09 00:00:00", "00", "00:01:02 UTC").foreach { invalidTime =>
-      checkStringToTime(invalidTime, None)
+    checkStringToTime("00:00 ", Some(localTime()))
+    checkStringToTime(" 00:00", Some(localTime()))
+    checkStringToTime(" 00:00 ", Some(localTime()))
+    checkStringToTime("1:2:3.0 ", Some(localTime(hour = 1, minute = 2, sec = 3)))
+    checkStringToTime(" 1:2:3.0", Some(localTime(hour = 1, minute = 2, sec = 3)))
+    checkStringToTime(" 1:2:3.0 ", Some(localTime(hour = 1, minute = 2, sec = 3)))
+
+    // Invalid 24-hour format tests (out of range).
+    Seq("24:00:00", "25:00:00", "-1:00:00", "23:60:00", "23:00:60", "99:99:99").foreach {
+      invalidTime =>
+        checkStringToTime(invalidTime, None)
+    }
+
+    // 12-hour format tests (with AM/PM).
+
+    // Midnight hour [12 AM, 1 AM).
+    checkStringToTime("12:00:00 AM",
+      Some(localTime(0, 0, 0, 0)))
+    checkStringToTime("12:30:45 AM",
+      Some(localTime(0, 30, 45, 0)))
+    checkStringToTime("12:59:59.999 AM",
+      Some(localTime(0, 59, 59, 999000)))
+    checkStringToTime("12:59:59.999999 AM",
+      Some(localTime(0, 59, 59, 999999)))
+
+    // Morning hours [1AM, 12PM).
+    checkStringToTime("1:00:00 AM",
+      Some(localTime(hour = 1, minute = 0, sec = 0)))
+    checkStringToTime("11:59:59 AM",
+      Some(localTime(hour = 11, minute = 59, sec = 59)))
+    checkStringToTime("5:30:15.123456 AM",
+      Some(localTime(hour = 5, minute = 30, sec = 15, micros = 123456)))
+
+    // Noon hour [12 PM, 1PM).
+    checkStringToTime("12:00:00 PM",
+      Some(localTime(hour = 12, minute = 0, sec = 0)))
+    checkStringToTime("12:30:45 PM",
+      Some(localTime(hour = 12, minute = 30, sec = 45)))
+    checkStringToTime("12:59:59.999 PM",
+      Some(localTime(hour = 12, minute = 59, sec = 59, micros = 999000)))
+    checkStringToTime("12:59:59.999999 PM",
+      Some(localTime(hour = 12, minute = 59, sec = 59, micros = 999999)))
+
+    // Afternoon hours [1PM, 12AM).
+    checkStringToTime("1:00:00 PM",
+      Some(localTime(hour = 13, minute = 0, sec = 0)))
+    checkStringToTime("11:59:59 PM",
+      Some(localTime(hour = 23, minute = 59, sec = 59)))
+    checkStringToTime("6:45:30.987654 PM",
+      Some(localTime(hour = 18, minute = 45, sec = 30, micros = 987654)))
+    checkStringToTime("11:59:59.999 PM",
+      Some(localTime(hour = 23, minute = 59, sec = 59, micros = 999000)))
+    checkStringToTime("11:59:59.999999 PM",
+      Some(localTime(hour = 23, minute = 59, sec = 59, micros = 999999)))
+
+    // Test without space before AM/PM.
+    checkStringToTime("12:00:00AM", Some(localTime(hour = 0, minute = 0, sec = 0)))
+    checkStringToTime("12:00:00PM", Some(localTime(hour = 12, minute = 0, sec = 0)))
+    checkStringToTime("3:30:45AM", Some(localTime(hour = 3, minute = 30, sec = 45)))
+    checkStringToTime("9:15:20PM", Some(localTime(hour = 21, minute = 15, sec = 20)))
+
+    // Test case insensitive.
+    checkStringToTime("10:30:00Am ", Some(localTime(hour = 10, minute = 30, sec = 0)))
+    checkStringToTime("10:30:00 am", Some(localTime(hour = 10, minute = 30, sec = 0)))
+    checkStringToTime("2:45:30 Pm", Some(localTime(hour = 14, minute = 45, sec = 30)))
+    checkStringToTime("2:45:30pm ", Some(localTime(hour = 14, minute = 45, sec = 30)))
+    checkStringToTime("7:00:00aM", Some(localTime(hour = 7, minute = 0, sec = 0)))
+    checkStringToTime("8:00:00Pm", Some(localTime(hour = 20, minute = 0, sec = 0)))
+
+    // Invalid 12-hour format tests (out of range).
+    Seq(
+      "0:00:00 AM",
+      "0:00:00 PM",
+      "13:00:00 AM",
+      "13:00:00 PM",
+      "24:00:00 AM",
+      "24:00:00 PM",
+      "12:60:00 AM",
+      "12:60:00 PM",
+      "12:00:60 AM",
+      "12:00:60 PM",
+      "99:99:99 AM",
+      "99:99:99 PM"
+    ).foreach {
+      invalidTime =>
+        checkStringToTime(invalidTime, None)
+    }
+
+    // Negative tests (invalid time string).
+    Seq("2025-03-09 00:00:00", "00", "00:01:02 UTC", "XYZ", "ABCD", " ", "").foreach {
+      invalidTime =>
+        checkStringToTime(invalidTime, None)
     }
   }
 
@@ -1177,13 +1311,13 @@ class DateTimeUtilsSuite extends SparkFunSuite with Matchers with SQLHelper {
     val secAndMicros = Decimal(sec + (micros / MICROS_PER_SECOND.toFloat), 16, 6)
 
     // Valid case
-    val microSecsTime = timeToMicros(hour, min, secAndMicros)
-    assert(microSecsTime === localTime(hour.toByte, min.toByte, sec.toByte, micros))
+    val nanoSecsTime = makeTime(hour, min, secAndMicros)
+    assert(nanoSecsTime === localTime(hour.toByte, min.toByte, sec.toByte, micros))
 
     // Invalid hour
     checkError(
       exception = intercept[SparkDateTimeException] {
-        timeToMicros(-1, min, secAndMicros)
+        makeTime(-1, min, secAndMicros)
       },
       condition = "DATETIME_FIELD_OUT_OF_BOUNDS.WITHOUT_SUGGESTION",
       parameters = Map("rangeMessage" -> "Invalid value for HourOfDay (valid values 0 - 23): -1"))
@@ -1191,7 +1325,7 @@ class DateTimeUtilsSuite extends SparkFunSuite with Matchers with SQLHelper {
     // Invalid minute
     checkError(
       exception = intercept[SparkDateTimeException] {
-        timeToMicros(hour, -1, secAndMicros)
+        makeTime(hour, -1, secAndMicros)
       },
       condition = "DATETIME_FIELD_OUT_OF_BOUNDS.WITHOUT_SUGGESTION",
       parameters = Map("rangeMessage" ->
@@ -1207,11 +1341,188 @@ class DateTimeUtilsSuite extends SparkFunSuite with Matchers with SQLHelper {
     ).foreach { invalidSecond =>
       checkError(
         exception = intercept[SparkDateTimeException] {
-          timeToMicros(hour, min, Decimal(invalidSecond, 16, 6))
+          makeTime(hour, min, Decimal(invalidSecond, 16, 6))
         },
         condition = "DATETIME_FIELD_OUT_OF_BOUNDS.WITHOUT_SUGGESTION",
         parameters = Map("rangeMessage" ->
           s"Invalid value for SecondOfMinute (valid values 0 - 59): ${invalidSecond.toLong}"))
     }
   }
+
+  test("SPARK-51415: makeTimestamp with days, nanos, and zoneId") {
+    Seq(
+      (MIT, -34200000000L), // -09:30
+      (PST, -28800000000L), // -08:00
+      (UTC, 0L), // +00:00
+      (CET, 3600000000L), // +01:00
+      (JST, 32400000000L) // +09:00
+    ).foreach({ case (zoneId: ZoneId, microsOffset: Long) =>
+      assert(makeTimestamp(0, 0, zoneId) ==
+        0 - microsOffset)
+      assert(makeTimestamp(0, localTime(23, 59, 59), zoneId) * NANOS_PER_MICROS ==
+        localTime(23, 59, 59) - microsOffset * NANOS_PER_MICROS)
+      assert(makeTimestamp(-1, 0, zoneId) ==
+        -1 * MICROS_PER_DAY - microsOffset)
+      assert(makeTimestamp(-1, localTime(23, 59, 59, 999999), zoneId) ==
+        -1 - microsOffset)
+      assert(makeTimestamp(days(9999, 12, 31), localTime(23, 59, 59, 999999), zoneId) ==
+        date(9999, 12, 31, 23, 59, 59, 999999) - microsOffset)
+      assert(makeTimestamp(days(1, 1, 1), localTime(0, 0, 0), zoneId) ==
+        date(1, 1, 1, 0, 0, 0) - microsOffset)
+      val msg = intercept[DateTimeException] {
+        makeTimestamp(0, -1, zoneId)
+      }.getMessage
+      assert(msg.contains("Invalid value"))
+    })
+  }
+
+  test("makeTimestampNTZ") {
+    assert(makeTimestampNTZ(0, 0) == 0)
+    assert(makeTimestampNTZ(0, localTime(23, 59, 59)) * NANOS_PER_MICROS == localTime(23, 59, 59))
+    assert(makeTimestampNTZ(-1, 0) == -1 * MICROS_PER_DAY)
+    assert(makeTimestampNTZ(-1, localTime(23, 59, 59, 999999)) == -1)
+    assert(makeTimestampNTZ(days(9999, 12, 31), localTime(23, 59, 59, 999999)) ==
+      date(9999, 12, 31, 23, 59, 59, 999999))
+    assert(makeTimestampNTZ(days(1, 1, 1), localTime(0, 0, 0)) == date(1, 1, 1, 0, 0, 0))
+    val msg = intercept[DateTimeException] {
+      makeTimestampNTZ(0, -1)
+    }.getMessage
+    assert(msg.contains("Invalid value"))
+  }
+
+  test("instant to nanos of day") {
+    assert(instantToNanosOfDay(Instant.parse("1970-01-01T00:00:01.001002003Z"), "UTC") ==
+      1001002003)
+    assert(instantToNanosOfDay(Instant.parse("0001-01-01T23:59:59.999999Z"), "UTC") ==
+      localTime(23, 59, 59, 999999))
+    assert(instantToNanosOfDay(Instant.parse("2025-07-02T19:24:12Z"),
+      ZoneId.of("America/Los_Angeles")) == localTime(12, 24, 12))
+  }
+
+  test("truncate time to precision") {
+    assert(truncateTimeToPrecision(1234, 0) == 0)
+    assert(truncateTimeToPrecision(1000, 6) == 1000)
+    assert(truncateTimeToPrecision(localTime(0, 0, 0, 999999), 6) == 999999000)
+    assert(truncateTimeToPrecision(localTime(0, 0, 0, 999999), 5) == 999990000)
+    assert(truncateTimeToPrecision(localTime(23, 59, 59, 123000), 2) ==
+      localTime(23, 59, 59, 120000))
+    assert(truncateTimeToPrecision(localTime(23, 59, 59, 987654), 1) ==
+      localTime(23, 59, 59, 900000))
+  }
+
+  test("add day-time interval to time") {
+    assert(timeAddInterval(0, 0, 0, SECOND, 6) == localTime())
+    assert(timeAddInterval(0, 6, MICROS_PER_DAY - 1, SECOND, 6) ==
+      localTime(23, 59, 59, 999999))
+    assert(timeAddInterval(localTime(23, 59, 59, 999999), 0, -MICROS_PER_DAY + 1, SECOND, 6) ==
+      localTime(0, 0))
+    assert(timeAddInterval(localTime(12, 30, 43, 123400), 4, 10 * MICROS_PER_MINUTE, SECOND, 6) ==
+      localTime(12, 40, 43, 123400))
+    assert(timeAddInterval(localTime(19, 31, 45, 123450), 5, 6, SECOND, 6) ==
+      localTime(19, 31, 45, 123456))
+    assert(timeAddInterval(localTime(1, 2, 3, 1), 6, MICROS_PER_HOUR, HOUR, 6) ==
+      localTime(2, 2, 3, 1))
+
+    checkError(
+      exception = intercept[SparkArithmeticException] {
+        timeAddInterval(1, 6, MICROS_PER_DAY, SECOND, 6)
+      },
+      condition = "DATETIME_OVERFLOW",
+      parameters = Map("operation" ->
+        "add INTERVAL '86400' SECOND to the time value TIME '00:00:00.000000001'")
+    )
+    checkError(
+      exception = intercept[SparkArithmeticException] {
+        timeAddInterval(0, 0, -1, SECOND, 6)
+      },
+      condition = "DATETIME_OVERFLOW",
+      parameters = Map("operation" ->
+        "add INTERVAL '-00.000001' SECOND to the time value TIME '00:00:00'")
+    )
+    checkError(
+      exception = intercept[SparkArithmeticException] {
+        timeAddInterval(0, 0, Long.MaxValue, SECOND, 6)
+      },
+      condition = "ARITHMETIC_OVERFLOW",
+      parameters = Map(
+        "message" -> "long overflow",
+        "alternative" -> "",
+        "config" -> toSQLConf(SqlApiConf.ANSI_ENABLED_KEY))
+    )
+  }
+
+  // Helper methods to assert results of the timeDiff method and verify execution symmetry.
+  private def testTimeDiff(unit: String, start: Long, end: Long, expected: Long): Unit = {
+    val unitStr = UTF8String.fromString(unit)
+    assert(timeDiff(unitStr, start, end) === expected)
+    assert(timeDiff(unitStr, end, start) === -expected)
+  }
+
+  test("SPARK-51555: time difference calculation using timeDiff") {
+    // Helper variables to express various units of time in nanoseconds.
+    val zero = 0L
+    val nano = zero + 1
+    val micro = 1000 * nano
+    val milli = 1000 * micro
+    val sec = 1000 * milli
+    val min = 60 * sec
+    val hour = 60 * min
+    val day = 24 * hour
+    val maxTime = day - nano
+
+    // Tests that return the same results for all supported units.
+    val supportedUnits = Seq("HOUR", "MINUTE", "SECOND", "MILLISECOND", "MICROSECOND")
+    supportedUnits.foreach(unit => {
+      testTimeDiff(unit, zero, zero, 0)
+      testTimeDiff(unit, zero, nano, 0)
+      testTimeDiff(unit, zero, nano * 999, 0)
+      testTimeDiff(unit, nano, nano, 0)
+      testTimeDiff(unit, nano, nano * 999, 0)
+      testTimeDiff(unit, maxTime, maxTime, 0)
+      testTimeDiff(unit, maxTime, maxTime - 999, 0)
+    })
+
+    // Tests that return different results for various supported units.
+    testTimeDiff("HOUR", hour, hour, 0)
+    testTimeDiff("MINUTE", min, min, 0)
+    testTimeDiff("SECOND", sec, sec, 0)
+    testTimeDiff("MILLISECOND", milli, milli, 0)
+    testTimeDiff("MICROSECOND", micro, micro, 0)
+    testTimeDiff("HOUR", zero, hour, 1)
+    testTimeDiff("MINUTE", zero, min, 1)
+    testTimeDiff("SECOND", zero, sec, 1)
+    testTimeDiff("MILLISECOND", zero, milli, 1)
+    testTimeDiff("MICROSECOND", zero, micro, 1)
+    testTimeDiff("HOUR", zero, maxTime, 23)
+    testTimeDiff("MINUTE", zero, maxTime, 1439)
+    testTimeDiff("SECOND", zero, maxTime, 86399)
+    testTimeDiff("MILLISECOND", zero, maxTime, 86399999)
+    testTimeDiff("MICROSECOND", zero, maxTime, 86399999999L)
+    val start = 10 * hour + 53 * min + 45 * sec + 123 * milli + 456 * micro // 10:53:45.123456
+    val end = 11 * hour + 54 * min + 46 * sec + 654 * milli + 321 * micro // 11:54:46.654321
+    testTimeDiff("HOUR", start, end, 1)
+    testTimeDiff("MINUTE", start, end, 61)
+    testTimeDiff("SECOND", start, end, 3661)
+    testTimeDiff("MILLISECOND", start, end, 3661530)
+    testTimeDiff("MICROSECOND", start, end, 3661530865L)
+  }
+
+  test("subtract times") {
+      Seq(
+        (LocalTime.MIDNIGHT, LocalTime.MIDNIGHT) -> 0,
+        (LocalTime.MAX, LocalTime.MIN) -> (TimeUnit.DAYS.toMicros(1) - 1),
+        (LocalTime.MIN, LocalTime.MAX) -> -(TimeUnit.DAYS.toMicros(1) - 1),
+        (LocalTime.of(12, 0, 0, 999999000), LocalTime.of(0, 0, 0, 999999000)) ->
+          TimeUnit.HOURS.toMicros(12),
+        (LocalTime.of(0, 0, 0, 1000), LocalTime.of(0, 0, 0, 999999000)) -> -999998,
+        (LocalTime.of(0, 0, 0, 123456789), LocalTime.of(0, 0, 0, 123)) -> 123456,
+        (LocalTime.of(20, 30, 45, 321000), LocalTime.of(10, 20, 15, 123000)) ->
+          (localTime(20, 30, 45, 321) - localTime(10, 20, 15, 123)) / 1000
+      ).foreach { case ((end, start), expected) =>
+        val endNanos = localTimeToNanos(end)
+        val startNanos = localTimeToNanos(start)
+        val result = subtractTimes(endNanos, startNanos)
+        assert(result === expected)
+      }
+    }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/TimeFormatterSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/TimeFormatterSuite.scala
index d99ea2bd1042b..9a707d80d248f 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/TimeFormatterSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/catalyst/util/TimeFormatterSuite.scala
@@ -24,22 +24,24 @@ import scala.util.Random
 import org.apache.spark.{SPARK_DOC_ROOT, SparkDateTimeException, SparkFunSuite, SparkRuntimeException}
 import org.apache.spark.sql.catalyst.plans.SQLHelper
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils._
-import org.apache.spark.sql.catalyst.util.DateTimeUtils.microsToLocalTime
+import org.apache.spark.sql.catalyst.util.DateTimeUtils.nanosToLocalTime
 
 class TimeFormatterSuite extends SparkFunSuite with SQLHelper {
 
   test("time parsing") {
     Seq(
-      ("12", "HH") -> 12 * 3600 * 1000000L,
-      ("01:02", "HH:mm") -> (1 * 3600 + 2 * 60) * 1000000L,
-      ("10:20", "HH:mm") -> (10 * 3600 + 20 * 60) * 1000000L,
+      ("12", "HH") -> 12 * 3600 * 1000000000L,
+      ("01:02", "HH:mm") -> (1 * 3600 + 2 * 60) * 1000000000L,
+      ("10:20", "HH:mm") -> (10 * 3600 + 20 * 60) * 1000000000L,
       ("00:00:00", "HH:mm:ss") -> 0L,
-      ("01:02:03", "HH:mm:ss") -> (1 * 3600 + 2 * 60 + 3) * 1000000L,
-      ("23:59:59", "HH:mm:ss") -> (23 * 3600 + 59 * 60 + 59) * 1000000L,
+      ("01:02:03", "HH:mm:ss") -> (1 * 3600 + 2 * 60 + 3) * 1000000000L,
+      ("23:59:59", "HH:mm:ss") -> (23 * 3600 + 59 * 60 + 59) * 1000000000L,
       ("00:00:00.000000", "HH:mm:ss.SSSSSS") -> 0L,
-      ("12:34:56.789012", "HH:mm:ss.SSSSSS") -> ((12 * 3600 + 34 * 60 + 56) * 1000000L + 789012),
-      ("23:59:59.000000", "HH:mm:ss.SSSSSS") -> (23 * 3600 + 59 * 60 + 59) * 1000000L,
-      ("23:59:59.999999", "HH:mm:ss.SSSSSS") -> ((23 * 3600 + 59 * 60 + 59) * 1000000L + 999999)
+      ("12:34:56.789012", "HH:mm:ss.SSSSSS") ->
+        ((12 * 3600 + 34 * 60 + 56) * 1000000000L + 789012000),
+      ("23:59:59.000000", "HH:mm:ss.SSSSSS") -> (23 * 3600 + 59 * 60 + 59) * 1000000000L,
+      ("23:59:59.999999", "HH:mm:ss.SSSSSS") ->
+        ((23 * 3600 + 59 * 60 + 59) * 1000000000L + 999999000)
     ).foreach { case ((inputStr, pattern), expectedMicros) =>
       val formatter = TimeFormatter(format = pattern, isParsing = true)
       assert(formatter.parse(inputStr) === expectedMicros)
@@ -60,16 +62,18 @@ class TimeFormatterSuite extends SparkFunSuite with SQLHelper {
 
   test("time formatting") {
     Seq(
-      (12 * 3600 * 1000000L, "HH") -> "12",
-      ((1 * 3600 + 2 * 60) * 1000000L, "HH:mm") -> "01:02",
-      ((10 * 3600 + 20 * 60) * 1000000L, "HH:mm") -> "10:20",
+      (12 * 3600 * 1000000000L, "HH") -> "12",
+      ((1 * 3600 + 2 * 60) * 1000000000L, "HH:mm") -> "01:02",
+      ((10 * 3600 + 20 * 60) * 1000000000L, "HH:mm") -> "10:20",
       (0L, "HH:mm:ss") -> "00:00:00",
-      ((1 * 3600 + 2 * 60 + 3) * 1000000L, "HH:mm:ss") -> "01:02:03",
-      ((23 * 3600 + 59 * 60 + 59) * 1000000L, "HH:mm:ss") -> "23:59:59",
+      ((1 * 3600 + 2 * 60 + 3) * 1000000000L, "HH:mm:ss") -> "01:02:03",
+      ((23 * 3600 + 59 * 60 + 59) * 1000000000L, "HH:mm:ss") -> "23:59:59",
       (0L, "HH:mm:ss.SSSSSS") -> "00:00:00.000000",
-      ((12 * 3600 + 34 * 60 + 56) * 1000000L + 789012, "HH:mm:ss.SSSSSS") -> "12:34:56.789012",
-      ((23 * 3600 + 59 * 60 + 59) * 1000000L, "HH:mm:ss.SSSSSS") -> "23:59:59.000000",
-      ((23 * 3600 + 59 * 60 + 59) * 1000000L + 999999, "HH:mm:ss.SSSSSS") -> "23:59:59.999999"
+      ((12 * 3600 + 34 * 60 + 56) * 1000000000L + 789012000, "HH:mm:ss.SSSSSS") ->
+        "12:34:56.789012",
+      ((23 * 3600 + 59 * 60 + 59) * 1000000000L, "HH:mm:ss.SSSSSS") -> "23:59:59.000000",
+      ((23 * 3600 + 59 * 60 + 59) * 1000000000L + 999999000, "HH:mm:ss.SSSSSS") ->
+        "23:59:59.999999"
     ).foreach { case ((micros, pattern), expectedStr) =>
       val formatter = TimeFormatter(format = pattern)
       assert(formatter.format(micros) === expectedStr)
@@ -82,8 +86,8 @@ class TimeFormatterSuite extends SparkFunSuite with SQLHelper {
       assert(e.getMessage.contains(expectedMsg))
     }
 
-    assertError(-1, "Invalid value for NanoOfDay (valid values 0 - 86399999999999): -1000")
-    assertError(25L * 3600 * 1000 * 1000,
+    assertError(-1000, "Invalid value for NanoOfDay (valid values 0 - 86399999999999): -1000")
+    assertError(25L * 3600 * 1000 * 1000 * 1000,
       "Invalid value for NanoOfDay (valid values 0 - 86399999999999): 90000000000000")
   }
 
@@ -101,14 +105,14 @@ class TimeFormatterSuite extends SparkFunSuite with SQLHelper {
   }
 
   test("round trip with the default pattern: format -> parse") {
-    val data = Seq.tabulate(10) { _ => Random.between(0, 24 * 60 * 60 * 1000000L) }
+    val data = Seq.tabulate(10) { _ => Random.between(0, 24 * 60 * 60 * 1000000L) * 1000L }
     val pattern = "HH:mm:ss.SSSSSS"
     val (formatter, parser) =
       (TimeFormatter(pattern, isParsing = false), TimeFormatter(pattern, isParsing = true))
-    data.foreach { micros =>
-      val str = formatter.format(micros)
-      assert(parser.parse(str) === micros, s"micros = $micros")
-      assert(formatter.format(microsToLocalTime(micros)) === str)
+    data.foreach { nanos =>
+      val str = formatter.format(nanos)
+      assert(parser.parse(str) === nanos, s"nanos = $nanos")
+      assert(formatter.format(nanosToLocalTime(nanos)) === str)
     }
   }
 
@@ -120,8 +124,9 @@ class TimeFormatterSuite extends SparkFunSuite with SQLHelper {
       1000 -> "00:00:00.001",
       900000 -> "00:00:00.9",
       1000000 -> "00:00:01").foreach { case (micros, tsStr) =>
-      assert(formatter.format(micros) === tsStr)
-      assert(formatter.format(microsToLocalTime(micros)) === tsStr)
+      val nanos = micros * 1000L
+      assert(formatter.format(nanos) === tsStr)
+      assert(formatter.format(nanosToLocalTime(nanos)) === tsStr)
     }
   }
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/CatalogSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/CatalogSuite.scala
index 178c432588163..47bf1c5bdc17c 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/CatalogSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/CatalogSuite.scala
@@ -279,7 +279,7 @@ class CatalogSuite extends SparkFunSuite {
     val loaded = catalog.loadTable(testIdent)
 
     assert(table.name == loaded.name)
-    assert(table.schema == loaded.schema)
+    assert(table.columns == loaded.columns)
     assert(table.properties == loaded.properties)
   }
 
@@ -307,7 +307,7 @@ class CatalogSuite extends SparkFunSuite {
     val loaded = catalog.loadTable(testIdent)
 
     assert(table.name == loaded.name)
-    assert(table.schema == loaded.schema)
+    assert(table.columns == loaded.columns)
     assert(table.properties == loaded.properties)
   }
 
@@ -544,8 +544,8 @@ class CatalogSuite extends SparkFunSuite {
 
     val updated = catalog.alterTable(testIdent, TableChange.updateColumnType(Array("id"), LongType))
 
-    val expectedSchema = new StructType().add("id", LongType).add("data", StringType)
-    assert(updated.schema == expectedSchema)
+    val expectedColumns = Array(Column.create("id", LongType), Column.create("data", StringType))
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: update column nullability") {
@@ -566,8 +566,9 @@ class CatalogSuite extends SparkFunSuite {
     val updated = catalog.alterTable(testIdent,
       TableChange.updateColumnNullability(Array("id"), true))
 
-    val expectedSchema = new StructType().add("id", IntegerType).add("data", StringType)
-    assert(updated.schema == expectedSchema)
+    val expectedColumns = Array(
+      Column.create("id", IntegerType, true), Column.create("data", StringType))
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: update missing column fails") {
@@ -606,10 +607,11 @@ class CatalogSuite extends SparkFunSuite {
     val updated = catalog.alterTable(testIdent,
       TableChange.updateColumnComment(Array("id"), "comment text"))
 
-    val expectedSchema = new StructType()
-        .add("id", IntegerType, nullable = true, "comment text")
-        .add("data", StringType)
-    assert(updated.schema == expectedSchema)
+    val expectedColumns = Array(
+      Column.create("id", IntegerType, true, "comment text", null),
+      Column.create("data", StringType)
+    )
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: replace comment") {
@@ -626,14 +628,14 @@ class CatalogSuite extends SparkFunSuite {
 
     catalog.alterTable(testIdent, TableChange.updateColumnComment(Array("id"), "comment text"))
 
-    val expectedSchema = new StructType()
-        .add("id", IntegerType, nullable = true, "replacement comment")
-        .add("data", StringType)
-
+    val expectedColumns = Array(
+      Column.create("id", IntegerType, true, "replacement comment", null),
+      Column.create("data", StringType)
+    )
     val updated = catalog.alterTable(testIdent,
       TableChange.updateColumnComment(Array("id"), "replacement comment"))
 
-    assert(updated.schema == expectedSchema)
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: add comment to missing column fails") {
@@ -671,9 +673,9 @@ class CatalogSuite extends SparkFunSuite {
 
     val updated = catalog.alterTable(testIdent, TableChange.renameColumn(Array("id"), "some_id"))
 
-    val expectedSchema = new StructType().add("some_id", IntegerType).add("data", StringType)
-
-    assert(updated.schema == expectedSchema)
+    val expectedColumns = Array(
+      Column.create("some_id", IntegerType), Column.create("data", StringType))
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: rename nested column") {
@@ -785,8 +787,8 @@ class CatalogSuite extends SparkFunSuite {
     val updated = catalog.alterTable(testIdent,
       TableChange.deleteColumn(Array("id"), false))
 
-    val expectedSchema = new StructType().add("data", StringType)
-    assert(updated.schema == expectedSchema)
+    val expectedColumns = Array(Column.create("data", StringType))
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: delete nested column") {
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/ConstraintSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/ConstraintSuite.scala
index 2d11bedb396fe..d63e3095a2ef4 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/ConstraintSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/ConstraintSuite.scala
@@ -33,7 +33,8 @@ class ConstraintSuite extends SparkFunSuite {
       .validationStatus(ValidationStatus.VALID)
       .rely(true)
       .build()
-    assert(con1.toDDL == "CONSTRAINT con1 CHECK (id > 10) ENFORCED VALID RELY")
+    assert(con1.toDDL == "CONSTRAINT con1 CHECK (id > 10) ENFORCED RELY")
+    assert(con1.validationStatus() == ValidationStatus.VALID)
 
     val con2 = Constraint.check("con2")
     .predicate(
@@ -46,7 +47,8 @@ class ConstraintSuite extends SparkFunSuite {
       .validationStatus(ValidationStatus.VALID)
       .rely(true)
       .build()
-    assert(con2.toDDL == "CONSTRAINT con2 CHECK (a.`b.c`.d = 1) NOT ENFORCED VALID RELY")
+    assert(con2.toDDL == "CONSTRAINT con2 CHECK (a.`b.c`.d = 1) NOT ENFORCED RELY")
+    assert(con2.validationStatus() == ValidationStatus.VALID)
 
     val con3 = Constraint.check("con3")
       .predicateSql("a.b.c <=> 1")
@@ -60,10 +62,12 @@ class ConstraintSuite extends SparkFunSuite {
       .validationStatus(ValidationStatus.INVALID)
       .rely(false)
       .build()
-    assert(con3.toDDL == "CONSTRAINT con3 CHECK (a.b.c <=> 1) NOT ENFORCED INVALID NORELY")
+    assert(con3.toDDL == "CONSTRAINT con3 CHECK (a.b.c <=> 1) NOT ENFORCED NORELY")
+    assert(con3.validationStatus() == ValidationStatus.INVALID)
 
     val con4 = Constraint.check("con4").predicateSql("a = 1").build()
-    assert(con4.toDDL == "CONSTRAINT con4 CHECK (a = 1) ENFORCED UNVALIDATED NORELY")
+    assert(con4.toDDL == "CONSTRAINT con4 CHECK (a = 1) ENFORCED NORELY")
+    assert(con4.validationStatus() == ValidationStatus.UNVALIDATED)
   }
 
   test("UNIQUE constraint toDDL") {
@@ -74,7 +78,8 @@ class ConstraintSuite extends SparkFunSuite {
       .validationStatus(ValidationStatus.UNVALIDATED)
       .rely(true)
       .build()
-    assert(con1.toDDL == "CONSTRAINT con1 UNIQUE (a.b.c, d) NOT ENFORCED UNVALIDATED RELY")
+    assert(con1.toDDL == "CONSTRAINT con1 UNIQUE (a.b.c, d) NOT ENFORCED RELY")
+    assert(con1.validationStatus() == ValidationStatus.UNVALIDATED)
 
     val con2 = Constraint.unique(
         "con2",
@@ -83,7 +88,8 @@ class ConstraintSuite extends SparkFunSuite {
       .validationStatus(ValidationStatus.VALID)
       .rely(true)
       .build()
-    assert(con2.toDDL == "CONSTRAINT con2 UNIQUE (`a.b`.x.y, d) NOT ENFORCED VALID RELY")
+    assert(con2.toDDL == "CONSTRAINT con2 UNIQUE (`a.b`.x.y, d) NOT ENFORCED RELY")
+    assert(con2.validationStatus() == ValidationStatus.VALID)
   }
 
   test("PRIMARY KEY constraint toDDL") {
@@ -94,7 +100,8 @@ class ConstraintSuite extends SparkFunSuite {
       .validationStatus(ValidationStatus.VALID)
       .rely(true)
       .build()
-    assert(pk1.toDDL == "CONSTRAINT pk1 PRIMARY KEY (a.b.c, d) ENFORCED VALID RELY")
+    assert(pk1.toDDL == "CONSTRAINT pk1 PRIMARY KEY (a.b.c, d) ENFORCED RELY")
+    assert(pk1.validationStatus() == ValidationStatus.VALID)
 
     val pk2 = Constraint.primaryKey(
         "pk2",
@@ -103,7 +110,8 @@ class ConstraintSuite extends SparkFunSuite {
       .validationStatus(ValidationStatus.INVALID)
       .rely(false)
       .build()
-    assert(pk2.toDDL == "CONSTRAINT pk2 PRIMARY KEY (`x.y`.z, id) NOT ENFORCED INVALID NORELY")
+    assert(pk2.toDDL == "CONSTRAINT pk2 PRIMARY KEY (`x.y`.z, id) NOT ENFORCED NORELY")
+    assert(pk2.validationStatus() == ValidationStatus.INVALID)
   }
 
   test("FOREIGN KEY constraint toDDL") {
@@ -118,7 +126,8 @@ class ConstraintSuite extends SparkFunSuite {
       .build()
     assert(fk1.toDDL == "CONSTRAINT fk1 FOREIGN KEY (col1, col2) " +
       "REFERENCES schema.table (ref_col1, ref_col2) " +
-      "ENFORCED VALID RELY")
+      "ENFORCED RELY")
+    assert(fk1.validationStatus() == ValidationStatus.VALID)
 
     val fk2 = Constraint.foreignKey(
         "fk2",
@@ -131,6 +140,7 @@ class ConstraintSuite extends SparkFunSuite {
       .build()
     assert(fk2.toDDL == "CONSTRAINT fk2 FOREIGN KEY (`x.y`.z) " +
       "REFERENCES other_table (other_id) " +
-      "NOT ENFORCED INVALID NORELY")
+      "NOT ENFORCED NORELY")
+    assert(fk2.validationStatus() == ValidationStatus.INVALID)
   }
 }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryAtomicPartitionTable.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryAtomicPartitionTable.scala
index 8c9039c723eb1..a4a70fff5e9f6 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryAtomicPartitionTable.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryAtomicPartitionTable.scala
@@ -30,12 +30,19 @@ import org.apache.spark.util.ArrayImplicits._
  */
 class InMemoryAtomicPartitionTable (
     name: String,
-    schema: StructType,
+    columns: Array[Column],
     partitioning: Array[Transform],
     properties: util.Map[String, String])
-  extends InMemoryPartitionTable(name, schema, partitioning, properties)
+  extends InMemoryPartitionTable(name, columns, partitioning, properties)
   with SupportsAtomicPartitionManagement {
 
+  def this(
+      name: String,
+      schema: StructType,
+      partitioning: Array[Transform],
+      properties: util.Map[String, String]) =
+    this(name, CatalogV2Util.structTypeToV2Columns(schema), partitioning, properties)
+
   override def createPartition(
       ident: InternalRow,
       properties: util.Map[String, String]): Unit = {
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryBaseTable.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryBaseTable.scala
index d032829d8645f..83fbedda86193 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryBaseTable.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryBaseTable.scala
@@ -20,15 +20,16 @@ package org.apache.spark.sql.connector.catalog
 import java.time.{Instant, ZoneId}
 import java.time.temporal.ChronoUnit
 import java.util
+import java.util.Objects
 import java.util.OptionalLong
 
 import scala.collection.mutable
-
-import com.google.common.base.Objects
+import scala.collection.mutable.ListBuffer
+import scala.jdk.CollectionConverters._
 
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, JoinedRow, MetadataStructFieldWithLogicalName}
-import org.apache.spark.sql.catalyst.util.{CharVarcharUtils, DateTimeUtils, ResolveDefaultColumns}
+import org.apache.spark.sql.catalyst.util.{CaseInsensitiveMap, CharVarcharUtils, DateTimeUtils, ResolveDefaultColumns}
 import org.apache.spark.sql.connector.catalog.constraints.Constraint
 import org.apache.spark.sql.connector.distributions.{Distribution, Distributions}
 import org.apache.spark.sql.connector.expressions._
@@ -38,6 +39,7 @@ import org.apache.spark.sql.connector.read.colstats.{ColumnStatistics, Histogram
 import org.apache.spark.sql.connector.read.partitioning.{KeyGroupedPartitioning, Partitioning, UnknownPartitioning}
 import org.apache.spark.sql.connector.write._
 import org.apache.spark.sql.connector.write.streaming.{StreamingDataWriterFactory, StreamingWrite}
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.connector.SupportsStreamingUpdateAsAppend
 import org.apache.spark.sql.sources._
 import org.apache.spark.sql.types._
@@ -50,7 +52,7 @@ import org.apache.spark.util.ArrayImplicits._
  */
 abstract class InMemoryBaseTable(
     val name: String,
-    override val columns: Array[Column],
+    val initialColumns: Array[Column],
     override val partitioning: Array[Transform],
     override val properties: util.Map[String, String],
     override val constraints: Array[Constraint] = Array.empty,
@@ -68,6 +70,10 @@ abstract class InMemoryBaseTable(
   // Stores the table version validated during the last `ALTER TABLE ... ADD CONSTRAINT` operation.
   private var validatedTableVersion: String = null
 
+  private var tableColumns: Array[Column] = initialColumns
+
+  override def columns(): Array[Column] = tableColumns
+
   override def currentVersion(): String = currentTableVersion.toString
 
   def setCurrentVersion(version: String): Unit = {
@@ -114,7 +120,7 @@ abstract class InMemoryBaseTable(
     }
   }
 
-  override val schema: StructType = CatalogV2Util.v2ColumnsToStructType(columns)
+  override def schema(): StructType = CatalogV2Util.v2ColumnsToStructType(columns())
 
   // purposely exposes a metadata column that conflicts with a data column in some tests
   override val metadataColumns: Array[MetadataColumn] = Array(IndexColumn, PartitionKeyColumn)
@@ -127,6 +133,10 @@ abstract class InMemoryBaseTable(
   private val allowUnsupportedTransforms =
     properties.getOrDefault("allow-unsupported-transforms", "false").toBoolean
 
+  private val acceptAnySchema = properties.getOrDefault("accept-any-schema", "false").toBoolean
+  private val autoSchemaEvolution = properties.getOrDefault("auto-schema-evolution", "true")
+    .toBoolean
+
   partitioning.foreach {
     case _: IdentityTransform =>
     case _: YearsTransform =>
@@ -144,6 +154,8 @@ abstract class InMemoryBaseTable(
   // The key `Seq[Any]` is the partition values, value is a set of splits, each with a set of rows.
   val dataMap: mutable.Map[Seq[Any], Seq[BufferedRows]] = mutable.Map.empty
 
+  val commits: ListBuffer[Commit] = ListBuffer[Commit]()
+
   def data: Array[BufferedRows] = dataMap.values.flatten.toArray
 
   def rows: Seq[InternalRow] = dataMap.values.flatten.flatMap(_.rows).toSeq
@@ -257,9 +269,9 @@ abstract class InMemoryBaseTable(
       val newRows = new BufferedRows(to)
       rows.rows.foreach { r =>
         val newRow = new GenericInternalRow(r.numFields)
-        for (i <- 0 until r.numFields) newRow.update(i, r.get(i, schema(i).dataType))
+        for (i <- 0 until r.numFields) newRow.update(i, r.get(i, schema()(i).dataType))
         for (i <- 0 until partitionSchema.length) {
-          val j = schema.fieldIndex(partitionSchema(i).name)
+          val j = schema().fieldIndex(partitionSchema(i).name)
           newRow.update(j, to(i))
         }
         newRows.withRow(newRow)
@@ -331,7 +343,7 @@ abstract class InMemoryBaseTable(
     this
   }
 
-  override def capabilities: util.Set[TableCapability] = util.EnumSet.of(
+  def baseCapabiilities: Set[TableCapability] = Set(
     TableCapability.BATCH_READ,
     TableCapability.BATCH_WRITE,
     TableCapability.STREAMING_WRITE,
@@ -339,6 +351,12 @@ abstract class InMemoryBaseTable(
     TableCapability.OVERWRITE_DYNAMIC,
     TableCapability.TRUNCATE)
 
+  override def capabilities(): util.Set[TableCapability] =
+    (baseCapabiilities ++
+      (if (acceptAnySchema) Seq(TableCapability.ACCEPT_ANY_SCHEMA) else Seq.empty) ++
+      (if (autoSchemaEvolution) Seq(TableCapability.AUTOMATIC_SCHEMA_EVOLUTION) else Seq.empty))
+      .asJava
+
   override def newScanBuilder(options: CaseInsensitiveStringMap): ScanBuilder = {
     new InMemoryScanBuilder(schema, options)
   }
@@ -557,7 +575,12 @@ abstract class InMemoryBaseTable(
         advisoryPartitionSize.getOrElse(0)
       }
 
-      override def toBatch: BatchWrite = writer
+      override def toBatch: BatchWrite = {
+        val newSchema = info.schema()
+        tableColumns = CatalogV2Util.structTypeToV2Columns(
+          mergeSchema(CatalogV2Util.v2ColumnsToStructType(columns()), newSchema))
+        writer
+      }
 
       override def toStreaming: StreamingWrite = streamingWriter match {
         case exc: StreamingNotSupportedOperation => exc.throwsException()
@@ -571,10 +594,33 @@ abstract class InMemoryBaseTable(
       override def reportDriverMetrics(): Array[CustomTaskMetric] = {
         Array(new InMemoryCustomDriverTaskMetric(rows.size))
       }
+
+      def mergeSchema(oldType: StructType, newType: StructType): StructType = {
+        val (oldFields, newFields) = (oldType.fields, newType.fields)
+
+        // this does not override the old field with the new field with same name for now
+        val nameToFieldMap = toFieldMap(oldFields)
+        val remainingNewFields = newFields.filterNot (f => nameToFieldMap.contains (f.name) )
+
+        // Create the merged struct with the new fields are appended at the end of the struct.
+        StructType (oldFields ++ remainingNewFields)
+      }
+
+      def toFieldMap(fields: Array[StructField]): Map[String, StructField] = {
+        val fieldMap = fields.map(field => field.name -> field).toMap
+        if (SQLConf.get.caseSensitiveAnalysis) {
+          fieldMap
+        } else {
+          CaseInsensitiveMap(fieldMap)
+        }
+      }
     }
   }
 
   protected abstract class TestBatchWrite extends BatchWrite {
+
+    var commitProperties: mutable.Map[String, String] = mutable.Map.empty[String, String]
+
     override def createBatchWriterFactory(info: PhysicalWriteInfo): DataWriterFactory = {
       BufferedRowsWriterFactory
     }
@@ -583,8 +629,11 @@ abstract class InMemoryBaseTable(
   }
 
   class Append(val info: LogicalWriteInfo) extends TestBatchWrite {
+
     override def commit(messages: Array[WriterCommitMessage]): Unit = dataMap.synchronized {
       withData(messages.map(_.asInstanceOf[BufferedRows]))
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
     }
   }
 
@@ -593,6 +642,8 @@ abstract class InMemoryBaseTable(
       val newData = messages.map(_.asInstanceOf[BufferedRows])
       dataMap --= newData.flatMap(_.rows.map(getKey))
       withData(newData)
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
     }
   }
 
@@ -600,6 +651,8 @@ abstract class InMemoryBaseTable(
     override def commit(messages: Array[WriterCommitMessage]): Unit = dataMap.synchronized {
       dataMap.clear()
       withData(messages.map(_.asInstanceOf[BufferedRows]))
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
     }
   }
 
@@ -702,7 +755,7 @@ case class PartitionInternalRow(keys: Array[Any])
     this.keys == other.asInstanceOf[PartitionInternalRow].keys
   }
   override def hashCode: Int = {
-    Objects.hashCode(keys)
+    Objects.hash(keys)
   }
 }
 
@@ -841,6 +894,8 @@ class InMemoryCustomDriverTaskMetric(value: Long) extends CustomTaskMetric {
   override def value(): Long = value
 }
 
+case class Commit(id: Long, properties: Map[String, String])
+
 sealed trait Operation
 case object Write extends Operation
 case object Delete extends Operation
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryPartitionTable.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryPartitionTable.scala
index ad55af81a3647..aaea6a2b11cd0 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryPartitionTable.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryPartitionTable.scala
@@ -33,12 +33,19 @@ import org.apache.spark.sql.types.StructType
  */
 class InMemoryPartitionTable(
     name: String,
-    schema: StructType,
+    columns: Array[Column],
     partitioning: Array[Transform],
     properties: util.Map[String, String])
-  extends InMemoryTable(name, schema, partitioning, properties) with SupportsPartitionManagement {
+  extends InMemoryTable(name, columns, partitioning, properties) with SupportsPartitionManagement {
   import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
 
+  def this(
+    name: String,
+    schema: StructType,
+    partitioning: Array[Transform],
+    properties: util.Map[String, String]
+  ) = this(name, CatalogV2Util.structTypeToV2Columns(schema), partitioning, properties)
+
   protected val memoryTablePartitions: util.Map[InternalRow, util.Map[String, String]] =
     new ConcurrentHashMap[InternalRow, util.Map[String, String]]()
 
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryRowLevelOperationTable.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryRowLevelOperationTable.scala
index aeb807768b076..100570a67a07b 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryRowLevelOperationTable.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/InMemoryRowLevelOperationTable.scala
@@ -17,7 +17,10 @@
 
 package org.apache.spark.sql.connector.catalog
 
-import java.util
+import java.{lang, util}
+import java.time.Instant
+
+import scala.jdk.CollectionConverters._
 
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.GenericInternalRow
@@ -111,7 +114,21 @@ class InMemoryRowLevelOperationTable(
     override def description(): String = "InMemoryPartitionReplaceOperation"
   }
 
-  private case class PartitionBasedReplaceData(scan: InMemoryBatchScan) extends TestBatchWrite {
+  abstract class RowLevelOperationBatchWrite extends TestBatchWrite {
+
+    override def commit(messages: Array[WriterCommitMessage],
+                                            metrics: util.Map[String, lang.Long]): Unit = {
+      metrics.asScala.map {
+        case (key, value) => commitProperties += key -> String.valueOf(value)
+      }
+      commit(messages)
+      commits += Commit(Instant.now().toEpochMilli, commitProperties.toMap)
+      commitProperties.clear()
+    }
+  }
+
+  private case class PartitionBasedReplaceData(scan: InMemoryBatchScan)
+    extends RowLevelOperationBatchWrite {
 
     override def commit(messages: Array[WriterCommitMessage]): Unit = dataMap.synchronized {
       val newData = messages.map(_.asInstanceOf[BufferedRows])
@@ -165,7 +182,7 @@ class InMemoryRowLevelOperationTable(
     }
   }
 
-  private object TestDeltaBatchWrite extends DeltaBatchWrite {
+  private object TestDeltaBatchWrite extends RowLevelOperationBatchWrite with DeltaBatchWrite{
     override def createBatchWriterFactory(info: PhysicalWriteInfo): DeltaWriterFactory = {
       DeltaBufferedRowsWriterFactory
     }
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsAtomicPartitionManagementSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsAtomicPartitionManagementSuite.scala
index a9d8a69128ae2..ce6a72c414910 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsAtomicPartitionManagementSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsAtomicPartitionManagementSuite.scala
@@ -53,7 +53,7 @@ class SupportsAtomicPartitionManagementSuite extends SparkFunSuite {
   test("createPartitions") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryAtomicPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdents = Array(InternalRow.apply("3"), InternalRow.apply("4"))
@@ -72,7 +72,7 @@ class SupportsAtomicPartitionManagementSuite extends SparkFunSuite {
   test("createPartitions failed if partition already exists") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryAtomicPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("4")
@@ -94,7 +94,7 @@ class SupportsAtomicPartitionManagementSuite extends SparkFunSuite {
   test("dropPartitions") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryAtomicPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdents = Array(InternalRow.apply("3"), InternalRow.apply("4"))
@@ -112,7 +112,7 @@ class SupportsAtomicPartitionManagementSuite extends SparkFunSuite {
   test("purgePartitions") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryAtomicPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     val partIdents = Array(InternalRow.apply("3"), InternalRow.apply("4"))
     partTable.createPartitions(
       partIdents,
@@ -129,7 +129,7 @@ class SupportsAtomicPartitionManagementSuite extends SparkFunSuite {
   test("dropPartitions failed if partition not exists") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryAtomicPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("4")
@@ -147,7 +147,7 @@ class SupportsAtomicPartitionManagementSuite extends SparkFunSuite {
   test("truncatePartitions") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryAtomicPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     partTable.createPartitions(
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsPartitionManagementSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsPartitionManagementSuite.scala
index 8581d4dec1fb8..5a62fe282c939 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsPartitionManagementSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/connector/catalog/SupportsPartitionManagementSuite.scala
@@ -55,7 +55,7 @@ class SupportsPartitionManagementSuite extends SparkFunSuite {
   test("createPartition") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("3")
@@ -70,7 +70,7 @@ class SupportsPartitionManagementSuite extends SparkFunSuite {
   test("dropPartition") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("3")
@@ -88,7 +88,7 @@ class SupportsPartitionManagementSuite extends SparkFunSuite {
   test("purgePartition") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     checkError(
       exception = intercept[SparkUnsupportedOperationException] {
         partTable.purgePartition(InternalRow.apply("3"))
@@ -101,7 +101,7 @@ class SupportsPartitionManagementSuite extends SparkFunSuite {
   test("replacePartitionMetadata") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("3")
@@ -123,7 +123,7 @@ class SupportsPartitionManagementSuite extends SparkFunSuite {
   test("loadPartitionMetadata") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("3")
@@ -140,7 +140,7 @@ class SupportsPartitionManagementSuite extends SparkFunSuite {
   test("listPartitionIdentifiers") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("3")
@@ -248,7 +248,7 @@ class SupportsPartitionManagementSuite extends SparkFunSuite {
   test("truncatePartition") {
     val table = catalog.loadTable(ident)
     val partTable = new InMemoryPartitionTable(
-      table.name(), table.schema(), table.partitioning(), table.properties())
+      table.name(), table.columns(), table.partitioning(), table.properties())
     assert(!hasPartitions(partTable))
 
     val partIdent = InternalRow.apply("3")
diff --git a/sql/catalyst/src/test/scala/org/apache/spark/sql/types/DataTypeSuite.scala b/sql/catalyst/src/test/scala/org/apache/spark/sql/types/DataTypeSuite.scala
index 115d561cbe7b8..c88b0fd996467 100644
--- a/sql/catalyst/src/test/scala/org/apache/spark/sql/types/DataTypeSuite.scala
+++ b/sql/catalyst/src/test/scala/org/apache/spark/sql/types/DataTypeSuite.scala
@@ -30,6 +30,7 @@ import org.apache.spark.sql.types.DataTypeTestUtils.{dayTimeIntervalTypes, yearM
 class DataTypeSuite extends SparkFunSuite {
 
   private val UNICODE_COLLATION_ID = CollationFactory.collationNameToId("UNICODE")
+  private val UTF8_LCASE_COLLATION_ID = CollationFactory.collationNameToId("UTF8_LCASE")
 
   test("construct an ArrayType") {
     val array = ArrayType(StringType)
@@ -339,11 +340,11 @@ class DataTypeSuite extends SparkFunSuite {
         |""".stripMargin
     val dt = DataType.fromJson(schema)
 
-    dt.simpleString equals "struct<c1:string>"
-    dt.json equals
+    assert(dt.simpleString equals "struct<c1:string>")
+    assert(dt.json equals
       """
-        |{"type":"struct","fields":[{"name":"c1","type":"string","nullable":false,"metadata":{}}]}
-        |""".stripMargin
+        |{"type":"struct","fields":[{"name":"c1","type":"string","nullable":true,"metadata":{}}]}
+        |""".stripMargin.trim)
   }
 
   def checkDefaultSize(dataType: DataType, expectedDefaultSize: Int): Unit = {
@@ -879,7 +880,7 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     ArrayType(StringType),
     ArrayType(StringType("UTF8_LCASE")),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     ArrayType(StringType),
@@ -889,7 +890,7 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     ArrayType(ArrayType(StringType)),
     ArrayType(ArrayType(StringType("UTF8_LCASE"))),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     ArrayType(ArrayType(StringType)),
@@ -914,12 +915,12 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     MapType(StringType, StringType),
     MapType(StringType, StringType("UTF8_LCASE")),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     MapType(StringType("UTF8_LCASE"), StringType),
     MapType(StringType, StringType),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     MapType(StringType("UTF8_LCASE"), StringType),
@@ -944,7 +945,7 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     MapType(StringType("UTF8_LCASE"), ArrayType(StringType)),
     MapType(StringType("UTF8_LCASE"), ArrayType(StringType("UTF8_LCASE"))),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     MapType(StringType("UTF8_LCASE"), ArrayType(StringType)),
@@ -969,7 +970,7 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     MapType(ArrayType(StringType), IntegerType),
     MapType(ArrayType(StringType("UTF8_LCASE")), IntegerType),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     MapType(ArrayType(StringType("UTF8_LCASE")), IntegerType),
@@ -999,7 +1000,7 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     StructType(StructField("a", StringType) :: Nil),
     StructType(StructField("a", StringType("UTF8_LCASE")) :: Nil),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     StructType(StructField("a", StringType) :: Nil),
@@ -1024,7 +1025,7 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     StructType(StructField("a", ArrayType(StringType)) :: Nil),
     StructType(StructField("a", ArrayType(StringType("UTF8_LCASE"))) :: Nil),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     StructType(StructField("a", ArrayType(StringType)) :: Nil),
@@ -1049,7 +1050,7 @@ class DataTypeSuite extends SparkFunSuite {
   checkEqualsIgnoreCompatibleCollation(
     StructType(StructField("a", MapType(StringType, IntegerType)) :: Nil),
     StructType(StructField("a", MapType(StringType("UTF8_LCASE"), IntegerType)) :: Nil),
-    expected = false
+    expected = true
   )
   checkEqualsIgnoreCompatibleCollation(
     StructType(StructField("a", MapType(StringType, IntegerType)) :: Nil),
@@ -1145,6 +1146,17 @@ class DataTypeSuite extends SparkFunSuite {
   }
 
   test("schema with collation should not change during ser/de") {
+    val standaloneString = StringType(UNICODE_COLLATION_ID)
+
+    val standaloneArray = ArrayType(StringType(UNICODE_COLLATION_ID))
+
+    val standaloneMap = MapType(StringType(UNICODE_COLLATION_ID),
+      StringType(UTF8_LCASE_COLLATION_ID))
+
+    val standaloneNested = ArrayType(MapType(
+      StringType(UNICODE_COLLATION_ID),
+      ArrayType(StringType(UTF8_LCASE_COLLATION_ID))))
+
     val simpleStruct = StructType(
       StructField("c1", StringType(UNICODE_COLLATION_ID)) :: Nil)
 
@@ -1185,6 +1197,7 @@ class DataTypeSuite extends SparkFunSuite {
         mapWithKeyInNameInSchema ++ arrayInMapInNestedSchema.fields ++ nestedArrayInMap.fields)
 
     Seq(
+      standaloneString, standaloneArray, standaloneMap, standaloneNested,
       simpleStruct, caseInsensitiveNames, specialCharsInName, nestedStruct, arrayInSchema,
       mapInSchema, mapWithKeyInNameInSchema, nestedArrayInMap, arrayInMapInNestedSchema,
       schemaWithMultipleFields)
@@ -1338,7 +1351,7 @@ class DataTypeSuite extends SparkFunSuite {
     assert(DataType.parseDataType(JsonMethods.parse(arrayJson)) === ArrayType(StringType))
 
     val parsedWithCollations = DataType.parseDataType(
-        JsonMethods.parse(arrayJson), collationsMap = collationsMap)
+        JsonMethods.parse(arrayJson), fieldPath = "", collationsMap = collationsMap)
     assert(parsedWithCollations === ArrayType(StringType(unicodeCollationId)))
   }
 
@@ -1360,7 +1373,7 @@ class DataTypeSuite extends SparkFunSuite {
     assert(DataType.parseDataType(JsonMethods.parse(mapJson)) === MapType(StringType, StringType))
 
     val parsedWithCollations = DataType.parseDataType(
-      JsonMethods.parse(mapJson), collationsMap = collationsMap)
+      JsonMethods.parse(mapJson), fieldPath = "", collationsMap = collationsMap)
     assert(parsedWithCollations ===
       MapType(StringType(unicodeCollationId), StringType(unicodeCollationId)))
   }
diff --git a/sql/connect/client/jvm/pom.xml b/sql/connect/client/jvm/pom.xml
index ee4f7b3483e61..a26b638cad76e 100644
--- a/sql/connect/client/jvm/pom.xml
+++ b/sql/connect/client/jvm/pom.xml
@@ -101,12 +101,29 @@
       </exclusions>
       <scope>provided</scope>
     </dependency>
+    <dependency>
+      <groupId>org.scalameta</groupId>
+      <artifactId>semanticdb-shared_${scala.binary.version}</artifactId>
+      <version>4.13.1.1</version>
+      <exclusions>
+        <exclusion>
+          <groupId>org.scala-lang</groupId>
+          <artifactId>scalap</artifactId>
+        </exclusion>
+      </exclusions>
+      <scope>provided</scope>
+    </dependency>
     <dependency>
       <groupId>org.apache.spark</groupId>
       <artifactId>spark-tags_${scala.binary.version}</artifactId>
       <type>test-jar</type>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>commons-io</groupId>
+      <artifactId>commons-io</artifactId>
+      <scope>test</scope>
+    </dependency>
     <dependency>
       <groupId>org.scalacheck</groupId>
       <artifactId>scalacheck_${scala.binary.version}</artifactId>
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/PlanGenerationTestSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/PlanGenerationTestSuite.scala
index a548ec7007dbe..b760828a1e99c 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/PlanGenerationTestSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/PlanGenerationTestSuite.scala
@@ -2369,6 +2369,14 @@ class PlanGenerationTestSuite
     fn.to_date(fn.col("s"), "yyyy-MM-dd")
   }
 
+  temporalFunctionTest("try_to_date") {
+    fn.try_to_date(fn.col("s"))
+  }
+
+  temporalFunctionTest("try_to_date with format") {
+    fn.try_to_date(fn.col("s"), "yyyy-MM-dd")
+  }
+
   temporalFunctionTest("xpath") {
     fn.xpath(fn.col("s"), lit("a/b/text()"))
   }
@@ -3319,6 +3327,7 @@ class PlanGenerationTestSuite
       fn.lit(java.sql.Date.valueOf("2023-02-23")),
       fn.lit(java.time.Duration.ofSeconds(200L)),
       fn.lit(java.time.Period.ofDays(100)),
+      fn.lit(java.time.LocalTime.of(23, 59, 59, 999999999)),
       fn.lit(new CalendarInterval(2, 20, 100L)))
   }
 
@@ -3389,13 +3398,14 @@ class PlanGenerationTestSuite
       fn.typedLit(java.sql.Date.valueOf("2023-02-23")),
       fn.typedLit(java.time.Duration.ofSeconds(200L)),
       fn.typedLit(java.time.Period.ofDays(100)),
+      fn.typedLit(java.time.LocalTime.of(23, 59, 59, 999999999)),
       fn.typedLit(new CalendarInterval(2, 20, 100L)),
 
       // Handle parameterized scala types e.g.: List, Seq and Map.
       fn.typedLit(Some(1)),
       fn.typedLit(Array(1, 2, 3)),
       fn.typedLit(Seq(1, 2, 3)),
-      fn.typedLit(Map("a" -> 1, "b" -> 2)),
+      fn.typedLit(mutable.LinkedHashMap("a" -> 1, "b" -> 2)),
       fn.typedLit(("a", 2, 1.0)),
       fn.typedLit[Option[Int]](None),
       fn.typedLit[Array[Option[Int]]](Array(Some(1))),
@@ -3404,9 +3414,20 @@ class PlanGenerationTestSuite
       fn.typedlit[collection.immutable.Map[Int, Option[Int]]](
         collection.immutable.Map(1 -> None)),
       fn.typedLit(Seq(Seq(1, 2, 3), Seq(4, 5, 6), Seq(7, 8, 9))),
-      fn.typedLit(Seq(Map("a" -> 1, "b" -> 2), Map("a" -> 3, "b" -> 4), Map("a" -> 5, "b" -> 6))),
-      fn.typedLit(Map(1 -> Map("a" -> 1, "b" -> 2), 2 -> Map("a" -> 3, "b" -> 4))),
-      fn.typedLit((Seq(1, 2, 3), Map("a" -> 1, "b" -> 2), ("a", Map(1 -> "a", 2 -> "b")))))
+      fn.typedLit(
+        Seq(
+          mutable.LinkedHashMap("a" -> 1, "b" -> 2),
+          mutable.LinkedHashMap("a" -> 3, "b" -> 4),
+          mutable.LinkedHashMap("a" -> 5, "b" -> 6))),
+      fn.typedLit(
+        mutable.LinkedHashMap(
+          1 -> mutable.LinkedHashMap("a" -> 1, "b" -> 2),
+          2 -> mutable.LinkedHashMap("a" -> 3, "b" -> 4))),
+      fn.typedLit(
+        (
+          Seq(1, 2, 3),
+          mutable.LinkedHashMap("a" -> 1, "b" -> 2),
+          ("a", mutable.LinkedHashMap(1 -> "a", 2 -> "b")))))
   }
 
   /* Window API */
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/CatalogSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/CatalogSuite.scala
index b2c19226dc542..bae569978890b 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/CatalogSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/CatalogSuite.scala
@@ -19,13 +19,12 @@ package org.apache.spark.sql.connect
 
 import java.io.{File, FilenameFilter}
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.SparkException
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.connect.test.{ConnectFunSuite, RemoteSparkSession, SQLHelper}
 import org.apache.spark.sql.types.{DoubleType, LongType, StructType}
 import org.apache.spark.storage.StorageLevel
+import org.apache.spark.util.SparkFileUtils
 
 class CatalogSuite extends ConnectFunSuite with RemoteSparkSession with SQLHelper {
 
@@ -258,7 +257,7 @@ class CatalogSuite extends ConnectFunSuite with RemoteSparkSession with SQLHelpe
           spark.catalog.cacheTable(tableName)
           assert(spark.table(tableName).collect().length == 1)
 
-          FileUtils.deleteDirectory(dir)
+          SparkFileUtils.deleteRecursively(dir)
           assert(spark.table(tableName).collect().length == 1)
 
           spark.catalog.refreshTable(tableName)
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ClientE2ETestSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ClientE2ETestSuite.scala
index 415960e83f9d1..29dd7d9742f44 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ClientE2ETestSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ClientE2ETestSuite.scala
@@ -18,7 +18,7 @@ package org.apache.spark.sql.connect
 
 import java.io.{ByteArrayOutputStream, PrintStream}
 import java.nio.file.Files
-import java.time.DateTimeException
+import java.time.{DateTimeException, LocalTime}
 import java.util.Properties
 
 import scala.collection.mutable
@@ -26,7 +26,6 @@ import scala.concurrent.{ExecutionContext, Future}
 import scala.concurrent.duration.{DurationInt, FiniteDuration}
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.io.FileUtils
 import org.apache.commons.io.output.TeeOutputStream
 import org.scalactic.TolerantNumerics
 import org.scalatest.PrivateMethodTester
@@ -46,7 +45,7 @@ import org.apache.spark.sql.connect.test.SparkConnectServerUtils.port
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SqlApiConf
 import org.apache.spark.sql.types._
-import org.apache.spark.util.SparkThreadUtils
+import org.apache.spark.util.{SparkFileUtils, SparkSystemUtils, SparkThreadUtils}
 
 class ClientE2ETestSuite
     extends QueryTest
@@ -120,7 +119,7 @@ class ClientE2ETestSuite
       import session.implicits._
 
       val throwException =
-        udf((_: String) => throw new SparkException("test" * 10000))
+        udf((_: String) => throw new SparkException("test".repeat(10000)))
 
       val ex = intercept[SparkException] {
         Seq("1").toDS().withColumn("udf_val", throwException($"value")).collect()
@@ -133,7 +132,7 @@ class ClientE2ETestSuite
       val cause = ex.getCause.asInstanceOf[SparkException]
       assert(cause.getCondition == null)
       assert(cause.getMessageParameters.isEmpty)
-      assert(cause.getMessage.contains("test" * 10000))
+      assert(cause.getMessage.contains("test".repeat(10000)))
     }
   }
 
@@ -228,7 +227,7 @@ class ClientE2ETestSuite
   }
 
   test("spark deep recursion") {
-    var recursionDepth = if (System.getProperty("os.arch") == "s390x") 400 else 500
+    var recursionDepth = if (SparkSystemUtils.osArch == "s390x") 400 else 500
     var df = spark.range(1)
     for (a <- 1 to recursionDepth) {
       df = df.union(spark.range(a, a + 1))
@@ -346,7 +345,7 @@ class ClientE2ETestSuite
       .listFiles()
       .filter(file => file.getPath.endsWith(".csv"))(0)
 
-    assert(FileUtils.contentEquals(testDataPath.toFile, outputFile))
+    assert(SparkFileUtils.contentEquals(testDataPath.toFile, outputFile))
   }
 
   test("read path collision") {
@@ -1670,6 +1669,53 @@ class ClientE2ETestSuite
     }
     checkAnswer(df, (0 until 6).map(i => Row(i)))
   }
+
+  test("SPARK-52770: Support Time type") {
+    val df = spark.sql("SELECT TIME '12:13:14'")
+
+    checkAnswer(df, Row(LocalTime.of(12, 13, 14)))
+  }
+
+  test("SPARK-53054: DataFrameReader defaults to spark.sql.sources.default") {
+    withTempPath { file =>
+      val path = file.getAbsoluteFile.toURI.toString
+      spark.range(100).write.parquet(file.toPath.toAbsolutePath.toString)
+
+      spark.conf.set("spark.sql.sources.default", "parquet")
+
+      val df = spark.read.load(path)
+      assert(df.count() == 100)
+    }
+  }
+
+  test("SPARK-52930: the nullability of arrays should be preserved using typedlit") {
+    val arrays = Seq(
+      (typedlit(Array[Int]()), false),
+      (typedlit(Array[Int](1)), false),
+      (typedlit(Array[Integer]()), true),
+      (typedlit(Array[Integer](1)), true))
+    for ((array, containsNull) <- arrays) {
+      val df = spark.sql("select 1").select(array)
+      df.createOrReplaceTempView("test_array_nullability")
+      val schema = spark.sql("select * from test_array_nullability").schema
+      assert(schema.fields.head.dataType.asInstanceOf[ArrayType].containsNull === containsNull)
+    }
+  }
+
+  test("SPARK-52930: the nullability of map values should be preserved using typedlit") {
+    val maps = Seq(
+      (typedlit(Map[String, Int]()), false),
+      (typedlit(Map[String, Int]("a" -> 1)), false),
+      (typedlit(Map[String, Integer]()), true),
+      (typedlit(Map[String, Integer]("a" -> 1)), true))
+    for ((map, valueContainsNull) <- maps) {
+      val df = spark.sql("select 1").select(map)
+      df.createOrReplaceTempView("test_map_nullability")
+      val schema = spark.sql("select * from test_map_nullability").schema
+      assert(
+        schema.fields.head.dataType.asInstanceOf[MapType].valueContainsNull === valueContainsNull)
+    }
+  }
 }
 
 private[sql] case class ClassData(a: String, b: Int)
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ColumnNodeToProtoConverterSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ColumnNodeToProtoConverterSuite.scala
index 02f0c35c44a8f..90da125b49ff0 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ColumnNodeToProtoConverterSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/ColumnNodeToProtoConverterSuite.scala
@@ -79,15 +79,24 @@ class ColumnNodeToProtoConverterSuite extends ConnectFunSuite {
       Literal((12.0, "north", 60.0, "west"), Option(dataType)),
       expr { b =>
         val builder = b.getLiteralBuilder.getStructBuilder
-        builder.getStructTypeBuilder.getStructBuilder
-          .addFields(structField("_1", ProtoDataTypes.DoubleType))
-          .addFields(structField("_2", stringTypeWithCollation))
-          .addFields(structField("_3", ProtoDataTypes.DoubleType))
-          .addFields(structField("_4", stringTypeWithCollation))
-        builder.addElements(proto.Expression.Literal.newBuilder().setDouble(12.0))
-        builder.addElements(proto.Expression.Literal.newBuilder().setString("north"))
-        builder.addElements(proto.Expression.Literal.newBuilder().setDouble(60.0))
-        builder.addElements(proto.Expression.Literal.newBuilder().setString("west"))
+        builder
+          .addElements(proto.Expression.Literal.newBuilder().setDouble(12.0).build())
+        builder
+          .addElements(proto.Expression.Literal.newBuilder().setString("north").build())
+        builder
+          .addElements(proto.Expression.Literal.newBuilder().setDouble(60.0).build())
+        builder
+          .addElements(proto.Expression.Literal.newBuilder().setString("west").build())
+        builder.setDataTypeStruct(
+          proto.DataType.Struct
+            .newBuilder()
+            .addFields(
+              proto.DataType.StructField.newBuilder().setName("_1").setNullable(true).build())
+            .addFields(structField("_2", stringTypeWithCollation))
+            .addFields(
+              proto.DataType.StructField.newBuilder().setName("_3").setNullable(true).build())
+            .addFields(structField("_4", stringTypeWithCollation))
+            .build())
       })
   }
 
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/DataFrameSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/DataFrameSuite.scala
new file mode 100644
index 0000000000000..890245fdd2fba
--- /dev/null
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/DataFrameSuite.scala
@@ -0,0 +1,81 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.connect
+
+import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.connect.test.{QueryTest, RemoteSparkSession}
+import org.apache.spark.sql.functions.{col, concat, lit, when}
+
+class DataFrameSuite extends QueryTest with RemoteSparkSession {
+
+  test("drop") {
+    val sparkSession = spark
+    import sparkSession.implicits._
+
+    val df1 = Seq[(String, String, String)](("a", "b", "c")).toDF("colA", "colB", "colC")
+
+    val df2 = Seq[(String, String, String)](("c", "d", "e")).toDF("colC", "colD", "colE")
+
+    val df3 = df1
+      .join(df2, df1.col("colC") === df2.col("colC"))
+      .withColumn(
+        "colB",
+        when(df1.col("colB") === "b", concat(df1.col("colB").cast("string"), lit("x")))
+          .otherwise(df1.col("colB")))
+
+    val df4 = df3.drop(df1.col("colB"))
+
+    assert(df4.columns === Array("colA", "colB", "colC", "colC", "colD", "colE"))
+    assert(df4.count() === 1)
+  }
+
+  test("drop column from different dataframe") {
+    val sparkSession = spark
+
+    val df1 = spark.range(10)
+    val df2 = df1.select(col("id"), lit(0).as("v0"))
+
+    assert(df2.drop(df2.col("id")).columns === Array("v0"))
+    // drop df1.col("id") from df2, which is semantically equal to df2.col("id")
+    // note that df1.drop(df2.col("id")) works in Classic, but not in Connect
+    assert(df2.drop(df1.col("id")).columns === Array("v0"))
+
+    val df3 = df2.select(col("*"), lit(1).as("v1"))
+    assert(df3.drop(df3.col("id")).columns === Array("v0", "v1"))
+    // drop df2.col("id") from df3, which is semantically equal to df3.col("id")
+    assert(df3.drop(df2.col("id")).columns === Array("v0", "v1"))
+    // drop df1.col("id") from df3, which is semantically equal to df3.col("id")
+    assert(df3.drop(df1.col("id")).columns === Array("v0", "v1"))
+
+    assert(df3.drop(df3.col("v0")).columns === Array("id", "v1"))
+    // drop df2.col("v0") from df3, which is semantically equal to df3.col("v0")
+    assert(df3.drop(df2.col("v0")).columns === Array("id", "v1"))
+  }
+
+  test("lazy column validation") {
+    val session = spark
+    import session.implicits._
+
+    val df1 = Seq(1 -> "y").toDF("a", "y")
+    val df2 = Seq(1 -> "x").toDF("a", "x")
+    val df3 = df1.join(df2, df1("a") === df2("a"))
+    val df4 = df3.select(df1("x")) // <- No exception here
+
+    intercept[AnalysisException] { df4.schema }
+  }
+}
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/SQLImplicitsTestSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/SQLImplicitsTestSuite.scala
index c7b4748f12221..547d5ca7804af 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/SQLImplicitsTestSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/SQLImplicitsTestSuite.scala
@@ -23,7 +23,6 @@ import java.util.concurrent.atomic.AtomicLong
 
 import io.grpc.inprocess.InProcessChannelBuilder
 import org.apache.arrow.memory.RootAllocator
-import org.apache.commons.lang3.SystemUtils
 import org.scalatest.BeforeAndAfterAll
 
 import org.apache.spark.sql.{Column, Encoder, SaveMode}
@@ -31,6 +30,7 @@ import org.apache.spark.sql.catalyst.encoders.AgnosticEncoders.agnosticEncoderFo
 import org.apache.spark.sql.connect.client.SparkConnectClient
 import org.apache.spark.sql.connect.client.arrow.{ArrowDeserializers, ArrowSerializer}
 import org.apache.spark.sql.connect.test.ConnectFunSuite
+import org.apache.spark.util.SparkSystemUtils
 
 /**
  * Test suite for SQL implicits.
@@ -173,7 +173,7 @@ class SQLImplicitsTestSuite extends ConnectFunSuite with BeforeAndAfterAll {
     // Spark always converts them to microseconds, this will cause the
     // test fail when using Java 17 on Linux, so add `truncatedTo(ChronoUnit.MICROS)` when
     // testing on Linux using Java 17 to ensure the accuracy of input data is microseconds.
-    if (SystemUtils.IS_OS_LINUX) {
+    if (SparkSystemUtils.isLinux) {
       testImplicit(LocalDateTime.now().truncatedTo(ChronoUnit.MICROS))
       testImplicit(Instant.now().truncatedTo(ChronoUnit.MICROS))
       testImplicit(Timestamp.from(Instant.now().truncatedTo(ChronoUnit.MICROS)))
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/ClassFinderSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/ClassFinderSuite.scala
index 92cd1acd45d40..5eef1de0a5437 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/ClassFinderSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/ClassFinderSuite.scala
@@ -18,8 +18,6 @@ package org.apache.spark.sql.connect.client
 
 import java.nio.file.Paths
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.sql.connect.test.ConnectFunSuite
 import org.apache.spark.util.SparkFileUtils
 
@@ -32,7 +30,7 @@ class ClassFinderSuite extends ConnectFunSuite {
     requiredClasses.foreach(className =>
       assume(classResourcePath.resolve(className).toFile.exists))
     val copyDir = SparkFileUtils.createTempDir().toPath
-    FileUtils.copyDirectory(classResourcePath.toFile, copyDir.toFile)
+    SparkFileUtils.copyDirectory(classResourcePath.toFile, copyDir.toFile)
     val monitor = new REPLClassDirMonitor(copyDir.toAbsolutePath.toString)
 
     def checkClasses(monitor: REPLClassDirMonitor, additionalClasses: Seq[String] = Nil): Unit = {
@@ -50,7 +48,7 @@ class ClassFinderSuite extends ConnectFunSuite {
     val subDir = SparkFileUtils.createTempDir(copyDir.toAbsolutePath.toString)
     val classToCopy = copyDir.resolve("Hello.class")
     val copyLocation = subDir.toPath.resolve("HelloDup.class")
-    FileUtils.copyFile(classToCopy.toFile, copyLocation.toFile)
+    SparkFileUtils.copyFile(classToCopy.toFile, copyLocation.toFile)
 
     checkClasses(monitor, Seq(s"${subDir.getName}/HelloDup.class"))
   }
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/SparkConnectClientRetriesSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/SparkConnectClientRetriesSuite.scala
new file mode 100644
index 0000000000000..c0738d7de325b
--- /dev/null
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/SparkConnectClientRetriesSuite.scala
@@ -0,0 +1,282 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.sql.connect.client
+
+import scala.concurrent.duration.FiniteDuration
+
+import com.google.protobuf.{Any, Duration}
+import com.google.rpc
+import io.grpc.{Status, StatusRuntimeException}
+import io.grpc.protobuf.StatusProto
+import org.scalatest.BeforeAndAfterEach
+import org.scalatest.concurrent.Eventually
+
+import org.apache.spark.sql.connect.test.ConnectFunSuite
+
+class SparkConnectClientRetriesSuite
+    extends ConnectFunSuite
+    with BeforeAndAfterEach
+    with Eventually {
+
+  private class DummyFn(e: => Throwable, numFails: Int = 3) {
+    var counter = 0
+    def fn(): Int = {
+      if (counter < numFails) {
+        counter += 1
+        throw e
+      } else {
+        42
+      }
+    }
+  }
+
+  /** Tracks sleep times in milliseconds for testing purposes. */
+  private class SleepTimeTracker {
+    private val data = scala.collection.mutable.ListBuffer[Long]()
+    def sleep(t: Long): Unit = data.append(t)
+    def times: List[Long] = data.toList
+    def totalSleep: Long = data.sum
+  }
+
+  /** Helper function for creating a test exception with retry_delay */
+  private def createTestExceptionWithDetails(
+      msg: String,
+      code: Status.Code = Status.Code.INTERNAL,
+      retryDelay: FiniteDuration = FiniteDuration(0, "s")): StatusRuntimeException = {
+    // In grpc-java, RetryDelay should be specified as seconds: Long + nanos: Int
+    val seconds = retryDelay.toSeconds
+    val nanos = (retryDelay - FiniteDuration(seconds, "s")).toNanos.toInt
+    val retryDelayMsg = Duration
+      .newBuilder()
+      .setSeconds(seconds)
+      .setNanos(nanos)
+      .build()
+    val retryInfo = rpc.RetryInfo
+      .newBuilder()
+      .setRetryDelay(retryDelayMsg)
+      .build()
+    val status = rpc.Status
+      .newBuilder()
+      .setMessage(msg)
+      .setCode(code.value())
+      .addDetails(Any.pack(retryInfo))
+      .build()
+    StatusProto.toStatusRuntimeException(status)
+  }
+
+  /** helper function for comparing two sequences of sleep times */
+  private def assertLongSequencesAlmostEqual(
+      first: Seq[Long],
+      second: Seq[Long],
+      delta: Long): Unit = {
+    assert(first.length == second.length, "Lists have different lengths.")
+    for ((a, b) <- first.zip(second)) {
+      assert(math.abs(a - b) <= delta, s"Elements $a and $b differ by more than $delta.")
+    }
+  }
+
+  test("SPARK-44721: Retries run for a minimum period") {
+    // repeat test few times to avoid random flakes
+    for (_ <- 1 to 10) {
+      val st = new SleepTimeTracker()
+      val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE), numFails = 100)
+      val retryHandler = new GrpcRetryHandler(RetryPolicy.defaultPolicies(), st.sleep)
+
+      assertThrows[StatusRuntimeException] {
+        retryHandler.retry {
+          dummyFn.fn()
+        }
+      }
+
+      assert(st.totalSleep >= 10 * 60 * 1000) // waited at least 10 minutes
+    }
+  }
+
+  test("SPARK-44275: retry actually retries") {
+    val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE))
+    val retryPolicies = RetryPolicy.defaultPolicies()
+    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = _ => {})
+    val result = retryHandler.retry { dummyFn.fn() }
+
+    assert(result == 42)
+    assert(dummyFn.counter == 3)
+  }
+
+  test("SPARK-44275: default retryException retries only on UNAVAILABLE") {
+    val dummyFn = new DummyFn(new StatusRuntimeException(Status.ABORTED))
+    val retryPolicies = RetryPolicy.defaultPolicies()
+    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = _ => {})
+
+    assertThrows[StatusRuntimeException] {
+      retryHandler.retry { dummyFn.fn() }
+    }
+    assert(dummyFn.counter == 1)
+  }
+
+  test("SPARK-44275: retry uses canRetry to filter exceptions") {
+    val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE))
+    val retryPolicy = RetryPolicy(canRetry = _ => false, name = "TestPolicy")
+    val retryHandler = new GrpcRetryHandler(retryPolicy)
+
+    assertThrows[StatusRuntimeException] {
+      retryHandler.retry { dummyFn.fn() }
+    }
+    assert(dummyFn.counter == 1)
+  }
+
+  test("SPARK-44275: retry does not exceed maxRetries") {
+    val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE))
+    val retryPolicy = RetryPolicy(canRetry = _ => true, maxRetries = Some(1), name = "TestPolicy")
+    val retryHandler = new GrpcRetryHandler(retryPolicy, sleep = _ => {})
+
+    assertThrows[StatusRuntimeException] {
+      retryHandler.retry { dummyFn.fn() }
+    }
+    assert(dummyFn.counter == 2)
+  }
+
+  def testPolicySpecificError(maxRetries: Int, status: Status): RetryPolicy = {
+    RetryPolicy(
+      maxRetries = Some(maxRetries),
+      name = s"Policy for ${status.getCode}",
+      canRetry = {
+        case e: StatusRuntimeException => e.getStatus.getCode == status.getCode
+        case _ => false
+      })
+  }
+
+  test("Test multiple policies") {
+    val policy1 = testPolicySpecificError(maxRetries = 2, status = Status.UNAVAILABLE)
+    val policy2 = testPolicySpecificError(maxRetries = 4, status = Status.INTERNAL)
+
+    // Tolerate 2 UNAVAILABLE errors and 4 INTERNAL errors
+
+    val errors = (List.fill(2)(Status.UNAVAILABLE) ++ List.fill(4)(Status.INTERNAL)).iterator
+
+    new GrpcRetryHandler(List(policy1, policy2), sleep = _ => {}).retry({
+      val e = errors.nextOption()
+      if (e.isDefined) {
+        throw e.get.asRuntimeException()
+      }
+    })
+
+    assert(!errors.hasNext)
+  }
+
+  test("Test multiple policies exceed") {
+    val policy1 = testPolicySpecificError(maxRetries = 2, status = Status.INTERNAL)
+    val policy2 = testPolicySpecificError(maxRetries = 4, status = Status.INTERNAL)
+
+    val errors = List.fill(10)(Status.INTERNAL).iterator
+    var countAttempted = 0
+
+    assertThrows[StatusRuntimeException](
+      new GrpcRetryHandler(List(policy1, policy2), sleep = _ => {}).retry({
+        countAttempted += 1
+        val e = errors.nextOption()
+        if (e.isDefined) {
+          throw e.get.asRuntimeException()
+        }
+      }))
+
+    assert(countAttempted == 3)
+  }
+
+  test("DefaultPolicy retries exceptions with RetryInfo") {
+    // Error contains RetryInfo with retry_delay set to 0
+    val dummyFn =
+      new DummyFn(createTestExceptionWithDetails(msg = "Some error message"), numFails = 100)
+    val retryPolicies = RetryPolicy.defaultPolicies()
+    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = _ => {})
+    assertThrows[StatusRuntimeException] {
+      retryHandler.retry { dummyFn.fn() }
+    }
+
+    // Should be retried by DefaultPolicy
+    val policy = retryPolicies.find(_.name == "DefaultPolicy").get
+    assert(dummyFn.counter == policy.maxRetries.get + 1)
+  }
+
+  test("retry_delay overrides maxBackoff") {
+    val st = new SleepTimeTracker()
+    val retryDelay = FiniteDuration(5, "min")
+    val dummyFn = new DummyFn(
+      createTestExceptionWithDetails(msg = "Some error message", retryDelay = retryDelay),
+      numFails = 100)
+    val retryPolicies = RetryPolicy.defaultPolicies()
+    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = st.sleep)
+
+    assertThrows[StatusRuntimeException] {
+      retryHandler.retry { dummyFn.fn() }
+    }
+
+    // Should be retried by DefaultPolicy
+    val policy = retryPolicies.find(_.name == "DefaultPolicy").get
+    // sleep times are higher than maxBackoff and are equal to retryDelay + jitter
+    st.times.foreach(t => assert(t > policy.maxBackoff.get.toMillis + policy.jitter.toMillis))
+    val expectedSleeps = List.fill(policy.maxRetries.get)(retryDelay.toMillis)
+    assertLongSequencesAlmostEqual(st.times, expectedSleeps, policy.jitter.toMillis)
+  }
+
+  test("maxServerRetryDelay limits retry_delay") {
+    val st = new SleepTimeTracker()
+    val retryDelay = FiniteDuration(5, "d")
+    val dummyFn = new DummyFn(
+      createTestExceptionWithDetails(msg = "Some error message", retryDelay = retryDelay),
+      numFails = 100)
+    val retryPolicies = RetryPolicy.defaultPolicies()
+    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = st.sleep)
+
+    assertThrows[StatusRuntimeException] {
+      retryHandler.retry { dummyFn.fn() }
+    }
+
+    // Should be retried by DefaultPolicy
+    val policy = retryPolicies.find(_.name == "DefaultPolicy").get
+    val expectedSleeps = List.fill(policy.maxRetries.get)(policy.maxServerRetryDelay.get.toMillis)
+    assertLongSequencesAlmostEqual(st.times, expectedSleeps, policy.jitter.toMillis)
+  }
+
+  test("Policy uses to exponential backoff after retry_delay is unset") {
+    val st = new SleepTimeTracker()
+    val retryDelay = FiniteDuration(5, "min")
+    val retryPolicies = RetryPolicy.defaultPolicies()
+    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = st.sleep)
+    val errors = (
+      List.fill(2)(
+        createTestExceptionWithDetails(
+          msg = "Some error message",
+          retryDelay = retryDelay)) ++ List.fill(3)(
+        createTestExceptionWithDetails(
+          msg = "Some error message",
+          code = Status.Code.UNAVAILABLE))
+    ).iterator
+
+    retryHandler.retry({
+      if (errors.hasNext) {
+        throw errors.next()
+      }
+    })
+    assert(!errors.hasNext)
+
+    // Should be retried by DefaultPolicy
+    val policy = retryPolicies.find(_.name == "DefaultPolicy").get
+    val expectedSleeps = List.fill(2)(retryDelay.toMillis) ++ List.tabulate(3)(i =>
+      policy.initialBackoff.toMillis * math.pow(policy.backoffMultiplier, i + 2).toLong)
+    assertLongSequencesAlmostEqual(st.times, expectedSleeps, delta = policy.jitter.toMillis)
+  }
+}
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/SparkConnectClientSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/SparkConnectClientSuite.scala
index 9bb8f5889d330..a41ea344cbd4c 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/SparkConnectClientSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/SparkConnectClientSuite.scala
@@ -339,130 +339,6 @@ class SparkConnectClientSuite extends ConnectFunSuite with BeforeAndAfterEach {
     }
   }
 
-  private class DummyFn(e: => Throwable, numFails: Int = 3) {
-    var counter = 0
-    def fn(): Int = {
-      if (counter < numFails) {
-        counter += 1
-        throw e
-      } else {
-        42
-      }
-    }
-  }
-
-  test("SPARK-44721: Retries run for a minimum period") {
-    // repeat test few times to avoid random flakes
-    for (_ <- 1 to 10) {
-      var totalSleepMs: Long = 0
-
-      def sleep(t: Long): Unit = {
-        totalSleepMs += t
-      }
-
-      val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE), numFails = 100)
-      val retryHandler = new GrpcRetryHandler(RetryPolicy.defaultPolicies(), sleep)
-
-      assertThrows[RetriesExceeded] {
-        retryHandler.retry {
-          dummyFn.fn()
-        }
-      }
-
-      assert(totalSleepMs >= 10 * 60 * 1000) // waited at least 10 minutes
-    }
-  }
-
-  test("SPARK-44275: retry actually retries") {
-    val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE))
-    val retryPolicies = RetryPolicy.defaultPolicies()
-    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = _ => {})
-    val result = retryHandler.retry { dummyFn.fn() }
-
-    assert(result == 42)
-    assert(dummyFn.counter == 3)
-  }
-
-  test("SPARK-44275: default retryException retries only on UNAVAILABLE") {
-    val dummyFn = new DummyFn(new StatusRuntimeException(Status.ABORTED))
-    val retryPolicies = RetryPolicy.defaultPolicies()
-    val retryHandler = new GrpcRetryHandler(retryPolicies, sleep = _ => {})
-
-    assertThrows[StatusRuntimeException] {
-      retryHandler.retry { dummyFn.fn() }
-    }
-    assert(dummyFn.counter == 1)
-  }
-
-  test("SPARK-44275: retry uses canRetry to filter exceptions") {
-    val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE))
-    val retryPolicy = RetryPolicy(canRetry = _ => false, name = "TestPolicy")
-    val retryHandler = new GrpcRetryHandler(retryPolicy)
-
-    assertThrows[StatusRuntimeException] {
-      retryHandler.retry { dummyFn.fn() }
-    }
-    assert(dummyFn.counter == 1)
-  }
-
-  test("SPARK-44275: retry does not exceed maxRetries") {
-    val dummyFn = new DummyFn(new StatusRuntimeException(Status.UNAVAILABLE))
-    val retryPolicy = RetryPolicy(canRetry = _ => true, maxRetries = Some(1), name = "TestPolicy")
-    val retryHandler = new GrpcRetryHandler(retryPolicy, sleep = _ => {})
-
-    assertThrows[RetriesExceeded] {
-      retryHandler.retry { dummyFn.fn() }
-    }
-    assert(dummyFn.counter == 2)
-  }
-
-  def testPolicySpecificError(maxRetries: Int, status: Status): RetryPolicy = {
-    RetryPolicy(
-      maxRetries = Some(maxRetries),
-      name = s"Policy for ${status.getCode}",
-      canRetry = {
-        case e: StatusRuntimeException => e.getStatus.getCode == status.getCode
-        case _ => false
-      })
-  }
-
-  test("Test multiple policies") {
-    val policy1 = testPolicySpecificError(maxRetries = 2, status = Status.UNAVAILABLE)
-    val policy2 = testPolicySpecificError(maxRetries = 4, status = Status.INTERNAL)
-
-    // Tolerate 2 UNAVAILABLE errors and 4 INTERNAL errors
-
-    val errors = (List.fill(2)(Status.UNAVAILABLE) ++ List.fill(4)(Status.INTERNAL)).iterator
-
-    new GrpcRetryHandler(List(policy1, policy2), sleep = _ => {}).retry({
-      val e = errors.nextOption()
-      if (e.isDefined) {
-        throw e.get.asRuntimeException()
-      }
-    })
-
-    assert(!errors.hasNext)
-  }
-
-  test("Test multiple policies exceed") {
-    val policy1 = testPolicySpecificError(maxRetries = 2, status = Status.INTERNAL)
-    val policy2 = testPolicySpecificError(maxRetries = 4, status = Status.INTERNAL)
-
-    val errors = List.fill(10)(Status.INTERNAL).iterator
-    var countAttempted = 0
-
-    assertThrows[RetriesExceeded](
-      new GrpcRetryHandler(List(policy1, policy2), sleep = _ => {}).retry({
-        countAttempted += 1
-        val e = errors.nextOption()
-        if (e.isDefined) {
-          throw e.get.asRuntimeException()
-        }
-      }))
-
-    assert(countAttempted == 7)
-  }
-
   test("ArtifactManager retries errors") {
     var attempt = 0
 
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/arrow/ArrowEncoderSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/arrow/ArrowEncoderSuite.scala
index 75816a835aaa7..b29d73be359b5 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/arrow/ArrowEncoderSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/client/arrow/ArrowEncoderSuite.scala
@@ -36,7 +36,7 @@ import org.apache.spark.sql.catalyst.{DefinedByConstructorParams, JavaTypeInfere
 import org.apache.spark.sql.catalyst.encoders.{AgnosticEncoder, Codec, OuterScopes}
 import org.apache.spark.sql.catalyst.encoders.AgnosticEncoders.{agnosticEncoderFor, BinaryEncoder, BoxedBooleanEncoder, BoxedByteEncoder, BoxedDoubleEncoder, BoxedFloatEncoder, BoxedIntEncoder, BoxedLongEncoder, BoxedShortEncoder, CalendarIntervalEncoder, DateEncoder, DayTimeIntervalEncoder, EncoderField, InstantEncoder, IterableEncoder, JavaDecimalEncoder, LocalDateEncoder, LocalDateTimeEncoder, NullEncoder, PrimitiveBooleanEncoder, PrimitiveByteEncoder, PrimitiveDoubleEncoder, PrimitiveFloatEncoder, PrimitiveIntEncoder, PrimitiveLongEncoder, PrimitiveShortEncoder, RowEncoder, ScalaDecimalEncoder, StringEncoder, TimestampEncoder, TransformingEncoder, UDTEncoder, YearMonthIntervalEncoder}
 import org.apache.spark.sql.catalyst.encoders.RowEncoder.{encoderFor => toRowEncoder}
-import org.apache.spark.sql.catalyst.util.{DateFormatter, SparkStringUtils, TimestampFormatter}
+import org.apache.spark.sql.catalyst.util.{DateFormatter, TimestampFormatter}
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.MICROS_PER_SECOND
 import org.apache.spark.sql.catalyst.util.IntervalStringStyles.ANSI_STYLE
 import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils._
@@ -46,6 +46,7 @@ import org.apache.spark.sql.connect.client.arrow.FooEnum.FooEnum
 import org.apache.spark.sql.connect.test.ConnectFunSuite
 import org.apache.spark.sql.types.{ArrayType, DataType, DayTimeIntervalType, Decimal, DecimalType, IntegerType, Metadata, SQLUserDefinedType, StringType, StructType, UserDefinedType, YearMonthIntervalType}
 import org.apache.spark.unsafe.types.VariantVal
+import org.apache.spark.util.SparkStringUtils
 
 /**
  * Tests for encoding external data to and from arrow.
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/streaming/TransformWithStateConnectSuite.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/streaming/TransformWithStateConnectSuite.scala
index 310b50dac1cc3..359486ae8e652 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/streaming/TransformWithStateConnectSuite.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/streaming/TransformWithStateConnectSuite.scala
@@ -26,17 +26,22 @@ import org.scalatest.concurrent.Eventually.eventually
 import org.scalatest.concurrent.Futures.timeout
 import org.scalatest.time.SpanSugar._
 
+import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.{DataFrame, Dataset, Encoders, Row}
 import org.apache.spark.sql.connect.SparkSession
 import org.apache.spark.sql.connect.test.{QueryTest, RemoteSparkSession}
 import org.apache.spark.sql.functions._
-import org.apache.spark.sql.streaming.{ListState, MapState, OutputMode, StatefulProcessor, StatefulProcessorWithInitialState, TimeMode, TimerValues, TTLConfig, ValueState}
+import org.apache.spark.sql.streaming.{ListState, MapState, OutputMode, StatefulProcessor, StatefulProcessorWithInitialState, StreamingQueryException, TimeMode, TimerValues, TTLConfig, ValueState}
 import org.apache.spark.sql.types._
+import org.apache.spark.util.SparkFileUtils
 
 case class InputRowForConnectTest(key: String, value: String)
 case class OutputRowForConnectTest(key: String, value: String)
+case class StateRowForConnectTestWithIntType(count: Int)
 case class StateRowForConnectTest(count: Long)
+case class StateRowForConnectTestWithTwoLongs(count: Long, count2: Long)
+case class StateRowForConnectTestWithReorder(count2: Long, count: Long)
 
 // A basic stateful processor which will return the occurrences of key
 class BasicCountStatefulProcessor
@@ -67,6 +72,97 @@ class BasicCountStatefulProcessor
   }
 }
 
+// A basic stateful processor which will return the occurrences of key.
+// Count State is a Int type.
+class CountStatefulProcessorWithInt
+    extends StatefulProcessor[String, InputRowForConnectTest, OutputRowForConnectTest]
+    with Logging {
+  @transient protected var _countState: ValueState[StateRowForConnectTestWithIntType] = _
+
+  override def init(outputMode: OutputMode, timeMode: TimeMode): Unit = {
+    _countState = getHandle.getValueState[StateRowForConnectTestWithIntType](
+      "countState",
+      Encoders.product[StateRowForConnectTestWithIntType],
+      TTLConfig.NONE)
+  }
+
+  override def handleInputRows(
+      key: String,
+      inputRows: Iterator[InputRowForConnectTest],
+      timerValues: TimerValues): Iterator[OutputRowForConnectTest] = {
+    val count = inputRows.toSeq.length + {
+      if (_countState.exists()) {
+        _countState.get().count
+      } else {
+        0
+      }
+    }
+    _countState.update(StateRowForConnectTestWithIntType(count))
+    Iterator(OutputRowForConnectTest(key, count.toString))
+  }
+}
+
+// A stateful processor with Two Longs as state
+// which will return the occurrences of key to test TWS schema evolution
+class CountStatefulProcessorTwoLongs
+    extends StatefulProcessor[String, InputRowForConnectTest, OutputRowForConnectTest]
+    with Logging {
+  @transient protected var _countState: ValueState[StateRowForConnectTestWithTwoLongs] = _
+
+  override def init(outputMode: OutputMode, timeMode: TimeMode): Unit = {
+    _countState = getHandle.getValueState[StateRowForConnectTestWithTwoLongs](
+      "countState",
+      Encoders.product[StateRowForConnectTestWithTwoLongs],
+      TTLConfig.NONE)
+  }
+
+  override def handleInputRows(
+      key: String,
+      inputRows: Iterator[InputRowForConnectTest],
+      timerValues: TimerValues): Iterator[OutputRowForConnectTest] = {
+    val count = inputRows.toSeq.length + {
+      if (_countState.exists()) {
+        _countState.get().count
+      } else {
+        0L
+      }
+    }
+    _countState.update(StateRowForConnectTestWithTwoLongs(count, count))
+    Iterator(OutputRowForConnectTest(key, count.toString))
+  }
+}
+
+// A stateful processor with Two Longs as state.
+// Reorder the field Sequence inside StateRowForConnectTestWithTwoLongs.
+// which will return the occurrences of key to test TWS schema evolution
+class CountStatefulProcessorWithReorder
+    extends StatefulProcessor[String, InputRowForConnectTest, OutputRowForConnectTest]
+    with Logging {
+  @transient protected var _countState: ValueState[StateRowForConnectTestWithReorder] = _
+
+  override def init(outputMode: OutputMode, timeMode: TimeMode): Unit = {
+    _countState = getHandle.getValueState[StateRowForConnectTestWithReorder](
+      "countState",
+      Encoders.product[StateRowForConnectTestWithReorder],
+      TTLConfig.NONE)
+  }
+
+  override def handleInputRows(
+      key: String,
+      inputRows: Iterator[InputRowForConnectTest],
+      timerValues: TimerValues): Iterator[OutputRowForConnectTest] = {
+    val count = inputRows.toSeq.length + {
+      if (_countState.exists()) {
+        _countState.get().count
+      } else {
+        0L
+      }
+    }
+    _countState.update(StateRowForConnectTestWithReorder(count, count))
+    Iterator(OutputRowForConnectTest(key, count.toString))
+  }
+}
+
 // A stateful processor with initial state which will return the occurrences of key
 class TestInitialStatefulProcessor
     extends StatefulProcessorWithInitialState[
@@ -488,13 +584,140 @@ class TransformWithStateConnectSuite
     }
   }
 
+  private def runSchemaEvolutionTest(
+      firstProcessor: StatefulProcessor[String, InputRowForConnectTest, OutputRowForConnectTest],
+      secondProcessor: StatefulProcessor[String, InputRowForConnectTest, OutputRowForConnectTest])
+      : Unit = {
+    withSQLConf(
+      (twsAdditionalSQLConf ++
+        Seq("spark.sql.streaming.stateStore.encodingFormat" -> "avro")): _*) {
+      val session: SparkSession = spark
+      import session.implicits._
+
+      withTempPath { dir =>
+        val path = dir.getCanonicalPath
+        val checkpointPath = s"$path/cpt"
+        val dataPath = s"$path/data"
+        val targetPath = s"$path/tgt"
+
+        testData
+          .toDS()
+          .toDF("key", "value")
+          .repartition(3)
+          .write
+          .mode("append")
+          .parquet(dataPath)
+
+        val testSchema =
+          StructType(Array(StructField("key", StringType), StructField("value", StringType)))
+
+        val q1 = spark.readStream
+          .schema(testSchema)
+          .option("maxFilesPerTrigger", 1)
+          .parquet(dataPath)
+          .as[InputRowForConnectTest]
+          .groupByKey(x => x.key)
+          .transformWithState[OutputRowForConnectTest](
+            firstProcessor,
+            TimeMode.None(),
+            OutputMode.Update())
+          .writeStream
+          .format("parquet")
+          .option("checkpointLocation", checkpointPath)
+          .option("path", targetPath)
+          .start()
+
+        try {
+          q1.processAllAvailable()
+          eventually(timeout(30.seconds)) {
+            checkDatasetUnorderly(
+              spark.read.format("parquet").load(targetPath).as[(String, String)],
+              ("a", "1"),
+              ("a", "2"),
+              ("b", "1"))
+          }
+        } finally {
+          q1.stop()
+        }
+
+        testData
+          .toDS()
+          .toDF("key", "value")
+          .repartition(3)
+          .write
+          .mode("append")
+          .parquet(dataPath)
+
+        val q2 = spark.readStream
+          .schema(testSchema)
+          .option("maxFilesPerTrigger", 1)
+          .parquet(dataPath)
+          .as[InputRowForConnectTest]
+          .groupByKey(x => x.key)
+          .transformWithState[OutputRowForConnectTest](
+            secondProcessor,
+            TimeMode.None(),
+            OutputMode.Update())
+          .writeStream
+          .format("parquet")
+          .option("checkpointLocation", checkpointPath)
+          .option("path", targetPath)
+          .start()
+
+        try {
+          q2.processAllAvailable()
+          eventually(timeout(30.seconds)) {
+            checkDatasetUnorderly(
+              spark.read.format("parquet").load(targetPath).as[(String, String)],
+              ("a", "1"),
+              ("a", "2"),
+              ("b", "1"),
+              ("a", "3"),
+              ("a", "4"),
+              ("b", "2"))
+          }
+        } finally {
+          q2.stop()
+        }
+      }
+    }
+  }
+
+  test("transformWithState - add fields schema evolution") {
+    runSchemaEvolutionTest(new BasicCountStatefulProcessor, new CountStatefulProcessorTwoLongs)
+  }
+
+  test("transformWithState - remove fields schema evolution") {
+    runSchemaEvolutionTest(new CountStatefulProcessorTwoLongs, new BasicCountStatefulProcessor)
+  }
+
+  test("transformWithState - reorder fields schema evolution") {
+    runSchemaEvolutionTest(
+      new CountStatefulProcessorTwoLongs,
+      new CountStatefulProcessorWithReorder)
+  }
+
+  test("transformWithState - upcast fields schema evolution") {
+    runSchemaEvolutionTest(new CountStatefulProcessorWithInt, new BasicCountStatefulProcessor)
+  }
+
+  test("transformWithState - downcast fields would fail") {
+    val e = intercept[StreamingQueryException] {
+      runSchemaEvolutionTest(new BasicCountStatefulProcessor, new CountStatefulProcessorWithInt)
+    }
+    assert(
+      e.getCause
+        .asInstanceOf[SparkUnsupportedOperationException]
+        .getCondition == "STATE_STORE_INVALID_VALUE_SCHEMA_EVOLUTION")
+  }
+
   /* Utils functions for tests */
   def prepareInputData(inputPath: String, col1: Seq[String], col2: Seq[Int]): File = {
     // Ensure the parent directory exists
     val file = Paths.get(inputPath).toFile
     val parentDir = file.getParentFile
     if (parentDir != null && !parentDir.exists()) {
-      parentDir.mkdirs()
+      SparkFileUtils.createDirectory(parentDir)
     }
 
     val writer = new BufferedWriter(new FileWriter(inputPath))
diff --git a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/test/QueryTest.scala b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/test/QueryTest.scala
index 5ae23368b9729..da3b32b408f58 100644
--- a/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/test/QueryTest.scala
+++ b/sql/connect/client/jvm/src/test/scala/org/apache/spark/sql/connect/test/QueryTest.scala
@@ -25,9 +25,9 @@ import org.scalatest.Assertions
 
 import org.apache.spark.{QueryContextType, SparkThrowable}
 import org.apache.spark.sql.Row
-import org.apache.spark.sql.catalyst.util.SparkStringUtils.sideBySide
 import org.apache.spark.sql.connect.{DataFrame, Dataset, SparkSession}
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.SparkStringUtils.sideBySide
 
 abstract class QueryTest extends ConnectFunSuite with SQLHelper {
 
diff --git a/sql/connect/common/pom.xml b/sql/connect/common/pom.xml
index 18fb06ff3341d..6ff47ec6d68ce 100644
--- a/sql/connect/common/pom.xml
+++ b/sql/connect/common/pom.xml
@@ -105,13 +105,6 @@
     </dependencies>
     <build>
         <!-- Protobuf compilation for Spark Connect -->
-        <extensions>
-            <extension>
-                <groupId>kr.motd.maven</groupId>
-                <artifactId>os-maven-plugin</artifactId>
-                <version>1.6.2</version>
-            </extension>
-        </extensions>
         <outputDirectory>target/scala-${scala.binary.version}/classes</outputDirectory>
         <testOutputDirectory>target/scala-${scala.binary.version}/test-classes</testOutputDirectory>
         <plugins>
diff --git a/sql/connect/common/src/main/protobuf/spark/connect/expressions.proto b/sql/connect/common/src/main/protobuf/spark/connect/expressions.proto
index df907a84868fe..913622b91a284 100644
--- a/sql/connect/common/src/main/protobuf/spark/connect/expressions.proto
+++ b/sql/connect/common/src/main/protobuf/spark/connect/expressions.proto
@@ -195,6 +195,7 @@ message Expression {
       Struct struct = 24;
 
       SpecializedArray specialized_array = 25;
+      Time time = 26;
     }
 
     message Decimal {
@@ -214,20 +215,66 @@ message Expression {
     }
 
     message Array {
-      DataType element_type = 1;
+      // (Deprecated) The element type of the array.
+      //
+      // This field is deprecated since Spark 4.1+ and should only be set
+      // if the data_type field is not set. Use data_type field instead.
+      DataType element_type = 1 [deprecated = true];
+
+      // The literal values that make up the array elements.
       repeated Literal elements = 2;
+
+      // The type of the array.
+      //
+      // If the element type can be inferred from the first element of the elements field,
+      // then you don't need to set data_type.element_type to save space. On the other hand,
+      // redundant type information is also acceptable.
+      DataType.Array data_type = 3;
     }
 
     message Map {
-      DataType key_type = 1;
-      DataType value_type = 2;
+      // (Deprecated) The key type of the map.
+      //
+      // This field is deprecated since Spark 4.1+ and should only be set
+      // if the data_type field is not set. Use data_type field instead.
+      DataType key_type = 1 [deprecated = true];
+
+      // (Deprecated) The value type of the map.
+      //
+      // This field is deprecated since Spark 4.1+ and should only be set
+      // if the data_type field is not set. Use data_type field instead.
+      DataType value_type = 2 [deprecated = true];
+
+      // The literal keys that make up the map.
       repeated Literal keys = 3;
+
+      // The literal values that make up the map.
       repeated Literal values = 4;
+
+      // The type of the map.
+      //
+      // If the key/value types can be inferred from the first element of the keys/values fields,
+      // then you don't need to set data_type.key_type/data_type.value_type to save space.
+      // On the other hand, redundant type information is also acceptable.
+      DataType.Map data_type = 5;
     }
 
     message Struct {
-      DataType struct_type = 1;
+      // (Deprecated) The type of the struct.
+      //
+      // This field is deprecated since Spark 4.1+ because using DataType as the type of a struct
+      // is ambiguous. This field should only be set if the data_type_struct field is not set.
+      // Use data_type_struct field instead.
+      DataType struct_type = 1 [deprecated = true];
+
+      // (Required) The literal values that make up the struct elements.
       repeated Literal elements = 2;
+
+      // The type of the struct.
+      //
+      // Whether data_type_struct.fields.data_type should be set depends on
+      // whether each field's type can be inferred from the elements field.
+      DataType.Struct data_type_struct = 3;
     }
 
     message SpecializedArray {
@@ -240,6 +287,12 @@ message Expression {
         Strings strings = 6;
       }
     }
+
+    message Time {
+      int64 nano = 1;
+      // The precision of this time, if omitted, uses the default value of MICROS_PRECISION.
+      optional int32 precision = 2;
+    }
   }
 
   // An unresolved attribute that is not explicitly bound to a specific column, but the column
diff --git a/sql/connect/common/src/main/protobuf/spark/connect/ml.proto b/sql/connect/common/src/main/protobuf/spark/connect/ml.proto
index b66c0a186df39..ef5c406dedd26 100644
--- a/sql/connect/common/src/main/protobuf/spark/connect/ml.proto
+++ b/sql/connect/common/src/main/protobuf/spark/connect/ml.proto
@@ -38,6 +38,8 @@ message MlCommand {
     Evaluate evaluate = 6;
     CleanCache clean_cache = 7;
     GetCacheInfo get_cache_info = 8;
+    CreateSummary create_summary = 9;
+    GetModelSize get_model_size = 10;
   }
 
   // Command for estimator.fit(dataset)
@@ -54,6 +56,9 @@ message MlCommand {
   // or summary evaluated by a model
   message Delete {
     repeated ObjectRef obj_refs = 1;
+    // if set `evict_only` to true, only evict the cached model from memory,
+    // but keep the offloaded model in Spark driver local disk.
+    optional bool evict_only = 2;
   }
 
   // Force to clean up all the ML cached objects
@@ -98,6 +103,18 @@ message MlCommand {
     // (Required) the evaluating dataset
     Relation dataset = 3;
   }
+
+  // This is for re-creating the model summary when the model summary is lost
+  // (model summary is lost when the model is offloaded and then loaded back)
+  message CreateSummary {
+    ObjectRef model_ref = 1;
+    Relation dataset = 2;
+  }
+
+  // This is for query the model estimated in-memory size
+  message GetModelSize {
+    ObjectRef model_ref = 1;
+  }
 }
 
 // The result of MlCommand
diff --git a/sql/connect/common/src/main/protobuf/spark/connect/pipelines.proto b/sql/connect/common/src/main/protobuf/spark/connect/pipelines.proto
index 2f685c6da42c9..57e1ffc7dbe76 100644
--- a/sql/connect/common/src/main/protobuf/spark/connect/pipelines.proto
+++ b/sql/connect/common/src/main/protobuf/spark/connect/pipelines.proto
@@ -25,6 +25,7 @@ import "spark/connect/types.proto";
 
 option java_multiple_files = true;
 option java_package = "org.apache.spark.connect.proto";
+option go_package = "internal/generated";
 
 // Dispatch object for pipelines commands. See each individual command for documentation.
 message PipelineCommand {
@@ -101,13 +102,10 @@ message PipelineCommand {
     optional string target_dataset_name = 3;
 
     // An unresolved relation that defines the dataset's flow.
-    optional spark.connect.Relation plan = 4;
+    optional spark.connect.Relation relation = 4;
 
     // SQL configurations set when running this flow.
     map<string, string> sql_conf = 5;
-
-    // If true, this flow will only be run once per full refresh.
-    optional bool once = 6;
   }
 
   // Resolves all datasets and flows and start a pipeline update. Should be called after all
@@ -115,6 +113,19 @@ message PipelineCommand {
   message StartRun {
     // The graph to start.
     optional string dataflow_graph_id = 1;
+
+    // List of dataset to reset and recompute.
+    repeated string full_refresh_selection = 2;
+    
+    // Perform a full graph reset and recompute.
+    optional bool full_refresh_all = 3;
+    
+    // List of dataset to update.
+    repeated string refresh_selection = 4;
+
+    // If true, the run will not actually execute any flows, but will only validate the graph and
+    // check for any errors. This is useful for testing and validation purposes.
+    optional bool dry = 5;
   }
 
   // Parses the SQL file and registers all datasets and flows.
diff --git a/sql/connect/common/src/main/protobuf/spark/connect/relations.proto b/sql/connect/common/src/main/protobuf/spark/connect/relations.proto
index 70a52a2111494..ccb674e812dc0 100644
--- a/sql/connect/common/src/main/protobuf/spark/connect/relations.proto
+++ b/sql/connect/common/src/main/protobuf/spark/connect/relations.proto
@@ -115,6 +115,9 @@ message MlRelation {
     Transform transform = 1;
     Fetch fetch = 2;
   }
+  // (Optional) the dataset for restoring the model summary
+  optional Relation model_summary_dataset = 3;
+
   // Relation to represent transform(input) of the operator
   // which could be a cached model or a new transformer
   message Transform {
diff --git a/sql/connect/common/src/main/protobuf/spark/connect/types.proto b/sql/connect/common/src/main/protobuf/spark/connect/types.proto
index e1a111e5d6917..1800e3885774f 100644
--- a/sql/connect/common/src/main/protobuf/spark/connect/types.proto
+++ b/sql/connect/common/src/main/protobuf/spark/connect/types.proto
@@ -69,8 +69,13 @@ message DataType {
 
     // UnparsedDataType
     Unparsed unparsed = 24;
+
+    Time time = 28;
   }
 
+  // Reserved for geometry and geography types
+  reserved 26, 27;
+
   message Boolean {
     uint32 type_variation_reference = 1;
   }
@@ -124,6 +129,11 @@ message DataType {
     uint32 type_variation_reference = 1;
   }
 
+  message Time {
+    optional int32 precision = 1;
+    uint32 type_variation_reference = 2;
+  }
+
   message CalendarInterval {
     uint32 type_variation_reference = 1;
   }
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/DataFrameReader.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/DataFrameReader.scala
index 0af603e0f6cc9..67a4d983f56bf 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/DataFrameReader.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/DataFrameReader.scala
@@ -79,8 +79,7 @@ class DataFrameReader private[sql] (sparkSession: SparkSession) extends sql.Data
   def load(paths: String*): DataFrame = {
     sparkSession.newDataFrame { builder =>
       val dataSourceBuilder = builder.getReadBuilder.getDataSourceBuilder
-      assertSourceFormatSpecified()
-      dataSourceBuilder.setFormat(source)
+      Option(source).foreach(dataSourceBuilder.setFormat)
       userSpecifiedSchema.foreach(schema => dataSourceBuilder.setSchema(schema.toDDL))
       extraOptions.foreach { case (k, v) =>
         dataSourceBuilder.putOptions(k, v)
@@ -211,12 +210,6 @@ class DataFrameReader private[sql] (sparkSession: SparkSession) extends sql.Data
   @scala.annotation.varargs
   override def textFile(paths: String*): Dataset[String] = super.textFile(paths: _*)
 
-  private def assertSourceFormatSpecified(): Unit = {
-    if (source == null) {
-      throw new IllegalArgumentException("The source format must be specified.")
-    }
-  }
-
   private def parse(ds: Dataset[String], format: ParseFormat): DataFrame = {
     sparkSession.newDataFrame { builder =>
       val parseBuilder = builder.getParseBuilder
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/KeyValueGroupedDataset.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/KeyValueGroupedDataset.scala
index af036218455fa..49298a5b39fc6 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/KeyValueGroupedDataset.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/KeyValueGroupedDataset.scala
@@ -24,6 +24,7 @@ import org.apache.spark.api.java.function._
 import org.apache.spark.connect.proto
 import org.apache.spark.sql
 import org.apache.spark.sql.{Column, Encoder, TypedColumn}
+import org.apache.spark.sql.catalyst.ScalaReflection
 import org.apache.spark.sql.catalyst.encoders.AgnosticEncoder
 import org.apache.spark.sql.catalyst.encoders.AgnosticEncoders.{agnosticEncoderFor, ProductEncoder, StructEncoder}
 import org.apache.spark.sql.connect.ColumnNodeToProtoConverter.{toExpr, toExprWithTransformation, toTypedExpr}
@@ -658,8 +659,14 @@ private class KeyValueGroupedDatasetImpl[K, V, IK, IV](
       initialState: Option[sql.KeyValueGroupedDataset[K, S]] = None,
       eventTimeColumnName: String = ""): Dataset[U] = {
     val outputEncoder = agnosticEncoderFor[U]
-    val stateEncoder = agnosticEncoderFor[S]
-    val inputEncoders: Seq[AgnosticEncoder[_]] = Seq(kEncoder, stateEncoder, ivEncoder)
+    val initialStateEncoder = if (initialState.isDefined) {
+      agnosticEncoderFor[S]
+    } else {
+      // Cannot use `agnosticEncoderFor[S]` here because it points to incorrect encoder
+      // when the initial state is not provided. Using an empty state encoder instead.
+      ScalaReflection.encoderFor[EmptyInitialStateStruct]
+    }
+    val inputEncoders: Seq[AgnosticEncoder[_]] = Seq(kEncoder, initialStateEncoder, ivEncoder)
 
     // SparkUserDefinedFunction is creating a udfPacket where the input function are
     // being java serialized into bytes; we pass in `statefulProcessor` as function so it can be
@@ -780,3 +787,14 @@ private object KeyValueGroupedDatasetImpl {
     case _ => false
   }
 }
+
+/**
+ * A marker case class used as a placeholder type for initial state encoders when no actual
+ * initial state is provided to stateful streaming operations.
+ *
+ * In the `transformWithStateHelper` method, when `initialState` is not provided, we cannot use
+ * `agnosticEncoderFor[S]` for the initial state encoder because it would incorrectly point to the
+ * other encoders. Instead, we use `EmptyStruct` as a sentinel type to create a proper encoder
+ * that represents the absence of initial state data.
+ */
+case class EmptyInitialStateStruct()
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/SparkSession.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/SparkSession.scala
index 739b0318759e5..646db83981fe2 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/SparkSession.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/SparkSession.scala
@@ -40,7 +40,7 @@ import org.apache.spark.api.java.JavaRDD
 import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.ExecutePlanResponse
 import org.apache.spark.connect.proto.ExecutePlanResponse.ObservedMetrics
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, PATH}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/StreamingQueryListenerBus.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/StreamingQueryListenerBus.scala
index 30cdf2b5cadb4..52b0ea24e9e33 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/StreamingQueryListenerBus.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/StreamingQueryListenerBus.scala
@@ -22,7 +22,7 @@ import java.util.concurrent.CopyOnWriteArrayList
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.connect.proto.{Command, ExecutePlanResponse, Plan, StreamingQueryEventType}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.connect.client.CloseableIterator
 import org.apache.spark.sql.streaming.StreamingQueryListener
 import org.apache.spark.sql.streaming.StreamingQueryListener.{Event, QueryIdleEvent, QueryProgressEvent, QueryStartedEvent, QueryTerminatedEvent}
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/ArtifactManager.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/ArtifactManager.scala
index e9411dc3db61b..213cd1d2e8673 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/ArtifactManager.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/ArtifactManager.scala
@@ -33,7 +33,6 @@ import com.google.protobuf.ByteString
 import io.grpc.StatusRuntimeException
 import io.grpc.stub.StreamObserver
 import org.apache.commons.codec.digest.DigestUtils.sha256Hex
-import org.apache.commons.lang3.StringUtils
 
 import org.apache.spark.SparkException
 import org.apache.spark.connect.proto
@@ -41,7 +40,7 @@ import org.apache.spark.connect.proto.AddArtifactsResponse
 import org.apache.spark.connect.proto.AddArtifactsResponse.ArtifactSummary
 import org.apache.spark.sql.Artifact
 import org.apache.spark.sql.Artifact.{newCacheArtifact, newIvyArtifacts}
-import org.apache.spark.util.{SparkFileUtils, SparkThreadUtils}
+import org.apache.spark.util.{SparkFileUtils, SparkStringUtils, SparkThreadUtils}
 
 /**
  * The Artifact Manager is responsible for handling and transferring artifacts from the local
@@ -173,7 +172,8 @@ class ArtifactManager(
       .addAllNames(Arrays.asList(artifactName))
       .build()
     val response = bstub.artifactStatus(request)
-    if (StringUtils.isNotEmpty(response.getSessionId) && response.getSessionId != sessionId) {
+    if (SparkStringUtils.isNotEmpty(response.getSessionId) &&
+      response.getSessionId != sessionId) {
       // In older versions of the Spark cluster, the session ID is not set in the response.
       // Ignore this check to keep compatibility.
       throw new IllegalStateException(
@@ -248,7 +248,7 @@ class ArtifactManager(
     val responseHandler = new StreamObserver[proto.AddArtifactsResponse] {
       private val summaries = mutable.Buffer.empty[ArtifactSummary]
       override def onNext(v: AddArtifactsResponse): Unit = {
-        if (StringUtils.isNotEmpty(v.getSessionId) && v.getSessionId != sessionId) {
+        if (SparkStringUtils.isNotEmpty(v.getSessionId) && v.getSessionId != sessionId) {
           // In older versions of the Spark cluster, the session ID is not set in the response.
           // Ignore this check to keep compatibility.
           throw new IllegalStateException(s"Session ID mismatch: $sessionId != ${v.getSessionId}")
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/GrpcRetryHandler.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/GrpcRetryHandler.scala
index 7e0a356b9e493..3f4558ee97dad 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/GrpcRetryHandler.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/GrpcRetryHandler.scala
@@ -23,7 +23,6 @@ import io.grpc.stub.StreamObserver
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ERROR, NUM_RETRY, POLICY, RETRY_WAIT_TIME}
-import org.apache.spark.internal.MDC
 
 private[sql] class GrpcRetryHandler(
     private val policies: Seq[RetryPolicy],
@@ -194,15 +193,17 @@ private[sql] object GrpcRetryHandler extends Logging {
         return
       }
 
-      for (policy <- policies if policy.canRetry(lastException)) {
-        val time = policy.nextAttempt()
-
+      // find a policy to wait with
+      val matchedPolicyOpt = policies.find(_.canRetry(lastException))
+      if (matchedPolicyOpt.isDefined) {
+        val matchedPolicy = matchedPolicyOpt.get
+        val time = matchedPolicy.nextAttempt(lastException)
         if (time.isDefined) {
           logWarning(
             log"Non-Fatal error during RPC execution: ${MDC(ERROR, lastException)}, " +
               log"retrying (wait=${MDC(RETRY_WAIT_TIME, time.get.toMillis)} ms, " +
               log"currentRetryNum=${MDC(NUM_RETRY, currentRetryNum)}, " +
-              log"policy=${MDC(POLICY, policy.getName)}).")
+              log"policy=${MDC(POLICY, matchedPolicy.getName)}).")
           sleep(time.get.toMillis)
           return
         }
@@ -212,9 +213,8 @@ private[sql] object GrpcRetryHandler extends Logging {
         log"Non-Fatal error during RPC execution: ${MDC(ERROR, lastException)}, " +
           log"exceeded retries (currentRetryNum=${MDC(NUM_RETRY, currentRetryNum)})")
 
-      val error = new RetriesExceeded()
-      exceptionList.foreach(error.addSuppressed)
-      throw error
+      logWarning(log"[RETRIES_EXCEEDED] The maximum number of retries has been exceeded.")
+      throw lastException
     }
 
     def retry(): T = {
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/RetryPolicy.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/RetryPolicy.scala
index 8c8472d780dbc..5b5c4b517923e 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/RetryPolicy.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/RetryPolicy.scala
@@ -18,9 +18,14 @@
 package org.apache.spark.sql.connect.client
 
 import scala.concurrent.duration.{Duration, FiniteDuration}
+import scala.jdk.CollectionConverters._
 import scala.util.Random
 
+import com.google.rpc.RetryInfo
 import io.grpc.{Status, StatusRuntimeException}
+import io.grpc.protobuf.StatusProto
+
+import org.apache.spark.internal.Logging
 
 /**
  * [[RetryPolicy]] configure the retry mechanism in [[GrpcRetryHandler]]
@@ -33,8 +38,27 @@ import io.grpc.{Status, StatusRuntimeException}
  *   Maximal value of the exponential backoff (ms).
  * @param backoffMultiplier
  *   Multiplicative base of the exponential backoff.
+ * @param jitter
+ *   Sample a random value uniformly from the range [0, jitter] and add it to the backoff.
+ * @param minJitterThreshold
+ *   Minimal value of the backoff to add random jitter.
  * @param canRetry
  *   Function that determines whether a retry is to be performed in the event of an error.
+ * @param name
+ *   Name of the policy.
+ * @param recognizeServerRetryDelay
+ *   Per gRPC standard, the server can send error messages that contain `RetryInfo` message with
+ *   `retry_delay` field indicating that the client should wait for at least `retry_delay` amount
+ *   of time before retrying again, see:
+ *   https://github.com/googleapis/googleapis/blob/master/google/rpc/error_details.proto#L91
+ *
+ * If this flag is set to true, RetryPolicy will use `RetryInfo.retry_delay` field in the backoff
+ * computation. Server's `retry_delay` can override client's `maxBackoff`.
+ *
+ * This flag does not change which errors are retried, only how the backoff is computed.
+ * `DefaultPolicy` additionally has a rule for retrying any error that contains `RetryInfo`.
+ * @param maxServerRetryDelay
+ *   Limit for the server-provided `retry_delay`.
  */
 case class RetryPolicy(
     maxRetries: Option[Int] = None,
@@ -44,14 +68,16 @@ case class RetryPolicy(
     jitter: FiniteDuration = FiniteDuration(0, "s"),
     minJitterThreshold: FiniteDuration = FiniteDuration(0, "s"),
     canRetry: Throwable => Boolean,
-    name: String) {
+    name: String,
+    recognizeServerRetryDelay: Boolean = false,
+    maxServerRetryDelay: Option[FiniteDuration] = None) {
 
   def getName: String = name
 
   def toState: RetryPolicy.RetryPolicyState = new RetryPolicy.RetryPolicyState(this)
 }
 
-object RetryPolicy {
+object RetryPolicy extends Logging {
   def defaultPolicy(): RetryPolicy = RetryPolicy(
     name = "DefaultPolicy",
     // Please synchronize changes here with Python side:
@@ -65,7 +91,9 @@ object RetryPolicy {
     backoffMultiplier = 4.0,
     jitter = FiniteDuration(500, "ms"),
     minJitterThreshold = FiniteDuration(2, "s"),
-    canRetry = defaultPolicyRetryException)
+    canRetry = defaultPolicyRetryException,
+    recognizeServerRetryDelay = true,
+    maxServerRetryDelay = Some(FiniteDuration(10, "min")))
 
   // list of policies to be used by this client
   def defaultPolicies(): Seq[RetryPolicy] = List(defaultPolicy())
@@ -77,7 +105,7 @@ object RetryPolicy {
     private var nextWait: Duration = policy.initialBackoff
 
     // return waiting time until next attempt, or None if has exceeded max retries
-    def nextAttempt(): Option[Duration] = {
+    def nextAttempt(e: Throwable): Option[Duration] = {
       if (policy.maxRetries.isDefined && numberAttempts >= policy.maxRetries.get) {
         return None
       }
@@ -90,6 +118,14 @@ object RetryPolicy {
         nextWait = nextWait min policy.maxBackoff.get
       }
 
+      if (policy.recognizeServerRetryDelay) {
+        extractRetryDelay(e).foreach { retryDelay =>
+          logDebug(s"The server has sent a retry delay of $retryDelay ms.")
+          val retryDelayLimited = retryDelay min policy.maxServerRetryDelay.getOrElse(retryDelay)
+          currentWait = currentWait max retryDelayLimited
+        }
+      }
+
       if (currentWait >= policy.minJitterThreshold) {
         currentWait += Random.nextDouble() * policy.jitter
       }
@@ -127,8 +163,33 @@ object RetryPolicy {
         if (statusCode == Status.Code.UNAVAILABLE) {
           return true
         }
+
+        // All errors messages containing `RetryInfo` should be retried.
+        if (extractRetryInfo(e).isDefined) {
+          return true
+        }
+
         false
       case _ => false
     }
   }
+
+  private def extractRetryInfo(e: Throwable): Option[RetryInfo] = {
+    e match {
+      case e: StatusRuntimeException =>
+        Option(StatusProto.fromThrowable(e))
+          .flatMap(status =>
+            status.getDetailsList.asScala
+              .find(_.is(classOf[RetryInfo]))
+              .map(_.unpack(classOf[RetryInfo])))
+      case _ => None
+    }
+  }
+
+  private def extractRetryDelay(e: Throwable): Option[FiniteDuration] = {
+    extractRetryInfo(e)
+      .flatMap(retryInfo => Option(retryInfo.getRetryDelay))
+      .map(retryDelay =>
+        FiniteDuration(retryDelay.getSeconds, "s") + FiniteDuration(retryDelay.getNanos, "ns"))
+  }
 }
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/SparkConnectClient.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/SparkConnectClient.scala
index e844237a3bb44..48f01a8042a64 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/SparkConnectClient.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/SparkConnectClient.scala
@@ -33,6 +33,7 @@ import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.UserContext
 import org.apache.spark.sql.connect.common.ProtoUtils
 import org.apache.spark.sql.connect.common.config.ConnectCommon
+import org.apache.spark.util.SparkSystemUtils
 
 /**
  * Conceptually the remote spark session that communicates with the server.
@@ -707,12 +708,11 @@ object SparkConnectClient {
    */
   private def genUserAgent(value: String): String = {
     val scalaVersion = Properties.versionNumberString
-    val jvmVersion = System.getProperty("java.version").split("_")(0)
+    val jvmVersion = SparkSystemUtils.javaVersion.split("_")(0)
     val osName = {
-      val os = System.getProperty("os.name").toLowerCase(Locale.ROOT)
-      if (os.contains("mac")) "darwin"
-      else if (os.contains("linux")) "linux"
-      else if (os.contains("win")) "windows"
+      if (SparkSystemUtils.isMac) "darwin"
+      else if (SparkSystemUtils.isLinux) "linux"
+      else if (SparkSystemUtils.isWindows) "windows"
       else "unknown"
     }
     List(
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowDeserializer.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowDeserializer.scala
index ceeece073da65..7597a0ceeb8cd 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowDeserializer.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowDeserializer.scala
@@ -200,6 +200,10 @@ object ArrowDeserializers {
         new LeafFieldDeserializer[LocalDateTime](encoder, v, timeZoneId) {
           override def value(i: Int): LocalDateTime = reader.getLocalDateTime(i)
         }
+      case (LocalTimeEncoder, v: FieldVector) =>
+        new LeafFieldDeserializer[LocalTime](encoder, v, timeZoneId) {
+          override def value(i: Int): LocalTime = reader.getLocalTime(i)
+        }
 
       case (OptionEncoder(value), v) =>
         val deserializer = deserializerFor(value, v, timeZoneId)
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowSerializer.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowSerializer.scala
index d79fb25ec1a0b..4acb11f014d19 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowSerializer.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowSerializer.scala
@@ -20,7 +20,7 @@ import java.io.{ByteArrayOutputStream, OutputStream}
 import java.lang.invoke.{MethodHandles, MethodType}
 import java.math.{BigDecimal => JBigDecimal, BigInteger => JBigInteger}
 import java.nio.channels.Channels
-import java.time.{Duration, Instant, LocalDate, LocalDateTime, Period}
+import java.time.{Duration, Instant, LocalDate, LocalDateTime, LocalTime, Period}
 import java.util.{Map => JMap, Objects}
 
 import scala.jdk.CollectionConverters._
@@ -392,6 +392,11 @@ object ArrowSerializer {
           override def set(index: Int, value: LocalDateTime): Unit =
             vector.setSafe(index, SparkDateTimeUtils.localDateTimeToMicros(value))
         }
+      case (LocalTimeEncoder, v: TimeNanoVector) =>
+        new FieldSerializer[LocalTime, TimeNanoVector](v) {
+          override def set(index: Int, value: LocalTime): Unit =
+            vector.setSafe(index, SparkDateTimeUtils.localTimeToNanos(value))
+        }
 
       case (OptionEncoder(value), v) =>
         new Serializer {
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowVectorReader.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowVectorReader.scala
index 3dbfce18e7b48..ea57e0e1c77fa 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowVectorReader.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/client/arrow/ArrowVectorReader.scala
@@ -18,17 +18,18 @@ package org.apache.spark.sql.connect.client.arrow
 
 import java.math.{BigDecimal => JBigDecimal}
 import java.sql.{Date, Timestamp}
-import java.time.{Duration, Instant, LocalDate, LocalDateTime, Period, ZoneOffset}
+import java.time.{Duration, Instant, LocalDate, LocalDateTime, LocalTime, Period, ZoneOffset}
 
 import org.apache.arrow.vector._
 import org.apache.arrow.vector.util.Text
 
-import org.apache.spark.sql.catalyst.util.{DateFormatter, SparkIntervalUtils, SparkStringUtils, TimestampFormatter}
+import org.apache.spark.sql.catalyst.util.{DateFormatter, SparkIntervalUtils, TimeFormatter, TimestampFormatter}
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.MICROS_PER_SECOND
 import org.apache.spark.sql.catalyst.util.IntervalStringStyles.ANSI_STYLE
 import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils._
 import org.apache.spark.sql.types.{DataType, DayTimeIntervalType, Decimal, UpCastRule, YearMonthIntervalType}
 import org.apache.spark.sql.util.ArrowUtils
+import org.apache.spark.util.SparkStringUtils
 
 /**
  * Base class for reading leaf values from an arrow vector. This reader has read methods for all
@@ -59,6 +60,7 @@ private[arrow] abstract class ArrowVectorReader {
   def getInstant(i: Int): java.time.Instant = unsupported()
   def getLocalDate(i: Int): java.time.LocalDate = unsupported()
   def getLocalDateTime(i: Int): java.time.LocalDateTime = unsupported()
+  def getLocalTime(i: Int): java.time.LocalTime = unsupported()
   private def unsupported(): Nothing = throw new UnsupportedOperationException()
 }
 
@@ -90,6 +92,7 @@ object ArrowVectorReader {
       case v: DateDayVector => new DateDayVectorReader(v, timeZoneId)
       case v: TimeStampMicroTZVector => new TimeStampMicroTZVectorReader(v)
       case v: TimeStampMicroVector => new TimeStampMicroVectorReader(v, timeZoneId)
+      case v: TimeNanoVector => new TimeVectorReader(v)
       case _: NullVector => NullVectorReader
       case _ => throw new RuntimeException("Unsupported Vector Type: " + vector.getClass)
     }
@@ -275,3 +278,11 @@ private[arrow] class TimeStampMicroVectorReader(v: TimeStampMicroVector, timeZon
   override def getLocalDateTime(i: Int): LocalDateTime = microsToLocalDateTime(utcMicros(i))
   override def getString(i: Int): String = formatter.format(utcMicros(i))
 }
+
+private[arrow] class TimeVectorReader(v: TimeNanoVector)
+    extends TypedArrowVectorReader[TimeNanoVector](v) {
+  private lazy val formatter = TimeFormatter.getFractionFormatter()
+  private def nanos(i: Int): Long = vector.get(i)
+  override def getLocalTime(i: Int): LocalTime = nanosToLocalTime(nanos(i))
+  override def getString(i: Int): String = formatter.format(nanos(i))
+}
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/columnNodeSupport.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/columnNodeSupport.scala
index 1e798387726bb..cbbec0599b77b 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/columnNodeSupport.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/columnNodeSupport.scala
@@ -29,7 +29,7 @@ import org.apache.spark.sql.catalyst.encoders.RowEncoder
 import org.apache.spark.sql.catalyst.trees.{CurrentOrigin, Origin}
 import org.apache.spark.sql.connect.ConnectConversions._
 import org.apache.spark.sql.connect.common.DataTypeProtoConverter
-import org.apache.spark.sql.connect.common.LiteralValueProtoConverter.toLiteralProtoBuilder
+import org.apache.spark.sql.connect.common.LiteralValueProtoConverter.{toLiteralProtoBuilderWithOptions, ToLiteralProtoOptions}
 import org.apache.spark.sql.expressions.{Aggregator, UserDefinedAggregateFunction, UserDefinedAggregator, UserDefinedFunction}
 import org.apache.spark.sql.internal.{Alias, CaseWhenOtherwise, Cast, ColumnNode, ColumnNodeLike, InvokeInlineUserDefinedFunction, LambdaFunction, LazyExpression, Literal, SortOrder, SqlExpression, SubqueryExpression, SubqueryType, UnresolvedAttribute, UnresolvedExtractValue, UnresolvedFunction, UnresolvedNamedLambdaVariable, UnresolvedRegex, UnresolvedStar, UpdateFields, Window, WindowFrame}
 
@@ -65,11 +65,12 @@ object ColumnNodeToProtoConverter extends (ColumnNode => proto.Expression) {
     val builder = proto.Expression.newBuilder()
     val n = additionalTransformation.map(_(node)).getOrElse(node)
     n match {
-      case Literal(value, None, _) =>
-        builder.setLiteral(toLiteralProtoBuilder(value))
-
-      case Literal(value, Some(dataType), _) =>
-        builder.setLiteral(toLiteralProtoBuilder(value, dataType))
+      case Literal(value, dataTypeOpt, _) =>
+        builder.setLiteral(
+          toLiteralProtoBuilderWithOptions(
+            value,
+            dataTypeOpt,
+            ToLiteralProtoOptions(useDeprecatedDataTypeFields = false)))
 
       case u @ UnresolvedAttribute(unparsedIdentifier, planId, isMetadataColumn, _) =>
         val escapedName = u.sql
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/DataTypeProtoConverter.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/DataTypeProtoConverter.scala
index 8c83ad3d1f550..4ff555c5645bd 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/DataTypeProtoConverter.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/DataTypeProtoConverter.scala
@@ -53,6 +53,12 @@ object DataTypeProtoConverter {
       case proto.DataType.KindCase.DATE => DateType
       case proto.DataType.KindCase.TIMESTAMP => TimestampType
       case proto.DataType.KindCase.TIMESTAMP_NTZ => TimestampNTZType
+      case proto.DataType.KindCase.TIME =>
+        if (t.getTime.hasPrecision) {
+          TimeType(t.getTime.getPrecision)
+        } else {
+          TimeType()
+        }
 
       case proto.DataType.KindCase.CALENDAR_INTERVAL => CalendarIntervalType
       case proto.DataType.KindCase.YEAR_MONTH_INTERVAL =>
@@ -204,6 +210,12 @@ object DataTypeProtoConverter {
 
       case TimestampNTZType => ProtoDataTypes.TimestampNTZType
 
+      case TimeType(precision) =>
+        proto.DataType
+          .newBuilder()
+          .setTime(proto.DataType.Time.newBuilder().setPrecision(precision).build())
+          .build()
+
       case CalendarIntervalType => ProtoDataTypes.CalendarIntervalType
 
       case YearMonthIntervalType(startField, endField) =>
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/LiteralValueProtoConverter.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/LiteralValueProtoConverter.scala
index 1f3496fa89847..870a452e85ecd 100644
--- a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/LiteralValueProtoConverter.scala
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/LiteralValueProtoConverter.scala
@@ -23,7 +23,6 @@ import java.sql.{Date, Timestamp}
 import java.time._
 
 import scala.collection.{immutable, mutable}
-import scala.jdk.CollectionConverters._
 import scala.reflect.ClassTag
 import scala.reflect.runtime.universe.TypeTag
 import scala.util.Try
@@ -40,14 +39,10 @@ import org.apache.spark.util.SparkClassUtils
 
 object LiteralValueProtoConverter {
 
-  /**
-   * Transforms literal value to the `proto.Expression.Literal.Builder`.
-   *
-   * @return
-   *   proto.Expression.Literal.Builder
-   */
   @scala.annotation.tailrec
-  def toLiteralProtoBuilder(literal: Any): proto.Expression.Literal.Builder = {
+  private def toLiteralProtoBuilderInternal(
+      literal: Any,
+      options: ToLiteralProtoOptions): proto.Expression.Literal.Builder = {
     val builder = proto.Expression.Literal.newBuilder()
 
     def decimalBuilder(precision: Int, scale: Int, value: String) = {
@@ -63,8 +58,17 @@ object LiteralValueProtoConverter {
 
     def arrayBuilder(array: Array[_]) = {
       val ab = builder.getArrayBuilder
-        .setElementType(toConnectProtoType(toDataType(array.getClass.getComponentType)))
-      array.foreach(x => ab.addElements(toLiteralProto(x)))
+      if (options.useDeprecatedDataTypeFields) {
+        ab.setElementType(toConnectProtoType(toDataType(array.getClass.getComponentType)))
+      } else {
+        ab.setDataType(
+          proto.DataType.Array
+            .newBuilder()
+            .setElementType(toConnectProtoType(toDataType(array.getClass.getComponentType)))
+            .setContainsNull(true)
+            .build())
+      }
+      array.foreach(x => ab.addElements(toLiteralProtoWithOptions(x, None, options)))
       ab
     }
 
@@ -84,8 +88,8 @@ object LiteralValueProtoConverter {
       case v: Char => builder.setString(v.toString)
       case v: Array[Char] => builder.setString(String.valueOf(v))
       case v: Array[Byte] => builder.setBinary(ByteString.copyFrom(v))
-      case v: mutable.ArraySeq[_] => toLiteralProtoBuilder(v.array)
-      case v: immutable.ArraySeq[_] => toLiteralProtoBuilder(v.unsafeArray)
+      case v: mutable.ArraySeq[_] => toLiteralProtoBuilderInternal(v.array, options)
+      case v: immutable.ArraySeq[_] => toLiteralProtoBuilderInternal(v.unsafeArray, options)
       case v: LocalDate => builder.setDate(v.toEpochDay.toInt)
       case v: Decimal =>
         builder.setDecimal(decimalBuilder(Math.max(v.precision, v.scale), v.scale, v.toString))
@@ -96,6 +100,11 @@ object LiteralValueProtoConverter {
       case v: Date => builder.setDate(SparkDateTimeUtils.fromJavaDate(v))
       case v: Duration => builder.setDayTimeInterval(SparkIntervalUtils.durationToMicros(v))
       case v: Period => builder.setYearMonthInterval(SparkIntervalUtils.periodToMonths(v))
+      case v: LocalTime =>
+        builder.setTime(
+          builder.getTimeBuilder
+            .setNano(SparkDateTimeUtils.localTimeToNanos(v))
+            .setPrecision(TimeType.DEFAULT_PRECISION))
       case v: Array[_] => builder.setArray(arrayBuilder(v))
       case v: CalendarInterval =>
         builder.setCalendarInterval(calendarIntervalBuilder(v.months, v.days, v.microseconds))
@@ -105,19 +114,31 @@ object LiteralValueProtoConverter {
   }
 
   @scala.annotation.tailrec
-  def toLiteralProtoBuilder(
+  private def toLiteralProtoBuilderInternal(
       literal: Any,
-      dataType: DataType): proto.Expression.Literal.Builder = {
+      dataType: DataType,
+      options: ToLiteralProtoOptions): proto.Expression.Literal.Builder = {
     val builder = proto.Expression.Literal.newBuilder()
 
-    def arrayBuilder(scalaValue: Any, elementType: DataType) = {
-      val ab = builder.getArrayBuilder.setElementType(toConnectProtoType(elementType))
-
+    def arrayBuilder(scalaValue: Any, elementType: DataType, containsNull: Boolean) = {
+      val ab = builder.getArrayBuilder
+      if (options.useDeprecatedDataTypeFields) {
+        ab.setElementType(toConnectProtoType(elementType))
+      } else {
+        ab.setDataType(
+          proto.DataType.Array
+            .newBuilder()
+            .setElementType(toConnectProtoType(elementType))
+            .setContainsNull(containsNull)
+            .build())
+      }
       scalaValue match {
         case a: Array[_] =>
-          a.foreach(item => ab.addElements(toLiteralProto(item, elementType)))
+          a.foreach(item =>
+            ab.addElements(toLiteralProtoWithOptions(item, Some(elementType), options)))
         case s: scala.collection.Seq[_] =>
-          s.foreach(item => ab.addElements(toLiteralProto(item, elementType)))
+          s.foreach(item =>
+            ab.addElements(toLiteralProtoWithOptions(item, Some(elementType), options)))
         case other =>
           throw new IllegalArgumentException(s"literal $other not supported (yet).")
       }
@@ -125,16 +146,30 @@ object LiteralValueProtoConverter {
       ab
     }
 
-    def mapBuilder(scalaValue: Any, keyType: DataType, valueType: DataType) = {
+    def mapBuilder(
+        scalaValue: Any,
+        keyType: DataType,
+        valueType: DataType,
+        valueContainsNull: Boolean) = {
       val mb = builder.getMapBuilder
-        .setKeyType(toConnectProtoType(keyType))
-        .setValueType(toConnectProtoType(valueType))
+      if (options.useDeprecatedDataTypeFields) {
+        mb.setKeyType(toConnectProtoType(keyType))
+        mb.setValueType(toConnectProtoType(valueType))
+      } else {
+        mb.setDataType(
+          proto.DataType.Map
+            .newBuilder()
+            .setKeyType(toConnectProtoType(keyType))
+            .setValueType(toConnectProtoType(valueType))
+            .setValueContainsNull(valueContainsNull)
+            .build())
+      }
 
       scalaValue match {
         case map: scala.collection.Map[_, _] =>
           map.foreach { case (k, v) =>
-            mb.addKeys(toLiteralProto(k, keyType))
-            mb.addValues(toLiteralProto(v, valueType))
+            mb.addKeys(toLiteralProtoWithOptions(k, Some(keyType), options))
+            mb.addValues(toLiteralProtoWithOptions(v, Some(valueType), options))
           }
         case other =>
           throw new IllegalArgumentException(s"literal $other not supported (yet).")
@@ -144,16 +179,47 @@ object LiteralValueProtoConverter {
     }
 
     def structBuilder(scalaValue: Any, structType: StructType) = {
-      val sb = builder.getStructBuilder.setStructType(toConnectProtoType(structType))
-      val dataTypes = structType.fields.map(_.dataType)
+      val sb = builder.getStructBuilder
+      val fields = structType.fields
 
       scalaValue match {
         case p: Product =>
           val iter = p.productIterator
           var idx = 0
-          while (idx < structType.size) {
-            sb.addElements(toLiteralProto(iter.next(), dataTypes(idx)))
-            idx += 1
+          if (options.useDeprecatedDataTypeFields) {
+            while (idx < structType.size) {
+              val field = fields(idx)
+              val literalProto =
+                toLiteralProtoWithOptions(iter.next(), Some(field.dataType), options)
+              sb.addElements(literalProto)
+              idx += 1
+            }
+            sb.setStructType(toConnectProtoType(structType))
+          } else {
+            val dataTypeStruct = proto.DataType.Struct.newBuilder()
+            while (idx < structType.size) {
+              val field = fields(idx)
+              val literalProto =
+                toLiteralProtoWithOptions(iter.next(), Some(field.dataType), options)
+              sb.addElements(literalProto)
+
+              val fieldBuilder = dataTypeStruct
+                .addFieldsBuilder()
+                .setName(field.name)
+                .setNullable(field.nullable)
+
+              if (LiteralValueProtoConverter.getInferredDataType(literalProto).isEmpty) {
+                fieldBuilder.setDataType(toConnectProtoType(field.dataType))
+              }
+
+              // Set metadata if available
+              if (field.metadata != Metadata.empty) {
+                fieldBuilder.setMetadata(field.metadata.json)
+              }
+
+              idx += 1
+            }
+            sb.setDataTypeStruct(dataTypeStruct.build())
           }
         case other =>
           throw new IllegalArgumentException(s"literal $other not supported (yet).")
@@ -164,24 +230,63 @@ object LiteralValueProtoConverter {
 
     (literal, dataType) match {
       case (v: mutable.ArraySeq[_], ArrayType(_, _)) =>
-        toLiteralProtoBuilder(v.array, dataType)
+        toLiteralProtoBuilderInternal(v.array, dataType, options)
       case (v: immutable.ArraySeq[_], ArrayType(_, _)) =>
-        toLiteralProtoBuilder(v.unsafeArray, dataType)
+        toLiteralProtoBuilderInternal(v.unsafeArray, dataType, options)
       case (v: Array[Byte], ArrayType(_, _)) =>
-        toLiteralProtoBuilder(v)
-      case (v, ArrayType(elementType, _)) =>
-        builder.setArray(arrayBuilder(v, elementType))
-      case (v, MapType(keyType, valueType, _)) =>
-        builder.setMap(mapBuilder(v, keyType, valueType))
+        toLiteralProtoBuilderInternal(v, options)
+      case (v, ArrayType(elementType, containsNull)) =>
+        builder.setArray(arrayBuilder(v, elementType, containsNull))
+      case (v, MapType(keyType, valueType, valueContainsNull)) =>
+        builder.setMap(mapBuilder(v, keyType, valueType, valueContainsNull))
       case (v, structType: StructType) =>
         builder.setStruct(structBuilder(v, structType))
       case (v: Option[_], _: DataType) =>
         if (v.isDefined) {
-          toLiteralProtoBuilder(v.get)
+          toLiteralProtoBuilderInternal(v.get, options)
         } else {
           builder.setNull(toConnectProtoType(dataType))
         }
-      case _ => toLiteralProtoBuilder(literal)
+      case (v: LocalTime, timeType: TimeType) =>
+        builder.setTime(
+          builder.getTimeBuilder
+            .setNano(SparkDateTimeUtils.localTimeToNanos(v))
+            .setPrecision(timeType.precision))
+      case _ => toLiteralProtoBuilderInternal(literal, options)
+    }
+
+  }
+
+  /**
+   * Transforms literal value to the `proto.Expression.Literal.Builder`.
+   *
+   * @return
+   *   proto.Expression.Literal.Builder
+   */
+  def toLiteralProtoBuilder(literal: Any): proto.Expression.Literal.Builder = {
+    toLiteralProtoBuilderInternal(
+      literal,
+      ToLiteralProtoOptions(useDeprecatedDataTypeFields = true))
+  }
+
+  def toLiteralProtoBuilder(
+      literal: Any,
+      dataType: DataType): proto.Expression.Literal.Builder = {
+    toLiteralProtoBuilderInternal(
+      literal,
+      dataType,
+      ToLiteralProtoOptions(useDeprecatedDataTypeFields = true))
+  }
+
+  def toLiteralProtoBuilderWithOptions(
+      literal: Any,
+      dataTypeOpt: Option[DataType],
+      options: ToLiteralProtoOptions): proto.Expression.Literal.Builder = {
+    dataTypeOpt match {
+      case Some(dataType) =>
+        toLiteralProtoBuilderInternal(literal, dataType, options)
+      case None =>
+        toLiteralProtoBuilderInternal(literal, options)
     }
   }
 
@@ -192,6 +297,8 @@ object LiteralValueProtoConverter {
     toLiteralProtoBuilder(v)
   }
 
+  case class ToLiteralProtoOptions(useDeprecatedDataTypeFields: Boolean)
+
   /**
    * Transforms literal value to the `proto.Expression.Literal`.
    *
@@ -199,10 +306,27 @@ object LiteralValueProtoConverter {
    *   proto.Expression.Literal
    */
   def toLiteralProto(literal: Any): proto.Expression.Literal =
-    toLiteralProtoBuilder(literal).build()
+    toLiteralProtoBuilderInternal(
+      literal,
+      ToLiteralProtoOptions(useDeprecatedDataTypeFields = true)).build()
 
   def toLiteralProto(literal: Any, dataType: DataType): proto.Expression.Literal =
-    toLiteralProtoBuilder(literal, dataType).build()
+    toLiteralProtoBuilderInternal(
+      literal,
+      dataType,
+      ToLiteralProtoOptions(useDeprecatedDataTypeFields = true)).build()
+
+  def toLiteralProtoWithOptions(
+      literal: Any,
+      dataTypeOpt: Option[DataType],
+      options: ToLiteralProtoOptions): proto.Expression.Literal = {
+    dataTypeOpt match {
+      case Some(dataType) =>
+        toLiteralProtoBuilderInternal(literal, dataType, options).build()
+      case None =>
+        toLiteralProtoBuilderInternal(literal, options).build()
+    }
+  }
 
   private[sql] def toDataType(clz: Class[_]): DataType = clz match {
     // primitive types
@@ -290,6 +414,9 @@ object LiteralValueProtoConverter {
       case proto.Expression.Literal.LiteralTypeCase.ARRAY =>
         toCatalystArray(literal.getArray)
 
+      case proto.Expression.Literal.LiteralTypeCase.STRUCT =>
+        toCatalystStruct(literal.getStruct)
+
       case other =>
         throw new UnsupportedOperationException(
           s"Unsupported Literal Type: ${other.getNumber} (${other.name})")
@@ -297,86 +424,250 @@ object LiteralValueProtoConverter {
   }
 
   private def getConverter(dataType: proto.DataType): proto.Expression.Literal => Any = {
-    if (dataType.hasShort) { v =>
-      v.getShort.toShort
-    } else if (dataType.hasInteger) { v =>
-      v.getInteger
-    } else if (dataType.hasLong) { v =>
-      v.getLong
-    } else if (dataType.hasDouble) { v =>
-      v.getDouble
-    } else if (dataType.hasByte) { v =>
-      v.getByte.toByte
-    } else if (dataType.hasFloat) { v =>
-      v.getFloat
-    } else if (dataType.hasBoolean) { v =>
-      v.getBoolean
-    } else if (dataType.hasString) { v =>
-      v.getString
-    } else if (dataType.hasBinary) { v =>
-      v.getBinary.toByteArray
-    } else if (dataType.hasDate) { v =>
-      v.getDate
-    } else if (dataType.hasTimestamp) { v =>
-      v.getTimestamp
-    } else if (dataType.hasTimestampNtz) { v =>
-      v.getTimestampNtz
-    } else if (dataType.hasDayTimeInterval) { v =>
-      v.getDayTimeInterval
-    } else if (dataType.hasYearMonthInterval) { v =>
-      v.getYearMonthInterval
-    } else if (dataType.hasDecimal) { v =>
-      Decimal(v.getDecimal.getValue)
-    } else if (dataType.hasCalendarInterval) { v =>
-      val interval = v.getCalendarInterval
-      new CalendarInterval(interval.getMonths, interval.getDays, interval.getMicroseconds)
-    } else if (dataType.hasArray) { v =>
-      toCatalystArray(v.getArray)
-    } else if (dataType.hasMap) { v =>
-      toCatalystMap(v.getMap)
-    } else if (dataType.hasStruct) { v =>
-      toCatalystStruct(v.getStruct)
-    } else {
-      throw InvalidPlanInput(s"Unsupported Literal Type: $dataType)")
+    dataType.getKindCase match {
+      case proto.DataType.KindCase.SHORT => v => v.getShort.toShort
+      case proto.DataType.KindCase.INTEGER => v => v.getInteger
+      case proto.DataType.KindCase.LONG => v => v.getLong
+      case proto.DataType.KindCase.DOUBLE => v => v.getDouble
+      case proto.DataType.KindCase.BYTE => v => v.getByte.toByte
+      case proto.DataType.KindCase.FLOAT => v => v.getFloat
+      case proto.DataType.KindCase.BOOLEAN => v => v.getBoolean
+      case proto.DataType.KindCase.STRING => v => v.getString
+      case proto.DataType.KindCase.BINARY => v => v.getBinary.toByteArray
+      case proto.DataType.KindCase.DATE => v => v.getDate
+      case proto.DataType.KindCase.TIMESTAMP => v => v.getTimestamp
+      case proto.DataType.KindCase.TIMESTAMP_NTZ => v => v.getTimestampNtz
+      case proto.DataType.KindCase.DAY_TIME_INTERVAL => v => v.getDayTimeInterval
+      case proto.DataType.KindCase.YEAR_MONTH_INTERVAL => v => v.getYearMonthInterval
+      case proto.DataType.KindCase.DECIMAL => v => Decimal(v.getDecimal.getValue)
+      case proto.DataType.KindCase.CALENDAR_INTERVAL =>
+        v =>
+          val interval = v.getCalendarInterval
+          new CalendarInterval(interval.getMonths, interval.getDays, interval.getMicroseconds)
+      case proto.DataType.KindCase.ARRAY =>
+        v => toCatalystArrayInternal(v.getArray, dataType.getArray)
+      case proto.DataType.KindCase.MAP =>
+        v => toCatalystMapInternal(v.getMap, dataType.getMap)
+      case proto.DataType.KindCase.STRUCT =>
+        v => toCatalystStructInternal(v.getStruct, dataType.getStruct)
+      case _ =>
+        throw InvalidPlanInput(s"Unsupported Literal Type: ${dataType.getKindCase}")
     }
   }
 
-  def toCatalystArray(array: proto.Expression.Literal.Array): Array[_] = {
+  private def getInferredDataType(
+      literal: proto.Expression.Literal,
+      recursive: Boolean = false): Option[proto.DataType] = {
+    if (literal.hasNull) {
+      return Some(literal.getNull)
+    }
+
+    val builder = proto.DataType.newBuilder()
+    literal.getLiteralTypeCase match {
+      case proto.Expression.Literal.LiteralTypeCase.BINARY =>
+        builder.setBinary(proto.DataType.Binary.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.BOOLEAN =>
+        builder.setBoolean(proto.DataType.Boolean.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.BYTE =>
+        builder.setByte(proto.DataType.Byte.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.SHORT =>
+        builder.setShort(proto.DataType.Short.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.INTEGER =>
+        builder.setInteger(proto.DataType.Integer.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.LONG =>
+        builder.setLong(proto.DataType.Long.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.FLOAT =>
+        builder.setFloat(proto.DataType.Float.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.DOUBLE =>
+        builder.setDouble(proto.DataType.Double.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.DATE =>
+        builder.setDate(proto.DataType.Date.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.TIMESTAMP =>
+        builder.setTimestamp(proto.DataType.Timestamp.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.TIMESTAMP_NTZ =>
+        builder.setTimestampNtz(proto.DataType.TimestampNTZ.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.CALENDAR_INTERVAL =>
+        builder.setCalendarInterval(proto.DataType.CalendarInterval.newBuilder.build())
+      case proto.Expression.Literal.LiteralTypeCase.STRUCT =>
+        if (recursive) {
+          val struct = literal.getStruct
+          val size = struct.getElementsCount
+          val structTypeBuilder = proto.DataType.Struct.newBuilder
+          var i = 0
+          while (i < size) {
+            val field = struct.getDataTypeStruct.getFields(i)
+            if (field.hasDataType) {
+              structTypeBuilder.addFields(field)
+            } else {
+              val element = struct.getElements(i)
+              getInferredDataType(element, recursive = true) match {
+                case Some(dataType) =>
+                  val fieldBuilder = structTypeBuilder.addFieldsBuilder()
+                  fieldBuilder.setName(field.getName)
+                  fieldBuilder.setDataType(dataType)
+                  fieldBuilder.setNullable(field.getNullable)
+                  if (field.hasMetadata) {
+                    fieldBuilder.setMetadata(field.getMetadata)
+                  }
+                case None => return None
+              }
+            }
+            i += 1
+          }
+          builder.setStruct(structTypeBuilder.build())
+        } else {
+          builder.setStruct(proto.DataType.Struct.newBuilder.build())
+        }
+      case proto.Expression.Literal.LiteralTypeCase.ARRAY =>
+        if (recursive) {
+          val arrayType = literal.getArray.getDataType
+          val elementTypeOpt = if (arrayType.hasElementType) {
+            Some(arrayType.getElementType)
+          } else if (literal.getArray.getElementsCount > 0) {
+            getInferredDataType(literal.getArray.getElements(0), recursive = true)
+          } else {
+            None
+          }
+          if (elementTypeOpt.isDefined) {
+            builder.setArray(
+              proto.DataType.Array
+                .newBuilder()
+                .setElementType(elementTypeOpt.get)
+                .setContainsNull(arrayType.getContainsNull)
+                .build())
+          } else {
+            return None
+          }
+        } else {
+          builder.setArray(proto.DataType.Array.newBuilder.build())
+        }
+      case proto.Expression.Literal.LiteralTypeCase.MAP =>
+        if (recursive) {
+          val mapType = literal.getMap.getDataType
+          val keyTypeOpt = if (mapType.hasKeyType) {
+            Some(mapType.getKeyType)
+          } else if (literal.getMap.getKeysCount > 0) {
+            getInferredDataType(literal.getMap.getKeys(0), recursive = true)
+          } else {
+            None
+          }
+          val valueTypeOpt = if (mapType.hasValueType) {
+            Some(mapType.getValueType)
+          } else if (literal.getMap.getValuesCount > 0) {
+            getInferredDataType(literal.getMap.getValues(0), recursive = true)
+          } else {
+            None
+          }
+          if (keyTypeOpt.isDefined && valueTypeOpt.isDefined) {
+            builder.setMap(
+              proto.DataType.Map.newBuilder
+                .setKeyType(keyTypeOpt.get)
+                .setValueType(valueTypeOpt.get)
+                .setValueContainsNull(mapType.getValueContainsNull)
+                .build())
+          } else {
+            return None
+          }
+        } else {
+          builder.setMap(proto.DataType.Map.newBuilder.build())
+        }
+      case _ =>
+        // Not all data types support inferring the data type from the literal at the moment.
+        // e.g. the type of DayTimeInterval contains extra information like start_field and
+        // end_field and cannot be inferred from the literal.
+        return None
+    }
+    Some(builder.build())
+  }
+
+  private def toCatalystArrayInternal(
+      array: proto.Expression.Literal.Array,
+      arrayType: proto.DataType.Array): Array[_] = {
     def makeArrayData[T](converter: proto.Expression.Literal => T)(implicit
         tag: ClassTag[T]): Array[T] = {
-      val builder = mutable.ArrayBuilder.make[T]
-      val elementList = array.getElementsList
-      builder.sizeHint(elementList.size())
-      val iter = elementList.iterator()
-      while (iter.hasNext) {
-        builder += converter(iter.next())
+      val size = array.getElementsCount
+      if (size > 0) {
+        Array.tabulate(size)(i => converter(array.getElements(i)))
+      } else {
+        Array.empty[T]
       }
-      builder.result()
     }
 
-    makeArrayData(getConverter(array.getElementType))
+    makeArrayData(getConverter(arrayType.getElementType))
   }
 
-  def toCatalystMap(map: proto.Expression.Literal.Map): mutable.Map[_, _] = {
+  def getProtoArrayType(array: proto.Expression.Literal.Array): proto.DataType.Array = {
+    if (array.hasDataType) {
+      val literal = proto.Expression.Literal.newBuilder().setArray(array).build()
+      getInferredDataType(literal, recursive = true) match {
+        case Some(dataType) => dataType.getArray
+        case None => throw InvalidPlanInput("Cannot infer data type from this array literal.")
+      }
+    } else if (array.hasElementType) {
+      // For backward compatibility, we still support the old way to
+      // define the type of the array.
+      proto.DataType.Array.newBuilder
+        .setElementType(array.getElementType)
+        .setContainsNull(true)
+        .build()
+    } else {
+      throw InvalidPlanInput("Data type information is missing in the array literal.")
+    }
+  }
+
+  def toCatalystArray(array: proto.Expression.Literal.Array): Array[_] = {
+    toCatalystArrayInternal(array, getProtoArrayType(array))
+  }
+
+  private def toCatalystMapInternal(
+      map: proto.Expression.Literal.Map,
+      mapType: proto.DataType.Map): mutable.Map[_, _] = {
     def makeMapData[K, V](
         keyConverter: proto.Expression.Literal => K,
         valueConverter: proto.Expression.Literal => V)(implicit
         tagK: ClassTag[K],
         tagV: ClassTag[V]): mutable.Map[K, V] = {
-      val builder = mutable.HashMap.empty[K, V]
-      val keys = map.getKeysList.asScala
-      val values = map.getValuesList.asScala
-      builder.sizeHint(keys.size)
-      keys.zip(values).foreach { case (key, value) =>
-        builder += ((keyConverter(key), valueConverter(value)))
+      val size = map.getKeysCount
+      if (size > 0) {
+        val m = mutable.LinkedHashMap.empty[K, V]
+        m.sizeHint(size)
+        m.addAll(Iterator.tabulate(size)(i =>
+          (keyConverter(map.getKeys(i)), valueConverter(map.getValues(i)))))
+      } else {
+        mutable.Map.empty[K, V]
       }
-      builder
     }
 
-    makeMapData(getConverter(map.getKeyType), getConverter(map.getValueType))
+    makeMapData(getConverter(mapType.getKeyType), getConverter(mapType.getValueType))
   }
 
-  def toCatalystStruct(struct: proto.Expression.Literal.Struct): Any = {
+  def getProtoMapType(map: proto.Expression.Literal.Map): proto.DataType.Map = {
+    if (map.hasDataType) {
+      val literal = proto.Expression.Literal.newBuilder().setMap(map).build()
+      getInferredDataType(literal, recursive = true) match {
+        case Some(dataType) => dataType.getMap
+        case None => throw InvalidPlanInput("Cannot infer data type from this map literal.")
+      }
+    } else if (map.hasKeyType && map.hasValueType) {
+      // For backward compatibility, we still support the old way to
+      // define the type of the map.
+      proto.DataType.Map.newBuilder
+        .setKeyType(map.getKeyType)
+        .setValueType(map.getValueType)
+        .setValueContainsNull(true)
+        .build()
+    } else {
+      throw InvalidPlanInput("Data type information is missing in the map literal.")
+    }
+  }
+
+  def toCatalystMap(map: proto.Expression.Literal.Map): mutable.Map[_, _] = {
+    toCatalystMapInternal(map, getProtoMapType(map))
+  }
+
+  private def toCatalystStructInternal(
+      struct: proto.Expression.Literal.Struct,
+      structType: proto.DataType.Struct): Any = {
     def toTuple[A <: Object](data: Seq[A]): Product = {
       try {
         val tupleClass = SparkClassUtils.classForName(s"scala.Tuple${data.length}")
@@ -387,16 +678,32 @@ object LiteralValueProtoConverter {
       }
     }
 
-    val elements = struct.getElementsList.asScala
-    val dataTypes = struct.getStructType.getStruct.getFieldsList.asScala.map(_.getDataType)
-    val structData = elements
-      .zip(dataTypes)
-      .map { case (element, dataType) =>
-        getConverter(dataType)(element)
+    val size = struct.getElementsCount
+    val structData = Seq.tabulate(size) { i =>
+      val element = struct.getElements(i)
+      val dataType = structType.getFields(i).getDataType
+      getConverter(dataType)(element).asInstanceOf[Object]
+    }
+    toTuple(structData)
+  }
+
+  def getProtoStructType(struct: proto.Expression.Literal.Struct): proto.DataType.Struct = {
+    if (struct.hasDataTypeStruct) {
+      val literal = proto.Expression.Literal.newBuilder().setStruct(struct).build()
+      getInferredDataType(literal, recursive = true) match {
+        case Some(dataType) => dataType.getStruct
+        case None => throw InvalidPlanInput("Cannot infer data type from this struct literal.")
       }
-      .asInstanceOf[scala.collection.Seq[Object]]
-      .toSeq
+    } else if (struct.hasStructType) {
+      // For backward compatibility, we still support the old way to
+      // define and convert struct types.
+      struct.getStructType.getStruct
+    } else {
+      throw InvalidPlanInput("Data type information is missing in the struct literal.")
+    }
+  }
 
-    toTuple(structData)
+  def toCatalystStruct(struct: proto.Expression.Literal.Struct): Any = {
+    toCatalystStructInternal(struct, getProtoStructType(struct))
   }
 }
diff --git a/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/ProtoSpecializedArray.scala b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/ProtoSpecializedArray.scala
new file mode 100644
index 0000000000000..eeccb1f77469c
--- /dev/null
+++ b/sql/connect/common/src/main/scala/org/apache/spark/sql/connect/common/ProtoSpecializedArray.scala
@@ -0,0 +1,172 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.sql.connect.common
+
+import org.apache.spark.connect.proto
+
+private[spark] object ProtoSpecializedArray {
+
+  def toArray(array: proto.Bools): Array[Boolean] = {
+    val size = array.getValuesCount
+    if (size > 0) {
+      val a = Array.ofDim[Boolean](size)
+      var i = 0
+      while (i < size) {
+        a(i) = array.getValues(i)
+        i += 1
+      }
+      a
+    } else {
+      Array.emptyBooleanArray
+    }
+  }
+
+  def toArray(array: proto.Ints): Array[Int] = {
+    val size = array.getValuesCount
+    if (size > 0) {
+      val a = Array.ofDim[Int](size)
+      var i = 0
+      while (i < size) {
+        a(i) = array.getValues(i)
+        i += 1
+      }
+      a
+    } else {
+      Array.emptyIntArray
+    }
+  }
+
+  def toArray(array: proto.Longs): Array[Long] = {
+    val size = array.getValuesCount
+    if (size > 0) {
+      val a = Array.ofDim[Long](size)
+      var i = 0
+      while (i < size) {
+        a(i) = array.getValues(i)
+        i += 1
+      }
+      a
+    } else {
+      Array.emptyLongArray
+    }
+  }
+
+  def toArray(array: proto.Floats): Array[Float] = {
+    val size = array.getValuesCount
+    if (size > 0) {
+      val a = Array.ofDim[Float](size)
+      var i = 0
+      while (i < size) {
+        a(i) = array.getValues(i)
+        i += 1
+      }
+      a
+    } else {
+      Array.emptyFloatArray
+    }
+  }
+
+  def toArray(array: proto.Doubles): Array[Double] = {
+    val size = array.getValuesCount
+    if (size > 0) {
+      val a = Array.ofDim[Double](size)
+      var i = 0
+      while (i < size) {
+        a(i) = array.getValues(i)
+        i += 1
+      }
+      a
+    } else {
+      Array.emptyDoubleArray
+    }
+  }
+
+  def toArray(array: proto.Strings): Array[String] = {
+    val size = array.getValuesCount
+    if (size > 0) {
+      val a = Array.ofDim[String](size)
+      var i = 0
+      while (i < size) {
+        a(i) = array.getValues(i)
+        i += 1
+      }
+      a
+    } else {
+      Array.empty[String]
+    }
+  }
+
+  def fromArray(array: Array[Boolean]): proto.Bools = {
+    if (array.nonEmpty) {
+      val builder = proto.Bools.newBuilder()
+      array.foreach(builder.addValues)
+      builder.build()
+    } else {
+      proto.Bools.getDefaultInstance
+    }
+  }
+
+  def fromArray(array: Array[Int]): proto.Ints = {
+    if (array.nonEmpty) {
+      val builder = proto.Ints.newBuilder()
+      array.foreach(builder.addValues)
+      builder.build()
+    } else {
+      proto.Ints.getDefaultInstance
+    }
+  }
+
+  def fromArray(array: Array[Long]): proto.Longs = {
+    if (array.nonEmpty) {
+      val builder = proto.Longs.newBuilder()
+      array.foreach(builder.addValues)
+      builder.build()
+    } else {
+      proto.Longs.getDefaultInstance
+    }
+  }
+
+  def fromArray(array: Array[Float]): proto.Floats = {
+    if (array.nonEmpty) {
+      val builder = proto.Floats.newBuilder()
+      array.foreach(builder.addValues)
+      builder.build()
+    } else {
+      proto.Floats.getDefaultInstance
+    }
+  }
+
+  def fromArray(array: Array[Double]): proto.Doubles = {
+    if (array.nonEmpty) {
+      val builder = proto.Doubles.newBuilder()
+      array.foreach(builder.addValues)
+      builder.build()
+    } else {
+      proto.Doubles.getDefaultInstance
+    }
+  }
+
+  def fromArray(array: Array[String]): proto.Strings = {
+    if (array.nonEmpty) {
+      val builder = proto.Strings.newBuilder()
+      array.foreach(builder.addValues)
+      builder.build()
+    } else {
+      proto.Strings.getDefaultInstance
+    }
+  }
+}
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/function_lit.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/function_lit.explain
index 4491b6166afae..888fdf71586fb 100644
--- a/sql/connect/common/src/test/resources/query-tests/explain-results/function_lit.explain
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/function_lit.explain
@@ -1,2 +1,2 @@
-Project [id#0L, id#0L, true AS true#0, 68 AS 68#0, 9872 AS 9872#0, -8726532 AS -8726532#0, 7834609328726532 AS 7834609328726532#0L, 2.718281828459045 AS 2.718281828459045#0, -0.8 AS -0.8#0, 89.97620 AS 89.97620#0, 89889.7667231 AS 89889.7667231#0, connect! AS connect!#0, T AS T#0, ABCDEFGHIJ AS ABCDEFGHIJ#0, 0x78797A7B7C7D7E7F808182838485868788898A8B8C8D8E AS X'78797A7B7C7D7E7F808182838485868788898A8B8C8D8E'#0, 0x0806 AS X'0806'#0, [8,6] AS ARRAY(8, 6)#0, null AS NULL#0, 2020-10-10 AS DATE '2020-10-10'#0, 8.997620 AS 8.997620#0, 2023-02-23 04:31:59.808 AS TIMESTAMP '2023-02-23 04:31:59.808'#0, 1969-12-31 16:00:12.345 AS TIMESTAMP '1969-12-31 16:00:12.345'#0, 2023-02-23 20:36:00 AS TIMESTAMP_NTZ '2023-02-23 20:36:00'#0, 2023-02-23 AS DATE '2023-02-23'#0, INTERVAL '0 00:03:20' DAY TO SECOND AS INTERVAL '0 00:03:20' DAY TO SECOND#0, ... 2 more fields]
+Project [id#0L, id#0L, true AS true#0, 68 AS 68#0, 9872 AS 9872#0, -8726532 AS -8726532#0, 7834609328726532 AS 7834609328726532#0L, 2.718281828459045 AS 2.718281828459045#0, -0.8 AS -0.8#0, 89.97620 AS 89.97620#0, 89889.7667231 AS 89889.7667231#0, connect! AS connect!#0, T AS T#0, ABCDEFGHIJ AS ABCDEFGHIJ#0, 0x78797A7B7C7D7E7F808182838485868788898A8B8C8D8E AS X'78797A7B7C7D7E7F808182838485868788898A8B8C8D8E'#0, 0x0806 AS X'0806'#0, [8,6] AS ARRAY(8, 6)#0, null AS NULL#0, 2020-10-10 AS DATE '2020-10-10'#0, 8.997620 AS 8.997620#0, 2023-02-23 04:31:59.808 AS TIMESTAMP '2023-02-23 04:31:59.808'#0, 1969-12-31 16:00:12.345 AS TIMESTAMP '1969-12-31 16:00:12.345'#0, 2023-02-23 20:36:00 AS TIMESTAMP_NTZ '2023-02-23 20:36:00'#0, 2023-02-23 AS DATE '2023-02-23'#0, INTERVAL '0 00:03:20' DAY TO SECOND AS INTERVAL '0 00:03:20' DAY TO SECOND#0, INTERVAL '0-0' YEAR TO MONTH AS INTERVAL '0-0' YEAR TO MONTH#0, 23:59:59.999999999 AS TIME '23:59:59.999999999'#0, 2 months 20 days 0.0001 seconds AS INTERVAL '2 months 20 days 0.0001 seconds'#0]
 +- LocalRelation <empty>, [id#0L, a#0, b#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/function_try_to_date.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/function_try_to_date.explain
new file mode 100644
index 0000000000000..b154d54f57533
--- /dev/null
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/function_try_to_date.explain
@@ -0,0 +1,2 @@
+Project [cast(s#0 as date) AS try_to_date(s)#0]
++- LocalRelation <empty>, [d#0, t#0, s#0, x#0L, wt#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/function_try_to_date_with_format.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/function_try_to_date_with_format.explain
new file mode 100644
index 0000000000000..ab3e72abc21da
--- /dev/null
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/function_try_to_date_with_format.explain
@@ -0,0 +1,2 @@
+Project [cast(gettimestamp(s#0, yyyy-MM-dd, TimestampType, try_to_date, Some(America/Los_Angeles), false) as date) AS try_to_date(s, yyyy-MM-dd)#0]
++- LocalRelation <empty>, [d#0, t#0, s#0, x#0L, wt#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/function_typedLit.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/function_typedLit.explain
index 6d854da250fcc..943b353a14ccf 100644
--- a/sql/connect/common/src/test/resources/query-tests/explain-results/function_typedLit.explain
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/function_typedLit.explain
@@ -1,2 +1,2 @@
-Project [id#0L, id#0L, 1 AS 1#0, null AS NULL#0, true AS true#0, 68 AS 68#0, 9872 AS 9872#0, -8726532 AS -8726532#0, 7834609328726532 AS 7834609328726532#0L, 2.718281828459045 AS 2.718281828459045#0, -0.8 AS -0.8#0, 89.97620 AS 89.97620#0, 89889.7667231 AS 89889.7667231#0, connect! AS connect!#0, T AS T#0, ABCDEFGHIJ AS ABCDEFGHIJ#0, 0x78797A7B7C7D7E7F808182838485868788898A8B8C8D8E AS X'78797A7B7C7D7E7F808182838485868788898A8B8C8D8E'#0, 0x0806 AS X'0806'#0, [8,6] AS ARRAY(8, 6)#0, null AS NULL#0, 2020-10-10 AS DATE '2020-10-10'#0, 8.997620 AS 8.997620#0, 2023-02-23 04:31:59.808 AS TIMESTAMP '2023-02-23 04:31:59.808'#0, 1969-12-31 16:00:12.345 AS TIMESTAMP '1969-12-31 16:00:12.345'#0, 2023-02-23 20:36:00 AS TIMESTAMP_NTZ '2023-02-23 20:36:00'#0, ... 18 more fields]
+Project [id#0L, id#0L, 1 AS 1#0, null AS NULL#0, true AS true#0, 68 AS 68#0, 9872 AS 9872#0, -8726532 AS -8726532#0, 7834609328726532 AS 7834609328726532#0L, 2.718281828459045 AS 2.718281828459045#0, -0.8 AS -0.8#0, 89.97620 AS 89.97620#0, 89889.7667231 AS 89889.7667231#0, connect! AS connect!#0, T AS T#0, ABCDEFGHIJ AS ABCDEFGHIJ#0, 0x78797A7B7C7D7E7F808182838485868788898A8B8C8D8E AS X'78797A7B7C7D7E7F808182838485868788898A8B8C8D8E'#0, 0x0806 AS X'0806'#0, [8,6] AS ARRAY(8, 6)#0, null AS NULL#0, 2020-10-10 AS DATE '2020-10-10'#0, 8.997620 AS 8.997620#0, 2023-02-23 04:31:59.808 AS TIMESTAMP '2023-02-23 04:31:59.808'#0, 1969-12-31 16:00:12.345 AS TIMESTAMP '1969-12-31 16:00:12.345'#0, 2023-02-23 20:36:00 AS TIMESTAMP_NTZ '2023-02-23 20:36:00'#0, 2023-02-23 AS DATE '2023-02-23'#0, INTERVAL '0 00:03:20' DAY TO SECOND AS INTERVAL '0 00:03:20' DAY TO SECOND#0, INTERVAL '0-0' YEAR TO MONTH AS INTERVAL '0-0' YEAR TO MONTH#0, 23:59:59.999999999 AS TIME '23:59:59.999999999'#0, 2 months 20 days 0.0001 seconds AS INTERVAL '2 months 20 days 0.0001 seconds'#0, 1 AS 1#0, [1,2,3] AS ARRAY(1, 2, 3)#0, [1,2,3] AS ARRAY(1, 2, 3)#0, map(keys: [a,b], values: [1,2]) AS MAP('a', 1, 'b', 2)#0, [a,2,1.0] AS NAMED_STRUCT('_1', 'a', '_2', 2, '_3', 1.0D)#0, null AS NULL#0, [1] AS ARRAY(1)#0, map(keys: [1], values: [0]) AS MAP(1, 0)#0, map(keys: [1], values: [0]) AS MAP(1, 0)#0, map(keys: [1], values: [0]) AS MAP(1, 0)#0, [[1,2,3],[4,5,6],[7,8,9]] AS ARRAY(ARRAY(1, 2, 3), ARRAY(4, 5, 6), ARRAY(7, 8, 9))#0, [keys: [a,b], values: [1,2],keys: [a,b], values: [3,4],keys: [a,b], values: [5,6]] AS ARRAY(MAP('a', 1, 'b', 2), MAP('a', 3, 'b', 4), MAP('a', 5, 'b', 6))#0, map(keys: [1,2], values: [keys: [a,b], values: [1,2],keys: [a,b], values: [3,4]]) AS MAP(1, MAP('a', 1, 'b', 2), 2, MAP('a', 3, 'b', 4))#0, [[1,2,3],keys: [a,b], values: [1,2],[a,keys: [1,2], values: [a,b]]] AS NAMED_STRUCT('_1', ARRAY(1, 2, 3), '_2', MAP('a', 1, 'b', 2), '_3', NAMED_STRUCT('_1', 'a', '_2', MAP(1, 'a', 2, 'b')))#0]
 +- LocalRelation <empty>, [id#0L, a#0, b#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/union.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/union.explain
index 4d5d1f53b8412..252774510896c 100644
--- a/sql/connect/common/src/test/resources/query-tests/explain-results/union.explain
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/union.explain
@@ -1,3 +1,3 @@
-Union false, false
+'Union false, false
 :- LocalRelation <empty>, [id#0L, a#0, b#0]
 +- LocalRelation <empty>, [id#0L, a#0, b#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/unionAll.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/unionAll.explain
index 4d5d1f53b8412..252774510896c 100644
--- a/sql/connect/common/src/test/resources/query-tests/explain-results/unionAll.explain
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/unionAll.explain
@@ -1,3 +1,3 @@
-Union false, false
+'Union false, false
 :- LocalRelation <empty>, [id#0L, a#0, b#0]
 +- LocalRelation <empty>, [id#0L, a#0, b#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName.explain
index 6ec8eb37f50ed..2877c7cef0fda 100644
--- a/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName.explain
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName.explain
@@ -1,4 +1,4 @@
-Union false, false
+'Union false, false
 :- Project [id#0L, a#0]
 :  +- LocalRelation <empty>, [id#0L, a#0, b#0]
 +- Project [id#0L, a#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName_allowMissingColumns.explain b/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName_allowMissingColumns.explain
index 96bd9f281c15e..dc0d1d94f85c1 100644
--- a/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName_allowMissingColumns.explain
+++ b/sql/connect/common/src/test/resources/query-tests/explain-results/unionByName_allowMissingColumns.explain
@@ -1,4 +1,4 @@
-Union false, false
+'Union false, false
 :- Project [id#0L, a#0, b#0, null AS payload#0]
 :  +- LocalRelation <empty>, [id#0L, a#0, b#0]
 +- Project [id#0L, a#0, null AS b#0, payload#0]
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_lit.json b/sql/connect/common/src/test/resources/query-tests/queries/function_lit.json
index 96bdfcc8105ba..cedf7572a1fd3 100644
--- a/sql/connect/common/src/test/resources/query-tests/queries/function_lit.json
+++ b/sql/connect/common/src/test/resources/query-tests/queries/function_lit.json
@@ -358,15 +358,18 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "integer": {
-            }
-          },
           "elements": [{
             "integer": 8
           }, {
             "integer": 6
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "integer": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -582,6 +585,30 @@
           }
         }
       }
+    }, {
+      "literal": {
+        "time": {
+          "nano": "86399999999999",
+          "precision": 6
+        }
+      },
+      "common": {
+        "origin": {
+          "jvmOrigin": {
+            "stackTrace": [{
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.functions$",
+              "methodName": "lit",
+              "fileName": "functions.scala"
+            }, {
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.PlanGenerationTestSuite",
+              "methodName": "~~trimmed~anonfun~~",
+              "fileName": "PlanGenerationTestSuite.scala"
+            }]
+          }
+        }
+      }
     }, {
       "literal": {
         "calendarInterval": {
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_lit.proto.bin b/sql/connect/common/src/test/resources/query-tests/queries/function_lit.proto.bin
index 8036cda6765f8..5d30f4fca159b 100644
Binary files a/sql/connect/common/src/test/resources/query-tests/queries/function_lit.proto.bin and b/sql/connect/common/src/test/resources/query-tests/queries/function_lit.proto.bin differ
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.json b/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.json
index 337b3366649f7..53b1a7b3947f9 100644
--- a/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.json
+++ b/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.json
@@ -14,9 +14,12 @@
     "expressions": [{
       "literal": {
         "array": {
-          "elementType": {
-            "double": {
-            }
+          "dataType": {
+            "elementType": {
+              "double": {
+              }
+            },
+            "containsNull": true
           }
         }
       },
@@ -40,46 +43,58 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
-              "containsNull": true
-            }
-          },
           "elements": [{
             "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
               "elements": [{
                 "integer": 1
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "integer": {
+                  }
+                },
+                "containsNull": true
+              }
             }
           }, {
             "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
               "elements": [{
                 "integer": 2
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "integer": {
+                  }
+                },
+                "containsNull": true
+              }
             }
           }, {
             "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
               "elements": [{
                 "integer": 3
-              }]
-            }
-          }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "integer": {
+                  }
+                },
+                "containsNull": true
+              }
+            }
+          }],
+          "dataType": {
+            "elementType": {
+              "array": {
+                "elementType": {
+                  "integer": {
+                  }
+                },
+                "containsNull": true
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -102,90 +117,111 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "array": {
-              "elementType": {
-                "array": {
-                  "elementType": {
-                    "integer": {
-                    }
-                  },
-                  "containsNull": true
-                }
-              },
-              "containsNull": true
-            }
-          },
           "elements": [{
             "array": {
-              "elementType": {
-                "array": {
-                  "elementType": {
-                    "integer": {
-                    }
-                  },
-                  "containsNull": true
-                }
-              },
               "elements": [{
                 "array": {
-                  "elementType": {
-                    "integer": {
-                    }
-                  },
                   "elements": [{
                     "integer": 1
-                  }]
+                  }],
+                  "dataType": {
+                    "elementType": {
+                      "integer": {
+                      }
+                    },
+                    "containsNull": true
+                  }
                 }
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "array": {
+                    "elementType": {
+                      "integer": {
+                      }
+                    },
+                    "containsNull": true
+                  }
+                },
+                "containsNull": true
+              }
             }
           }, {
             "array": {
-              "elementType": {
-                "array": {
-                  "elementType": {
-                    "integer": {
-                    }
-                  },
-                  "containsNull": true
-                }
-              },
               "elements": [{
                 "array": {
-                  "elementType": {
-                    "integer": {
-                    }
-                  },
                   "elements": [{
                     "integer": 2
-                  }]
+                  }],
+                  "dataType": {
+                    "elementType": {
+                      "integer": {
+                      }
+                    },
+                    "containsNull": true
+                  }
                 }
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "array": {
+                    "elementType": {
+                      "integer": {
+                      }
+                    },
+                    "containsNull": true
+                  }
+                },
+                "containsNull": true
+              }
             }
           }, {
             "array": {
-              "elementType": {
-                "array": {
-                  "elementType": {
-                    "integer": {
-                    }
-                  },
-                  "containsNull": true
-                }
-              },
               "elements": [{
                 "array": {
-                  "elementType": {
-                    "integer": {
-                    }
-                  },
                   "elements": [{
                     "integer": 3
-                  }]
+                  }],
+                  "dataType": {
+                    "elementType": {
+                      "integer": {
+                      }
+                    },
+                    "containsNull": true
+                  }
                 }
-              }]
-            }
-          }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "array": {
+                    "elementType": {
+                      "integer": {
+                      }
+                    },
+                    "containsNull": true
+                  }
+                },
+                "containsNull": true
+              }
+            }
+          }],
+          "dataType": {
+            "elementType": {
+              "array": {
+                "elementType": {
+                  "array": {
+                    "elementType": {
+                      "integer": {
+                      }
+                    },
+                    "containsNull": true
+                  }
+                },
+                "containsNull": true
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -208,15 +244,18 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "boolean": {
-            }
-          },
           "elements": [{
             "boolean": true
           }, {
             "boolean": false
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "boolean": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -260,17 +299,20 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "short": {
-            }
-          },
           "elements": [{
             "short": 9872
           }, {
             "short": 9873
           }, {
             "short": 9874
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "short": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -293,17 +335,20 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "integer": {
-            }
-          },
           "elements": [{
             "integer": -8726532
           }, {
             "integer": 8726532
           }, {
             "integer": -8726533
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "integer": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -326,17 +371,20 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "long": {
-            }
-          },
           "elements": [{
             "long": "7834609328726531"
           }, {
             "long": "7834609328726532"
           }, {
             "long": "7834609328726533"
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "long": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -359,17 +407,20 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "double": {
-            }
-          },
           "elements": [{
             "double": 2.718281828459045
           }, {
             "double": 1.0
           }, {
             "double": 2.0
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "double": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -392,17 +443,20 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "float": {
-            }
-          },
           "elements": [{
             "float": -0.8
           }, {
             "float": -0.7
           }, {
             "float": -0.9
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "float": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -425,12 +479,6 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "decimal": {
-              "scale": 18,
-              "precision": 38
-            }
-          },
           "elements": [{
             "decimal": {
               "value": "89.97620",
@@ -443,7 +491,16 @@
               "precision": 7,
               "scale": 5
             }
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "decimal": {
+                "scale": 18,
+                "precision": 38
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -466,12 +523,6 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "decimal": {
-              "scale": 18,
-              "precision": 38
-            }
-          },
           "elements": [{
             "decimal": {
               "value": "89889.7667231",
@@ -484,7 +535,16 @@
               "precision": 12,
               "scale": 7
             }
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "decimal": {
+                "scale": 18,
+                "precision": 38
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -507,16 +567,19 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "string": {
-              "collation": "UTF8_BINARY"
-            }
-          },
           "elements": [{
             "string": "connect!"
           }, {
             "string": "disconnect!"
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "string": {
+                "collation": "UTF8_BINARY"
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -560,16 +623,19 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "string": {
-              "collation": "UTF8_BINARY"
-            }
-          },
           "elements": [{
             "string": "ABCDEFGHIJ"
           }, {
             "string": "BCDEFGHIJK"
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "string": {
+                "collation": "UTF8_BINARY"
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -592,15 +658,18 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "date": {
-            }
-          },
           "elements": [{
             "date": 18545
           }, {
             "date": 18546
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "date": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -623,15 +692,18 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "timestamp": {
-            }
-          },
           "elements": [{
             "timestamp": "1677155519808000"
           }, {
             "timestamp": "1677155519809000"
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "timestamp": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -654,15 +726,18 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "timestamp": {
-            }
-          },
           "elements": [{
             "timestamp": "12345000"
           }, {
             "timestamp": "23456000"
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "timestamp": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -685,15 +760,18 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "timestampNtz": {
-            }
-          },
           "elements": [{
             "timestampNtz": "1677184560000000"
           }, {
             "timestampNtz": "1677188160000000"
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "timestampNtz": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -716,15 +794,18 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "date": {
-            }
-          },
           "elements": [{
             "date": 19411
           }, {
             "date": 19417
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "date": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -747,17 +828,20 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "dayTimeInterval": {
-              "startField": 0,
-              "endField": 3
-            }
-          },
           "elements": [{
             "dayTimeInterval": "100000000"
           }, {
             "dayTimeInterval": "200000000"
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "dayTimeInterval": {
+                "startField": 0,
+                "endField": 3
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -780,17 +864,20 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "yearMonthInterval": {
-              "startField": 0,
-              "endField": 1
-            }
-          },
           "elements": [{
             "yearMonthInterval": 0
           }, {
             "yearMonthInterval": 0
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "yearMonthInterval": {
+                "startField": 0,
+                "endField": 1
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -813,10 +900,6 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "calendarInterval": {
-            }
-          },
           "elements": [{
             "calendarInterval": {
               "months": 2,
@@ -829,7 +912,14 @@
               "days": 21,
               "microseconds": "200"
             }
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "calendarInterval": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.proto.bin b/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.proto.bin
index 320da10258180..8cb965dd25a0b 100644
Binary files a/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.proto.bin and b/sql/connect/common/src/test/resources/query-tests/queries/function_lit_array.proto.bin differ
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date.json b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date.json
new file mode 100644
index 0000000000000..fa22071a05e5e
--- /dev/null
+++ b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date.json
@@ -0,0 +1,60 @@
+{
+  "common": {
+    "planId": "1"
+  },
+  "project": {
+    "input": {
+      "common": {
+        "planId": "0"
+      },
+      "localRelation": {
+        "schema": "struct\u003cd:date,t:timestamp,s:string,x:bigint,wt:struct\u003cstart:timestamp,end:timestamp\u003e\u003e"
+      }
+    },
+    "expressions": [{
+      "unresolvedFunction": {
+        "functionName": "try_to_date",
+        "arguments": [{
+          "unresolvedAttribute": {
+            "unparsedIdentifier": "s"
+          },
+          "common": {
+            "origin": {
+              "jvmOrigin": {
+                "stackTrace": [{
+                  "classLoaderName": "app",
+                  "declaringClass": "org.apache.spark.sql.functions$",
+                  "methodName": "col",
+                  "fileName": "functions.scala"
+                }, {
+                  "classLoaderName": "app",
+                  "declaringClass": "org.apache.spark.sql.PlanGenerationTestSuite",
+                  "methodName": "~~trimmed~anonfun~~",
+                  "fileName": "PlanGenerationTestSuite.scala"
+                }]
+              }
+            }
+          }
+        }],
+        "isInternal": false
+      },
+      "common": {
+        "origin": {
+          "jvmOrigin": {
+            "stackTrace": [{
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.functions$",
+              "methodName": "try_to_date",
+              "fileName": "functions.scala"
+            }, {
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.PlanGenerationTestSuite",
+              "methodName": "~~trimmed~anonfun~~",
+              "fileName": "PlanGenerationTestSuite.scala"
+            }]
+          }
+        }
+      }
+    }]
+  }
+}
\ No newline at end of file
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date.proto.bin b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date.proto.bin
new file mode 100644
index 0000000000000..d322dec35417a
Binary files /dev/null and b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date.proto.bin differ
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date_with_format.json b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date_with_format.json
new file mode 100644
index 0000000000000..ccf5e8970ce9f
--- /dev/null
+++ b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date_with_format.json
@@ -0,0 +1,81 @@
+{
+  "common": {
+    "planId": "1"
+  },
+  "project": {
+    "input": {
+      "common": {
+        "planId": "0"
+      },
+      "localRelation": {
+        "schema": "struct\u003cd:date,t:timestamp,s:string,x:bigint,wt:struct\u003cstart:timestamp,end:timestamp\u003e\u003e"
+      }
+    },
+    "expressions": [{
+      "unresolvedFunction": {
+        "functionName": "try_to_date",
+        "arguments": [{
+          "unresolvedAttribute": {
+            "unparsedIdentifier": "s"
+          },
+          "common": {
+            "origin": {
+              "jvmOrigin": {
+                "stackTrace": [{
+                  "classLoaderName": "app",
+                  "declaringClass": "org.apache.spark.sql.functions$",
+                  "methodName": "col",
+                  "fileName": "functions.scala"
+                }, {
+                  "classLoaderName": "app",
+                  "declaringClass": "org.apache.spark.sql.PlanGenerationTestSuite",
+                  "methodName": "~~trimmed~anonfun~~",
+                  "fileName": "PlanGenerationTestSuite.scala"
+                }]
+              }
+            }
+          }
+        }, {
+          "literal": {
+            "string": "yyyy-MM-dd"
+          },
+          "common": {
+            "origin": {
+              "jvmOrigin": {
+                "stackTrace": [{
+                  "classLoaderName": "app",
+                  "declaringClass": "org.apache.spark.sql.functions$",
+                  "methodName": "try_to_date",
+                  "fileName": "functions.scala"
+                }, {
+                  "classLoaderName": "app",
+                  "declaringClass": "org.apache.spark.sql.PlanGenerationTestSuite",
+                  "methodName": "~~trimmed~anonfun~~",
+                  "fileName": "PlanGenerationTestSuite.scala"
+                }]
+              }
+            }
+          }
+        }],
+        "isInternal": false
+      },
+      "common": {
+        "origin": {
+          "jvmOrigin": {
+            "stackTrace": [{
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.functions$",
+              "methodName": "try_to_date",
+              "fileName": "functions.scala"
+            }, {
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.PlanGenerationTestSuite",
+              "methodName": "~~trimmed~anonfun~~",
+              "fileName": "PlanGenerationTestSuite.scala"
+            }]
+          }
+        }
+      }
+    }]
+  }
+}
\ No newline at end of file
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date_with_format.proto.bin b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date_with_format.proto.bin
new file mode 100644
index 0000000000000..0c252b8c37a93
Binary files /dev/null and b/sql/connect/common/src/test/resources/query-tests/queries/function_try_to_date_with_format.proto.bin differ
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.json b/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.json
index e56b6e1f3ee09..66bf31d670f9f 100644
--- a/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.json
+++ b/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.json
@@ -403,15 +403,17 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "integer": {
-            }
-          },
           "elements": [{
             "integer": 8
           }, {
             "integer": 6
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "integer": {
+              }
+            }
+          }
         }
       },
       "common": {
@@ -627,6 +629,30 @@
           }
         }
       }
+    }, {
+      "literal": {
+        "time": {
+          "nano": "86399999999999",
+          "precision": 6
+        }
+      },
+      "common": {
+        "origin": {
+          "jvmOrigin": {
+            "stackTrace": [{
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.functions$",
+              "methodName": "typedLit",
+              "fileName": "functions.scala"
+            }, {
+              "classLoaderName": "app",
+              "declaringClass": "org.apache.spark.sql.PlanGenerationTestSuite",
+              "methodName": "~~trimmed~anonfun~~",
+              "fileName": "PlanGenerationTestSuite.scala"
+            }]
+          }
+        }
+      }
     }, {
       "literal": {
         "calendarInterval": {
@@ -676,17 +702,19 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "integer": {
-            }
-          },
           "elements": [{
             "integer": 1
           }, {
             "integer": 2
           }, {
             "integer": 3
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "integer": {
+              }
+            }
+          }
         }
       },
       "common": {
@@ -709,17 +737,19 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "integer": {
-            }
-          },
           "elements": [{
             "integer": 1
           }, {
             "integer": 2
           }, {
             "integer": 3
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "integer": {
+              }
+            }
+          }
         }
       },
       "common": {
@@ -742,15 +772,6 @@
     }, {
       "literal": {
         "map": {
-          "keyType": {
-            "string": {
-              "collation": "UTF8_BINARY"
-            }
-          },
-          "valueType": {
-            "integer": {
-            }
-          },
           "keys": [{
             "string": "a"
           }, {
@@ -760,7 +781,18 @@
             "integer": 1
           }, {
             "integer": 2
-          }]
+          }],
+          "dataType": {
+            "keyType": {
+              "string": {
+                "collation": "UTF8_BINARY"
+              }
+            },
+            "valueType": {
+              "integer": {
+              }
+            }
+          }
         }
       },
       "common": {
@@ -783,38 +815,28 @@
     }, {
       "literal": {
         "struct": {
-          "structType": {
-            "struct": {
-              "fields": [{
-                "name": "_1",
-                "dataType": {
-                  "string": {
-                    "collation": "UTF8_BINARY"
-                  }
-                },
-                "nullable": true
-              }, {
-                "name": "_2",
-                "dataType": {
-                  "integer": {
-                  }
-                }
-              }, {
-                "name": "_3",
-                "dataType": {
-                  "double": {
-                  }
-                }
-              }]
-            }
-          },
           "elements": [{
             "string": "a"
           }, {
             "integer": 2
           }, {
             "double": 1.0
-          }]
+          }],
+          "dataTypeStruct": {
+            "fields": [{
+              "name": "_1",
+              "dataType": {
+                "string": {
+                  "collation": "UTF8_BINARY"
+                }
+              },
+              "nullable": true
+            }, {
+              "name": "_2"
+            }, {
+              "name": "_3"
+            }]
+          }
         }
       },
       "common": {
@@ -861,13 +883,16 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "integer": {
-            }
-          },
           "elements": [{
             "integer": 1
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "integer": {
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -890,14 +915,6 @@
     }, {
       "literal": {
         "map": {
-          "keyType": {
-            "integer": {
-            }
-          },
-          "valueType": {
-            "integer": {
-            }
-          },
           "keys": [{
             "integer": 1
           }],
@@ -906,7 +923,18 @@
               "integer": {
               }
             }
-          }]
+          }],
+          "dataType": {
+            "keyType": {
+              "integer": {
+              }
+            },
+            "valueType": {
+              "integer": {
+              }
+            },
+            "valueContainsNull": true
+          }
         }
       },
       "common": {
@@ -929,14 +957,6 @@
     }, {
       "literal": {
         "map": {
-          "keyType": {
-            "integer": {
-            }
-          },
-          "valueType": {
-            "integer": {
-            }
-          },
           "keys": [{
             "integer": 1
           }],
@@ -945,7 +965,18 @@
               "integer": {
               }
             }
-          }]
+          }],
+          "dataType": {
+            "keyType": {
+              "integer": {
+              }
+            },
+            "valueType": {
+              "integer": {
+              }
+            },
+            "valueContainsNull": true
+          }
         }
       },
       "common": {
@@ -968,14 +999,6 @@
     }, {
       "literal": {
         "map": {
-          "keyType": {
-            "integer": {
-            }
-          },
-          "valueType": {
-            "integer": {
-            }
-          },
           "keys": [{
             "integer": 1
           }],
@@ -984,7 +1007,18 @@
               "integer": {
               }
             }
-          }]
+          }],
+          "dataType": {
+            "keyType": {
+              "integer": {
+              }
+            },
+            "valueType": {
+              "integer": {
+              }
+            },
+            "valueContainsNull": true
+          }
         }
       },
       "common": {
@@ -1007,57 +1041,66 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "array": {
-              "elementType": {
-                "integer": {
-                }
-              }
-            }
-          },
           "elements": [{
             "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
               "elements": [{
                 "integer": 1
               }, {
                 "integer": 2
               }, {
                 "integer": 3
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "integer": {
+                  }
+                }
+              }
             }
           }, {
             "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
               "elements": [{
                 "integer": 4
               }, {
                 "integer": 5
               }, {
                 "integer": 6
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "integer": {
+                  }
+                }
+              }
             }
           }, {
             "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
               "elements": [{
                 "integer": 7
               }, {
                 "integer": 8
               }, {
                 "integer": 9
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "integer": {
+                  }
+                }
+              }
             }
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "array": {
+                "elementType": {
+                  "integer": {
+                  }
+                }
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -1080,30 +1123,8 @@
     }, {
       "literal": {
         "array": {
-          "elementType": {
-            "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              }
-            }
-          },
           "elements": [{
             "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              },
               "keys": [{
                 "string": "a"
               }, {
@@ -1113,19 +1134,21 @@
                 "integer": 1
               }, {
                 "integer": 2
-              }]
+              }],
+              "dataType": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
             }
           }, {
             "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              },
               "keys": [{
                 "string": "a"
               }, {
@@ -1135,19 +1158,21 @@
                 "integer": 3
               }, {
                 "integer": 4
-              }]
+              }],
+              "dataType": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
             }
           }, {
             "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              },
               "keys": [{
                 "string": "a"
               }, {
@@ -1157,9 +1182,36 @@
                 "integer": 5
               }, {
                 "integer": 6
-              }]
+              }],
+              "dataType": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
             }
-          }]
+          }],
+          "dataType": {
+            "elementType": {
+              "map": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
+            },
+            "containsNull": true
+          }
         }
       },
       "common": {
@@ -1182,23 +1234,6 @@
     }, {
       "literal": {
         "map": {
-          "keyType": {
-            "integer": {
-            }
-          },
-          "valueType": {
-            "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              }
-            }
-          },
           "keys": [{
             "integer": 1
           }, {
@@ -1206,15 +1241,6 @@
           }],
           "values": [{
             "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              },
               "keys": [{
                 "string": "a"
               }, {
@@ -1224,19 +1250,21 @@
                 "integer": 1
               }, {
                 "integer": 2
-              }]
+              }],
+              "dataType": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
             }
           }, {
             "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              },
               "keys": [{
                 "string": "a"
               }, {
@@ -1246,9 +1274,40 @@
                 "integer": 3
               }, {
                 "integer": 4
-              }]
+              }],
+              "dataType": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
             }
-          }]
+          }],
+          "dataType": {
+            "keyType": {
+              "integer": {
+              }
+            },
+            "valueType": {
+              "map": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
+            },
+            "valueContainsNull": true
+          }
         }
       },
       "common": {
@@ -1271,96 +1330,24 @@
     }, {
       "literal": {
         "struct": {
-          "structType": {
-            "struct": {
-              "fields": [{
-                "name": "_1",
-                "dataType": {
-                  "array": {
-                    "elementType": {
-                      "integer": {
-                      }
-                    }
-                  }
-                },
-                "nullable": true
-              }, {
-                "name": "_2",
-                "dataType": {
-                  "map": {
-                    "keyType": {
-                      "string": {
-                        "collation": "UTF8_BINARY"
-                      }
-                    },
-                    "valueType": {
-                      "integer": {
-                      }
-                    }
-                  }
-                },
-                "nullable": true
-              }, {
-                "name": "_3",
-                "dataType": {
-                  "struct": {
-                    "fields": [{
-                      "name": "_1",
-                      "dataType": {
-                        "string": {
-                          "collation": "UTF8_BINARY"
-                        }
-                      },
-                      "nullable": true
-                    }, {
-                      "name": "_2",
-                      "dataType": {
-                        "map": {
-                          "keyType": {
-                            "integer": {
-                            }
-                          },
-                          "valueType": {
-                            "string": {
-                              "collation": "UTF8_BINARY"
-                            }
-                          },
-                          "valueContainsNull": true
-                        }
-                      },
-                      "nullable": true
-                    }]
-                  }
-                },
-                "nullable": true
-              }]
-            }
-          },
           "elements": [{
             "array": {
-              "elementType": {
-                "integer": {
-                }
-              },
               "elements": [{
                 "integer": 1
               }, {
                 "integer": 2
               }, {
                 "integer": 3
-              }]
+              }],
+              "dataType": {
+                "elementType": {
+                  "integer": {
+                  }
+                }
+              }
             }
           }, {
             "map": {
-              "keyType": {
-                "string": {
-                  "collation": "UTF8_BINARY"
-                }
-              },
-              "valueType": {
-                "integer": {
-                }
-              },
               "keys": [{
                 "string": "a"
               }, {
@@ -1370,53 +1357,25 @@
                 "integer": 1
               }, {
                 "integer": 2
-              }]
+              }],
+              "dataType": {
+                "keyType": {
+                  "string": {
+                    "collation": "UTF8_BINARY"
+                  }
+                },
+                "valueType": {
+                  "integer": {
+                  }
+                }
+              }
             }
           }, {
             "struct": {
-              "structType": {
-                "struct": {
-                  "fields": [{
-                    "name": "_1",
-                    "dataType": {
-                      "string": {
-                        "collation": "UTF8_BINARY"
-                      }
-                    },
-                    "nullable": true
-                  }, {
-                    "name": "_2",
-                    "dataType": {
-                      "map": {
-                        "keyType": {
-                          "integer": {
-                          }
-                        },
-                        "valueType": {
-                          "string": {
-                            "collation": "UTF8_BINARY"
-                          }
-                        },
-                        "valueContainsNull": true
-                      }
-                    },
-                    "nullable": true
-                  }]
-                }
-              },
               "elements": [{
                 "string": "a"
               }, {
                 "map": {
-                  "keyType": {
-                    "integer": {
-                    }
-                  },
-                  "valueType": {
-                    "string": {
-                      "collation": "UTF8_BINARY"
-                    }
-                  },
                   "keys": [{
                     "integer": 1
                   }, {
@@ -1426,11 +1385,49 @@
                     "string": "a"
                   }, {
                     "string": "b"
-                  }]
+                  }],
+                  "dataType": {
+                    "keyType": {
+                      "integer": {
+                      }
+                    },
+                    "valueType": {
+                      "string": {
+                        "collation": "UTF8_BINARY"
+                      }
+                    },
+                    "valueContainsNull": true
+                  }
                 }
-              }]
+              }],
+              "dataTypeStruct": {
+                "fields": [{
+                  "name": "_1",
+                  "dataType": {
+                    "string": {
+                      "collation": "UTF8_BINARY"
+                    }
+                  },
+                  "nullable": true
+                }, {
+                  "name": "_2",
+                  "nullable": true
+                }]
+              }
             }
-          }]
+          }],
+          "dataTypeStruct": {
+            "fields": [{
+              "name": "_1",
+              "nullable": true
+            }, {
+              "name": "_2",
+              "nullable": true
+            }, {
+              "name": "_3",
+              "nullable": true
+            }]
+          }
         }
       },
       "common": {
diff --git a/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.proto.bin b/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.proto.bin
index 38a6ce6300567..b3ebe8a79e3ec 100644
Binary files a/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.proto.bin and b/sql/connect/common/src/test/resources/query-tests/queries/function_typedLit.proto.bin differ
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/config/Connect.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/config/Connect.scala
index 5fe62295d1a5a..1887e4ede04db 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/config/Connect.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/config/Connect.scala
@@ -304,7 +304,7 @@ object Connect {
       .version("4.0.0")
       .internal()
       .intConf
-      .createWithDefault(16)
+      .createWithDefault(32)
 
   val CONNECT_SESSION_PLAN_CACHE_ENABLED =
     buildConf("spark.connect.session.planCache.enabled")
@@ -317,6 +317,17 @@ object Connect {
       .booleanConf
       .createWithDefault(true)
 
+  val CONNECT_ALWAYS_CACHE_DATA_SOURCE_READS_ENABLED =
+    buildConf("spark.connect.session.planCache.alwaysCacheDataSourceReadsEnabled")
+      .doc("When true, always cache the translation of Read.DataSource plans" +
+        " in the plan cache. This massively improves the performance of queries that reuse the" +
+        " same Read.DataSource within the same session, since these translations/analyses" +
+        " are usually quite costly.")
+      .version("4.1.0")
+      .internal()
+      .booleanConf
+      .createWithDefault(true)
+
   val CONNECT_AUTHENTICATE_TOKEN =
     buildStaticConf("spark.connect.authenticate.token")
       .doc("A pre-shared token that will be used to authenticate clients. This secret must be" +
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteGrpcResponseSender.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteGrpcResponseSender.scala
index ff59789980ce7..632a2aecee050 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteGrpcResponseSender.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteGrpcResponseSender.scala
@@ -24,7 +24,7 @@ import io.grpc.stub.{ServerCallStreamObserver, StreamObserver}
 
 import org.apache.spark.{SparkEnv, SparkSQLException}
 import org.apache.spark.connect.proto.ExecutePlanResponse
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.NANOS_PER_MILLIS
 import org.apache.spark.sql.connect.common.ProtoUtils
@@ -232,7 +232,8 @@ private[connect] class ExecuteGrpcResponseSender[T <: Message](
       // 2. has a response to send
       def gotResponse = response.nonEmpty
       // 3. sent everything from the stream and the stream is finished
-      def streamFinished = executionObserver.getLastResponseIndex().exists(nextIndex > _)
+      def streamFinished = executionObserver.getLastResponseIndex().exists(nextIndex > _) ||
+        executionObserver.isCleaned()
       // 4. time deadline or size limit reached
       def deadlineLimitReached =
         sentResponsesSize > maximumResponseSize || deadlineTimeNs < System.nanoTime()
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteResponseObserver.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteResponseObserver.scala
index 9d0cc2128dd41..2473df0e53f1e 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteResponseObserver.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteResponseObserver.scala
@@ -26,7 +26,7 @@ import io.grpc.stub.StreamObserver
 
 import org.apache.spark.{SparkEnv, SparkSQLException}
 import org.apache.spark.connect.proto
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.sql.connect.config.Connect.CONNECT_EXECUTE_REATTACHABLE_OBSERVER_RETRY_BUFFER_SIZE
 import org.apache.spark.sql.connect.service.ExecuteHolder
@@ -260,6 +260,11 @@ private[connect] class ExecuteResponseObserver[T <: Message](val executeHolder:
     finalProducedIndex.isDefined
   }
 
+  // Returns if this observer has already been cleaned
+  def isCleaned(): Boolean = responseLock.synchronized {
+    completed() && responses.isEmpty
+  }
+
   // For testing.
   private[connect] def undoCompletion(): Unit = responseLock.synchronized {
     finalProducedIndex = None
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteThreadRunner.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteThreadRunner.scala
index 13857e066a8fa..7c4ad7df66fc8 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteThreadRunner.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/ExecuteThreadRunner.scala
@@ -23,13 +23,12 @@ import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
 import com.google.protobuf.Message
-import org.apache.commons.lang3.StringUtils
 
 import org.apache.spark.SparkSQLException
 import org.apache.spark.connect.proto
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.connect.common.ProtoUtils
-import org.apache.spark.sql.connect.planner.SparkConnectPlanner
+import org.apache.spark.sql.connect.planner.InvalidInputErrors
 import org.apache.spark.sql.connect.service.{ExecuteHolder, ExecuteSessionTag, SparkConnectService}
 import org.apache.spark.sql.connect.utils.ErrorUtils
 import org.apache.spark.util.Utils
@@ -209,23 +208,23 @@ private[connect] class ExecuteThreadRunner(executeHolder: ExecuteHolder) extends
             tag))
       }
       session.sparkContext.setJobDescription(
-        s"Spark Connect - ${StringUtils.abbreviate(debugString, 128)}")
+        s"Spark Connect - ${Utils.abbreviate(debugString, 128)}")
       session.sparkContext.setInterruptOnCancel(true)
 
       // Add debug information to the query execution so that the jobs are traceable.
       session.sparkContext.setLocalProperty(
         "callSite.short",
-        s"Spark Connect - ${StringUtils.abbreviate(debugString, 128)}")
-      session.sparkContext.setLocalProperty(
-        "callSite.long",
-        StringUtils.abbreviate(debugString, 2048))
+        s"Spark Connect - ${Utils.abbreviate(debugString, 128)}")
+      session.sparkContext.setLocalProperty("callSite.long", Utils.abbreviate(debugString, 2048))
 
       executeHolder.request.getPlan.getOpTypeCase match {
-        case proto.Plan.OpTypeCase.COMMAND => handleCommand(executeHolder.request)
-        case proto.Plan.OpTypeCase.ROOT => handlePlan(executeHolder.request)
-        case _ =>
-          throw new UnsupportedOperationException(
-            s"${executeHolder.request.getPlan.getOpTypeCase} not supported.")
+        case proto.Plan.OpTypeCase.ROOT | proto.Plan.OpTypeCase.COMMAND =>
+          val execution = new SparkConnectPlanExecution(executeHolder)
+          execution.handlePlan(executeHolder.responseObserver)
+        case other =>
+          throw InvalidInputErrors.invalidOneOfField(
+            other,
+            executeHolder.request.getPlan.getDescriptorForType)
       }
 
       val observedMetrics: Map[String, Seq[(Option[String], Any)]] = {
@@ -307,21 +306,6 @@ private[connect] class ExecuteThreadRunner(executeHolder: ExecuteHolder) extends
       proto.StreamingQueryListenerBusCommand.CommandCase.ADD_LISTENER_BUS_LISTENER
   }
 
-  private def handlePlan(request: proto.ExecutePlanRequest): Unit = {
-    val responseObserver = executeHolder.responseObserver
-
-    val execution = new SparkConnectPlanExecution(executeHolder)
-    execution.handlePlan(responseObserver)
-  }
-
-  private def handleCommand(request: proto.ExecutePlanRequest): Unit = {
-    val responseObserver = executeHolder.responseObserver
-
-    val command = request.getPlan.getCommand
-    val planner = new SparkConnectPlanner(executeHolder)
-    planner.process(command = command, responseObserver = responseObserver)
-  }
-
   private def requestString(request: Message) = {
     try {
       Utils.redact(
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/SparkConnectPlanExecution.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/SparkConnectPlanExecution.scala
index 65b9863ca9543..388fd6a575db8 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/SparkConnectPlanExecution.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/execution/SparkConnectPlanExecution.scala
@@ -32,10 +32,10 @@ import org.apache.spark.sql.classic.{DataFrame, Dataset}
 import org.apache.spark.sql.connect.common.DataTypeProtoConverter
 import org.apache.spark.sql.connect.common.LiteralValueProtoConverter.toLiteralProto
 import org.apache.spark.sql.connect.config.Connect.CONNECT_GRPC_ARROW_MAX_BATCH_SIZE
-import org.apache.spark.sql.connect.planner.SparkConnectPlanner
+import org.apache.spark.sql.connect.planner.{InvalidInputErrors, SparkConnectPlanner}
 import org.apache.spark.sql.connect.service.ExecuteHolder
 import org.apache.spark.sql.connect.utils.MetricGenerator
-import org.apache.spark.sql.execution.{DoNotCleanup, LocalTableScanExec, RemoveShuffleFiles, SkipMigration, SQLExecution}
+import org.apache.spark.sql.execution.{DoNotCleanup, LocalTableScanExec, QueryExecution, RemoveShuffleFiles, SkipMigration, SQLExecution}
 import org.apache.spark.sql.execution.arrow.ArrowConverters
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StructType
@@ -53,34 +53,49 @@ private[execution] class SparkConnectPlanExecution(executeHolder: ExecuteHolder)
 
   def handlePlan(responseObserver: ExecuteResponseObserver[proto.ExecutePlanResponse]): Unit = {
     val request = executeHolder.request
-    if (request.getPlan.getOpTypeCase != proto.Plan.OpTypeCase.ROOT) {
-      throw new IllegalStateException(
-        s"Illegal operation type ${request.getPlan.getOpTypeCase} to be handled here.")
-    }
     val planner = new SparkConnectPlanner(executeHolder)
     val tracker = executeHolder.eventsManager.createQueryPlanningTracker()
     val conf = session.sessionState.conf
     val shuffleCleanupMode =
-      if (conf.getConf(SQLConf.SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED)) {
+      if (conf.getConf(SQLConf.CONNECT_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED)) {
         RemoveShuffleFiles
       } else if (conf.getConf(SQLConf.SHUFFLE_DEPENDENCY_SKIP_MIGRATION_ENABLED)) {
         SkipMigration
       } else {
         DoNotCleanup
       }
-    val dataframe =
-      Dataset.ofRows(
-        sessionHolder.session,
-        planner.transformRelation(request.getPlan.getRoot, cachePlan = true),
-        tracker,
-        shuffleCleanupMode)
-    responseObserver.onNext(createSchemaResponse(request.getSessionId, dataframe.schema))
-    processAsArrowBatches(dataframe, responseObserver, executeHolder)
-    responseObserver.onNext(MetricGenerator.createMetricsResponse(sessionHolder, dataframe))
-    createObservedMetricsResponse(
-      request.getSessionId,
-      executeHolder.allObservationAndPlanIds,
-      dataframe).foreach(responseObserver.onNext)
+    request.getPlan.getOpTypeCase match {
+      case proto.Plan.OpTypeCase.ROOT =>
+        val dataframe =
+          Dataset.ofRows(
+            sessionHolder.session,
+            planner.transformRelation(request.getPlan.getRoot, cachePlan = true),
+            tracker,
+            shuffleCleanupMode)
+        responseObserver.onNext(createSchemaResponse(request.getSessionId, dataframe.schema))
+        processAsArrowBatches(dataframe, responseObserver, executeHolder)
+        responseObserver.onNext(MetricGenerator.createMetricsResponse(sessionHolder, dataframe))
+        createObservedMetricsResponse(
+          request.getSessionId,
+          executeHolder.allObservationAndPlanIds,
+          dataframe).foreach(responseObserver.onNext)
+      case proto.Plan.OpTypeCase.COMMAND =>
+        val command = request.getPlan.getCommand
+        planner.transformCommand(command) match {
+          case Some(transformer) =>
+            val qe = new QueryExecution(
+              session,
+              transformer(tracker),
+              tracker,
+              shuffleCleanupMode = shuffleCleanupMode)
+            qe.assertCommandExecuted()
+            executeHolder.eventsManager.postFinished()
+          case None =>
+            planner.process(command, responseObserver)
+        }
+      case other =>
+        throw InvalidInputErrors.invalidOneOfField(other, request.getPlan.getDescriptorForType)
+    }
   }
 
   type Batch = (Array[Byte], Long)
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLCache.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLCache.scala
index ef1b17dc2221e..7761c0078b27c 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLCache.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLCache.scala
@@ -25,14 +25,14 @@ import java.util.concurrent.atomic.AtomicLong
 import scala.collection.mutable
 
 import com.google.common.cache.{CacheBuilder, RemovalNotification}
-import org.apache.commons.io.FileUtils
 
 import org.apache.spark.SparkException
 import org.apache.spark.internal.Logging
 import org.apache.spark.ml.Model
-import org.apache.spark.ml.util.{ConnectHelper, MLWritable, Summary}
+import org.apache.spark.ml.util.{ConnectHelper, HasTrainingSummary, MLWritable, Summary}
 import org.apache.spark.sql.connect.config.Connect
 import org.apache.spark.sql.connect.service.SessionHolder
+import org.apache.spark.util.SparkFileUtils
 
 /**
  * MLCache is for caching ML objects, typically for models and summaries evaluated by a model.
@@ -115,6 +115,12 @@ private[connect] class MLCache(sessionHolder: SessionHolder) extends Logging {
     }
   }
 
+  private[spark] def getModelOffloadingPath(refId: String): Path = {
+    val path = offloadedModelsDir.resolve(refId)
+    require(path.startsWith(offloadedModelsDir))
+    path
+  }
+
   /**
    * Cache an object into a map of MLCache, and return its key
    * @param obj
@@ -122,7 +128,7 @@ private[connect] class MLCache(sessionHolder: SessionHolder) extends Logging {
    * @return
    *   the key
    */
-  def register(obj: Object): String = {
+  def register(obj: Object): String = this.synchronized {
     val objectId = UUID.randomUUID().toString
 
     if (obj.isInstanceOf[Summary]) {
@@ -137,9 +143,14 @@ private[connect] class MLCache(sessionHolder: SessionHolder) extends Logging {
       }
       cachedModel.put(objectId, CacheItem(obj, sizeBytes))
       if (getMemoryControlEnabled) {
-        val savePath = offloadedModelsDir.resolve(objectId)
-        require(savePath.startsWith(offloadedModelsDir))
+        val savePath = getModelOffloadingPath(objectId)
         obj.asInstanceOf[MLWritable].write.saveToLocal(savePath.toString)
+        if (obj.isInstanceOf[HasTrainingSummary[_]]
+          && obj.asInstanceOf[HasTrainingSummary[_]].hasSummary) {
+          obj
+            .asInstanceOf[HasTrainingSummary[_]]
+            .saveSummary(savePath.resolve("summary").toString)
+        }
         Files.writeString(savePath.resolve(modelClassNameFile), obj.getClass.getName)
         totalMLCacheInMemorySizeBytes.addAndGet(sizeBytes)
         totalMLCacheSizeBytes.addAndGet(sizeBytes)
@@ -169,15 +180,14 @@ private[connect] class MLCache(sessionHolder: SessionHolder) extends Logging {
    * @return
    *   the cached object
    */
-  def get(refId: String): Object = {
+  def get(refId: String): Object = this.synchronized {
     if (refId == helperID) {
       helper
     } else {
       verifyObjectId(refId)
       var obj: Object = Option(cachedModel.get(refId)).map(_.obj).getOrElse(null)
       if (obj == null && getMemoryControlEnabled) {
-        val loadPath = offloadedModelsDir.resolve(refId)
-        require(loadPath.startsWith(offloadedModelsDir))
+        val loadPath = getModelOffloadingPath(refId)
         if (Files.isDirectory(loadPath)) {
           val className = Files.readString(loadPath.resolve(modelClassNameFile))
           obj = MLUtils.loadTransformer(
@@ -194,17 +204,16 @@ private[connect] class MLCache(sessionHolder: SessionHolder) extends Logging {
     }
   }
 
-  def _removeModel(refId: String): Boolean = {
+  def _removeModel(refId: String, evictOnly: Boolean): Boolean = {
     verifyObjectId(refId)
     val removedModel = cachedModel.remove(refId)
     val removedFromMem = removedModel != null
-    val removedFromDisk = if (removedModel != null && getMemoryControlEnabled) {
+    val removedFromDisk = if (!evictOnly && removedModel != null && getMemoryControlEnabled) {
       totalMLCacheSizeBytes.addAndGet(-removedModel.sizeBytes)
-      val removePath = offloadedModelsDir.resolve(refId)
-      require(removePath.startsWith(offloadedModelsDir))
+      val removePath = getModelOffloadingPath(refId)
       val offloadingPath = new File(removePath.toString)
       if (offloadingPath.exists()) {
-        FileUtils.deleteDirectory(offloadingPath)
+        SparkFileUtils.deleteRecursively(offloadingPath)
         true
       } else {
         false
@@ -220,8 +229,8 @@ private[connect] class MLCache(sessionHolder: SessionHolder) extends Logging {
    * @param refId
    *   the key used to look up the corresponding object
    */
-  def remove(refId: String): Boolean = {
-    val modelIsRemoved = _removeModel(refId)
+  def remove(refId: String, evictOnly: Boolean = false): Boolean = this.synchronized {
+    val modelIsRemoved = _removeModel(refId, evictOnly)
 
     modelIsRemoved
   }
@@ -229,16 +238,17 @@ private[connect] class MLCache(sessionHolder: SessionHolder) extends Logging {
   /**
    * Clear all the caches
    */
-  def clear(): Int = {
+  def clear(): Int = this.synchronized {
     val size = cachedModel.size()
     cachedModel.clear()
+    totalMLCacheSizeBytes.set(0)
     if (getMemoryControlEnabled) {
-      FileUtils.cleanDirectory(new File(offloadedModelsDir.toString))
+      SparkFileUtils.cleanDirectory(new File(offloadedModelsDir.toString))
     }
     size
   }
 
-  def getInfo(): Array[String] = {
+  def getInfo(): Array[String] = this.synchronized {
     val info = mutable.ArrayBuilder.make[String]
     cachedModel.forEach { case (key, value) =>
       info += s"id: $key, obj: ${value.obj.getClass}, size: ${value.sizeBytes}"
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLException.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLException.scala
index a017c719ed16e..847052be98a98 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLException.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLException.scala
@@ -51,3 +51,9 @@ private[spark] case class MLCacheSizeOverflowException(mlCacheMaxSize: Long)
       errorClass = "CONNECT_ML.ML_CACHE_SIZE_OVERFLOW_EXCEPTION",
       messageParameters = Map("mlCacheMaxSize" -> mlCacheMaxSize.toString),
       cause = null)
+
+private[spark] case class MLModelSummaryLostException(objectName: String)
+    extends SparkException(
+      errorClass = "CONNECT_ML.MODEL_SUMMARY_LOST",
+      messageParameters = Map("objectName" -> objectName),
+      cause = null)
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLHandler.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLHandler.scala
index d40b70ba0813c..40f1172677a50 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLHandler.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLHandler.scala
@@ -17,11 +17,14 @@
 
 package org.apache.spark.sql.connect.ml
 
+import java.io.{PrintWriter, StringWriter}
 import java.lang.ThreadLocal
+import java.util.concurrent.ConcurrentHashMap
 
 import scala.collection.mutable
 import scala.jdk.CollectionConverters.CollectionHasAsScala
 
+import org.apache.spark.SparkException
 import org.apache.spark.connect.proto
 import org.apache.spark.internal.Logging
 import org.apache.spark.ml.{Estimator, EstimatorUtils, Model, Transformer}
@@ -121,6 +124,9 @@ private[connect] object MLHandler extends Logging {
     override def initialValue: SessionHolder = null
   }
 
+  // A map of thread-id -> handler execution start time (UNIX timestamp)
+  val handlerExecutionStartTimeMap = new ConcurrentHashMap[Long, Long]()
+
   private val allowlistedMLClasses = {
     val transformerClasses = MLUtils.loadOperators(classOf[Transformer])
     val estimatorClasses = MLUtils.loadOperators(classOf[Estimator[_]])
@@ -150,7 +156,43 @@ private[connect] object MLHandler extends Logging {
     }
   }
 
-  def handleMlCommand(
+  def startHangingHandlerReaper(): Unit = {
+    val handlerInterruptionTimeoutMinutes = {
+      try {
+        val envValue = System.getenv("SPARK_CONNECT_ML_HANDLER_INTERRUPTION_TIMEOUT_MINUTES")
+        if (envValue != null) {
+          envValue.toInt
+        } else { 0 }
+      } catch {
+        case _: Exception => 0
+      }
+    }
+
+    if (handlerInterruptionTimeoutMinutes > 0) {
+      val handlerInterruptionTimeoutMillis = handlerInterruptionTimeoutMinutes * 60 * 1000
+      val thread = new Thread(() => {
+        while (true) {
+          handlerExecutionStartTimeMap.forEach { (threadId, startTime) =>
+            val execTime = System.currentTimeMillis() - startTime
+            if (execTime > handlerInterruptionTimeoutMillis) {
+              for (t <- Thread.getAllStackTraces().keySet().asScala) {
+                if (t.getId() == threadId) {
+                  t.interrupt()
+                }
+              }
+            }
+          }
+          Thread.sleep(60 * 1000)
+        }
+      })
+      thread.setDaemon(true)
+      thread.start()
+    }
+  }
+
+  startHangingHandlerReaper()
+
+  def _handleMlCommand(
       sessionHolder: SessionHolder,
       mlCommand: proto.MlCommand): proto.MlCommandResult = {
 
@@ -229,9 +271,7 @@ private[connect] object MLHandler extends Logging {
         if (obj != null && obj.isInstanceOf[HasTrainingSummary[_]]
           && methods(0).getMethod == "summary"
           && !obj.asInstanceOf[HasTrainingSummary[_]].hasSummary) {
-          throw MLCacheInvalidException(
-            objRefId,
-            sessionHolder.mlCache.getOffloadingTimeoutMinute)
+          throw MLModelSummaryLostException(objRefId)
         }
         val helper = AttributeHelper(sessionHolder, objRefId, methods)
         val attrResult = helper.getAttribute
@@ -264,9 +304,13 @@ private[connect] object MLHandler extends Logging {
 
       case proto.MlCommand.CommandCase.DELETE =>
         val ids = mutable.ArrayBuilder.make[String]
-        mlCommand.getDelete.getObjRefsList.asScala.toArray.foreach { objId =>
+        val deleteCmd = mlCommand.getDelete
+        val evictOnly = if (deleteCmd.hasEvictOnly) {
+          deleteCmd.getEvictOnly
+        } else { false }
+        deleteCmd.getObjRefsList.asScala.toArray.foreach { objId =>
           if (!objId.getId.contains(".")) {
-            if (mlCache.remove(objId.getId)) {
+            if (mlCache.remove(objId.getId, evictOnly)) {
               ids += objId.getId
             }
           }
@@ -400,11 +444,80 @@ private[connect] object MLHandler extends Logging {
           .setParam(LiteralValueProtoConverter.toLiteralProto(metric))
           .build()
 
+      case proto.MlCommand.CommandCase.CREATE_SUMMARY =>
+        val createSummaryCmd = mlCommand.getCreateSummary
+        createModelSummary(sessionHolder, createSummaryCmd)
+
+      case proto.MlCommand.CommandCase.GET_MODEL_SIZE =>
+        val modelRefId = mlCommand.getGetModelSize.getModelRef.getId
+        val model = mlCache.get(modelRefId)
+        val modelSize = model.asInstanceOf[Model[_]].estimatedSize
+        proto.MlCommandResult
+          .newBuilder()
+          .setParam(LiteralValueProtoConverter.toLiteralProto(modelSize))
+          .build()
+
       case other => throw MlUnsupportedException(s"$other not supported")
     }
   }
 
-  def transformMLRelation(relation: proto.MlRelation, sessionHolder: SessionHolder): DataFrame = {
+  def wrapHandler(
+      originHandler: () => Any,
+      reqProto: com.google.protobuf.GeneratedMessage): Any = {
+    val threadId = Thread.currentThread().getId
+    val startTime = System.currentTimeMillis()
+    handlerExecutionStartTimeMap.put(threadId, startTime)
+    try {
+      originHandler()
+    } catch {
+      case e: InterruptedException =>
+        val stackTrace = {
+          val sw = new StringWriter()
+          val pw = new PrintWriter(sw)
+          e.printStackTrace(pw)
+          sw.toString
+        }
+        val execTime = (System.currentTimeMillis() - startTime) / (60 * 1000)
+        throw SparkException.internalError(
+          s"The Spark Connect ML handler thread is interrupted after executing for " +
+            s"$execTime minutes.\nThe request proto message is:\n${reqProto.toString}\n, " +
+            s"the current stack trace is:\n$stackTrace\n")
+    } finally {
+      handlerExecutionStartTimeMap.remove(threadId)
+    }
+  }
+
+  def handleMlCommand(
+      sessionHolder: SessionHolder,
+      mlCommand: proto.MlCommand): proto.MlCommandResult = {
+    wrapHandler(() => _handleMlCommand(sessionHolder, mlCommand), mlCommand)
+      .asInstanceOf[proto.MlCommandResult]
+  }
+
+  private def createModelSummary(
+      sessionHolder: SessionHolder,
+      createSummaryCmd: proto.MlCommand.CreateSummary): proto.MlCommandResult =
+    sessionHolder.mlCache.synchronized {
+      val refId = createSummaryCmd.getModelRef.getId
+      val model = sessionHolder.mlCache.get(refId).asInstanceOf[HasTrainingSummary[_]]
+      val isCreated = if (!model.hasSummary) {
+        val dataset = MLUtils.parseRelationProto(createSummaryCmd.getDataset, sessionHolder)
+        val modelPath = sessionHolder.mlCache.getModelOffloadingPath(refId)
+        val summaryPath = modelPath.resolve("summary").toString
+        model.loadSummary(summaryPath, dataset)
+        true
+      } else {
+        false
+      }
+      proto.MlCommandResult
+        .newBuilder()
+        .setParam(LiteralValueProtoConverter.toLiteralProto(isCreated))
+        .build()
+    }
+
+  def _transformMLRelation(
+      relation: proto.MlRelation,
+      sessionHolder: SessionHolder): DataFrame = {
     relation.getMlTypeCase match {
       // Ml transform
       case proto.MlRelation.MlTypeCase.TRANSFORM =>
@@ -433,13 +546,36 @@ private[connect] object MLHandler extends Logging {
 
       // Get the attribute from a cached object which could be a model or summary
       case proto.MlRelation.MlTypeCase.FETCH =>
-        val helper = AttributeHelper(
-          sessionHolder,
-          relation.getFetch.getObjRef.getId,
-          relation.getFetch.getMethodsList.asScala.toArray)
+        val objRefId = relation.getFetch.getObjRef.getId
+        val methods = relation.getFetch.getMethodsList.asScala.toArray
+        val obj = sessionHolder.mlCache.get(objRefId)
+        sessionHolder.mlCache.synchronized {
+          if (obj != null && obj.isInstanceOf[HasTrainingSummary[_]]
+            && methods(0).getMethod == "summary"
+            && !obj.asInstanceOf[HasTrainingSummary[_]].hasSummary) {
+
+            if (relation.hasModelSummaryDataset) {
+              val dataset =
+                MLUtils.parseRelationProto(relation.getModelSummaryDataset, sessionHolder)
+              val modelPath = sessionHolder.mlCache.getModelOffloadingPath(objRefId)
+              val summaryPath = modelPath.resolve("summary").toString
+              obj.asInstanceOf[HasTrainingSummary[_]].loadSummary(summaryPath, dataset)
+            } else {
+              // For old Spark client backward compatibility.
+              throw MLModelSummaryLostException(objRefId)
+            }
+          }
+        }
+
+        val helper = AttributeHelper(sessionHolder, objRefId, methods)
         helper.getAttribute.asInstanceOf[DataFrame]
 
       case other => throw MlUnsupportedException(s"$other not supported")
     }
   }
+
+  def transformMLRelation(relation: proto.MlRelation, sessionHolder: SessionHolder): DataFrame = {
+    wrapHandler(() => _transformMLRelation(relation, sessionHolder), relation)
+      .asInstanceOf[DataFrame]
+  }
 }
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLUtils.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLUtils.scala
index 0ab9105637291..b06ddaadc4da5 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLUtils.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ml/MLUtils.scala
@@ -40,7 +40,7 @@ import org.apache.spark.ml.tree.{DecisionTreeModel, TreeEnsembleModel}
 import org.apache.spark.ml.util.{ConnectHelper, HasTrainingSummary, Identifiable, MLReader, MLWritable}
 import org.apache.spark.sql.DataFrame
 import org.apache.spark.sql.classic.Dataset
-import org.apache.spark.sql.connect.common.LiteralValueProtoConverter
+import org.apache.spark.sql.connect.common.{LiteralValueProtoConverter, ProtoSpecializedArray}
 import org.apache.spark.sql.connect.planner.SparkConnectPlanner
 import org.apache.spark.sql.connect.plugin.SparkConnectPluginRegistry
 import org.apache.spark.sql.connect.service.SessionHolder
@@ -73,39 +73,19 @@ private[ml] object MLUtils {
       .toMap
   }
 
-  private def parseInts(ints: proto.Ints): Array[Int] = {
-    val size = ints.getValuesCount
-    val values = Array.ofDim[Int](size)
-    var i = 0
-    while (i < size) {
-      values(i) = ints.getValues(i)
-      i += 1
-    }
-    values
-  }
-
-  private def parseDoubles(doubles: proto.Doubles): Array[Double] = {
-    val size = doubles.getValuesCount
-    val values = Array.ofDim[Double](size)
-    var i = 0
-    while (i < size) {
-      values(i) = doubles.getValues(i)
-      i += 1
-    }
-    values
-  }
-
   def deserializeVector(s: proto.Expression.Literal.Struct): Vector = {
     assert(s.getElementsCount == 4)
     s.getElements(0).getByte match {
       case 0 =>
         val size = s.getElements(1).getInteger
-        val indices = parseInts(s.getElements(2).getSpecializedArray.getInts)
-        val values = parseDoubles(s.getElements(3).getSpecializedArray.getDoubles)
+        val indices = ProtoSpecializedArray.toArray(s.getElements(2).getSpecializedArray.getInts)
+        val values =
+          ProtoSpecializedArray.toArray(s.getElements(3).getSpecializedArray.getDoubles)
         Vectors.sparse(size, indices, values)
 
       case 1 =>
-        val values = parseDoubles(s.getElements(3).getSpecializedArray.getDoubles)
+        val values =
+          ProtoSpecializedArray.toArray(s.getElements(3).getSpecializedArray.getDoubles)
         Vectors.dense(values)
 
       case o => throw MlUnsupportedException(s"Unknown Vector type $o")
@@ -118,16 +98,19 @@ private[ml] object MLUtils {
       case 0 =>
         val numRows = s.getElements(1).getInteger
         val numCols = s.getElements(2).getInteger
-        val colPtrs = parseInts(s.getElements(3).getSpecializedArray.getInts)
-        val rowIndices = parseInts(s.getElements(4).getSpecializedArray.getInts)
-        val values = parseDoubles(s.getElements(5).getSpecializedArray.getDoubles)
+        val colPtrs = ProtoSpecializedArray.toArray(s.getElements(3).getSpecializedArray.getInts)
+        val rowIndices =
+          ProtoSpecializedArray.toArray(s.getElements(4).getSpecializedArray.getInts)
+        val values =
+          ProtoSpecializedArray.toArray(s.getElements(5).getSpecializedArray.getDoubles)
         val isTransposed = s.getElements(6).getBoolean
         new SparseMatrix(numRows, numCols, colPtrs, rowIndices, values, isTransposed)
 
       case 1 =>
         val numRows = s.getElements(1).getInteger
         val numCols = s.getElements(2).getInteger
-        val values = parseDoubles(s.getElements(5).getSpecializedArray.getDoubles)
+        val values =
+          ProtoSpecializedArray.toArray(s.getElements(5).getSpecializedArray.getDoubles)
         val isTransposed = s.getElements(6).getBoolean
         new DenseMatrix(numRows, numCols, values, isTransposed)
 
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/DataflowGraphRegistry.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/DataflowGraphRegistry.scala
index 4402dde04f3c8..e0c7beb43001d 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/DataflowGraphRegistry.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/DataflowGraphRegistry.scala
@@ -28,10 +28,7 @@ import org.apache.spark.sql.pipelines.graph.GraphRegistrationContext
  * PipelinesHandler when CreateDataflowGraph is called, and the PipelinesHandler also supports
  * attaching flows/datasets to a graph.
  */
-// TODO(SPARK-51727): Currently DataflowGraphRegistry is a singleton, but it should instead be
-//  scoped to a single SparkSession for proper isolation between pipelines that are run on the
-//  same cluster.
-object DataflowGraphRegistry {
+class DataflowGraphRegistry {
 
   private val dataflowGraphs = new ConcurrentHashMap[String, GraphRegistrationContext]()
 
@@ -55,7 +52,7 @@ object DataflowGraphRegistry {
 
   /** Retrieves the graph for a given id, and throws if the id could not be found. */
   def getDataflowGraphOrThrow(dataflowGraphId: String): GraphRegistrationContext =
-    DataflowGraphRegistry.getDataflowGraph(dataflowGraphId).getOrElse {
+    getDataflowGraph(dataflowGraphId).getOrElse {
       throw new SparkException(
         errorClass = "DATAFLOW_GRAPH_NOT_FOUND",
         messageParameters = Map("graphId" -> dataflowGraphId),
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/PipelinesHandler.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/PipelinesHandler.scala
index 92cb5bcac4ee0..b595ba2c501ed 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/PipelinesHandler.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/pipelines/PipelinesHandler.scala
@@ -26,14 +26,13 @@ import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.{ExecutePlanResponse, PipelineCommandResult, Relation}
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
-import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.connect.common.DataTypeProtoConverter
 import org.apache.spark.sql.connect.service.SessionHolder
 import org.apache.spark.sql.pipelines.Language.Python
-import org.apache.spark.sql.pipelines.QueryOriginType
 import org.apache.spark.sql.pipelines.common.RunState.{CANCELED, FAILED}
-import org.apache.spark.sql.pipelines.graph.{FlowAnalysis, GraphIdentifierManager, IdentifierHelper, PipelineUpdateContextImpl, QueryContext, QueryOrigin, SqlGraphRegistrationContext, Table, TemporaryView, UnresolvedFlow}
+import org.apache.spark.sql.pipelines.graph.{AllTables, FlowAnalysis, GraphIdentifierManager, GraphRegistrationContext, IdentifierHelper, NoTables, PipelineUpdateContextImpl, QueryContext, QueryOrigin, QueryOriginType, SomeTables, SqlGraphRegistrationContext, Table, TableFilter, TemporaryView, UnresolvedFlow}
 import org.apache.spark.sql.pipelines.logging.{PipelineEvent, RunProgress}
 import org.apache.spark.sql.types.StructType
 
@@ -67,7 +66,7 @@ private[connect] object PipelinesHandler extends Logging {
     cmd.getCommandTypeCase match {
       case proto.PipelineCommand.CommandTypeCase.CREATE_DATAFLOW_GRAPH =>
         val createdGraphId =
-          createDataflowGraph(cmd.getCreateDataflowGraph, sessionHolder.session)
+          createDataflowGraph(cmd.getCreateDataflowGraph, sessionHolder)
         PipelineCommandResult
           .newBuilder()
           .setCreateDataflowGraphResult(
@@ -77,15 +76,16 @@ private[connect] object PipelinesHandler extends Logging {
           .build()
       case proto.PipelineCommand.CommandTypeCase.DROP_DATAFLOW_GRAPH =>
         logInfo(s"Drop pipeline cmd received: $cmd")
-        DataflowGraphRegistry.dropDataflowGraph(cmd.getDropDataflowGraph.getDataflowGraphId)
+        sessionHolder.dataflowGraphRegistry
+          .dropDataflowGraph(cmd.getDropDataflowGraph.getDataflowGraphId)
         defaultResponse
       case proto.PipelineCommand.CommandTypeCase.DEFINE_DATASET =>
         logInfo(s"Define pipelines dataset cmd received: $cmd")
-        defineDataset(cmd.getDefineDataset, sessionHolder.session)
+        defineDataset(cmd.getDefineDataset, sessionHolder)
         defaultResponse
       case proto.PipelineCommand.CommandTypeCase.DEFINE_FLOW =>
         logInfo(s"Define pipelines flow cmd received: $cmd")
-        defineFlow(cmd.getDefineFlow, transformRelationFunc, sessionHolder.session)
+        defineFlow(cmd.getDefineFlow, transformRelationFunc, sessionHolder)
         defaultResponse
       case proto.PipelineCommand.CommandTypeCase.START_RUN =>
         logInfo(s"Start pipeline cmd received: $cmd")
@@ -93,7 +93,7 @@ private[connect] object PipelinesHandler extends Logging {
         defaultResponse
       case proto.PipelineCommand.CommandTypeCase.DEFINE_SQL_GRAPH_ELEMENTS =>
         logInfo(s"Register sql datasets cmd received: $cmd")
-        defineSqlGraphElements(cmd.getDefineSqlGraphElements, sessionHolder.session)
+        defineSqlGraphElements(cmd.getDefineSqlGraphElements, sessionHolder)
         defaultResponse
       case other => throw new UnsupportedOperationException(s"$other not supported")
     }
@@ -101,24 +101,24 @@ private[connect] object PipelinesHandler extends Logging {
 
   private def createDataflowGraph(
       cmd: proto.PipelineCommand.CreateDataflowGraph,
-      spark: SparkSession): String = {
+      sessionHolder: SessionHolder): String = {
     val defaultCatalog = Option
       .when(cmd.hasDefaultCatalog)(cmd.getDefaultCatalog)
       .getOrElse {
         logInfo(s"No default catalog was supplied. Falling back to the current catalog.")
-        spark.catalog.currentCatalog()
+        sessionHolder.session.catalog.currentCatalog()
       }
 
     val defaultDatabase = Option
       .when(cmd.hasDefaultDatabase)(cmd.getDefaultDatabase)
       .getOrElse {
         logInfo(s"No default database was supplied. Falling back to the current database.")
-        spark.catalog.currentDatabase
+        sessionHolder.session.catalog.currentDatabase
       }
 
     val defaultSqlConf = cmd.getSqlConfMap.asScala.toMap
 
-    DataflowGraphRegistry.createDataflowGraph(
+    sessionHolder.dataflowGraphRegistry.createDataflowGraph(
       defaultCatalog = defaultCatalog,
       defaultDatabase = defaultDatabase,
       defaultSqlConf = defaultSqlConf)
@@ -126,24 +126,31 @@ private[connect] object PipelinesHandler extends Logging {
 
   private def defineSqlGraphElements(
       cmd: proto.PipelineCommand.DefineSqlGraphElements,
-      session: SparkSession): Unit = {
+      sessionHolder: SessionHolder): Unit = {
     val dataflowGraphId = cmd.getDataflowGraphId
 
-    val graphElementRegistry = DataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
+    val graphElementRegistry =
+      sessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
     val sqlGraphElementRegistrationContext = new SqlGraphRegistrationContext(graphElementRegistry)
-    sqlGraphElementRegistrationContext.processSqlFile(cmd.getSqlText, cmd.getSqlFilePath, session)
+    sqlGraphElementRegistrationContext.processSqlFile(
+      cmd.getSqlText,
+      cmd.getSqlFilePath,
+      sessionHolder.session)
   }
 
   private def defineDataset(
       dataset: proto.PipelineCommand.DefineDataset,
-      sparkSession: SparkSession): Unit = {
+      sessionHolder: SessionHolder): Unit = {
     val dataflowGraphId = dataset.getDataflowGraphId
-    val graphElementRegistry = DataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
+    val graphElementRegistry =
+      sessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
 
     dataset.getDatasetType match {
       case proto.DatasetType.MATERIALIZED_VIEW | proto.DatasetType.TABLE =>
         val tableIdentifier =
-          GraphIdentifierManager.parseTableIdentifier(dataset.getDatasetName, sparkSession)
+          GraphIdentifierManager.parseTableIdentifier(
+            dataset.getDatasetName,
+            sessionHolder.session)
         graphElementRegistry.registerTable(
           Table(
             identifier = tableIdentifier,
@@ -161,10 +168,12 @@ private[connect] object PipelinesHandler extends Logging {
               language = Option(Python())),
             format = Option.when(dataset.hasFormat)(dataset.getFormat),
             normalizedPath = None,
-            isStreamingTableOpt = None))
+            isStreamingTable = dataset.getDatasetType == proto.DatasetType.TABLE))
       case proto.DatasetType.TEMPORARY_VIEW =>
         val viewIdentifier =
-          GraphIdentifierManager.parseTableIdentifier(dataset.getDatasetName, sparkSession)
+          GraphIdentifierManager.parseTableIdentifier(
+            dataset.getDatasetName,
+            sessionHolder.session)
 
         graphElementRegistry.registerView(
           TemporaryView(
@@ -183,14 +192,15 @@ private[connect] object PipelinesHandler extends Logging {
   private def defineFlow(
       flow: proto.PipelineCommand.DefineFlow,
       transformRelationFunc: Relation => LogicalPlan,
-      sparkSession: SparkSession): Unit = {
+      sessionHolder: SessionHolder): Unit = {
     val dataflowGraphId = flow.getDataflowGraphId
-    val graphElementRegistry = DataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
+    val graphElementRegistry =
+      sessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
 
     val isImplicitFlow = flow.getFlowName == flow.getTargetDatasetName
 
     val flowIdentifier = GraphIdentifierManager
-      .parseTableIdentifier(name = flow.getFlowName, spark = sparkSession)
+      .parseTableIdentifier(name = flow.getFlowName, spark = sessionHolder.session)
 
     // If the flow is not an implicit flow (i.e. one defined as part of dataset creation), then
     // it must be a single-part identifier.
@@ -204,15 +214,14 @@ private[connect] object PipelinesHandler extends Logging {
       new UnresolvedFlow(
         identifier = flowIdentifier,
         destinationIdentifier = GraphIdentifierManager
-          .parseTableIdentifier(name = flow.getTargetDatasetName, spark = sparkSession),
+          .parseTableIdentifier(name = flow.getTargetDatasetName, spark = sessionHolder.session),
         func =
-          FlowAnalysis.createFlowFunctionFromLogicalPlan(transformRelationFunc(flow.getPlan)),
+          FlowAnalysis.createFlowFunctionFromLogicalPlan(transformRelationFunc(flow.getRelation)),
         sqlConf = flow.getSqlConfMap.asScala.toMap,
-        once = flow.getOnce,
+        once = false,
         queryContext = QueryContext(
           Option(graphElementRegistry.defaultCatalog),
           Option(graphElementRegistry.defaultDatabase)),
-        comment = None,
         origin = QueryOrigin(
           objectType = Option(QueryOriginType.Flow.toString),
           objectName = Option(flowIdentifier.unquotedString),
@@ -224,9 +233,12 @@ private[connect] object PipelinesHandler extends Logging {
       responseObserver: StreamObserver[ExecutePlanResponse],
       sessionHolder: SessionHolder): Unit = {
     val dataflowGraphId = cmd.getDataflowGraphId
-    val graphElementRegistry = DataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
+    val graphElementRegistry =
+      sessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(dataflowGraphId)
+    val tableFiltersResult = createTableFilters(cmd, graphElementRegistry, sessionHolder)
+
     // We will use this variable to store the run failure event if it occurs. This will be set
-    // by the event callback that is executed when an event is added to the PipelineRunEventBuffer.
+    // by the event callback.
     @volatile var runFailureEvent = Option.empty[PipelineEvent]
     // Define a callback which will stream logs back to the SparkConnect client when an internal
     // pipeline event is emitted during pipeline execution. We choose to pass a callback rather the
@@ -280,10 +292,17 @@ private[connect] object PipelinesHandler extends Logging {
               .build())
       }
     }
-    val pipelineUpdateContext =
-      new PipelineUpdateContextImpl(graphElementRegistry.toDataflowGraph, eventCallback)
+    val pipelineUpdateContext = new PipelineUpdateContextImpl(
+      graphElementRegistry.toDataflowGraph,
+      eventCallback,
+      tableFiltersResult.refresh,
+      tableFiltersResult.fullRefresh)
     sessionHolder.cachePipelineExecution(dataflowGraphId, pipelineUpdateContext)
-    pipelineUpdateContext.pipelineExecution.runPipeline()
+    if (cmd.getDry) {
+      pipelineUpdateContext.pipelineExecution.dryRunPipeline()
+    } else {
+      pipelineUpdateContext.pipelineExecution.runPipeline()
+    }
 
     // Rethrow any exceptions that caused the pipeline run to fail so that the exception is
     // propagated back to the SC client / CLI.
@@ -291,4 +310,87 @@ private[connect] object PipelinesHandler extends Logging {
       throw event.error.get
     }
   }
+
+  /**
+   * Creates the table filters for the full refresh and refresh operations based on the StartRun
+   * command user provided. Also validates the command parameters to ensure that they are
+   * consistent and do not conflict with each other.
+   *
+   * If `fullRefreshAll` is true, create `AllTables` filter for full refresh.
+   *
+   * If `fullRefreshTables` and `refreshTables` are both empty, create `AllTables` filter for
+   * refresh as a default behavior.
+   *
+   * If both non-empty, verifies that there is no overlap and creates SomeTables filters for both.
+   *
+   * If one non-empty and the other empty, create `SomeTables` filter for the non-empty one, and
+   * `NoTables` filter for the empty one.
+   */
+  private def createTableFilters(
+      startRunCommand: proto.PipelineCommand.StartRun,
+      graphElementRegistry: GraphRegistrationContext,
+      sessionHolder: SessionHolder): TableFilters = {
+    // Convert table names to fully qualified TableIdentifier objects
+    def parseTableNames(tableNames: Seq[String]): Set[TableIdentifier] = {
+      tableNames.map { name =>
+        GraphIdentifierManager
+          .parseAndQualifyTableIdentifier(
+            rawTableIdentifier =
+              GraphIdentifierManager.parseTableIdentifier(name, sessionHolder.session),
+            currentCatalog = Some(graphElementRegistry.defaultCatalog),
+            currentDatabase = Some(graphElementRegistry.defaultDatabase))
+          .identifier
+      }.toSet
+    }
+
+    val fullRefreshTables = startRunCommand.getFullRefreshSelectionList.asScala.toSeq
+    val fullRefreshAll = startRunCommand.getFullRefreshAll
+    val refreshTables = startRunCommand.getRefreshSelectionList.asScala.toSeq
+
+    if (refreshTables.nonEmpty && fullRefreshAll) {
+      throw new IllegalArgumentException(
+        "Cannot specify a subset to refresh when full refresh all is set to true.")
+    }
+
+    if (fullRefreshTables.nonEmpty && fullRefreshAll) {
+      throw new IllegalArgumentException(
+        "Cannot specify a subset to full refresh when full refresh all is set to true.")
+    }
+    val refreshTableNames = parseTableNames(refreshTables)
+    val fullRefreshTableNames = parseTableNames(fullRefreshTables)
+
+    if (refreshTables.nonEmpty && fullRefreshTables.nonEmpty) {
+      // check if there is an intersection between the subset
+      val intersection = refreshTableNames.intersect(fullRefreshTableNames)
+      if (intersection.nonEmpty) {
+        throw new IllegalArgumentException(
+          "Datasets specified for refresh and full refresh cannot overlap: " +
+            s"${intersection.mkString(", ")}")
+      }
+    }
+
+    if (fullRefreshAll) {
+      return TableFilters(fullRefresh = AllTables, refresh = NoTables)
+    }
+
+    (fullRefreshTables, refreshTables) match {
+      case (Nil, Nil) =>
+        // If both are empty, we default to refreshing all tables
+        TableFilters(fullRefresh = NoTables, refresh = AllTables)
+      case (_, Nil) =>
+        TableFilters(fullRefresh = SomeTables(fullRefreshTableNames), refresh = NoTables)
+      case (Nil, _) =>
+        TableFilters(fullRefresh = NoTables, refresh = SomeTables(refreshTableNames))
+      case (_, _) =>
+        // If both are specified, we create filters for both after validation
+        TableFilters(
+          fullRefresh = SomeTables(fullRefreshTableNames),
+          refresh = SomeTables(refreshTableNames))
+    }
+  }
+
+  /**
+   * A case class to hold the table filters for full refresh and refresh operations.
+   */
+  private case class TableFilters(fullRefresh: TableFilter, refresh: TableFilter)
 }
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverter.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverter.scala
index 50f413399befd..e1d30240f867e 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverter.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverter.scala
@@ -97,21 +97,35 @@ object LiteralExpressionProtoConverter {
       case proto.Expression.Literal.LiteralTypeCase.DAY_TIME_INTERVAL =>
         expressions.Literal(lit.getDayTimeInterval, DayTimeIntervalType())
 
+      case proto.Expression.Literal.LiteralTypeCase.TIME =>
+        var precision = TimeType.DEFAULT_PRECISION
+        if (lit.getTime.hasPrecision) {
+          precision = lit.getTime.getPrecision
+        }
+        expressions.Literal(lit.getTime.getNano, TimeType(precision))
+
       case proto.Expression.Literal.LiteralTypeCase.ARRAY =>
-        expressions.Literal.create(
-          LiteralValueProtoConverter.toCatalystArray(lit.getArray),
-          ArrayType(DataTypeProtoConverter.toCatalystType(lit.getArray.getElementType)))
+        val arrayData = LiteralValueProtoConverter.toCatalystArray(lit.getArray)
+        val dataType = DataTypeProtoConverter.toCatalystType(
+          proto.DataType.newBuilder
+            .setArray(LiteralValueProtoConverter.getProtoArrayType(lit.getArray))
+            .build())
+        expressions.Literal.create(arrayData, dataType)
 
       case proto.Expression.Literal.LiteralTypeCase.MAP =>
-        expressions.Literal.create(
-          LiteralValueProtoConverter.toCatalystMap(lit.getMap),
-          MapType(
-            DataTypeProtoConverter.toCatalystType(lit.getMap.getKeyType),
-            DataTypeProtoConverter.toCatalystType(lit.getMap.getValueType)))
+        val mapData = LiteralValueProtoConverter.toCatalystMap(lit.getMap)
+        val dataType = DataTypeProtoConverter.toCatalystType(
+          proto.DataType.newBuilder
+            .setMap(LiteralValueProtoConverter.getProtoMapType(lit.getMap))
+            .build())
+        expressions.Literal.create(mapData, dataType)
 
       case proto.Expression.Literal.LiteralTypeCase.STRUCT =>
-        val dataType = DataTypeProtoConverter.toCatalystType(lit.getStruct.getStructType)
         val structData = LiteralValueProtoConverter.toCatalystStruct(lit.getStruct)
+        val dataType = DataTypeProtoConverter.toCatalystType(
+          proto.DataType.newBuilder
+            .setStruct(LiteralValueProtoConverter.getProtoStructType(lit.getStruct))
+            .build())
         val convert = CatalystTypeConverters.createToCatalystConverter(dataType)
         expressions.Literal(convert(structData), dataType)
 
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectPlanner.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectPlanner.scala
index bcd643a30253f..c0b1fd01616a4 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectPlanner.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectPlanner.scala
@@ -17,8 +17,7 @@
 
 package org.apache.spark.sql.connect.planner
 
-import java.util.Properties
-import java.util.UUID
+import java.util.{HashMap, Properties, UUID}
 
 import scala.collection.mutable
 import scala.jdk.CollectionConverters._
@@ -26,11 +25,10 @@ import scala.util.Try
 import scala.util.control.NonFatal
 
 import com.google.common.base.Throwables
-import com.google.common.collect.{Lists, Maps}
+import com.google.common.collect.Lists
 import com.google.protobuf.{Any => ProtoAny, ByteString}
 import io.grpc.{Context, Status, StatusRuntimeException}
 import io.grpc.stub.StreamObserver
-import org.apache.commons.lang3.exception.ExceptionUtils
 
 import org.apache.spark.{SparkClassNotFoundException, SparkEnv, SparkException, TaskContext}
 import org.apache.spark.annotation.{DeveloperApi, Since}
@@ -41,7 +39,7 @@ import org.apache.spark.connect.proto.ExecutePlanResponse.SqlCommandResult
 import org.apache.spark.connect.proto.Parse.ParseFormat
 import org.apache.spark.connect.proto.StreamingQueryManagerCommandResult.StreamingQueryInstance
 import org.apache.spark.connect.proto.WriteStreamOperationStart.TriggerCase
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{DATAFRAME_ID, SESSION_ID}
 import org.apache.spark.resource.{ExecutorResourceRequest, ResourceProfile, TaskResourceProfile, TaskResourceRequest}
 import org.apache.spark.sql.{Column, Encoders, ForeachWriter, Observation, Row}
@@ -59,7 +57,7 @@ import org.apache.spark.sql.catalyst.streaming.InternalOutputModes
 import org.apache.spark.sql.catalyst.trees.{CurrentOrigin, Origin, TreePattern}
 import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.catalyst.util.{CaseInsensitiveMap, CharVarcharUtils}
-import org.apache.spark.sql.classic.{Catalog, Dataset, MergeIntoWriter, RelationalGroupedDataset, SparkSession, TypedAggUtils, UserDefinedFunctionUtils}
+import org.apache.spark.sql.classic.{Catalog, DataFrameWriter, Dataset, MergeIntoWriter, RelationalGroupedDataset, SparkSession, TypedAggUtils, UserDefinedFunctionUtils}
 import org.apache.spark.sql.classic.ClassicConversions._
 import org.apache.spark.sql.connect.client.arrow.ArrowSerializer
 import org.apache.spark.sql.connect.common.{DataTypeProtoConverter, ForeachWriterPacket, LiteralValueProtoConverter, StorageLevelProtoConverter, StreamingListenerPacket, UdfPacket}
@@ -79,8 +77,8 @@ import org.apache.spark.sql.execution.datasources.v2.python.UserDefinedPythonDat
 import org.apache.spark.sql.execution.python.{UserDefinedPythonFunction, UserDefinedPythonTableFunction}
 import org.apache.spark.sql.execution.python.streaming.PythonForeachWriter
 import org.apache.spark.sql.execution.stat.StatFunctions
-import org.apache.spark.sql.execution.streaming.GroupStateImpl.groupStateTimeoutFromString
-import org.apache.spark.sql.execution.streaming.StreamingQueryWrapper
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl.groupStateTimeoutFromString
+import org.apache.spark.sql.execution.streaming.runtime.StreamingQueryWrapper
 import org.apache.spark.sql.expressions.{Aggregator, ReduceAggregator, SparkUserDefinedFunction, UserDefinedAggregator, UserDefinedFunction}
 import org.apache.spark.sql.streaming.{GroupStateTimeout, OutputMode, StatefulProcessor, StatefulProcessorWithInitialState, StreamingQuery, StreamingQueryListener, StreamingQueryProgress, Trigger}
 import org.apache.spark.sql.types._
@@ -1191,7 +1189,7 @@ class SparkConnectPlanner(
     SimplePythonFunction(
       command = fun.getCommand.toByteArray.toImmutableArraySeq,
       // Empty environment variables
-      envVars = Maps.newHashMap(),
+      envVars = new HashMap[String, String](),
       pythonIncludes = sessionHolder.artifactManager.getPythonIncludes.asJava,
       pythonExec = pythonExec,
       pythonVer = fun.getPythonVer,
@@ -1205,7 +1203,7 @@ class SparkConnectPlanner(
     SimplePythonFunction(
       command = ds.getCommand.toByteArray.toImmutableArraySeq,
       // Empty environment variables
-      envVars = Maps.newHashMap(),
+      envVars = new HashMap[String, String](),
       pythonIncludes = sessionHolder.artifactManager.getPythonIncludes.asJava,
       pythonExec = pythonExec,
       pythonVer = ds.getPythonVer,
@@ -1443,9 +1441,8 @@ class SparkConnectPlanner(
     }
 
     if (rel.hasData) {
-      val (rows, structType) = ArrowConverters.fromBatchWithSchemaIterator(
-        Iterator(rel.getData.toByteArray),
-        TaskContext.get())
+      val (rows, structType) =
+        ArrowConverters.fromIPCStream(rel.getData.toByteArray, TaskContext.get())
       if (structType == null) {
         throw InvalidInputErrors.inputDataForLocalRelationNoSchema()
       }
@@ -2034,7 +2031,7 @@ class SparkConnectPlanner(
     SimplePythonFunction(
       command = fun.getCommand.toByteArray.toImmutableArraySeq,
       // Empty environment variables
-      envVars = Maps.newHashMap(),
+      envVars = new HashMap[String, String](),
       pythonExec = pythonExec,
       // Merge the user specified includes with the includes managed by the artifact manager.
       pythonIncludes = (fun.getAdditionalIncludesList.asScala.toSeq ++
@@ -2646,9 +2643,29 @@ class SparkConnectPlanner(
     process(command, new MockObserver())
   }
 
+  def transformCommand(command: proto.Command): Option[QueryPlanningTracker => LogicalPlan] = {
+    command.getCommandTypeCase match {
+      case proto.Command.CommandTypeCase.WRITE_OPERATION =>
+        Some(transformWriteOperation(command.getWriteOperation))
+      case proto.Command.CommandTypeCase.WRITE_OPERATION_V2 =>
+        Some(transformWriteOperationV2(command.getWriteOperationV2))
+      case proto.Command.CommandTypeCase.MERGE_INTO_TABLE_COMMAND =>
+        Some(transformMergeIntoTableCommand(command.getMergeIntoTableCommand))
+      case proto.Command.CommandTypeCase.CREATE_DATAFRAME_VIEW =>
+        Some(_ => transformCreateViewCommand(command.getCreateDataframeView))
+      case _ =>
+        None
+    }
+  }
+
   def process(
       command: proto.Command,
       responseObserver: StreamObserver[ExecutePlanResponse]): Unit = {
+    val transformerOpt = transformCommand(command)
+    if (transformerOpt.isDefined) {
+      transformAndRunCommand(transformerOpt.get)
+      return
+    }
     command.getCommandTypeCase match {
       case proto.Command.CommandTypeCase.REGISTER_FUNCTION =>
         handleRegisterUserDefinedFunction(command.getRegisterFunction)
@@ -2656,12 +2673,6 @@ class SparkConnectPlanner(
         handleRegisterUserDefinedTableFunction(command.getRegisterTableFunction)
       case proto.Command.CommandTypeCase.REGISTER_DATA_SOURCE =>
         handleRegisterUserDefinedDataSource(command.getRegisterDataSource)
-      case proto.Command.CommandTypeCase.WRITE_OPERATION =>
-        handleWriteOperation(command.getWriteOperation)
-      case proto.Command.CommandTypeCase.CREATE_DATAFRAME_VIEW =>
-        handleCreateViewCommand(command.getCreateDataframeView)
-      case proto.Command.CommandTypeCase.WRITE_OPERATION_V2 =>
-        handleWriteOperationV2(command.getWriteOperationV2)
       case proto.Command.CommandTypeCase.EXTENSION =>
         handleCommandPlugin(command.getExtension)
       case proto.Command.CommandTypeCase.SQL_COMMAND =>
@@ -2689,8 +2700,6 @@ class SparkConnectPlanner(
         handleCheckpointCommand(command.getCheckpointCommand, responseObserver)
       case proto.Command.CommandTypeCase.REMOVE_CACHED_REMOTE_RELATION_COMMAND =>
         handleRemoveCachedRemoteRelationCommand(command.getRemoveCachedRemoteRelationCommand)
-      case proto.Command.CommandTypeCase.MERGE_INTO_TABLE_COMMAND =>
-        handleMergeIntoTableCommand(command.getMergeIntoTableCommand)
       case proto.Command.CommandTypeCase.ML_COMMAND =>
         handleMlCommand(command.getMlCommand, responseObserver)
       case proto.Command.CommandTypeCase.PIPELINE_COMMAND =>
@@ -3050,7 +3059,8 @@ class SparkConnectPlanner(
     executeHolder.eventsManager.postFinished()
   }
 
-  private def handleCreateViewCommand(createView: proto.CreateDataFrameViewCommand): Unit = {
+  private def transformCreateViewCommand(
+      createView: proto.CreateDataFrameViewCommand): LogicalPlan = {
     val viewType = if (createView.getIsGlobal) GlobalTempView else LocalTempView
 
     val tableIdentifier =
@@ -3061,7 +3071,7 @@ class SparkConnectPlanner(
           throw QueryCompilationErrors.invalidViewNameError(createView.getName)
       }
 
-    val plan = CreateViewCommand(
+    CreateViewCommand(
       name = tableIdentifier,
       userSpecifiedColumns = Nil,
       comment = None,
@@ -3072,14 +3082,10 @@ class SparkConnectPlanner(
       allowExisting = false,
       replace = createView.getReplace,
       viewType = viewType)
-
-    val tracker = executeHolder.eventsManager.createQueryPlanningTracker()
-    Dataset.ofRows(session, plan, tracker).queryExecution.commandExecuted
-    executeHolder.eventsManager.postFinished()
   }
 
   /**
-   * Transforms the write operation and executes it.
+   * Transforms the write operation.
    *
    * The input write operation contains a reference to the input plan and transforms it to the
    * corresponding logical plan. Afterwards, creates the DataFrameWriter and translates the
@@ -3087,14 +3093,14 @@ class SparkConnectPlanner(
    *
    * @param writeOperation
    */
-  private def handleWriteOperation(writeOperation: proto.WriteOperation): Unit = {
+  private def transformWriteOperation(writeOperation: proto.WriteOperation)(
+      tracker: QueryPlanningTracker): LogicalPlan = {
     // Transform the input plan into the logical plan.
     val plan = transformRelation(writeOperation.getInput)
     // And create a Dataset from the plan.
-    val tracker = executeHolder.eventsManager.createQueryPlanningTracker()
     val dataset = Dataset.ofRows(session, plan, tracker)
 
-    val w = dataset.write
+    val w = dataset.write.asInstanceOf[DataFrameWriter[_]]
     if (writeOperation.getMode != proto.WriteOperation.SaveMode.SAVE_MODE_UNSPECIFIED) {
       w.mode(SaveModeConverter.toSaveMode(writeOperation.getMode))
     }
@@ -3129,25 +3135,32 @@ class SparkConnectPlanner(
     }
 
     writeOperation.getSaveTypeCase match {
-      case proto.WriteOperation.SaveTypeCase.SAVETYPE_NOT_SET => w.save()
-      case proto.WriteOperation.SaveTypeCase.PATH => w.save(writeOperation.getPath)
+      case proto.WriteOperation.SaveTypeCase.SAVETYPE_NOT_SET => w.saveCommand(None)
+      case proto.WriteOperation.SaveTypeCase.PATH =>
+        w.saveCommand(Some(writeOperation.getPath))
       case proto.WriteOperation.SaveTypeCase.TABLE =>
         val tableName = writeOperation.getTable.getTableName
         writeOperation.getTable.getSaveMethod match {
           case proto.WriteOperation.SaveTable.TableSaveMethod.TABLE_SAVE_METHOD_SAVE_AS_TABLE =>
-            w.saveAsTable(tableName)
+            w.saveAsTableCommand(tableName)
           case proto.WriteOperation.SaveTable.TableSaveMethod.TABLE_SAVE_METHOD_INSERT_INTO =>
-            w.insertInto(tableName)
+            w.insertIntoCommand(tableName)
           case other => throw InvalidInputErrors.invalidEnum(other)
         }
       case other =>
         throw InvalidInputErrors.invalidOneOfField(other, writeOperation.getDescriptorForType)
     }
+  }
+
+  private def transformAndRunCommand(transformer: QueryPlanningTracker => LogicalPlan): Unit = {
+    val tracker = executeHolder.eventsManager.createQueryPlanningTracker()
+    val qe = new QueryExecution(session, transformer(tracker), tracker)
+    qe.assertCommandExecuted()
     executeHolder.eventsManager.postFinished()
   }
 
   /**
-   * Transforms the write operation and executes it.
+   * Transforms the write operation.
    *
    * The input write operation contains a reference to the input plan and transforms it to the
    * corresponding logical plan. Afterwards, creates the DataFrameWriter and translates the
@@ -3155,11 +3168,11 @@ class SparkConnectPlanner(
    *
    * @param writeOperation
    */
-  private def handleWriteOperationV2(writeOperation: proto.WriteOperationV2): Unit = {
+  private def transformWriteOperationV2(writeOperation: proto.WriteOperationV2)(
+      tracker: QueryPlanningTracker): LogicalPlan = {
     // Transform the input plan into the logical plan.
     val plan = transformRelation(writeOperation.getInput)
     // And create a Dataset from the plan.
-    val tracker = executeHolder.eventsManager.createQueryPlanningTracker()
     val dataset = Dataset.ofRows(session, plan, tracker)
 
     val w = dataset.writeTo(table = writeOperation.getTableName)
@@ -3190,32 +3203,28 @@ class SparkConnectPlanner(
     writeOperation.getMode match {
       case proto.WriteOperationV2.Mode.MODE_CREATE =>
         if (writeOperation.hasProvider) {
-          w.using(writeOperation.getProvider).create()
-        } else {
-          w.create()
+          w.using(writeOperation.getProvider)
         }
+        w.createCommand()
       case proto.WriteOperationV2.Mode.MODE_OVERWRITE =>
-        w.overwrite(Column(transformExpression(writeOperation.getOverwriteCondition)))
+        w.overwriteCommand(Column(transformExpression(writeOperation.getOverwriteCondition)))
       case proto.WriteOperationV2.Mode.MODE_OVERWRITE_PARTITIONS =>
-        w.overwritePartitions()
+        w.overwritePartitionsCommand()
       case proto.WriteOperationV2.Mode.MODE_APPEND =>
-        w.append()
+        w.appendCommand()
       case proto.WriteOperationV2.Mode.MODE_REPLACE =>
         if (writeOperation.hasProvider) {
-          w.using(writeOperation.getProvider).replace()
-        } else {
-          w.replace()
+          w.using(writeOperation.getProvider)
         }
+        w.replaceCommand(orCreate = false)
       case proto.WriteOperationV2.Mode.MODE_CREATE_OR_REPLACE =>
         if (writeOperation.hasProvider) {
-          w.using(writeOperation.getProvider).createOrReplace()
-        } else {
-          w.createOrReplace()
+          w.using(writeOperation.getProvider)
         }
+        w.replaceCommand(orCreate = true)
       case other =>
         throw InvalidInputErrors.invalidEnum(other)
     }
-    executeHolder.eventsManager.postFinished()
   }
 
   private def handleWriteStreamOperationStart(
@@ -3472,7 +3481,7 @@ class SparkConnectPlanner(
             .setExceptionMessage(e.toString())
             .setErrorClass(e.getCondition)
 
-          val stackTrace = Option(ExceptionUtils.getStackTrace(e))
+          val stackTrace = Option(Utils.stackTraceToString(e))
           stackTrace.foreach { s =>
             exception_builder.setStackTrace(s)
           }
@@ -3745,7 +3754,8 @@ class SparkConnectPlanner(
     executeHolder.eventsManager.postFinished()
   }
 
-  private def handleMergeIntoTableCommand(cmd: proto.MergeIntoTableCommand): Unit = {
+  private def transformMergeIntoTableCommand(cmd: proto.MergeIntoTableCommand)(
+      tracker: QueryPlanningTracker): LogicalPlan = {
     def transformActions(actions: java.util.List[proto.Expression]): Seq[MergeAction] =
       actions.asScala.map(transformExpression).map(_.asInstanceOf[MergeAction]).toSeq
 
@@ -3753,7 +3763,7 @@ class SparkConnectPlanner(
     val notMatchedActions = transformActions(cmd.getNotMatchedActionsList)
     val notMatchedBySourceActions = transformActions(cmd.getNotMatchedBySourceActionsList)
 
-    val sourceDs = Dataset.ofRows(session, transformRelation(cmd.getSourceTablePlan))
+    val sourceDs = Dataset.ofRows(session, transformRelation(cmd.getSourceTablePlan), tracker)
     val mergeInto = sourceDs
       .mergeInto(cmd.getTargetTableName, Column(transformExpression(cmd.getMergeCondition)))
       .asInstanceOf[MergeIntoWriter[Row]]
@@ -3763,8 +3773,7 @@ class SparkConnectPlanner(
     if (cmd.getWithSchemaEvolution) {
       mergeInto.withSchemaEvolution()
     }
-    mergeInto.merge()
-    executeHolder.eventsManager.postFinished()
+    mergeInto.mergeCommand()
   }
 
   private val emptyLocalRelation = LocalRelation(
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectStreamingQueryListenerHandler.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectStreamingQueryListenerHandler.scala
index 70f18a1a9c1a0..04312a35a3b4b 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectStreamingQueryListenerHandler.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/SparkConnectStreamingQueryListenerHandler.scala
@@ -24,7 +24,7 @@ import io.grpc.stub.StreamObserver
 import org.apache.spark.connect.proto.ExecutePlanResponse
 import org.apache.spark.connect.proto.StreamingQueryListenerBusCommand
 import org.apache.spark.connect.proto.StreamingQueryListenerEventsResult
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.connect.service.ExecuteHolder
 
 /**
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingForeachBatchHelper.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingForeachBatchHelper.scala
index 5a44607a4c7d9..a4da5ea998386 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingForeachBatchHelper.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingForeachBatchHelper.scala
@@ -26,7 +26,7 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.SparkException
 import org.apache.spark.api.python.{PythonException, PythonWorkerUtils, SimplePythonFunction, SpecialLengths, StreamingPythonRunner}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DATAFRAME_ID, PYTHON_EXEC, QUERY_ID, RUN_ID_STRING, SESSION_ID, USER_ID}
 import org.apache.spark.sql.{DataFrame, Dataset}
 import org.apache.spark.sql.catalyst.encoders.{AgnosticEncoder, AgnosticEncoders}
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingQueryListenerHelper.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingQueryListenerHelper.scala
index 42c090d43f065..f994ada920ec2 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingQueryListenerHelper.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/planner/StreamingQueryListenerHelper.scala
@@ -21,7 +21,7 @@ import java.io.EOFException
 
 import org.apache.spark.SparkException
 import org.apache.spark.api.python.{PythonException, PythonWorkerUtils, SimplePythonFunction, SpecialLengths, StreamingPythonRunner}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.FUNCTION_NAME
 import org.apache.spark.sql.connect.config.Connect
 import org.apache.spark.sql.connect.service.{SessionHolder, SparkConnectService}
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/LoggingInterceptor.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/LoggingInterceptor.scala
index a071579692fb1..695034954e981 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/LoggingInterceptor.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/LoggingInterceptor.scala
@@ -28,7 +28,7 @@ import io.grpc.ServerCall
 import io.grpc.ServerCallHandler
 import io.grpc.ServerInterceptor
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DESCRIPTION, MESSAGE}
 
 /**
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SessionHolder.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SessionHolder.scala
index ada322fd859c5..be59439daefbb 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SessionHolder.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SessionHolder.scala
@@ -31,13 +31,14 @@ import com.google.common.cache.{Cache, CacheBuilder}
 import org.apache.spark.{SparkEnv, SparkException, SparkSQLException}
 import org.apache.spark.api.python.PythonFunction.PythonAccumulator
 import org.apache.spark.connect.proto
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.DataFrame
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.connect.common.InvalidPlanInput
 import org.apache.spark.sql.connect.config.Connect
 import org.apache.spark.sql.connect.ml.MLCache
+import org.apache.spark.sql.connect.pipelines.DataflowGraphRegistry
 import org.apache.spark.sql.connect.planner.PythonStreamingQueryListener
 import org.apache.spark.sql.connect.planner.StreamingForeachBatchHelper
 import org.apache.spark.sql.connect.service.SessionHolder.{ERROR_CACHE_SIZE, ERROR_CACHE_TIMEOUT_SEC}
@@ -125,6 +126,9 @@ case class SessionHolder(userId: String, sessionId: String, session: SparkSessio
   private lazy val pipelineExecutions =
     new ConcurrentHashMap[String, PipelineUpdateContext]()
 
+  // Registry for dataflow graphs specific to this session
+  private[connect] lazy val dataflowGraphRegistry = new DataflowGraphRegistry()
+
   // Handles Python process clean up for streaming queries. Initialized on first use in a query.
   private[connect] lazy val streamingForeachBatchRunnerCleanerCache =
     new StreamingForeachBatchHelper.CleanerCache(this)
@@ -320,6 +324,9 @@ case class SessionHolder(userId: String, sessionId: String, session: SparkSessio
     // Stops all pipeline execution and clears the pipeline execution cache
     removeAllPipelineExecutions()
 
+    // Clean up dataflow graphs
+    dataflowGraphRegistry.dropAllDataflowGraphs()
+
     // if there is a server side listener, clean up related resources
     if (streamingServersideListenerHolder.isServerSideListenerRegistered) {
       streamingServersideListenerHolder.cleanUp()
@@ -514,6 +521,11 @@ case class SessionHolder(userId: String, sessionId: String, session: SparkSessio
     // We only cache plans that have a plan ID.
     val hasPlanId = rel.hasCommon && rel.getCommon.hasPlanId
 
+    // Always cache a `Read.DataSource` to avoid re-analyzing the same `DataSource` twice.
+    lazy val alwaysCacheDataSourceReadsEnabled = Option(session)
+      .forall(_.conf.get(Connect.CONNECT_ALWAYS_CACHE_DATA_SOURCE_READS_ENABLED, true))
+    lazy val isDataSourceRead = rel.hasRead && rel.getRead.hasDataSource
+
     def getPlanCache(rel: proto.Relation): Option[LogicalPlan] =
       planCache match {
         case Some(cache) if planCacheEnabled && hasPlanId =>
@@ -535,7 +547,7 @@ case class SessionHolder(userId: String, sessionId: String, session: SparkSessio
     getPlanCache(rel)
       .getOrElse({
         val plan = transform(rel)
-        if (cachePlan) {
+        if (cachePlan || (alwaysCacheDataSourceReadsEnabled && isDataSourceRead)) {
           putPlanCache(rel, plan)
         }
         plan
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectAddArtifactsHandler.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectAddArtifactsHandler.scala
index 3ba79402e99ef..becd7d855133d 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectAddArtifactsHandler.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectAddArtifactsHandler.scala
@@ -26,6 +26,7 @@ import scala.util.control.NonFatal
 import com.google.common.io.CountingOutputStream
 import io.grpc.stub.StreamObserver
 
+import org.apache.spark.SparkRuntimeException
 import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.{AddArtifactsRequest, AddArtifactsResponse}
 import org.apache.spark.connect.proto.AddArtifactsResponse.ArtifactSummary
@@ -112,19 +113,32 @@ class SparkConnectAddArtifactsHandler(val responseObserver: StreamObserver[AddAr
    * @return
    */
   protected def flushStagedArtifacts(): Seq[ArtifactSummary] = {
+    val failedArtifactExceptions = mutable.ListBuffer[SparkRuntimeException]()
+
     // Non-lazy transformation when using Buffer.
-    stagedArtifacts.map { artifact =>
-      // We do not store artifacts that fail the CRC. The failure is reported in the artifact
-      // summary and it is up to the client to decide whether to retry sending the artifact.
-      if (artifact.getCrcStatus.contains(true)) {
-        if (artifact.path.startsWith(ArtifactManager.forwardToFSPrefix + File.separator)) {
-          holder.artifactManager.uploadArtifactToFs(artifact.path, artifact.stagedPath)
-        } else {
-          addStagedArtifactToArtifactManager(artifact)
+    val summaries = stagedArtifacts.map { artifact =>
+      try {
+        // We do not store artifacts that fail the CRC. The failure is reported in the artifact
+        // summary and it is up to the client to decide whether to retry sending the artifact.
+        if (artifact.getCrcStatus.contains(true)) {
+          if (artifact.path.startsWith(ArtifactManager.forwardToFSPrefix + File.separator)) {
+            holder.artifactManager.uploadArtifactToFs(artifact.path, artifact.stagedPath)
+          } else {
+            addStagedArtifactToArtifactManager(artifact)
+          }
         }
+      } catch {
+        case e: SparkRuntimeException if e.getCondition == "ARTIFACT_ALREADY_EXISTS" =>
+          failedArtifactExceptions += e
       }
       artifact.summary()
     }.toSeq
+
+    if (failedArtifactExceptions.nonEmpty) {
+      throw ArtifactUtils.mergeExceptionsWithSuppressed(failedArtifactExceptions.toSeq)
+    }
+
+    summaries
   }
 
   protected def cleanUpStagedArtifacts(): Unit = Utils.deleteRecursively(stagingDir.toFile)
@@ -216,6 +230,7 @@ class SparkConnectAddArtifactsHandler(val responseObserver: StreamObserver[AddAr
     private val fileOut = Files.newOutputStream(stagedPath)
     private val countingOut = new CountingOutputStream(fileOut)
     private val checksumOut = new CheckedOutputStream(countingOut, new CRC32)
+    private val overallChecksum = new CRC32()
 
     private val builder = ArtifactSummary.newBuilder().setName(name)
     private var artifactSummary: ArtifactSummary = _
@@ -227,6 +242,8 @@ class SparkConnectAddArtifactsHandler(val responseObserver: StreamObserver[AddAr
 
     def getCrcStatus: Option[Boolean] = Option(isCrcSuccess)
 
+    def getCrc: Long = overallChecksum.getValue
+
     def write(dataChunk: proto.AddArtifactsRequest.ArtifactChunk): Unit = {
       try dataChunk.getData.writeTo(checksumOut)
       catch {
@@ -234,6 +251,8 @@ class SparkConnectAddArtifactsHandler(val responseObserver: StreamObserver[AddAr
           close()
           throw e
       }
+
+      overallChecksum.update(dataChunk.getData.toByteArray)
       updateCrc(checksumOut.getChecksum.getValue == dataChunk.getCrc)
       checksumOut.getChecksum.reset()
     }
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectExecutionManager.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectExecutionManager.scala
index c8f4a1bc977f8..35c4073fe93c9 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectExecutionManager.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectExecutionManager.scala
@@ -30,7 +30,7 @@ import io.grpc.stub.StreamObserver
 
 import org.apache.spark.{SparkEnv, SparkSQLException}
 import org.apache.spark.connect.proto
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.NANOS_PER_MILLIS
 import org.apache.spark.sql.connect.config.Connect.{CONNECT_EXECUTE_MANAGER_ABANDONED_TOMBSTONES_SIZE, CONNECT_EXECUTE_MANAGER_DETACHED_TIMEOUT, CONNECT_EXECUTE_MANAGER_MAINTENANCE_INTERVAL}
 import org.apache.spark.sql.connect.execution.ExecuteGrpcResponseSender
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectListenerBusListener.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectListenerBusListener.scala
index 8fbcf3218a003..91fe395f520d8 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectListenerBusListener.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectListenerBusListener.scala
@@ -29,7 +29,7 @@ import org.apache.spark.connect.proto.ExecutePlanResponse
 import org.apache.spark.connect.proto.StreamingQueryEventType
 import org.apache.spark.connect.proto.StreamingQueryListenerEvent
 import org.apache.spark.connect.proto.StreamingQueryListenerEventsResult
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.connect.execution.ExecuteResponseObserver
 import org.apache.spark.sql.streaming.StreamingQueryListener
 import org.apache.spark.util.ArrayImplicits._
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectServer.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectServer.scala
index b2c4d1abb17b4..5b1034a4a27b7 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectServer.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectServer.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.connect.service
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{HOST, PORT}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectService.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectService.scala
index 262cc954f8f9d..cc1cb95b66c46 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectService.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectService.scala
@@ -29,13 +29,12 @@ import io.grpc.netty.NettyServerBuilder
 import io.grpc.protobuf.ProtoUtils
 import io.grpc.protobuf.services.ProtoReflectionService
 import io.grpc.stub.StreamObserver
-import org.apache.commons.lang3.StringUtils
 
 import org.apache.spark.{SparkContext, SparkEnv}
 import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.{AddArtifactsRequest, AddArtifactsResponse, SparkConnectServiceGrpc}
 import org.apache.spark.connect.proto.SparkConnectServiceGrpc.AsyncService
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.HOST
 import org.apache.spark.internal.config.UI.UI_ENABLED
 import org.apache.spark.scheduler.{LiveListenerBus, SparkListenerEvent}
@@ -504,7 +503,7 @@ object SparkConnectService extends Logging {
   }
 
   def extractErrorMessage(st: Throwable): String = {
-    val message = StringUtils.abbreviate(st.getMessage, 2048)
+    val message = Utils.abbreviate(st.getMessage, 2048)
     convertNullString(message)
   }
 
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectSessionManager.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectSessionManager.scala
index 572d760187e9d..1c3cfd67f132c 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectSessionManager.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectSessionManager.scala
@@ -28,7 +28,7 @@ import scala.util.control.NonFatal
 import com.google.common.cache.CacheBuilder
 
 import org.apache.spark.{SparkEnv, SparkSQLException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{INTERVAL, SESSION_HOLD_INFO}
 import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.connect.config.Connect.{CONNECT_SESSION_MANAGER_CLOSED_SESSIONS_TOMBSTONES_SIZE, CONNECT_SESSION_MANAGER_DEFAULT_SESSION_TIMEOUT, CONNECT_SESSION_MANAGER_MAINTENANCE_INTERVAL}
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectStreamingQueryCache.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectStreamingQueryCache.scala
index beff193f6701f..8ff13f5afe191 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectStreamingQueryCache.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/service/SparkConnectStreamingQueryCache.scala
@@ -25,7 +25,7 @@ import scala.concurrent.{ExecutionContext, Future}
 import scala.concurrent.duration.{Duration, DurationInt, FiniteDuration}
 import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DURATION, NEW_VALUE, OLD_VALUE, QUERY_CACHE_VALUE, QUERY_ID, QUERY_RUN_ID, SESSION_ID}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.streaming.StreamingQuery
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ui/SparkConnectServerListener.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ui/SparkConnectServerListener.scala
index 3a93bbae3f2b8..98dccc6c9a6c8 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ui/SparkConnectServerListener.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/ui/SparkConnectServerListener.scala
@@ -23,7 +23,7 @@ import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.{SparkConf, SparkContext, SparkEnv}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{OP_ID, SESSION_ID}
 import org.apache.spark.internal.config.Status.LIVE_ENTITY_UPDATE_PERIOD
 import org.apache.spark.scheduler._
diff --git a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/utils/ErrorUtils.scala b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/utils/ErrorUtils.scala
index 837d4a4d3ee78..76f91ee710590 100644
--- a/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/utils/ErrorUtils.scala
+++ b/sql/connect/server/src/main/scala/org/apache/spark/sql/connect/utils/ErrorUtils.scala
@@ -30,20 +30,19 @@ import com.google.rpc.{Code => RPCCode, ErrorInfo, Status => RPCStatus}
 import io.grpc.Status
 import io.grpc.protobuf.StatusProto
 import io.grpc.stub.StreamObserver
-import org.apache.commons.lang3.StringUtils
-import org.apache.commons.lang3.exception.ExceptionUtils
 import org.json4s.JsonDSL._
 import org.json4s.jackson.JsonMethods
 
 import org.apache.spark.{QueryContextType, SparkEnv, SparkException, SparkThrowable}
 import org.apache.spark.api.python.PythonException
 import org.apache.spark.connect.proto.FetchErrorDetailsResponse
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{OP_TYPE, SESSION_ID, USER_ID}
 import org.apache.spark.sql.connect.config.Connect
 import org.apache.spark.sql.connect.service.{ExecuteEventsManager, SessionHolder, SessionKey, SparkConnectService}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.Utils
 
 private[connect] object ErrorUtils extends Logging {
 
@@ -217,7 +216,7 @@ private[connect] object ErrorUtils extends Logging {
         .put(errorId, st)
     }
 
-    lazy val stackTrace = Option(ExceptionUtils.getStackTrace(st))
+    lazy val stackTrace = Option(Utils.stackTraceToString(st))
     val stackTraceEnabled = sessionHolderOpt.exists(
       _.session.sessionState.conf.getConf(SQLConf.PYSPARK_JVM_STACKTRACE_ENABLED))
     val withStackTrace =
@@ -225,7 +224,7 @@ private[connect] object ErrorUtils extends Logging {
         val maxSize = Math.min(
           SparkEnv.get.conf.get(Connect.CONNECT_JVM_STACK_TRACE_MAX_SIZE),
           maxMetadataSize)
-        errorInfo.putMetadata("stackTrace", StringUtils.abbreviate(stackTrace.get, maxSize.toInt))
+        errorInfo.putMetadata("stackTrace", Utils.abbreviate(stackTrace.get, maxSize.toInt))
       } else {
         errorInfo
       }
@@ -297,7 +296,7 @@ private[connect] object ErrorUtils extends Logging {
           e,
           Status.UNKNOWN
             .withCause(e)
-            .withDescription(StringUtils.abbreviate(e.getMessage, 2048))
+            .withDescription(Utils.abbreviate(e.getMessage, 2048))
             .asRuntimeException())
     }
     partial
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/ProtoToParsedPlanTestSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/ProtoToParsedPlanTestSuite.scala
index 29ad97ad9fbe8..02c5683e02765 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/ProtoToParsedPlanTestSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/ProtoToParsedPlanTestSuite.scala
@@ -27,7 +27,6 @@ import scala.util.{Failure, Success, Try}
 import org.apache.spark.{SparkConf, SparkFunSuite}
 import org.apache.spark.connect.proto
 import org.apache.spark.internal.LogKeys.PATH
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.{catalog, QueryPlanningTracker}
 import org.apache.spark.sql.catalyst.analysis.{caseSensitiveResolution, Analyzer, FunctionRegistry, Resolver, TableFunctionRegistry}
 import org.apache.spark.sql.catalyst.catalog.SessionCatalog
@@ -38,6 +37,7 @@ import org.apache.spark.sql.connect.config.Connect
 import org.apache.spark.sql.connect.planner.SparkConnectPlanner
 import org.apache.spark.sql.connector.catalog.{CatalogManager, Column, Identifier, InMemoryCatalog}
 import org.apache.spark.sql.connector.expressions.Transform
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.LongType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
@@ -198,7 +198,9 @@ class ProtoToParsedPlanTestSuite
         }
         Helper.execute(catalystPlan)
       }
-      val actual = removeMemoryAddress(normalizeExprIds(finalAnalyzedPlan).treeString)
+      val actual = withSQLConf(SQLConf.MAX_TO_STRING_FIELDS.key -> Int.MaxValue.toString) {
+        removeMemoryAddress(normalizeExprIds(finalAnalyzedPlan).treeString)
+      }
       val goldenFile = goldenFilePath.resolve(relativePath).getParent.resolve(name + ".explain")
       Try(readGoldenFile(goldenFile)) match {
         case Success(expected) if expected == actual => // Test passes.
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/messages/AbbreviateSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/messages/AbbreviateSuite.scala
index 94d92a264d20c..41271a874cc8d 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/messages/AbbreviateSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/messages/AbbreviateSuite.scala
@@ -27,7 +27,7 @@ import org.apache.spark.sql.connect.common.{ProtoDataTypes, ProtoUtils}
 class AbbreviateSuite extends SparkFunSuite {
 
   test("truncate string: simple SQL text") {
-    val message = proto.SQL.newBuilder().setQuery("x" * 1024).build()
+    val message = proto.SQL.newBuilder().setQuery("x".repeat(1024)).build()
 
     Seq(1, 16, 256, 512, 1024, 2048).foreach { threshold =>
       val truncated = ProtoUtils.abbreviate(message, threshold)
@@ -47,7 +47,7 @@ class AbbreviateSuite extends SparkFunSuite {
       .setSql(
         proto.SQL
           .newBuilder()
-          .setQuery("x" * 1024)
+          .setQuery("x".repeat(1024))
           .build())
       .build()
     val drop = proto.Relation
@@ -214,7 +214,10 @@ class AbbreviateSuite extends SparkFunSuite {
   test("truncate map<string, string>") {
     val read = proto.Read.NamedTable
       .newBuilder()
-      .putAllOptions(Map("k1" * 4096 -> "v1" * 4096, "k2" * 4096 -> "v2" * 4096).asJava)
+      .putAllOptions(
+        Map(
+          "k1".repeat(4096) -> "v1".repeat(4096),
+          "k2".repeat(4096) -> "v2".repeat(4096)).asJava)
       .build()
 
     val threshold = 1024
@@ -237,14 +240,14 @@ class AbbreviateSuite extends SparkFunSuite {
             .newBuilder()
             .setUnresolvedAttribute(proto.Expression.UnresolvedAttribute
               .newBuilder()
-              .setUnparsedIdentifier("v1" * 4096)
+              .setUnparsedIdentifier("v1".repeat(4096))
               .build())
             .build(),
           "k2" -> proto.Expression
             .newBuilder()
             .setUnresolvedAttribute(proto.Expression.UnresolvedAttribute
               .newBuilder()
-              .setUnparsedIdentifier("v2" * 4096)
+              .setUnparsedIdentifier("v2".repeat(4096))
               .build())
             .build()).asJava)
       .build()
@@ -272,7 +275,7 @@ class AbbreviateSuite extends SparkFunSuite {
           .newBuilder()
           .setQuery(
             // Level 5.
-            "x" * (threshold + 32))
+            "x".repeat(threshold + 32))
           .build())
       .build()
 
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PipelineEventStreamSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PipelineEventStreamSuite.scala
index 100aa2e3b63a7..83862545a723e 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PipelineEventStreamSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PipelineEventStreamSuite.scala
@@ -70,14 +70,67 @@ class PipelineEventStreamSuite extends SparkDeclarativePipelinesServerTest {
     }
   }
 
-  test("check error events from stream") {
+  test("flow resolution failure") {
+    val dryOptions = Seq(true, false)
+
+    dryOptions.foreach { dry =>
+      withRawBlockingStub { implicit stub =>
+        val graphId = createDataflowGraph
+        val pipeline = new TestPipelineDefinition(graphId) {
+          createTable(
+            name = "a",
+            datasetType = proto.DatasetType.MATERIALIZED_VIEW,
+            sql = Some("SELECT * FROM unknown_table"))
+          createTable(
+            name = "b",
+            datasetType = proto.DatasetType.TABLE,
+            sql = Some("SELECT * FROM STREAM a"))
+        }
+        registerPipelineDatasets(pipeline)
+
+        val capturedEvents = new ArrayBuffer[PipelineEvent]()
+        withClient { client =>
+          val startRunRequest = buildStartRunPlan(
+            proto.PipelineCommand.StartRun
+              .newBuilder()
+              .setDataflowGraphId(graphId)
+              .setDry(dry)
+              .build())
+          val ex = intercept[AnalysisException] {
+            val responseIterator = client.execute(startRunRequest)
+            while (responseIterator.hasNext) {
+              val response = responseIterator.next()
+              if (response.hasPipelineEventResult) {
+                capturedEvents.append(response.getPipelineEventResult.getEvent)
+              }
+            }
+          }
+          // (?s) enables wildcard matching on newline characters
+          val runFailureErrorMsg = "(?s).*Failed to resolve flows in the pipeline.*".r
+          assert(runFailureErrorMsg.matches(ex.getMessage))
+          val expectedLogPatterns = Set(
+            "(?s).*Failed to resolve flow.*Failed to read dataset 'spark_catalog.default.a'.*".r,
+            "(?s).*Failed to resolve flow.*[TABLE_OR_VIEW_NOT_FOUND].*".r)
+          expectedLogPatterns.foreach { logPattern =>
+            assert(
+              capturedEvents.exists(e => logPattern.matches(e.getMessage)),
+              s"Did not receive expected event matching pattern: $logPattern")
+          }
+          // Ensure that the error causing the run failure is not surfaced to the user twice
+          assert(capturedEvents.forall(e => !runFailureErrorMsg.matches(e.getMessage)))
+        }
+      }
+    }
+  }
+
+  test("successful dry run") {
     withRawBlockingStub { implicit stub =>
       val graphId = createDataflowGraph
       val pipeline = new TestPipelineDefinition(graphId) {
         createTable(
           name = "a",
           datasetType = proto.DatasetType.MATERIALIZED_VIEW,
-          sql = Some("SELECT * FROM unknown_table"))
+          sql = Some("SELECT * FROM RANGE(5)"))
         createTable(
           name = "b",
           datasetType = proto.DatasetType.TABLE,
@@ -88,29 +141,29 @@ class PipelineEventStreamSuite extends SparkDeclarativePipelinesServerTest {
       val capturedEvents = new ArrayBuffer[PipelineEvent]()
       withClient { client =>
         val startRunRequest = buildStartRunPlan(
-          proto.PipelineCommand.StartRun.newBuilder().setDataflowGraphId(graphId).build())
-        val ex = intercept[AnalysisException] {
-          val responseIterator = client.execute(startRunRequest)
-          while (responseIterator.hasNext) {
-            val response = responseIterator.next()
-            if (response.hasPipelineEventResult) {
-              capturedEvents.append(response.getPipelineEventResult.getEvent)
-            }
+          proto.PipelineCommand.StartRun
+            .newBuilder()
+            .setDataflowGraphId(graphId)
+            .setDry(true)
+            .build())
+        val responseIterator = client.execute(startRunRequest)
+        while (responseIterator.hasNext) {
+          val response = responseIterator.next()
+          if (response.hasPipelineEventResult) {
+            capturedEvents.append(response.getPipelineEventResult.getEvent)
           }
         }
-        // (?s) enables wildcard matching on newline characters
-        val runFailureErrorMsg = "(?s).*Failed to resolve flows in the pipeline.*".r
-        assert(runFailureErrorMsg.matches(ex.getMessage))
-        val expectedLogPatterns = Set(
-          "(?s).*Failed to resolve flow.*Failed to read dataset 'spark_catalog.default.a'.*".r,
-          "(?s).*Failed to resolve flow.*[TABLE_OR_VIEW_NOT_FOUND].*".r)
-        expectedLogPatterns.foreach { logPattern =>
+        val expectedEventMessages = Set("Run is COMPLETED")
+        expectedEventMessages.foreach { eventMessage =>
           assert(
-            capturedEvents.exists(e => logPattern.matches(e.getMessage)),
-            s"Did not receive expected event matching pattern: $logPattern")
+            capturedEvents.exists(e => e.getMessage.contains(eventMessage)),
+            s"Did not receive expected event: $eventMessage")
         }
-        // Ensure that the error causing the run failure is not surfaced to the user twice
-        assert(capturedEvents.forall(e => !runFailureErrorMsg.matches(e.getMessage)))
+      }
+
+      // No flows should be started in dry run mode
+      capturedEvents.foreach { event =>
+        assert(!event.getMessage.contains("is QUEUED"))
       }
     }
   }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PipelineRefreshFunctionalSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PipelineRefreshFunctionalSuite.scala
new file mode 100644
index 0000000000000..794932544d5f9
--- /dev/null
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PipelineRefreshFunctionalSuite.scala
@@ -0,0 +1,353 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.connect.pipelines
+
+import scala.collection.mutable.ArrayBuffer
+import scala.jdk.CollectionConverters._
+
+import org.apache.spark.connect.proto.{DatasetType, PipelineCommand, PipelineEvent}
+import org.apache.spark.sql.QueryTest
+import org.apache.spark.sql.catalyst.TableIdentifier
+import org.apache.spark.sql.connect.service.{SessionKey, SparkConnectService}
+import org.apache.spark.sql.pipelines.utils.{EventVerificationTestHelpers, TestPipelineUpdateContextMixin}
+
+/**
+ * Comprehensive test suite that validates pipeline refresh functionality by running actual
+ * pipelines with different refresh parameters and validating the results.
+ */
+class PipelineRefreshFunctionalSuite
+    extends SparkDeclarativePipelinesServerTest
+    with TestPipelineUpdateContextMixin
+    with EventVerificationTestHelpers {
+
+  private val externalSourceTable = TableIdentifier(
+    catalog = Some("spark_catalog"),
+    database = Some("default"),
+    table = "source_data")
+
+  override def beforeEach(): Unit = {
+    super.beforeEach()
+    // Create source table to simulate streaming updates
+    spark.sql(s"CREATE TABLE $externalSourceTable AS SELECT * FROM RANGE(1, 2)")
+  }
+
+  override def afterEach(): Unit = {
+    super.afterEach()
+    // Clean up the source table after each test
+    spark.sql(s"DROP TABLE IF EXISTS $externalSourceTable")
+  }
+
+  private def createTestPipeline(graphId: String): TestPipelineDefinition = {
+    new TestPipelineDefinition(graphId) {
+      // Create tables that depend on the mv
+      createTable(
+        name = "a",
+        datasetType = DatasetType.TABLE,
+        sql = Some(s"SELECT id FROM STREAM $externalSourceTable"))
+      createTable(
+        name = "b",
+        datasetType = DatasetType.TABLE,
+        sql = Some(s"SELECT id FROM STREAM $externalSourceTable"))
+      createTable(
+        name = "mv",
+        datasetType = DatasetType.MATERIALIZED_VIEW,
+        sql = Some(s"SELECT id FROM a"))
+    }
+  }
+
+  /**
+   * Helper method to run refresh tests with common setup and verification logic. This reduces
+   * code duplication across the refresh test cases.
+   */
+  private def runRefreshTest(
+      refreshConfigBuilder: String => Option[PipelineCommand.StartRun] = _ => None,
+      expectedContentAfterRefresh: Map[String, Set[Map[String, Any]]],
+      eventValidation: Option[ArrayBuffer[PipelineEvent] => Unit] = None): Unit = {
+    withRawBlockingStub { implicit stub =>
+      val graphId = createDataflowGraph
+      val pipeline = createTestPipeline(graphId)
+      registerPipelineDatasets(pipeline)
+
+      // First run to populate tables
+      startPipelineAndWaitForCompletion(graphId)
+
+      // combine above into a map for verification
+      val initialContent = Map(
+        "spark_catalog.default.a" -> Set(Map("id" -> 1)),
+        "spark_catalog.default.b" -> Set(Map("id" -> 1)),
+        "spark_catalog.default.mv" -> Set(Map("id" -> 1)))
+      // Verify initial content
+      initialContent.foreach { case (tableName, expectedRows) =>
+        checkTableContent(tableName, expectedRows)
+      }
+      // Clear cached pipeline execution before starting new run
+      SparkConnectService.sessionManager
+        .getIsolatedSessionIfPresent(SessionKey(defaultUserId, defaultSessionId))
+        .foreach(_.removeAllPipelineExecutions())
+
+      // Replace source data to simulate a streaming update
+      spark.sql(
+        "INSERT OVERWRITE TABLE spark_catalog.default.source_data " +
+          "SELECT * FROM VALUES (2), (3) AS t(id)")
+
+      // Run with specified refresh configuration
+      val capturedEvents = refreshConfigBuilder(graphId) match {
+        case Some(startRun) => startPipelineAndWaitForCompletion(startRun)
+        case None => startPipelineAndWaitForCompletion(graphId)
+      }
+
+      // Additional validation if provided
+      eventValidation.foreach(_(capturedEvents))
+
+      // Verify final content with checkTableContent
+      expectedContentAfterRefresh.foreach { case (tableName, expectedRows) =>
+        checkTableContent(tableName, expectedRows)
+      }
+    }
+  }
+
+  test("pipeline runs selective full_refresh") {
+    runRefreshTest(
+      refreshConfigBuilder = { graphId =>
+        Some(
+          PipelineCommand.StartRun
+            .newBuilder()
+            .setDataflowGraphId(graphId)
+            .addAllFullRefreshSelection(List("a").asJava)
+            .build())
+      },
+      expectedContentAfterRefresh = Map(
+        "spark_catalog.default.a" -> Set(
+          Map("id" -> 2), // a is fully refreshed and only contains the new values
+          Map("id" -> 3)),
+        "spark_catalog.default.b" -> Set(
+          Map("id" -> 1) // b is not refreshed, so it retains the old value
+        ),
+        "spark_catalog.default.mv" -> Set(
+          Map("id" -> 1) // mv is not refreshed, so it retains the old value
+        )),
+      eventValidation = Some { capturedEvents =>
+        // assert that table_b is excluded
+        assert(
+          capturedEvents.exists(
+            _.getMessage.contains(s"Flow \'spark_catalog.default.b\' is EXCLUDED.")))
+        // assert that table_a ran to completion
+        assert(
+          capturedEvents.exists(
+            _.getMessage.contains(s"Flow spark_catalog.default.a has COMPLETED.")))
+        // assert that mv is excluded
+        assert(
+          capturedEvents.exists(
+            _.getMessage.contains(s"Flow \'spark_catalog.default.mv\' is EXCLUDED.")))
+        // Verify completion event
+        assert(capturedEvents.exists(_.getMessage.contains("Run is COMPLETED")))
+      })
+  }
+
+  test("pipeline runs selective full_refresh and selective refresh") {
+    runRefreshTest(
+      refreshConfigBuilder = { graphId =>
+        Some(
+          PipelineCommand.StartRun
+            .newBuilder()
+            .setDataflowGraphId(graphId)
+            .addAllFullRefreshSelection(Seq("a", "mv").asJava)
+            .addRefreshSelection("b")
+            .build())
+      },
+      expectedContentAfterRefresh = Map(
+        "spark_catalog.default.a" -> Set(
+          Map("id" -> 2), // a is fully refreshed and only contains the new values
+          Map("id" -> 3)),
+        "spark_catalog.default.b" -> Set(
+          Map("id" -> 1), // b is refreshed, so it retains the old value and adds the new ones
+          Map("id" -> 2),
+          Map("id" -> 3)),
+        "spark_catalog.default.mv" -> Set(
+          Map("id" -> 2), // mv is fully refreshed and only contains the new values
+          Map("id" -> 3))))
+  }
+
+  test("pipeline runs refresh by default") {
+    runRefreshTest(expectedContentAfterRefresh =
+      Map(
+        "spark_catalog.default.a" -> Set(
+          Map(
+            "id" -> 1
+          ), // a is refreshed by default, retains the old value and adds the new ones
+          Map("id" -> 2),
+          Map("id" -> 3)),
+        "spark_catalog.default.b" -> Set(
+          Map(
+            "id" -> 1
+          ), // b is refreshed by default, retains the old value and adds the new ones
+          Map("id" -> 2),
+          Map("id" -> 3)),
+        "spark_catalog.default.mv" -> Set(
+          Map("id" -> 1),
+          Map("id" -> 2), // mv is refreshed from table a, retains all values
+          Map("id" -> 3))))
+  }
+
+  test("pipeline runs full refresh all") {
+    runRefreshTest(
+      refreshConfigBuilder = { graphId =>
+        Some(
+          PipelineCommand.StartRun
+            .newBuilder()
+            .setDataflowGraphId(graphId)
+            .setFullRefreshAll(true)
+            .build())
+      },
+      // full refresh all causes all tables to lose the initial value
+      // and only contain the new values after the source data is updated
+      expectedContentAfterRefresh = Map(
+        "spark_catalog.default.a" -> Set(Map("id" -> 2), Map("id" -> 3)),
+        "spark_catalog.default.b" -> Set(Map("id" -> 2), Map("id" -> 3)),
+        "spark_catalog.default.mv" -> Set(Map("id" -> 2), Map("id" -> 3))))
+  }
+
+  test("validation: cannot specify subset refresh when full_refresh_all is true") {
+    withRawBlockingStub { implicit stub =>
+      val graphId = createDataflowGraph
+      val pipeline = createTestPipeline(graphId)
+      registerPipelineDatasets(pipeline)
+
+      val startRun = PipelineCommand.StartRun
+        .newBuilder()
+        .setDataflowGraphId(graphId)
+        .setFullRefreshAll(true)
+        .addRefreshSelection("a")
+        .build()
+
+      val exception = intercept[IllegalArgumentException] {
+        startPipelineAndWaitForCompletion(startRun)
+      }
+      assert(
+        exception.getMessage.contains(
+          "Cannot specify a subset to refresh when full refresh all is set to true"))
+    }
+  }
+
+  test("validation: cannot specify subset full_refresh when full_refresh_all is true") {
+    withRawBlockingStub { implicit stub =>
+      val graphId = createDataflowGraph
+      val pipeline = createTestPipeline(graphId)
+      registerPipelineDatasets(pipeline)
+
+      val startRun = PipelineCommand.StartRun
+        .newBuilder()
+        .setDataflowGraphId(graphId)
+        .setFullRefreshAll(true)
+        .addFullRefreshSelection("a")
+        .build()
+
+      val exception = intercept[IllegalArgumentException] {
+        startPipelineAndWaitForCompletion(startRun)
+      }
+      assert(
+        exception.getMessage.contains(
+          "Cannot specify a subset to full refresh when full refresh all is set to true"))
+    }
+  }
+
+  test("validation: refresh and full_refresh cannot overlap") {
+    withRawBlockingStub { implicit stub =>
+      val graphId = createDataflowGraph
+      val pipeline = createTestPipeline(graphId)
+      registerPipelineDatasets(pipeline)
+
+      val startRun = PipelineCommand.StartRun
+        .newBuilder()
+        .setDataflowGraphId(graphId)
+        .addRefreshSelection("a")
+        .addFullRefreshSelection("a")
+        .build()
+
+      val exception = intercept[IllegalArgumentException] {
+        startPipelineAndWaitForCompletion(startRun)
+      }
+      assert(
+        exception.getMessage.contains(
+          "Datasets specified for refresh and full refresh cannot overlap"))
+      assert(exception.getMessage.contains("a"))
+    }
+  }
+
+  test("validation: multiple overlapping tables in refresh and full_refresh not allowed") {
+    withRawBlockingStub { implicit stub =>
+      val graphId = createDataflowGraph
+      val pipeline = createTestPipeline(graphId)
+      registerPipelineDatasets(pipeline)
+
+      val startRun = PipelineCommand.StartRun
+        .newBuilder()
+        .setDataflowGraphId(graphId)
+        .addRefreshSelection("a")
+        .addRefreshSelection("b")
+        .addFullRefreshSelection("a")
+        .build()
+
+      val exception = intercept[IllegalArgumentException] {
+        startPipelineAndWaitForCompletion(startRun)
+      }
+      assert(
+        exception.getMessage.contains(
+          "Datasets specified for refresh and full refresh cannot overlap"))
+      assert(exception.getMessage.contains("a"))
+    }
+  }
+
+  test("validation: fully qualified table names in validation") {
+    withRawBlockingStub { implicit stub =>
+      val graphId = createDataflowGraph
+      val pipeline = createTestPipeline(graphId)
+      registerPipelineDatasets(pipeline)
+
+      val startRun = PipelineCommand.StartRun
+        .newBuilder()
+        .setDataflowGraphId(graphId)
+        .addRefreshSelection("spark_catalog.default.a")
+        .addFullRefreshSelection("a") // This should be treated as the same table
+        .build()
+
+      val exception = intercept[IllegalArgumentException] {
+        startPipelineAndWaitForCompletion(startRun)
+      }
+      assert(
+        exception.getMessage.contains(
+          "Datasets specified for refresh and full refresh cannot overlap"))
+    }
+  }
+
+  private def checkTableContent[A <: Map[String, Any]](
+      name: String,
+      expectedContent: Set[A]): Unit = {
+    spark.catalog.refreshTable(name) // clear cache for the table
+    val df = spark.table(name)
+    QueryTest.checkAnswer(
+      df,
+      expectedContent
+        .map(row => {
+          // Convert each row to a Row object
+          org.apache.spark.sql.Row.fromSeq(row.values.toSeq)
+        })
+        .toSeq
+        .asJava)
+  }
+}
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PythonPipelineSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PythonPipelineSuite.scala
index 21f2857090182..0895463037f2a 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PythonPipelineSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/PythonPipelineSuite.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.connect.pipelines
 import java.io.{BufferedReader, InputStreamReader}
 import java.nio.charset.StandardCharsets
 import java.nio.file.Paths
+import java.util.UUID
 import java.util.concurrent.TimeUnit
 
 import scala.collection.mutable.ArrayBuffer
@@ -28,7 +29,8 @@ import scala.util.Try
 import org.apache.spark.api.python.PythonUtils
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.TableIdentifier
-import org.apache.spark.sql.pipelines.graph.DataflowGraph
+import org.apache.spark.sql.connect.service.SparkConnectService
+import org.apache.spark.sql.pipelines.graph.{DataflowGraph, PipelineUpdateContextImpl}
 import org.apache.spark.sql.pipelines.utils.{EventVerificationTestHelpers, TestPipelineUpdateContextMixin}
 
 /**
@@ -42,10 +44,12 @@ class PythonPipelineSuite
 
   def buildGraph(pythonText: String): DataflowGraph = {
     val indentedPythonText = pythonText.linesIterator.map("    " + _).mkString("\n")
+    // create a unique identifier to allow identifying the session and dataflow graph
+    val customSessionIdentifier = UUID.randomUUID().toString
     val pythonCode =
       s"""
          |from pyspark.sql import SparkSession
-         |from pyspark import pipelines as sdp
+         |from pyspark import pipelines as dp
          |from pyspark.pipelines.spark_connect_graph_element_registry import (
          |    SparkConnectGraphElementRegistry,
          |)
@@ -57,6 +61,7 @@ class PythonPipelineSuite
          |spark = SparkSession.builder \\
          |    .remote("sc://localhost:$serverPort") \\
          |    .config("spark.connect.grpc.channel.timeout", "5s") \\
+         |    .config("spark.custom.identifier", "$customSessionIdentifier") \\
          |    .create()
          |
          |dataflow_graph_id = create_dataflow_graph(
@@ -78,8 +83,17 @@ class PythonPipelineSuite
       throw new RuntimeException(
         s"Python process failed with exit code $exitCode. Output: ${output.mkString("\n")}")
     }
+    val activeSessions = SparkConnectService.sessionManager.listActiveSessions
 
-    val dataflowGraphContexts = DataflowGraphRegistry.getAllDataflowGraphs
+    // get the session holder by finding the session with the custom UUID set in the conf
+    val sessionHolder = activeSessions
+      .map(info => SparkConnectService.sessionManager.getIsolatedSession(info.key, None))
+      .find(_.session.conf.get("spark.custom.identifier") == customSessionIdentifier)
+      .getOrElse(
+        throw new RuntimeException(s"Session with identifier $customSessionIdentifier not found"))
+
+    // get all dataflow graphs from the session holder
+    val dataflowGraphContexts = sessionHolder.dataflowGraphRegistry.getAllDataflowGraphs
     assert(dataflowGraphContexts.size == 1)
 
     dataflowGraphContexts.head.toDataflowGraph
@@ -91,9 +105,9 @@ class PythonPipelineSuite
 
   test("basic") {
     val graph = buildGraph("""
-        |@sdp.table
+        |@dp.table
         |def table1():
-        |    return spark.range(10)
+        |    return spark.readStream.format("rate").load()
         |""".stripMargin)
       .resolve()
       .validate()
@@ -104,19 +118,19 @@ class PythonPipelineSuite
   test("basic with inverted topological order") {
     // This graph is purposefully in the wrong topological order to test the topological sort
     val graph = buildGraph("""
-        |@sdp.table()
+        |@dp.table()
         |def b():
         |  return spark.readStream.table("a")
         |
-        |@sdp.table()
+        |@dp.table()
         |def c():
         |  return spark.readStream.table("a")
         |
-        |@sdp.table()
+        |@dp.materialized_view()
         |def d():
         |  return spark.read.table("a")
         |
-        |@sdp.table()
+        |@dp.materialized_view()
         |def a():
         |  return spark.range(5)
         |""".stripMargin)
@@ -127,11 +141,11 @@ class PythonPipelineSuite
 
   test("flows") {
     val graph = buildGraph("""
-      |@sdp.table()
+      |@dp.table()
       |def a():
       |  return spark.readStream.format("rate").load()
       |
-      |@sdp.append_flow(target = "a")
+      |@dp.append_flow(target = "a")
       |def supplement():
       |  return spark.readStream.format("rate").load()
       |""".stripMargin).resolve().validate()
@@ -146,15 +160,15 @@ class PythonPipelineSuite
 
   test("referencing internal datasets") {
     val graph = buildGraph("""
-      |@sdp.materialized_view
+      |@dp.materialized_view
       |def src():
       |  return spark.range(5)
       |
-      |@sdp.materialized_view
+      |@dp.materialized_view
       |def a():
       |  return spark.read.table("src")
       |
-      |@sdp.table
+      |@dp.table
       |def b():
       |  return spark.readStream.table("src")
       |""".stripMargin).resolve().validate()
@@ -177,15 +191,15 @@ class PythonPipelineSuite
   test("referencing external datasets") {
     sql("CREATE TABLE spark_catalog.default.src AS SELECT * FROM RANGE(5)")
     val graph = buildGraph("""
-        |@sdp.table
+        |@dp.materialized_view
         |def a():
         |  return spark.read.table("spark_catalog.default.src")
         |
-        |@sdp.table
+        |@dp.materialized_view
         |def b():
         |  return spark.table("spark_catalog.default.src")
         |
-        |@sdp.table
+        |@dp.table
         |def c():
         |  return spark.readStream.table("spark_catalog.default.src")
         |""".stripMargin).resolve().validate()
@@ -204,15 +218,15 @@ class PythonPipelineSuite
 
   test("referencing internal datasets failed") {
     val graph = buildGraph("""
-        |@sdp.table
+        |@dp.table
         |def a():
         |  return spark.read.table("src")
         |
-        |@sdp.table
+        |@dp.table
         |def b():
         |  return spark.table("src")
         |
-        |@sdp.table
+        |@dp.table
         |def c():
         |  return spark.readStream.table("src")
         |""".stripMargin).resolve()
@@ -226,15 +240,15 @@ class PythonPipelineSuite
 
   test("referencing external datasets failed") {
     val graph = buildGraph("""
-        |@sdp.table
+        |@dp.table
         |def a():
         |  return spark.read.table("spark_catalog.default.src")
         |
-        |@sdp.table
+        |@dp.materialized_view
         |def b():
         |  return spark.table("spark_catalog.default.src")
         |
-        |@sdp.table
+        |@dp.materialized_view
         |def c():
         |  return spark.readStream.table("spark_catalog.default.src")
         |""".stripMargin).resolve()
@@ -246,11 +260,11 @@ class PythonPipelineSuite
   test("create dataset with the same name will fail") {
     val ex = intercept[AnalysisException] {
       buildGraph(s"""
-           |@sdp.materialized_view
+           |@dp.materialized_view
            |def a():
            |  return spark.range(1)
            |
-           |@sdp.materialized_view(name = "a")
+           |@dp.materialized_view(name = "a")
            |def b():
            |  return spark.range(1)
            |""".stripMargin)
@@ -260,19 +274,19 @@ class PythonPipelineSuite
 
   test("create datasets with fully/partially qualified names") {
     val graph = buildGraph(s"""
-         |@sdp.table
+         |@dp.table
          |def mv_1():
          |  return spark.range(5)
          |
-         |@sdp.table(name = "schema_a.mv_2")
+         |@dp.table(name = "schema_a.mv_2")
          |def irrelevant_1():
          |  return spark.range(5)
          |
-         |@sdp.table(name = "st_1")
+         |@dp.table(name = "st_1")
          |def irrelevant_2():
          |  return spark.readStream.format("rate").load()
          |
-         |@sdp.table(name = "schema_b.st_2")
+         |@dp.table(name = "schema_b.st_2")
          |def irrelevant_3():
          |  return spark.readStream.format("rate").load()
          |""".stripMargin).resolve()
@@ -319,11 +333,11 @@ class PythonPipelineSuite
   test("create datasets with three part names") {
     val graphTry = Try {
       buildGraph(s"""
-           |@sdp.table(name = "some_catalog.some_schema.mv")
+           |@dp.table(name = "some_catalog.some_schema.mv")
            |def irrelevant_1():
            |  return spark.range(5)
            |
-           |@sdp.table(name = "some_catalog.some_schema.st")
+           |@dp.table(name = "some_catalog.some_schema.st")
            |def irrelevant_2():
            |  return spark.readStream.format("rate").load()
            |""".stripMargin).resolve()
@@ -339,24 +353,28 @@ class PythonPipelineSuite
         TableIdentifier("st", Some("some_schema"), Some("some_catalog"))))
   }
 
-  test("view works") {
+  test("temporary views works") {
+    // A table is defined since pipeline with only temporary views is invalid.
     val graph = buildGraph(s"""
-         |@sdp.temporary_view
+         |@dp.table
+         |def mv_1():
+         |  return spark.range(5)
+         |@dp.temporary_view
          |def view_1():
          |  return spark.range(5)
          |
-         |@sdp.temporary_view(name= "view_2")
+         |@dp.temporary_view(name= "view_2")
          |def irrelevant_1():
          |  return spark.read.table("view_1")
          |
-         |@sdp.temporary_view(name= "view_3")
+         |@dp.temporary_view(name= "view_3")
          |def irrelevant_2():
          |  return spark.read.table("view_1")
          |""".stripMargin).resolve()
     // views are temporary views, so they're not fully qualified.
-    assert(graph.tables.isEmpty)
     assert(
-      graph.flows.map(_.identifier.unquotedString).toSet == Set("view_1", "view_2", "view_3"))
+      Set("view_1", "view_2", "view_3").subsetOf(
+        graph.flows.map(_.identifier.unquotedString).toSet))
     // dependencies are correctly resolved view_2 reading from view_1
     assert(
       graph.resolvedFlow(TableIdentifier("view_2")).inputs.contains(TableIdentifier("view_1")))
@@ -367,11 +385,11 @@ class PythonPipelineSuite
   test("create named flow with multipart name will fail") {
     val ex = intercept[RuntimeException] {
       buildGraph(s"""
-           |@sdp.table
+           |@dp.table
            |def src():
            |  return spark.readStream.table("src0")
            |
-           |@sdp.append_flow(name ="some_schema.some_flow", target = "src")
+           |@dp.append_flow(name ="some_schema.some_flow", target = "src")
            |def some_flow():
            |  return spark.readStream.format("rate").load()
            |""".stripMargin)
@@ -381,11 +399,11 @@ class PythonPipelineSuite
 
   test("create flow with multipart target and no explicit name succeeds") {
     val graph = buildGraph("""
-           |@sdp.table()
+           |@dp.table()
            |def a():
            |  return spark.readStream.format("rate").load()
            |
-           |@sdp.append_flow(target = "default.a")
+           |@dp.append_flow(target = "default.a")
            |def supplement():
            |  return spark.readStream.format("rate").load()
            |""".stripMargin).resolve().validate()
@@ -400,11 +418,11 @@ class PythonPipelineSuite
 
   test("create named flow with multipart target succeeds") {
     val graph = buildGraph("""
-           |@sdp.table()
+           |@dp.table()
            |def a():
            |  return spark.readStream.format("rate").load()
            |
-           |@sdp.append_flow(target = "default.a", name = "something")
+           |@dp.append_flow(target = "default.a", name = "something")
            |def supplement():
            |  return spark.readStream.format("rate").load()
            |""".stripMargin)
@@ -416,6 +434,103 @@ class PythonPipelineSuite
         .map(_.identifier) == Seq(graphIdentifier("a"), graphIdentifier("something")))
   }
 
+  test("groupby and rollup works with internal datasets, referencing with (col, str)") {
+    val graph = buildGraph("""
+      from pyspark.sql.functions import col, sum, count
+
+      @dp.materialized_view
+      def src():
+        return spark.range(3)
+
+      @dp.materialized_view
+      def groupby_with_col_result():
+        return spark.read.table("src").groupBy(col("id")).agg(
+          sum("id").alias("sum_id"),
+          count("*").alias("cnt")
+        )
+
+      @dp.materialized_view
+      def groupby_with_str_result():
+        return spark.read.table("src").groupBy("id").agg(
+          sum("id").alias("sum_id"),
+          count("*").alias("cnt")
+        )
+
+      @dp.materialized_view
+      def rollup_with_col_result():
+        return spark.read.table("src").rollup(col("id")).agg(
+          sum("id").alias("sum_id"),
+          count("*").alias("cnt")
+        )
+
+      @dp.materialized_view
+      def rollup_with_str_result():
+        return spark.read.table("src").rollup("id").agg(
+          sum("id").alias("sum_id"),
+          count("*").alias("cnt")
+        )
+    """)
+
+    val updateContext = new PipelineUpdateContextImpl(graph, _ => ())
+    updateContext.pipelineExecution.runPipeline()
+    updateContext.pipelineExecution.awaitCompletion()
+
+    val groupbyDfs =
+      Seq(spark.table("groupby_with_col_result"), spark.table("groupby_with_str_result"))
+
+    val rollupDfs =
+      Seq(spark.table("rollup_with_col_result"), spark.table("rollup_with_str_result"))
+
+    // groupBy: each variant should have exactly one row per id [0,1,2]
+    groupbyDfs.foreach { df =>
+      assert(df.select("id").collect().map(_.getLong(0)).toSet == Set(0L, 1L, 2L))
+    }
+
+    // rollup: each variant should have groupBy rows + one total row
+    rollupDfs.foreach { df =>
+      assert(df.count() == 3 + 1) // 3 ids + 1 total
+      val totalRow = df.filter("id IS NULL").collect().head
+      assert(totalRow.getLong(1) == 3L && totalRow.getLong(2) == 3L)
+    }
+  }
+
+  test("create pipeline without table will throw RUN_EMPTY_PIPELINE exception") {
+    checkError(
+      exception = intercept[AnalysisException] {
+        buildGraph(s"""
+            |spark.range(1)
+            |""".stripMargin)
+      },
+      condition = "RUN_EMPTY_PIPELINE",
+      parameters = Map.empty)
+  }
+
+  test("create pipeline with only temp view will throw RUN_EMPTY_PIPELINE exception") {
+    checkError(
+      exception = intercept[AnalysisException] {
+        buildGraph(s"""
+            |@dp.temporary_view
+            |def view_1():
+            |  return spark.range(5)
+            |""".stripMargin)
+      },
+      condition = "RUN_EMPTY_PIPELINE",
+      parameters = Map.empty)
+  }
+
+  test("create pipeline with only flow will throw RUN_EMPTY_PIPELINE exception") {
+    checkError(
+      exception = intercept[AnalysisException] {
+        buildGraph(s"""
+            |@dp.append_flow(target = "a")
+            |def flow():
+            |  return spark.range(5)
+            |""".stripMargin)
+      },
+      condition = "RUN_EMPTY_PIPELINE",
+      parameters = Map.empty)
+  }
+
   /**
    * Executes Python code in a separate process and returns the exit code.
    *
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerSuite.scala
index 6bd31fba8ec26..ef5da0c014ee1 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerSuite.scala
@@ -17,10 +17,13 @@
 
 package org.apache.spark.sql.connect.pipelines
 
+import java.util.UUID
+
 import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.{DatasetType, Expression, PipelineCommand, Relation, UnresolvedTableValuedFunction}
 import org.apache.spark.connect.proto.PipelineCommand.{DefineDataset, DefineFlow}
 import org.apache.spark.internal.Logging
+import org.apache.spark.sql.connect.service.{SessionKey, SparkConnectService}
 
 class SparkDeclarativePipelinesServerSuite
     extends SparkDeclarativePipelinesServerTest
@@ -41,8 +44,7 @@ class SparkDeclarativePipelinesServerSuite
             .newBuilder()
             .build())).getPipelineCommandResult.getCreateDataflowGraphResult.getDataflowGraphId
       val definition =
-        DataflowGraphRegistry
-          .getDataflowGraphOrThrow(graphId)
+        getDefaultSessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(graphId)
       assert(definition.defaultDatabase == "test_db")
     }
   }
@@ -93,7 +95,7 @@ class SparkDeclarativePipelinesServerSuite
                 .setDataflowGraphId(graphId)
                 .setFlowName("mv")
                 .setTargetDatasetName("mv")
-                .setPlan(
+                .setRelation(
                   Relation
                     .newBuilder()
                     .setUnresolvedTableValuedFunction(
@@ -115,8 +117,7 @@ class SparkDeclarativePipelinesServerSuite
                 |""".stripMargin)
 
       val definition =
-        DataflowGraphRegistry
-          .getDataflowGraphOrThrow(graphId)
+        getDefaultSessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(graphId)
 
       val graph = definition.toDataflowGraph.resolve()
 
@@ -161,8 +162,7 @@ class SparkDeclarativePipelinesServerSuite
       }
 
       val definition =
-        DataflowGraphRegistry
-          .getDataflowGraphOrThrow(graphId)
+        getDefaultSessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(graphId)
 
       registerPipelineDatasets(pipeline)
       val graph = definition.toDataflowGraph
@@ -206,7 +206,7 @@ class SparkDeclarativePipelinesServerSuite
           sql = Some("SELECT * FROM STREAM tableA"))
         createTable(
           name = "tableC",
-          datasetType = DatasetType.TABLE,
+          datasetType = DatasetType.MATERIALIZED_VIEW,
           sql = Some("SELECT * FROM tableB"))
       }
 
@@ -238,7 +238,7 @@ class SparkDeclarativePipelinesServerSuite
         createView(name = "viewC", sql = "SELECT * FROM curr.tableB")
         createTable(
           name = "other.tableD",
-          datasetType = proto.DatasetType.TABLE,
+          datasetType = proto.DatasetType.MATERIALIZED_VIEW,
           sql = Some("SELECT * FROM viewC"))
       }
 
@@ -251,4 +251,239 @@ class SparkDeclarativePipelinesServerSuite
       assert(spark.table("spark_catalog.other.tableD").count() == 5)
     }
   }
+
+  test("dataflow graphs are session-specific") {
+    withRawBlockingStub { implicit stub =>
+      // Create a dataflow graph in the default session
+      val graphId1 = createDataflowGraph
+
+      // Register a dataset in the default session
+      sendPlan(
+        buildPlanFromPipelineCommand(
+          PipelineCommand
+            .newBuilder()
+            .setDefineDataset(
+              DefineDataset
+                .newBuilder()
+                .setDataflowGraphId(graphId1)
+                .setDatasetName("session1_table")
+                .setDatasetType(DatasetType.MATERIALIZED_VIEW))
+            .build()))
+
+      // Verify the graph exists in the default session
+      assert(getDefaultSessionHolder.dataflowGraphRegistry.getAllDataflowGraphs.size == 1)
+    }
+
+    // Create a second session with different user/session ID
+    val newSessionId = UUID.randomUUID().toString
+    val newSessionUserId = "session2_user"
+
+    withRawBlockingStub { implicit stub =>
+      // Override the test context to use different session
+      val newSessionExecuteRequest = buildExecutePlanRequest(
+        buildCreateDataflowGraphPlan(
+          proto.PipelineCommand.CreateDataflowGraph
+            .newBuilder()
+            .setDefaultCatalog("spark_catalog")
+            .setDefaultDatabase("default")
+            .build())).toBuilder
+        .setUserContext(proto.UserContext
+          .newBuilder()
+          .setUserId(newSessionUserId)
+          .build())
+        .setSessionId(newSessionId)
+        .build()
+
+      val response = stub.executePlan(newSessionExecuteRequest)
+      val graphId2 =
+        response.next().getPipelineCommandResult.getCreateDataflowGraphResult.getDataflowGraphId
+
+      // Register a different dataset in second session
+      val session2DefineRequest = buildExecutePlanRequest(
+        buildPlanFromPipelineCommand(
+          PipelineCommand
+            .newBuilder()
+            .setDefineDataset(
+              DefineDataset
+                .newBuilder()
+                .setDataflowGraphId(graphId2)
+                .setDatasetName("session2_table")
+                .setDatasetType(DatasetType.MATERIALIZED_VIEW))
+            .build())).toBuilder
+        .setUserContext(proto.UserContext
+          .newBuilder()
+          .setUserId(newSessionUserId)
+          .build())
+        .setSessionId(newSessionId)
+        .build()
+
+      stub.executePlan(session2DefineRequest).next()
+
+      // Verify session isolation - each session should only see its own graphs
+      val newSessionHolder = SparkConnectService.sessionManager
+        .getIsolatedSession(SessionKey(newSessionUserId, newSessionId), None)
+
+      val defaultSessionGraphs =
+        getDefaultSessionHolder.dataflowGraphRegistry.getAllDataflowGraphs
+      val newSessionGraphs = newSessionHolder.dataflowGraphRegistry.getAllDataflowGraphs
+
+      assert(defaultSessionGraphs.size == 1)
+      assert(newSessionGraphs.size == 1)
+
+      assert(
+        defaultSessionGraphs.head.toDataflowGraph.tables
+          .exists(_.identifier.table == "session1_table"),
+        "Session 1 should have its own table")
+      assert(
+        newSessionGraphs.head.toDataflowGraph.tables
+          .exists(_.identifier.table == "session2_table"),
+        "Session 2 should have its own table")
+    }
+  }
+
+  test("dataflow graphs are cleaned up when session is closed") {
+    val testUserId = "test_user"
+    val testSessionId = UUID.randomUUID().toString
+
+    // Create a session and dataflow graph
+    withRawBlockingStub { implicit stub =>
+      val createGraphRequest = buildExecutePlanRequest(
+        buildCreateDataflowGraphPlan(
+          proto.PipelineCommand.CreateDataflowGraph
+            .newBuilder()
+            .setDefaultCatalog("spark_catalog")
+            .setDefaultDatabase("default")
+            .build())).toBuilder
+        .setUserContext(proto.UserContext
+          .newBuilder()
+          .setUserId(testUserId)
+          .build())
+        .setSessionId(testSessionId)
+        .build()
+
+      val response = stub.executePlan(createGraphRequest)
+      val graphId =
+        response.next().getPipelineCommandResult.getCreateDataflowGraphResult.getDataflowGraphId
+
+      // Register a dataset
+      val defineRequest = buildExecutePlanRequest(
+        buildPlanFromPipelineCommand(
+          PipelineCommand
+            .newBuilder()
+            .setDefineDataset(
+              DefineDataset
+                .newBuilder()
+                .setDataflowGraphId(graphId)
+                .setDatasetName("test_table")
+                .setDatasetType(DatasetType.MATERIALIZED_VIEW))
+            .build())).toBuilder
+        .setUserContext(proto.UserContext
+          .newBuilder()
+          .setUserId(testUserId)
+          .build())
+        .setSessionId(testSessionId)
+        .build()
+
+      stub.executePlan(defineRequest).next()
+
+      // Verify the graph exists
+      val sessionHolder = SparkConnectService.sessionManager
+        .getIsolatedSessionIfPresent(SessionKey(testUserId, testSessionId))
+        .get
+
+      val graphsBefore = sessionHolder.dataflowGraphRegistry.getAllDataflowGraphs
+      assert(graphsBefore.size == 1)
+
+      // Close the session
+      SparkConnectService.sessionManager.closeSession(SessionKey(testUserId, testSessionId))
+
+      // Verify the session is no longer available
+      val sessionAfterClose = SparkConnectService.sessionManager
+        .getIsolatedSessionIfPresent(SessionKey(testUserId, testSessionId))
+
+      assert(sessionAfterClose.isEmpty, "Session should be cleaned up after close")
+      // Verify the graph is removed
+      val graphsAfter = sessionHolder.dataflowGraphRegistry.getAllDataflowGraphs
+      assert(graphsAfter.isEmpty, "Graph should be removed after session close")
+    }
+  }
+
+  test("multiple dataflow graphs can exist in the same session") {
+    withRawBlockingStub { implicit stub =>
+      // Create two dataflow graphs in the same session
+      val graphId1 = createDataflowGraph
+      val graphId2 = createDataflowGraph
+
+      // Register datasets in both graphs
+      sendPlan(
+        buildPlanFromPipelineCommand(
+          PipelineCommand
+            .newBuilder()
+            .setDefineDataset(
+              DefineDataset
+                .newBuilder()
+                .setDataflowGraphId(graphId1)
+                .setDatasetName("graph1_table")
+                .setDatasetType(DatasetType.MATERIALIZED_VIEW))
+            .build()))
+
+      sendPlan(
+        buildPlanFromPipelineCommand(
+          PipelineCommand
+            .newBuilder()
+            .setDefineDataset(
+              DefineDataset
+                .newBuilder()
+                .setDataflowGraphId(graphId2)
+                .setDatasetName("graph2_table")
+                .setDatasetType(DatasetType.MATERIALIZED_VIEW))
+            .build()))
+
+      // Verify both graphs exist in the session
+      val sessionHolder = getDefaultSessionHolder
+      val graph1 = sessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(graphId1)
+      val graph2 = sessionHolder.dataflowGraphRegistry.getDataflowGraphOrThrow(graphId2)
+      // Check that both graphs have their datasets registered
+      assert(graph1.toDataflowGraph.tables.exists(_.identifier.table == "graph1_table"))
+      assert(graph2.toDataflowGraph.tables.exists(_.identifier.table == "graph2_table"))
+    }
+  }
+
+  test("dropping a dataflow graph removes it from session") {
+    withRawBlockingStub { implicit stub =>
+      val graphId = createDataflowGraph
+
+      // Register a dataset
+      sendPlan(
+        buildPlanFromPipelineCommand(
+          PipelineCommand
+            .newBuilder()
+            .setDefineDataset(
+              DefineDataset
+                .newBuilder()
+                .setDataflowGraphId(graphId)
+                .setDatasetName("test_table")
+                .setDatasetType(DatasetType.MATERIALIZED_VIEW))
+            .build()))
+
+      // Verify the graph exists
+      val sessionHolder = getDefaultSessionHolder
+      val graphsBefore = sessionHolder.dataflowGraphRegistry.getAllDataflowGraphs
+      assert(graphsBefore.size == 1)
+
+      // Drop the graph
+      sendPlan(
+        buildPlanFromPipelineCommand(
+          PipelineCommand
+            .newBuilder()
+            .setDropDataflowGraph(PipelineCommand.DropDataflowGraph
+              .newBuilder()
+              .setDataflowGraphId(graphId))
+            .build()))
+
+      // Verify the graph is removed
+      val graphsAfter = sessionHolder.dataflowGraphRegistry.getAllDataflowGraphs
+      assert(graphsAfter.isEmpty, "Graph should be removed after drop")
+    }
+  }
 }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerTest.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerTest.scala
index ea4cc5f3aba55..a31883677f92a 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerTest.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/SparkDeclarativePipelinesServerTest.scala
@@ -17,10 +17,13 @@
 
 package org.apache.spark.sql.connect.pipelines
 
+import scala.collection.mutable.ArrayBuffer
+
 import org.apache.spark.connect.{proto => sc}
+import org.apache.spark.connect.proto.{PipelineCommand, PipelineEvent}
 import org.apache.spark.sql.connect.{SparkConnectServerTest, SparkConnectTestUtils}
 import org.apache.spark.sql.connect.planner.SparkConnectPlanner
-import org.apache.spark.sql.connect.service.{SessionKey, SparkConnectService}
+import org.apache.spark.sql.connect.service.{SessionHolder, SessionKey, SparkConnectService}
 import org.apache.spark.sql.pipelines.utils.PipelineTest
 
 class SparkDeclarativePipelinesServerTest extends SparkConnectServerTest {
@@ -28,12 +31,20 @@ class SparkDeclarativePipelinesServerTest extends SparkConnectServerTest {
   override def afterEach(): Unit = {
     SparkConnectService.sessionManager
       .getIsolatedSessionIfPresent(SessionKey(defaultUserId, defaultSessionId))
-      .foreach(_.removeAllPipelineExecutions())
-    DataflowGraphRegistry.dropAllDataflowGraphs()
+      .foreach(s => {
+        s.removeAllPipelineExecutions()
+        s.dataflowGraphRegistry.dropAllDataflowGraphs()
+      })
     PipelineTest.cleanupMetastore(spark)
     super.afterEach()
   }
 
+  // Helper method to get the session holder
+  protected def getDefaultSessionHolder: SessionHolder = {
+    SparkConnectService.sessionManager
+      .getIsolatedSession(SessionKey(defaultUserId, defaultSessionId), None)
+  }
+
   def buildPlanFromPipelineCommand(command: sc.PipelineCommand): sc.Plan = {
     sc.Plan
       .newBuilder()
@@ -125,15 +136,27 @@ class SparkDeclarativePipelinesServerTest extends SparkConnectServerTest {
   def createPlanner(): SparkConnectPlanner =
     new SparkConnectPlanner(SparkConnectTestUtils.createDummySessionHolder(spark))
 
-  def startPipelineAndWaitForCompletion(graphId: String): Unit = {
+  def startPipelineAndWaitForCompletion(graphId: String): ArrayBuffer[PipelineEvent] = {
+    val defaultStartRunCommand =
+      PipelineCommand.StartRun.newBuilder().setDataflowGraphId(graphId).build()
+    startPipelineAndWaitForCompletion(defaultStartRunCommand)
+  }
+
+  def startPipelineAndWaitForCompletion(
+      startRunCommand: PipelineCommand.StartRun): ArrayBuffer[PipelineEvent] = {
     withClient { client =>
-      val startRunRequest = buildStartRunPlan(
-        sc.PipelineCommand.StartRun.newBuilder().setDataflowGraphId(graphId).build())
+      val capturedEvents = new ArrayBuffer[PipelineEvent]()
+      val startRunRequest = buildStartRunPlan(startRunCommand)
       val responseIterator = client.execute(startRunRequest)
       // The response iterator will be closed when the pipeline is completed.
       while (responseIterator.hasNext) {
-        responseIterator.next()
+        val response = responseIterator.next()
+        if (response.hasPipelineEventResult) {
+          capturedEvents.append(response.getPipelineEventResult.getEvent)
+        }
       }
+      return capturedEvents
     }
+    ArrayBuffer.empty[PipelineEvent]
   }
 }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/TestPipelineDefinition.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/TestPipelineDefinition.scala
index 3efc71ba7d259..c31aec0b7a5e6 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/TestPipelineDefinition.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/pipelines/TestPipelineDefinition.scala
@@ -58,9 +58,8 @@ class TestPipelineDefinition(graphId: String) {
         .setDataflowGraphId(graphId)
         .setFlowName(name)
         .setTargetDatasetName(name)
-        .setPlan(q)
+        .setRelation(q)
         .putAllSqlConf(sparkConf.asJava)
-        .setOnce(false)
         .build()
     }
   }
@@ -98,9 +97,8 @@ class TestPipelineDefinition(graphId: String) {
       .setDataflowGraphId(graphId)
       .setFlowName(name)
       .setTargetDatasetName(name)
-      .setPlan(query)
+      .setRelation(query)
       .putAllSqlConf(sparkConf.asJava)
-      .setOnce(false)
       .build()
 
   }
@@ -125,9 +123,8 @@ class TestPipelineDefinition(graphId: String) {
       .setDataflowGraphId(graphId)
       .setFlowName(name)
       .setTargetDatasetName(destinationName)
-      .setPlan(query)
+      .setRelation(query)
       .putAllSqlConf(sparkConf.asJava)
-      .setOnce(once)
       .build()
   }
 }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverterSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverterSuite.scala
index 79ef8decb310a..0af181e4be1a7 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverterSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/LiteralExpressionProtoConverterSuite.scala
@@ -19,15 +19,244 @@ package org.apache.spark.sql.connect.planner
 
 import org.scalatest.funsuite.AnyFunSuite // scalastyle:ignore funsuite
 
+import org.apache.spark.connect.proto
 import org.apache.spark.sql.connect.common.LiteralValueProtoConverter
+import org.apache.spark.sql.connect.common.LiteralValueProtoConverter.ToLiteralProtoOptions
+import org.apache.spark.sql.connect.planner.LiteralExpressionProtoConverter
+import org.apache.spark.sql.types._
 
 class LiteralExpressionProtoConverterSuite extends AnyFunSuite { // scalastyle:ignore funsuite
 
+  private def toLiteralProto(v: Any): proto.Expression.Literal = {
+    LiteralValueProtoConverter
+      .toLiteralProtoWithOptions(
+        v,
+        None,
+        ToLiteralProtoOptions(useDeprecatedDataTypeFields = false))
+  }
+
+  private def toLiteralProto(v: Any, t: DataType): proto.Expression.Literal = {
+    LiteralValueProtoConverter
+      .toLiteralProtoWithOptions(
+        v,
+        Some(t),
+        ToLiteralProtoOptions(useDeprecatedDataTypeFields = false))
+  }
+
   test("basic proto value and catalyst value conversion") {
     val values = Array(null, true, 1.toByte, 1.toShort, 1, 1L, 1.1d, 1.1f, "spark")
     for (v <- values) {
-      assertResult(v)(
-        LiteralValueProtoConverter.toCatalystValue(LiteralValueProtoConverter.toLiteralProto(v)))
+      assertResult(v)(LiteralValueProtoConverter.toCatalystValue(toLiteralProto(v)))
+    }
+  }
+
+  Seq(
+    (
+      (1, "string", true),
+      StructType(
+        Seq(
+          StructField("a", IntegerType),
+          StructField("b", StringType),
+          StructField("c", BooleanType)))),
+    (
+      Array((1, "string", true), (2, "string", false), (3, "string", true)),
+      ArrayType(
+        StructType(
+          Seq(
+            StructField("a", IntegerType),
+            StructField("b", StringType),
+            StructField("c", BooleanType))))),
+    (
+      (1, (2, 3)),
+      StructType(
+        Seq(
+          StructField("a", IntegerType),
+          StructField(
+            "b",
+            StructType(
+              Seq(StructField("c", IntegerType), StructField("d", IntegerType)))))))).zipWithIndex
+    .foreach { case ((v, t), idx) =>
+      test(s"complex proto value and catalyst value conversion #$idx") {
+        assertResult(v)(
+          LiteralValueProtoConverter.toCatalystValue(
+            LiteralValueProtoConverter.toLiteralProtoWithOptions(
+              v,
+              Some(t),
+              ToLiteralProtoOptions(useDeprecatedDataTypeFields = false))))
+      }
+
+      test(s"complex proto value and catalyst value conversion #$idx - backward compatibility") {
+        assertResult(v)(
+          LiteralValueProtoConverter.toCatalystValue(
+            LiteralValueProtoConverter.toLiteralProtoWithOptions(
+              v,
+              Some(t),
+              ToLiteralProtoOptions(useDeprecatedDataTypeFields = true))))
+      }
     }
+
+  test("backward compatibility for array literal proto") {
+    // Test the old way of defining arrays with elementType field and elements
+    val arrayProto = proto.Expression.Literal.Array
+      .newBuilder()
+      .setElementType(
+        proto.DataType
+          .newBuilder()
+          .setInteger(proto.DataType.Integer.newBuilder())
+          .build())
+      .addElements(toLiteralProto(1))
+      .addElements(toLiteralProto(2))
+      .addElements(toLiteralProto(3))
+      .build()
+
+    val literalProto = proto.Expression.Literal.newBuilder().setArray(arrayProto).build()
+    val literal = LiteralExpressionProtoConverter.toCatalystExpression(literalProto)
+    assert(literal.dataType.isInstanceOf[ArrayType])
+    assert(literal.dataType.asInstanceOf[ArrayType].elementType == IntegerType)
+    // The containsNull field is always set to true when using the old way of defining arrays.
+    assert(literal.dataType.asInstanceOf[ArrayType].containsNull)
+
+    val arrayData = literal.value.asInstanceOf[org.apache.spark.sql.catalyst.util.ArrayData]
+    assert(arrayData.numElements() == 3)
+    assert(arrayData.getInt(0) == 1)
+    assert(arrayData.getInt(1) == 2)
+    assert(arrayData.getInt(2) == 3)
+  }
+
+  test("backward compatibility for map literal proto") {
+    // Test the old way of defining maps with keyType and valueType fields
+    val mapProto = proto.Expression.Literal.Map
+      .newBuilder()
+      .setKeyType(
+        proto.DataType
+          .newBuilder()
+          .setString(proto.DataType.String.newBuilder())
+          .build())
+      .setValueType(
+        proto.DataType
+          .newBuilder()
+          .setInteger(proto.DataType.Integer.newBuilder())
+          .build())
+      .addKeys(toLiteralProto("a"))
+      .addKeys(toLiteralProto("b"))
+      .addValues(toLiteralProto(1))
+      .addValues(toLiteralProto(2))
+      .build()
+
+    val literalProto = proto.Expression.Literal.newBuilder().setMap(mapProto).build()
+    val literal = LiteralExpressionProtoConverter.toCatalystExpression(literalProto)
+    assert(literal.dataType.isInstanceOf[MapType])
+    assert(literal.dataType.asInstanceOf[MapType].keyType == StringType)
+    assert(literal.dataType.asInstanceOf[MapType].valueType == IntegerType)
+    // The valueContainsNull field is always set to true when using the old way of defining maps.
+    assert(literal.dataType.asInstanceOf[MapType].valueContainsNull)
+
+    val mapData = literal.value.asInstanceOf[org.apache.spark.sql.catalyst.util.MapData]
+    assert(mapData.numElements() == 2)
+    val keys = mapData.keyArray()
+    val values = mapData.valueArray()
+    assert(keys.getUTF8String(0).toString == "a")
+    assert(values.getInt(0) == 1)
+    assert(keys.getUTF8String(1).toString == "b")
+    assert(values.getInt(1) == 2)
+  }
+
+  test("backward compatibility for struct literal proto") {
+    // Test the old way of defining structs with structType field and elements
+    val structTypeProto = proto.DataType.Struct
+      .newBuilder()
+      .addFields(
+        proto.DataType.StructField
+          .newBuilder()
+          .setName("a")
+          .setDataType(proto.DataType
+            .newBuilder()
+            .setInteger(proto.DataType.Integer.newBuilder())
+            .build())
+          .setNullable(true)
+          .build())
+      .addFields(
+        proto.DataType.StructField
+          .newBuilder()
+          .setName("b")
+          .setDataType(proto.DataType
+            .newBuilder()
+            .setString(proto.DataType.String.newBuilder())
+            .build())
+          .setNullable(false)
+          .build())
+      .build()
+
+    val structProto = proto.Expression.Literal.Struct
+      .newBuilder()
+      .setStructType(proto.DataType.newBuilder().setStruct(structTypeProto).build())
+      .addElements(LiteralValueProtoConverter.toLiteralProto(1))
+      .addElements(LiteralValueProtoConverter.toLiteralProto("test"))
+      .build()
+
+    val result = LiteralValueProtoConverter.toCatalystStruct(structProto)
+    val resultType = LiteralValueProtoConverter.getProtoStructType(structProto)
+
+    // Verify the result is a tuple with correct values
+    assert(result.isInstanceOf[Product])
+    val product = result.asInstanceOf[Product]
+    assert(product.productArity == 2)
+    assert(product.productElement(0) == 1)
+    assert(product.productElement(1) == "test")
+
+    // Verify the returned struct type matches the original
+    assert(resultType.getFieldsCount == 2)
+    assert(resultType.getFields(0).getName == "a")
+    assert(resultType.getFields(0).getDataType.hasInteger)
+    assert(resultType.getFields(0).getNullable)
+    assert(resultType.getFields(1).getName == "b")
+    assert(resultType.getFields(1).getDataType.hasString)
+    assert(!resultType.getFields(1).getNullable)
+  }
+
+  test("data types of struct fields are not set for inferable types") {
+    val literalProto = toLiteralProto(
+      (1, 2.0, true, (1, 2)),
+      StructType(
+        Seq(
+          StructField("a", IntegerType),
+          StructField("b", DoubleType),
+          StructField("c", BooleanType),
+          StructField(
+            "d",
+            StructType(Seq(StructField("e", IntegerType), StructField("f", IntegerType)))))))
+    assert(!literalProto.getStruct.getDataTypeStruct.getFieldsList.get(0).hasDataType)
+    assert(!literalProto.getStruct.getDataTypeStruct.getFieldsList.get(1).hasDataType)
+    assert(!literalProto.getStruct.getDataTypeStruct.getFieldsList.get(2).hasDataType)
+    assert(!literalProto.getStruct.getDataTypeStruct.getFieldsList.get(3).hasDataType)
+  }
+
+  test("data types of struct fields are set for non-inferable types") {
+    val literalProto = toLiteralProto(
+      ("string", Decimal(1)),
+      StructType(Seq(StructField("a", StringType), StructField("b", DecimalType(10, 2)))))
+    assert(literalProto.getStruct.getDataTypeStruct.getFieldsList.get(0).hasDataType)
+    assert(literalProto.getStruct.getDataTypeStruct.getFieldsList.get(1).hasDataType)
+  }
+
+  test("nullable and metadata fields are set for struct literal proto") {
+    val literalProto = toLiteralProto(
+      ("string", Decimal(1)),
+      StructType(Seq(
+        StructField("a", StringType, nullable = true, Metadata.fromJson("""{"key": "value"}""")),
+        StructField("b", DecimalType(10, 2), nullable = false))))
+    val structFields = literalProto.getStruct.getDataTypeStruct.getFieldsList
+    assert(structFields.get(0).getNullable)
+    assert(structFields.get(0).hasMetadata)
+    assert(structFields.get(0).getMetadata == """{"key":"value"}""")
+    assert(!structFields.get(1).getNullable)
+    assert(!structFields.get(1).hasMetadata)
+
+    val structTypeProto = LiteralValueProtoConverter.getProtoStructType(literalProto.getStruct)
+    assert(structTypeProto.getFieldsList.get(0).getNullable)
+    assert(structTypeProto.getFieldsList.get(0).hasMetadata)
+    assert(structTypeProto.getFieldsList.get(0).getMetadata == """{"key":"value"}""")
+    assert(!structTypeProto.getFieldsList.get(1).getNullable)
+    assert(!structTypeProto.getFieldsList.get(1).hasMetadata)
   }
 }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectPlannerSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectPlannerSuite.scala
index 126c4d7a3cfe5..16cdd7da82799 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectPlannerSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectPlannerSuite.scala
@@ -38,7 +38,7 @@ import org.apache.spark.sql.connect.common.InvalidPlanInput
 import org.apache.spark.sql.connect.common.LiteralValueProtoConverter.toLiteralProto
 import org.apache.spark.sql.execution.arrow.ArrowConverters
 import org.apache.spark.sql.test.SharedSparkSession
-import org.apache.spark.sql.types.{IntegerType, StringType, StructField, StructType}
+import org.apache.spark.sql.types.{IntegerType, StringType, StructField, StructType, TimeType}
 import org.apache.spark.unsafe.types.UTF8String
 
 /**
@@ -961,4 +961,49 @@ class SparkConnectPlannerSuite extends SparkFunSuite with SparkConnectPlanTest {
     assert(plan.aggregateExpressions.forall(aggregateExpression =>
       !aggregateExpression.containsPattern(TreePattern.UNRESOLVED_ORDINAL)))
   }
+
+  test("Time literal") {
+    val project = proto.Project.newBuilder
+      .addExpressions(
+        proto.Expression.newBuilder
+          .setLiteral(proto.Expression.Literal.newBuilder.setTime(
+            proto.Expression.Literal.newBuilder.getTimeBuilder
+              .setNano(86399999999999L)
+              .setPrecision(TimeType.MIN_PRECISION)))
+          .build())
+      .addExpressions(
+        proto.Expression.newBuilder
+          .setLiteral(
+            proto.Expression.Literal.newBuilder.setTime(
+              proto.Expression.Literal.newBuilder.getTimeBuilder
+                .setNano(86399999999999L)
+                .setPrecision(TimeType.MAX_PRECISION)))
+          .build())
+      .addExpressions(
+        proto.Expression.newBuilder
+          .setLiteral(
+            proto.Expression.Literal.newBuilder.setTime(
+              proto.Expression.Literal.newBuilder.getTimeBuilder
+                .setNano(86399999999999L)
+                .setPrecision(TimeType.DEFAULT_PRECISION)))
+          .build())
+      .addExpressions(proto.Expression.newBuilder
+        .setLiteral(proto.Expression.Literal.newBuilder.setTime(
+          proto.Expression.Literal.newBuilder.getTimeBuilder.setNano(86399999999999L)))
+        .build())
+      .build()
+
+    val logical = transform(proto.Relation.newBuilder.setProject(project).build())
+    val df = Dataset.ofRows(spark, logical)
+    assertResult(df.schema.fields(0).dataType)(TimeType(TimeType.MIN_PRECISION))
+    assertResult(df.schema.fields(1).dataType)(TimeType(TimeType.MAX_PRECISION))
+    assertResult(df.schema.fields(2).dataType)(TimeType(TimeType.DEFAULT_PRECISION))
+    assertResult(df.schema.fields(3).dataType)(TimeType(TimeType.DEFAULT_PRECISION))
+    assertResult(df.collect()(0).toString)(
+      InternalRow(
+        "23:59:59.999999999",
+        "23:59:59.999999999",
+        "23:59:59.999999999",
+        "23:59:59.999999999").toString)
+  }
 }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectProtoSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectProtoSuite.scala
index 5c43715d2dd13..7b734f93e595e 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectProtoSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectProtoSuite.scala
@@ -40,7 +40,7 @@ import org.apache.spark.sql.connect.dsl.MockRemoteSession
 import org.apache.spark.sql.connect.dsl.commands._
 import org.apache.spark.sql.connect.dsl.expressions._
 import org.apache.spark.sql.connect.dsl.plans._
-import org.apache.spark.sql.connector.catalog.{Identifier, InMemoryTableCatalog, TableCatalog}
+import org.apache.spark.sql.connector.catalog.{Column => ColumnV2, Identifier, InMemoryTableCatalog, TableCatalog}
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.CatalogHelper
 import org.apache.spark.sql.execution.arrow.ArrowConverters
 import org.apache.spark.sql.functions._
@@ -822,7 +822,9 @@ class SparkConnectProtoSuite extends PlanTest with SparkConnectPlanTest {
         .asTableCatalog
         .loadTable(Identifier.of(Array(), "table_name"))
       assert(table.name === "testcat.table_name")
-      assert(table.schema === new StructType().add("id", LongType).add("data", StringType))
+      assert(
+        table.columns sameElements
+          Array(ColumnV2.create("id", LongType), ColumnV2.create("data", StringType)))
       assert(table.partitioning.isEmpty)
       assert(table.properties === (Map("provider" -> "foo") ++ defaultOwnership).asJava)
     }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectServiceSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectServiceSuite.scala
index 4fb57b736185a..c5567e0d218c3 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectServiceSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/planner/SparkConnectServiceSuite.scala
@@ -920,7 +920,11 @@ class SparkConnectServiceSuite
     }
     def onError(throwable: Throwable): Unit = {
       assert(executeHolder.eventsManager.hasCanceled.isEmpty)
-      assert(executeHolder.eventsManager.hasError.isDefined)
+      Eventually.eventually(EVENT_WAIT_TIMEOUT) {
+        assert(
+          executeHolder.eventsManager.hasError.isDefined,
+          s"Error has not been recorded in events manager within $EVENT_WAIT_TIMEOUT")
+      }
     }
     def onCompleted(producedRowCount: Option[Long] = None): Unit = {
       assert(executeHolder.eventsManager.getProducedRowCount == producedRowCount)
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/AddArtifactsHandlerSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/AddArtifactsHandlerSuite.scala
index a158ca9fad8ce..6cc5daadfddd7 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/AddArtifactsHandlerSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/AddArtifactsHandlerSuite.scala
@@ -32,6 +32,7 @@ import io.grpc.StatusRuntimeException
 import io.grpc.protobuf.StatusProto
 import io.grpc.stub.StreamObserver
 
+import org.apache.spark.SparkRuntimeException
 import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.{AddArtifactsRequest, AddArtifactsResponse}
 import org.apache.spark.sql.connect.ResourceHelper
@@ -43,6 +44,7 @@ class AddArtifactsHandlerSuite extends SharedSparkSession with ResourceHelper {
   private val CHUNK_SIZE: Int = 32 * 1024
 
   private val sessionId = UUID.randomUUID.toString()
+  private val sessionKey = SessionKey("c1", sessionId)
 
   class DummyStreamObserver(p: Promise[AddArtifactsResponse])
       extends StreamObserver[AddArtifactsResponse] {
@@ -51,17 +53,31 @@ class AddArtifactsHandlerSuite extends SharedSparkSession with ResourceHelper {
     override def onCompleted(): Unit = {}
   }
 
-  class TestAddArtifactsHandler(responseObserver: StreamObserver[AddArtifactsResponse])
+  class TestAddArtifactsHandler(
+      responseObserver: StreamObserver[AddArtifactsResponse],
+      throwIfArtifactExists: Boolean = false)
       extends SparkConnectAddArtifactsHandler(responseObserver) {
 
     // Stop the staged artifacts from being automatically deleted
     override protected def cleanUpStagedArtifacts(): Unit = {}
 
     private val finalArtifacts = mutable.Buffer.empty[String]
+    private val artifactChecksums: mutable.Map[String, Long] = mutable.Map.empty
 
     // Record the artifacts that are sent out for final processing.
     override protected def addStagedArtifactToArtifactManager(artifact: StagedArtifact): Unit = {
+      // Throw if artifact already exists and has different checksum
+      // This mocks the behavior of ArtifactManager.addArtifact without comparing the entire file
+      if (throwIfArtifactExists
+        && finalArtifacts.contains(artifact.name)
+        && artifact.getCrc != artifactChecksums(artifact.name)) {
+        throw new SparkRuntimeException(
+          "ARTIFACT_ALREADY_EXISTS",
+          Map("normalizedRemoteRelativePath" -> artifact.name))
+      }
+
       finalArtifacts.append(artifact.name)
+      artifactChecksums += (artifact.name -> artifact.getCrc)
     }
 
     def getFinalArtifacts: Seq[String] = finalArtifacts.toSeq
@@ -418,4 +434,79 @@ class AddArtifactsHandlerSuite extends SharedSparkSession with ResourceHelper {
     }
   }
 
+  def addSingleChunkArtifact(
+      handler: SparkConnectAddArtifactsHandler,
+      sessionKey: SessionKey,
+      name: String,
+      artifactPath: Path): Unit = {
+    val dataChunks = getDataChunks(artifactPath)
+    assert(dataChunks.size == 1)
+    val bytes = dataChunks.head
+    val context = proto.UserContext
+      .newBuilder()
+      .setUserId(sessionKey.userId)
+      .build()
+    val fileNameNoExtension = artifactPath.getFileName.toString.split('.').head
+    val singleChunkArtifact = proto.AddArtifactsRequest.SingleChunkArtifact
+      .newBuilder()
+      .setName(name)
+      .setData(
+        proto.AddArtifactsRequest.ArtifactChunk
+          .newBuilder()
+          .setData(bytes)
+          .setCrc(getCrcValues(crcPath.resolve(fileNameNoExtension + ".txt")).head)
+          .build())
+      .build()
+
+    val singleChunkArtifactRequest = AddArtifactsRequest
+      .newBuilder()
+      .setSessionId(sessionKey.sessionId)
+      .setUserContext(context)
+      .setBatch(
+        proto.AddArtifactsRequest.Batch.newBuilder().addArtifacts(singleChunkArtifact).build())
+      .build()
+
+    handler.onNext(singleChunkArtifactRequest)
+  }
+
+  test("All artifacts are added, even if some fail") {
+    val promise = Promise[AddArtifactsResponse]()
+    val handler =
+      new TestAddArtifactsHandler(new DummyStreamObserver(promise), throwIfArtifactExists = true)
+    try {
+      val name1 = "jars/dummy1.jar"
+      val name2 = "jars/dummy2.jar"
+      val name3 = "jars/dummy3.jar"
+
+      val artifactPath1 = inputFilePath.resolve("smallClassFile.class")
+      val artifactPath2 = inputFilePath.resolve("smallJar.jar")
+
+      assume(artifactPath1.toFile.exists)
+      addSingleChunkArtifact(handler, sessionKey, name1, artifactPath1)
+      addSingleChunkArtifact(handler, sessionKey, name3, artifactPath1)
+
+      val e = intercept[StatusRuntimeException] {
+        addSingleChunkArtifact(handler, sessionKey, name1, artifactPath2)
+        addSingleChunkArtifact(handler, sessionKey, name2, artifactPath1)
+        addSingleChunkArtifact(handler, sessionKey, name3, artifactPath2)
+        handler.onCompleted()
+      }
+
+      // Both artifacts should be added, despite exception
+      assert(handler.getFinalArtifacts.contains(name1))
+      assert(handler.getFinalArtifacts.contains(name2))
+      assert(handler.getFinalArtifacts.contains(name3))
+
+      assert(e.getStatus.getCode == Code.INTERNAL)
+      val statusProto = StatusProto.fromThrowable(e)
+      assert(statusProto.getDetailsCount == 1)
+      val details = statusProto.getDetails(0)
+      val info = details.unpack(classOf[ErrorInfo])
+
+      assert(e.getMessage.contains("ARTIFACT_ALREADY_EXISTS"))
+      assert(info.getMetadataMap().get("messageParameters").contains(name1))
+    } finally {
+      handler.forceCleanUp()
+    }
+  }
 }
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/ExecuteEventsManagerSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/ExecuteEventsManagerSuite.scala
index 66dd3680d93a2..a17c76ae95286 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/ExecuteEventsManagerSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/ExecuteEventsManagerSuite.scala
@@ -24,7 +24,7 @@ import scala.util.matching.Regex
 import org.mockito.Mockito._
 import org.scalatestplus.mockito.MockitoSugar
 
-import org.apache.spark.{SparkConf, SparkContext, SparkFunSuite}
+import org.apache.spark.{SparkContext, SparkFunSuite}
 import org.apache.spark.connect.proto
 import org.apache.spark.connect.proto.{ExecutePlanRequest, Plan, UserContext}
 import org.apache.spark.scheduler.LiveListenerBus
@@ -51,7 +51,6 @@ class ExecuteEventsManagerSuite
   val DEFAULT_SESSION_ID = UUID.randomUUID.toString
   val DEFAULT_QUERY_ID = UUID.randomUUID.toString
   val DEFAULT_CLIENT_TYPE = "clientType"
-  val jsonProtocol = new JsonProtocol(new SparkConf())
 
   test("SPARK-43923: post started") {
     val events = setupEvents(ExecuteStatus.Pending)
@@ -72,8 +71,8 @@ class ExecuteEventsManagerSuite
       .post(expectedEvent)
 
     assert(
-      jsonProtocol
-        .sparkEventFromJson(jsonProtocol.sparkEventToJsonString(expectedEvent))
+      JsonProtocol
+        .sparkEventFromJson(JsonProtocol.sparkEventToJsonString(expectedEvent))
         .isInstanceOf[SparkListenerConnectOperationStarted])
   }
 
@@ -91,8 +90,8 @@ class ExecuteEventsManagerSuite
       .post(expectedEvent)
 
     assert(
-      jsonProtocol
-        .sparkEventFromJson(jsonProtocol.sparkEventToJsonString(expectedEvent))
+      JsonProtocol
+        .sparkEventFromJson(JsonProtocol.sparkEventToJsonString(expectedEvent))
         .isInstanceOf[SparkListenerConnectOperationAnalyzed])
   }
 
@@ -118,8 +117,8 @@ class ExecuteEventsManagerSuite
       .post(expectedEvent)
 
     assert(
-      jsonProtocol
-        .sparkEventFromJson(jsonProtocol.sparkEventToJsonString(expectedEvent))
+      JsonProtocol
+        .sparkEventFromJson(JsonProtocol.sparkEventToJsonString(expectedEvent))
         .isInstanceOf[SparkListenerConnectOperationReadyForExecution])
   }
 
@@ -134,8 +133,8 @@ class ExecuteEventsManagerSuite
       .post(expectedEvent)
 
     assert(
-      jsonProtocol
-        .sparkEventFromJson(jsonProtocol.sparkEventToJsonString(expectedEvent))
+      JsonProtocol
+        .sparkEventFromJson(JsonProtocol.sparkEventToJsonString(expectedEvent))
         .isInstanceOf[SparkListenerConnectOperationCanceled])
   }
 
@@ -152,8 +151,8 @@ class ExecuteEventsManagerSuite
       .post(expectedEvent)
 
     assert(
-      jsonProtocol
-        .sparkEventFromJson(jsonProtocol.sparkEventToJsonString(expectedEvent))
+      JsonProtocol
+        .sparkEventFromJson(JsonProtocol.sparkEventToJsonString(expectedEvent))
         .isInstanceOf[SparkListenerConnectOperationFailed])
   }
 
@@ -168,8 +167,8 @@ class ExecuteEventsManagerSuite
       .post(expectedEvent)
 
     assert(
-      jsonProtocol
-        .sparkEventFromJson(jsonProtocol.sparkEventToJsonString(expectedEvent))
+      JsonProtocol
+        .sparkEventFromJson(JsonProtocol.sparkEventToJsonString(expectedEvent))
         .isInstanceOf[SparkListenerConnectOperationFinished])
   }
 
@@ -209,8 +208,8 @@ class ExecuteEventsManagerSuite
       .post(expectedEvent)
 
     assert(
-      jsonProtocol
-        .sparkEventFromJson(jsonProtocol.sparkEventToJsonString(expectedEvent))
+      JsonProtocol
+        .sparkEventFromJson(JsonProtocol.sparkEventToJsonString(expectedEvent))
         .isInstanceOf[SparkListenerConnectOperationClosed])
   }
 
diff --git a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/SparkConnectSessionHolderSuite.scala b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/SparkConnectSessionHolderSuite.scala
index 159b29ce6b8e7..a110b0164f199 100644
--- a/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/SparkConnectSessionHolderSuite.scala
+++ b/sql/connect/server/src/test/scala/org/apache/spark/sql/connect/service/SparkConnectSessionHolderSuite.scala
@@ -401,19 +401,23 @@ class SparkConnectSessionHolderSuite extends SharedSparkSession {
   test("Test session plan cache - disabled") {
     val sessionHolder = SparkConnectTestUtils.createDummySessionHolder(spark)
     // Disable plan cache of the session
-    sessionHolder.session.conf.set(Connect.CONNECT_SESSION_PLAN_CACHE_ENABLED.key, false)
-    val planner = new SparkConnectPlanner(sessionHolder)
+    try {
+      sessionHolder.session.conf.set(Connect.CONNECT_SESSION_PLAN_CACHE_ENABLED.key, false)
+      val planner = new SparkConnectPlanner(sessionHolder)
 
-    val query = buildRelation("select 1")
+      val query = buildRelation("select 1")
 
-    // If cachePlan is false, the cache is still empty.
-    // Although the cache is created as cache size is greater than zero, it won't be used.
-    planner.transformRelation(query, cachePlan = false)
-    assertPlanCache(sessionHolder, Some(Set()))
+      // If cachePlan is false, the cache is still empty.
+      // Although the cache is created as cache size is greater than zero, it won't be used.
+      planner.transformRelation(query, cachePlan = false)
+      assertPlanCache(sessionHolder, Some(Set()))
 
-    // Even if we specify "cachePlan = true", the cache is still empty.
-    planner.transformRelation(query, cachePlan = true)
-    assertPlanCache(sessionHolder, Some(Set()))
+      // Even if we specify "cachePlan = true", the cache is still empty.
+      planner.transformRelation(query, cachePlan = true)
+      assertPlanCache(sessionHolder, Some(Set()))
+    } finally {
+      sessionHolder.session.conf.set(Connect.CONNECT_SESSION_PLAN_CACHE_ENABLED, true)
+    }
   }
 
   test("Test duplicate operation IDs") {
@@ -440,4 +444,40 @@ class SparkConnectSessionHolderSuite extends SharedSparkSession {
       sessionHolder.getPipelineExecution(graphId).isEmpty,
       "pipeline execution was not removed")
   }
+
+  gridTest("Actively cache data source reads")(Seq(true, false)) { enabled =>
+    val sessionHolder = SparkConnectTestUtils.createDummySessionHolder(spark)
+    val planner = new SparkConnectPlanner(sessionHolder)
+
+    val dataSourceRead = proto.Relation
+      .newBuilder()
+      .setRead(
+        proto.Read
+          .newBuilder()
+          .setDataSource(proto.Read.DataSource
+            .newBuilder()
+            .setSchema("col int")))
+      .setCommon(proto.RelationCommon.newBuilder().setPlanId(Random.nextLong()).build())
+      .build()
+    val dataSourceReadJoin = proto.Relation
+      .newBuilder()
+      .setJoin(
+        proto.Join
+          .newBuilder()
+          .setLeft(dataSourceRead)
+          .setRight(dataSourceRead)
+          .setJoinType(proto.Join.JoinType.JOIN_TYPE_CROSS))
+      .setCommon(proto.RelationCommon.newBuilder().setPlanId(Random.nextLong()).build())
+      .build()
+
+    sessionHolder.session.conf
+      .set(Connect.CONNECT_ALWAYS_CACHE_DATA_SOURCE_READS_ENABLED, enabled)
+    planner.transformRelation(dataSourceReadJoin, cachePlan = true)
+    val expected = if (enabled) {
+      Set(dataSourceReadJoin, dataSourceRead)
+    } else {
+      Set(dataSourceReadJoin)
+    }
+    assertPlanCache(sessionHolder, Some(expected))
+  }
 }
diff --git a/sql/core/benchmarks/AggregateBenchmark-jdk21-results.txt b/sql/core/benchmarks/AggregateBenchmark-jdk21-results.txt
index 186593aff6bbc..86de9e21ade3f 100644
--- a/sql/core/benchmarks/AggregateBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/AggregateBenchmark-jdk21-results.txt
@@ -2,147 +2,147 @@
 aggregate without grouping
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 agg w/o group:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-agg w/o group wholestage off                      35437          35937         707         59.2          16.9       1.0X
-agg w/o group wholestage on                        2857           2862           6        734.0           1.4      12.4X
+agg w/o group wholestage off                      35386          35792         574         59.3          16.9       1.0X
+agg w/o group wholestage on                        2850           2855           4        735.8           1.4      12.4X
 
 
 ================================================================================================
 stat functions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 stddev:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-stddev wholestage off                              4410           4433          34         23.8          42.1       1.0X
-stddev wholestage on                                982            987           4        106.8           9.4       4.5X
+stddev wholestage off                              4380           4400          27         23.9          41.8       1.0X
+stddev wholestage on                                982            989           7        106.8           9.4       4.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 kurtosis:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-kurtosis wholestage off                           22289          22520         326          4.7         212.6       1.0X
-kurtosis wholestage on                              988            996           6        106.2           9.4      22.6X
+kurtosis wholestage off                           21731          21746          20          4.8         207.2       1.0X
+kurtosis wholestage on                              990            998           6        105.9           9.4      21.9X
 
 
 ================================================================================================
 aggregate with linear keys
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w keys:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        6846           6857          16         12.3          81.6       1.0X
-codegen = T, hashmap = F                           4326           4415         102         19.4          51.6       1.6X
-codegen = T, row-based hashmap = T                 1180           1194          12         71.1          14.1       5.8X
-codegen = T, vectorized hashmap = T                 804            843          39        104.3           9.6       8.5X
+codegen = F                                        6421           6468          66         13.1          76.5       1.0X
+codegen = T, hashmap = F                           4050           4075          23         20.7          48.3       1.6X
+codegen = T, row-based hashmap = T                 1229           1239          10         68.2          14.7       5.2X
+codegen = T, vectorized hashmap = T                 812            824          12        103.3           9.7       7.9X
 
 
 ================================================================================================
 aggregate with randomized keys
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w keys:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        7511           7796         403         11.2          89.5       1.0X
-codegen = T, hashmap = F                           4800           4868          67         17.5          57.2       1.6X
-codegen = T, row-based hashmap = T                 1661           1677          11         50.5          19.8       4.5X
-codegen = T, vectorized hashmap = T                1077           1159         121         77.9          12.8       7.0X
+codegen = F                                        7268           7292          33         11.5          86.6       1.0X
+codegen = T, hashmap = F                           4630           4645          18         18.1          55.2       1.6X
+codegen = T, row-based hashmap = T                 1641           1645           5         51.1          19.6       4.4X
+codegen = T, vectorized hashmap = T                1066           1115          73         78.7          12.7       6.8X
 
 
 ================================================================================================
 aggregate with string key
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w string key:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        2438           2457          26          8.6         116.3       1.0X
-codegen = T, hashmap = F                           1762           1770           7         11.9          84.0       1.4X
-codegen = T, row-based hashmap = T                 1028           1044          11         20.4          49.0       2.4X
-codegen = T, vectorized hashmap = T                 803            817          18         26.1          38.3       3.0X
+codegen = F                                        2524           2549          35          8.3         120.3       1.0X
+codegen = T, hashmap = F                           1515           1540          41         13.8          72.2       1.7X
+codegen = T, row-based hashmap = T                 1059           1068           6         19.8          50.5       2.4X
+codegen = T, vectorized hashmap = T                 823            825           3         25.5          39.2       3.1X
 
 
 ================================================================================================
 aggregate with decimal key
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w decimal key:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        2272           2276           6          9.2         108.3       1.0X
-codegen = T, hashmap = F                           1343           1356          18         15.6          64.1       1.7X
-codegen = T, row-based hashmap = T                  456            481          19         46.0          21.7       5.0X
-codegen = T, vectorized hashmap = T                 333            336           4         63.0          15.9       6.8X
+codegen = F                                        2169           2174           6          9.7         103.4       1.0X
+codegen = T, hashmap = F                           1349           1363          20         15.5          64.3       1.6X
+codegen = T, row-based hashmap = T                  470            483           9         44.6          22.4       4.6X
+codegen = T, vectorized hashmap = T                 313            317           2         67.0          14.9       6.9X
 
 
 ================================================================================================
 aggregate with multiple key types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w multiple keys:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        4329           4360          43          4.8         206.4       1.0X
-codegen = T, hashmap = F                           2337           2347          14          9.0         111.5       1.9X
-codegen = T, row-based hashmap = T                 1749           1752           4         12.0          83.4       2.5X
-codegen = T, vectorized hashmap = T                1628           1632           6         12.9          77.6       2.7X
+codegen = F                                        4283           4287           7          4.9         204.2       1.0X
+codegen = T, hashmap = F                           2291           2301          13          9.2         109.3       1.9X
+codegen = T, row-based hashmap = T                 1750           1756           7         12.0          83.5       2.4X
+codegen = T, vectorized hashmap = T                1584           1595          15         13.2          75.6       2.7X
 
 
 ================================================================================================
 max function bytecode size of wholestagecodegen
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 max function bytecode size:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                         359            370           9          1.8         548.0       1.0X
-codegen = T, hugeMethodLimit = 10000                142            160          16          4.6         216.6       2.5X
-codegen = T, hugeMethodLimit = 1500                 136            146          11          4.8         207.3       2.6X
+codegen = F                                         365            391          24          1.8         557.4       1.0X
+codegen = T, hugeMethodLimit = 10000                141            155          13          4.6         215.6       2.6X
+codegen = T, hugeMethodLimit = 1500                 134            146          20          4.9         205.0       2.7X
 
 
 ================================================================================================
 cube
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cube:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cube wholestage off                                2070           2141         100          2.5         394.8       1.0X
-cube wholestage on                                 1094           1113          12          4.8         208.6       1.9X
+cube wholestage off                                2067           2088          31          2.5         394.2       1.0X
+cube wholestage on                                 1072           1084           9          4.9         204.4       1.9X
 
 
 ================================================================================================
 hash and BytesToBytesMap
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 BytesToBytesMap:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UnsafeRowhash                                       146            147           2        143.2           7.0       1.0X
-murmur3 hash                                         54             54           0        390.9           2.6       2.7X
-fast hash                                            24             24           0        882.5           1.1       6.2X
-arrayEqual                                          137            137           0        153.2           6.5       1.1X
-Java HashMap (Long)                                  60             70           7        346.9           2.9       2.4X
-Java HashMap (two ints)                              81             84           2        259.2           3.9       1.8X
-Java HashMap (UnsafeRow)                            531            533           1         39.5          25.3       0.3X
-LongToUnsafeRowMap (opt=false)                      351            352           1         59.7          16.7       0.4X
-LongToUnsafeRowMap (opt=true)                        74             76           1        283.3           3.5       2.0X
-BytesToBytesMap (off Heap)                          413            417           5         50.8          19.7       0.4X
-BytesToBytesMap (on Heap)                           428            433           5         49.0          20.4       0.3X
-Aggregate HashMap                                    30             31           2        689.0           1.5       4.8X
+UnsafeRowhash                                       146            147           1        143.2           7.0       1.0X
+murmur3 hash                                         54             54           0        390.8           2.6       2.7X
+fast hash                                            24             24           0        882.6           1.1       6.2X
+arrayEqual                                          137            137           0        153.1           6.5       1.1X
+Java HashMap (Long)                                  62             65           3        335.8           3.0       2.3X
+Java HashMap (two ints)                              86             90           4        242.5           4.1       1.7X
+Java HashMap (UnsafeRow)                            509            511           4         41.2          24.3       0.3X
+LongToUnsafeRowMap (opt=false)                      345            346           1         60.8          16.4       0.4X
+LongToUnsafeRowMap (opt=true)                        85             86           1        246.3           4.1       1.7X
+BytesToBytesMap (off Heap)                          437            439           1         48.0          20.8       0.3X
+BytesToBytesMap (on Heap)                           437            438           1         48.0          20.8       0.3X
+Aggregate HashMap                                    30             31           1        690.8           1.4       4.8X
 
 
diff --git a/sql/core/benchmarks/AggregateBenchmark-results.txt b/sql/core/benchmarks/AggregateBenchmark-results.txt
index 68c605d5c4a16..27b6d7d37c505 100644
--- a/sql/core/benchmarks/AggregateBenchmark-results.txt
+++ b/sql/core/benchmarks/AggregateBenchmark-results.txt
@@ -2,147 +2,147 @@
 aggregate without grouping
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 agg w/o group:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-agg w/o group wholestage off                      38366          39019         923         54.7          18.3       1.0X
-agg w/o group wholestage on                        3369           3383           9        622.5           1.6      11.4X
+agg w/o group wholestage off                      38902          39364         653         53.9          18.5       1.0X
+agg w/o group wholestage on                        3377           3381           4        621.0           1.6      11.5X
 
 
 ================================================================================================
 stat functions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 stddev:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-stddev wholestage off                              4539           4551          17         23.1          43.3       1.0X
-stddev wholestage on                                981            986           4        106.8           9.4       4.6X
+stddev wholestage off                              4528           4536          12         23.2          43.2       1.0X
+stddev wholestage on                                979            992           9        107.2           9.3       4.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 kurtosis:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-kurtosis wholestage off                           22063          22102          56          4.8         210.4       1.0X
-kurtosis wholestage on                              985            994           7        106.4           9.4      22.4X
+kurtosis wholestage off                           23508          23553          64          4.5         224.2       1.0X
+kurtosis wholestage on                              995           1000           5        105.4           9.5      23.6X
 
 
 ================================================================================================
 aggregate with linear keys
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w keys:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        6868           6923          78         12.2          81.9       1.0X
-codegen = T, hashmap = F                           4329           4358          35         19.4          51.6       1.6X
-codegen = T, row-based hashmap = T                 1203           1222          19         69.7          14.3       5.7X
-codegen = T, vectorized hashmap = T                 828            847          34        101.3           9.9       8.3X
+codegen = F                                        7037           7162         177         11.9          83.9       1.0X
+codegen = T, hashmap = F                           4256           4318          57         19.7          50.7       1.7X
+codegen = T, row-based hashmap = T                 1236           1256          20         67.9          14.7       5.7X
+codegen = T, vectorized hashmap = T                 817            840          19        102.7           9.7       8.6X
 
 
 ================================================================================================
 aggregate with randomized keys
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w keys:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        7623           7658          49         11.0          90.9       1.0X
-codegen = T, hashmap = F                           4942           4971          28         17.0          58.9       1.5X
-codegen = T, row-based hashmap = T                 1706           1729          17         49.2          20.3       4.5X
-codegen = T, vectorized hashmap = T                1042           1079          31         80.5          12.4       7.3X
+codegen = F                                        7713           7764          73         10.9          91.9       1.0X
+codegen = T, hashmap = F                           4964           4975          18         16.9          59.2       1.6X
+codegen = T, row-based hashmap = T                 1689           1711          20         49.7          20.1       4.6X
+codegen = T, vectorized hashmap = T                1044           1086          34         80.3          12.4       7.4X
 
 
 ================================================================================================
 aggregate with string key
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w string key:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        2493           2520          39          8.4         118.9       1.0X
-codegen = T, hashmap = F                           1527           1538          11         13.7          72.8       1.6X
-codegen = T, row-based hashmap = T                 1015           1025          12         20.7          48.4       2.5X
-codegen = T, vectorized hashmap = T                 821            831          11         25.5          39.2       3.0X
+codegen = F                                        2526           2539          18          8.3         120.5       1.0X
+codegen = T, hashmap = F                           1567           1575          11         13.4          74.7       1.6X
+codegen = T, row-based hashmap = T                 1024           1028           3         20.5          48.8       2.5X
+codegen = T, vectorized hashmap = T                 825            829           5         25.4          39.3       3.1X
 
 
 ================================================================================================
 aggregate with decimal key
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w decimal key:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        2122           2170          68          9.9         101.2       1.0X
-codegen = T, hashmap = F                           1377           1393          22         15.2          65.7       1.5X
-codegen = T, row-based hashmap = T                  437            442           4         48.0          20.9       4.9X
-codegen = T, vectorized hashmap = T                 310            317           3         67.6          14.8       6.8X
+codegen = F                                        2110           2114           6          9.9         100.6       1.0X
+codegen = T, hashmap = F                           1449           1450           2         14.5          69.1       1.5X
+codegen = T, row-based hashmap = T                  448            458          13         46.8          21.4       4.7X
+codegen = T, vectorized hashmap = T                 311            319           5         67.5          14.8       6.8X
 
 
 ================================================================================================
 aggregate with multiple key types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Aggregate w multiple keys:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                        4196           4197           2          5.0         200.1       1.0X
-codegen = T, hashmap = F                           2482           2493          14          8.4         118.4       1.7X
-codegen = T, row-based hashmap = T                 1727           1740          18         12.1          82.4       2.4X
-codegen = T, vectorized hashmap = T                1648           1671          32         12.7          78.6       2.5X
+codegen = F                                        4264           4286          31          4.9         203.3       1.0X
+codegen = T, hashmap = F                           2383           2406          32          8.8         113.6       1.8X
+codegen = T, row-based hashmap = T                 1873           1876           4         11.2          89.3       2.3X
+codegen = T, vectorized hashmap = T                1674           1681          10         12.5          79.8       2.5X
 
 
 ================================================================================================
 max function bytecode size of wholestagecodegen
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 max function bytecode size:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-codegen = F                                         359            388          25          1.8         548.0       1.0X
-codegen = T, hugeMethodLimit = 10000                147            166          16          4.5         223.6       2.5X
-codegen = T, hugeMethodLimit = 1500                 135            146          13          4.8         206.5       2.7X
+codegen = F                                         379            411          21          1.7         577.6       1.0X
+codegen = T, hugeMethodLimit = 10000                137            160          20          4.8         209.4       2.8X
+codegen = T, hugeMethodLimit = 1500                 135            156          15          4.9         205.7       2.8X
 
 
 ================================================================================================
 cube
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cube:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cube wholestage off                                2183           2214          44          2.4         416.4       1.0X
-cube wholestage on                                 1139           1148           7          4.6         217.3       1.9X
+cube wholestage off                                2099           2117          27          2.5         400.3       1.0X
+cube wholestage on                                 1157           1164           5          4.5         220.7       1.8X
 
 
 ================================================================================================
 hash and BytesToBytesMap
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 BytesToBytesMap:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UnsafeRowhash                                       204            205           1        102.9           9.7       1.0X
-murmur3 hash                                         69             70           1        304.0           3.3       3.0X
-fast hash                                            72             73           7        292.8           3.4       2.8X
-arrayEqual                                          144            144           0        145.8           6.9       1.4X
-Java HashMap (Long)                                  65             69           3        320.7           3.1       3.1X
-Java HashMap (two ints)                              85             88           1        247.9           4.0       2.4X
-Java HashMap (UnsafeRow)                            549            550           1         38.2          26.2       0.4X
-LongToUnsafeRowMap (opt=false)                      342            344           1         61.3          16.3       0.6X
-LongToUnsafeRowMap (opt=true)                        73             74           1        287.4           3.5       2.8X
-BytesToBytesMap (off Heap)                          607            609           2         34.6          28.9       0.3X
-BytesToBytesMap (on Heap)                           609            623          17         34.4          29.0       0.3X
-Aggregate HashMap                                    31             31           0        686.4           1.5       6.7X
+UnsafeRowhash                                       204            204           0        102.9           9.7       1.0X
+murmur3 hash                                         70             70           0        301.0           3.3       2.9X
+fast hash                                            72             72           1        293.2           3.4       2.8X
+arrayEqual                                          144            144           0        145.7           6.9       1.4X
+Java HashMap (Long)                                  65             68           3        321.3           3.1       3.1X
+Java HashMap (two ints)                              91             93           2        229.2           4.4       2.2X
+Java HashMap (UnsafeRow)                            541            544           3         38.7          25.8       0.4X
+LongToUnsafeRowMap (opt=false)                      345            346           1         60.9          16.4       0.6X
+LongToUnsafeRowMap (opt=true)                        81             82           1        259.0           3.9       2.5X
+BytesToBytesMap (off Heap)                          540            544           3         38.8          25.8       0.4X
+BytesToBytesMap (on Heap)                           544            546           2         38.5          25.9       0.4X
+Aggregate HashMap                                    31             31           2        686.0           1.5       6.7X
 
 
diff --git a/sql/core/benchmarks/AnsiIntervalSortBenchmark-jdk21-results.txt b/sql/core/benchmarks/AnsiIntervalSortBenchmark-jdk21-results.txt
index b8fafc2f6104b..8ab7df150dc27 100644
--- a/sql/core/benchmarks/AnsiIntervalSortBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/AnsiIntervalSortBenchmark-jdk21-results.txt
@@ -1,28 +1,28 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 year month interval one column:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-year month interval one column enable radix           23323          23592         290          4.3         233.2       1.0X
-year month interval one column disable radix          33714          34091         548          3.0         337.1       0.7X
+year month interval one column enable radix           23086          23193         180          4.3         230.9       1.0X
+year month interval one column disable radix          33420          33638         280          3.0         334.2       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 year month interval two columns:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-year month interval two columns enable radix           35096          35612         485          2.8         351.0       1.0X
-year month interval two columns disable radix          35011          35229         196          2.9         350.1       1.0X
+year month interval two columns enable radix           34321          34376          49          2.9         343.2       1.0X
+year month interval two columns disable radix          34147          34406         226          2.9         341.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 day time interval one columns:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-day time interval one columns enable radix           22557          22651         141          4.4         225.6       1.0X
-day time interval one columns disable radix          45748          47238        1535          2.2         457.5       0.5X
+day time interval one columns enable radix           22025          22097          95          4.5         220.2       1.0X
+day time interval one columns disable radix          33367          33681         273          3.0         333.7       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 day time interval two columns:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-day time interval two columns enable radix           34733          36376        2685          2.9         347.3       1.0X
-day time interval two columns disable radix          34733          34798          57          2.9         347.3       1.0X
+day time interval two columns enable radix           34400          34546         199          2.9         344.0       1.0X
+day time interval two columns disable radix          34308          34467         148          2.9         343.1       1.0X
 
diff --git a/sql/core/benchmarks/AnsiIntervalSortBenchmark-results.txt b/sql/core/benchmarks/AnsiIntervalSortBenchmark-results.txt
index 2f43585165677..ab4243d9d9daa 100644
--- a/sql/core/benchmarks/AnsiIntervalSortBenchmark-results.txt
+++ b/sql/core/benchmarks/AnsiIntervalSortBenchmark-results.txt
@@ -1,28 +1,28 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 year month interval one column:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-year month interval one column enable radix           22341          22440         168          4.5         223.4       1.0X
-year month interval one column disable radix          32157          32216          51          3.1         321.6       0.7X
+year month interval one column enable radix           22721          22833         190          4.4         227.2       1.0X
+year month interval one column disable radix          32701          33148         769          3.1         327.0       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 year month interval two columns:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-year month interval two columns enable radix           33156          33365         284          3.0         331.6       1.0X
-year month interval two columns disable radix          33156          33661         697          3.0         331.6       1.0X
+year month interval two columns enable radix           33482          33621         208          3.0         334.8       1.0X
+year month interval two columns disable radix          34206          35140         824          2.9         342.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 day time interval one columns:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-day time interval one columns enable radix           21445          21467          21          4.7         214.5       1.0X
-day time interval one columns disable radix          33962          34125         193          2.9         339.6       0.6X
+day time interval one columns enable radix           21312          21459         239          4.7         213.1       1.0X
+day time interval one columns disable radix          32898          33575         820          3.0         329.0       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 day time interval two columns:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-day time interval two columns enable radix           33598          34314         627          3.0         336.0       1.0X
-day time interval two columns disable radix          34614          34755         192          2.9         346.1       1.0X
+day time interval two columns enable radix           35367          35398          27          2.8         353.7       1.0X
+day time interval two columns disable radix          33655          34642         856          3.0         336.5       1.1X
 
diff --git a/sql/core/benchmarks/Base64Benchmark-jdk21-results.txt b/sql/core/benchmarks/Base64Benchmark-jdk21-results.txt
index 1ffdb71362577..402818e8677f3 100644
--- a/sql/core/benchmarks/Base64Benchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/Base64Benchmark-jdk21-results.txt
@@ -1,56 +1,56 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 1:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               2064           2074          13          9.7         103.2       1.0X
-apache                                            11112          11179          70          1.8         555.6       0.2X
+java                                               1702           1734          29         11.8          85.1       1.0X
+apache                                            12539          12638         149          1.6         626.9       0.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 3:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               2450           2454           4          8.2         122.5       1.0X
-apache                                            12408          12449          36          1.6         620.4       0.2X
+java                                               2296           2307          12          8.7         114.8       1.0X
+apache                                            13071          13126          95          1.5         653.5       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 5:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               3023           3025           2          6.6         151.1       1.0X
-apache                                            13242          13399         215          1.5         662.1       0.2X
+java                                               2547           2561          12          7.9         127.3       1.0X
+apache                                            13833          13954         190          1.4         691.7       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 7:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               3104           3107           3          6.4         155.2       1.0X
-apache                                            14314          14395         116          1.4         715.7       0.2X
+java                                               2364           2393          29          8.5         118.2       1.0X
+apache                                            14684          14846         151          1.4         734.2       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 1:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               3051           3110          69          6.6         152.5       1.0X
-apache                                            12294          12367          68          1.6         614.7       0.2X
+java                                               3451           3463          10          5.8         172.6       1.0X
+apache                                            13152          13264          99          1.5         657.6       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 3:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               4231           4235           6          4.7         211.5       1.0X
-apache                                            14025          14169         134          1.4         701.2       0.3X
+java                                               3957           3985          27          5.1         197.8       1.0X
+apache                                            15380          15852         454          1.3         769.0       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 5:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               5199           5209          14          3.8         260.0       1.0X
-apache                                            15985          16010          26          1.3         799.3       0.3X
+java                                               5316           5319           3          3.8         265.8       1.0X
+apache                                            16800          17066         241          1.2         840.0       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 7:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               5650           5664          18          3.5         282.5       1.0X
-apache                                            17240          17296          49          1.2         862.0       0.3X
+java                                               5803           5816          19          3.4         290.2       1.0X
+apache                                            17991          18178         257          1.1         899.5       0.3X
 
diff --git a/sql/core/benchmarks/Base64Benchmark-results.txt b/sql/core/benchmarks/Base64Benchmark-results.txt
index ee761ac20b45f..168622f3ee6d5 100644
--- a/sql/core/benchmarks/Base64Benchmark-results.txt
+++ b/sql/core/benchmarks/Base64Benchmark-results.txt
@@ -1,56 +1,56 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 1:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               2137           2171          52          9.4         106.9       1.0X
-apache                                            11307          11383         122          1.8         565.4       0.2X
+java                                               1803           1819          20         11.1          90.2       1.0X
+apache                                            10576          10612          33          1.9         528.8       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 3:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               2607           2632          23          7.7         130.3       1.0X
-apache                                            12419          12504          77          1.6         620.9       0.2X
+java                                               2202           2206           4          9.1         110.1       1.0X
+apache                                            11399          11473          71          1.8         570.0       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 5:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               3217           3221           6          6.2         160.8       1.0X
-apache                                            13718          13802         123          1.5         685.9       0.2X
+java                                               2389           2413          22          8.4         119.5       1.0X
+apache                                            12749          12760          10          1.6         637.4       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode for 7:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               3680           3809         202          5.4         184.0       1.0X
-apache                                            14864          14911          41          1.3         743.2       0.2X
+java                                               2678           2692          19          7.5         133.9       1.0X
+apache                                            13702          13728          23          1.5         685.1       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 1:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               3284           3421         193          6.1         164.2       1.0X
-apache                                            12601          12635          45          1.6         630.0       0.3X
+java                                               2485           2607         135          8.0         124.2       1.0X
+apache                                            11603          11610           8          1.7         580.2       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 3:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               4651           4656           7          4.3         232.6       1.0X
-apache                                            14540          14547           8          1.4         727.0       0.3X
+java                                               3652           3680          25          5.5         182.6       1.0X
+apache                                            13428          13497          66          1.5         671.4       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 5:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               5689           5703          12          3.5         284.5       1.0X
-apache                                            16703          16719          16          1.2         835.1       0.3X
+java                                               4284           4359          66          4.7         214.2       1.0X
+apache                                            15058          15105          79          1.3         752.9       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 decode for 7:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-java                                               6467           6473           5          3.1         323.4       1.0X
-apache                                            18201          18301         124          1.1         910.1       0.4X
+java                                               5091           5176          74          3.9         254.6       1.0X
+apache                                            16424          16503          69          1.2         821.2       0.3X
 
diff --git a/sql/core/benchmarks/BloomFilterBenchmark-jdk21-results.txt b/sql/core/benchmarks/BloomFilterBenchmark-jdk21-results.txt
index 8f80b1e19fe32..93c71c9ed9b04 100644
--- a/sql/core/benchmarks/BloomFilterBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/BloomFilterBenchmark-jdk21-results.txt
@@ -2,195 +2,195 @@
 ORC Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write 100M rows:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter                               7475           7543          96         13.4          74.8       1.0X
-With bloom filter                                  9433           9445          16         10.6          94.3       0.8X
+Without bloom filter                               7914           7933          26         12.6          79.1       1.0X
+With bloom filter                                  9778           9781           5         10.2          97.8       0.8X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 2097152            871            881          13        114.8           8.7       1.0X
-With bloom filter, blocksize: 2097152               593            602          10        168.7           5.9       1.5X
+Without bloom filter, blocksize: 2097152            858            896          34        116.6           8.6       1.0X
+With bloom filter, blocksize: 2097152               576            592          18        173.5           5.8       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 4194304            823            835          18        121.6           8.2       1.0X
-With bloom filter, blocksize: 4194304               535            544           8        186.8           5.4       1.5X
+Without bloom filter, blocksize: 4194304            834            846          11        119.9           8.3       1.0X
+With bloom filter, blocksize: 4194304               546            567          21        183.1           5.5       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 6291456            820            831          17        121.9           8.2       1.0X
-With bloom filter, blocksize: 6291456               536            554          15        186.7           5.4       1.5X
+Without bloom filter, blocksize: 6291456            824            842          18        121.3           8.2       1.0X
+With bloom filter, blocksize: 6291456               560            591          22        178.6           5.6       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 8388608            813            832          20        123.1           8.1       1.0X
-With bloom filter, blocksize: 8388608               538            568          30        185.7           5.4       1.5X
+Without bloom filter, blocksize: 8388608            816            839          21        122.6           8.2       1.0X
+With bloom filter, blocksize: 8388608               550            571          26        181.7           5.5       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 12582912            868            874           9        115.2           8.7       1.0X
-With bloom filter, blocksize: 12582912               550            572          19        181.9           5.5       1.6X
+Without bloom filter, blocksize: 12582912            826            849          22        121.1           8.3       1.0X
+With bloom filter, blocksize: 12582912               586            597           8        170.5           5.9       1.4X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 16777216            808            824          26        123.8           8.1       1.0X
-With bloom filter, blocksize: 16777216               541            561          14        184.7           5.4       1.5X
+Without bloom filter, blocksize: 16777216            811            826          13        123.2           8.1       1.0X
+With bloom filter, blocksize: 16777216               521            541          16        191.9           5.2       1.6X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 33554432            805            818          14        124.3           8.0       1.0X
-With bloom filter, blocksize: 33554432               557            580          18        179.7           5.6       1.4X
+Without bloom filter, blocksize: 33554432            805            824          17        124.3           8.0       1.0X
+With bloom filter, blocksize: 33554432               526            540          10        190.1           5.3       1.5X
 
 
 ================================================================================================
 Parquet Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write 100M rows:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Without bloom filter                                 11626          11656          43          8.6         116.3       1.0X
-With bloom filter                                    14511          14577          93          6.9         145.1       0.8X
-With adaptive bloom filter & 3 candidates            14742          14886         203          6.8         147.4       0.8X
-With adaptive bloom filter & 5 candidates            14784          14789           8          6.8         147.8       0.8X
-With adaptive bloom filter & 9 candidates            14709          14725          23          6.8         147.1       0.8X
-With adaptive bloom filter & 15 candidates           14704          14749          64          6.8         147.0       0.8X
+Without bloom filter                                  9804           9869          91         10.2          98.0       1.0X
+With bloom filter                                    13700          13801         143          7.3         137.0       0.7X
+With adaptive bloom filter & 3 candidates            13475          13510          48          7.4         134.8       0.7X
+With adaptive bloom filter & 5 candidates            13308          13387         112          7.5         133.1       0.7X
+With adaptive bloom filter & 9 candidates            13471          13687         306          7.4         134.7       0.7X
+With adaptive bloom filter & 15 candidates           13292          13391         141          7.5         132.9       0.7X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 2097152            414            435          25        241.7           4.1       1.0X
-With bloom filter, blocksize: 2097152               180            196           7        556.2           1.8       2.3X
+Without bloom filter, blocksize: 2097152            429            464          34        232.8           4.3       1.0X
+With bloom filter, blocksize: 2097152               178            188          10        562.2           1.8       2.4X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 4194304            442            448           6        226.2           4.4       1.0X
-With bloom filter, blocksize: 4194304               121            128           7        829.6           1.2       3.7X
+Without bloom filter, blocksize: 4194304            405            410           4        247.1           4.0       1.0X
+With bloom filter, blocksize: 4194304               135            144           5        742.9           1.3       3.0X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 6291456            589            593           2        169.6           5.9       1.0X
-With bloom filter, blocksize: 6291456               125            134           7        799.9           1.3       4.7X
+Without bloom filter, blocksize: 6291456            399            409           8        250.7           4.0       1.0X
+With bloom filter, blocksize: 6291456               130            136           4        768.2           1.3       3.1X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 8388608            593            602          15        168.8           5.9       1.0X
-With bloom filter, blocksize: 8388608               281            292          11        355.3           2.8       2.1X
+Without bloom filter, blocksize: 8388608            403            410           5        248.1           4.0       1.0X
+With bloom filter, blocksize: 8388608               236            246           9        423.2           2.4       1.7X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 12582912            602            626          18        166.2           6.0       1.0X
-With bloom filter, blocksize: 12582912               477            502          29        209.8           4.8       1.3X
+Without bloom filter, blocksize: 12582912            416            453          25        240.1           4.2       1.0X
+With bloom filter, blocksize: 12582912               364            381           9        274.5           3.6       1.1X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 16777216            598            610          18        167.3           6.0       1.0X
-With bloom filter, blocksize: 16777216               520            524           4        192.5           5.2       1.2X
+Without bloom filter, blocksize: 16777216            443            474          21        225.8           4.4       1.0X
+With bloom filter, blocksize: 16777216               423            435           8        236.2           4.2       1.0X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 33554432            627            641          11        159.6           6.3       1.0X
-With bloom filter, blocksize: 33554432               615            629          13        162.6           6.1       1.0X
+Without bloom filter, blocksize: 33554432            421            440          15        237.3           4.2       1.0X
+With bloom filter, blocksize: 33554432               466            475           7        214.7           4.7       0.9X
 
 
diff --git a/sql/core/benchmarks/BloomFilterBenchmark-results.txt b/sql/core/benchmarks/BloomFilterBenchmark-results.txt
index 039dd1b73231e..2cdce5bfd7b72 100644
--- a/sql/core/benchmarks/BloomFilterBenchmark-results.txt
+++ b/sql/core/benchmarks/BloomFilterBenchmark-results.txt
@@ -2,195 +2,195 @@
 ORC Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write 100M rows:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter                               7671           7735          92         13.0          76.7       1.0X
-With bloom filter                                  9571           9658         123         10.4          95.7       0.8X
+Without bloom filter                               7656           7767         157         13.1          76.6       1.0X
+With bloom filter                                  9477           9524          66         10.6          94.8       0.8X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 2097152            912            932          19        109.6           9.1       1.0X
-With bloom filter, blocksize: 2097152               575            597          18        173.9           5.8       1.6X
+Without bloom filter, blocksize: 2097152            894            925          50        111.9           8.9       1.0X
+With bloom filter, blocksize: 2097152               586            596           9        170.5           5.9       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 4194304            801            810          10        124.8           8.0       1.0X
-With bloom filter, blocksize: 4194304               547            562          11        182.7           5.5       1.5X
+Without bloom filter, blocksize: 4194304            856            879          20        116.8           8.6       1.0X
+With bloom filter, blocksize: 4194304               558            579          22        179.1           5.6       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 6291456            814            820           5        122.8           8.1       1.0X
-With bloom filter, blocksize: 6291456               528            552          20        189.3           5.3       1.5X
+Without bloom filter, blocksize: 6291456            840            852          16        119.1           8.4       1.0X
+With bloom filter, blocksize: 6291456               544            566          15        183.8           5.4       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 8388608            804            809           4        124.3           8.0       1.0X
-With bloom filter, blocksize: 8388608               531            556          25        188.3           5.3       1.5X
+Without bloom filter, blocksize: 8388608            813            816           5        123.0           8.1       1.0X
+With bloom filter, blocksize: 8388608               545            567          15        183.3           5.5       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 12582912            816            822          11        122.6           8.2       1.0X
-With bloom filter, blocksize: 12582912               535            548          12        187.0           5.3       1.5X
+Without bloom filter, blocksize: 12582912            825            837          14        121.2           8.3       1.0X
+With bloom filter, blocksize: 12582912               542            547           6        184.6           5.4       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 16777216            790            794           5        126.6           7.9       1.0X
-With bloom filter, blocksize: 16777216               792            798           9        126.3           7.9       1.0X
+Without bloom filter, blocksize: 16777216            827            835          10        120.9           8.3       1.0X
+With bloom filter, blocksize: 16777216               536            542           5        186.5           5.4       1.5X
 
 
 ================================================================================================
 ORC Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 33554432           1266           1267           1         79.0          12.7       1.0X
-With bloom filter, blocksize: 33554432               759            769          12        131.8           7.6       1.7X
+Without bloom filter, blocksize: 33554432            802            808           6        124.7           8.0       1.0X
+With bloom filter, blocksize: 33554432               546            570          23        183.0           5.5       1.5X
 
 
 ================================================================================================
 Parquet Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write 100M rows:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Without bloom filter                                 11243          11335         130          8.9         112.4       1.0X
-With bloom filter                                    14701          14728          38          6.8         147.0       0.8X
-With adaptive bloom filter & 3 candidates            14681          14747          93          6.8         146.8       0.8X
-With adaptive bloom filter & 5 candidates            14656          14680          34          6.8         146.6       0.8X
-With adaptive bloom filter & 9 candidates            14597          14739         201          6.9         146.0       0.8X
-With adaptive bloom filter & 15 candidates           14719          15232         726          6.8         147.2       0.8X
+Without bloom filter                                 10611          10612           1          9.4         106.1       1.0X
+With bloom filter                                    18632          18656          35          5.4         186.3       0.6X
+With adaptive bloom filter & 3 candidates            18536          18648         159          5.4         185.4       0.6X
+With adaptive bloom filter & 5 candidates            18673          18767         132          5.4         186.7       0.6X
+With adaptive bloom filter & 9 candidates            19199          19339         198          5.2         192.0       0.6X
+With adaptive bloom filter & 15 candidates           18736          18811         107          5.3         187.4       0.6X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 2097152            428            460          31        233.8           4.3       1.0X
-With bloom filter, blocksize: 2097152               180            185           5        556.9           1.8       2.4X
+Without bloom filter, blocksize: 2097152            454            464          13        220.1           4.5       1.0X
+With bloom filter, blocksize: 2097152               177            183           4        565.6           1.8       2.6X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 4194304            425            434           9        235.3           4.2       1.0X
-With bloom filter, blocksize: 4194304               132            142           9        758.3           1.3       3.2X
+Without bloom filter, blocksize: 4194304            424            432           5        235.7           4.2       1.0X
+With bloom filter, blocksize: 4194304               133            143          11        751.8           1.3       3.2X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 6291456            421            425           4        237.8           4.2       1.0X
-With bloom filter, blocksize: 6291456               133            140           5        750.9           1.3       3.2X
+Without bloom filter, blocksize: 6291456            427            434           5        234.1           4.3       1.0X
+With bloom filter, blocksize: 6291456               137            141           3        730.2           1.4       3.1X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 8388608            414            427          21        241.6           4.1       1.0X
-With bloom filter, blocksize: 8388608               180            188           6        555.3           1.8       2.3X
+Without bloom filter, blocksize: 8388608            419            429           5        238.5           4.2       1.0X
+With bloom filter, blocksize: 8388608               180            185           6        557.0           1.8       2.3X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 12582912            415            422           5        241.2           4.1       1.0X
-With bloom filter, blocksize: 12582912               277            284           8        360.9           2.8       1.5X
+Without bloom filter, blocksize: 12582912            427            435           6        234.4           4.3       1.0X
+With bloom filter, blocksize: 12582912               271            274           3        369.6           2.7       1.6X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 16777216            415            421           4        241.0           4.1       1.0X
-With bloom filter, blocksize: 16777216               345            348           2        289.7           3.5       1.2X
+Without bloom filter, blocksize: 16777216            442            457          17        226.2           4.4       1.0X
+With bloom filter, blocksize: 16777216               379            385           7        264.0           3.8       1.2X
 
 
 ================================================================================================
 Parquet Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read a row from 100M rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Without bloom filter, blocksize: 33554432            427            430           3        234.2           4.3       1.0X
-With bloom filter, blocksize: 33554432               508            520          12        196.9           5.1       0.8X
+Without bloom filter, blocksize: 33554432            507            520          10        197.1           5.1       1.0X
+With bloom filter, blocksize: 33554432               444            465          32        225.3           4.4       1.1X
 
 
diff --git a/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-jdk21-results.txt b/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-jdk21-results.txt
index f5a5e41abc411..f1a8a184aed2f 100644
--- a/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-jdk21-results.txt
@@ -2,69 +2,69 @@
 Parquet writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet(PARQUET_1_0) writer benchmark:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1728           1873         205          9.1         109.9       1.0X
-Output Single Double Column                        1755           1770          22          9.0         111.6       1.0X
-Output Int and String Column                       4182           4224          59          3.8         265.9       0.4X
-Output Partitions                                  3197           3308         157          4.9         203.2       0.5X
-Output Buckets                                     4471           4532          86          3.5         284.2       0.4X
+Output Single Int Column                           1800           1830          42          8.7         114.5       1.0X
+Output Single Double Column                        1730           1764          48          9.1         110.0       1.0X
+Output Int and String Column                       4175           4245          98          3.8         265.5       0.4X
+Output Partitions                                  3118           3174          78          5.0         198.3       0.6X
+Output Buckets                                     4285           4407         172          3.7         272.4       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet(PARQUET_2_0) writer benchmark:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1911           1937          36          8.2         121.5       1.0X
-Output Single Double Column                        1842           1857          21          8.5         117.1       1.0X
-Output Int and String Column                       4738           4790          74          3.3         301.2       0.4X
-Output Partitions                                  3311           3314           5          4.8         210.5       0.6X
-Output Buckets                                     4457           4463           8          3.5         283.4       0.4X
+Output Single Int Column                           1766           1792          36          8.9         112.3       1.0X
+Output Single Double Column                        1730           1743          18          9.1         110.0       1.0X
+Output Int and String Column                       5000           5014          19          3.1         317.9       0.4X
+Output Partitions                                  3373           3377           6          4.7         214.4       0.5X
+Output Buckets                                     4349           4363          21          3.6         276.5       0.4X
 
 
 ================================================================================================
 ORC writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 ORC writer benchmark:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1023           1029           9         15.4          65.0       1.0X
-Output Single Double Column                        1585           1586           1          9.9         100.7       0.6X
-Output Int and String Column                       3941           3976          50          4.0         250.6       0.3X
-Output Partitions                                  2392           2416          34          6.6         152.1       0.4X
-Output Buckets                                     3288           3336          69          4.8         209.0       0.3X
+Output Single Int Column                           1045           1046           2         15.1          66.4       1.0X
+Output Single Double Column                        1700           1700           1          9.3         108.1       0.6X
+Output Int and String Column                       3891           3930          55          4.0         247.4       0.3X
+Output Partitions                                  2441           2453          17          6.4         155.2       0.4X
+Output Buckets                                     3401           3407           8          4.6         216.2       0.3X
 
 
 ================================================================================================
 JSON writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON writer benchmark:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1549           1554           8         10.2          98.5       1.0X
-Output Single Double Column                        2290           2293           4          6.9         145.6       0.7X
-Output Int and String Column                       3888           3901          18          4.0         247.2       0.4X
-Output Partitions                                  3097           3098           2          5.1         196.9       0.5X
-Output Buckets                                     3967           3993          37          4.0         252.2       0.4X
+Output Single Int Column                           1531           1534           5         10.3          97.3       1.0X
+Output Single Double Column                        2285           2289           6          6.9         145.2       0.7X
+Output Int and String Column                       3803           3811          12          4.1         241.8       0.4X
+Output Partitions                                  3025           3036          15          5.2         192.3       0.5X
+Output Buckets                                     3817           3827          14          4.1         242.7       0.4X
 
 
 ================================================================================================
 CSV writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 CSV writer benchmark:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           3614           3631          23          4.4         229.8       1.0X
-Output Single Double Column                        4315           4359          61          3.6         274.4       0.8X
-Output Int and String Column                       6223           6230          10          2.5         395.6       0.6X
-Output Partitions                                  5652           5665          18          2.8         359.3       0.6X
-Output Buckets                                     6433           6439           8          2.4         409.0       0.6X
+Output Single Int Column                           3485           3499          21          4.5         221.6       1.0X
+Output Single Double Column                        4287           4316          41          3.7         272.6       0.8X
+Output Int and String Column                       6416           6424          11          2.5         407.9       0.5X
+Output Partitions                                  4985           5016          45          3.2         316.9       0.7X
+Output Buckets                                     6180           6193          19          2.5         392.9       0.6X
 
 
diff --git a/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-results.txt b/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-results.txt
index d335986e385a4..f8805b65e8227 100644
--- a/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-results.txt
+++ b/sql/core/benchmarks/BuiltInDataSourceWriteBenchmark-results.txt
@@ -2,69 +2,69 @@
 Parquet writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet(PARQUET_1_0) writer benchmark:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1807           1850          61          8.7         114.9       1.0X
-Output Single Double Column                        1877           1878           2          8.4         119.3       1.0X
-Output Int and String Column                       4562           4569          10          3.4         290.1       0.4X
-Output Partitions                                  3272           3312          57          4.8         208.0       0.6X
-Output Buckets                                     4431           4532         143          3.5         281.7       0.4X
+Output Single Int Column                           1818           1898         114          8.7         115.6       1.0X
+Output Single Double Column                        1847           1901          76          8.5         117.4       1.0X
+Output Int and String Column                       4498           4547          69          3.5         286.0       0.4X
+Output Partitions                                  3369           3453         118          4.7         214.2       0.5X
+Output Buckets                                     4790           4814          34          3.3         304.5       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet(PARQUET_2_0) writer benchmark:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1750           1756           8          9.0         111.3       1.0X
-Output Single Double Column                        1742           1749          11          9.0         110.7       1.0X
-Output Int and String Column                       4936           4943           9          3.2         313.8       0.4X
-Output Partitions                                  3140           3151          16          5.0         199.7       0.6X
-Output Buckets                                     4037           4042           7          3.9         256.7       0.4X
+Output Single Int Column                           1861           1901          57          8.5         118.3       1.0X
+Output Single Double Column                        1866           1873          10          8.4         118.6       1.0X
+Output Int and String Column                       4816           4830          19          3.3         306.2       0.4X
+Output Partitions                                  3270           3287          24          4.8         207.9       0.6X
+Output Buckets                                     4354           4359           7          3.6         276.8       0.4X
 
 
 ================================================================================================
 ORC writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 ORC writer benchmark:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1011           1023          17         15.6          64.3       1.0X
-Output Single Double Column                        1523           1526           5         10.3          96.8       0.7X
-Output Int and String Column                       3604           3645          58          4.4         229.2       0.3X
-Output Partitions                                  2397           2397           0          6.6         152.4       0.4X
-Output Buckets                                     3249           3278          40          4.8         206.6       0.3X
+Output Single Int Column                           1004           1030          37         15.7          63.8       1.0X
+Output Single Double Column                        1736           1742           9          9.1         110.4       0.6X
+Output Int and String Column                       3888           3908          27          4.0         247.2       0.3X
+Output Partitions                                  2649           2654           7          5.9         168.4       0.4X
+Output Buckets                                     3544           3562          25          4.4         225.3       0.3X
 
 
 ================================================================================================
 JSON writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON writer benchmark:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           1558           1569          14         10.1          99.1       1.0X
-Output Single Double Column                        2142           2163          30          7.3         136.2       0.7X
-Output Int and String Column                       3999           4021          31          3.9         254.3       0.4X
-Output Partitions                                  2928           2945          23          5.4         186.2       0.5X
-Output Buckets                                     3971           3975           5          4.0         252.5       0.4X
+Output Single Int Column                           1510           1528          24         10.4          96.0       1.0X
+Output Single Double Column                        2198           2201           4          7.2         139.7       0.7X
+Output Int and String Column                       3918           3948          41          4.0         249.1       0.4X
+Output Partitions                                  3058           3069          15          5.1         194.4       0.5X
+Output Buckets                                     3867           3892          36          4.1         245.8       0.4X
 
 
 ================================================================================================
 CSV writer benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 CSV writer benchmark:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Output Single Int Column                           2961           2980          27          5.3         188.3       1.0X
-Output Single Double Column                        3846           3853           9          4.1         244.5       0.8X
-Output Int and String Column                       5817           5827          15          2.7         369.8       0.5X
-Output Partitions                                  4568           4572           6          3.4         290.4       0.6X
-Output Buckets                                     5719           5753          48          2.8         363.6       0.5X
+Output Single Int Column                           2989           3007          25          5.3         190.0       1.0X
+Output Single Double Column                        3478           3498          28          4.5         221.1       0.9X
+Output Int and String Column                       6016           6059          61          2.6         382.5       0.5X
+Output Partitions                                  5130           5149          26          3.1         326.2       0.6X
+Output Buckets                                     5946           5950           6          2.6         378.1       0.5X
 
 
diff --git a/sql/core/benchmarks/ByteArrayBenchmark-jdk21-results.txt b/sql/core/benchmarks/ByteArrayBenchmark-jdk21-results.txt
index f6fbe1845b326..86aeef46914fb 100644
--- a/sql/core/benchmarks/ByteArrayBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/ByteArrayBenchmark-jdk21-results.txt
@@ -2,26 +2,26 @@
 byte array comparisons
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Byte Array compareTo:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-2-7 byte                                            252            259           4        259.7           3.9       1.0X
-8-16 byte                                           386            414          34        169.7           5.9       0.7X
-16-32 byte                                          387            393           7        169.3           5.9       0.7X
-512-1024 byte                                       521            528          10        125.7           8.0       0.5X
-512 byte slow                                      1537           1551          10         42.6          23.4       0.2X
-2-7 byte                                            315            316           1        208.0           4.8       0.8X
+2-7 byte                                            252            259           4        260.0           3.8       1.0X
+8-16 byte                                           412            438          34        159.0           6.3       0.6X
+16-32 byte                                          413            414           1        158.7           6.3       0.6X
+512-1024 byte                                       554            556           2        118.2           8.5       0.5X
+512 byte slow                                      1635           1704          64         40.1          25.0       0.2X
+2-7 byte                                            296            297           2        221.7           4.5       0.9X
 
 
 ================================================================================================
 byte array equals
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Byte Array equals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Byte Array equals                                   789            801          15        202.8           4.9       1.0X
+Byte Array equals                                   810            814           4        197.6           5.1       1.0X
 
 
diff --git a/sql/core/benchmarks/ByteArrayBenchmark-results.txt b/sql/core/benchmarks/ByteArrayBenchmark-results.txt
index b94c773fc513f..2dcb98a837fcd 100644
--- a/sql/core/benchmarks/ByteArrayBenchmark-results.txt
+++ b/sql/core/benchmarks/ByteArrayBenchmark-results.txt
@@ -2,26 +2,26 @@
 byte array comparisons
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Byte Array compareTo:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-2-7 byte                                            258            260           1        253.7           3.9       1.0X
-8-16 byte                                           388            440          37        169.0           5.9       0.7X
-16-32 byte                                          466            469           2        140.5           7.1       0.6X
-512-1024 byte                                       591            592           1        111.0           9.0       0.4X
-512 byte slow                                      1619           1694          72         40.5          24.7       0.2X
-2-7 byte                                            298            299           1        219.7           4.6       0.9X
+2-7 byte                                            259            260           1        253.3           3.9       1.0X
+8-16 byte                                           439            482          32        149.1           6.7       0.6X
+16-32 byte                                          501            503           1        130.7           7.7       0.5X
+512-1024 byte                                       648            652           1        101.1           9.9       0.4X
+512 byte slow                                      1721           1766          41         38.1          26.3       0.2X
+2-7 byte                                            296            296           0        221.5           4.5       0.9X
 
 
 ================================================================================================
 byte array equals
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Byte Array equals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Byte Array equals                                   822            829           6        194.7           5.1       1.0X
+Byte Array equals                                   706            710           1        226.6           4.4       1.0X
 
 
diff --git a/sql/core/benchmarks/CSVBenchmark-jdk21-results.txt b/sql/core/benchmarks/CSVBenchmark-jdk21-results.txt
index c3d72d847800d..e2c27a52e1f4b 100644
--- a/sql/core/benchmarks/CSVBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/CSVBenchmark-jdk21-results.txt
@@ -2,76 +2,76 @@
 Benchmark to measure CSV read/write performance
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parsing quoted values:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-One quoted string                                 24351          24419          60          0.0      487014.8       1.0X
+One quoted string                                 24075          24176          88          0.0      481490.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Wide rows with 1000 columns:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select 1000 columns                               56834          57144         501          0.0       56834.4       1.0X
-Select 100 columns                                21054          21095          55          0.0       21054.0       2.7X
-Select one column                                 17523          17550          27          0.1       17522.9       3.2X
-count()                                            3658           3676          25          0.3        3657.7      15.5X
-Select 100 columns, one bad input field           25678          25832         245          0.0       25678.1       2.2X
-Select 100 columns, corrupt record field          29027          29102          75          0.0       29026.6       2.0X
+Select 1000 columns                               58743          59075         481          0.0       58742.9       1.0X
+Select 100 columns                                21215          21234          19          0.0       21215.2       2.8X
+Select one column                                 17492          17573         122          0.1       17491.7       3.4X
+count()                                            3652           3697          70          0.3        3652.5      16.1X
+Select 100 columns, one bad input field           25226          25290          75          0.0       25226.1       2.3X
+Select 100 columns, corrupt record field          28706          28800         139          0.0       28705.9       2.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Count a dataset with 10 columns:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select 10 columns + count()                       10832          10860          39          0.9        1083.2       1.0X
-Select 1 column + count()                          7372           7399          27          1.4         737.2       1.5X
-count()                                            1698           1706           8          5.9         169.8       6.4X
+Select 10 columns + count()                       10639          10688          49          0.9        1063.9       1.0X
+Select 1 column + count()                          7266           7274           7          1.4         726.6       1.5X
+count()                                            1565           1572           6          6.4         156.5       6.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write dates and timestamps:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Create a dataset of timestamps                      864            867           2         11.6          86.4       1.0X
-to_csv(timestamp)                                  6183           6192          11          1.6         618.3       0.1X
-write timestamps to files                          6506           6512           7          1.5         650.6       0.1X
-Create a dataset of dates                           961            962           2         10.4          96.1       0.9X
-to_csv(date)                                       4597           4600           5          2.2         459.7       0.2X
-write dates to files                               4608           4613           6          2.2         460.8       0.2X
+Create a dataset of timestamps                      843            861          23         11.9          84.3       1.0X
+to_csv(timestamp)                                  5939           5965          45          1.7         593.9       0.1X
+write timestamps to files                          6446           6456           9          1.6         644.6       0.1X
+Create a dataset of dates                           936            941           5         10.7          93.6       0.9X
+to_csv(date)                                       4325           4331           5          2.3         432.5       0.2X
+write dates to files                               4637           4646           8          2.2         463.7       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read dates and timestamps:                                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-read timestamp text from files                                                  1311           1314           5          7.6         131.1       1.0X
-read timestamps from files                                                     11583          11590           8          0.9        1158.3       0.1X
-infer timestamps from files                                                    22995          23055          64          0.4        2299.5       0.1X
-read date text from files                                                       1234           1276          37          8.1         123.4       1.1X
-read date from files                                                           11216          11238          30          0.9        1121.6       0.1X
-infer date from files                                                          22681          22718          35          0.4        2268.1       0.1X
-timestamp strings                                                               1224           1227           2          8.2         122.4       1.1X
-parse timestamps from Dataset[String]                                          13706          13760          83          0.7        1370.6       0.1X
-infer timestamps from Dataset[String]                                          25170          25224          64          0.4        2517.0       0.1X
-date strings                                                                    1698           1704           5          5.9         169.8       0.8X
-parse dates from Dataset[String]                                               12766          12789          21          0.8        1276.6       0.1X
-from_csv(timestamp)                                                            11607          11690          73          0.9        1160.7       0.1X
-from_csv(date)                                                                 11353          11364          13          0.9        1135.3       0.1X
-infer error timestamps from Dataset[String] with default format                14883          14927          46          0.7        1488.3       0.1X
-infer error timestamps from Dataset[String] with user-provided format          14897          14928          38          0.7        1489.7       0.1X
-infer error timestamps from Dataset[String] with legacy format                 14893          14931          45          0.7        1489.3       0.1X
+read timestamp text from files                                                  1204           1213           8          8.3         120.4       1.0X
+read timestamps from files                                                     11651          11677          22          0.9        1165.1       0.1X
+infer timestamps from files                                                    23349          23353           6          0.4        2334.9       0.1X
+read date text from files                                                       1101           1108           9          9.1         110.1       1.1X
+read date from files                                                           10918          10925           8          0.9        1091.8       0.1X
+infer date from files                                                          22494          22523          26          0.4        2249.4       0.1X
+timestamp strings                                                               1183           1188           5          8.5         118.3       1.0X
+parse timestamps from Dataset[String]                                          13334          13359          24          0.7        1333.4       0.1X
+infer timestamps from Dataset[String]                                          24804          24861          50          0.4        2480.4       0.0X
+date strings                                                                    1664           1666           3          6.0         166.4       0.7X
+parse dates from Dataset[String]                                               12782          12826          38          0.8        1278.2       0.1X
+from_csv(timestamp)                                                            11198          11219          23          0.9        1119.8       0.1X
+from_csv(date)                                                                 11210          11217          11          0.9        1121.0       0.1X
+infer error timestamps from Dataset[String] with default format                14749          14806          52          0.7        1474.9       0.1X
+infer error timestamps from Dataset[String] with user-provided format          14727          14797          69          0.7        1472.7       0.1X
+infer error timestamps from Dataset[String] with legacy format                 14750          14815          92          0.7        1475.0       0.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Filters pushdown:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-w/o filters                                        4227           4239          14          0.0       42274.8       1.0X
-pushdown disabled                                  4259           4299          42          0.0       42592.2       1.0X
-w/ filters                                          741            746           4          0.1        7414.8       5.7X
+w/o filters                                        4312           4316           6          0.0       43118.3       1.0X
+pushdown disabled                                  4380           4388          10          0.0       43801.0       1.0X
+w/ filters                                          829            838           9          0.1        8288.7       5.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Interval:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Read as Intervals                                   808            809           1          0.4        2693.2       1.0X
-Read Raw Strings                                    325            330           6          0.9        1082.6       2.5X
+Read as Intervals                                   772            785          16          0.4        2571.8       1.0X
+Read Raw Strings                                    323            330           6          0.9        1076.2       2.4X
 
 
diff --git a/sql/core/benchmarks/CSVBenchmark-results.txt b/sql/core/benchmarks/CSVBenchmark-results.txt
index 606263be672ef..8d5f3cf320743 100644
--- a/sql/core/benchmarks/CSVBenchmark-results.txt
+++ b/sql/core/benchmarks/CSVBenchmark-results.txt
@@ -2,76 +2,76 @@
 Benchmark to measure CSV read/write performance
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parsing quoted values:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-One quoted string                                 24626          24670          43          0.0      492514.1       1.0X
+One quoted string                                 24585          24692         144          0.0      491701.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Wide rows with 1000 columns:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select 1000 columns                               51490          52060         751          0.0       51489.8       1.0X
-Select 100 columns                                22350          22409          52          0.0       22349.9       2.3X
-Select one column                                 19397          19463         110          0.1       19397.4       2.7X
-count()                                            3518           3521           4          0.3        3517.6      14.6X
-Select 100 columns, one bad input field           27426          27460          48          0.0       27425.9       1.9X
-Select 100 columns, corrupt record field          30873          30931          59          0.0       30872.7       1.7X
+Select 1000 columns                               56692          57020         438          0.0       56691.8       1.0X
+Select 100 columns                                22207          22251          40          0.0       22206.5       2.6X
+Select one column                                 18890          18927          43          0.1       18889.9       3.0X
+count()                                            3530           3572          49          0.3        3530.3      16.1X
+Select 100 columns, one bad input field           27094          27109          23          0.0       27094.0       2.1X
+Select 100 columns, corrupt record field          30004          30083         125          0.0       30003.6       1.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Count a dataset with 10 columns:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select 10 columns + count()                        9260           9278          26          1.1         926.0       1.0X
-Select 1 column + count()                          6719           6732          15          1.5         671.9       1.4X
-count()                                            1605           1606           1          6.2         160.5       5.8X
+Select 10 columns + count()                        9066           9092          33          1.1         906.6       1.0X
+Select 1 column + count()                          6397           6416          16          1.6         639.7       1.4X
+count()                                            1500           1507          12          6.7         150.0       6.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write dates and timestamps:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Create a dataset of timestamps                      853            872          30         11.7          85.3       1.0X
-to_csv(timestamp)                                  6321           6364          37          1.6         632.1       0.1X
-write timestamps to files                          6787           6802          14          1.5         678.7       0.1X
-Create a dataset of dates                           972            978           9         10.3          97.2       0.9X
-to_csv(date)                                       4729           4734           8          2.1         472.9       0.2X
-write dates to files                               4759           4771          12          2.1         475.9       0.2X
+Create a dataset of timestamps                      972            978           5         10.3          97.2       1.0X
+to_csv(timestamp)                                  6014           6026          13          1.7         601.4       0.2X
+write timestamps to files                          6293           6302           9          1.6         629.3       0.2X
+Create a dataset of dates                           971            974           6         10.3          97.1       1.0X
+to_csv(date)                                       4320           4327           6          2.3         432.0       0.2X
+write dates to files                               4137           4153          17          2.4         413.7       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read dates and timestamps:                                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-read timestamp text from files                                                  1229           1242          19          8.1         122.9       1.0X
-read timestamps from files                                                      9798           9822          20          1.0         979.8       0.1X
-infer timestamps from files                                                    19462          19478          24          0.5        1946.2       0.1X
-read date text from files                                                       1116           1119           2          9.0         111.6       1.1X
-read date from files                                                            9909           9922          12          1.0         990.9       0.1X
-infer date from files                                                          20206          20218          19          0.5        2020.6       0.1X
-timestamp strings                                                               1240           1243           3          8.1         124.0       1.0X
-parse timestamps from Dataset[String]                                          11635          11649          12          0.9        1163.5       0.1X
-infer timestamps from Dataset[String]                                          21255          21265           9          0.5        2125.5       0.1X
-date strings                                                                    1785           1787           3          5.6         178.5       0.7X
-parse dates from Dataset[String]                                               11553          11571          17          0.9        1155.3       0.1X
-from_csv(timestamp)                                                             9827           9833           5          1.0         982.7       0.1X
-from_csv(date)                                                                 10621          10635          12          0.9        1062.1       0.1X
-infer error timestamps from Dataset[String] with default format                12066          12074          12          0.8        1206.6       0.1X
-infer error timestamps from Dataset[String] with user-provided format          12061          12066           6          0.8        1206.1       0.1X
-infer error timestamps from Dataset[String] with legacy format                 12033          12042           9          0.8        1203.3       0.1X
+read timestamp text from files                                                  1158           1165           8          8.6         115.8       1.0X
+read timestamps from files                                                      9575           9587          11          1.0         957.5       0.1X
+infer timestamps from files                                                    19365          19406          36          0.5        1936.5       0.1X
+read date text from files                                                       1059           1064           8          9.4         105.9       1.1X
+read date from files                                                            9650           9685          36          1.0         965.0       0.1X
+infer date from files                                                          20159          20171          11          0.5        2015.9       0.1X
+timestamp strings                                                               1180           1183           3          8.5         118.0       1.0X
+parse timestamps from Dataset[String]                                          11475          11488          20          0.9        1147.5       0.1X
+infer timestamps from Dataset[String]                                          21022          21030           7          0.5        2102.2       0.1X
+date strings                                                                    1640           1641           1          6.1         164.0       0.7X
+parse dates from Dataset[String]                                               11604          11616          19          0.9        1160.4       0.1X
+from_csv(timestamp)                                                             9428           9456          25          1.1         942.8       0.1X
+from_csv(date)                                                                 10226          10268          65          1.0        1022.6       0.1X
+infer error timestamps from Dataset[String] with default format                11716          11728          14          0.9        1171.6       0.1X
+infer error timestamps from Dataset[String] with user-provided format          11726          11734           8          0.9        1172.6       0.1X
+infer error timestamps from Dataset[String] with legacy format                 11730          11747          16          0.9        1173.0       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Filters pushdown:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-w/o filters                                        4092           4098           6          0.0       40917.6       1.0X
-pushdown disabled                                  3990           4009          20          0.0       39897.7       1.0X
-w/ filters                                          717            721           4          0.1        7170.8       5.7X
+w/o filters                                        4305           4314          10          0.0       43050.4       1.0X
+pushdown disabled                                  4245           4256          10          0.0       42448.7       1.0X
+w/ filters                                          789            790           2          0.1        7886.0       5.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Interval:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Read as Intervals                                   699            705           6          0.4        2331.5       1.0X
-Read Raw Strings                                    274            279           5          1.1         911.8       2.6X
+Read as Intervals                                   660            660           1          0.5        2198.5       1.0X
+Read Raw Strings                                    281            286           5          1.1         937.0       2.3X
 
 
diff --git a/sql/core/benchmarks/CharVarcharBenchmark-jdk21-results.txt b/sql/core/benchmarks/CharVarcharBenchmark-jdk21-results.txt
index 640b0c3095f0d..d9f8e2df2d9f3 100644
--- a/sql/core/benchmarks/CharVarcharBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/CharVarcharBenchmark-jdk21-results.txt
@@ -2,121 +2,121 @@
 Char Varchar Write Side Perf w/o Tailing Spaces
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 5:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 5                         6970           7325         311          5.7         174.3       1.0X
-write char with length 5                          10016          10047          27          4.0         250.4       0.7X
-write varchar with length 5                        7156           7176          22          5.6         178.9       1.0X
+write string with length 5                         7168           7314         139          5.6         179.2       1.0X
+write char with length 5                          10502          10571          66          3.8         262.6       0.7X
+write varchar with length 5                        7223           7343         149          5.5         180.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 10:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 10                        3332           3385          54          6.0         166.6       1.0X
-write char with length 10                          6314           6319           6          3.2         315.7       0.5X
-write varchar with length 10                       3647           3673          41          5.5         182.4       0.9X
+write string with length 10                        3561           3573          11          5.6         178.1       1.0X
+write char with length 10                          6447           6511          55          3.1         322.4       0.6X
+write varchar with length 10                       3720           3728           7          5.4         186.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 20:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 20                        1877           1880           4          5.3         187.7       1.0X
-write char with length 20                          4522           4549          42          2.2         452.2       0.4X
-write varchar with length 20                       1923           1933          12          5.2         192.3       1.0X
+write string with length 20                        1684           1691           6          5.9         168.4       1.0X
+write char with length 20                          4764           4788          37          2.1         476.4       0.4X
+write varchar with length 20                       1907           1909           3          5.2         190.7       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 40:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 40                         961            969           8          5.2         192.1       1.0X
-write char with length 40                          3548           3567          22          1.4         709.6       0.3X
-write varchar with length 40                        959            967          10          5.2         191.8       1.0X
+write string with length 40                         880            885           4          5.7         176.1       1.0X
+write char with length 40                          3718           3726          13          1.3         743.5       0.2X
+write varchar with length 40                        989            991           3          5.1         197.8       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 60:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 60                         616            648          33          5.4         184.9       1.0X
-write char with length 60                          3199           3205           8          1.0         959.7       0.2X
-write varchar with length 60                        695            698           4          4.8         208.5       0.9X
+write string with length 60                         674            678           4          4.9         202.1       1.0X
+write char with length 60                          3345           3364          17          1.0        1003.5       0.2X
+write varchar with length 60                        705            706           1          4.7         211.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 80:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 80                         490            497           6          5.1         196.1       1.0X
-write char with length 80                          3006           3020          21          0.8        1202.3       0.2X
-write varchar with length 80                        540            548          12          4.6         216.2       0.9X
+write string with length 80                         497            501           4          5.0         198.9       1.0X
+write char with length 80                          3126           3131           7          0.8        1250.3       0.2X
+write varchar with length 80                        563            569           7          4.4         225.3       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 100:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 100                        413            418           8          4.8         206.4       1.0X
-write char with length 100                         2955           2960           9          0.7        1477.4       0.1X
-write varchar with length 100                       452            454           2          4.4         226.1       0.9X
+write string with length 100                        390            392           2          5.1         194.8       1.0X
+write char with length 100                         3008           3019          10          0.7        1503.9       0.1X
+write varchar with length 100                       460            463           5          4.4         229.8       0.8X
 
 
 ================================================================================================
 Char Varchar Write Side Perf w/ Tailing Spaces
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 5:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 5                         8601           8616          22          4.7         215.0       1.0X
-write char with length 5                          12123          12186         101          3.3         303.1       0.7X
-write varchar with length 5                       12329          12357          42          3.2         308.2       0.7X
+write string with length 5                         8133           8163          28          4.9         203.3       1.0X
+write char with length 5                          11464          11555         149          3.5         286.6       0.7X
+write varchar with length 5                       10906          10970          56          3.7         272.7       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 10:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 10                        5147           5184          33          3.9         257.3       1.0X
-write char with length 10                          8036           8072          39          2.5         401.8       0.6X
-write varchar with length 10                       7861           7876          19          2.5         393.1       0.7X
+write string with length 10                        4726           4731           7          4.2         236.3       1.0X
+write char with length 10                          6837           6849          12          2.9         341.9       0.7X
+write varchar with length 10                       6910           6915           5          2.9         345.5       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 20:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 20                        3124           3131           8          3.2         312.4       1.0X
-write char with length 20                          5491           5499          10          1.8         549.1       0.6X
-write varchar with length 20                       5562           5567           5          1.8         556.2       0.6X
+write string with length 20                        2816           2822           5          3.6         281.6       1.0X
+write char with length 20                          4928           4931           5          2.0         492.8       0.6X
+write varchar with length 20                       4886           4888           2          2.0         488.6       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 40:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 40                        2069           2072           5          2.4         413.8       1.0X
-write char with length 40                          4264           4275          13          1.2         852.8       0.5X
-write varchar with length 40                       4312           4317           6          1.2         862.3       0.5X
+write string with length 40                        1517           1521           3          3.3         303.4       1.0X
+write char with length 40                          3716           3719           2          1.3         743.3       0.4X
+write varchar with length 40                       3724           3731           6          1.3         744.9       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 60:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 60                        1771           1774           3          1.9         531.4       1.0X
-write char with length 60                          3884           3887           3          0.9        1165.3       0.5X
-write varchar with length 60                       3987           3988           1          0.8        1196.0       0.4X
+write string with length 60                        1250           1251           2          2.7         375.0       1.0X
+write char with length 60                          3404           3420          22          1.0        1021.1       0.4X
+write varchar with length 60                       3412           3419           6          1.0        1023.5       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 80:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 80                        1684           1691           6          1.5         673.6       1.0X
-write char with length 80                          3712           3721           9          0.7        1484.8       0.5X
-write varchar with length 80                       3729           3737          11          0.7        1491.5       0.5X
+write string with length 80                        1159           1171          12          2.2         463.8       1.0X
+write char with length 80                          3190           3202          17          0.8        1275.9       0.4X
+write varchar with length 80                       2868           2870           4          0.9        1147.2       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 100:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 100                       1593           1597           6          1.3         796.6       1.0X
-write char with length 100                         3723           3726           5          0.5        1861.4       0.4X
-write varchar with length 100                      3627           3641          13          0.6        1813.6       0.4X
+write string with length 100                        990            994           6          2.0         494.8       1.0X
+write char with length 100                         3104           3117          14          0.6        1552.1       0.3X
+write varchar with length 100                      2748           2755           9          0.7        1374.1       0.4X
 
 
diff --git a/sql/core/benchmarks/CharVarcharBenchmark-results.txt b/sql/core/benchmarks/CharVarcharBenchmark-results.txt
index 49822b663aa12..d76b532eeb5fd 100644
--- a/sql/core/benchmarks/CharVarcharBenchmark-results.txt
+++ b/sql/core/benchmarks/CharVarcharBenchmark-results.txt
@@ -2,121 +2,121 @@
 Char Varchar Write Side Perf w/o Tailing Spaces
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 5:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 5                         7259           7346          87          5.5         181.5       1.0X
-write char with length 5                          10259          10279          27          3.9         256.5       0.7X
-write varchar with length 5                        7483           7499          23          5.3         187.1       1.0X
+write string with length 5                         6572           6829         222          6.1         164.3       1.0X
+write char with length 5                           9718           9745          43          4.1         242.9       0.7X
+write varchar with length 5                        7419           7449          49          5.4         185.5       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 10:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 10                        3732           3789          57          5.4         186.6       1.0X
-write char with length 10                          6479           6493          14          3.1         324.0       0.6X
-write varchar with length 10                       3708           3748          36          5.4         185.4       1.0X
+write string with length 10                        3344           3352           8          6.0         167.2       1.0X
+write char with length 10                          6395           6435          41          3.1         319.8       0.5X
+write varchar with length 10                       3621           3627           6          5.5         181.0       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 20:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 20                        1752           1761          16          5.7         175.2       1.0X
-write char with length 20                          4446           4506          52          2.2         444.6       0.4X
-write varchar with length 20                       1900           1923          22          5.3         190.0       0.9X
+write string with length 20                        1703           1718          16          5.9         170.3       1.0X
+write char with length 20                          4663           4701          37          2.1         466.3       0.4X
+write varchar with length 20                       1836           1847          13          5.4         183.6       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 40:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 40                         986            997          10          5.1         197.2       1.0X
-write char with length 40                          3535           3540           4          1.4         707.1       0.3X
-write varchar with length 40                       1037           1043           8          4.8         207.3       1.0X
+write string with length 40                         900            911           9          5.6         180.1       1.0X
+write char with length 40                          3683           3684           1          1.4         736.6       0.2X
+write varchar with length 40                       1017           1028          10          4.9         203.3       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 60:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 60                         682            684           2          4.9         204.6       1.0X
-write char with length 60                          3192           3201           8          1.0         957.5       0.2X
-write varchar with length 60                        715            720           4          4.7         214.5       1.0X
+write string with length 60                         634            638           3          5.3         190.2       1.0X
+write char with length 60                          3267           3270           3          1.0         980.1       0.2X
+write varchar with length 60                        677            689          18          4.9         203.2       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 80:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 80                         522            527           7          4.8         208.9       1.0X
-write char with length 80                          2997           3006          10          0.8        1199.0       0.2X
-write varchar with length 80                        542            553          15          4.6         216.7       1.0X
+write string with length 80                         493            493           0          5.1         197.2       1.0X
+write char with length 80                          3101           3167          62          0.8        1240.3       0.2X
+write varchar with length 80                        557            560           3          4.5         222.9       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 100:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 100                        414            420           9          4.8         207.0       1.0X
-write char with length 100                         2917           2936          17          0.7        1458.7       0.1X
-write varchar with length 100                       462            467           5          4.3         231.1       0.9X
+write string with length 100                        399            408          10          5.0         199.7       1.0X
+write char with length 100                         3032           3045          12          0.7        1516.1       0.1X
+write varchar with length 100                       455            459           7          4.4         227.4       0.9X
 
 
 ================================================================================================
 Char Varchar Write Side Perf w/ Tailing Spaces
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 5:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 5                         8623           8642          16          4.6         215.6       1.0X
-write char with length 5                          11664          11723          86          3.4         291.6       0.7X
-write varchar with length 5                       11849          11900          60          3.4         296.2       0.7X
+write string with length 5                         7780           7823          40          5.1         194.5       1.0X
+write char with length 5                          10884          10938          70          3.7         272.1       0.7X
+write varchar with length 5                       10615          10673          88          3.8         265.4       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 10:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 10                        5569           5576           9          3.6         278.5       1.0X
-write char with length 10                          7953           7968          25          2.5         397.6       0.7X
-write varchar with length 10                       7745           7758          20          2.6         387.3       0.7X
+write string with length 10                        4629           4641          11          4.3         231.4       1.0X
+write char with length 10                          7046           7050           6          2.8         352.3       0.7X
+write varchar with length 10                       6512           6540          24          3.1         325.6       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 20:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 20                        3400           3409          15          2.9         340.0       1.0X
-write char with length 20                          5593           5599           9          1.8         559.3       0.6X
-write varchar with length 20                       5128           5134          11          2.0         512.8       0.7X
+write string with length 20                        2486           2497          12          4.0         248.6       1.0X
+write char with length 20                          4770           4787          15          2.1         477.0       0.5X
+write varchar with length 20                       4508           4513           4          2.2         450.8       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 40:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 40                        2194           2196           3          2.3         438.8       1.0X
-write char with length 40                          4255           4262           7          1.2         850.9       0.5X
-write varchar with length 40                       4032           4035           3          1.2         806.5       0.5X
+write string with length 40                        1580           1586           5          3.2         316.1       1.0X
+write char with length 40                          3773           3777           5          1.3         754.7       0.4X
+write varchar with length 40                       3411           3417           8          1.5         682.2       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 60:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 60                        1932           1936           5          1.7         579.5       1.0X
-write char with length 60                          3976           3991          14          0.8        1192.9       0.5X
-write varchar with length 60                       3690           3692           4          0.9        1106.9       0.5X
+write string with length 60                        1303           1305           3          2.6         390.9       1.0X
+write char with length 60                          3443           3447           4          1.0        1032.9       0.4X
+write varchar with length 60                       3097           3099           2          1.1         929.0       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 80:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 80                        1751           1759          12          1.4         700.3       1.0X
-write char with length 80                          3842           3854          17          0.7        1536.9       0.5X
-write varchar with length 80                       3478           3482           5          0.7        1391.2       0.5X
+write string with length 80                        1164           1173           7          2.1         465.7       1.0X
+write char with length 80                          3342           3346           5          0.7        1336.9       0.3X
+write varchar with length 80                       2912           2926          16          0.9        1164.7       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write with length 100:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-write string with length 100                       1579           1588          13          1.3         789.7       1.0X
-write char with length 100                         3644           3658          18          0.5        1821.9       0.4X
-write varchar with length 100                      3390           3393           4          0.6        1694.9       0.5X
+write string with length 100                       1064           1071           5          1.9         532.2       1.0X
+write char with length 100                         3252           3261          11          0.6        1625.9       0.3X
+write varchar with length 100                      2846           2855           8          0.7        1422.9       0.4X
 
 
diff --git a/sql/core/benchmarks/CollationBenchmark-jdk21-results.txt b/sql/core/benchmarks/CollationBenchmark-jdk21-results.txt
index 771b6526a7136..e15be5c51f72e 100644
--- a/sql/core/benchmarks/CollationBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/CollationBenchmark-jdk21-results.txt
@@ -1,88 +1,88 @@
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - equalsFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                          1702           1703           1          0.1       17020.6       1.0X
-UTF8_LCASE                                           2636           2639           5          0.0       26357.2       1.5X
-UNICODE                                             17060          17064           7          0.0      170597.2      10.0X
-UNICODE_CI                                          16499          16522          33          0.0      164987.9       9.7X
+UTF8_BINARY                                          1769           1769           1          0.1       17688.3       1.0X
+UTF8_LCASE                                           2662           2662           1          0.0       26617.3       1.5X
+UNICODE                                             16947          16955          12          0.0      169467.7       9.6X
+UNICODE_CI                                          16600          16610          14          0.0      165998.2       9.4X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - compareFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ---------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                           1783           1783           0          0.1       17825.5       1.0X
-UTF8_LCASE                                            2598           2598           0          0.0       25975.5       1.5X
-UNICODE                                              17608          17611           5          0.0      176075.6       9.9X
-UNICODE_CI                                           17425          17425           0          0.0      174251.6       9.8X
+UTF8_BINARY                                           1778           1779           1          0.1       17782.8       1.0X
+UTF8_LCASE                                            3755           3756           1          0.0       37550.7       2.1X
+UNICODE                                              17556          17569          18          0.0      175562.4       9.9X
+UNICODE_CI                                           17348          17360          17          0.0      173481.2       9.8X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - hashFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        2844           2845           1          0.0       28440.6       1.0X
-UTF8_LCASE                                         5455           5460           8          0.0       54547.5       1.9X
-UNICODE                                           68308          68344          50          0.0      683078.9      24.0X
-UNICODE_CI                                        57344          57360          23          0.0      573442.6      20.2X
+UTF8_BINARY                                       12827          12831           6          0.0      128267.0       1.0X
+UTF8_LCASE                                        19675          19693          25          0.0      196751.6       1.5X
+UNICODE                                          106365         106368           4          0.0     1063650.1       8.3X
+UNICODE_CI                                       153190         153205          20          0.0     1531904.4      11.9X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - contains:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        1704           1704           0          0.1       17035.8       1.0X
-UTF8_LCASE                                        15349          15352           5          0.0      153485.8       9.0X
-UNICODE                                          315270         315691         595          0.0     3152700.6     185.1X
-UNICODE_CI                                       318287         318890         852          0.0     3182870.3     186.8X
+UTF8_BINARY                                        2879           2881           3          0.0       28786.7       1.0X
+UTF8_LCASE                                        15268          15275          11          0.0      152677.0       5.3X
+UNICODE                                          316698         317100         569          0.0     3166978.2     110.0X
+UNICODE_CI                                       321232         321330         138          0.0     3212319.7     111.6X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - startsWith:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        1992           1992           0          0.1       19918.0       1.0X
-UTF8_LCASE                                        10388          10388           0          0.0      103878.0       5.2X
-UNICODE                                          311363         311436         103          0.0     3113630.8     156.3X
-UNICODE_CI                                       314454         315188        1039          0.0     3144536.7     157.9X
+UTF8_BINARY                                        2046           2047           1          0.0       20457.6       1.0X
+UTF8_LCASE                                        11301          11302           1          0.0      113011.9       5.5X
+UNICODE                                          317856         318087         326          0.0     3178561.7     155.4X
+UNICODE_CI                                       321502         321592         127          0.0     3215019.0     157.2X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - endsWith:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        2052           2052           1          0.0       20517.7       1.0X
-UTF8_LCASE                                        11198          11206          11          0.0      111983.3       5.5X
-UNICODE                                          330704         330753          70          0.0     3307040.2     161.2X
-UNICODE_CI                                       333624         334191         802          0.0     3336242.4     162.6X
+UTF8_BINARY                                        2053           2056           4          0.0       20526.5       1.0X
+UTF8_LCASE                                        11156          11158           2          0.0      111560.7       5.4X
+UNICODE                                          325433         327150        2428          0.0     3254333.6     158.5X
+UNICODE_CI                                       331312         331923         864          0.0     3313119.8     161.4X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------
-UNICODE                                                           393            394           1          0.3        3934.9       1.0X
-UNICODE_CI                                                        388            390           1          0.3        3882.2       1.0X
+UNICODE                                                           369            370           0          0.3        3690.8       1.0X
+UNICODE_CI                                                        369            370           0          0.3        3689.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinaryICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             573            574           2          0.2        5727.7       1.0X
-UTF8_LCASE                                                              573            574           1          0.2        5726.9       1.0X
-UNICODE                                                                 572            574           2          0.2        5722.1       1.0X
-UNICODE_CI                                                              573            589          33          0.2        5726.9       1.0X
+UTF8_BINARY                                                             565            566           1          0.2        5650.4       1.0X
+UTF8_LCASE                                                              565            566           1          0.2        5653.0       1.0X
+UNICODE                                                                 566            566           1          0.2        5655.2       1.0X
+UNICODE_CI                                                              565            566           0          0.2        5651.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinary:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 -----------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                          137            138           1          0.7        1371.0       1.0X
-UTF8_LCASE                                                           137            138           1          0.7        1371.4       1.0X
-UNICODE                                                              137            138           1          0.7        1370.2       1.0X
-UNICODE_CI                                                           137            138           1          0.7        1370.3       1.0X
+UTF8_BINARY                                                          137            138           1          0.7        1372.6       1.0X
+UTF8_LCASE                                                           137            138           0          0.7        1371.7       1.0X
+UNICODE                                                              137            138           1          0.7        1373.9       1.0X
+UNICODE_CI                                                           137            138           0          0.7        1373.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execLowercase:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             388            389           1          0.3        3878.0       1.0X
-UTF8_LCASE                                                              388            389           1          0.3        3879.3       1.0X
-UNICODE                                                                 388            389           1          0.3        3879.9       1.0X
-UNICODE_CI                                                              388            389           0          0.3        3878.4       1.0X
+UTF8_BINARY                                                             370            371           1          0.3        3696.7       1.0X
+UTF8_LCASE                                                              369            370           1          0.3        3685.8       1.0X
+UNICODE                                                                 369            370           1          0.3        3690.9       1.0X
+UNICODE_CI                                                              369            370           0          0.3        3693.8       1.0X
 
diff --git a/sql/core/benchmarks/CollationBenchmark-results.txt b/sql/core/benchmarks/CollationBenchmark-results.txt
index 4b178530f1c6e..bf5cd74a86c6f 100644
--- a/sql/core/benchmarks/CollationBenchmark-results.txt
+++ b/sql/core/benchmarks/CollationBenchmark-results.txt
@@ -1,88 +1,88 @@
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - equalsFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                          1750           1751           2          0.1       17498.8       1.0X
-UTF8_LCASE                                           2882           2884           3          0.0       28824.3       1.6X
-UNICODE                                             19141          19143           3          0.0      191411.8      10.9X
-UNICODE_CI                                          18699          18703           6          0.0      186988.2      10.7X
+UTF8_BINARY                                          1748           1750           2          0.1       17482.9       1.0X
+UTF8_LCASE                                           3042           3045           4          0.0       30424.8       1.7X
+UNICODE                                             19142          19156          19          0.0      191422.9      10.9X
+UNICODE_CI                                          19141          19147          10          0.0      191405.2      10.9X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - compareFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ---------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                           1737           1738           2          0.1       17369.8       1.0X
-UTF8_LCASE                                            3079           3082           4          0.0       30791.2       1.8X
-UNICODE                                              19852          19859           9          0.0      198518.8      11.4X
-UNICODE_CI                                           19727          19728           1          0.0      197272.5      11.4X
+UTF8_BINARY                                           1708           1709           2          0.1       17079.7       1.0X
+UTF8_LCASE                                            3149           3150           2          0.0       31487.7       1.8X
+UNICODE                                              19352          19361          13          0.0      193515.4      11.3X
+UNICODE_CI                                           19185          19188           4          0.0      191851.2      11.2X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - hashFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        3092           3093           1          0.0       30922.4       1.0X
-UTF8_LCASE                                         6473           6474           2          0.0       64728.0       2.1X
-UNICODE                                           66907          66913           9          0.0      669070.9      21.6X
-UNICODE_CI                                        55134          55219         119          0.0      551343.8      17.8X
+UTF8_BINARY                                       13960          13960           0          0.0      139601.6       1.0X
+UTF8_LCASE                                        25003          25005           2          0.0      250031.9       1.8X
+UNICODE                                          117914         117918           6          0.0     1179141.1       8.4X
+UNICODE_CI                                       160718         160758          57          0.0     1607177.0      11.5X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - contains:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        2107           2109           2          0.0       21073.8       1.0X
-UTF8_LCASE                                        17995          17997           4          0.0      179946.3       8.5X
-UNICODE                                          318380         318887         717          0.0     3183800.7     151.1X
-UNICODE_CI                                       309694         309747          74          0.0     3096942.4     147.0X
+UTF8_BINARY                                        2244           2246           3          0.0       22444.5       1.0X
+UTF8_LCASE                                        17111          17112           1          0.0      171107.2       7.6X
+UNICODE                                          317260         318448        1680          0.0     3172604.4     141.4X
+UNICODE_CI                                       313112         313564         639          0.0     3131124.6     139.5X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - startsWith:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        2502           2504           2          0.0       25023.7       1.0X
-UTF8_LCASE                                        17341          17344           4          0.0      173412.8       6.9X
-UNICODE                                          304576         305362        1112          0.0     3045764.2     121.7X
-UNICODE_CI                                       308506         309328        1161          0.0     3085064.4     123.3X
+UTF8_BINARY                                        2365           2374          13          0.0       23648.0       1.0X
+UTF8_LCASE                                        17098          17103           7          0.0      170981.8       7.2X
+UNICODE                                          308770         308831          86          0.0     3087700.9     130.6X
+UNICODE_CI                                       312503         312717         303          0.0     3125027.8     132.1X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - endsWith:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                        2518           2518           0          0.0       25184.0       1.0X
-UTF8_LCASE                                        17347          17352           7          0.0      173470.3       6.9X
-UNICODE                                          319689         320154         658          0.0     3196888.5     126.9X
-UNICODE_CI                                       322042         322706         939          0.0     3220420.5     127.9X
+UTF8_BINARY                                        2481           2481           0          0.0       24811.2       1.0X
+UTF8_LCASE                                        17154          17155           2          0.0      171542.6       6.9X
+UNICODE                                          328959         329495         758          0.0     3289591.2     132.6X
+UNICODE_CI                                       333560         334318        1073          0.0     3335595.5     134.4X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------
-UNICODE                                                           420            421           2          0.2        4196.0       1.0X
-UNICODE_CI                                                        419            420           1          0.2        4190.7       1.0X
+UNICODE                                                           298            299           1          0.3        2982.0       1.0X
+UNICODE_CI                                                        298            299           0          0.3        2981.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinaryICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             598            599           1          0.2        5982.9       1.0X
-UTF8_LCASE                                                              598            599           1          0.2        5980.5       1.0X
-UNICODE                                                                 598            600           3          0.2        5979.3       1.0X
-UNICODE_CI                                                              598            599           1          0.2        5978.9       1.0X
+UTF8_BINARY                                                             577            578           1          0.2        5767.1       1.0X
+UTF8_LCASE                                                              576            577           1          0.2        5762.1       1.0X
+UNICODE                                                                 577            577           1          0.2        5768.5       1.0X
+UNICODE_CI                                                              577            577           0          0.2        5768.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinary:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 -----------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                          181            182           1          0.6        1810.0       1.0X
-UTF8_LCASE                                                           181            182           1          0.6        1810.8       1.0X
-UNICODE                                                              181            182           1          0.6        1810.1       1.0X
-UNICODE_CI                                                           181            182           0          0.6        1810.9       1.0X
+UTF8_BINARY                                                          185            185           1          0.5        1847.2       1.0X
+UTF8_LCASE                                                           185            185           0          0.5        1846.8       1.0X
+UNICODE                                                              185            185           0          0.5        1847.5       1.0X
+UNICODE_CI                                                           185            185           1          0.5        1846.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execLowercase:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             419            420           1          0.2        4190.1       1.0X
-UTF8_LCASE                                                              419            420           1          0.2        4194.1       1.0X
-UNICODE                                                                 419            420           1          0.2        4188.6       1.0X
-UNICODE_CI                                                              419            420           1          0.2        4189.5       1.0X
+UTF8_BINARY                                                             317            317           0          0.3        3166.9       1.0X
+UTF8_LCASE                                                              317            318           0          0.3        3170.9       1.0X
+UNICODE                                                                 316            317           0          0.3        3163.9       1.0X
+UNICODE_CI                                                              316            317           1          0.3        3163.6       1.0X
 
diff --git a/sql/core/benchmarks/CollationNonASCIIBenchmark-jdk21-results.txt b/sql/core/benchmarks/CollationNonASCIIBenchmark-jdk21-results.txt
index 3c0b9d1647ee7..cdce26c80a5d1 100644
--- a/sql/core/benchmarks/CollationNonASCIIBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/CollationNonASCIIBenchmark-jdk21-results.txt
@@ -1,88 +1,88 @@
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - equalsFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                           193            193           1          0.2        4819.3       1.0X
-UTF8_LCASE                                           7333           7334           1          0.0      183334.3      38.0X
-UNICODE                                              5117           5122           8          0.0      127913.6      26.5X
-UNICODE_CI                                           5127           5138          16          0.0      128171.7      26.6X
+UTF8_BINARY                                           193            194           2          0.2        4825.3       1.0X
+UTF8_LCASE                                           7364           7365           2          0.0      184098.9      38.2X
+UNICODE                                              5138           5143           7          0.0      128446.5      26.6X
+UNICODE_CI                                           5273           5274           1          0.0      131830.6      27.3X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - compareFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ---------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                            320            320           0          0.1        7988.9       1.0X
-UTF8_LCASE                                            7380           7384           6          0.0      184501.6      23.1X
-UNICODE                                               5380           5382           2          0.0      134502.1      16.8X
-UNICODE_CI                                            5329           5330           1          0.0      133234.0      16.7X
+UTF8_BINARY                                            297            297           0          0.1        7428.2       1.0X
+UTF8_LCASE                                            7223           7224           1          0.0      180585.9      24.3X
+UNICODE                                               5167           5168           1          0.0      129185.4      17.4X
+UNICODE_CI                                            5118           5124           7          0.0      127959.9      17.2X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - hashFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         389            391           2          0.1        9731.7       1.0X
-UTF8_LCASE                                         3765           3767           2          0.0       94136.1       9.7X
-UNICODE                                           14511          14522          16          0.0      362778.4      37.3X
-UNICODE_CI                                        11611          11629          25          0.0      290286.6      29.8X
+UTF8_BINARY                                        1781           1785           6          0.0       44533.6       1.0X
+UTF8_LCASE                                         6031           6031           1          0.0      150765.3       3.4X
+UNICODE                                           21149          21157          12          0.0      528720.3      11.9X
+UNICODE_CI                                        27480          27489          13          0.0      686999.9      15.4X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - contains:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         397            398           1          0.1        9932.6       1.0X
-UTF8_LCASE                                         8126           8133          10          0.0      203142.7      20.5X
-UNICODE                                           59149          59172          32          0.0     1478723.8     148.9X
-UNICODE_CI                                        59069          59086          24          0.0     1476724.4     148.7X
+UTF8_BINARY                                         527            527           0          0.1       13166.7       1.0X
+UTF8_LCASE                                         9131           9135           6          0.0      228267.9      17.3X
+UNICODE                                           60953          60989          52          0.0     1523813.1     115.7X
+UNICODE_CI                                        62495          62503          12          0.0     1562377.7     118.7X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - startsWith:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         322            322           0          0.1        8057.5       1.0X
-UTF8_LCASE                                         5402           5402           0          0.0      135048.8      16.8X
-UNICODE                                           58820          58831          15          0.0     1470505.1     182.5X
-UNICODE_CI                                        59412          59560         210          0.0     1485296.8     184.3X
+UTF8_BINARY                                         275            276           0          0.1        6882.2       1.0X
+UTF8_LCASE                                         5751           5751           1          0.0      143769.6      20.9X
+UNICODE                                           62099          62196         139          0.0     1552462.9     225.6X
+UNICODE_CI                                        62870          62928          82          0.0     1571750.5     228.4X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - endsWith:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         313            313           0          0.1        7828.0       1.0X
-UTF8_LCASE                                         5456           5474          26          0.0      136400.1      17.4X
-UNICODE                                           64778          64790          16          0.0     1619459.4     206.9X
-UNICODE_CI                                        63831          63915         117          0.0     1595786.8     203.9X
+UTF8_BINARY                                         260            260           0          0.2        6502.2       1.0X
+UTF8_LCASE                                         5910           5914           6          0.0      147754.7      22.7X
+UNICODE                                           68219          68299         114          0.0     1705463.3     262.3X
+UNICODE_CI                                        67093          67462         523          0.0     1677318.2     258.0X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------
-UNICODE                                                           216            216           0          0.2        5394.2       1.0X
-UNICODE_CI                                                        214            215           0          0.2        5352.1       1.0X
+UNICODE                                                           207            208           1          0.2        5176.3       1.0X
+UNICODE_CI                                                        207            208           1          0.2        5174.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinaryICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             323            334          25          0.1        8067.4       1.0X
-UTF8_LCASE                                                              323            323           0          0.1        8064.4       1.0X
-UNICODE                                                                 322            323           1          0.1        8057.2       1.0X
-UNICODE_CI                                                              323            323           1          0.1        8063.9       1.0X
+UTF8_BINARY                                                             323            323           0          0.1        8067.0       1.0X
+UTF8_LCASE                                                              323            323           0          0.1        8067.9       1.0X
+UNICODE                                                                 322            323           1          0.1        8062.3       1.0X
+UNICODE_CI                                                              322            323           0          0.1        8061.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinary:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 -----------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                           86             87           0          0.5        2149.3       1.0X
-UTF8_LCASE                                                            86             87           0          0.5        2145.8       1.0X
-UNICODE                                                               86             87           0          0.5        2150.8       1.0X
-UNICODE_CI                                                            86             87           1          0.5        2151.2       1.0X
+UTF8_BINARY                                                           85             86           0          0.5        2121.4       1.0X
+UTF8_LCASE                                                            85             86           0          0.5        2122.4       1.0X
+UNICODE                                                               85             86           0          0.5        2120.1       1.0X
+UNICODE_CI                                                            85             86           0          0.5        2119.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.7+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execLowercase:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             214            214           0          0.2        5345.7       1.0X
-UTF8_LCASE                                                              214            220          12          0.2        5349.8       1.0X
-UNICODE                                                                 214            214           1          0.2        5340.1       1.0X
-UNICODE_CI                                                              214            214           0          0.2        5339.8       1.0X
+UTF8_BINARY                                                             208            209           1          0.2        5195.0       1.0X
+UTF8_LCASE                                                              208            208           0          0.2        5197.6       1.0X
+UNICODE                                                                 208            208           0          0.2        5196.5       1.0X
+UNICODE_CI                                                              208            209           1          0.2        5198.4       1.0X
 
diff --git a/sql/core/benchmarks/CollationNonASCIIBenchmark-results.txt b/sql/core/benchmarks/CollationNonASCIIBenchmark-results.txt
index 21edf6d64859c..3f2d6fc1edce8 100644
--- a/sql/core/benchmarks/CollationNonASCIIBenchmark-results.txt
+++ b/sql/core/benchmarks/CollationNonASCIIBenchmark-results.txt
@@ -1,88 +1,88 @@
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - equalsFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                           171            172           1          0.2        4277.4       1.0X
-UTF8_LCASE                                           7351           7351           1          0.0      183764.8      43.0X
-UNICODE                                              5655           5657           3          0.0      141374.5      33.1X
-UNICODE_CI                                           5739           5741           2          0.0      143486.9      33.5X
+UTF8_BINARY                                           174            176           4          0.2        4357.6       1.0X
+UTF8_LCASE                                           7310           7312           2          0.0      182759.8      41.9X
+UNICODE                                              6486           6486           1          0.0      162152.0      37.2X
+UNICODE_CI                                           6365           6365           1          0.0      159118.5      36.5X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - compareFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ---------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                            300            300           0          0.1        7500.6       1.0X
-UTF8_LCASE                                            7137           7165          40          0.0      178413.7      23.8X
-UNICODE                                               5506           5510           5          0.0      137660.9      18.4X
-UNICODE_CI                                            5468           5473           7          0.0      136699.1      18.2X
+UTF8_BINARY                                            479            480           1          0.1       11966.1       1.0X
+UTF8_LCASE                                            7479           7480           1          0.0      186981.5      15.6X
+UNICODE                                               6517           6526          13          0.0      162913.6      13.6X
+UNICODE_CI                                            6467           6488          29          0.0      161684.0      13.5X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - hashFunction:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         717            718           2          0.1       17925.8       1.0X
-UTF8_LCASE                                         3642           3643           1          0.0       91045.7       5.1X
-UNICODE                                           14060          14072          17          0.0      351498.4      19.6X
-UNICODE_CI                                        12921          12923           2          0.0      323026.0      18.0X
+UTF8_BINARY                                        1976           1978           2          0.0       49402.1       1.0X
+UTF8_LCASE                                         6319           6322           4          0.0      157976.7       3.2X
+UNICODE                                           22688          22698          14          0.0      567210.9      11.5X
+UNICODE_CI                                        29579          29579           1          0.0      739471.9      15.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - contains:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         552            553           1          0.1       13806.7       1.0X
-UTF8_LCASE                                         8430           8436           8          0.0      210740.5      15.3X
-UNICODE                                           59134          59277         202          0.0     1478349.1     107.1X
-UNICODE_CI                                        55157          55368         299          0.0     1378923.9      99.9X
+UTF8_BINARY                                         604            604           1          0.1       15092.4       1.0X
+UTF8_LCASE                                         8491           8518          38          0.0      212269.4      14.1X
+UNICODE                                           60312          60430         167          0.0     1507792.3      99.9X
+UNICODE_CI                                        57877          57884          10          0.0     1446922.4      95.9X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - startsWith:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         335            336           0          0.1        8384.1       1.0X
-UTF8_LCASE                                         5312           5314           3          0.0      132802.3      15.8X
-UNICODE                                           54850          54887          53          0.0     1371249.7     163.6X
-UNICODE_CI                                        55529          55678         211          0.0     1388216.9     165.6X
+UTF8_BINARY                                         376            377           1          0.1        9402.1       1.0X
+UTF8_LCASE                                         5370           5371           1          0.0      134249.8      14.3X
+UNICODE                                           57074          57101          39          0.0     1426838.7     151.8X
+UNICODE_CI                                        57428          57492          90          0.0     1435699.4     152.7X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - endsWith:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 ------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                         338            338           1          0.1        8437.7       1.0X
-UTF8_LCASE                                         5363           5389          37          0.0      134077.3      15.9X
-UNICODE                                           61997          62088         128          0.0     1549932.7     183.7X
-UNICODE_CI                                        61712          61836         176          0.0     1542800.4     182.8X
+UTF8_BINARY                                         376            377           1          0.1        9389.3       1.0X
+UTF8_LCASE                                         5340           5341           0          0.0      133505.3      14.2X
+UNICODE                                           63927          63986          83          0.0     1598179.3     170.2X
+UNICODE_CI                                        63400          63579         253          0.0     1585004.3     168.8X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------
-UNICODE                                                           225            226           0          0.2        5628.8       1.0X
-UNICODE_CI                                                        225            226           0          0.2        5627.4       1.0X
+UNICODE                                                           266            268           2          0.2        6649.1       1.0X
+UNICODE_CI                                                        267            269           1          0.1        6681.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinaryICU:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             316            317           1          0.1        7904.0       1.0X
-UTF8_LCASE                                                              316            317           1          0.1        7905.4       1.0X
-UNICODE                                                                 316            317           1          0.1        7899.7       1.0X
-UNICODE_CI                                                              316            317           0          0.1        7904.5       1.0X
+UTF8_BINARY                                                             314            315           0          0.1        7854.1       1.0X
+UTF8_LCASE                                                              315            315           0          0.1        7863.0       1.0X
+UNICODE                                                                 314            315           0          0.1        7858.8       1.0X
+UNICODE_CI                                                              314            315           1          0.1        7852.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execBinary:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 -----------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                          126            127           0          0.3        3147.2       1.0X
-UTF8_LCASE                                                           126            127           1          0.3        3154.2       1.0X
-UNICODE                                                              126            127           1          0.3        3149.0       1.0X
-UNICODE_CI                                                           126            127           1          0.3        3157.4       1.0X
+UTF8_BINARY                                                          158            160           1          0.3        3947.4       1.0X
+UTF8_LCASE                                                           159            160           1          0.3        3979.2       1.0X
+UNICODE                                                              158            160           1          0.3        3962.3       1.0X
+UNICODE_CI                                                           159            160           0          0.3        3983.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.15+6-LTS on Linux 6.11.0-1012-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collation unit benchmarks - initCap using impl execLowercase:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns) Relative time
 --------------------------------------------------------------------------------------------------------------------------------------------
-UTF8_BINARY                                                             224            225           1          0.2        5598.3       1.0X
-UTF8_LCASE                                                              224            225           1          0.2        5596.6       1.0X
-UNICODE                                                                 224            225           0          0.2        5599.3       1.0X
-UNICODE_CI                                                              224            225           1          0.2        5596.4       1.0X
+UTF8_BINARY                                                             265            271           8          0.2        6630.7       1.0X
+UTF8_LCASE                                                              265            267           2          0.2        6622.7       1.0X
+UNICODE                                                                 265            266           1          0.2        6633.8       1.0X
+UNICODE_CI                                                              267            269           1          0.1        6677.1       1.0X
 
diff --git a/sql/core/benchmarks/ColumnarBatchBenchmark-jdk21-results.txt b/sql/core/benchmarks/ColumnarBatchBenchmark-jdk21-results.txt
index 5e4032460e6af..b0a81778443ee 100644
--- a/sql/core/benchmarks/ColumnarBatchBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/ColumnarBatchBenchmark-jdk21-results.txt
@@ -2,58 +2,58 @@
 Int Read/Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int Read/Write:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Java Array                                          119            120           0       2745.9           0.4       1.0X
-ByteBuffer Unsafe                                   199            203           5       1648.0           0.6       0.6X
-ByteBuffer API                                      349            350           1        937.6           1.1       0.3X
-DirectByteBuffer                                    419            420           1        781.8           1.3       0.3X
-Unsafe Buffer                                       155            155           0       2119.1           0.5       0.8X
-Column(on heap)                                     124            124           0       2642.9           0.4       1.0X
-Column(off heap)                                    154            155           1       2124.3           0.5       0.8X
-Column(off heap direct)                             155            155           0       2118.0           0.5       0.8X
-UnsafeRow (on heap)                                 435            435           0        753.9           1.3       0.3X
-UnsafeRow (off heap)                                295            296           1       1111.1           0.9       0.4X
-Column On Heap Append                               312            319           6       1049.0           1.0       0.4X
+Java Array                                          123            123           1       2664.6           0.4       1.0X
+ByteBuffer Unsafe                                   191            197           7       1714.7           0.6       0.6X
+ByteBuffer API                                      443            443           0        740.2           1.4       0.3X
+DirectByteBuffer                                    419            420           0        781.4           1.3       0.3X
+Unsafe Buffer                                       154            154           0       2124.5           0.5       0.8X
+Column(on heap)                                     124            124           0       2643.6           0.4       1.0X
+Column(off heap)                                    154            155           0       2121.4           0.5       0.8X
+Column(off heap direct)                             154            155           0       2121.0           0.5       0.8X
+UnsafeRow (on heap)                                 435            440          12        754.0           1.3       0.3X
+UnsafeRow (off heap)                                295            296           1       1110.5           0.9       0.4X
+Column On Heap Append                               313            314           2       1048.3           1.0       0.4X
 
 
 ================================================================================================
 Boolean Read/Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Boolean Read/Write:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Bitset                                              523            525           2        641.1           1.6       1.0X
-Byte Array                                          250            251           2       1341.9           0.7       2.1X
+Bitset                                              432            433           0        776.0           1.3       1.0X
+Byte Array                                          237            237           0       1417.2           0.7       1.8X
 
 
 ================================================================================================
 String Read/Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String Read/Write:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-On Heap                                             126            128           2        130.2           7.7       1.0X
-Off Heap                                            402            424          19         40.8          24.5       0.3X
+On Heap                                             126            129           2        129.7           7.7       1.0X
+Off Heap                                            410            469          34         40.0          25.0       0.3X
 
 
 ================================================================================================
 Array Vector Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array Vector Read:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-On Heap Read Size Only                               86             86           0       1898.6           0.5       1.0X
-Off Heap Read Size Only                             358            361           2        457.2           2.2       0.2X
-On Heap Read Elements                              2405           2407           3         68.1          14.7       0.0X
-Off Heap Read Elements                             2648           2652           5         61.9          16.2       0.0X
+On Heap Read Size Only                               88             88           0       1865.6           0.5       1.0X
+Off Heap Read Size Only                             427            427           0        383.6           2.6       0.2X
+On Heap Read Elements                              2480           2564         120         66.1          15.1       0.0X
+Off Heap Read Elements                             2448           2496          68         66.9          14.9       0.0X
 
 
diff --git a/sql/core/benchmarks/ColumnarBatchBenchmark-results.txt b/sql/core/benchmarks/ColumnarBatchBenchmark-results.txt
index d2123457fe149..e0a39640e547c 100644
--- a/sql/core/benchmarks/ColumnarBatchBenchmark-results.txt
+++ b/sql/core/benchmarks/ColumnarBatchBenchmark-results.txt
@@ -2,58 +2,58 @@
 Int Read/Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int Read/Write:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Java Array                                          175            176           0       1869.0           0.5       1.0X
-ByteBuffer Unsafe                                   304            307           1       1077.0           0.9       0.6X
-ByteBuffer API                                      510            511           1        642.7           1.6       0.3X
-DirectByteBuffer                                    406            406           0        807.8           1.2       0.4X
-Unsafe Buffer                                       162            163           1       2023.2           0.5       1.1X
-Column(on heap)                                     171            172           1       1912.8           0.5       1.0X
-Column(off heap)                                    163            163           1       2015.1           0.5       1.1X
-Column(off heap direct)                             158            158           0       2078.2           0.5       1.1X
-UnsafeRow (on heap)                                 439            439           0        747.1           1.3       0.4X
-UnsafeRow (off heap)                                315            316           2       1041.6           1.0       0.6X
-Column On Heap Append                               389            390           1        842.3           1.2       0.5X
+Java Array                                          196            196           0       1673.2           0.6       1.0X
+ByteBuffer Unsafe                                   288            288           0       1139.3           0.9       0.7X
+ByteBuffer API                                      510            511           1        643.0           1.6       0.4X
+DirectByteBuffer                                    469            470           0        698.1           1.4       0.4X
+Unsafe Buffer                                       162            163           0       2016.7           0.5       1.2X
+Column(on heap)                                     171            172           0       1911.9           0.5       1.1X
+Column(off heap)                                    163            163           0       2010.0           0.5       1.2X
+Column(off heap direct)                             158            158           0       2074.5           0.5       1.2X
+UnsafeRow (on heap)                                 439            442           6        747.2           1.3       0.4X
+UnsafeRow (off heap)                                314            317           2       1043.7           1.0       0.6X
+Column On Heap Append                               363            364           0        902.1           1.1       0.5X
 
 
 ================================================================================================
 Boolean Read/Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Boolean Read/Write:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Bitset                                              445            447           1        753.3           1.3       1.0X
-Byte Array                                          263            264           1       1274.2           0.8       1.7X
+Bitset                                              479            480           0        699.8           1.4       1.0X
+Byte Array                                          263            264           0       1274.3           0.8       1.8X
 
 
 ================================================================================================
 String Read/Write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String Read/Write:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-On Heap                                             142            144           1        115.3           8.7       1.0X
-Off Heap                                            393            410          12         41.7          24.0       0.4X
+On Heap                                             142            143           2        115.2           8.7       1.0X
+Off Heap                                            367            394          18         44.7          22.4       0.4X
 
 
 ================================================================================================
 Array Vector Read
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array Vector Read:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-On Heap Read Size Only                               88             88           0       1869.3           0.5       1.0X
-Off Heap Read Size Only                              85             86           0       1920.0           0.5       1.0X
-On Heap Read Elements                              2415           2417           3         67.8          14.7       0.0X
-Off Heap Read Elements                             2880           2880           1         56.9          17.6       0.0X
+On Heap Read Size Only                               90             90           0       1818.9           0.5       1.0X
+Off Heap Read Size Only                              86             86           0       1915.7           0.5       1.1X
+On Heap Read Elements                              2195           2199           6         74.6          13.4       0.0X
+Off Heap Read Elements                             2791           2793           3         58.7          17.0       0.0X
 
 
diff --git a/sql/core/benchmarks/CompressionSchemeBenchmark-jdk21-results.txt b/sql/core/benchmarks/CompressionSchemeBenchmark-jdk21-results.txt
index e177803bb1efa..6901556ad1faf 100644
--- a/sql/core/benchmarks/CompressionSchemeBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/CompressionSchemeBenchmark-jdk21-results.txt
@@ -2,136 +2,136 @@
 Compression Scheme Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 BOOLEAN Encode:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    1              1           0      47214.4           0.0       1.0X
-RunLengthEncoding(2.515)                            943           1094         261         71.2          14.1       0.0X
-BooleanBitSet(0.125)                                292            293           0        229.5           4.4       0.0X
+PassThrough(1.000)                                    1              1           0      48542.5           0.0       1.0X
+RunLengthEncoding(2.497)                            940            946           9         71.4          14.0       0.0X
+BooleanBitSet(0.125)                                274            274           0        245.1           4.1       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 BOOLEAN Decode:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         212            213           1        317.1           3.2       1.0X
-RunLengthEncoding                                   618            618           0        108.6           9.2       0.3X
-BooleanBitSet                                       668            669           0        100.4          10.0       0.3X
+PassThrough                                         211            212           1        318.3           3.1       1.0X
+RunLengthEncoding                                   580            581           1        115.7           8.6       0.4X
+BooleanBitSet                                       678            681           4         98.9          10.1       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Encode (Lower Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    3              3           0      24468.7           0.0       1.0X
-RunLengthEncoding(1.504)                           1066           1068           3         63.0          15.9       0.0X
+PassThrough(1.000)                                    3              3           0      24472.0           0.0       1.0X
+RunLengthEncoding(1.501)                           1131           1131           0         59.3          16.9       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Decode (Lower Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         710            710           0         94.5          10.6       1.0X
-RunLengthEncoding                                  1000           1000           0         67.1          14.9       0.7X
+PassThrough                                         627            628           1        107.0           9.3       1.0X
+RunLengthEncoding                                   986            987           0         68.0          14.7       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Encode (Higher Skew):               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    3              3           0      24523.0           0.0       1.0X
-RunLengthEncoding(2.017)                           1108           1109           0         60.6          16.5       0.0X
+PassThrough(1.000)                                    3              3           0      24323.5           0.0       1.0X
+RunLengthEncoding(2.008)                           1170           1170           0         57.4          17.4       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Decode (Higher Skew):               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         648            650           3        103.6           9.7       1.0X
-RunLengthEncoding                                   939            942           2         71.4          14.0       0.7X
+PassThrough                                         606            607           1        110.8           9.0       1.0X
+RunLengthEncoding                                   962            963           1         69.7          14.3       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Encode (Lower Skew):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    6              6           0      11110.5           0.1       1.0X
-RunLengthEncoding(0.996)                           1029           1029           1         65.2          15.3       0.0X
-DictionaryEncoding(0.500)                           343            344           1        195.6           5.1       0.0X
-IntDelta(0.250)                                     110            110           0        609.4           1.6       0.1X
+PassThrough(1.000)                                    6              6           0      11620.1           0.1       1.0X
+RunLengthEncoding(0.998)                           1048           1050           2         64.0          15.6       0.0X
+DictionaryEncoding(0.500)                           518            519           0        129.5           7.7       0.0X
+IntDelta(0.250)                                     141            142           1        477.0           2.1       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Decode (Lower Skew):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         648            651           2        103.6           9.7       1.0X
-RunLengthEncoding                                  1222           1224           3         54.9          18.2       0.5X
-DictionaryEncoding                                  544            545           0        123.3           8.1       1.2X
-IntDelta                                            502            504           2        133.6           7.5       1.3X
+PassThrough                                         647            648           2        103.7           9.6       1.0X
+RunLengthEncoding                                  1120           1127           9         59.9          16.7       0.6X
+DictionaryEncoding                                  549            551           3        122.1           8.2       1.2X
+IntDelta                                            501            502           0        133.9           7.5       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Encode (Higher Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    6              6           0      11275.3           0.1       1.0X
-RunLengthEncoding(1.336)                           1064           1064           0         63.1          15.9       0.0X
-DictionaryEncoding(0.501)                           343            343           0        195.6           5.1       0.0X
-IntDelta(0.250)                                     111            111           1        606.8           1.6       0.1X
+PassThrough(1.000)                                    6              6           0      11163.4           0.1       1.0X
+RunLengthEncoding(1.335)                           1078           1078           0         62.3          16.1       0.0X
+DictionaryEncoding(0.501)                           399            399           0        168.2           5.9       0.0X
+IntDelta(0.250)                                     132            133           0        506.7           2.0       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Decode (Higher Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         731            733           2         91.8          10.9       1.0X
-RunLengthEncoding                                  1220           1223           4         55.0          18.2       0.6X
-DictionaryEncoding                                  671            673           2        100.0          10.0       1.1X
-IntDelta                                            524            603          53        128.1           7.8       1.4X
+PassThrough                                         710            710           1         94.5          10.6       1.0X
+RunLengthEncoding                                  1216           1217           1         55.2          18.1       0.6X
+DictionaryEncoding                                  671            672           2        100.1          10.0       1.1X
+IntDelta                                            522            522           0        128.6           7.8       1.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Encode (Lower Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                   13             14           0       4998.1           0.2       1.0X
-RunLengthEncoding(0.749)                           1056           1056           0         63.5          15.7       0.0X
-DictionaryEncoding(0.250)                           409            410           2        164.2           6.1       0.0X
-LongDelta(0.125)                                    111            111           0        603.3           1.7       0.1X
+PassThrough(1.000)                                   14             14           0       4948.2           0.2       1.0X
+RunLengthEncoding(0.749)                           1072           1072           0         62.6          16.0       0.0X
+DictionaryEncoding(0.250)                           424            425           1        158.3           6.3       0.0X
+LongDelta(0.125)                                    133            134           0        504.1           2.0       0.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Decode (Lower Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         837            838           2         80.2          12.5       1.0X
-RunLengthEncoding                                  1260           1263           3         53.2          18.8       0.7X
-DictionaryEncoding                                  810            818          11         82.9          12.1       1.0X
-LongDelta                                           544            546           2        123.3           8.1       1.5X
+PassThrough                                         774            775           0         86.7          11.5       1.0X
+RunLengthEncoding                                  1244           1255          16         54.0          18.5       0.6X
+DictionaryEncoding                                  733            733           0         91.6          10.9       1.1X
+LongDelta                                           543            543           0        123.6           8.1       1.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Encode (Higher Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                   13             13           0       5021.1           0.2       1.0X
-RunLengthEncoding(0.999)                           1087           1090           4         61.7          16.2       0.0X
-DictionaryEncoding(0.251)                           409            410           2        164.0           6.1       0.0X
-LongDelta(0.125)                                    111            112           1        603.0           1.7       0.1X
+PassThrough(1.000)                                   18             18           0       3753.2           0.3       1.0X
+RunLengthEncoding(1.000)                           1103           1104           1         60.8          16.4       0.0X
+DictionaryEncoding(0.251)                           426            426           0        157.6           6.3       0.0X
+LongDelta(0.125)                                    133            134           0        503.1           2.0       0.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Decode (Higher Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         816            817           2         82.3          12.2       1.0X
-RunLengthEncoding                                  1235           1236           1         54.4          18.4       0.7X
-DictionaryEncoding                                  811            812           2         82.8          12.1       1.0X
-LongDelta                                           671            674           3        100.0          10.0       1.2X
+PassThrough                                         774            775           1         86.7          11.5       1.0X
+RunLengthEncoding                                  1242           1243           1         54.0          18.5       0.6X
+DictionaryEncoding                                  734            735           1         91.4          10.9       1.1X
+LongDelta                                           671            671           0        100.0          10.0       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 STRING Encode:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                   26             29           1       2629.0           0.4       1.0X
-RunLengthEncoding(0.889)                           2060           2063           6         32.6          30.7       0.0X
-DictionaryEncoding(0.167)                          2176           2179           5         30.8          32.4       0.0X
+PassThrough(1.000)                                   20             20           0       3349.9           0.3       1.0X
+RunLengthEncoding(0.894)                           2062           2062           0         32.5          30.7       0.0X
+DictionaryEncoding(0.167)                          2312           2317           8         29.0          34.4       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 STRING Decode:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                        1650           1670          28         40.7          24.6       1.0X
-RunLengthEncoding                                  2510           2512           3         26.7          37.4       0.7X
-DictionaryEncoding                                 1990           1998          12         33.7          29.6       0.8X
+PassThrough                                        1632           1654          31         41.1          24.3       1.0X
+RunLengthEncoding                                  2508           2510           2         26.8          37.4       0.7X
+DictionaryEncoding                                 2009           2011           2         33.4          29.9       0.8X
 
 
diff --git a/sql/core/benchmarks/CompressionSchemeBenchmark-results.txt b/sql/core/benchmarks/CompressionSchemeBenchmark-results.txt
index 0e846555ef114..644366d42a968 100644
--- a/sql/core/benchmarks/CompressionSchemeBenchmark-results.txt
+++ b/sql/core/benchmarks/CompressionSchemeBenchmark-results.txt
@@ -2,136 +2,136 @@
 Compression Scheme Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 BOOLEAN Encode:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    1              1           0      49097.6           0.0       1.0X
-RunLengthEncoding(2.503)                            887            892           5         75.6          13.2       0.0X
-BooleanBitSet(0.125)                                297            297           0        226.1           4.4       0.0X
+PassThrough(1.000)                                    1              1           0      49126.6           0.0       1.0X
+RunLengthEncoding(2.503)                            886            888           2         75.8          13.2       0.0X
+BooleanBitSet(0.125)                                293            294           1        228.8           4.4       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 BOOLEAN Decode:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         168            168           0        400.3           2.5       1.0X
-RunLengthEncoding                                   554            554           1        121.2           8.3       0.3X
-BooleanBitSet                                       652            657           4        102.9           9.7       0.3X
+PassThrough                                         168            168           0        399.9           2.5       1.0X
+RunLengthEncoding                                   540            541           1        124.3           8.0       0.3X
+BooleanBitSet                                       655            659           4        102.5           9.8       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Encode (Lower Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    3              3           0      24577.6           0.0       1.0X
-RunLengthEncoding(1.494)                            998           1000           3         67.3          14.9       0.0X
+PassThrough(1.000)                                    3              3           0      23278.0           0.0       1.0X
+RunLengthEncoding(1.499)                           1038           1039           1         64.7          15.5       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Decode (Lower Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         689            691           2         97.4          10.3       1.0X
-RunLengthEncoding                                   969            970           2         69.3          14.4       0.7X
+PassThrough                                         543            544           1        123.5           8.1       1.0X
+RunLengthEncoding                                   963            964           1         69.7          14.4       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Encode (Higher Skew):               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    3              3           0      22331.2           0.0       1.0X
-RunLengthEncoding(2.005)                           1008           1008           0         66.6          15.0       0.0X
+PassThrough(1.000)                                    3              3           0      23167.5           0.0       1.0X
+RunLengthEncoding(2.010)                           1059           1061           3         63.4          15.8       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SHORT Decode (Higher Skew):               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         689            691           2         97.4          10.3       1.0X
-RunLengthEncoding                                   927            928           1         72.4          13.8       0.7X
+PassThrough                                         544            544           0        123.4           8.1       1.0X
+RunLengthEncoding                                   908            909           2         73.9          13.5       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Encode (Lower Skew):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    6              6           0      11223.2           0.1       1.0X
-RunLengthEncoding(1.000)                            958            959           1         70.0          14.3       0.0X
-DictionaryEncoding(0.500)                           370            371           2        181.5           5.5       0.0X
-IntDelta(0.250)                                     110            110           1        609.9           1.6       0.1X
+PassThrough(1.000)                                    6              6           0      11254.0           0.1       1.0X
+RunLengthEncoding(1.006)                            990            991           1         67.8          14.8       0.0X
+DictionaryEncoding(0.500)                           384            385           0        174.6           5.7       0.0X
+IntDelta(0.250)                                     115            115           0        582.0           1.7       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Decode (Lower Skew):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         626            629           2        107.1           9.3       1.0X
-RunLengthEncoding                                  1051           1052           0         63.8          15.7       0.6X
-DictionaryEncoding                                  523            524           2        128.3           7.8       1.2X
-IntDelta                                            459            460           1        146.1           6.8       1.4X
+PassThrough                                         627            627           0        107.1           9.3       1.0X
+RunLengthEncoding                                  1177           1177           0         57.0          17.5       0.5X
+DictionaryEncoding                                  523            524           2        128.4           7.8       1.2X
+IntDelta                                            459            459           0        146.2           6.8       1.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Encode (Higher Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                    6              6           0      11176.2           0.1       1.0X
-RunLengthEncoding(1.333)                            975            977           2         68.8          14.5       0.0X
-DictionaryEncoding(0.501)                           369            371           2        181.8           5.5       0.0X
-IntDelta(0.250)                                     110            110           1        609.1           1.6       0.1X
+PassThrough(1.000)                                    6              6           0      11285.5           0.1       1.0X
+RunLengthEncoding(1.339)                           1009           1009           0         66.5          15.0       0.0X
+DictionaryEncoding(0.501)                           386            386           1        174.0           5.7       0.0X
+IntDelta(0.250)                                     115            115           0        581.8           1.7       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 INT Decode (Higher Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
 PassThrough                                         710            712           2         94.5          10.6       1.0X
-RunLengthEncoding                                  1157           1159           3         58.0          17.2       0.6X
-DictionaryEncoding                                  544            570          50        123.3           8.1       1.3X
-IntDelta                                            598            599           1        112.2           8.9       1.2X
+RunLengthEncoding                                  1111           1111           0         60.4          16.6       0.6X
+DictionaryEncoding                                  542            548           7        123.8           8.1       1.3X
+IntDelta                                            595            596           1        112.7           8.9       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Encode (Lower Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                   13             18           1       5006.5           0.2       1.0X
-RunLengthEncoding(0.757)                           1008           1008           1         66.6          15.0       0.0X
-DictionaryEncoding(0.250)                           433            434           0        154.9           6.5       0.0X
-LongDelta(0.125)                                    116            116           1        580.0           1.7       0.1X
+PassThrough(1.000)                                   13             13           0       5021.3           0.2       1.0X
+RunLengthEncoding(0.751)                           1045           1046           0         64.2          15.6       0.0X
+DictionaryEncoding(0.250)                           456            461          12        147.2           6.8       0.0X
+LongDelta(0.125)                                    111            111           0        605.7           1.7       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Decode (Lower Skew):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         782            785           3         85.8          11.7       1.0X
-RunLengthEncoding                                  1187           1188           2         56.5          17.7       0.7X
-DictionaryEncoding                                  714            716           2         94.0          10.6       1.1X
-LongDelta                                           506            506           0        132.6           7.5       1.5X
+PassThrough                                         712            712           0         94.3          10.6       1.0X
+RunLengthEncoding                                  1169           1169           1         57.4          17.4       0.6X
+DictionaryEncoding                                  710            710           0         94.5          10.6       1.0X
+LongDelta                                           522            522           0        128.5           7.8       1.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Encode (Higher Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                   14             15           2       4970.3           0.2       1.0X
-RunLengthEncoding(1.003)                           1009           1010           1         66.5          15.0       0.0X
-DictionaryEncoding(0.251)                           435            436           2        154.3           6.5       0.0X
-LongDelta(0.125)                                    116            116           1        579.1           1.7       0.1X
+PassThrough(1.000)                                   13             14           0       5032.9           0.2       1.0X
+RunLengthEncoding(0.999)                           1064           1065           0         63.0          15.9       0.0X
+DictionaryEncoding(0.251)                           452            453           1        148.3           6.7       0.0X
+LongDelta(0.125)                                    111            111           0        603.9           1.7       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LONG Decode (Higher Skew):                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                         781            782           1         85.9          11.6       1.0X
-RunLengthEncoding                                  1195           1197           4         56.2          17.8       0.7X
-DictionaryEncoding                                  715            716           2         93.9          10.6       1.1X
-LongDelta                                           634            635           2        105.9           9.4       1.2X
+PassThrough                                         713            714           0         94.1          10.6       1.0X
+RunLengthEncoding                                  1175           1177           3         57.1          17.5       0.6X
+DictionaryEncoding                                  687            688           1         97.7          10.2       1.0X
+LongDelta                                           611            612           1        109.8           9.1       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 STRING Encode:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough(1.000)                                   26             27           0       2611.3           0.4       1.0X
-RunLengthEncoding(0.892)                           2003           2003           0         33.5          29.8       0.0X
-DictionaryEncoding(0.167)                          2471           2472           2         27.2          36.8       0.0X
+PassThrough(1.000)                                   25             29           1       2732.0           0.4       1.0X
+RunLengthEncoding(0.895)                           1991           1991           0         33.7          29.7       0.0X
+DictionaryEncoding(0.167)                          1965           1966           2         34.2          29.3       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 STRING Decode:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-PassThrough                                        1447           1472          35         46.4          21.6       1.0X
-RunLengthEncoding                                  2274           2275           1         29.5          33.9       0.6X
-DictionaryEncoding                                 2100           2100           1         32.0          31.3       0.7X
+PassThrough                                        1603           1604           2         41.9          23.9       1.0X
+RunLengthEncoding                                  2452           2453           1         27.4          36.5       0.7X
+DictionaryEncoding                                 2090           2090           0         32.1          31.1       0.8X
 
 
diff --git a/sql/core/benchmarks/ConstantColumnVectorBenchmark-jdk21-results.txt b/sql/core/benchmarks/ConstantColumnVectorBenchmark-jdk21-results.txt
index 873f19d3fff43..ef3b3ef806417 100644
--- a/sql/core/benchmarks/ConstantColumnVectorBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/ConstantColumnVectorBenchmark-jdk21-results.txt
@@ -1,280 +1,280 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 1:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    1              1           0     403153.6           0.0       1.0X
-OnHeapColumnVector                                   2682           2693          16        152.7           6.5       0.0X
-OffHeapColumnVector                                  3740           3741           1        109.5           9.1       0.0X
+ConstantColumnVector                                    1              1           0     394213.8           0.0       1.0X
+OnHeapColumnVector                                   2886           2891           7        141.9           7.0       0.0X
+OffHeapColumnVector                                  5302           5304           2         77.3          12.9       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 5:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    1              1           0     458928.9           0.0       1.0X
-OnHeapColumnVector                                   4029           4031           4        101.7           9.8       0.0X
-OffHeapColumnVector                                  4613           4614           1         88.8          11.3       0.0X
+ConstantColumnVector                                    1              1           0     422517.2           0.0       1.0X
+OnHeapColumnVector                                   4022           4022           1        101.8           9.8       0.0X
+OffHeapColumnVector                                  4704           4706           3         87.1          11.5       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 10:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     458451.7           0.0       1.0X
-OnHeapColumnVector                                    4208           4211           4         97.3          10.3       0.0X
-OffHeapColumnVector                                   4774           4774           0         85.8          11.7       0.0X
+ConstantColumnVector                                     1              1           0     422455.8           0.0       1.0X
+OnHeapColumnVector                                    4232           4255          32         96.8          10.3       0.0X
+OffHeapColumnVector                                   5072           5074           2         80.8          12.4       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 15:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     458729.0           0.0       1.0X
-OnHeapColumnVector                                    4053           4053           0        101.1           9.9       0.0X
-OffHeapColumnVector                                   4629           4635          10         88.5          11.3       0.0X
+ConstantColumnVector                                     1              1           0     422731.3           0.0       1.0X
+OnHeapColumnVector                                    4260           4273          20         96.2          10.4       0.0X
+OffHeapColumnVector                                   4725           4735          14         86.7          11.5       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 20:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     459972.5           0.0       1.0X
-OnHeapColumnVector                                    3920           3933          18        104.5           9.6       0.0X
-OffHeapColumnVector                                   4652           4656           5         88.0          11.4       0.0X
+ConstantColumnVector                                     1              1           0     422774.9           0.0       1.0X
+OnHeapColumnVector                                    4526           4526           0         90.5          11.0       0.0X
+OffHeapColumnVector                                   5028           5030           2         81.5          12.3       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 30:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     458806.5           0.0       1.0X
-OnHeapColumnVector                                    4289           4289           0         95.5          10.5       0.0X
-OffHeapColumnVector                                   4958           4960           3         82.6          12.1       0.0X
+ConstantColumnVector                                     1              1           0     422525.9           0.0       1.0X
+OnHeapColumnVector                                    4698           4700           3         87.2          11.5       0.0X
+OffHeapColumnVector                                   5213           5215           4         78.6          12.7       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with IntegerType:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     720559.7           0.0       1.0X
-OnHeapColumnVector                                   15             15           0      27615.9           0.0       0.0X
-OffHeapColumnVector                                  61             62           1       6721.8           0.1       0.0X
+ConstantColumnVector                                  1              1           0     664352.7           0.0       1.0X
+OnHeapColumnVector                                   16             16           0      25464.2           0.0       0.0X
+OffHeapColumnVector                                  65             65           0       6277.8           0.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with LongType:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     655063.4           0.0       1.0X
-OnHeapColumnVector                                   30             31           1      13471.6           0.1       0.0X
-OffHeapColumnVector                                  61             62           2       6691.9           0.1       0.0X
+ConstantColumnVector                                  1              1           0     632716.8           0.0       1.0X
+OnHeapColumnVector                                   33             33           0      12471.3           0.1       0.0X
+OffHeapColumnVector                                  67             67           0       6156.8           0.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with FloatType:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     496475.8           0.0       1.0X
-OnHeapColumnVector                                   15             15           0      27289.6           0.0       0.1X
-OffHeapColumnVector                                 118            119           1       3470.7           0.3       0.0X
+ConstantColumnVector                                  1              1           0     457741.1           0.0       1.0X
+OnHeapColumnVector                                   16             16           0      25377.8           0.0       0.1X
+OffHeapColumnVector                                 128            128           0       3210.0           0.3       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with DoubleType:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     553741.0           0.0       1.0X
-OnHeapColumnVector                                   31             32           1      13108.1           0.1       0.0X
-OffHeapColumnVector                                 119            120           1       3454.9           0.3       0.0X
+ConstantColumnVector                                  1              1           0     366593.5           0.0       1.0X
+OnHeapColumnVector                                   33             33           0      12450.1           0.1       0.0X
+OffHeapColumnVector                                 129            130           0       3164.6           0.3       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 1:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                   0              0           0   14401237.6           0.0       1.0X
-OnHeapColumnVector                                   100            102           1       4086.1           0.2       0.0X
-OffHeapColumnVector                                 4198           4227          41         97.6          10.3       0.0X
+ConstantColumnVector                                   0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                   106            106           0       3881.1           0.3       0.0X
+OffHeapColumnVector                                 3773           3773           1        108.6           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 5:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                   0              0           0   14401237.6           0.0       1.0X
-OnHeapColumnVector                                  3811           3832          30        107.5           9.3       0.0X
-OffHeapColumnVector                                 4210           4215           6         97.3          10.3       0.0X
+ConstantColumnVector                                   0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                  4106           4112          10         99.8          10.0       0.0X
+OffHeapColumnVector                                 3778           3788          14        108.4           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 10:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    0              0           0   14401237.6           0.0       1.0X
-OnHeapColumnVector                                   3810           3820          14        107.5           9.3       0.0X
-OffHeapColumnVector                                  4138           4197          83         99.0          10.1       0.0X
+ConstantColumnVector                                    0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                   4100           4101           2         99.9          10.0       0.0X
+OffHeapColumnVector                                  3780           3791          15        108.4           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 15:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    0              0           0   14401237.6           0.0       1.0X
-OnHeapColumnVector                                   3801           3831          42        107.8           9.3       0.0X
-OffHeapColumnVector                                  4196           4200           6         97.6          10.2       0.0X
+ConstantColumnVector                                    0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                   4099           4103           5         99.9          10.0       0.0X
+OffHeapColumnVector                                  3758           3759           0        109.0           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 20:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    0              0           0   14401237.6           0.0       1.0X
-OnHeapColumnVector                                   3810           3824          20        107.5           9.3       0.0X
-OffHeapColumnVector                                  4163           4165           2         98.4          10.2       0.0X
+ConstantColumnVector                                    0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                   4096           4097           2        100.0          10.0       0.0X
+OffHeapColumnVector                                  3752           3754           2        109.2           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 30:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    0              0           0   14401237.6           0.0       1.0X
-OnHeapColumnVector                                   3789           3794           8        108.1           9.2       0.0X
-OffHeapColumnVector                                  4180           4203          33         98.0          10.2       0.0X
+ConstantColumnVector                                    0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                   4088           4089           1        100.2          10.0       0.0X
+OffHeapColumnVector                                  3751           3754           5        109.2           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with IntegerType:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0    3602747.8           0.0       1.0X
-OnHeapColumnVector                                    1              1           0     554206.3           0.0       0.2X
-OffHeapColumnVector                                 828            829           1        494.8           2.0       0.0X
+ConstantColumnVector                                  0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                    1              1           0     510968.5           0.0       0.0X
+OffHeapColumnVector                                 893            893           0        458.6           2.2       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with LongType:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               1723           1731          12        237.8           4.2       1.0X
-OnHeapColumnVector                                 1972           1974           3        207.7           4.8       0.9X
-OffHeapColumnVector                                2497           2517          29        164.0           6.1       0.7X
+ConstantColumnVector                               1831           1832           0        223.7           4.5       1.0X
+OnHeapColumnVector                                 2087           2087           0        196.3           5.1       0.9X
+OffHeapColumnVector                                2609           2609           1        157.0           6.4       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with FloatType:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               1741           1746           7        235.3           4.3       1.0X
-OnHeapColumnVector                                 1998           2009          16        205.0           4.9       0.9X
-OffHeapColumnVector                                2598           2598           1        157.7           6.3       0.7X
+ConstantColumnVector                               1854           1855           1        220.9           4.5       1.0X
+OnHeapColumnVector                                 2110           2110           0        194.1           5.2       0.9X
+OffHeapColumnVector                                2623           2632          13        156.2           6.4       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with DoubleType:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               1886           1890           6        217.2           4.6       1.0X
-OnHeapColumnVector                                 1994           1999           8        205.4           4.9       0.9X
-OffHeapColumnVector                                2582           2594          17        158.6           6.3       0.7X
+ConstantColumnVector                               1991           1991           1        205.8           4.9       1.0X
+OnHeapColumnVector                                 2143           2146           5        191.2           5.2       0.9X
+OffHeapColumnVector                                2764           2765           1        148.2           6.7       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 1:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                          2352           2367          21        174.2           5.7       1.0X
-OnHeapColumnVector                                            5306           5327          30         77.2          13.0       0.4X
-OffHeapColumnVector                                           5835           5836           2         70.2          14.2       0.4X
+ConstantColumnVector                                          1953           1953           0        209.8           4.8       1.0X
+OnHeapColumnVector                                            5871           5914          61         69.8          14.3       0.3X
+OffHeapColumnVector                                           5194           5198           6         78.9          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 5:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                          2348           2350           2        174.4           5.7       1.0X
-OnHeapColumnVector                                            5374           5387          18         76.2          13.1       0.4X
-OffHeapColumnVector                                           5940           5990          71         69.0          14.5       0.4X
+ConstantColumnVector                                          1952           1953           2        209.9           4.8       1.0X
+OnHeapColumnVector                                            5843           5843           1         70.1          14.3       0.3X
+OffHeapColumnVector                                           5217           5218           2         78.5          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 10:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                           2335           2350          21        175.4           5.7       1.0X
-OnHeapColumnVector                                             5323           5370          66         77.0          13.0       0.4X
-OffHeapColumnVector                                            5828           5835          10         70.3          14.2       0.4X
+ConstantColumnVector                                           1954           1955           2        209.6           4.8       1.0X
+OnHeapColumnVector                                             5850           5851           1         70.0          14.3       0.3X
+OffHeapColumnVector                                            5215           5216           1         78.5          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 15:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                           2323           2332          13        176.3           5.7       1.0X
-OnHeapColumnVector                                             5271           5305          48         77.7          12.9       0.4X
-OffHeapColumnVector                                            5856           5861           7         69.9          14.3       0.4X
+ConstantColumnVector                                           1951           1952           2        210.0           4.8       1.0X
+OnHeapColumnVector                                             5848           5849           1         70.0          14.3       0.3X
+OffHeapColumnVector                                            5217           5219           2         78.5          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 20:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                           2323           2327           6        176.3           5.7       1.0X
-OnHeapColumnVector                                             5313           5318           8         77.1          13.0       0.4X
-OffHeapColumnVector                                            5814           5821          10         70.4          14.2       0.4X
+ConstantColumnVector                                           1952           1952           0        209.8           4.8       1.0X
+OnHeapColumnVector                                             5867           5869           2         69.8          14.3       0.3X
+OffHeapColumnVector                                            5198           5200           2         78.8          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 30:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                           2315           2326          15        176.9           5.7       1.0X
-OnHeapColumnVector                                             5274           5281          10         77.7          12.9       0.4X
-OffHeapColumnVector                                            5834           5857          33         70.2          14.2       0.4X
+ConstantColumnVector                                           1968           1969           2        208.1           4.8       1.0X
+OnHeapColumnVector                                             5847           5861          21         70.1          14.3       0.3X
+OffHeapColumnVector                                            5202           5206           5         78.7          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with IntegerType:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                708            711           2        578.4           1.7       1.0X
-OnHeapColumnVector                                  827            829           3        495.2           2.0       0.9X
-OffHeapColumnVector                                 827            833           7        495.0           2.0       0.9X
+ConstantColumnVector                                893            893           1        458.9           2.2       1.0X
+OnHeapColumnVector                                 1020           1022           2        401.6           2.5       0.9X
+OffHeapColumnVector                                 893            893           1        458.9           2.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with LongType:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               2707           2710           4        151.3           6.6       1.0X
-OnHeapColumnVector                                 2801           2815          20        146.2           6.8       1.0X
-OffHeapColumnVector                                2832           2839          11        144.7           6.9       1.0X
+ConstantColumnVector                               2871           2872           1        142.7           7.0       1.0X
+OnHeapColumnVector                                 2994           2995           1        136.8           7.3       1.0X
+OffHeapColumnVector                                2999           3013          20        136.6           7.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with FloatType:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               2220           2231          15        184.5           5.4       1.0X
-OnHeapColumnVector                                 2972           2995          32        137.8           7.3       0.7X
-OffHeapColumnVector                                2971           2974           3        137.8           7.3       0.7X
+ConstantColumnVector                               2884           2885           2        142.0           7.0       1.0X
+OnHeapColumnVector                                 3040           3041           1        134.8           7.4       0.9X
+OffHeapColumnVector                                3010           3010           1        136.1           7.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with DoubleType:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               2836           2843          10        144.4           6.9       1.0X
-OnHeapColumnVector                                 2973           2995          30        137.8           7.3       1.0X
-OffHeapColumnVector                                2948           2953           7        138.9           7.2       1.0X
+ConstantColumnVector                               3024           3026           2        135.4           7.4       1.0X
+OnHeapColumnVector                                 3154           3155           1        129.9           7.7       1.0X
+OffHeapColumnVector                                3150           3151           2        130.0           7.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with StringType:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  439957035.4           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    3602747.8           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  439957035.4           0.0       1.0X
+ConstantColumnVector                                  0              0           0  405143422.4           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    3321467.1           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  405143422.4           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with IntegerType:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  439957035.4           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    3602747.8           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  439957035.4           0.0       1.0X
+ConstantColumnVector                                  0              0           0  405143422.4           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    3321467.1           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  405143422.4           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with LongType:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  439957035.4           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    3602747.8           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  439957035.4           0.0       1.0X
+ConstantColumnVector                                  0              0           0  405143422.4           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    3321467.1           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  405143422.4           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with FloatType:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  439957035.4           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    3602747.8           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  439957035.4           0.0       1.0X
+ConstantColumnVector                                  0              0           0  405143422.4           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    3321467.1           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  405143422.4           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with DoubleType:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  439957035.4           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    3602747.8           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  439957035.4           0.0       1.0X
+ConstantColumnVector                                  0              0           0  405143422.4           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    3321467.1           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  405143422.4           0.0       1.0X
 
diff --git a/sql/core/benchmarks/ConstantColumnVectorBenchmark-results.txt b/sql/core/benchmarks/ConstantColumnVectorBenchmark-results.txt
index c7c6f7d6f5fee..9d1a8cbbaaac7 100644
--- a/sql/core/benchmarks/ConstantColumnVectorBenchmark-results.txt
+++ b/sql/core/benchmarks/ConstantColumnVectorBenchmark-results.txt
@@ -1,280 +1,280 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 1:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    1              1           0     325448.5           0.0       1.0X
-OnHeapColumnVector                                   2823           2826           4        145.1           6.9       0.0X
-OffHeapColumnVector                                  3497           3499           3        117.1           8.5       0.0X
+ConstantColumnVector                                    1              1           0     326662.9           0.0       1.0X
+OnHeapColumnVector                                   2826           2830           5        144.9           6.9       0.0X
+OffHeapColumnVector                                  3311           3319          12        123.7           8.1       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 5:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                    1              1           0     383288.8           0.0       1.0X
-OnHeapColumnVector                                   3660           3661           2        111.9           8.9       0.0X
-OffHeapColumnVector                                  4384           4387           4         93.4          10.7       0.0X
+ConstantColumnVector                                    1              1           0     383970.7           0.0       1.0X
+OnHeapColumnVector                                   3676           3694          25        111.4           9.0       0.0X
+OffHeapColumnVector                                  4324           4326           3         94.7          10.6       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 10:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     383417.9           0.0       1.0X
-OnHeapColumnVector                                    3845           3846           1        106.5           9.4       0.0X
-OffHeapColumnVector                                   4622           4624           2         88.6          11.3       0.0X
+ConstantColumnVector                                     1              1           0     383962.4           0.0       1.0X
+OnHeapColumnVector                                    3742           3742           1        109.5           9.1       0.0X
+OffHeapColumnVector                                   4315           4320           8         94.9          10.5       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 15:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     383417.6           0.0       1.0X
-OnHeapColumnVector                                    3682           3685           3        111.2           9.0       0.0X
-OffHeapColumnVector                                   4408           4424          23         92.9          10.8       0.0X
+ConstantColumnVector                                     1              1           0     384110.8           0.0       1.0X
+OnHeapColumnVector                                    3914           3914           0        104.7           9.6       0.0X
+OffHeapColumnVector                                   4335           4339           6         94.5          10.6       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 20:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     383346.2           0.0       1.0X
-OnHeapColumnVector                                    4120           4120           1         99.4          10.1       0.0X
-OffHeapColumnVector                                   4573           4573           0         89.6          11.2       0.0X
+ConstantColumnVector                                     1              1           0     384114.0           0.0       1.0X
+OnHeapColumnVector                                    3759           3759           0        109.0           9.2       0.0X
+OffHeapColumnVector                                   4346           4348           4         94.3          10.6       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with StringType, row length = 30:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                     1              1           0     383533.2           0.0       1.0X
-OnHeapColumnVector                                    4446           4460          20         92.1          10.9       0.0X
-OffHeapColumnVector                                   4740           4746           9         86.4          11.6       0.0X
+ConstantColumnVector                                     1              1           0     384121.2           0.0       1.0X
+OnHeapColumnVector                                    3820           3828          11        107.2           9.3       0.0X
+OffHeapColumnVector                                   4250           4252           3         96.4          10.4       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with IntegerType:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     699318.6           0.0       1.0X
-OnHeapColumnVector                                   16             16           0      25434.3           0.0       0.0X
-OffHeapColumnVector                                  65             66           0       6261.4           0.2       0.0X
+ConstantColumnVector                                  1              1           0     699312.6           0.0       1.0X
+OnHeapColumnVector                                   16             16           0      25439.2           0.0       0.0X
+OffHeapColumnVector                                  65             65           0       6290.8           0.2       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with LongType:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     664349.4           0.0       1.0X
-OnHeapColumnVector                                   34             34           0      12170.8           0.1       0.0X
-OffHeapColumnVector                                  67             67           0       6157.8           0.2       0.0X
+ConstantColumnVector                                  1              1           0     664346.2           0.0       1.0X
+OnHeapColumnVector                                   33             34           0      12270.8           0.1       0.0X
+OffHeapColumnVector                                  66             66           0       6202.4           0.2       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with FloatType:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     553055.4           0.0       1.0X
-OnHeapColumnVector                                   16             16           0      25045.2           0.0       0.0X
-OffHeapColumnVector                                 128            128           0       3202.8           0.3       0.0X
+ConstantColumnVector                                  1              1           0     553051.6           0.0       1.0X
+OnHeapColumnVector                                   16             16           0      25077.4           0.0       0.0X
+OffHeapColumnVector                                 128            128           0       3197.1           0.3       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write with DoubleType:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  1              1           0     510539.9           0.0       1.0X
-OnHeapColumnVector                                   35             35           0      11831.2           0.1       0.0X
-OffHeapColumnVector                                 129            130           0       3171.6           0.3       0.0X
+ConstantColumnVector                                  1              1           0     510536.0           0.0       1.0X
+OnHeapColumnVector                                   34             35           0      11916.5           0.1       0.0X
+OffHeapColumnVector                                 129            129           0       3175.9           0.3       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 1:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                 684            687           3        598.9           1.7       1.0X
-OnHeapColumnVector                                  1801           1801           1        227.5           4.4       0.4X
-OffHeapColumnVector                                 4435           4437           3         92.4          10.8       0.2X
+ConstantColumnVector                                   0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                    98             99           0       4159.9           0.2       0.0X
+OffHeapColumnVector                                 3722           3724           3        110.0           9.1       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 5:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                 939            947          14        436.3           2.3       1.0X
-OnHeapColumnVector                                  4945           4946           2         82.8          12.1       0.2X
-OffHeapColumnVector                                 4579           4580           1         89.5          11.2       0.2X
+ConstantColumnVector                                   0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                  4109           4115           9         99.7          10.0       0.0X
+OffHeapColumnVector                                 3686           3695          12        111.1           9.0       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 10:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  942            944           2        434.9           2.3       1.0X
-OnHeapColumnVector                                   5119           5121           3         80.0          12.5       0.2X
-OffHeapColumnVector                                  4486           4489           3         91.3          11.0       0.2X
+ConstantColumnVector                                    0              0           0   13278008.3           0.0       1.0X
+OnHeapColumnVector                                   4114           4115           0         99.6          10.0       0.0X
+OffHeapColumnVector                                  3700           3709          12        110.7           9.0       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 15:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  937            939           2        437.0           2.3       1.0X
-OnHeapColumnVector                                   5118           5119           2         80.0          12.5       0.2X
-OffHeapColumnVector                                  4492           4495           3         91.2          11.0       0.2X
+ConstantColumnVector                                    0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                   4127           4131           5         99.3          10.1       0.0X
+OffHeapColumnVector                                  3693           3699           9        110.9           9.0       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 20:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  941            942           1        435.1           2.3       1.0X
-OnHeapColumnVector                                   5111           5122          15         80.1          12.5       0.2X
-OffHeapColumnVector                                  4484           4488           6         91.3          10.9       0.2X
+ConstantColumnVector                                    0              0           0   13274135.5           0.0       1.0X
+OnHeapColumnVector                                   4117           4127          14         99.5          10.1       0.0X
+OffHeapColumnVector                                  3680           3685           7        111.3           9.0       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with StringType, row length = 30:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  938            939           1        436.8           2.3       1.0X
-OnHeapColumnVector                                   5116           5119           5         80.1          12.5       0.2X
-OffHeapColumnVector                                  4582           4584           4         89.4          11.2       0.2X
+ConstantColumnVector                                    0              0           0   13278438.7           0.0       1.0X
+OnHeapColumnVector                                   4125           4136          15         99.3          10.1       0.0X
+OffHeapColumnVector                                  3691           3697           9        111.0           9.0       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with IntegerType:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               2595           2597           2        157.8           6.3       1.0X
-OnHeapColumnVector                                 2720           2720           1        150.6           6.6       1.0X
-OffHeapColumnVector                                2600           2602           2        157.5           6.3       1.0X
+ConstantColumnVector                               2472           2472           1        165.7           6.0       1.0X
+OnHeapColumnVector                                 2600           2601           1        157.5           6.3       1.0X
+OffHeapColumnVector                                2482           2483           0        165.0           6.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with LongType:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0    1476318.0           0.0       1.0X
-OnHeapColumnVector                                    0              0           0     949059.9           0.0       0.6X
-OffHeapColumnVector                                 767            768           1        533.9           1.9       0.0X
+ConstantColumnVector                                  0              0           0    1660841.3           0.0       1.0X
+OnHeapColumnVector                                    1              1           0     474470.6           0.0       0.3X
+OffHeapColumnVector                                 767            768           1        534.1           1.9       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with FloatType:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0    1476318.0           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    1022063.2           0.0       0.7X
-OffHeapColumnVector                                 767            767           0        534.0           1.9       0.0X
+ConstantColumnVector                                  0              0           0    1660848.0           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    1022058.1           0.0       0.6X
+OffHeapColumnVector                                 767            773           5        533.8           1.9       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test read with DoubleType:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0    1476318.0           0.0       1.0X
-OnHeapColumnVector                                    0              1           0     885790.2           0.0       0.6X
-OffHeapColumnVector                                 696            696           0        588.9           1.7       0.0X
+ConstantColumnVector                                  0              0           0    1476307.4           0.0       1.0X
+OnHeapColumnVector                                    1              1           0     459321.6           0.0       0.3X
+OffHeapColumnVector                                 893            893           0        458.7           2.2       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 1:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                             0              0           0    1021805.7           0.0       1.0X
-OnHeapColumnVector                                            3895           3903          12        105.2           9.5       0.0X
-OffHeapColumnVector                                           3725           3734          13        110.0           9.1       0.0X
+ConstantColumnVector                                             0              0           0     948833.4           0.0       1.0X
+OnHeapColumnVector                                            3903           3908           7        104.9           9.5       0.0X
+OffHeapColumnVector                                           3765           3769           6        108.8           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 5:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                             0              0           0     830408.9           0.0       1.0X
-OnHeapColumnVector                                            3894           3907          17        105.2           9.5       0.0X
-OffHeapColumnVector                                           3714           3721          10        110.3           9.1       0.0X
+ConstantColumnVector                                             0              0           0     830400.4           0.0       1.0X
+OnHeapColumnVector                                            3900           3904           6        105.0           9.5       0.0X
+OffHeapColumnVector                                           3731           3746          21        109.8           9.1       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 10:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                              0              0           0     830392.0           0.0       1.0X
-OnHeapColumnVector                                             3895           3896           2        105.2           9.5       0.0X
-OffHeapColumnVector                                            3723           3723           0        110.0           9.1       0.0X
+ConstantColumnVector                                              0              0           0     830403.8           0.0       1.0X
+OnHeapColumnVector                                             3904           3912          11        104.9           9.5       0.0X
+OffHeapColumnVector                                            3749           3759          14        109.3           9.2       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 15:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                              0              0           0     830388.7           0.0       1.0X
-OnHeapColumnVector                                             3890           3896           8        105.3           9.5       0.0X
-OffHeapColumnVector                                            3763           3764           1        108.8           9.2       0.0X
+ConstantColumnVector                                              0              0           0     830403.8           0.0       1.0X
+OnHeapColumnVector                                             3899           3899           0        105.1           9.5       0.0X
+OffHeapColumnVector                                            3728           3731           4        109.9           9.1       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 20:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
 ConstantColumnVector                                              0              0           0     830403.8           0.0       1.0X
-OnHeapColumnVector                                             3882           3886           6        105.5           9.5       0.0X
-OffHeapColumnVector                                            3697           3699           3        110.8           9.0       0.0X
+OnHeapColumnVector                                             3900           3907          10        105.0           9.5       0.0X
+OffHeapColumnVector                                            3731           3766          49        109.8           9.1       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with StringType, row length = 30:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                              0              0           0     830407.2           0.0       1.0X
-OnHeapColumnVector                                             3887           3891           5        105.4           9.5       0.0X
-OffHeapColumnVector                                            3700           3701           1        110.7           9.0       0.0X
+ConstantColumnVector                                              0              1           0     830403.8           0.0       1.0X
+OnHeapColumnVector                                             3905           3911           9        104.9           9.5       0.0X
+OffHeapColumnVector                                            3725           3726           1        109.9           9.1       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with IntegerType:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                               2967           2968           2        138.1           7.2       1.0X
-OnHeapColumnVector                                 2714           2716           3        150.9           6.6       1.1X
-OffHeapColumnVector                                2714           2715           2        150.9           6.6       1.1X
+ConstantColumnVector                               2847           2858          16        143.9           7.0       1.0X
+OnHeapColumnVector                                 2607           2609           2        157.1           6.4       1.1X
+OffHeapColumnVector                                2496           2497           1        164.1           6.1       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with LongType:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                765            765           0        535.7           1.9       1.0X
-OnHeapColumnVector                                  893            894           2        458.6           2.2       0.9X
-OffHeapColumnVector                                 893            893           0        458.8           2.2       0.9X
+ConstantColumnVector                                764            765           0        535.8           1.9       1.0X
+OnHeapColumnVector                                  894            894           1        458.4           2.2       0.9X
+OffHeapColumnVector                                 893            895           2        458.5           2.2       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with FloatType:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                765            765           0        535.5           1.9       1.0X
-OnHeapColumnVector                                  767            767           1        534.3           1.9       1.0X
-OffHeapColumnVector                                 766            769           3        535.0           1.9       1.0X
+ConstantColumnVector                                892            893           1        459.0           2.2       1.0X
+OnHeapColumnVector                                  766            767           0        534.5           1.9       1.2X
+OffHeapColumnVector                                 766            766           1        535.0           1.9       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test write and read with DoubleType:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0    1898027.4           0.0       1.0X
-OnHeapColumnVector                                  656            657           3        624.5           1.6       0.0X
-OffHeapColumnVector                                 696            696           0        588.8           1.7       0.0X
+ConstantColumnVector                                765            765           0        535.3           1.9       1.0X
+OnHeapColumnVector                                  893            895           2        458.5           2.2       0.9X
+OffHeapColumnVector                                 894            895           0        458.2           2.2       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with StringType:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  409190809.2           0.0       1.0X
+ConstantColumnVector                                  0              0           0  209728622.6           0.0       1.0X
 OnHeapColumnVector                                    0              0           0    2212069.2           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  409190809.2           0.0       1.0X
+OffHeapColumnVector                                   0              0           0  209728622.6           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with IntegerType:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  409190809.2           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    2211961.7           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  409190809.2           0.0       1.0X
+ConstantColumnVector                                  0              0           0  209728622.6           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    2212057.2           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  209728622.6           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with LongType:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  409190809.2           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    2211961.7           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  409190809.2           0.0       1.0X
+ConstantColumnVector                                  0              0           0  209728622.6           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    2212069.2           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  209728622.6           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with FloatType:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  409190809.2           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    2212057.2           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  409190809.2           0.0       1.0X
+ConstantColumnVector                                  0              0           0  209728622.6           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    2212069.2           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  209728622.6           0.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Test isNull with DoubleType:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ConstantColumnVector                                  0              0           0  409190809.2           0.0       1.0X
-OnHeapColumnVector                                    0              0           0    2211949.7           0.0       0.0X
-OffHeapColumnVector                                   0              0           0  409190809.2           0.0       1.0X
+ConstantColumnVector                                  0              0           0  209728622.6           0.0       1.0X
+OnHeapColumnVector                                    0              0           0    2212057.2           0.0       0.0X
+OffHeapColumnVector                                   0              0           0  209728622.6           0.0       1.0X
 
diff --git a/sql/core/benchmarks/DataSourceReadBenchmark-jdk21-results.txt b/sql/core/benchmarks/DataSourceReadBenchmark-jdk21-results.txt
index b716c18deba73..be11d3a0d8b0e 100644
--- a/sql/core/benchmarks/DataSourceReadBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/DataSourceReadBenchmark-jdk21-results.txt
@@ -2,437 +2,437 @@
 SQL Single Numeric Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BOOLEAN Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            9693           9747          77          1.6         616.2       1.0X
-SQL Json                                           7743           7871         181          2.0         492.3       1.3X
-SQL Json with UnsafeRow                            8445           8509          90          1.9         536.9       1.1X
-SQL Parquet Vectorized: DataPageV1                  107            118           7        147.3           6.8      90.7X
-SQL Parquet Vectorized: DataPageV2                  125            132           4        126.2           7.9      77.8X
-SQL Parquet MR: DataPageV1                         1743           1747           5          9.0         110.8       5.6X
-SQL Parquet MR: DataPageV2                         1608           1608           0          9.8         102.2       6.0X
-SQL ORC Vectorized                                  139            152          18        113.5           8.8      70.0X
-SQL ORC MR                                         1452           1466          20         10.8          92.3       6.7X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           10016          10139         174          1.6         636.8       1.0X
+SQL Json                                           8116           8156          56          1.9         516.0       1.2X
+SQL Json with UnsafeRow                            8940           8963          33          1.8         568.4       1.1X
+SQL Parquet Vectorized: DataPageV1                   90            102          12        175.7           5.7     111.9X
+SQL Parquet Vectorized: DataPageV2                   93            102           6        168.9           5.9     107.6X
+SQL Parquet MR: DataPageV1                         1798           1838          56          8.7         114.3       5.6X
+SQL Parquet MR: DataPageV2                         1674           1679           7          9.4         106.4       6.0X
+SQL ORC Vectorized                                  143            159          24        110.2           9.1      70.2X
+SQL ORC MR                                         1552           1562          15         10.1          98.6       6.5X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single BOOLEAN Column Scan:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                    94             95           2        167.7           6.0       1.0X
-ParquetReader Vectorized: DataPageV2                   124            126           1        126.5           7.9       0.8X
-ParquetReader Vectorized -> Row: DataPageV1             75             76           2        211.1           4.7       1.3X
-ParquetReader Vectorized -> Row: DataPageV2            107            108           1        147.5           6.8       0.9X
+ParquetReader Vectorized: DataPageV1                    94             96           2        166.9           6.0       1.0X
+ParquetReader Vectorized: DataPageV2                   106            109           2        148.6           6.7       0.9X
+ParquetReader Vectorized -> Row: DataPageV1             76             78           2        207.7           4.8       1.2X
+ParquetReader Vectorized -> Row: DataPageV2             89             91           2        177.6           5.6       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            9054           9113          83          1.7         575.7       1.0X
-SQL Json                                           8690           8707          24          1.8         552.5       1.0X
-SQL Json with UnsafeRow                            9308           9317          13          1.7         591.8       1.0X
-SQL Parquet Vectorized: DataPageV1                   99            110           8        159.5           6.3      91.8X
-SQL Parquet Vectorized: DataPageV2                   97            111          17        162.1           6.2      93.3X
-SQL Parquet MR: DataPageV1                         1818           1820           3          8.7         115.6       5.0X
-SQL Parquet MR: DataPageV2                         1864           1866           3          8.4         118.5       4.9X
-SQL ORC Vectorized                                  110            134          19        142.6           7.0      82.1X
-SQL ORC MR                                         1592           1600          10          9.9         101.2       5.7X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            9341           9372          44          1.7         593.9       1.0X
+SQL Json                                           8686           8757         100          1.8         552.2       1.1X
+SQL Json with UnsafeRow                            9507           9517          13          1.7         604.5       1.0X
+SQL Parquet Vectorized: DataPageV1                  150            158           6        104.5           9.6      62.1X
+SQL Parquet Vectorized: DataPageV2                  149            156           7        105.5           9.5      62.7X
+SQL Parquet MR: DataPageV1                         1959           1967          12          8.0         124.6       4.8X
+SQL Parquet MR: DataPageV2                         1856           1880          34          8.5         118.0       5.0X
+SQL ORC Vectorized                                  141            150          12        111.5           9.0      66.2X
+SQL ORC MR                                         1669           1670           2          9.4         106.1       5.6X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single TINYINT Column Scan:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                    78             81           6        202.9           4.9       1.0X
-ParquetReader Vectorized: DataPageV2                    79             81           1        199.7           5.0       1.0X
-ParquetReader Vectorized -> Row: DataPageV1             46             49           4        339.0           2.9       1.7X
-ParquetReader Vectorized -> Row: DataPageV2             46             50           4        339.3           2.9       1.7X
+ParquetReader Vectorized: DataPageV1                   125            129           6        125.9           7.9       1.0X
+ParquetReader Vectorized: DataPageV2                   124            128           3        126.8           7.9       1.0X
+ParquetReader Vectorized -> Row: DataPageV1            101            117          33        155.9           6.4       1.2X
+ParquetReader Vectorized -> Row: DataPageV2            101            103           2        156.1           6.4       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            9898           9911          19          1.6         629.3       1.0X
-SQL Json                                           9233           9238           7          1.7         587.0       1.1X
-SQL Json with UnsafeRow                            9788           9804          24          1.6         622.3       1.0X
-SQL Parquet Vectorized: DataPageV1                  121            135          14        130.2           7.7      82.0X
-SQL Parquet Vectorized: DataPageV2                  138            152          16        114.1           8.8      71.8X
-SQL Parquet MR: DataPageV1                         2029           2035           7          7.8         129.0       4.9X
-SQL Parquet MR: DataPageV2                         1949           1964          22          8.1         123.9       5.1X
-SQL ORC Vectorized                                  140            147          11        112.5           8.9      70.8X
-SQL ORC MR                                         1607           1619          16          9.8         102.2       6.2X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           10510          10522          17          1.5         668.2       1.0X
+SQL Json                                           9264           9265           2          1.7         589.0       1.1X
+SQL Json with UnsafeRow                            9945           9947           3          1.6         632.3       1.1X
+SQL Parquet Vectorized: DataPageV1                  123            140          13        127.5           7.8      85.2X
+SQL Parquet Vectorized: DataPageV2                  142            171          24        110.6           9.0      73.9X
+SQL Parquet MR: DataPageV1                         2103           2104           1          7.5         133.7       5.0X
+SQL Parquet MR: DataPageV2                         2072           2075           4          7.6         131.7       5.1X
+SQL ORC Vectorized                                  147            162          19        107.2           9.3      71.6X
+SQL ORC MR                                         1769           1770           1          8.9         112.4       5.9X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single SMALLINT Column Scan:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   149            164          11        105.3           9.5       1.0X
-ParquetReader Vectorized: DataPageV2                   168            176           6         93.8          10.7       0.9X
-ParquetReader Vectorized -> Row: DataPageV1            145            153          10        108.3           9.2       1.0X
-ParquetReader Vectorized -> Row: DataPageV2            165            176           8         95.3          10.5       0.9X
+ParquetReader Vectorized: DataPageV1                   150            159           7        105.0           9.5       1.0X
+ParquetReader Vectorized: DataPageV2                   196            203           5         80.2          12.5       0.8X
+ParquetReader Vectorized -> Row: DataPageV1            146            149           2        107.9           9.3       1.0X
+ParquetReader Vectorized -> Row: DataPageV2            175            183           7         90.1          11.1       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           11119          11129          15          1.4         706.9       1.0X
-SQL Json                                           9483           9484           2          1.7         602.9       1.2X
-SQL Json with UnsafeRow                           10139          10156          24          1.6         644.6       1.1X
-SQL Parquet Vectorized: DataPageV1                  103            118          15        152.0           6.6     107.5X
-SQL Parquet Vectorized: DataPageV2                  181            197          15         86.8          11.5      61.4X
-SQL Parquet MR: DataPageV1                         1907           1930          32          8.2         121.3       5.8X
-SQL Parquet MR: DataPageV2                         1942           1983          57          8.1         123.5       5.7X
-SQL ORC Vectorized                                  180            191          12         87.6          11.4      61.9X
-SQL ORC MR                                         1642           1642           0          9.6         104.4       6.8X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           11428          11428           1          1.4         726.6       1.0X
+SQL Json                                           9760           9761           2          1.6         620.5       1.2X
+SQL Json with UnsafeRow                           10321          10322           0          1.5         656.2       1.1X
+SQL Parquet Vectorized: DataPageV1                  104            126          20        150.7           6.6     109.5X
+SQL Parquet Vectorized: DataPageV2                  189            209          21         83.2          12.0      60.4X
+SQL Parquet MR: DataPageV1                         2071           2086          21          7.6         131.7       5.5X
+SQL Parquet MR: DataPageV2                         2040           2061          30          7.7         129.7       5.6X
+SQL ORC Vectorized                                  188            205          17         83.7          12.0      60.8X
+SQL ORC MR                                         1807           1818          15          8.7         114.9       6.3X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single INT Column Scan:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   131            134           7        119.9           8.3       1.0X
-ParquetReader Vectorized: DataPageV2                   210            215           7         74.9          13.4       0.6X
-ParquetReader Vectorized -> Row: DataPageV1            135            135           1        116.9           8.6       1.0X
-ParquetReader Vectorized -> Row: DataPageV2            207            219          10         76.0          13.2       0.6X
+ParquetReader Vectorized: DataPageV1                   146            159           9        107.6           9.3       1.0X
+ParquetReader Vectorized: DataPageV2                   228            242           9         69.0          14.5       0.6X
+ParquetReader Vectorized -> Row: DataPageV1            135            148          12        116.6           8.6       1.1X
+ParquetReader Vectorized -> Row: DataPageV2            220            239          12         71.5          14.0       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           11093          11109          23          1.4         705.3       1.0X
-SQL Json                                           9583           9600          24          1.6         609.3       1.2X
-SQL Json with UnsafeRow                           10139          10159          28          1.6         644.6       1.1X
-SQL Parquet Vectorized: DataPageV1                  285            300          14         55.2          18.1      38.9X
-SQL Parquet Vectorized: DataPageV2                  232            264          21         67.9          14.7      47.9X
-SQL Parquet MR: DataPageV1                         2439           2442           4          6.4         155.1       4.5X
-SQL Parquet MR: DataPageV2                         2014           2020           8          7.8         128.0       5.5X
-SQL ORC Vectorized                                  165            173           9         95.2          10.5      67.1X
-SQL ORC MR                                         1682           1690          12          9.4         106.9       6.6X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           11431          11447          23          1.4         726.8       1.0X
+SQL Json                                           9801           9807           9          1.6         623.1       1.2X
+SQL Json with UnsafeRow                           10539          10543           6          1.5         670.0       1.1X
+SQL Parquet Vectorized: DataPageV1                  312            337          19         50.4          19.8      36.7X
+SQL Parquet Vectorized: DataPageV2                  243            277          20         64.7          15.5      47.0X
+SQL Parquet MR: DataPageV1                         2547           2571          34          6.2         161.9       4.5X
+SQL Parquet MR: DataPageV2                         2120           2122           3          7.4         134.8       5.4X
+SQL ORC Vectorized                                  148            161          16        106.1           9.4      77.1X
+SQL ORC MR                                         1789           1808          28          8.8         113.7       6.4X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single BIGINT Column Scan:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   352            357           5         44.7          22.4       1.0X
-ParquetReader Vectorized: DataPageV2                   309            315           8         50.9          19.7       1.1X
-ParquetReader Vectorized -> Row: DataPageV1            330            335           5         47.6          21.0       1.1X
-ParquetReader Vectorized -> Row: DataPageV2            264            273           8         59.6          16.8       1.3X
+ParquetReader Vectorized: DataPageV1                   333            338           3         47.2          21.2       1.0X
+ParquetReader Vectorized: DataPageV2                   278            288          10         56.6          17.7       1.2X
+ParquetReader Vectorized -> Row: DataPageV1            324            330           6         48.5          20.6       1.0X
+ParquetReader Vectorized -> Row: DataPageV2            275            286           8         57.3          17.5       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           11874          11897          32          1.3         754.9       1.0X
-SQL Json                                          11112          11136          34          1.4         706.5       1.1X
-SQL Json with UnsafeRow                           12000          12000           1          1.3         762.9       1.0X
-SQL Parquet Vectorized: DataPageV1                   85            104          16        184.8           5.4     139.5X
-SQL Parquet Vectorized: DataPageV2                   84             99          15        186.3           5.4     140.6X
-SQL Parquet MR: DataPageV1                         1962           1964           3          8.0         124.7       6.1X
-SQL Parquet MR: DataPageV2                         1899           1993         132          8.3         120.8       6.3X
-SQL ORC Vectorized                                  232            241          16         67.7          14.8      51.1X
-SQL ORC MR                                         1718           1729          17          9.2         109.2       6.9X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           11476          11505          41          1.4         729.6       1.0X
+SQL Json                                          11463          11529          93          1.4         728.8       1.0X
+SQL Json with UnsafeRow                           11909          11918          13          1.3         757.1       1.0X
+SQL Parquet Vectorized: DataPageV1                   92            110          15        170.2           5.9     124.2X
+SQL Parquet Vectorized: DataPageV2                   93            106          14        169.7           5.9     123.8X
+SQL Parquet MR: DataPageV1                         2111           2120          13          7.5         134.2       5.4X
+SQL Parquet MR: DataPageV2                         2023           2032          12          7.8         128.6       5.7X
+SQL ORC Vectorized                                  227            239          15         69.4          14.4      50.6X
+SQL ORC MR                                         1846           1864          26          8.5         117.4       6.2X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single FLOAT Column Scan:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   133            139           6        118.4           8.4       1.0X
-ParquetReader Vectorized: DataPageV2                   131            138           7        119.8           8.3       1.0X
-ParquetReader Vectorized -> Row: DataPageV1            128            133           6        122.7           8.1       1.0X
-ParquetReader Vectorized -> Row: DataPageV2            129            133           4        122.1           8.2       1.0X
+ParquetReader Vectorized: DataPageV1                   145            154           6        108.5           9.2       1.0X
+ParquetReader Vectorized: DataPageV2                   143            151           8        110.0           9.1       1.0X
+ParquetReader Vectorized -> Row: DataPageV1            136            141           6        115.9           8.6       1.1X
+ParquetReader Vectorized -> Row: DataPageV2            134            142           7        117.3           8.5       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           11741          11743           3          1.3         746.5       1.0X
-SQL Json                                          11539          11542           4          1.4         733.7       1.0X
-SQL Json with UnsafeRow                           12260          12274          20          1.3         779.5       1.0X
-SQL Parquet Vectorized: DataPageV1                  308            315           7         51.1          19.6      38.1X
-SQL Parquet Vectorized: DataPageV2                  308            316           8         51.0          19.6      38.1X
-SQL Parquet MR: DataPageV1                         2475           2493          25          6.4         157.4       4.7X
-SQL Parquet MR: DataPageV2                         2406           2414          11          6.5         153.0       4.9X
-SQL ORC Vectorized                                  584            599          16         27.0          37.1      20.1X
-SQL ORC MR                                         2152           2167          21          7.3         136.8       5.5X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           11669          11686          25          1.3         741.9       1.0X
+SQL Json                                          11629          11633           6          1.4         739.3       1.0X
+SQL Json with UnsafeRow                           12510          12513           5          1.3         795.3       0.9X
+SQL Parquet Vectorized: DataPageV1                  325            332           9         48.3          20.7      35.9X
+SQL Parquet Vectorized: DataPageV2                  275            307          22         57.1          17.5      42.4X
+SQL Parquet MR: DataPageV1                         2500           2508          11          6.3         158.9       4.7X
+SQL Parquet MR: DataPageV2                         2442           2454          16          6.4         155.3       4.8X
+SQL ORC Vectorized                                  599            613          26         26.3          38.1      19.5X
+SQL ORC MR                                         2361           2364           5          6.7         150.1       4.9X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single DOUBLE Column Scan:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   314            319           4         50.1          20.0       1.0X
-ParquetReader Vectorized: DataPageV2                   325            330           6         48.4          20.7       1.0X
-ParquetReader Vectorized -> Row: DataPageV1            324            331           9         48.5          20.6       1.0X
-ParquetReader Vectorized -> Row: DataPageV2            326            330           4         48.3          20.7       1.0X
+ParquetReader Vectorized: DataPageV1                   342            354           8         46.0          21.7       1.0X
+ParquetReader Vectorized: DataPageV2                   343            349           5         45.8          21.8       1.0X
+ParquetReader Vectorized -> Row: DataPageV1            338            345           5         46.6          21.5       1.0X
+ParquetReader Vectorized -> Row: DataPageV2            335            341           5         46.9          21.3       1.0X
 
 
 ================================================================================================
 SQL Single Numeric Column Scan in Struct
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan in Struct:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2079           2176         137          7.6         132.2       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2147           2151           6          7.3         136.5       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             144            153          20        109.1           9.2      14.4X
-SQL Parquet MR: DataPageV1                                            2361           2371          14          6.7         150.1       0.9X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2672           2690          26          5.9         169.9       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             106            115          12        148.8           6.7      19.7X
-SQL Parquet MR: DataPageV2                                            2298           2311          18          6.8         146.1       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2604           2608           6          6.0         165.6       0.8X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             106            119          17        148.9           6.7      19.7X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2301           2403         145          6.8         146.3       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2357           2394          51          6.7         149.9       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             148            157          13        106.3           9.4      15.5X
+SQL Parquet MR: DataPageV1                                            2363           2396          47          6.7         150.2       1.0X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2914           2915           2          5.4         185.3       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             157            182          25        100.1          10.0      14.6X
+SQL Parquet MR: DataPageV2                                            2343           2347           7          6.7         148.9       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2892           2902          14          5.4         183.9       0.8X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             165            179          18         95.2          10.5      13.9X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan in Struct:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2110           2113           5          7.5         134.2       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2097           2119          32          7.5         133.3       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             280            287          13         56.2          17.8       7.5X
-SQL Parquet MR: DataPageV1                                            2483           2487           5          6.3         157.9       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2984           2985           1          5.3         189.7       0.7X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             111            143          26        141.6           7.1      19.0X
-SQL Parquet MR: DataPageV2                                            2440           2442           4          6.4         155.1       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2873           2896          32          5.5         182.7       0.7X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             206            232          26         76.5          13.1      10.3X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2471           2484          17          6.4         157.1       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2471           2492          29          6.4         157.1       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             273            286          17         57.6          17.4       9.1X
+SQL Parquet MR: DataPageV1                                            2486           2507          29          6.3         158.1       1.0X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2970           2974           6          5.3         188.8       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             119            139          17        132.4           7.6      20.8X
+SQL Parquet MR: DataPageV2                                            2499           2526          38          6.3         158.9       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2896           2910          21          5.4         184.1       0.9X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             155            194          21        101.2           9.9      15.9X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan in Struct:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2198           2266          97          7.2         139.7       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2204           2227          33          7.1         140.1       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             299            312          19         52.6          19.0       7.4X
-SQL Parquet MR: DataPageV1                                            2426           2442          23          6.5         154.2       0.9X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3032           3036           5          5.2         192.8       0.7X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             106            130          21        148.4           6.7      20.7X
-SQL Parquet MR: DataPageV2                                            2427           2441          20          6.5         154.3       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2892           2906          20          5.4         183.9       0.8X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             289            305          17         54.5          18.3       7.6X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2430           2496          92          6.5         154.5       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2576           2588          17          6.1         163.8       0.9X
+SQL ORC Vectorized (Nested Column Enabled)                             275            291          22         57.1          17.5       8.8X
+SQL Parquet MR: DataPageV1                                            2578           2587          13          6.1         163.9       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3173           3204          45          5.0         201.7       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             132            140           4        118.9           8.4      18.4X
+SQL Parquet MR: DataPageV2                                            2580           2608          40          6.1         164.0       0.9X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           3159           3179          28          5.0         200.8       0.8X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             231            247          18         68.2          14.7      10.5X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan in Struct:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2180           2185           7          7.2         138.6       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2182           2185           4          7.2         138.7       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             302            311          18         52.1          19.2       7.2X
-SQL Parquet MR: DataPageV1                                            2798           2824          36          5.6         177.9       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3348           3353           7          4.7         212.9       0.7X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             322            330           8         48.8          20.5       6.8X
-SQL Parquet MR: DataPageV2                                            2371           2385          20          6.6         150.7       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2861           2873          17          5.5         181.9       0.8X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             254            297          23         61.9          16.2       8.6X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2695           2705          13          5.8         171.4       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2702           2716          20          5.8         171.8       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             277            300          34         56.7          17.6       9.7X
+SQL Parquet MR: DataPageV1                                            3101           3103           2          5.1         197.1       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3865           3870           6          4.1         245.7       0.7X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             346            359          21         45.4          22.0       7.8X
+SQL Parquet MR: DataPageV2                                            2590           2608          25          6.1         164.7       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           3178           3185          10          4.9         202.0       0.8X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             279            314          16         56.3          17.8       9.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan in Struct:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2367           2453         123          6.6         150.5       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2321           2339          26          6.8         147.6       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             357            368          22         44.0          22.7       6.6X
-SQL Parquet MR: DataPageV1                                            2306           2327          30          6.8         146.6       1.0X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2783           2784           1          5.7         177.0       0.9X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)              93            103           6        169.4           5.9      25.5X
-SQL Parquet MR: DataPageV2                                            2306           2312           8          6.8         146.6       1.0X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2710           2724          19          5.8         172.3       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)              90            116          23        174.0           5.7      26.2X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2490           2582         130          6.3         158.3       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2698           2699           1          5.8         171.5       0.9X
+SQL ORC Vectorized (Nested Column Enabled)                             348            354           3         45.2          22.1       7.2X
+SQL Parquet MR: DataPageV1                                            2637           2653          22          6.0         167.7       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3035           3051          22          5.2         193.0       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             117            154          17        134.8           7.4      21.3X
+SQL Parquet MR: DataPageV2                                            2560           2579          26          6.1         162.8       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2924           2926           3          5.4         185.9       0.9X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)              99            118          15        158.5           6.3      25.1X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan in Struct:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2547           2564          24          6.2         162.0       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2591           2602          15          6.1         164.7       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             721            722           1         21.8          45.8       3.5X
-SQL Parquet MR: DataPageV1                                            2777           2783           8          5.7         176.6       0.9X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3278           3282           6          4.8         208.4       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             310            324          11         50.7          19.7       8.2X
-SQL Parquet MR: DataPageV2                                            2742           2758          22          5.7         174.3       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           3149           3165          22          5.0         200.2       0.8X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             307            317           8         51.3          19.5       8.3X
+SQL ORC MR                                                            2811           2839          41          5.6         178.7       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2866           2870           5          5.5         182.2       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             722            726           5         21.8          45.9       3.9X
+SQL Parquet MR: DataPageV1                                            2998           2998           1          5.2         190.6       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3518           3530          16          4.5         223.7       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             336            341           7         46.9          21.3       8.4X
+SQL Parquet MR: DataPageV2                                            2939           2954          22          5.4         186.8       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           3408           3419          15          4.6         216.7       0.8X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             326            341          10         48.3          20.7       8.6X
 
 
 ================================================================================================
 SQL Nested Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Nested Column Scan:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                           13328          13415          73          0.1       12711.0       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                          13285          13333          28          0.1       12670.0       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                            7170           7196          14          0.1        6837.5       1.9X
-SQL Parquet MR: DataPageV1                                            9251           9339          83          0.1        8822.7       1.4X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           9546           9592          39          0.1        9103.6       1.4X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)            5892           5932          24          0.2        5618.8       2.3X
-SQL Parquet MR: DataPageV2                                            9848          10065         239          0.1        9392.2       1.4X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)          10250          10501         199          0.1        9775.5       1.3X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)            5653           5720          31          0.2        5390.8       2.4X
+SQL ORC MR                                                           14501          14817         190          0.1       13828.8       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                          14626          15009         205          0.1       13948.9       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                            7701           7776          33          0.1        7344.1       1.9X
+SQL Parquet MR: DataPageV1                                            9945          10009          58          0.1        9484.3       1.5X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)          10227          10319          57          0.1        9753.7       1.4X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)            6799           6970          93          0.2        6483.6       2.1X
+SQL Parquet MR: DataPageV2                                           10726          11061         289          0.1       10229.5       1.4X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)          10919          11197         260          0.1       10413.5       1.3X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)            6398           6474          57          0.2        6101.6       2.3X
 
 
 ================================================================================================
 Int and String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int and String Scan:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           10418          10449          44          1.0         993.5       1.0X
-SQL Json                                          10216          10220           5          1.0         974.3       1.0X
-SQL Parquet Vectorized: DataPageV1                 1761           1786          35          6.0         168.0       5.9X
-SQL Parquet Vectorized: DataPageV2                 1978           1994          22          5.3         188.7       5.3X
-SQL Parquet MR: DataPageV1                         4085           4092           9          2.6         389.6       2.6X
-SQL Parquet MR: DataPageV2                         4058           4074          22          2.6         387.0       2.6X
-SQL ORC Vectorized                                 1905           1927          31          5.5         181.6       5.5X
-SQL ORC MR                                         3633           3644          15          2.9         346.5       2.9X
+SQL CSV                                           10362          10412          70          1.0         988.2       1.0X
+SQL Json                                          10177          10208          45          1.0         970.5       1.0X
+SQL Parquet Vectorized: DataPageV1                 1821           1832          15          5.8         173.7       5.7X
+SQL Parquet Vectorized: DataPageV2                 2053           2057           5          5.1         195.8       5.0X
+SQL Parquet MR: DataPageV1                         4043           4056          18          2.6         385.5       2.6X
+SQL Parquet MR: DataPageV2                         3960           3966           8          2.6         377.7       2.6X
+SQL ORC Vectorized                                 1785           1791           8          5.9         170.2       5.8X
+SQL ORC MR                                         3663           3687          33          2.9         349.3       2.8X
 
 
 ================================================================================================
 Repeated String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repeated String:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            5454           5472          25          1.9         520.1       1.0X
-SQL Json                                           6444           6445           2          1.6         614.6       0.8X
-SQL Parquet Vectorized: DataPageV1                  529            538           9         19.8          50.5      10.3X
-SQL Parquet Vectorized: DataPageV2                  543            556          13         19.3          51.8      10.0X
-SQL Parquet MR: DataPageV1                         1776           1792          23          5.9         169.4       3.1X
-SQL Parquet MR: DataPageV2                         1662           1671          13          6.3         158.5       3.3X
-SQL ORC Vectorized                                  367            371           3         28.6          35.0      14.9X
-SQL ORC MR                                         1795           1816          29          5.8         171.2       3.0X
+SQL CSV                                            5839           5892          75          1.8         556.9       1.0X
+SQL Json                                           6442           6448           8          1.6         614.3       0.9X
+SQL Parquet Vectorized: DataPageV1                  490            496           5         21.4          46.7      11.9X
+SQL Parquet Vectorized: DataPageV2                  466            471           4         22.5          44.5      12.5X
+SQL Parquet MR: DataPageV1                         1670           1688          26          6.3         159.2       3.5X
+SQL Parquet MR: DataPageV2                         1601           1631          42          6.5         152.7       3.6X
+SQL ORC Vectorized                                  390            396           6         26.9          37.2      15.0X
+SQL ORC MR                                         1846           1867          29          5.7         176.1       3.2X
 
 
 ================================================================================================
 Partitioned Table Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partitioned Table:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-Data column - CSV                                          10869          10873           6          1.4         691.0       1.0X
-Data column - Json                                          9344           9391          67          1.7         594.1       1.2X
-Data column - Parquet Vectorized: DataPageV1                 112            126          10        140.1           7.1      96.8X
-Data column - Parquet Vectorized: DataPageV2                 218            241          19         72.0          13.9      49.7X
-Data column - Parquet MR: DataPageV1                        2361           2395          48          6.7         150.1       4.6X
-Data column - Parquet MR: DataPageV2                        2300           2301           2          6.8         146.2       4.7X
-Data column - ORC Vectorized                                 154            165          13        101.8           9.8      70.4X
-Data column - ORC MR                                        1990           2000          15          7.9         126.5       5.5X
-Partition column - CSV                                      3690           3704          20          4.3         234.6       2.9X
-Partition column - Json                                     8499           8531          46          1.9         540.3       1.3X
-Partition column - Parquet Vectorized: DataPageV1             30             41          10        521.6           1.9     360.5X
-Partition column - Parquet Vectorized: DataPageV2             29             34           6        548.7           1.8     379.2X
-Partition column - Parquet MR: DataPageV1                   1245           1260          22         12.6          79.1       8.7X
-Partition column - Parquet MR: DataPageV2                   1250           1261          15         12.6          79.5       8.7X
-Partition column - ORC Vectorized                             30             34           6        520.5           1.9     359.6X
-Partition column - ORC MR                                   1220           1221           1         12.9          77.6       8.9X
-Both columns - CSV                                         10588          10682         134          1.5         673.2       1.0X
-Both columns - Json                                         9542           9545           4          1.6         606.7       1.1X
-Both columns - Parquet Vectorized: DataPageV1                117            141          20        134.0           7.5      92.6X
-Both columns - Parquet Vectorized: DataPageV2                241            262          20         65.2          15.3      45.0X
-Both columns - Parquet MR: DataPageV1                       2266           2270           6          6.9         144.1       4.8X
-Both columns - Parquet MR: DataPageV2                       2202           2237          50          7.1         140.0       4.9X
-Both columns - ORC Vectorized                                158            200          32         99.4          10.1      68.7X
-Both columns - ORC MR                                       1941           1950          13          8.1         123.4       5.6X
+Data column - CSV                                          11085          11095          14          1.4         704.8       1.0X
+Data column - Json                                          9608           9800         272          1.6         610.8       1.2X
+Data column - Parquet Vectorized: DataPageV1                 108            130          20        145.0           6.9     102.2X
+Data column - Parquet Vectorized: DataPageV2                 234            254          19         67.1          14.9      47.3X
+Data column - Parquet MR: DataPageV1                        2352           2355           4          6.7         149.5       4.7X
+Data column - Parquet MR: DataPageV2                        2308           2384         107          6.8         146.7       4.8X
+Data column - ORC Vectorized                                 175            187          16         90.0          11.1      63.4X
+Data column - ORC MR                                        2001           2009          12          7.9         127.2       5.5X
+Partition column - CSV                                      3583           3630          67          4.4         227.8       3.1X
+Partition column - Json                                     8739           8762          32          1.8         555.6       1.3X
+Partition column - Parquet Vectorized: DataPageV1             35             44          11        448.9           2.2     316.4X
+Partition column - Parquet Vectorized: DataPageV2             34             43           7        467.8           2.1     329.7X
+Partition column - Parquet MR: DataPageV1                   1249           1258          13         12.6          79.4       8.9X
+Partition column - Parquet MR: DataPageV2                   1237           1248          15         12.7          78.7       9.0X
+Partition column - ORC Vectorized                             34             40           7        465.0           2.2     327.7X
+Partition column - ORC MR                                   1290           1291           1         12.2          82.0       8.6X
+Both columns - CSV                                         11214          11244          43          1.4         712.9       1.0X
+Both columns - Json                                         9546           9567          30          1.6         606.9       1.2X
+Both columns - Parquet Vectorized: DataPageV1                130            161          20        120.7           8.3      85.0X
+Both columns - Parquet Vectorized: DataPageV2                248            273          26         63.3          15.8      44.6X
+Both columns - Parquet MR: DataPageV1                       2305           2321          22          6.8         146.6       4.8X
+Both columns - Parquet MR: DataPageV2                       2274           2288          21          6.9         144.6       4.9X
+Both columns - ORC Vectorized                                171            203          29         91.9          10.9      64.7X
+Both columns - ORC MR                                       2067           2083          23          7.6         131.4       5.4X
 
 
 ================================================================================================
 String with Nulls Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (0.0%):            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            7234           7254          29          1.4         689.9       1.0X
-SQL Json                                           8754           8758           5          1.2         834.9       0.8X
-SQL Parquet Vectorized: DataPageV1                 1139           1151          17          9.2         108.6       6.4X
-SQL Parquet Vectorized: DataPageV2                 1469           1482          18          7.1         140.1       4.9X
-SQL Parquet MR: DataPageV1                         3437           3441           5          3.1         327.8       2.1X
-SQL Parquet MR: DataPageV2                         3643           3666          33          2.9         347.4       2.0X
-ParquetReader Vectorized: DataPageV1                759            765           9         13.8          72.4       9.5X
-ParquetReader Vectorized: DataPageV2               1099           1105           8          9.5         104.8       6.6X
-SQL ORC Vectorized                                  820            834          22         12.8          78.2       8.8X
-SQL ORC MR                                         2782           2792          14          3.8         265.3       2.6X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            7331           7353          30          1.4         699.2       1.0X
+SQL Json                                           9139           9253         160          1.1         871.6       0.8X
+SQL Parquet Vectorized: DataPageV1                 1184           1208          35          8.9         112.9       6.2X
+SQL Parquet Vectorized: DataPageV2                 1517           1526          12          6.9         144.7       4.8X
+SQL Parquet MR: DataPageV1                         3688           3709          29          2.8         351.7       2.0X
+SQL Parquet MR: DataPageV2                         3820           3831          16          2.7         364.3       1.9X
+ParquetReader Vectorized: DataPageV1                785            800          13         13.4          74.8       9.3X
+ParquetReader Vectorized: DataPageV2               1096           1114          25          9.6         104.5       6.7X
+SQL ORC Vectorized                                  785            850          57         13.4          74.9       9.3X
+SQL ORC MR                                         3070           3081          15          3.4         292.8       2.4X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (50.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            5381           5407          37          1.9         513.2       1.0X
-SQL Json                                           7194           7264          99          1.5         686.1       0.7X
-SQL Parquet Vectorized: DataPageV1                  742            753          16         14.1          70.7       7.3X
-SQL Parquet Vectorized: DataPageV2                  976            978           3         10.7          93.1       5.5X
-SQL Parquet MR: DataPageV1                         2764           2777          17          3.8         263.6       1.9X
-SQL Parquet MR: DataPageV2                         2846           2853          10          3.7         271.4       1.9X
-ParquetReader Vectorized: DataPageV1                721            732          12         14.6          68.7       7.5X
-ParquetReader Vectorized: DataPageV2                916            919           3         11.5          87.3       5.9X
-SQL ORC Vectorized                                  974            987          19         10.8          92.9       5.5X
-SQL ORC MR                                         2695           2707          17          3.9         257.0       2.0X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            5577           5588          15          1.9         531.9       1.0X
+SQL Json                                           7460           7462           3          1.4         711.4       0.7X
+SQL Parquet Vectorized: DataPageV1                  807            824          15         13.0          76.9       6.9X
+SQL Parquet Vectorized: DataPageV2                 1117           1119           2          9.4         106.5       5.0X
+SQL Parquet MR: DataPageV1                         2808           2815          10          3.7         267.8       2.0X
+SQL Parquet MR: DataPageV2                         2946           2957          15          3.6         280.9       1.9X
+ParquetReader Vectorized: DataPageV1                715            723           8         14.7          68.1       7.8X
+ParquetReader Vectorized: DataPageV2                936            940           3         11.2          89.3       6.0X
+SQL ORC Vectorized                                  953            971          24         11.0          90.8       5.9X
+SQL ORC MR                                         2817           2848          43          3.7         268.7       2.0X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (95.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            3904           3912          11          2.7         372.4       1.0X
-SQL Json                                           5105           5123          26          2.1         486.8       0.8X
-SQL Parquet Vectorized: DataPageV1                  175            179           5         59.8          16.7      22.3X
-SQL Parquet Vectorized: DataPageV2                  195            197           1         53.7          18.6      20.0X
-SQL Parquet MR: DataPageV1                         1629           1637          11          6.4         155.4       2.4X
-SQL Parquet MR: DataPageV2                         1575           1609          48          6.7         150.2       2.5X
-ParquetReader Vectorized: DataPageV1                174            176           1         60.1          16.6      22.4X
-ParquetReader Vectorized: DataPageV2                204            205           1         51.5          19.4      19.2X
-SQL ORC Vectorized                                  344            351           6         30.5          32.8      11.4X
-SQL ORC MR                                         1582           1603          29          6.6         150.9       2.5X
+SQL CSV                                            4347           4352           6          2.4         414.6       1.0X
+SQL Json                                           5219           5224           6          2.0         497.7       0.8X
+SQL Parquet Vectorized: DataPageV1                  163            173          10         64.3          15.6      26.6X
+SQL Parquet Vectorized: DataPageV2                  201            227          15         52.1          19.2      21.6X
+SQL Parquet MR: DataPageV1                         1765           1774          13          5.9         168.3       2.5X
+SQL Parquet MR: DataPageV2                         1710           1712           2          6.1         163.1       2.5X
+ParquetReader Vectorized: DataPageV1                172            179           7         61.0          16.4      25.3X
+ParquetReader Vectorized: DataPageV2                205            211           3         51.0          19.6      21.2X
+SQL ORC Vectorized                                  332            337           8         31.6          31.6      13.1X
+SQL ORC MR                                         1636           1637           1          6.4         156.1       2.7X
 
 
 ================================================================================================
 Single Column Scan From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 10 columns:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            1131           1159          40          0.9        1078.4       1.0X
-SQL Json                                           1731           1740          13          0.6        1650.7       0.7X
-SQL Parquet Vectorized: DataPageV1                   25             29           6         42.1          23.7      45.4X
-SQL Parquet Vectorized: DataPageV2                   33             37           6         32.1          31.1      34.7X
-SQL Parquet MR: DataPageV1                          153            160           6          6.8         146.3       7.4X
-SQL Parquet MR: DataPageV2                          151            161           8          6.9         144.1       7.5X
-SQL ORC Vectorized                                   27             31           6         39.0          25.6      42.0X
-SQL ORC MR                                          128            135           6          8.2         121.8       8.9X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            1131           1132           2          0.9        1078.4       1.0X
+SQL Json                                           1788           1791           4          0.6        1704.9       0.6X
+SQL Parquet Vectorized: DataPageV1                   29             35           6         35.8          28.0      38.6X
+SQL Parquet Vectorized: DataPageV2                   37             44           7         28.6          35.0      30.8X
+SQL Parquet MR: DataPageV1                          157            166           8          6.7         150.2       7.2X
+SQL Parquet MR: DataPageV2                          162            175           7          6.5         154.5       7.0X
+SQL ORC Vectorized                                   32             38           7         32.7          30.6      35.2X
+SQL ORC MR                                          150            158           8          7.0         142.9       7.5X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 50 columns:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            2518           2519           1          0.4        2401.5       1.0X
-SQL Json                                           5418           5442          33          0.2        5167.0       0.5X
-SQL Parquet Vectorized: DataPageV1                   28             34           7         38.1          26.2      91.6X
-SQL Parquet Vectorized: DataPageV2                   31             36           6         33.4          30.0      80.2X
-SQL Parquet MR: DataPageV1                          159            169           5          6.6         151.7      15.8X
-SQL Parquet MR: DataPageV2                          162            171           5          6.5         154.9      15.5X
-SQL ORC Vectorized                                   30             35           6         34.8          28.7      83.6X
-SQL ORC MR                                          132            143           7          7.9         126.0      19.1X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            2424           2438          20          0.4        2311.5       1.0X
+SQL Json                                           6479           6527          69          0.2        6178.6       0.4X
+SQL Parquet Vectorized: DataPageV1                   31             36           6         33.5          29.8      77.5X
+SQL Parquet Vectorized: DataPageV2                   38             46           8         27.8          36.0      64.2X
+SQL Parquet MR: DataPageV1                          167            174           6          6.3         159.6      14.5X
+SQL Parquet MR: DataPageV2                          169            178           6          6.2         161.0      14.4X
+SQL ORC Vectorized                                   36             45           8         29.3          34.2      67.6X
+SQL ORC MR                                          164            170           4          6.4         156.6      14.8X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 100 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            4195           4198           4          0.2        4000.7       1.0X
-SQL Json                                          10366          10415          69          0.1        9886.0       0.4X
-SQL Parquet Vectorized: DataPageV1                   34             40           7         30.7          32.5     122.9X
-SQL Parquet Vectorized: DataPageV2                   38             41           4         27.4          36.5     109.6X
-SQL Parquet MR: DataPageV1                          169            178           6          6.2         160.8      24.9X
-SQL Parquet MR: DataPageV2                          176            181           4          6.0         167.4      23.9X
-SQL ORC Vectorized                                   36             41           6         29.1          34.4     116.3X
-SQL ORC MR                                          140            146           8          7.5         133.4      30.0X
+SQL CSV                                            3988           4030          59          0.3        3802.9       1.0X
+SQL Json                                          10875          10928          75          0.1       10370.8       0.4X
+SQL Parquet Vectorized: DataPageV1                   38             46           8         27.7          36.1     105.4X
+SQL Parquet Vectorized: DataPageV2                   45             52           8         23.1          43.3      87.8X
+SQL Parquet MR: DataPageV1                          175            194           8          6.0         167.3      22.7X
+SQL Parquet MR: DataPageV2                          186            195           4          5.6         177.8      21.4X
+SQL ORC Vectorized                                   41             46           6         25.5          39.1      97.1X
+SQL ORC MR                                          156            169           5          6.7         148.8      25.6X
 
 
diff --git a/sql/core/benchmarks/DataSourceReadBenchmark-results.txt b/sql/core/benchmarks/DataSourceReadBenchmark-results.txt
index f8627fb101679..ad66e68428bcf 100644
--- a/sql/core/benchmarks/DataSourceReadBenchmark-results.txt
+++ b/sql/core/benchmarks/DataSourceReadBenchmark-results.txt
@@ -2,437 +2,437 @@
 SQL Single Numeric Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BOOLEAN Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           12149          12272         173          1.3         772.4       1.0X
-SQL Json                                           8354           8445         129          1.9         531.1       1.5X
-SQL Json with UnsafeRow                            9377           9393          22          1.7         596.2       1.3X
-SQL Parquet Vectorized: DataPageV1                  101            113           8        155.1           6.4     119.8X
-SQL Parquet Vectorized: DataPageV2                  103            112           7        152.8           6.5     118.0X
-SQL Parquet MR: DataPageV1                         1767           1776          13          8.9         112.3       6.9X
-SQL Parquet MR: DataPageV2                         1721           1730          12          9.1         109.4       7.1X
-SQL ORC Vectorized                                  136            143           5        115.5           8.7      89.2X
-SQL ORC MR                                         1485           1489           6         10.6          94.4       8.2X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           12682          12766         120          1.2         806.3       1.0X
+SQL Json                                           8232           8269          52          1.9         523.4       1.5X
+SQL Json with UnsafeRow                            9077           9103          36          1.7         577.1       1.4X
+SQL Parquet Vectorized: DataPageV1                  103            119           9        152.6           6.6     123.0X
+SQL Parquet Vectorized: DataPageV2                  117            124           5        133.9           7.5     107.9X
+SQL Parquet MR: DataPageV1                         1788           1799          15          8.8         113.7       7.1X
+SQL Parquet MR: DataPageV2                         1730           1738          11          9.1         110.0       7.3X
+SQL ORC Vectorized                                  143            149           4        110.0           9.1      88.7X
+SQL ORC MR                                         1585           1599          19          9.9         100.8       8.0X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single BOOLEAN Column Scan:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                    87             88           1        180.4           5.5       1.0X
-ParquetReader Vectorized: DataPageV2                    94             95           1        166.9           6.0       0.9X
-ParquetReader Vectorized -> Row: DataPageV1             73             74           1        215.3           4.6       1.2X
-ParquetReader Vectorized -> Row: DataPageV2             82             83           2        191.9           5.2       1.1X
+ParquetReader Vectorized: DataPageV1                    95             96           1        165.7           6.0       1.0X
+ParquetReader Vectorized: DataPageV2                   119            120           1        132.7           7.5       0.8X
+ParquetReader Vectorized -> Row: DataPageV1             75             76           1        208.9           4.8       1.3X
+ParquetReader Vectorized -> Row: DataPageV2             99            102           4        158.1           6.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           11552          11570          25          1.4         734.5       1.0X
-SQL Json                                           9556           9560           6          1.6         607.6       1.2X
-SQL Json with UnsafeRow                           10151          10165          20          1.5         645.4       1.1X
-SQL Parquet Vectorized: DataPageV1                   92             99           8        170.9           5.9     125.5X
-SQL Parquet Vectorized: DataPageV2                   91             98           5        172.6           5.8     126.8X
-SQL Parquet MR: DataPageV1                         1972           2005          47          8.0         125.4       5.9X
-SQL Parquet MR: DataPageV2                         1895           1927          45          8.3         120.5       6.1X
-SQL ORC Vectorized                                  130            139          11        121.3           8.2      89.1X
-SQL ORC MR                                         1455           1462          11         10.8          92.5       7.9X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           12590          12760         241          1.2         800.4       1.0X
+SQL Json                                           9103           9139          51          1.7         578.8       1.4X
+SQL Json with UnsafeRow                            9946           9973          37          1.6         632.4       1.3X
+SQL Parquet Vectorized: DataPageV1                   92            101           7        171.2           5.8     137.1X
+SQL Parquet Vectorized: DataPageV2                   91             98           5        173.0           5.8     138.5X
+SQL Parquet MR: DataPageV1                         1855           1864          13          8.5         117.9       6.8X
+SQL Parquet MR: DataPageV2                         1808           1812           5          8.7         115.0       7.0X
+SQL ORC Vectorized                                  115            122           6        136.4           7.3     109.2X
+SQL ORC MR                                         1459           1459           1         10.8          92.7       8.6X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single TINYINT Column Scan:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                    68             70           1        231.1           4.3       1.0X
-ParquetReader Vectorized: DataPageV2                    68             69           1        230.3           4.3       1.0X
-ParquetReader Vectorized -> Row: DataPageV1             48             49           2        329.2           3.0       1.4X
-ParquetReader Vectorized -> Row: DataPageV2             48             49           1        329.1           3.0       1.4X
+ParquetReader Vectorized: DataPageV1                    70             72           2        225.9           4.4       1.0X
+ParquetReader Vectorized: DataPageV2                    70             71           1        224.9           4.4       1.0X
+ParquetReader Vectorized -> Row: DataPageV1             47             48           1        336.8           3.0       1.5X
+ParquetReader Vectorized -> Row: DataPageV2             47             48           1        335.4           3.0       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           11987          11990           4          1.3         762.1       1.0X
-SQL Json                                           9896           9903          10          1.6         629.2       1.2X
-SQL Json with UnsafeRow                           10451          10472          29          1.5         664.5       1.1X
-SQL Parquet Vectorized: DataPageV1                  101            105           4        155.8           6.4     118.7X
-SQL Parquet Vectorized: DataPageV2                  134            138           4        117.2           8.5      89.3X
-SQL Parquet MR: DataPageV1                         2115           2150          50          7.4         134.5       5.7X
-SQL Parquet MR: DataPageV2                         1958           1962           6          8.0         124.5       6.1X
-SQL ORC Vectorized                                  129            132           2        121.7           8.2      92.8X
-SQL ORC MR                                         1597           1610          18          9.8         101.5       7.5X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           13145          13165          28          1.2         835.7       1.0X
+SQL Json                                           9536           9550          20          1.6         606.3       1.4X
+SQL Json with UnsafeRow                           10364          10401          53          1.5         658.9       1.3X
+SQL Parquet Vectorized: DataPageV1                  109            114           3        143.9           6.9     120.3X
+SQL Parquet Vectorized: DataPageV2                  138            141           3        113.7           8.8      95.0X
+SQL Parquet MR: DataPageV1                         2015           2019           5          7.8         128.1       6.5X
+SQL Parquet MR: DataPageV2                         1969           1977          11          8.0         125.2       6.7X
+SQL ORC Vectorized                                  127            131           3        123.8           8.1     103.4X
+SQL ORC MR                                         1673           1677           7          9.4         106.3       7.9X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single SMALLINT Column Scan:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   139            140           1        113.2           8.8       1.0X
-ParquetReader Vectorized: DataPageV2                   173            174           1         90.9          11.0       0.8X
-ParquetReader Vectorized -> Row: DataPageV1            136            139           2        115.3           8.7       1.0X
-ParquetReader Vectorized -> Row: DataPageV2            170            173           2         92.3          10.8       0.8X
+ParquetReader Vectorized: DataPageV1                   141            142           1        111.9           8.9       1.0X
+ParquetReader Vectorized: DataPageV2                   170            171           1         92.5          10.8       0.8X
+ParquetReader Vectorized -> Row: DataPageV1            139            140           1        113.4           8.8       1.0X
+ParquetReader Vectorized -> Row: DataPageV2            168            169           2         93.9          10.7       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           13126          13151          35          1.2         834.5       1.0X
-SQL Json                                          10020          10023           5          1.6         637.0       1.3X
-SQL Json with UnsafeRow                           10792          10812          29          1.5         686.2       1.2X
-SQL Parquet Vectorized: DataPageV1                  100            107          10        156.8           6.4     130.9X
-SQL Parquet Vectorized: DataPageV2                  180            183           5         87.5          11.4      73.0X
-SQL Parquet MR: DataPageV1                         2141           2270         183          7.3         136.1       6.1X
-SQL Parquet MR: DataPageV2                         1978           2002          34          8.0         125.8       6.6X
-SQL ORC Vectorized                                  146            150           4        107.6           9.3      89.8X
-SQL ORC MR                                         1623           1630          10          9.7         103.2       8.1X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           14110          14121          15          1.1         897.1       1.0X
+SQL Json                                           9936           9949          19          1.6         631.7       1.4X
+SQL Json with UnsafeRow                           10717          10718           1          1.5         681.4       1.3X
+SQL Parquet Vectorized: DataPageV1                  108            112           3        145.7           6.9     130.7X
+SQL Parquet Vectorized: DataPageV2                  178            182           4         88.3          11.3      79.3X
+SQL Parquet MR: DataPageV1                         2086           2135          69          7.5         132.6       6.8X
+SQL Parquet MR: DataPageV2                         2059           2070          17          7.6         130.9       6.9X
+SQL ORC Vectorized                                  146            149           3        107.6           9.3      96.5X
+SQL ORC MR                                         1668           1670           3          9.4         106.0       8.5X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single INT Column Scan:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   142            144           1        110.7           9.0       1.0X
-ParquetReader Vectorized: DataPageV2                   216            218           2         72.8          13.7       0.7X
-ParquetReader Vectorized -> Row: DataPageV1            139            142           2        112.9           8.9       1.0X
-ParquetReader Vectorized -> Row: DataPageV2            214            215           2         73.5          13.6       0.7X
+ParquetReader Vectorized: DataPageV1                   142            144           1        110.6           9.0       1.0X
+ParquetReader Vectorized: DataPageV2                   212            214           1         74.2          13.5       0.7X
+ParquetReader Vectorized -> Row: DataPageV1            140            144           5        112.3           8.9       1.0X
+ParquetReader Vectorized -> Row: DataPageV2            210            212           1         74.8          13.4       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           12940          12949          13          1.2         822.7       1.0X
-SQL Json                                          10064          10080          22          1.6         639.9       1.3X
-SQL Json with UnsafeRow                           10745          10775          43          1.5         683.1       1.2X
-SQL Parquet Vectorized: DataPageV1                  286            289           3         55.0          18.2      45.2X
-SQL Parquet Vectorized: DataPageV2                  175            178           3         90.0          11.1      74.0X
-SQL Parquet MR: DataPageV1                         2462           2484          31          6.4         156.5       5.3X
-SQL Parquet MR: DataPageV2                         1998           2017          27          7.9         127.0       6.5X
-SQL ORC Vectorized                                  132            137           4        118.8           8.4      97.8X
-SQL ORC MR                                         1673           1677           7          9.4         106.3       7.7X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           13768          13773           7          1.1         875.4       1.0X
+SQL Json                                           9915           9933          24          1.6         630.4       1.4X
+SQL Json with UnsafeRow                           10669          10685          22          1.5         678.3       1.3X
+SQL Parquet Vectorized: DataPageV1                  284            296           8         55.4          18.1      48.5X
+SQL Parquet Vectorized: DataPageV2                  200            203           3         78.6          12.7      68.8X
+SQL Parquet MR: DataPageV1                         2647           2676          41          5.9         168.3       5.2X
+SQL Parquet MR: DataPageV2                         2116           2163          67          7.4         134.5       6.5X
+SQL ORC Vectorized                                  128            137           9        122.5           8.2     107.2X
+SQL ORC MR                                         1691           1702          15          9.3         107.5       8.1X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single BIGINT Column Scan:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   315            322          11         49.9          20.0       1.0X
-ParquetReader Vectorized: DataPageV2                   205            206           1         76.9          13.0       1.5X
-ParquetReader Vectorized -> Row: DataPageV1            332            334           2         47.4          21.1       0.9X
-ParquetReader Vectorized -> Row: DataPageV2            219            221           2         71.8          13.9       1.4X
+ParquetReader Vectorized: DataPageV1                   320            322           1         49.1          20.4       1.0X
+ParquetReader Vectorized: DataPageV2                   218            220           2         72.1          13.9       1.5X
+ParquetReader Vectorized -> Row: DataPageV1            329            332           2         47.8          20.9       1.0X
+ParquetReader Vectorized -> Row: DataPageV2            232            234           2         67.7          14.8       1.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           13460          13468          11          1.2         855.8       1.0X
-SQL Json                                          11451          11489          54          1.4         728.0       1.2X
-SQL Json with UnsafeRow                           12351          12372          29          1.3         785.2       1.1X
-SQL Parquet Vectorized: DataPageV1                   82             85           3        190.9           5.2     163.3X
-SQL Parquet Vectorized: DataPageV2                   81             84           3        193.8           5.2     165.8X
-SQL Parquet MR: DataPageV1                         2027           2080          76          7.8         128.9       6.6X
-SQL Parquet MR: DataPageV2                         1913           1922          13          8.2         121.6       7.0X
-SQL ORC Vectorized                                  242            246           5         65.1          15.4      55.7X
-SQL ORC MR                                         1788           1789           0          8.8         113.7       7.5X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           14385          14421          50          1.1         914.6       1.0X
+SQL Json                                          11200          11214          20          1.4         712.1       1.3X
+SQL Json with UnsafeRow                           11987          12002          22          1.3         762.1       1.2X
+SQL Parquet Vectorized: DataPageV1                   85             89           3        184.4           5.4     168.7X
+SQL Parquet Vectorized: DataPageV2                   85             88           2        184.6           5.4     168.8X
+SQL Parquet MR: DataPageV1                         2024           2024           1          7.8         128.7       7.1X
+SQL Parquet MR: DataPageV2                         1935           1956          30          8.1         123.1       7.4X
+SQL ORC Vectorized                                  249            251           2         63.2          15.8      57.8X
+SQL ORC MR                                         1679           1690          15          9.4         106.8       8.6X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single FLOAT Column Scan:     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   138            138           0        114.3           8.7       1.0X
-ParquetReader Vectorized: DataPageV2                   134            136           1        117.0           8.5       1.0X
-ParquetReader Vectorized -> Row: DataPageV1            133            136           6        118.1           8.5       1.0X
-ParquetReader Vectorized -> Row: DataPageV2            133            136           3        118.1           8.5       1.0X
+ParquetReader Vectorized: DataPageV1                   135            137           1        116.5           8.6       1.0X
+ParquetReader Vectorized: DataPageV2                   136            139           5        115.8           8.6       1.0X
+ParquetReader Vectorized -> Row: DataPageV1            134            138           8        117.1           8.5       1.0X
+ParquetReader Vectorized -> Row: DataPageV2            134            139           4        117.0           8.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           13669          13678          12          1.2         869.1       1.0X
-SQL Json                                          11696          11714          25          1.3         743.6       1.2X
-SQL Json with UnsafeRow                           12529          12545          23          1.3         796.6       1.1X
-SQL Parquet Vectorized: DataPageV1                  261            263           3         60.3          16.6      52.4X
-SQL Parquet Vectorized: DataPageV2                  260            264           3         60.4          16.6      52.5X
-SQL Parquet MR: DataPageV1                         2457           2468          16          6.4         156.2       5.6X
-SQL Parquet MR: DataPageV2                         2334           2398          91          6.7         148.4       5.9X
-SQL ORC Vectorized                                  576            582           4         27.3          36.7      23.7X
-SQL ORC MR                                         2114           2121          10          7.4         134.4       6.5X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                           14585          14594          13          1.1         927.3       1.0X
+SQL Json                                          11269          11294          35          1.4         716.5       1.3X
+SQL Json with UnsafeRow                           12098          12126          40          1.3         769.2       1.2X
+SQL Parquet Vectorized: DataPageV1                  265            268           3         59.4          16.8      55.1X
+SQL Parquet Vectorized: DataPageV2                  264            266           2         59.6          16.8      55.2X
+SQL Parquet MR: DataPageV1                         2599           2606          10          6.1         165.2       5.6X
+SQL Parquet MR: DataPageV2                         2488           2490           3          6.3         158.2       5.9X
+SQL ORC Vectorized                                  579            582           4         27.2          36.8      25.2X
+SQL ORC MR                                         2117           2144          38          7.4         134.6       6.9X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet Reader Single DOUBLE Column Scan:    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-ParquetReader Vectorized: DataPageV1                   314            315           1         50.2          19.9       1.0X
-ParquetReader Vectorized: DataPageV2                   308            324          31         51.1          19.6       1.0X
-ParquetReader Vectorized -> Row: DataPageV1            334            335           1         47.1          21.2       0.9X
-ParquetReader Vectorized -> Row: DataPageV2            335            336           1         47.0          21.3       0.9X
+ParquetReader Vectorized: DataPageV1                   315            317           1         50.0          20.0       1.0X
+ParquetReader Vectorized: DataPageV2                   317            318           1         49.6          20.2       1.0X
+ParquetReader Vectorized -> Row: DataPageV1            334            336           3         47.1          21.2       0.9X
+ParquetReader Vectorized -> Row: DataPageV2            333            334           1         47.2          21.2       0.9X
 
 
 ================================================================================================
 SQL Single Numeric Column Scan in Struct
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan in Struct:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            1958           1972          21          8.0         124.5       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           1985           1986           1          7.9         126.2       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             127            133           6        123.8           8.1      15.4X
-SQL Parquet MR: DataPageV1                                            2395           2397           2          6.6         152.3       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2745           2754          12          5.7         174.5       0.7X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)              99            105           5        158.2           6.3      19.7X
-SQL Parquet MR: DataPageV2                                            2291           2291           1          6.9         145.6       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2675           2681           9          5.9         170.1       0.7X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)              99            104           5        159.2           6.3      19.8X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2048           2050           3          7.7         130.2       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2030           2053          33          7.7         129.1       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             112            116           4        140.7           7.1      18.3X
+SQL Parquet MR: DataPageV1                                            2205           2207           4          7.1         140.2       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2760           2826          93          5.7         175.5       0.7X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)              95             99           5        166.0           6.0      21.6X
+SQL Parquet MR: DataPageV2                                            2145           2147           2          7.3         136.4       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2587           2591           6          6.1         164.5       0.8X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)              94             99           3        166.9           6.0      21.7X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan in Struct:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2000           2006           8          7.9         127.2       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2011           2016           7          7.8         127.9       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             284            290           7         55.3          18.1       7.0X
-SQL Parquet MR: DataPageV1                                            2499           2504           8          6.3         158.9       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3087           3089           3          5.1         196.3       0.6X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             112            120           8        141.0           7.1      17.9X
-SQL Parquet MR: DataPageV2                                            2322           2323           2          6.8         147.6       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2966           2969           5          5.3         188.6       0.7X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             240            253          10         65.5          15.3       8.3X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2057           2083          38          7.6         130.8       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2067           2072           7          7.6         131.4       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             257            262           7         61.3          16.3       8.0X
+SQL Parquet MR: DataPageV1                                            2475           2480           7          6.4         157.3       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3189           3196          10          4.9         202.8       0.6X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             125            129           4        125.9           7.9      16.5X
+SQL Parquet MR: DataPageV2                                            2370           2371           1          6.6         150.7       0.9X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2888           2892           6          5.4         183.6       0.7X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             244            247           2         64.4          15.5       8.4X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan in Struct:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2118           2196         110          7.4         134.6       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2129           2184          77          7.4         135.4       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             293            304           9         53.8          18.6       7.2X
-SQL Parquet MR: DataPageV1                                            2483           2505          32          6.3         157.8       0.9X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3260           3265           6          4.8         207.3       0.6X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             113            127          17        138.8           7.2      18.7X
-SQL Parquet MR: DataPageV2                                            2326           2343          23          6.8         147.9       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2928           2944          23          5.4         186.2       0.7X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             259            264           3         60.8          16.4       8.2X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2069           2131          88          7.6         131.5       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2085           2115          43          7.5         132.5       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             278            287           6         56.6          17.7       7.4X
+SQL Parquet MR: DataPageV1                                            2350           2355           7          6.7         149.4       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2822           2836          20          5.6         179.4       0.7X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             115            118           3        136.4           7.3      17.9X
+SQL Parquet MR: DataPageV2                                            2285           2290           7          6.9         145.3       0.9X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2970           2981          16          5.3         188.8       0.7X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             257            260           3         61.2          16.3       8.0X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan in Struct:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2122           2165          61          7.4         134.9       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2113           2115           3          7.4         134.4       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             308            315           5         51.1          19.6       6.9X
-SQL Parquet MR: DataPageV1                                            2838           2865          38          5.5         180.4       0.7X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3238           3250          17          4.9         205.9       0.7X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             303            307           5         51.9          19.3       7.0X
-SQL Parquet MR: DataPageV2                                            2315           2332          24          6.8         147.2       0.9X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2685           2686           1          5.9         170.7       0.8X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             187            197           8         84.2          11.9      11.4X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2119           2146          39          7.4         134.7       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2143           2169          37          7.3         136.2       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             280            286           7         56.1          17.8       7.6X
+SQL Parquet MR: DataPageV1                                            2785           2794          14          5.6         177.0       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3359           3363           6          4.7         213.5       0.6X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             291            294           2         54.1          18.5       7.3X
+SQL Parquet MR: DataPageV2                                            2293           2321          39          6.9         145.8       0.9X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2871           2877           8          5.5         182.5       0.7X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             190            194           4         82.8          12.1      11.2X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan in Struct:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2243           2255          17          7.0         142.6       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2229           2251          31          7.1         141.7       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             379            395          11         41.5          24.1       5.9X
-SQL Parquet MR: DataPageV1                                            2388           2408          28          6.6         151.8       0.9X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2869           2881          17          5.5         182.4       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)              95            116          16        165.2           6.1      23.6X
-SQL Parquet MR: DataPageV2                                            2322           2333          16          6.8         147.6       1.0X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2769           2797          40          5.7         176.0       0.8X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)              90             96           6        175.4           5.7      25.0X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL ORC MR                                                            2262           2314          73          7.0         143.8       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2157           2185          40          7.3         137.1       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             380            383           3         41.3          24.2       5.9X
+SQL Parquet MR: DataPageV1                                            2395           2400           7          6.6         152.2       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           2865           2869           6          5.5         182.2       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)              94            100           6        167.9           6.0      24.2X
+SQL Parquet MR: DataPageV2                                            2343           2351          12          6.7         148.9       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           2799           2807          11          5.6         177.9       0.8X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)              93             99           7        169.2           5.9      24.3X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan in Struct:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                            2570           2570           0          6.1         163.4       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                           2576           2581           6          6.1         163.8       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                             721            722           2         21.8          45.8       3.6X
-SQL Parquet MR: DataPageV1                                            2808           2831          34          5.6         178.5       0.9X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3286           3316          42          4.8         208.9       0.8X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             283            296          12         55.5          18.0       9.1X
-SQL Parquet MR: DataPageV2                                            2642           2659          23          6.0         168.0       1.0X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           3126           3129           5          5.0         198.7       0.8X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             289            297           7         54.4          18.4       8.9X
+SQL ORC MR                                                            2589           2613          34          6.1         164.6       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                           2600           2638          53          6.0         165.3       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                             723            735          13         21.8          46.0       3.6X
+SQL Parquet MR: DataPageV1                                            2782           2807          36          5.7         176.9       0.9X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           3259           3266          11          4.8         207.2       0.8X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)             279            288           7         56.4          17.7       9.3X
+SQL Parquet MR: DataPageV2                                            2699           2720          31          5.8         171.6       1.0X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           3174           3182          12          5.0         201.8       0.8X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)             275            284           7         57.1          17.5       9.4X
 
 
 ================================================================================================
 SQL Nested Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Nested Column Scan:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------
-SQL ORC MR                                                           12768          12973         132          0.1       12176.7       1.0X
-SQL ORC Vectorized (Nested Column Disabled)                          12932          13289         327          0.1       12333.3       1.0X
-SQL ORC Vectorized (Nested Column Enabled)                            7205           7270          60          0.1        6870.8       1.8X
-SQL Parquet MR: DataPageV1                                            9028           9123          63          0.1        8609.9       1.4X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           9363           9406          38          0.1        8928.9       1.4X
-SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)            5947           6003          50          0.2        5671.6       2.1X
-SQL Parquet MR: DataPageV2                                            9731          10064         276          0.1        9280.2       1.3X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           9999          10015          14          0.1        9535.5       1.3X
-SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)            5554           5581          16          0.2        5297.1       2.3X
+SQL ORC MR                                                           13352          13556         177          0.1       12733.3       1.0X
+SQL ORC Vectorized (Nested Column Disabled)                          13179          13338         148          0.1       12568.6       1.0X
+SQL ORC Vectorized (Nested Column Enabled)                            7419           7472          53          0.1        7075.5       1.8X
+SQL Parquet MR: DataPageV1                                            8783           8858          49          0.1        8375.8       1.5X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Disabled)           9105           9163          39          0.1        8683.3       1.5X
+SQL Parquet Vectorized: DataPageV1 (Nested Column Enabled)            5874           5929          36          0.2        5601.5       2.3X
+SQL Parquet MR: DataPageV2                                            9562           9661          78          0.1        9118.9       1.4X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Disabled)           9851           9891          24          0.1        9394.4       1.4X
+SQL Parquet Vectorized: DataPageV2 (Nested Column Enabled)            5640           5684          27          0.2        5379.0       2.4X
 
 
 ================================================================================================
 Int and String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int and String Scan:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                           12435          12520         120          0.8        1185.9       1.0X
-SQL Json                                          10492          10539          67          1.0        1000.6       1.2X
-SQL Parquet Vectorized: DataPageV1                 1788           1793           7          5.9         170.5       7.0X
-SQL Parquet Vectorized: DataPageV2                 1918           1924           9          5.5         182.9       6.5X
-SQL Parquet MR: DataPageV1                         4163           4169           8          2.5         397.0       3.0X
-SQL Parquet MR: DataPageV2                         4092           4108          21          2.6         390.3       3.0X
-SQL ORC Vectorized                                 1843           1847           6          5.7         175.7       6.7X
-SQL ORC MR                                         3565           3573          11          2.9         340.0       3.5X
+SQL CSV                                           12583          12752         240          0.8        1200.0       1.0X
+SQL Json                                          10318          10364          64          1.0         984.0       1.2X
+SQL Parquet Vectorized: DataPageV1                 1792           1802          15          5.9         170.9       7.0X
+SQL Parquet Vectorized: DataPageV2                 1890           1897          10          5.5         180.3       6.7X
+SQL Parquet MR: DataPageV1                         3919           3921           2          2.7         373.8       3.2X
+SQL Parquet MR: DataPageV2                         3924           3945          30          2.7         374.2       3.2X
+SQL ORC Vectorized                                 1922           1928           9          5.5         183.3       6.5X
+SQL ORC MR                                         3550           3556           8          3.0         338.6       3.5X
 
 
 ================================================================================================
 Repeated String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repeated String:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            7117           7146          41          1.5         678.8       1.0X
-SQL Json                                           6813           6814           1          1.5         649.7       1.0X
-SQL Parquet Vectorized: DataPageV1                  487            492           5         21.5          46.4      14.6X
-SQL Parquet Vectorized: DataPageV2                  492            502          12         21.3          46.9      14.5X
-SQL Parquet MR: DataPageV1                         1659           1667          12          6.3         158.2       4.3X
-SQL Parquet MR: DataPageV2                         1613           1621          11          6.5         153.8       4.4X
-SQL ORC Vectorized                                  398            409          13         26.3          38.0      17.9X
-SQL ORC MR                                         1857           1860           5          5.6         177.1       3.8X
+SQL CSV                                            7707           7781         104          1.4         735.0       1.0X
+SQL Json                                           6650           6655           7          1.6         634.2       1.2X
+SQL Parquet Vectorized: DataPageV1                  511            524          18         20.5          48.7      15.1X
+SQL Parquet Vectorized: DataPageV2                  513            521          14         20.5          48.9      15.0X
+SQL Parquet MR: DataPageV1                         1628           1674          66          6.4         155.2       4.7X
+SQL Parquet MR: DataPageV2                         1576           1580           7          6.7         150.3       4.9X
+SQL ORC Vectorized                                  408            411           2         25.7          38.9      18.9X
+SQL ORC MR                                         1683           1683           0          6.2         160.5       4.6X
 
 
 ================================================================================================
 Partitioned Table Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partitioned Table:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-Data column - CSV                                          13634          13651          24          1.2         866.8       1.0X
-Data column - Json                                         10104          10109           7          1.6         642.4       1.3X
-Data column - Parquet Vectorized: DataPageV1                 102            122          17        154.3           6.5     133.8X
-Data column - Parquet Vectorized: DataPageV2                 236            252          17         66.8          15.0      57.9X
-Data column - Parquet MR: DataPageV1                        2341           2361          28          6.7         148.9       5.8X
-Data column - Parquet MR: DataPageV2                        2297           2311          20          6.8         146.0       5.9X
-Data column - ORC Vectorized                                 146            151           5        108.1           9.3      93.7X
-Data column - ORC MR                                        1848           1849           0          8.5         117.5       7.4X
-Partition column - CSV                                      3362           3435         103          4.7         213.8       4.1X
-Partition column - Json                                     8775           8801          37          1.8         557.9       1.6X
-Partition column - Parquet Vectorized: DataPageV1             31             34           3        512.8           2.0     444.5X
-Partition column - Parquet Vectorized: DataPageV2             30             34           4        522.3           1.9     452.8X
-Partition column - Parquet MR: DataPageV1                   1205           1208           4         13.1          76.6      11.3X
-Partition column - Parquet MR: DataPageV2                   1218           1240          31         12.9          77.4      11.2X
-Partition column - ORC Vectorized                             29             32           3        549.4           1.8     476.3X
-Partition column - ORC MR                                   1255           1260           7         12.5          79.8      10.9X
-Both columns - CSV                                         13329          13349          28          1.2         847.4       1.0X
-Both columns - Json                                        10467          10476          13          1.5         665.5       1.3X
-Both columns - Parquet Vectorized: DataPageV1                121            140          14        129.6           7.7     112.4X
-Both columns - Parquet Vectorized: DataPageV2                250            275          17         63.0          15.9      54.6X
-Both columns - Parquet MR: DataPageV1                       2295           2316          31          6.9         145.9       5.9X
-Both columns - Parquet MR: DataPageV2                       2356           2378          30          6.7         149.8       5.8X
-Both columns - ORC Vectorized                                178            187          16         88.5          11.3      76.7X
-Both columns - ORC MR                                       1893           1893           0          8.3         120.3       7.2X
+Data column - CSV                                          14303          14342          55          1.1         909.4       1.0X
+Data column - Json                                          9732           9830         139          1.6         618.8       1.5X
+Data column - Parquet Vectorized: DataPageV1                 109            120           6        144.7           6.9     131.6X
+Data column - Parquet Vectorized: DataPageV2                 264            275           8         59.7          16.8      54.3X
+Data column - Parquet MR: DataPageV1                        2340           2346           9          6.7         148.8       6.1X
+Data column - Parquet MR: DataPageV2                        2230           2238          11          7.1         141.8       6.4X
+Data column - ORC Vectorized                                 172            192           9         91.2          11.0      83.0X
+Data column - ORC MR                                        2021           2031          14          7.8         128.5       7.1X
+Partition column - CSV                                      3387           3413          36          4.6         215.4       4.2X
+Partition column - Json                                     8342           8348           9          1.9         530.4       1.7X
+Partition column - Parquet Vectorized: DataPageV1             33             36           3        470.0           2.1     427.4X
+Partition column - Parquet Vectorized: DataPageV2             34             37           4        466.6           2.1     424.3X
+Partition column - Parquet MR: DataPageV1                   1204           1209           7         13.1          76.5      11.9X
+Partition column - Parquet MR: DataPageV2                   1202           1210          11         13.1          76.4      11.9X
+Partition column - ORC Vectorized                             36             38           3        438.3           2.3     398.6X
+Partition column - ORC MR                                   1348           1349           2         11.7          85.7      10.6X
+Both columns - CSV                                         14140          14184          62          1.1         899.0       1.0X
+Both columns - Json                                        10105          10120          21          1.6         642.4       1.4X
+Both columns - Parquet Vectorized: DataPageV1                140            155          17        112.2           8.9     102.0X
+Both columns - Parquet Vectorized: DataPageV2                302            330          21         52.1          19.2      47.4X
+Both columns - Parquet MR: DataPageV1                       2385           2404          26          6.6         151.6       6.0X
+Both columns - Parquet MR: DataPageV2                       2354           2374          28          6.7         149.6       6.1X
+Both columns - ORC Vectorized                                208            244          21         75.5          13.2      68.7X
+Both columns - ORC MR                                       2162           2163           1          7.3         137.4       6.6X
 
 
 ================================================================================================
 String with Nulls Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (0.0%):            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            8636           8656          28          1.2         823.6       1.0X
-SQL Json                                           8982           9006          34          1.2         856.6       1.0X
-SQL Parquet Vectorized: DataPageV1                 1302           1305           3          8.1         124.2       6.6X
-SQL Parquet Vectorized: DataPageV2                 1342           1360          25          7.8         128.0       6.4X
-SQL Parquet MR: DataPageV1                         3495           3511          22          3.0         333.3       2.5X
-SQL Parquet MR: DataPageV2                         3660           3673          17          2.9         349.1       2.4X
-ParquetReader Vectorized: DataPageV1                859            862           3         12.2          81.9      10.1X
-ParquetReader Vectorized: DataPageV2                873            877           6         12.0          83.3       9.9X
-SQL ORC Vectorized                                  923            940          17         11.4          88.0       9.4X
-SQL ORC MR                                         2963           2966           4          3.5         282.6       2.9X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            9147           9239         130          1.1         872.4       1.0X
+SQL Json                                           9080           9083           4          1.2         865.9       1.0X
+SQL Parquet Vectorized: DataPageV1                 1277           1299          31          8.2         121.8       7.2X
+SQL Parquet Vectorized: DataPageV2                 1369           1387          26          7.7         130.6       6.7X
+SQL Parquet MR: DataPageV1                         3487           3491           5          3.0         332.6       2.6X
+SQL Parquet MR: DataPageV2                         3582           3583           2          2.9         341.6       2.6X
+ParquetReader Vectorized: DataPageV1                869            886          19         12.1          82.9      10.5X
+ParquetReader Vectorized: DataPageV2                899            903           4         11.7          85.7      10.2X
+SQL ORC Vectorized                                  971            988          15         10.8          92.6       9.4X
+SQL ORC MR                                         2933           2955          32          3.6         279.7       3.1X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (50.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            6432           6443          15          1.6         613.4       1.0X
-SQL Json                                           7575           7586          15          1.4         722.4       0.8X
-SQL Parquet Vectorized: DataPageV1                  867            885          15         12.1          82.7       7.4X
-SQL Parquet Vectorized: DataPageV2                  927            946          22         11.3          88.4       6.9X
-SQL Parquet MR: DataPageV1                         2864           2868           5          3.7         273.1       2.2X
-SQL Parquet MR: DataPageV2                         3055           3055           0          3.4         291.3       2.1X
-ParquetReader Vectorized: DataPageV1                755            767          11         13.9          72.0       8.5X
-ParquetReader Vectorized: DataPageV2                793            801           7         13.2          75.6       8.1X
-SQL ORC Vectorized                                  999           1001           4         10.5          95.2       6.4X
-SQL ORC MR                                         2740           2743           4          3.8         261.3       2.3X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            6715           6773          83          1.6         640.4       1.0X
+SQL Json                                           7526           7531           6          1.4         717.8       0.9X
+SQL Parquet Vectorized: DataPageV1                  859            875          20         12.2          81.9       7.8X
+SQL Parquet Vectorized: DataPageV2                  950            958           7         11.0          90.6       7.1X
+SQL Parquet MR: DataPageV1                         2656           2668          18          3.9         253.3       2.5X
+SQL Parquet MR: DataPageV2                         2819           2828          13          3.7         268.8       2.4X
+ParquetReader Vectorized: DataPageV1                760            780          19         13.8          72.5       8.8X
+ParquetReader Vectorized: DataPageV2                823            830          12         12.7          78.5       8.2X
+SQL ORC Vectorized                                 1040           1040           0         10.1          99.2       6.5X
+SQL ORC MR                                         2782           2791          13          3.8         265.3       2.4X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (95.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            4835           4848          18          2.2         461.1       1.0X
-SQL Json                                           5469           5472           5          1.9         521.5       0.9X
-SQL Parquet Vectorized: DataPageV1                  166            169           2         63.0          15.9      29.1X
-SQL Parquet Vectorized: DataPageV2                  183            184           2         57.3          17.5      26.4X
-SQL Parquet MR: DataPageV1                         1775           1785          14          5.9         169.3       2.7X
-SQL Parquet MR: DataPageV2                         1800           1815          21          5.8         171.7       2.7X
-ParquetReader Vectorized: DataPageV1                169            173           2         62.2          16.1      28.7X
-ParquetReader Vectorized: DataPageV2                183            187           2         57.4          17.4      26.5X
-SQL ORC Vectorized                                  304            308           2         34.5          29.0      15.9X
-SQL ORC MR                                         1535           1541           9          6.8         146.4       3.2X
+SQL CSV                                            4498           4509          16          2.3         429.0       1.0X
+SQL Json                                           5349           5355           8          2.0         510.1       0.8X
+SQL Parquet Vectorized: DataPageV1                  167            172           2         63.0          15.9      27.0X
+SQL Parquet Vectorized: DataPageV2                  189            190           1         55.5          18.0      23.8X
+SQL Parquet MR: DataPageV1                         1658           1675          24          6.3         158.1       2.7X
+SQL Parquet MR: DataPageV2                         1613           1640          39          6.5         153.8       2.8X
+ParquetReader Vectorized: DataPageV1                172            173           1         61.0          16.4      26.1X
+ParquetReader Vectorized: DataPageV2                191            194           3         54.9          18.2      23.5X
+SQL ORC Vectorized                                  331            336           8         31.7          31.5      13.6X
+SQL ORC MR                                         1634           1642          11          6.4         155.8       2.8X
 
 
 ================================================================================================
 Single Column Scan From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 10 columns:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            1202           1210          11          0.9        1146.3       1.0X
-SQL Json                                           1734           1735           1          0.6        1654.0       0.7X
-SQL Parquet Vectorized: DataPageV1                   24             27           3         43.9          22.8      50.3X
-SQL Parquet Vectorized: DataPageV2                   32             34           3         32.7          30.5      37.5X
-SQL Parquet MR: DataPageV1                          156            160           4          6.7         149.0       7.7X
-SQL Parquet MR: DataPageV2                          153            156           2          6.9         145.9       7.9X
-SQL ORC Vectorized                                   29             33           4         36.0          27.8      41.3X
-SQL ORC MR                                          123            129           6          8.5         117.2       9.8X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            1267           1279          17          0.8        1208.4       1.0X
+SQL Json                                           1757           1762           6          0.6        1676.0       0.7X
+SQL Parquet Vectorized: DataPageV1                   25             29           4         41.5          24.1      50.2X
+SQL Parquet Vectorized: DataPageV2                   34             38           4         30.9          32.3      37.4X
+SQL Parquet MR: DataPageV1                          158            163           4          6.6         150.6       8.0X
+SQL Parquet MR: DataPageV2                          154            158           4          6.8         146.5       8.3X
+SQL ORC Vectorized                                   30             32           4         35.1          28.5      42.4X
+SQL ORC MR                                          130            132           3          8.1         123.9       9.8X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 50 columns:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            2618           2631          18          0.4        2497.0       1.0X
-SQL Json                                           6142           6146           6          0.2        5857.1       0.4X
-SQL Parquet Vectorized: DataPageV1                   26             29           3         40.1          24.9     100.2X
-SQL Parquet Vectorized: DataPageV2                   34             37           4         31.1          32.2      77.6X
-SQL Parquet MR: DataPageV1                          161            165           5          6.5         153.4      16.3X
-SQL Parquet MR: DataPageV2                          155            161           4          6.7         148.2      16.8X
-SQL ORC Vectorized                                   32             35           3         32.9          30.4      82.1X
-SQL ORC MR                                          125            129           3          8.4         119.5      20.9X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+SQL CSV                                            2691           2740          70          0.4        2566.3       1.0X
+SQL Json                                           6037           6057          29          0.2        5757.4       0.4X
+SQL Parquet Vectorized: DataPageV1                   28             30           3         38.0          26.3      97.5X
+SQL Parquet Vectorized: DataPageV2                   37             40           4         28.3          35.3      72.6X
+SQL Parquet MR: DataPageV1                          163            167           3          6.4         155.9      16.5X
+SQL Parquet MR: DataPageV2                          158            163           6          6.6         150.7      17.0X
+SQL ORC Vectorized                                   34             37           3         31.3          32.0      80.3X
+SQL ORC MR                                          133            136           2          7.9         127.2      20.2X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 100 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-SQL CSV                                            4450           4453           4          0.2        4244.0       1.0X
-SQL Json                                          11304          11358          77          0.1       10780.6       0.4X
-SQL Parquet Vectorized: DataPageV1                   34             37           4         30.9          32.4     131.2X
-SQL Parquet Vectorized: DataPageV2                   41             46           6         25.6          39.1     108.5X
-SQL Parquet MR: DataPageV1                          169            177           6          6.2         160.7      26.4X
-SQL Parquet MR: DataPageV2                          168            172           3          6.3         159.7      26.6X
-SQL ORC Vectorized                                   37             41           7         28.2          35.5     119.6X
-SQL ORC MR                                          129            135           4          8.1         123.1      34.5X
+SQL CSV                                            4417           4431          19          0.2        4212.5       1.0X
+SQL Json                                          11107          11201         134          0.1       10592.1       0.4X
+SQL Parquet Vectorized: DataPageV1                   36             40           5         29.3          34.1     123.5X
+SQL Parquet Vectorized: DataPageV2                   45             49           5         23.5          42.5      99.1X
+SQL Parquet MR: DataPageV1                          176            180           2          5.9         168.1      25.1X
+SQL Parquet MR: DataPageV2                          172            175           3          6.1         163.6      25.7X
+SQL ORC Vectorized                                   43             47           5         24.6          40.7     103.6X
+SQL ORC MR                                          146            149           3          7.2         139.3      30.2X
 
 
diff --git a/sql/core/benchmarks/DatasetBenchmark-jdk21-results.txt b/sql/core/benchmarks/DatasetBenchmark-jdk21-results.txt
index 6f45a55c40ec6..051577fa4a9f0 100644
--- a/sql/core/benchmarks/DatasetBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/DatasetBenchmark-jdk21-results.txt
@@ -2,45 +2,45 @@
 Dataset Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back map long:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                6520           6520           1         15.3          65.2       1.0X
-DataFrame                                          1192           1241          68         83.9          11.9       5.5X
-Dataset                                            1640           1705          92         61.0          16.4       4.0X
+RDD                                                6456           6516          85         15.5          64.6       1.0X
+DataFrame                                          1215           1262          67         82.3          12.1       5.3X
+Dataset                                            1722           1726           6         58.1          17.2       3.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back map:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                7453           7459           9         13.4          74.5       1.0X
-DataFrame                                          2922           2940          25         34.2          29.2       2.6X
-Dataset                                            7021           7024           4         14.2          70.2       1.1X
+RDD                                                7533           7547          20         13.3          75.3       1.0X
+DataFrame                                          2802           2841          55         35.7          28.0       2.7X
+Dataset                                            7391           7397           8         13.5          73.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back filter Long:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                4428           4492          90         22.6          44.3       1.0X
-DataFrame                                           728            736          10        137.5           7.3       6.1X
-Dataset                                            1638           1654          23         61.1          16.4       2.7X
+RDD                                                4352           4379          38         23.0          43.5       1.0X
+DataFrame                                           714            730          20        140.1           7.1       6.1X
+Dataset                                            2404           2407           4         41.6          24.0       1.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back filter:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                2086           2095          12         47.9          20.9       1.0X
-DataFrame                                           110            122          10        912.5           1.1      19.0X
-Dataset                                            2367           2398          45         42.3          23.7       0.9X
+RDD                                                2082           2116          47         48.0          20.8       1.0X
+DataFrame                                           112            125          16        896.6           1.1      18.7X
+Dataset                                            2342           2375          46         42.7          23.4       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 aggregate:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD sum                                            1404           1408           5         71.2          14.0       1.0X
-DataFrame sum                                        57             70          10       1767.9           0.6      24.8X
-Dataset sum using Aggregator                       1944           2023         111         51.4          19.4       0.7X
-Dataset complex Aggregator                         4838           4881          60         20.7          48.4       0.3X
+RDD sum                                            1402           1412          14         71.3          14.0       1.0X
+DataFrame sum                                        68             83          11       1470.1           0.7      20.6X
+Dataset sum using Aggregator                       1946           2009          89         51.4          19.5       0.7X
+Dataset complex Aggregator                         5018           5103         119         19.9          50.2       0.3X
 
 
diff --git a/sql/core/benchmarks/DatasetBenchmark-results.txt b/sql/core/benchmarks/DatasetBenchmark-results.txt
index 856b2302069a0..5cdca4d5041b2 100644
--- a/sql/core/benchmarks/DatasetBenchmark-results.txt
+++ b/sql/core/benchmarks/DatasetBenchmark-results.txt
@@ -2,45 +2,45 @@
 Dataset Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back map long:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                5879           6176         420         17.0          58.8       1.0X
-DataFrame                                          1159           1189          43         86.3          11.6       5.1X
-Dataset                                            1617           1667          70         61.8          16.2       3.6X
+RDD                                                5736           5828         129         17.4          57.4       1.0X
+DataFrame                                          1164           1168           6         85.9          11.6       4.9X
+Dataset                                            1604           1701         137         62.4          16.0       3.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back map:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                6934           6965          44         14.4          69.3       1.0X
-DataFrame                                          2836           2893          82         35.3          28.4       2.4X
-Dataset                                            6597           6669         102         15.2          66.0       1.1X
+RDD                                                6867           6977         155         14.6          68.7       1.0X
+DataFrame                                          2745           2782          52         36.4          27.5       2.5X
+Dataset                                            6475           6615         198         15.4          64.7       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back filter Long:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                4186           4227          57         23.9          41.9       1.0X
-DataFrame                                           671            703          53        148.9           6.7       6.2X
-Dataset                                            1598           1599           1         62.6          16.0       2.6X
+RDD                                                4072           4132          84         24.6          40.7       1.0X
+DataFrame                                           683            696          12        146.4           6.8       6.0X
+Dataset                                            1724           1763          55         58.0          17.2       2.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 back-to-back filter:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD                                                2083           2087           6         48.0          20.8       1.0X
-DataFrame                                           111            124          11        903.6           1.1      18.8X
-Dataset                                            2453           2498          65         40.8          24.5       0.8X
+RDD                                                2035           2090          78         49.1          20.3       1.0X
+DataFrame                                           108            120          11        927.7           1.1      18.9X
+Dataset                                            2467           2477          14         40.5          24.7       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 aggregate:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-RDD sum                                            1412           1427          20         70.8          14.1       1.0X
-DataFrame sum                                        69             81           9       1447.3           0.7      20.4X
-Dataset sum using Aggregator                       2107           2148          58         47.5          21.1       0.7X
-Dataset complex Aggregator                         4949           5079         183         20.2          49.5       0.3X
+RDD sum                                            1402           1422          29         71.3          14.0       1.0X
+DataFrame sum                                        67             78           9       1499.3           0.7      21.0X
+Dataset sum using Aggregator                       2099           2104           7         47.6          21.0       0.7X
+Dataset complex Aggregator                         4956           5026          99         20.2          49.6       0.3X
 
 
diff --git a/sql/core/benchmarks/DateTimeBenchmark-jdk21-results.txt b/sql/core/benchmarks/DateTimeBenchmark-jdk21-results.txt
index be96ecb63d510..09f3b3dbba4c6 100644
--- a/sql/core/benchmarks/DateTimeBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/DateTimeBenchmark-jdk21-results.txt
@@ -2,460 +2,460 @@
 datetime +/- interval
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 datetime +/- interval:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date + interval(m)                                  910            932          21         11.0          91.0       1.0X
-date + interval(m, d)                               899            900           1         11.1          89.9       1.0X
-date + interval(m, d, ms)                          3476           3482           8          2.9         347.6       0.3X
-date - interval(m)                                  826            830           4         12.1          82.6       1.1X
-date - interval(m, d)                               886            888           2         11.3          88.6       1.0X
-date - interval(m, d, ms)                          3498           3504           9          2.9         349.8       0.3X
-timestamp + interval(m)                            1827           1831           6          5.5         182.7       0.5X
-timestamp + interval(m, d)                         1902           1905           3          5.3         190.2       0.5X
-timestamp + interval(m, d, ms)                     1749           1750           1          5.7         174.9       0.5X
-timestamp - interval(m)                            1494           1496           2          6.7         149.4       0.6X
-timestamp - interval(m, d)                         1579           1580           2          6.3         157.9       0.6X
-timestamp - interval(m, d, ms)                     1737           1740           5          5.8         173.7       0.5X
+date + interval(m)                                  886            903          16         11.3          88.6       1.0X
+date + interval(m, d)                               860            869           8         11.6          86.0       1.0X
+date + interval(m, d, ms)                          3589           3600          16          2.8         358.9       0.2X
+date - interval(m)                                  835            837           2         12.0          83.5       1.1X
+date - interval(m, d)                               896            900           5         11.2          89.6       1.0X
+date - interval(m, d, ms)                          3614           3618           6          2.8         361.4       0.2X
+timestamp + interval(m)                            1867           1883          23          5.4         186.7       0.5X
+timestamp + interval(m, d)                         1922           1923           1          5.2         192.2       0.5X
+timestamp + interval(m, d, ms)                     1711           1712           1          5.8         171.1       0.5X
+timestamp - interval(m)                            1515           1516           2          6.6         151.5       0.6X
+timestamp - interval(m, d)                         1561           1562           1          6.4         156.1       0.6X
+timestamp - interval(m, d, ms)                     1704           1708           6          5.9         170.4       0.5X
 
 
 ================================================================================================
 Extract components
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast to timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to timestamp wholestage off                    200            204           5         50.0          20.0       1.0X
-cast to timestamp wholestage on                     208            214           4         48.2          20.8       1.0X
+cast to timestamp wholestage off                    198            203           7         50.6          19.8       1.0X
+cast to timestamp wholestage on                     213            218           3         46.9          21.3       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 year of timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-year of timestamp wholestage off                    641            645           6         15.6          64.1       1.0X
-year of timestamp wholestage on                     630            635           7         15.9          63.0       1.0X
+year of timestamp wholestage off                    628            630           3         15.9          62.8       1.0X
+year of timestamp wholestage on                     633            639           8         15.8          63.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 quarter of timestamp:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-quarter of timestamp wholestage off                 674            677           5         14.8          67.4       1.0X
-quarter of timestamp wholestage on                  673            676           2         14.9          67.3       1.0X
+quarter of timestamp wholestage off                 673            674           1         14.9          67.3       1.0X
+quarter of timestamp wholestage on                  669            675           6         14.9          66.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 month of timestamp:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-month of timestamp wholestage off                   650            655           8         15.4          65.0       1.0X
-month of timestamp wholestage on                    637            641           4         15.7          63.7       1.0X
+month of timestamp wholestage off                   647            648           1         15.5          64.7       1.0X
+month of timestamp wholestage on                    646            650           3         15.5          64.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 weekofyear of timestamp:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-weekofyear of timestamp wholestage off             1006           1012           8          9.9         100.6       1.0X
-weekofyear of timestamp wholestage on              1054           1057           3          9.5         105.4       1.0X
+weekofyear of timestamp wholestage off             1037           1039           2          9.6         103.7       1.0X
+weekofyear of timestamp wholestage on              1120           1124           4          8.9         112.0       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 day of timestamp:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-day of timestamp wholestage off                     660            661           0         15.1          66.0       1.0X
-day of timestamp wholestage on                      637            643           5         15.7          63.7       1.0X
+day of timestamp wholestage off                     658            658           1         15.2          65.8       1.0X
+day of timestamp wholestage on                      661            666           7         15.1          66.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dayofyear of timestamp:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-dayofyear of timestamp wholestage off               697            699           3         14.4          69.7       1.0X
-dayofyear of timestamp wholestage on                689            693           3         14.5          68.9       1.0X
+dayofyear of timestamp wholestage off               679            680           3         14.7          67.9       1.0X
+dayofyear of timestamp wholestage on                683            693          12         14.6          68.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dayofmonth of timestamp:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-dayofmonth of timestamp wholestage off              684            687           5         14.6          68.4       1.0X
-dayofmonth of timestamp wholestage on               640            643           3         15.6          64.0       1.1X
+dayofmonth of timestamp wholestage off              673            678           7         14.9          67.3       1.0X
+dayofmonth of timestamp wholestage on               655            658           4         15.3          65.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dayofweek of timestamp:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-dayofweek of timestamp wholestage off               820            826           8         12.2          82.0       1.0X
-dayofweek of timestamp wholestage on                810            816           4         12.3          81.0       1.0X
+dayofweek of timestamp wholestage off               804            808           6         12.4          80.4       1.0X
+dayofweek of timestamp wholestage on                813            818           5         12.3          81.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 weekday of timestamp:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-weekday of timestamp wholestage off                 765            766           1         13.1          76.5       1.0X
-weekday of timestamp wholestage on                  741            745           4         13.5          74.1       1.0X
+weekday of timestamp wholestage off                 739            740           2         13.5          73.9       1.0X
+weekday of timestamp wholestage on                  749            752           4         13.4          74.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 hour of timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-hour of timestamp wholestage off                    555            556           1         18.0          55.5       1.0X
-hour of timestamp wholestage on                     573            576           4         17.5          57.3       1.0X
+hour of timestamp wholestage off                    543            544           2         18.4          54.3       1.0X
+hour of timestamp wholestage on                     558            570          22         17.9          55.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 minute of timestamp:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-minute of timestamp wholestage off                  559            559           1         17.9          55.9       1.0X
-minute of timestamp wholestage on                   551            554           4         18.1          55.1       1.0X
+minute of timestamp wholestage off                  544            546           3         18.4          54.4       1.0X
+minute of timestamp wholestage on                   561            563           2         17.8          56.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 second of timestamp:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-second of timestamp wholestage off                  556            558           3         18.0          55.6       1.0X
-second of timestamp wholestage on                   552            556           3         18.1          55.2       1.0X
+second of timestamp wholestage off                  544            566          31         18.4          54.4       1.0X
+second of timestamp wholestage on                   561            563           2         17.8          56.1       1.0X
 
 
 ================================================================================================
 Current date and time
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 current_date:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-current_date wholestage off                         196            197           3         51.1          19.6       1.0X
-current_date wholestage on                          208            211           4         48.1          20.8       0.9X
+current_date wholestage off                         176            176           1         56.8          17.6       1.0X
+current_date wholestage on                          215            219           4         46.5          21.5       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 current_timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-current_timestamp wholestage off                    188            190           2         53.1          18.8       1.0X
-current_timestamp wholestage on                     218            237          28         45.9          21.8       0.9X
+current_timestamp wholestage off                    182            186           5         54.9          18.2       1.0X
+current_timestamp wholestage on                     230            242          14         43.5          23.0       0.8X
 
 
 ================================================================================================
 Date arithmetic
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast to date:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to date wholestage off                         619            626          10         16.2          61.9       1.0X
-cast to date wholestage on                          621            626           5         16.1          62.1       1.0X
+cast to date wholestage off                         614            615           1         16.3          61.4       1.0X
+cast to date wholestage on                          633            637           2         15.8          63.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 last_day:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-last_day wholestage off                             684            685           2         14.6          68.4       1.0X
-last_day wholestage on                              664            670           4         15.0          66.4       1.0X
+last_day wholestage off                             673            674           2         14.9          67.3       1.0X
+last_day wholestage on                              682            687           6         14.7          68.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 next_day:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-next_day wholestage off                             653            656           5         15.3          65.3       1.0X
-next_day wholestage on                              651            654           4         15.4          65.1       1.0X
+next_day wholestage off                             637            647          15         15.7          63.7       1.0X
+next_day wholestage on                              664            666           1         15.1          66.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_add:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_add wholestage off                             590            592           2         16.9          59.0       1.0X
-date_add wholestage on                              587            591           4         17.0          58.7       1.0X
+date_add wholestage off                             590            591           2         17.0          59.0       1.0X
+date_add wholestage on                              593            595           2         16.9          59.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_sub:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_sub wholestage off                             599            599           1         16.7          59.9       1.0X
-date_sub wholestage on                              588            590           1         17.0          58.8       1.0X
+date_sub wholestage off                             585            587           3         17.1          58.5       1.0X
+date_sub wholestage on                              590            595           5         16.9          59.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 add_months:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-add_months wholestage off                           836            840           6         12.0          83.6       1.0X
-add_months wholestage on                            812            815           4         12.3          81.2       1.0X
+add_months wholestage off                           812            815           4         12.3          81.2       1.0X
+add_months wholestage on                            823            824           1         12.1          82.3       1.0X
 
 
 ================================================================================================
 Formatting dates
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 format date:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-format date wholestage off                         3197           3201           6          3.1         319.7       1.0X
-format date wholestage on                          3169           3195          18          3.2         316.9       1.0X
+format date wholestage off                         3196           3208          17          3.1         319.6       1.0X
+format date wholestage on                          3256           3281          45          3.1         325.6       1.0X
 
 
 ================================================================================================
 Formatting timestamps
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_unixtime:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-from_unixtime wholestage off                       2512           2522          14          4.0         251.2       1.0X
-from_unixtime wholestage on                        2577           2590           8          3.9         257.7       1.0X
+from_unixtime wholestage off                       2538           2542           6          3.9         253.8       1.0X
+from_unixtime wholestage on                        2543           2559          16          3.9         254.3       1.0X
 
 
 ================================================================================================
 Convert timestamps
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_utc_timestamp:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-from_utc_timestamp wholestage off                   673            674           1         14.9          67.3       1.0X
-from_utc_timestamp wholestage on                    779            785           5         12.8          77.9       0.9X
+from_utc_timestamp wholestage off                   704            705           2         14.2          70.4       1.0X
+from_utc_timestamp wholestage on                    776            777           1         12.9          77.6       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_utc_timestamp:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_utc_timestamp wholestage off                     794            795           0         12.6          79.4       1.0X
-to_utc_timestamp wholestage on                      837            843           7         12.0          83.7       0.9X
+to_utc_timestamp wholestage off                     774            774           1         12.9          77.4       1.0X
+to_utc_timestamp wholestage on                      827            830           3         12.1          82.7       0.9X
 
 
 ================================================================================================
 Intervals
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast interval:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast interval wholestage off                        226            227           1         44.3          22.6       1.0X
-cast interval wholestage on                         217            218           3         46.2          21.7       1.0X
+cast interval wholestage off                        228            234           9         43.9          22.8       1.0X
+cast interval wholestage on                         218            220           3         45.8          21.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 datediff:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-datediff wholestage off                             996           1000           6         10.0          99.6       1.0X
-datediff wholestage on                             1042           1046           6          9.6         104.2       1.0X
+datediff wholestage off                             984            984           0         10.2          98.4       1.0X
+datediff wholestage on                             1038           1039           1          9.6         103.8       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 months_between:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-months_between wholestage off                      3012           3021          14          3.3         301.2       1.0X
-months_between wholestage on                       3080           3088          12          3.2         308.0       1.0X
+months_between wholestage off                      3204           3208           6          3.1         320.4       1.0X
+months_between wholestage on                       3175           3182           7          3.1         317.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 window:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-window wholestage off                               409            416          10          2.4         408.5       1.0X
-window wholestage on                                654            692          24          1.5         654.2       0.6X
+window wholestage off                               401            408          10          2.5         400.6       1.0X
+window wholestage on                                613            642          18          1.6         612.9       0.7X
 
 
 ================================================================================================
 Truncation
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc YEAR:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc YEAR wholestage off                     1544           1545           0          6.5         154.4       1.0X
-date_trunc YEAR wholestage on                      1535           1539           4          6.5         153.5       1.0X
+date_trunc YEAR wholestage off                     1674           1677           4          6.0         167.4       1.0X
+date_trunc YEAR wholestage on                      1643           1646           3          6.1         164.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc YYYY:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc YYYY wholestage off                     1541           1547           9          6.5         154.1       1.0X
-date_trunc YYYY wholestage on                      1534           1536           2          6.5         153.4       1.0X
+date_trunc YYYY wholestage off                     1675           1676           3          6.0         167.5       1.0X
+date_trunc YYYY wholestage on                      1642           1646           4          6.1         164.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc YY:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc YY wholestage off                       1544           1545           0          6.5         154.4       1.0X
-date_trunc YY wholestage on                        1534           1540           6          6.5         153.4       1.0X
+date_trunc YY wholestage off                       1677           1677           1          6.0         167.7       1.0X
+date_trunc YY wholestage on                        1642           1645           4          6.1         164.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MON:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MON wholestage off                      1592           1593           1          6.3         159.2       1.0X
-date_trunc MON wholestage on                       1805           1816           9          5.5         180.5       0.9X
+date_trunc MON wholestage off                      1700           1701           1          5.9         170.0       1.0X
+date_trunc MON wholestage on                       1634           1636           2          6.1         163.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MONTH:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MONTH wholestage off                    1591           1592           2          6.3         159.1       1.0X
-date_trunc MONTH wholestage on                     1805           1813           7          5.5         180.5       0.9X
+date_trunc MONTH wholestage off                    1705           1706           2          5.9         170.5       1.0X
+date_trunc MONTH wholestage on                     1633           1636           3          6.1         163.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MM:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MM wholestage off                       1587           1587           1          6.3         158.7       1.0X
-date_trunc MM wholestage on                        1804           1812           5          5.5         180.4       0.9X
+date_trunc MM wholestage off                       1702           1703           2          5.9         170.2       1.0X
+date_trunc MM wholestage on                        1634           1636           3          6.1         163.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc DAY:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc DAY wholestage off                      1178           1179           1          8.5         117.8       1.0X
-date_trunc DAY wholestage on                       1157           1160           2          8.6         115.7       1.0X
+date_trunc DAY wholestage off                      1160           1162           3          8.6         116.0       1.0X
+date_trunc DAY wholestage on                       1157           1159           1          8.6         115.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc DD:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc DD wholestage off                       1183           1198          21          8.5         118.3       1.0X
-date_trunc DD wholestage on                        1157           1167          19          8.6         115.7       1.0X
+date_trunc DD wholestage off                       1187           1195          11          8.4         118.7       1.0X
+date_trunc DD wholestage on                        1150           1153           3          8.7         115.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc HOUR:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc HOUR wholestage off                     1216           1223           9          8.2         121.6       1.0X
-date_trunc HOUR wholestage on                      1236           1239           2          8.1         123.6       1.0X
+date_trunc HOUR wholestage off                     1213           1215           3          8.2         121.3       1.0X
+date_trunc HOUR wholestage on                      1230           1232           3          8.1         123.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MINUTE:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MINUTE wholestage off                   1201           1202           1          8.3         120.1       1.0X
-date_trunc MINUTE wholestage on                    1172           1174           2          8.5         117.2       1.0X
+date_trunc MINUTE wholestage off                   1196           1197           2          8.4         119.6       1.0X
+date_trunc MINUTE wholestage on                    1190           1192           2          8.4         119.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc SECOND:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc SECOND wholestage off                    307            313           8         32.5          30.7       1.0X
-date_trunc SECOND wholestage on                     288            293           5         34.7          28.8       1.1X
+date_trunc SECOND wholestage off                    290            294           5         34.4          29.0       1.0X
+date_trunc SECOND wholestage on                     264            268           4         37.8          26.4       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc WEEK:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc WEEK wholestage off                     1484           1486           4          6.7         148.4       1.0X
-date_trunc WEEK wholestage on                      1458           1462           4          6.9         145.8       1.0X
+date_trunc WEEK wholestage off                     1677           1679           2          6.0         167.7       1.0X
+date_trunc WEEK wholestage on                      1548           1550           2          6.5         154.8       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc QUARTER:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc QUARTER wholestage off                  1859           1860           1          5.4         185.9       1.0X
-date_trunc QUARTER wholestage on                   1892           1897           4          5.3         189.2       1.0X
+date_trunc QUARTER wholestage off                  2013           2019           9          5.0         201.3       1.0X
+date_trunc QUARTER wholestage on                   1933           1935           3          5.2         193.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc year:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc year wholestage off                           804            805           1         12.4          80.4       1.0X
-trunc year wholestage on                            780            785           5         12.8          78.0       1.0X
+trunc year wholestage off                           792            793           1         12.6          79.2       1.0X
+trunc year wholestage on                            765            770           3         13.1          76.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc yyyy:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc yyyy wholestage off                           800            800           1         12.5          80.0       1.0X
-trunc yyyy wholestage on                            779            782           2         12.8          77.9       1.0X
+trunc yyyy wholestage off                           793            793           1         12.6          79.3       1.0X
+trunc yyyy wholestage on                            762            765           2         13.1          76.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc yy:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc yy wholestage off                             800            802           2         12.5          80.0       1.0X
-trunc yy wholestage on                              780            782           2         12.8          78.0       1.0X
+trunc yy wholestage off                             793            793           1         12.6          79.3       1.0X
+trunc yy wholestage on                              763            765           2         13.1          76.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc mon:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc mon wholestage off                            771            771           0         13.0          77.1       1.0X
-trunc mon wholestage on                             752            756           3         13.3          75.2       1.0X
+trunc mon wholestage off                            747            749           2         13.4          74.7       1.0X
+trunc mon wholestage on                             731            733           2         13.7          73.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc month:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc month wholestage off                          768            769           2         13.0          76.8       1.0X
-trunc month wholestage on                           754            757           4         13.3          75.4       1.0X
+trunc month wholestage off                          748            748           0         13.4          74.8       1.0X
+trunc month wholestage on                           731            732           1         13.7          73.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc mm:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc mm wholestage off                             768            770           3         13.0          76.8       1.0X
-trunc mm wholestage on                              757            767          10         13.2          75.7       1.0X
+trunc mm wholestage off                             749            749           1         13.4          74.9       1.0X
+trunc mm wholestage on                              731            736           3         13.7          73.1       1.0X
 
 
 ================================================================================================
 Parsing
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to timestamp str:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to timestamp str wholestage off                     106            106           0          9.5         105.7       1.0X
-to timestamp str wholestage on                      100            103           4         10.0         100.3       1.1X
+to timestamp str wholestage off                     104            106           2          9.6         104.2       1.0X
+to timestamp str wholestage on                       97            100           3         10.3          97.4       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_timestamp:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_timestamp wholestage off                         663            670           9          1.5         663.0       1.0X
-to_timestamp wholestage on                          665            666           1          1.5         665.0       1.0X
+to_timestamp wholestage off                         667            677          14          1.5         667.3       1.0X
+to_timestamp wholestage on                          666            668           1          1.5         666.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_unix_timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_unix_timestamp wholestage off                    673            680          10          1.5         672.7       1.0X
-to_unix_timestamp wholestage on                     675            676           1          1.5         674.7       1.0X
+to_unix_timestamp wholestage off                    678            680           2          1.5         678.4       1.0X
+to_unix_timestamp wholestage on                     667            669           3          1.5         666.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to date str:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to date str wholestage off                          134            135           1          7.5         133.6       1.0X
-to date str wholestage on                           133            135           2          7.5         132.7       1.0X
+to date str wholestage off                          137            138           2          7.3         136.5       1.0X
+to date str wholestage on                           129            131           2          7.8         128.9       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_date:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_date wholestage off                              650            652           2          1.5         650.3       1.0X
-to_date wholestage on                               643            647           4          1.6         642.9       1.0X
+to_date wholestage off                              693            694           1          1.4         693.3       1.0X
+to_date wholestage on                               690            693           2          1.4         690.1       1.0X
 
 
 ================================================================================================
 Conversion from/to external types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 To/from Java's date-time:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-From java.sql.Date                                  290            292           2         17.3          57.9       1.0X
-From java.time.LocalDate                            231            233           2         21.7          46.2       1.3X
-Collect java.sql.Date                              1074           1256         160          4.7         214.7       0.3X
-Collect java.time.LocalDate                         907            988         138          5.5         181.4       0.3X
-From java.sql.Timestamp                             253            256           4         19.7          50.7       1.1X
-From java.time.Instant                              204            216          12         24.6          40.7       1.4X
-Collect longs                                       802            980         168          6.2         160.3       0.4X
-Collect java.sql.Timestamp                         1147           1173          32          4.4         229.5       0.3X
-Collect java.time.Instant                          1064           1093          46          4.7         212.8       0.3X
-java.sql.Date to Hive string                       4131           4176          54          1.2         826.2       0.1X
-java.time.LocalDate to Hive string                 3118           3176          57          1.6         623.5       0.1X
-java.sql.Timestamp to Hive string                  6324           6506         159          0.8        1264.8       0.0X
-java.time.Instant to Hive string                   4122           4159          33          1.2         824.3       0.1X
+From java.sql.Date                                  270            271           1         18.5          54.0       1.0X
+From java.time.LocalDate                            222            223           0         22.5          44.5       1.2X
+Collect java.sql.Date                              1212           1267          83          4.1         242.3       0.2X
+Collect java.time.LocalDate                         848            981         212          5.9         169.6       0.3X
+From java.sql.Timestamp                             201            202           1         24.8          40.3       1.3X
+From java.time.Instant                              172            174           2         29.1          34.4       1.6X
+Collect longs                                       900           1019         150          5.6         179.9       0.3X
+Collect java.sql.Timestamp                         1137           1235          91          4.4         227.4       0.2X
+Collect java.time.Instant                           799           1074         285          6.3         159.9       0.3X
+java.sql.Date to Hive string                       4066           4209         128          1.2         813.2       0.1X
+java.time.LocalDate to Hive string                 3288           3408         146          1.5         657.6       0.1X
+java.sql.Timestamp to Hive string                  6486           6588          90          0.8        1297.2       0.0X
+java.time.Instant to Hive string                   4388           4434          74          1.1         877.5       0.1X
 
 
diff --git a/sql/core/benchmarks/DateTimeBenchmark-results.txt b/sql/core/benchmarks/DateTimeBenchmark-results.txt
index dcb4e3c45e26a..34bd57334d646 100644
--- a/sql/core/benchmarks/DateTimeBenchmark-results.txt
+++ b/sql/core/benchmarks/DateTimeBenchmark-results.txt
@@ -2,460 +2,460 @@
 datetime +/- interval
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 datetime +/- interval:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date + interval(m)                                 1015           1028          19          9.9         101.5       1.0X
-date + interval(m, d)                               988            993           7         10.1          98.8       1.0X
-date + interval(m, d, ms)                          3626           3649          32          2.8         362.6       0.3X
-date - interval(m)                                  981            993          15         10.2          98.1       1.0X
-date - interval(m, d)                              1009           1020          17          9.9         100.9       1.0X
-date - interval(m, d, ms)                          3654           3658           6          2.7         365.4       0.3X
-timestamp + interval(m)                            1782           1786           6          5.6         178.2       0.6X
-timestamp + interval(m, d)                         1826           1835          13          5.5         182.6       0.6X
-timestamp + interval(m, d, ms)                     1970           1971           2          5.1         197.0       0.5X
-timestamp - interval(m)                            1717           1731          19          5.8         171.7       0.6X
-timestamp - interval(m, d)                         1791           1793           3          5.6         179.1       0.6X
-timestamp - interval(m, d, ms)                     1962           1965           4          5.1         196.2       0.5X
+date + interval(m)                                  976            985           8         10.2          97.6       1.0X
+date + interval(m, d)                               995           1005          10         10.1          99.5       1.0X
+date + interval(m, d, ms)                          3730           3736           8          2.7         373.0       0.3X
+date - interval(m)                                  966            970           4         10.4          96.6       1.0X
+date - interval(m, d)                               978            994          26         10.2          97.8       1.0X
+date - interval(m, d, ms)                          3761           3773          17          2.7         376.1       0.3X
+timestamp + interval(m)                            1897           1919          30          5.3         189.7       0.5X
+timestamp + interval(m, d)                         1952           1954           4          5.1         195.2       0.5X
+timestamp + interval(m, d, ms)                     2181           2182           3          4.6         218.1       0.4X
+timestamp - interval(m)                            1946           1946           1          5.1         194.6       0.5X
+timestamp - interval(m, d)                         2018           2022           5          5.0         201.8       0.5X
+timestamp - interval(m, d, ms)                     2181           2185           6          4.6         218.1       0.4X
 
 
 ================================================================================================
 Extract components
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast to timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to timestamp wholestage off                    193            198           6         51.7          19.3       1.0X
-cast to timestamp wholestage on                     209            217           9         47.8          20.9       0.9X
+cast to timestamp wholestage off                    195            198           4         51.3          19.5       1.0X
+cast to timestamp wholestage on                     208            215           7         48.0          20.8       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 year of timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-year of timestamp wholestage off                    775            778           5         12.9          77.5       1.0X
-year of timestamp wholestage on                     772            777           5         13.0          77.2       1.0X
+year of timestamp wholestage off                    775            783          11         12.9          77.5       1.0X
+year of timestamp wholestage on                     775            780           5         12.9          77.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 quarter of timestamp:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-quarter of timestamp wholestage off                 791            793           2         12.6          79.1       1.0X
-quarter of timestamp wholestage on                  782            788           7         12.8          78.2       1.0X
+quarter of timestamp wholestage off                 793            794           2         12.6          79.3       1.0X
+quarter of timestamp wholestage on                  803            807           5         12.5          80.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 month of timestamp:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-month of timestamp wholestage off                   769            770           1         13.0          76.9       1.0X
-month of timestamp wholestage on                    771            775           3         13.0          77.1       1.0X
+month of timestamp wholestage off                   771            773           3         13.0          77.1       1.0X
+month of timestamp wholestage on                    780            784           3         12.8          78.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 weekofyear of timestamp:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-weekofyear of timestamp wholestage off             1029           1032           5          9.7         102.9       1.0X
-weekofyear of timestamp wholestage on              1207           1210           4          8.3         120.7       0.9X
+weekofyear of timestamp wholestage off             1135           1141           8          8.8         113.5       1.0X
+weekofyear of timestamp wholestage on              1240           1242           1          8.1         124.0       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 day of timestamp:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-day of timestamp wholestage off                     780            782           2         12.8          78.0       1.0X
-day of timestamp wholestage on                      779            786          11         12.8          77.9       1.0X
+day of timestamp wholestage off                     766            775          13         13.1          76.6       1.0X
+day of timestamp wholestage on                      778            790          16         12.8          77.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dayofyear of timestamp:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-dayofyear of timestamp wholestage off               805            807           2         12.4          80.5       1.0X
-dayofyear of timestamp wholestage on                816            820           3         12.3          81.6       1.0X
+dayofyear of timestamp wholestage off               806            807           2         12.4          80.6       1.0X
+dayofyear of timestamp wholestage on                819            823           6         12.2          81.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dayofmonth of timestamp:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-dayofmonth of timestamp wholestage off              781            783           3         12.8          78.1       1.0X
-dayofmonth of timestamp wholestage on               773            777           3         12.9          77.3       1.0X
+dayofmonth of timestamp wholestage off              780            786           8         12.8          78.0       1.0X
+dayofmonth of timestamp wholestage on               782            787           7         12.8          78.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dayofweek of timestamp:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-dayofweek of timestamp wholestage off               929            930           2         10.8          92.9       1.0X
-dayofweek of timestamp wholestage on                912            917           5         11.0          91.2       1.0X
+dayofweek of timestamp wholestage off               914            916           2         10.9          91.4       1.0X
+dayofweek of timestamp wholestage on                924            930           7         10.8          92.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 weekday of timestamp:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-weekday of timestamp wholestage off                 896            896           0         11.2          89.6       1.0X
-weekday of timestamp wholestage on                  871            871           1         11.5          87.1       1.0X
+weekday of timestamp wholestage off                 877            880           5         11.4          87.7       1.0X
+weekday of timestamp wholestage on                  892            894           3         11.2          89.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 hour of timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-hour of timestamp wholestage off                    611            611           0         16.4          61.1       1.0X
-hour of timestamp wholestage on                     607            614           5         16.5          60.7       1.0X
+hour of timestamp wholestage off                    605            607           2         16.5          60.5       1.0X
+hour of timestamp wholestage on                     625            627           2         16.0          62.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 minute of timestamp:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-minute of timestamp wholestage off                  606            607           1         16.5          60.6       1.0X
-minute of timestamp wholestage on                   606            615          10         16.5          60.6       1.0X
+minute of timestamp wholestage off                  604            606           2         16.6          60.4       1.0X
+minute of timestamp wholestage on                   625            631          11         16.0          62.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 second of timestamp:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-second of timestamp wholestage off                  604            605           2         16.6          60.4       1.0X
-second of timestamp wholestage on                   612            616           4         16.3          61.2       1.0X
+second of timestamp wholestage off                  605            608           4         16.5          60.5       1.0X
+second of timestamp wholestage on                   624            627           3         16.0          62.4       1.0X
 
 
 ================================================================================================
 Current date and time
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 current_date:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-current_date wholestage off                         182            184           2         54.9          18.2       1.0X
-current_date wholestage on                          208            215           7         48.2          20.8       0.9X
+current_date wholestage off                         182            183           1         54.8          18.2       1.0X
+current_date wholestage on                          220            228          12         45.5          22.0       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 current_timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-current_timestamp wholestage off                    190            192           2         52.6          19.0       1.0X
-current_timestamp wholestage on                     225            239          18         44.3          22.5       0.8X
+current_timestamp wholestage off                    192            195           4         52.0          19.2       1.0X
+current_timestamp wholestage on                     217            249          42         46.1          21.7       0.9X
 
 
 ================================================================================================
 Date arithmetic
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast to date:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to date wholestage off                         667            668           3         15.0          66.7       1.0X
-cast to date wholestage on                          678            683           6         14.7          67.8       1.0X
+cast to date wholestage off                         666            668           2         15.0          66.6       1.0X
+cast to date wholestage on                          678            684           5         14.7          67.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 last_day:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-last_day wholestage off                             786            786           0         12.7          78.6       1.0X
-last_day wholestage on                              777            780           3         12.9          77.7       1.0X
+last_day wholestage off                             782            783           1         12.8          78.2       1.0X
+last_day wholestage on                              787            789           2         12.7          78.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 next_day:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
 next_day wholestage off                             699            700           1         14.3          69.9       1.0X
-next_day wholestage on                              705            707           2         14.2          70.5       1.0X
+next_day wholestage on                              704            708           3         14.2          70.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_add:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_add wholestage off                             653            655           2         15.3          65.3       1.0X
-date_add wholestage on                              647            658          23         15.5          64.7       1.0X
+date_add wholestage off                             651            651           1         15.4          65.1       1.0X
+date_add wholestage on                              657            669          19         15.2          65.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_sub:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_sub wholestage off                             658            659           2         15.2          65.8       1.0X
-date_sub wholestage on                              652            660           5         15.3          65.2       1.0X
+date_sub wholestage off                             650            651           2         15.4          65.0       1.0X
+date_sub wholestage on                              658            663           4         15.2          65.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 add_months:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-add_months wholestage off                           932            932           0         10.7          93.2       1.0X
-add_months wholestage on                            925            930           6         10.8          92.5       1.0X
+add_months wholestage off                           923            925           2         10.8          92.3       1.0X
+add_months wholestage on                            934            939           6         10.7          93.4       1.0X
 
 
 ================================================================================================
 Formatting dates
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 format date:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-format date wholestage off                         3595           3654          83          2.8         359.5       1.0X
-format date wholestage on                          3531           3545           9          2.8         353.1       1.0X
+format date wholestage off                         3458           3482          34          2.9         345.8       1.0X
+format date wholestage on                          3353           3362          10          3.0         335.3       1.0X
 
 
 ================================================================================================
 Formatting timestamps
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_unixtime:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-from_unixtime wholestage off                       3760           3761           2          2.7         376.0       1.0X
-from_unixtime wholestage on                        3836           3852          13          2.6         383.6       1.0X
+from_unixtime wholestage off                       3487           3514          38          2.9         348.7       1.0X
+from_unixtime wholestage on                        3425           3441          18          2.9         342.5       1.0X
 
 
 ================================================================================================
 Convert timestamps
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_utc_timestamp:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-from_utc_timestamp wholestage off                   743            745           2         13.5          74.3       1.0X
-from_utc_timestamp wholestage on                    869            873           4         11.5          86.9       0.9X
+from_utc_timestamp wholestage off                   734            736           3         13.6          73.4       1.0X
+from_utc_timestamp wholestage on                    841            851          14         11.9          84.1       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_utc_timestamp:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_utc_timestamp wholestage off                    1081           1082           2          9.3         108.1       1.0X
-to_utc_timestamp wholestage on                     1079           1087           5          9.3         107.9       1.0X
+to_utc_timestamp wholestage off                    1115           1115           0          9.0         111.5       1.0X
+to_utc_timestamp wholestage on                     1147           1155          13          8.7         114.7       1.0X
 
 
 ================================================================================================
 Intervals
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast interval:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast interval wholestage off                        217            219           3         46.1          21.7       1.0X
-cast interval wholestage on                         195            200           5         51.3          19.5       1.1X
+cast interval wholestage off                        220            222           2         45.5          22.0       1.0X
+cast interval wholestage on                         219            223           3         45.6          21.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 datediff:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-datediff wholestage off                            1119           1123           6          8.9         111.9       1.0X
-datediff wholestage on                             1162           1166           3          8.6         116.2       1.0X
+datediff wholestage off                            1116           1117           1          9.0         111.6       1.0X
+datediff wholestage on                             1165           1173           7          8.6         116.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 months_between:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-months_between wholestage off                      3399           3409          14          2.9         339.9       1.0X
-months_between wholestage on                       3477           3485           8          2.9         347.7       1.0X
+months_between wholestage off                      3358           3359           1          3.0         335.8       1.0X
+months_between wholestage on                       3361           3371          18          3.0         336.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 window:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-window wholestage off                               404            409           8          2.5         403.6       1.0X
-window wholestage on                                630            652          20          1.6         629.7       0.6X
+window wholestage off                               419            428          13          2.4         419.3       1.0X
+window wholestage on                                643            661          16          1.6         642.7       0.7X
 
 
 ================================================================================================
 Truncation
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc YEAR:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc YEAR wholestage off                     1811           1814           4          5.5         181.1       1.0X
-date_trunc YEAR wholestage on                      1797           1802           4          5.6         179.7       1.0X
+date_trunc YEAR wholestage off                     1752           1763          15          5.7         175.2       1.0X
+date_trunc YEAR wholestage on                      1726           1730           4          5.8         172.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc YYYY:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc YYYY wholestage off                     1806           1810           6          5.5         180.6       1.0X
-date_trunc YYYY wholestage on                      1798           1809          19          5.6         179.8       1.0X
+date_trunc YYYY wholestage off                     1774           1777           3          5.6         177.4       1.0X
+date_trunc YYYY wholestage on                      1727           1730           3          5.8         172.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc YY:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc YY wholestage off                       1814           1815           1          5.5         181.4       1.0X
-date_trunc YY wholestage on                        1800           1804           3          5.6         180.0       1.0X
+date_trunc YY wholestage off                       1756           1764          12          5.7         175.6       1.0X
+date_trunc YY wholestage on                        1723           1729           4          5.8         172.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MON:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MON wholestage off                      1843           1846           4          5.4         184.3       1.0X
-date_trunc MON wholestage on                       1799           1805          12          5.6         179.9       1.0X
+date_trunc MON wholestage off                      1735           1736           1          5.8         173.5       1.0X
+date_trunc MON wholestage on                       1758           1760           2          5.7         175.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MONTH:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MONTH wholestage off                    1841           1842           1          5.4         184.1       1.0X
-date_trunc MONTH wholestage on                     1795           1800           4          5.6         179.5       1.0X
+date_trunc MONTH wholestage off                    1741           1743           3          5.7         174.1       1.0X
+date_trunc MONTH wholestage on                     1759           1772          21          5.7         175.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MM:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MM wholestage off                       1838           1842           6          5.4         183.8       1.0X
-date_trunc MM wholestage on                        1796           1805           7          5.6         179.6       1.0X
+date_trunc MM wholestage off                       1729           1731           3          5.8         172.9       1.0X
+date_trunc MM wholestage on                        1758           1762           4          5.7         175.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc DAY:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc DAY wholestage off                      1309           1313           6          7.6         130.9       1.0X
-date_trunc DAY wholestage on                       1302           1308           6          7.7         130.2       1.0X
+date_trunc DAY wholestage off                      1348           1348           0          7.4         134.8       1.0X
+date_trunc DAY wholestage on                       1308           1313           5          7.6         130.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc DD:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc DD wholestage off                       1315           1316           1          7.6         131.5       1.0X
-date_trunc DD wholestage on                        1302           1304           3          7.7         130.2       1.0X
+date_trunc DD wholestage off                       1348           1351           4          7.4         134.8       1.0X
+date_trunc DD wholestage on                        1307           1308           1          7.7         130.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc HOUR:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc HOUR wholestage off                     1287           1289           2          7.8         128.7       1.0X
-date_trunc HOUR wholestage on                      1261           1265           5          7.9         126.1       1.0X
+date_trunc HOUR wholestage off                     1327           1334           9          7.5         132.7       1.0X
+date_trunc HOUR wholestage on                      1280           1281           2          7.8         128.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc MINUTE:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc MINUTE wholestage off                   1316           1318           4          7.6         131.6       1.0X
-date_trunc MINUTE wholestage on                    1280           1283           2          7.8         128.0       1.0X
+date_trunc MINUTE wholestage off                   1348           1349           1          7.4         134.8       1.0X
+date_trunc MINUTE wholestage on                    1305           1310           7          7.7         130.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc SECOND:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc SECOND wholestage off                    315            315           0         31.8          31.5       1.0X
-date_trunc SECOND wholestage on                     271            274           2         36.9          27.1       1.2X
+date_trunc SECOND wholestage off                    325            326           1         30.7          32.5       1.0X
+date_trunc SECOND wholestage on                     276            278           2         36.2          27.6       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc WEEK:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc WEEK wholestage off                     1687           1690           4          5.9         168.7       1.0X
-date_trunc WEEK wholestage on                      1694           1700           4          5.9         169.4       1.0X
+date_trunc WEEK wholestage off                     1616           1632          23          6.2         161.6       1.0X
+date_trunc WEEK wholestage on                      1625           1629           7          6.2         162.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 date_trunc QUARTER:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-date_trunc QUARTER wholestage off                  2405           2405           1          4.2         240.5       1.0X
-date_trunc QUARTER wholestage on                   2328           2343          25          4.3         232.8       1.0X
+date_trunc QUARTER wholestage off                  2073           2073           1          4.8         207.3       1.0X
+date_trunc QUARTER wholestage on                   2077           2094          24          4.8         207.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc year:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc year wholestage off                           919            920           1         10.9          91.9       1.0X
-trunc year wholestage on                            892            897           4         11.2          89.2       1.0X
+trunc year wholestage off                           933            937           5         10.7          93.3       1.0X
+trunc year wholestage on                            898            903           5         11.1          89.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc yyyy:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc yyyy wholestage off                           920            920           0         10.9          92.0       1.0X
-trunc yyyy wholestage on                            889            896           7         11.2          88.9       1.0X
+trunc yyyy wholestage off                           932            934           3         10.7          93.2       1.0X
+trunc yyyy wholestage on                            901            909          10         11.1          90.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc yy:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc yy wholestage off                             918            920           3         10.9          91.8       1.0X
-trunc yy wholestage on                              894            896           4         11.2          89.4       1.0X
+trunc yy wholestage off                             938            942           6         10.7          93.8       1.0X
+trunc yy wholestage on                              897            898           1         11.1          89.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc mon:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc mon wholestage off                            898            898           0         11.1          89.8       1.0X
-trunc mon wholestage on                             862            865           3         11.6          86.2       1.0X
+trunc mon wholestage off                            906            913           9         11.0          90.6       1.0X
+trunc mon wholestage on                             883            893          15         11.3          88.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc month:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc month wholestage off                          891            893           3         11.2          89.1       1.0X
-trunc month wholestage on                           861            863           1         11.6          86.1       1.0X
+trunc month wholestage off                          907            907           1         11.0          90.7       1.0X
+trunc month wholestage on                           883            884           1         11.3          88.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trunc mm:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-trunc mm wholestage off                             895            896           2         11.2          89.5       1.0X
-trunc mm wholestage on                              861            864           4         11.6          86.1       1.0X
+trunc mm wholestage off                             904            908           6         11.1          90.4       1.0X
+trunc mm wholestage on                              881            893          21         11.4          88.1       1.0X
 
 
 ================================================================================================
 Parsing
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to timestamp str:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to timestamp str wholestage off                     115            116           1          8.7         115.2       1.0X
-to timestamp str wholestage on                       99            104           6         10.1          99.4       1.2X
+to timestamp str wholestage off                     106            107           2          9.4         106.1       1.0X
+to timestamp str wholestage on                       99            100           1         10.1          98.8       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_timestamp:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_timestamp wholestage off                         744            745           2          1.3         743.6       1.0X
-to_timestamp wholestage on                          745            748           3          1.3         744.7       1.0X
+to_timestamp wholestage off                         737            737           0          1.4         736.8       1.0X
+to_timestamp wholestage on                          747            748           1          1.3         746.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_unix_timestamp:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_unix_timestamp wholestage off                    748            748           0          1.3         748.2       1.0X
-to_unix_timestamp wholestage on                     761            766           9          1.3         760.8       1.0X
+to_unix_timestamp wholestage off                    750            762          16          1.3         750.3       1.0X
+to_unix_timestamp wholestage on                     758            760           2          1.3         758.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to date str:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to date str wholestage off                          135            137           2          7.4         135.4       1.0X
-to date str wholestage on                           136            140           5          7.4         135.9       1.0X
+to date str wholestage off                          134            136           4          7.5         133.7       1.0X
+to date str wholestage on                           130            131           1          7.7         129.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 to_date:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-to_date wholestage off                              654            655           2          1.5         653.6       1.0X
-to_date wholestage on                               649            652           3          1.5         649.5       1.0X
+to_date wholestage off                              647            649           2          1.5         647.3       1.0X
+to_date wholestage on                               632            634           1          1.6         632.3       1.0X
 
 
 ================================================================================================
 Conversion from/to external types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 To/from Java's date-time:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-From java.sql.Date                                  279            285           7         17.9          55.8       1.0X
-From java.time.LocalDate                            242            242           1         20.7          48.3       1.2X
-Collect java.sql.Date                              1131           1375         220          4.4         226.1       0.2X
-Collect java.time.LocalDate                         984           1083         115          5.1         196.8       0.3X
-From java.sql.Timestamp                             225            236          13         22.2          45.0       1.2X
-From java.time.Instant                              179            182           5         28.0          35.7       1.6X
-Collect longs                                       809            914         181          6.2         161.8       0.3X
-Collect java.sql.Timestamp                          865           1112         222          5.8         173.1       0.3X
-Collect java.time.Instant                           834            976         152          6.0         166.7       0.3X
-java.sql.Date to Hive string                       3819           3954         176          1.3         763.9       0.1X
-java.time.LocalDate to Hive string                 3414           3543         114          1.5         682.8       0.1X
-java.sql.Timestamp to Hive string                  6507           6599         134          0.8        1301.4       0.0X
-java.time.Instant to Hive string                   5115           5206         124          1.0        1022.9       0.1X
+From java.sql.Date                                  281            283           2         17.8          56.3       1.0X
+From java.time.LocalDate                            242            244           2         20.6          48.5       1.2X
+Collect java.sql.Date                              1221           1342         111          4.1         244.1       0.2X
+Collect java.time.LocalDate                         964           1080         105          5.2         192.9       0.3X
+From java.sql.Timestamp                             227            231           7         22.1          45.3       1.2X
+From java.time.Instant                              183            187           5         27.3          36.6       1.5X
+Collect longs                                       891            983          84          5.6         178.3       0.3X
+Collect java.sql.Timestamp                          944           1202         225          5.3         188.8       0.3X
+Collect java.time.Instant                           966           1046         126          5.2         193.2       0.3X
+java.sql.Date to Hive string                       3882           4034         137          1.3         776.3       0.1X
+java.time.LocalDate to Hive string                 3308           3348          67          1.5         661.7       0.1X
+java.sql.Timestamp to Hive string                  6361           6505         149          0.8        1272.2       0.0X
+java.time.Instant to Hive string                   5138           5301         170          1.0        1027.6       0.1X
 
 
diff --git a/sql/core/benchmarks/DateTimeRebaseBenchmark-jdk21-results.txt b/sql/core/benchmarks/DateTimeRebaseBenchmark-jdk21-results.txt
index dd76ea3d6e1d7..ffb629892fed2 100644
--- a/sql/core/benchmarks/DateTimeRebaseBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/DateTimeRebaseBenchmark-jdk21-results.txt
@@ -2,153 +2,153 @@
 Rebasing dates/timestamps in Parquet datasource
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save DATE to parquet:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, noop                                  10311          10311           0          9.7         103.1       1.0X
-before 1582, noop                                  6160           6160           0         16.2          61.6       1.7X
-after 1582, rebase EXCEPTION                      18563          18563           0          5.4         185.6       0.6X
-after 1582, rebase LEGACY                         18638          18638           0          5.4         186.4       0.6X
-after 1582, rebase CORRECTED                      18928          18928           0          5.3         189.3       0.5X
-before 1582, rebase LEGACY                        14605          14605           0          6.8         146.1       0.7X
-before 1582, rebase CORRECTED                     14392          14392           0          6.9         143.9       0.7X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+after 1582, noop                                  10212          10212           0          9.8         102.1       1.0X
+before 1582, noop                                  6105           6105           0         16.4          61.1       1.7X
+after 1582, rebase EXCEPTION                      19278          19278           0          5.2         192.8       0.5X
+after 1582, rebase LEGACY                         18977          18977           0          5.3         189.8       0.5X
+after 1582, rebase CORRECTED                      19081          19081           0          5.2         190.8       0.5X
+before 1582, rebase LEGACY                        15225          15225           0          6.6         152.3       0.7X
+before 1582, rebase CORRECTED                     15244          15244           0          6.6         152.4       0.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load DATE from parquet:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, vec off, rebase EXCEPTION             11852          11893          45          8.4         118.5       1.0X
-after 1582, vec off, rebase LEGACY                12029          12065          31          8.3         120.3       1.0X
-after 1582, vec off, rebase CORRECTED             11961          12060         127          8.4         119.6       1.0X
-after 1582, vec on, rebase EXCEPTION               2393           2404          11         41.8          23.9       5.0X
-after 1582, vec on, rebase LEGACY                  2502           2516          15         40.0          25.0       4.7X
-after 1582, vec on, rebase CORRECTED               2467           2513          40         40.5          24.7       4.8X
-before 1582, vec off, rebase LEGACY               12216          12263          45          8.2         122.2       1.0X
-before 1582, vec off, rebase CORRECTED            11957          11986          29          8.4         119.6       1.0X
-before 1582, vec on, rebase LEGACY                 2851           2880          25         35.1          28.5       4.2X
-before 1582, vec on, rebase CORRECTED              2446           2460          23         40.9          24.5       4.8X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+after 1582, vec off, rebase EXCEPTION             11007          11051          39          9.1         110.1       1.0X
+after 1582, vec off, rebase LEGACY                11022          11031           8          9.1         110.2       1.0X
+after 1582, vec off, rebase CORRECTED             10983          11022          46          9.1         109.8       1.0X
+after 1582, vec on, rebase EXCEPTION               2383           2388           7         42.0          23.8       4.6X
+after 1582, vec on, rebase LEGACY                  2466           2472          11         40.5          24.7       4.5X
+after 1582, vec on, rebase CORRECTED               2438           2444           6         41.0          24.4       4.5X
+before 1582, vec off, rebase LEGACY               11465          11546         130          8.7         114.7       1.0X
+before 1582, vec off, rebase CORRECTED            11249          11284          33          8.9         112.5       1.0X
+before 1582, vec on, rebase LEGACY                 2769           2786          16         36.1          27.7       4.0X
+before 1582, vec on, rebase CORRECTED              2441           2451          13         41.0          24.4       4.5X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP_INT96 to parquet:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2362           2362           0         42.3          23.6       1.0X
+after 1900, noop                                   2337           2337           0         42.8          23.4       1.0X
 before 1900, noop                                  2361           2361           0         42.4          23.6       1.0X
-after 1900, rebase EXCEPTION                      12537          12537           0          8.0         125.4       0.2X
-after 1900, rebase LEGACY                         12241          12241           0          8.2         122.4       0.2X
-after 1900, rebase CORRECTED                      12272          12272           0          8.1         122.7       0.2X
-before 1900, rebase LEGACY                        15654          15654           0          6.4         156.5       0.2X
-before 1900, rebase CORRECTED                     13597          13597           0          7.4         136.0       0.2X
+after 1900, rebase EXCEPTION                      12186          12186           0          8.2         121.9       0.2X
+after 1900, rebase LEGACY                         12195          12195           0          8.2         121.9       0.2X
+after 1900, rebase CORRECTED                      12358          12358           0          8.1         123.6       0.2X
+before 1900, rebase LEGACY                        14091          14091           0          7.1         140.9       0.2X
+before 1900, rebase CORRECTED                     12391          12391           0          8.1         123.9       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP_INT96 from parquet:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off, rebase EXCEPTION             16938          17063         112          5.9         169.4       1.0X
-after 1900, vec off, rebase LEGACY                16645          16650           7          6.0         166.5       1.0X
-after 1900, vec off, rebase CORRECTED             16494          16508          12          6.1         164.9       1.0X
-after 1900, vec on, rebase EXCEPTION               4026           4046          21         24.8          40.3       4.2X
-after 1900, vec on, rebase LEGACY                  4046           4055          10         24.7          40.5       4.2X
-after 1900, vec on, rebase CORRECTED               4041           4060          17         24.7          40.4       4.2X
-before 1900, vec off, rebase LEGACY               18686          18818         114          5.4         186.9       0.9X
-before 1900, vec off, rebase CORRECTED            16266          16320          50          6.1         162.7       1.0X
-before 1900, vec on, rebase LEGACY                 6178           6194          23         16.2          61.8       2.7X
-before 1900, vec on, rebase CORRECTED              4059           4073          16         24.6          40.6       4.2X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+after 1900, vec off, rebase EXCEPTION             16129          16171          37          6.2         161.3       1.0X
+after 1900, vec off, rebase LEGACY                16787          16840          46          6.0         167.9       1.0X
+after 1900, vec off, rebase CORRECTED             15982          16015          37          6.3         159.8       1.0X
+after 1900, vec on, rebase EXCEPTION               4027           4052          33         24.8          40.3       4.0X
+after 1900, vec on, rebase LEGACY                  4079           4086           9         24.5          40.8       4.0X
+after 1900, vec on, rebase CORRECTED               4081           4104          24         24.5          40.8       4.0X
+before 1900, vec off, rebase LEGACY               18237          18291          89          5.5         182.4       0.9X
+before 1900, vec off, rebase CORRECTED            15917          15987          73          6.3         159.2       1.0X
+before 1900, vec on, rebase LEGACY                 6133           6141          12         16.3          61.3       2.6X
+before 1900, vec on, rebase CORRECTED              4062           4072          13         24.6          40.6       4.0X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP_MICROS to parquet:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2404           2404           0         41.6          24.0       1.0X
-before 1900, noop                                  2349           2349           0         42.6          23.5       1.0X
-after 1900, rebase EXCEPTION                      11876          11876           0          8.4         118.8       0.2X
-after 1900, rebase LEGACY                         11243          11243           0          8.9         112.4       0.2X
-after 1900, rebase CORRECTED                      11348          11348           0          8.8         113.5       0.2X
-before 1900, rebase LEGACY                        13254          13254           0          7.5         132.5       0.2X
-before 1900, rebase CORRECTED                     11536          11536           0          8.7         115.4       0.2X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+after 1900, noop                                   2548           2548           0         39.2          25.5       1.0X
+before 1900, noop                                  2352           2352           0         42.5          23.5       1.1X
+after 1900, rebase EXCEPTION                      11992          11992           0          8.3         119.9       0.2X
+after 1900, rebase LEGACY                         11708          11708           0          8.5         117.1       0.2X
+after 1900, rebase CORRECTED                      11784          11784           0          8.5         117.8       0.2X
+before 1900, rebase LEGACY                        13537          13537           0          7.4         135.4       0.2X
+before 1900, rebase CORRECTED                     11748          11748           0          8.5         117.5       0.2X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP_MICROS from parquet:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off, rebase EXCEPTION             14674          14716          54          6.8         146.7       1.0X
-after 1900, vec off, rebase LEGACY                14633          14706          74          6.8         146.3       1.0X
-after 1900, vec off, rebase CORRECTED             14704          14765          74          6.8         147.0       1.0X
-after 1900, vec on, rebase EXCEPTION               3772           3791          31         26.5          37.7       3.9X
-after 1900, vec on, rebase LEGACY                  3744           3790          45         26.7          37.4       3.9X
-after 1900, vec on, rebase CORRECTED               3707           3766          75         27.0          37.1       4.0X
-before 1900, vec off, rebase LEGACY               16749          16837          86          6.0         167.5       0.9X
-before 1900, vec off, rebase CORRECTED            14649          14709          80          6.8         146.5       1.0X
-before 1900, vec on, rebase LEGACY                 5535           5548          12         18.1          55.3       2.7X
-before 1900, vec on, rebase CORRECTED              3721           3747          37         26.9          37.2       3.9X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+after 1900, vec off, rebase EXCEPTION             14859          14953          87          6.7         148.6       1.0X
+after 1900, vec off, rebase LEGACY                14898          14952          56          6.7         149.0       1.0X
+after 1900, vec off, rebase CORRECTED             14825          14868          38          6.7         148.2       1.0X
+after 1900, vec on, rebase EXCEPTION               3771           3783          10         26.5          37.7       3.9X
+after 1900, vec on, rebase LEGACY                  3768           3800          35         26.5          37.7       3.9X
+after 1900, vec on, rebase CORRECTED               3747           3759          10         26.7          37.5       4.0X
+before 1900, vec off, rebase LEGACY               17281          17347          71          5.8         172.8       0.9X
+before 1900, vec off, rebase CORRECTED            14931          14986          72          6.7         149.3       1.0X
+before 1900, vec on, rebase LEGACY                 5572           5609          38         17.9          55.7       2.7X
+before 1900, vec on, rebase CORRECTED              3710           3757          50         27.0          37.1       4.0X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP_MILLIS to parquet:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2380           2380           0         42.0          23.8       1.0X
-before 1900, noop                                  2375           2375           0         42.1          23.7       1.0X
-after 1900, rebase EXCEPTION                      11461          11461           0          8.7         114.6       0.2X
-after 1900, rebase LEGACY                         11387          11387           0          8.8         113.9       0.2X
-after 1900, rebase CORRECTED                      11302          11302           0          8.8         113.0       0.2X
-before 1900, rebase LEGACY                        14100          14100           0          7.1         141.0       0.2X
-before 1900, rebase CORRECTED                     11411          11411           0          8.8         114.1       0.2X
-
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+after 1900, noop                                   2359           2359           0         42.4          23.6       1.0X
+before 1900, noop                                  2433           2433           0         41.1          24.3       1.0X
+after 1900, rebase EXCEPTION                      10998          10998           0          9.1         110.0       0.2X
+after 1900, rebase LEGACY                         11011          11011           0          9.1         110.1       0.2X
+after 1900, rebase CORRECTED                      11328          11328           0          8.8         113.3       0.2X
+before 1900, rebase LEGACY                        12980          12980           0          7.7         129.8       0.2X
+before 1900, rebase CORRECTED                     10966          10966           0          9.1         109.7       0.2X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP_MILLIS from parquet:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off, rebase EXCEPTION             14312          14337          24          7.0         143.1       1.0X
-after 1900, vec off, rebase LEGACY                14327          14406          73          7.0         143.3       1.0X
-after 1900, vec off, rebase CORRECTED             14244          14289          61          7.0         142.4       1.0X
-after 1900, vec on, rebase EXCEPTION               4862           4916          49         20.6          48.6       2.9X
-after 1900, vec on, rebase LEGACY                  4469           4498          36         22.4          44.7       3.2X
-after 1900, vec on, rebase CORRECTED               4858           4869          14         20.6          48.6       2.9X
-before 1900, vec off, rebase LEGACY               16578          16652          66          6.0         165.8       0.9X
-before 1900, vec off, rebase CORRECTED            14240          14331          82          7.0         142.4       1.0X
-before 1900, vec on, rebase LEGACY                 6015           6044          48         16.6          60.1       2.4X
-before 1900, vec on, rebase CORRECTED              4873           4898          27         20.5          48.7       2.9X
+after 1900, vec off, rebase EXCEPTION             14432          14453          20          6.9         144.3       1.0X
+after 1900, vec off, rebase LEGACY                14708          14761          57          6.8         147.1       1.0X
+after 1900, vec off, rebase CORRECTED             14689          14744          70          6.8         146.9       1.0X
+after 1900, vec on, rebase EXCEPTION               4891           4915          22         20.4          48.9       3.0X
+after 1900, vec on, rebase LEGACY                  4353           4392          40         23.0          43.5       3.3X
+after 1900, vec on, rebase CORRECTED               4906           4934          26         20.4          49.1       2.9X
+before 1900, vec off, rebase LEGACY               17095          17242         217          5.8         170.9       0.8X
+before 1900, vec off, rebase CORRECTED            14633          14651          27          6.8         146.3       1.0X
+before 1900, vec on, rebase LEGACY                 6068           6069           1         16.5          60.7       2.4X
+before 1900, vec on, rebase CORRECTED              4910           4934          36         20.4          49.1       2.9X
 
 
 ================================================================================================
 Rebasing dates/timestamps in ORC datasource
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save DATE to ORC:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, noop                                  11787          11787           0          8.5         117.9       1.0X
-before 1582, noop                                  5513           5513           0         18.1          55.1       2.1X
-after 1582                                        16137          16137           0          6.2         161.4       0.7X
-before 1582                                        9680           9680           0         10.3          96.8       1.2X
+after 1582, noop                                   9915           9915           0         10.1          99.2       1.0X
+before 1582, noop                                  5846           5846           0         17.1          58.5       1.7X
+after 1582                                        13925          13925           0          7.2         139.2       0.7X
+before 1582                                       10596          10596           0          9.4         106.0       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load DATE from ORC:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, vec off                                8458           8500          37         11.8          84.6       1.0X
-after 1582, vec on                                 2411           2437          23         41.5          24.1       3.5X
-before 1582, vec off                               8607           8658          73         11.6          86.1       1.0X
-before 1582, vec on                                2557           2586          45         39.1          25.6       3.3X
+after 1582, vec off                                8802           8811          11         11.4          88.0       1.0X
+after 1582, vec on                                 2410           2434          21         41.5          24.1       3.7X
+before 1582, vec off                               8919           8930          10         11.2          89.2       1.0X
+before 1582, vec on                                2553           2566          21         39.2          25.5       3.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP to ORC:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2371           2371           0         42.2          23.7       1.0X
-before 1900, noop                                  2365           2365           0         42.3          23.6       1.0X
-after 1900                                         9499           9499           0         10.5          95.0       0.2X
-before 1900                                       12115          12115           0          8.3         121.1       0.2X
+after 1900, noop                                   2296           2296           0         43.6          23.0       1.0X
+before 1900, noop                                  2316           2316           0         43.2          23.2       1.0X
+after 1900                                        11515          11515           0          8.7         115.1       0.2X
+before 1900                                       12345          12345           0          8.1         123.5       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP from ORC:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off                                9880           9897          19         10.1          98.8       1.0X
-after 1900, vec on                                 3891           3908          18         25.7          38.9       2.5X
-before 1900, vec off                              11614          11656          42          8.6         116.1       0.9X
-before 1900, vec on                                5409           5441          29         18.5          54.1       1.8X
+after 1900, vec off                               10546          10548           3          9.5         105.5       1.0X
+after 1900, vec on                                 4153           4159          10         24.1          41.5       2.5X
+before 1900, vec off                              12789          12815          38          7.8         127.9       0.8X
+before 1900, vec on                                5646           5648           2         17.7          56.5       1.9X
 
 
diff --git a/sql/core/benchmarks/DateTimeRebaseBenchmark-results.txt b/sql/core/benchmarks/DateTimeRebaseBenchmark-results.txt
index f96863864365d..8d9e830e163fe 100644
--- a/sql/core/benchmarks/DateTimeRebaseBenchmark-results.txt
+++ b/sql/core/benchmarks/DateTimeRebaseBenchmark-results.txt
@@ -2,153 +2,153 @@
 Rebasing dates/timestamps in Parquet datasource
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save DATE to parquet:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, noop                                  12334          12334           0          8.1         123.3       1.0X
-before 1582, noop                                  6783           6783           0         14.7          67.8       1.8X
-after 1582, rebase EXCEPTION                      21193          21193           0          4.7         211.9       0.6X
-after 1582, rebase LEGACY                         21767          21767           0          4.6         217.7       0.6X
-after 1582, rebase CORRECTED                      21968          21968           0          4.6         219.7       0.6X
-before 1582, rebase LEGACY                        17878          17878           0          5.6         178.8       0.7X
-before 1582, rebase CORRECTED                     17372          17372           0          5.8         173.7       0.7X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+after 1582, noop                                  11639          11639           0          8.6         116.4       1.0X
+before 1582, noop                                  6668           6668           0         15.0          66.7       1.7X
+after 1582, rebase EXCEPTION                      20766          20766           0          4.8         207.7       0.6X
+after 1582, rebase LEGACY                         20737          20737           0          4.8         207.4       0.6X
+after 1582, rebase CORRECTED                      20877          20877           0          4.8         208.8       0.6X
+before 1582, rebase LEGACY                        16082          16082           0          6.2         160.8       0.7X
+before 1582, rebase CORRECTED                     16149          16149           0          6.2         161.5       0.7X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load DATE from parquet:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, vec off, rebase EXCEPTION             11178          11279         174          8.9         111.8       1.0X
-after 1582, vec off, rebase LEGACY                11579          11620          44          8.6         115.8       1.0X
-after 1582, vec off, rebase CORRECTED             11618          11659          37          8.6         116.2       1.0X
-after 1582, vec on, rebase EXCEPTION               2549           2561          17         39.2          25.5       4.4X
-after 1582, vec on, rebase LEGACY                  2558           2573          14         39.1          25.6       4.4X
-after 1582, vec on, rebase CORRECTED               2507           2540          30         39.9          25.1       4.5X
-before 1582, vec off, rebase LEGACY               11480          11530          79          8.7         114.8       1.0X
-before 1582, vec off, rebase CORRECTED            11377          11392          15          8.8         113.8       1.0X
-before 1582, vec on, rebase LEGACY                 2850           2866          23         35.1          28.5       3.9X
-before 1582, vec on, rebase CORRECTED              2504           2529          21         39.9          25.0       4.5X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+after 1582, vec off, rebase EXCEPTION             11234          11278          45          8.9         112.3       1.0X
+after 1582, vec off, rebase LEGACY                11417          11445          31          8.8         114.2       1.0X
+after 1582, vec off, rebase CORRECTED             11277          11301          22          8.9         112.8       1.0X
+after 1582, vec on, rebase EXCEPTION               2499           2522          21         40.0          25.0       4.5X
+after 1582, vec on, rebase LEGACY                  2529           2557          29         39.5          25.3       4.4X
+after 1582, vec on, rebase CORRECTED               2452           2503          49         40.8          24.5       4.6X
+before 1582, vec off, rebase LEGACY               11636          11638           4          8.6         116.4       1.0X
+before 1582, vec off, rebase CORRECTED            11413          11433          33          8.8         114.1       1.0X
+before 1582, vec on, rebase LEGACY                 2856           2942         134         35.0          28.6       3.9X
+before 1582, vec on, rebase CORRECTED              2423           2432           8         41.3          24.2       4.6X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP_INT96 to parquet:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2239           2239           0         44.7          22.4       1.0X
-before 1900, noop                                  2258           2258           0         44.3          22.6       1.0X
-after 1900, rebase EXCEPTION                      13699          13699           0          7.3         137.0       0.2X
-after 1900, rebase LEGACY                         13692          13692           0          7.3         136.9       0.2X
-after 1900, rebase CORRECTED                      13661          13661           0          7.3         136.6       0.2X
-before 1900, rebase LEGACY                        15321          15321           0          6.5         153.2       0.1X
-before 1900, rebase CORRECTED                     13646          13646           0          7.3         136.5       0.2X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+after 1900, noop                                   2256           2256           0         44.3          22.6       1.0X
+before 1900, noop                                  2318           2318           0         43.1          23.2       1.0X
+after 1900, rebase EXCEPTION                      13444          13444           0          7.4         134.4       0.2X
+after 1900, rebase LEGACY                         13419          13419           0          7.5         134.2       0.2X
+after 1900, rebase CORRECTED                      13231          13231           0          7.6         132.3       0.2X
+before 1900, rebase LEGACY                        15176          15176           0          6.6         151.8       0.1X
+before 1900, rebase CORRECTED                     13494          13494           0          7.4         134.9       0.2X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP_INT96 from parquet:        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off, rebase EXCEPTION             14596          14627          27          6.9         146.0       1.0X
-after 1900, vec off, rebase LEGACY                15157          15202          49          6.6         151.6       1.0X
-after 1900, vec off, rebase CORRECTED             14936          14972          33          6.7         149.4       1.0X
-after 1900, vec on, rebase EXCEPTION               5412           5429          18         18.5          54.1       2.7X
-after 1900, vec on, rebase LEGACY                  5372           5427          48         18.6          53.7       2.7X
-after 1900, vec on, rebase CORRECTED               5406           5413           9         18.5          54.1       2.7X
-before 1900, vec off, rebase LEGACY               17556          17637          82          5.7         175.6       0.8X
-before 1900, vec off, rebase CORRECTED            15475          15502          26          6.5         154.7       0.9X
-before 1900, vec on, rebase LEGACY                 7054           7080          23         14.2          70.5       2.1X
-before 1900, vec on, rebase CORRECTED              5369           5377           8         18.6          53.7       2.7X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+after 1900, vec off, rebase EXCEPTION             14887          14927          50          6.7         148.9       1.0X
+after 1900, vec off, rebase LEGACY                14789          14811          22          6.8         147.9       1.0X
+after 1900, vec off, rebase CORRECTED             14792          14829          40          6.8         147.9       1.0X
+after 1900, vec on, rebase EXCEPTION               4113           4146          33         24.3          41.1       3.6X
+after 1900, vec on, rebase LEGACY                  5453           5483          26         18.3          54.5       2.7X
+after 1900, vec on, rebase CORRECTED               4103           4146          41         24.4          41.0       3.6X
+before 1900, vec off, rebase LEGACY               17155          17183          29          5.8         171.5       0.9X
+before 1900, vec off, rebase CORRECTED            14714          14733          20          6.8         147.1       1.0X
+before 1900, vec on, rebase LEGACY                 7105           7129          21         14.1          71.1       2.1X
+before 1900, vec on, rebase CORRECTED              4113           4128          23         24.3          41.1       3.6X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP_MICROS to parquet:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2260           2260           0         44.2          22.6       1.0X
-before 1900, noop                                  2253           2253           0         44.4          22.5       1.0X
-after 1900, rebase EXCEPTION                      12513          12513           0          8.0         125.1       0.2X
-after 1900, rebase LEGACY                         12690          12690           0          7.9         126.9       0.2X
-after 1900, rebase CORRECTED                      13009          13009           0          7.7         130.1       0.2X
-before 1900, rebase LEGACY                        14412          14412           0          6.9         144.1       0.2X
-before 1900, rebase CORRECTED                     12546          12546           0          8.0         125.5       0.2X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+after 1900, noop                                   2316           2316           0         43.2          23.2       1.0X
+before 1900, noop                                  2341           2341           0         42.7          23.4       1.0X
+after 1900, rebase EXCEPTION                      12220          12220           0          8.2         122.2       0.2X
+after 1900, rebase LEGACY                         12031          12031           0          8.3         120.3       0.2X
+after 1900, rebase CORRECTED                      12199          12199           0          8.2         122.0       0.2X
+before 1900, rebase LEGACY                        14011          14011           0          7.1         140.1       0.2X
+before 1900, rebase CORRECTED                     12239          12239           0          8.2         122.4       0.2X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP_MICROS from parquet:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off, rebase EXCEPTION             15222          15269          49          6.6         152.2       1.0X
-after 1900, vec off, rebase LEGACY                15154          15189          34          6.6         151.5       1.0X
-after 1900, vec off, rebase CORRECTED             15391          15426          31          6.5         153.9       1.0X
-after 1900, vec on, rebase EXCEPTION               3770           3790          17         26.5          37.7       4.0X
-after 1900, vec on, rebase LEGACY                  3814           3869          71         26.2          38.1       4.0X
-after 1900, vec on, rebase CORRECTED               3784           3798          15         26.4          37.8       4.0X
-before 1900, vec off, rebase LEGACY               17591          17636          55          5.7         175.9       0.9X
-before 1900, vec off, rebase CORRECTED            15408          15436          45          6.5         154.1       1.0X
-before 1900, vec on, rebase LEGACY                 5604           5629          29         17.8          56.0       2.7X
-before 1900, vec on, rebase CORRECTED              3784           3790           7         26.4          37.8       4.0X
-
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+after 1900, vec off, rebase EXCEPTION             15111          15142          33          6.6         151.1       1.0X
+after 1900, vec off, rebase LEGACY                15282          15396         169          6.5         152.8       1.0X
+after 1900, vec off, rebase CORRECTED             15273          15320          54          6.5         152.7       1.0X
+after 1900, vec on, rebase EXCEPTION               3843           3850           9         26.0          38.4       3.9X
+after 1900, vec on, rebase LEGACY                  3862           3882          28         25.9          38.6       3.9X
+after 1900, vec on, rebase CORRECTED               3836           3864          26         26.1          38.4       3.9X
+before 1900, vec off, rebase LEGACY               17575          17590          13          5.7         175.7       0.9X
+before 1900, vec off, rebase CORRECTED            15328          15341          14          6.5         153.3       1.0X
+before 1900, vec on, rebase LEGACY                 5662           5674          12         17.7          56.6       2.7X
+before 1900, vec on, rebase CORRECTED              3807           3821          12         26.3          38.1       4.0X
+
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP_MILLIS to parquet:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2303           2303           0         43.4          23.0       1.0X
+after 1900, noop                                   2262           2262           0         44.2          22.6       1.0X
 before 1900, noop                                  2283           2283           0         43.8          22.8       1.0X
-after 1900, rebase EXCEPTION                      11819          11819           0          8.5         118.2       0.2X
-after 1900, rebase LEGACY                         11878          11878           0          8.4         118.8       0.2X
-after 1900, rebase CORRECTED                      11760          11760           0          8.5         117.6       0.2X
-before 1900, rebase LEGACY                        13634          13634           0          7.3         136.3       0.2X
-before 1900, rebase CORRECTED                     11533          11533           0          8.7         115.3       0.2X
+after 1900, rebase EXCEPTION                      11581          11581           0          8.6         115.8       0.2X
+after 1900, rebase LEGACY                         11524          11524           0          8.7         115.2       0.2X
+after 1900, rebase CORRECTED                      11721          11721           0          8.5         117.2       0.2X
+before 1900, rebase LEGACY                        13792          13792           0          7.3         137.9       0.2X
+before 1900, rebase CORRECTED                     11664          11664           0          8.6         116.6       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP_MILLIS from parquet:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off, rebase EXCEPTION             15683          15716          56          6.4         156.8       1.0X
-after 1900, vec off, rebase LEGACY                15669          15708          57          6.4         156.7       1.0X
-after 1900, vec off, rebase CORRECTED             15790          15834          71          6.3         157.9       1.0X
-after 1900, vec on, rebase EXCEPTION               3936           3947          12         25.4          39.4       4.0X
-after 1900, vec on, rebase LEGACY                  4508           4534          31         22.2          45.1       3.5X
-after 1900, vec on, rebase CORRECTED               4006           4009           4         25.0          40.1       3.9X
-before 1900, vec off, rebase LEGACY               17911          17944          47          5.6         179.1       0.9X
-before 1900, vec off, rebase CORRECTED            15705          15751          48          6.4         157.1       1.0X
-before 1900, vec on, rebase LEGACY                 6250           6260          18         16.0          62.5       2.5X
-before 1900, vec on, rebase CORRECTED              3929           3976          42         25.5          39.3       4.0X
+after 1900, vec off, rebase EXCEPTION             15276          15313          38          6.5         152.8       1.0X
+after 1900, vec off, rebase LEGACY                15279          15323          44          6.5         152.8       1.0X
+after 1900, vec off, rebase CORRECTED             15412          15448          31          6.5         154.1       1.0X
+after 1900, vec on, rebase EXCEPTION               4031           4046          21         24.8          40.3       3.8X
+after 1900, vec on, rebase LEGACY                  4618           4629          17         21.7          46.2       3.3X
+after 1900, vec on, rebase CORRECTED               4044           4058          13         24.7          40.4       3.8X
+before 1900, vec off, rebase LEGACY               17341          17397          57          5.8         173.4       0.9X
+before 1900, vec off, rebase CORRECTED            15353          15399          45          6.5         153.5       1.0X
+before 1900, vec on, rebase LEGACY                 6287           6292           9         15.9          62.9       2.4X
+before 1900, vec on, rebase CORRECTED              4043           4074          28         24.7          40.4       3.8X
 
 
 ================================================================================================
 Rebasing dates/timestamps in ORC datasource
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save DATE to ORC:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, noop                                  12491          12491           0          8.0         124.9       1.0X
-before 1582, noop                                  6804           6804           0         14.7          68.0       1.8X
-after 1582                                        16422          16422           0          6.1         164.2       0.8X
-before 1582                                       11024          11024           0          9.1         110.2       1.1X
+after 1582, noop                                  11666          11666           0          8.6         116.7       1.0X
+before 1582, noop                                  6686           6686           0         15.0          66.9       1.7X
+after 1582                                        15631          15631           0          6.4         156.3       0.7X
+before 1582                                       10773          10773           0          9.3         107.7       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load DATE from ORC:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1582, vec off                                8591           8595           6         11.6          85.9       1.0X
-after 1582, vec on                                 2555           2578          31         39.1          25.5       3.4X
-before 1582, vec off                               8445           8491          52         11.8          84.5       1.0X
-before 1582, vec on                                2706           2715          11         37.0          27.1       3.2X
+after 1582, vec off                                8409           8415          10         11.9          84.1       1.0X
+after 1582, vec on                                 2552           2574          30         39.2          25.5       3.3X
+before 1582, vec off                               8456           8533          83         11.8          84.6       1.0X
+before 1582, vec on                                2623           2638          14         38.1          26.2       3.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Save TIMESTAMP to ORC:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, noop                                   2177           2177           0         45.9          21.8       1.0X
-before 1900, noop                                  2180           2180           0         45.9          21.8       1.0X
-after 1900                                         8990           8990           0         11.1          89.9       0.2X
-before 1900                                       11043          11043           0          9.1         110.4       0.2X
+after 1900, noop                                   2185           2185           0         45.8          21.9       1.0X
+before 1900, noop                                  2263           2263           0         44.2          22.6       1.0X
+after 1900                                         9439           9439           0         10.6          94.4       0.2X
+before 1900                                       11613          11613           0          8.6         116.1       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Load TIMESTAMP from ORC:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-after 1900, vec off                               10558          10576          29          9.5         105.6       1.0X
-after 1900, vec on                                 4070           4109          41         24.6          40.7       2.6X
-before 1900, vec off                              11951          11986          41          8.4         119.5       0.9X
-before 1900, vec on                                5539           5547          10         18.1          55.4       1.9X
+after 1900, vec off                                9771           9811          53         10.2          97.7       1.0X
+after 1900, vec on                                 4046           4062          14         24.7          40.5       2.4X
+before 1900, vec off                              11436          11477          57          8.7         114.4       0.9X
+before 1900, vec on                                5690           5701          10         17.6          56.9       1.7X
 
 
diff --git a/sql/core/benchmarks/EncodeBenchmark-jdk21-results.txt b/sql/core/benchmarks/EncodeBenchmark-jdk21-results.txt
index 6fa07836f177c..d0b3598712655 100644
--- a/sql/core/benchmarks/EncodeBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/EncodeBenchmark-jdk21-results.txt
@@ -1,8 +1,8 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UTF-32                                            48699          48707          12          0.2        4869.9       1.0X
-UTF-16                                            60472          60483          15          0.2        6047.2       0.8X
-UTF-8                                             31641          31688          66          0.3        3164.1       1.5X
+UTF-32                                            58475          58556         115          0.2        5847.5       1.0X
+UTF-16                                            60460          60596         193          0.2        6046.0       1.0X
+UTF-8                                             32910          32911           1          0.3        3291.0       1.8X
 
diff --git a/sql/core/benchmarks/EncodeBenchmark-results.txt b/sql/core/benchmarks/EncodeBenchmark-results.txt
index 5df736af1bc5e..58424b316eec5 100644
--- a/sql/core/benchmarks/EncodeBenchmark-results.txt
+++ b/sql/core/benchmarks/EncodeBenchmark-results.txt
@@ -1,8 +1,8 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 encode:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UTF-32                                            33507          33538          44          0.3        3350.7       1.0X
-UTF-16                                            52085          52137          74          0.2        5208.5       0.6X
-UTF-8                                             30150          30156           9          0.3        3015.0       1.1X
+UTF-32                                            56295          56403         153          0.2        5629.5       1.0X
+UTF-16                                            50644          50653          13          0.2        5064.4       1.1X
+UTF-8                                             30599          30619          28          0.3        3059.9       1.8X
 
diff --git a/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-jdk21-results.txt b/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-jdk21-results.txt
index 2aa91c041f04a..8d16f6cb9c5cb 100644
--- a/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-jdk21-results.txt
@@ -2,44 +2,44 @@
 WITHOUT SPILL
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array with 100000 rows:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ArrayBuffer                                        2676           2677           2         38.3          26.1       1.0X
-ExternalAppendOnlyUnsafeRowArray                   3586           3598          17         28.6          35.0       0.7X
+ArrayBuffer                                        2797           2810          17         36.6          27.3       1.0X
+ExternalAppendOnlyUnsafeRowArray                   3838           3842           6         26.7          37.5       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array with 1000 rows:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ArrayBuffer                                        5541           5543           2         47.3          21.1       1.0X
-ExternalAppendOnlyUnsafeRowArray                  12412          12447          50         21.1          47.3       0.4X
+ArrayBuffer                                        5501           5508          10         47.7          21.0       1.0X
+ExternalAppendOnlyUnsafeRowArray                  12829          12879          70         20.4          48.9       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array with 30000 rows:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ArrayBuffer                                       11108          11111           4         44.2          22.6       1.0X
-ExternalAppendOnlyUnsafeRowArray                  18620          18663          61         26.4          37.9       0.6X
+ArrayBuffer                                       10905          11000         135         45.1          22.2       1.0X
+ExternalAppendOnlyUnsafeRowArray                  18327          18373          64         26.8          37.3       0.6X
 
 
 ================================================================================================
 WITH SPILL
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Spilling with 1000 rows:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UnsafeExternalSorter                               8438           8501          88         31.1          32.2       1.0X
-ExternalAppendOnlyUnsafeRowArray                   6672           6673           0         39.3          25.5       1.3X
+UnsafeExternalSorter                               8819           8837          27         29.7          33.6       1.0X
+ExternalAppendOnlyUnsafeRowArray                   7137           7140           4         36.7          27.2       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Spilling with 10000 rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UnsafeExternalSorter                                  5              5           0         32.8          30.5       1.0X
-ExternalAppendOnlyUnsafeRowArray                      4              4           0         38.6          25.9       1.2X
+UnsafeExternalSorter                                  5              5           0         33.6          29.8       1.0X
+ExternalAppendOnlyUnsafeRowArray                      4              4           0         38.3          26.1       1.1X
 
 
diff --git a/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-results.txt b/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-results.txt
index a8fc3fc7e0395..6cc5f3af4581d 100644
--- a/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-results.txt
+++ b/sql/core/benchmarks/ExternalAppendOnlyUnsafeRowArrayBenchmark-results.txt
@@ -2,44 +2,44 @@
 WITHOUT SPILL
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array with 100000 rows:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ArrayBuffer                                        2513           2516           3         40.7          24.5       1.0X
-ExternalAppendOnlyUnsafeRowArray                   3627           3635          12         28.2          35.4       0.7X
+ArrayBuffer                                        2536           2538           2         40.4          24.8       1.0X
+ExternalAppendOnlyUnsafeRowArray                   3472           3488          22         29.5          33.9       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array with 1000 rows:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ArrayBuffer                                        5460           5468          11         48.0          20.8       1.0X
-ExternalAppendOnlyUnsafeRowArray                  12333          12352          28         21.3          47.0       0.4X
+ArrayBuffer                                        5217           5224          10         50.2          19.9       1.0X
+ExternalAppendOnlyUnsafeRowArray                  13015          13025          15         20.1          49.6       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Array with 30000 rows:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-ArrayBuffer                                       10277          10283           9         47.8          20.9       1.0X
-ExternalAppendOnlyUnsafeRowArray                  17958          17977          26         27.4          36.5       0.6X
+ArrayBuffer                                        9950           9973          33         49.4          20.2       1.0X
+ExternalAppendOnlyUnsafeRowArray                  17598          17606          13         27.9          35.8       0.6X
 
 
 ================================================================================================
 WITH SPILL
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Spilling with 1000 rows:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UnsafeExternalSorter                               8492           8495           4         30.9          32.4       1.0X
-ExternalAppendOnlyUnsafeRowArray                   6176           6181           7         42.4          23.6       1.4X
+UnsafeExternalSorter                               8485           8532          67         30.9          32.4       1.0X
+ExternalAppendOnlyUnsafeRowArray                   6400           6405           7         41.0          24.4       1.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Spilling with 10000 rows:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UnsafeExternalSorter                                  5              5           0         34.2          29.2       1.0X
-ExternalAppendOnlyUnsafeRowArray                      4              4           0         42.0          23.8       1.2X
+UnsafeExternalSorter                                  5              5           0         32.5          30.8       1.0X
+ExternalAppendOnlyUnsafeRowArray                      4              4           0         38.7          25.8       1.2X
 
 
diff --git a/sql/core/benchmarks/ExtractBenchmark-jdk21-results.txt b/sql/core/benchmarks/ExtractBenchmark-jdk21-results.txt
index 84b5eda46cc46..a22cc3228194d 100644
--- a/sql/core/benchmarks/ExtractBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/ExtractBenchmark-jdk21-results.txt
@@ -1,104 +1,104 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke extract for timestamp:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to timestamp                                   260            264           4         38.4          26.0       1.0X
-YEAR of timestamp                                   669            672           3         14.9          66.9       0.4X
-YEAROFWEEK of timestamp                             642            643           1         15.6          64.2       0.4X
-QUARTER of timestamp                                643            647           3         15.6          64.3       0.4X
-MONTH of timestamp                                  567            574           7         17.6          56.7       0.5X
-WEEK of timestamp                                   864            865           2         11.6          86.4       0.3X
-DAY of timestamp                                    557            562           8         18.0          55.7       0.5X
-DAYOFWEEK of timestamp                              742            756          21         13.5          74.2       0.4X
-DOW of timestamp                                    743            754          18         13.5          74.3       0.4X
-DOW_ISO of timestamp                                681            684           3         14.7          68.1       0.4X
-DAYOFWEEK_ISO of timestamp                          681            685           7         14.7          68.1       0.4X
-DOY of timestamp                                    597            603           8         16.7          59.7       0.4X
-HOUR of timestamp                                   465            468           4         21.5          46.5       0.6X
-MINUTE of timestamp                                 467            472           6         21.4          46.7       0.6X
-SECOND of timestamp                                 529            530           2         18.9          52.9       0.5X
+cast to timestamp                                   255            265           9         39.2          25.5       1.0X
+YEAR of timestamp                                   693            695           2         14.4          69.3       0.4X
+YEAROFWEEK of timestamp                             650            651           2         15.4          65.0       0.4X
+QUARTER of timestamp                                649            654           5         15.4          64.9       0.4X
+MONTH of timestamp                                  571            574           4         17.5          57.1       0.4X
+WEEK of timestamp                                   892            899          11         11.2          89.2       0.3X
+DAY of timestamp                                    570            571           1         17.5          57.0       0.4X
+DAYOFWEEK of timestamp                              756            758           2         13.2          75.6       0.3X
+DOW of timestamp                                    755            759           5         13.3          75.5       0.3X
+DOW_ISO of timestamp                                694            699           6         14.4          69.4       0.4X
+DAYOFWEEK_ISO of timestamp                          697            699           2         14.3          69.7       0.4X
+DOY of timestamp                                    610            612           2         16.4          61.0       0.4X
+HOUR of timestamp                                   474            476           4         21.1          47.4       0.5X
+MINUTE of timestamp                                 472            477           7         21.2          47.2       0.5X
+SECOND of timestamp                                 538            541           3         18.6          53.8       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke date_part for timestamp:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to timestamp                                   236            243           8         42.4          23.6       1.0X
-YEAR of timestamp                                   529            533           6         18.9          52.9       0.4X
-YEAROFWEEK of timestamp                             601            609           7         16.6          60.1       0.4X
-QUARTER of timestamp                                623            629           8         16.0          62.3       0.4X
-MONTH of timestamp                                  538            542           3         18.6          53.8       0.4X
-WEEK of timestamp                                   855            859           4         11.7          85.5       0.3X
-DAY of timestamp                                    555            557           2         18.0          55.5       0.4X
-DAYOFWEEK of timestamp                              737            739           2         13.6          73.7       0.3X
-DOW of timestamp                                    737            739           2         13.6          73.7       0.3X
-DOW_ISO of timestamp                                673            676           3         14.9          67.3       0.4X
-DAYOFWEEK_ISO of timestamp                          680            689          11         14.7          68.0       0.3X
-DOY of timestamp                                    589            591           2         17.0          58.9       0.4X
-HOUR of timestamp                                   460            468          12         21.7          46.0       0.5X
-MINUTE of timestamp                                 464            465           2         21.6          46.4       0.5X
-SECOND of timestamp                                 530            541           9         18.9          53.0       0.4X
+cast to timestamp                                   235            237           4         42.6          23.5       1.0X
+YEAR of timestamp                                   542            545           4         18.4          54.2       0.4X
+YEAROFWEEK of timestamp                             627            632           8         15.9          62.7       0.4X
+QUARTER of timestamp                                639            640           1         15.6          63.9       0.4X
+MONTH of timestamp                                  561            562           2         17.8          56.1       0.4X
+WEEK of timestamp                                   885            887           2         11.3          88.5       0.3X
+DAY of timestamp                                    556            564          12         18.0          55.6       0.4X
+DAYOFWEEK of timestamp                              750            754           4         13.3          75.0       0.3X
+DOW of timestamp                                    750            752           2         13.3          75.0       0.3X
+DOW_ISO of timestamp                                686            692           6         14.6          68.6       0.3X
+DAYOFWEEK_ISO of timestamp                          688            694           5         14.5          68.8       0.3X
+DOY of timestamp                                    605            607           2         16.5          60.5       0.4X
+HOUR of timestamp                                   469            471           1         21.3          46.9       0.5X
+MINUTE of timestamp                                 471            475           6         21.3          47.1       0.5X
+SECOND of timestamp                                 534            539           4         18.7          53.4       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke extract for date:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to date                                        512            518           7         19.5          51.2       1.0X
-YEAR of date                                        531            533           2         18.8          53.1       1.0X
-YEAROFWEEK of date                                  595            596           1         16.8          59.5       0.9X
-QUARTER of date                                     615            615           1         16.3          61.5       0.8X
-MONTH of date                                       538            539           1         18.6          53.8       1.0X
-WEEK of date                                        858            862           4         11.7          85.8       0.6X
-DAY of date                                         552            553           2         18.1          55.2       0.9X
-DAYOFWEEK of date                                   740            741           1         13.5          74.0       0.7X
-DOW of date                                         738            739           2         13.6          73.8       0.7X
-DOW_ISO of date                                     697            701           6         14.4          69.7       0.7X
-DAYOFWEEK_ISO of date                               673            679           5         14.9          67.3       0.8X
-DOY of date                                         589            597          11         17.0          58.9       0.9X
-HOUR of date                                        978            989          15         10.2          97.8       0.5X
-MINUTE of date                                      976            988          13         10.2          97.6       0.5X
-SECOND of date                                     1035           1041          10          9.7         103.5       0.5X
+cast to date                                        529            530           1         18.9          52.9       1.0X
+YEAR of date                                        532            536           4         18.8          53.2       1.0X
+YEAROFWEEK of date                                  628            629           1         15.9          62.8       0.8X
+QUARTER of date                                     634            636           2         15.8          63.4       0.8X
+MONTH of date                                       561            565           5         17.8          56.1       0.9X
+WEEK of date                                        886            889           3         11.3          88.6       0.6X
+DAY of date                                         560            563           5         17.9          56.0       0.9X
+DAYOFWEEK of date                                   756            759           3         13.2          75.6       0.7X
+DOW of date                                         750            758           9         13.3          75.0       0.7X
+DOW_ISO of date                                     689            694           4         14.5          68.9       0.8X
+DAYOFWEEK_ISO of date                               686            688           2         14.6          68.6       0.8X
+DOY of date                                         604            605           1         16.6          60.4       0.9X
+HOUR of date                                        985            995          12         10.2          98.5       0.5X
+MINUTE of date                                      987            988           1         10.1          98.7       0.5X
+SECOND of date                                     1036           1041           6          9.7         103.6       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke date_part for date:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to date                                        511            520          11         19.6          51.1       1.0X
-YEAR of date                                        531            532           1         18.8          53.1       1.0X
-YEAROFWEEK of date                                  597            599           3         16.7          59.7       0.9X
-QUARTER of date                                     616            618           3         16.2          61.6       0.8X
-MONTH of date                                       534            536           1         18.7          53.4       1.0X
-WEEK of date                                        853            856           3         11.7          85.3       0.6X
-DAY of date                                         550            551           2         18.2          55.0       0.9X
-DAYOFWEEK of date                                   734            759          42         13.6          73.4       0.7X
-DOW of date                                         734            735           2         13.6          73.4       0.7X
-DOW_ISO of date                                     673            675           2         14.9          67.3       0.8X
-DAYOFWEEK_ISO of date                               672            674           3         14.9          67.2       0.8X
-DOY of date                                         588            594           8         17.0          58.8       0.9X
-HOUR of date                                        983            983           1         10.2          98.3       0.5X
-MINUTE of date                                      981            982           1         10.2          98.1       0.5X
-SECOND of date                                     1032           1034           2          9.7         103.2       0.5X
+cast to date                                        525            541          25         19.0          52.5       1.0X
+YEAR of date                                        533            535           3         18.8          53.3       1.0X
+YEAROFWEEK of date                                  627            628           1         15.9          62.7       0.8X
+QUARTER of date                                     631            635           5         15.8          63.1       0.8X
+MONTH of date                                       556            559           2         18.0          55.6       0.9X
+WEEK of date                                        885            885           1         11.3          88.5       0.6X
+DAY of date                                         557            558           1         18.0          55.7       0.9X
+DAYOFWEEK of date                                   748            749           1         13.4          74.8       0.7X
+DOW of date                                         748            749           2         13.4          74.8       0.7X
+DOW_ISO of date                                     687            687           1         14.6          68.7       0.8X
+DAYOFWEEK_ISO of date                               685            687           2         14.6          68.5       0.8X
+DOY of date                                         602            604           2         16.6          60.2       0.9X
+HOUR of date                                        987            989           2         10.1          98.7       0.5X
+MINUTE of date                                      985            992           8         10.1          98.5       0.5X
+SECOND of date                                     1035           1037           3          9.7         103.5       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke extract for interval:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to interval                                    717            719           2         13.9          71.7       1.0X
-YEAR of interval                                    713            715           2         14.0          71.3       1.0X
-MONTH of interval                                   733            736           3         13.6          73.3       1.0X
-DAY of interval                                     709            717          12         14.1          70.9       1.0X
-HOUR of interval                                    721            722           2         13.9          72.1       1.0X
-MINUTE of interval                                  721            727           8         13.9          72.1       1.0X
-SECOND of interval                                  769            772           4         13.0          76.9       0.9X
+cast to interval                                    743            746           3         13.5          74.3       1.0X
+YEAR of interval                                    718            720           2         13.9          71.8       1.0X
+MONTH of interval                                   724            726           2         13.8          72.4       1.0X
+DAY of interval                                     723            726           5         13.8          72.3       1.0X
+HOUR of interval                                    732            733           1         13.7          73.2       1.0X
+MINUTE of interval                                  735            736           1         13.6          73.5       1.0X
+SECOND of interval                                  779            784           5         12.8          77.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke date_part for interval:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to interval                                    720            721           1         13.9          72.0       1.0X
-YEAR of interval                                    711            741          53         14.1          71.1       1.0X
-MONTH of interval                                   739            742           4         13.5          73.9       1.0X
-DAY of interval                                     708            710           2         14.1          70.8       1.0X
-HOUR of interval                                    723            730          11         13.8          72.3       1.0X
-MINUTE of interval                                  723            726           2         13.8          72.3       1.0X
-SECOND of interval                                  779            781           2         12.8          77.9       0.9X
+cast to interval                                    742            744           2         13.5          74.2       1.0X
+YEAR of interval                                    719            720           1         13.9          71.9       1.0X
+MONTH of interval                                   725            727           2         13.8          72.5       1.0X
+DAY of interval                                     722            725           2         13.8          72.2       1.0X
+HOUR of interval                                    732            736           4         13.7          73.2       1.0X
+MINUTE of interval                                  733            743          14         13.6          73.3       1.0X
+SECOND of interval                                  783            791          13         12.8          78.3       0.9X
 
diff --git a/sql/core/benchmarks/ExtractBenchmark-results.txt b/sql/core/benchmarks/ExtractBenchmark-results.txt
index 5c850be75f60d..96179820ea6f1 100644
--- a/sql/core/benchmarks/ExtractBenchmark-results.txt
+++ b/sql/core/benchmarks/ExtractBenchmark-results.txt
@@ -1,104 +1,104 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke extract for timestamp:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to timestamp                                   246            257          10         40.6          24.6       1.0X
-YEAR of timestamp                                   703            706           3         14.2          70.3       0.4X
-YEAROFWEEK of timestamp                             767            780          12         13.0          76.7       0.3X
-QUARTER of timestamp                                730            731           1         13.7          73.0       0.3X
-MONTH of timestamp                                  703            707           5         14.2          70.3       0.4X
-WEEK of timestamp                                   990            993           3         10.1          99.0       0.2X
-DAY of timestamp                                    694            700           6         14.4          69.4       0.4X
-DAYOFWEEK of timestamp                              843            845           2         11.9          84.3       0.3X
-DOW of timestamp                                    841            845           5         11.9          84.1       0.3X
-DOW_ISO of timestamp                                795            799           4         12.6          79.5       0.3X
-DAYOFWEEK_ISO of timestamp                          800            803           5         12.5          80.0       0.3X
-DOY of timestamp                                    712            715           3         14.0          71.2       0.3X
-HOUR of timestamp                                   506            513          10         19.8          50.6       0.5X
-MINUTE of timestamp                                 504            508           7         19.8          50.4       0.5X
-SECOND of timestamp                                 603            604           2         16.6          60.3       0.4X
+cast to timestamp                                   255            276          27         39.3          25.5       1.0X
+YEAR of timestamp                                   695            701           8         14.4          69.5       0.4X
+YEAROFWEEK of timestamp                             759            760           1         13.2          75.9       0.3X
+QUARTER of timestamp                                700            717          23         14.3          70.0       0.4X
+MONTH of timestamp                                  682            685           4         14.7          68.2       0.4X
+WEEK of timestamp                                   988            989           2         10.1          98.8       0.3X
+DAY of timestamp                                    680            693          22         14.7          68.0       0.4X
+DAYOFWEEK of timestamp                              828            833           5         12.1          82.8       0.3X
+DOW of timestamp                                    827            830           4         12.1          82.7       0.3X
+DOW_ISO of timestamp                                803            806           2         12.4          80.3       0.3X
+DAYOFWEEK_ISO of timestamp                          784            785           1         12.8          78.4       0.3X
+DOY of timestamp                                    702            704           3         14.2          70.2       0.4X
+HOUR of timestamp                                   538            540           2         18.6          53.8       0.5X
+MINUTE of timestamp                                 538            540           2         18.6          53.8       0.5X
+SECOND of timestamp                                 644            649           6         15.5          64.4       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke date_part for timestamp:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to timestamp                                   200            203           3         50.0          20.0       1.0X
-YEAR of timestamp                                   663            669           5         15.1          66.3       0.3X
-YEAROFWEEK of timestamp                             715            718           3         14.0          71.5       0.3X
-QUARTER of timestamp                                686            692          10         14.6          68.6       0.3X
-MONTH of timestamp                                  667            670           3         15.0          66.7       0.3X
-WEEK of timestamp                                   951            956           5         10.5          95.1       0.2X
-DAY of timestamp                                    667            681          15         15.0          66.7       0.3X
-DAYOFWEEK of timestamp                              808            813           8         12.4          80.8       0.2X
-DOW of timestamp                                    809            812           3         12.4          80.9       0.2X
-DOW_ISO of timestamp                                765            766           1         13.1          76.5       0.3X
-DAYOFWEEK_ISO of timestamp                          762            763           3         13.1          76.2       0.3X
-DOY of timestamp                                    704            709           6         14.2          70.4       0.3X
-HOUR of timestamp                                   504            507           3         19.8          50.4       0.4X
-MINUTE of timestamp                                 509            511           2         19.6          50.9       0.4X
-SECOND of timestamp                                 598            600           3         16.7          59.8       0.3X
+cast to timestamp                                   233            234           1         43.0          23.3       1.0X
+YEAR of timestamp                                   666            670           4         15.0          66.6       0.3X
+YEAROFWEEK of timestamp                             735            739           4         13.6          73.5       0.3X
+QUARTER of timestamp                                688            695          11         14.5          68.8       0.3X
+MONTH of timestamp                                  670            676           6         14.9          67.0       0.3X
+WEEK of timestamp                                   980            981           1         10.2          98.0       0.2X
+DAY of timestamp                                    670            674           5         14.9          67.0       0.3X
+DAYOFWEEK of timestamp                              825            835          11         12.1          82.5       0.3X
+DOW of timestamp                                    821            827          10         12.2          82.1       0.3X
+DOW_ISO of timestamp                                781            782           1         12.8          78.1       0.3X
+DAYOFWEEK_ISO of timestamp                          780            788           9         12.8          78.0       0.3X
+DOY of timestamp                                    705            711           9         14.2          70.5       0.3X
+HOUR of timestamp                                   536            541           5         18.7          53.6       0.4X
+MINUTE of timestamp                                 546            549           4         18.3          54.6       0.4X
+SECOND of timestamp                                 644            658          23         15.5          64.4       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke extract for date:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to date                                        572            575           3         17.5          57.2       1.0X
-YEAR of date                                        660            664           4         15.1          66.0       0.9X
-YEAROFWEEK of date                                  714            718           4         14.0          71.4       0.8X
-QUARTER of date                                     683            698          21         14.7          68.3       0.8X
-MONTH of date                                       666            674           9         15.0          66.6       0.9X
-WEEK of date                                        953            955           3         10.5          95.3       0.6X
-DAY of date                                         673            676           4         14.9          67.3       0.9X
-DAYOFWEEK of date                                   810            815           8         12.3          81.0       0.7X
-DOW of date                                         807            810           3         12.4          80.7       0.7X
-DOW_ISO of date                                     766            769           3         13.1          76.6       0.7X
-DAYOFWEEK_ISO of date                               765            766           1         13.1          76.5       0.7X
-DOY of date                                         704            705           1         14.2          70.4       0.8X
-HOUR of date                                       1118           1121           4          8.9         111.8       0.5X
-MINUTE of date                                     1129           1130           2          8.9         112.9       0.5X
-SECOND of date                                     1281           1287           9          7.8         128.1       0.4X
+cast to date                                        585            586           1         17.1          58.5       1.0X
+YEAR of date                                        670            674           4         14.9          67.0       0.9X
+YEAROFWEEK of date                                  738            749          11         13.6          73.8       0.8X
+QUARTER of date                                     701            701           0         14.3          70.1       0.8X
+MONTH of date                                       667            673           9         15.0          66.7       0.9X
+WEEK of date                                        974            978           5         10.3          97.4       0.6X
+DAY of date                                         669            674           7         14.9          66.9       0.9X
+DAYOFWEEK of date                                   825            837          20         12.1          82.5       0.7X
+DOW of date                                         821            824           4         12.2          82.1       0.7X
+DOW_ISO of date                                     776            777           1         12.9          77.6       0.8X
+DAYOFWEEK_ISO of date                               775            776           1         12.9          77.5       0.8X
+DOY of date                                         697            701           6         14.3          69.7       0.8X
+HOUR of date                                       1129           1130           1          8.9         112.9       0.5X
+MINUTE of date                                     1131           1141          17          8.8         113.1       0.5X
+SECOND of date                                     1255           1257           3          8.0         125.5       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke date_part for date:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to date                                        570            573           3         17.5          57.0       1.0X
-YEAR of date                                        659            659           1         15.2          65.9       0.9X
-YEAROFWEEK of date                                  713            716           4         14.0          71.3       0.8X
-QUARTER of date                                     683            684           1         14.6          68.3       0.8X
-MONTH of date                                       663            666           3         15.1          66.3       0.9X
-WEEK of date                                        947            950           2         10.6          94.7       0.6X
-DAY of date                                         665            668           3         15.0          66.5       0.9X
-DAYOFWEEK of date                                   807            808           1         12.4          80.7       0.7X
-DOW of date                                         805            809           3         12.4          80.5       0.7X
-DOW_ISO of date                                     758            762           4         13.2          75.8       0.8X
-DAYOFWEEK_ISO of date                               761            763           3         13.1          76.1       0.7X
-DOY of date                                         701            705           4         14.3          70.1       0.8X
-HOUR of date                                       1119           1129          16          8.9         111.9       0.5X
-MINUTE of date                                     1121           1128           6          8.9         112.1       0.5X
-SECOND of date                                     1274           1284           9          7.8         127.4       0.4X
+cast to date                                        582            583           2         17.2          58.2       1.0X
+YEAR of date                                        663            663           1         15.1          66.3       0.9X
+YEAROFWEEK of date                                  731            735           3         13.7          73.1       0.8X
+QUARTER of date                                     682            688           9         14.7          68.2       0.9X
+MONTH of date                                       667            669           2         15.0          66.7       0.9X
+WEEK of date                                        975            980           6         10.3          97.5       0.6X
+DAY of date                                         665            672           6         15.0          66.5       0.9X
+DAYOFWEEK of date                                   822            824           3         12.2          82.2       0.7X
+DOW of date                                         818            822           5         12.2          81.8       0.7X
+DOW_ISO of date                                     776            787          18         12.9          77.6       0.7X
+DAYOFWEEK_ISO of date                               771            784          19         13.0          77.1       0.8X
+DOY of date                                         697            701           6         14.4          69.7       0.8X
+HOUR of date                                       1133           1137           6          8.8         113.3       0.5X
+MINUTE of date                                     1137           1138           1          8.8         113.7       0.5X
+SECOND of date                                     1245           1247           1          8.0         124.5       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke extract for interval:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to interval                                    786            791           5         12.7          78.6       1.0X
-YEAR of interval                                    786            791           4         12.7          78.6       1.0X
-MONTH of interval                                   796            799           3         12.6          79.6       1.0X
-DAY of interval                                     788            790           2         12.7          78.8       1.0X
-HOUR of interval                                    791            794           3         12.6          79.1       1.0X
-MINUTE of interval                                  797            799           3         12.5          79.7       1.0X
-SECOND of interval                                  885            886           2         11.3          88.5       0.9X
+cast to interval                                    811            824          13         12.3          81.1       1.0X
+YEAR of interval                                    796            799           3         12.6          79.6       1.0X
+MONTH of interval                                   801            803           4         12.5          80.1       1.0X
+DAY of interval                                     801            807           8         12.5          80.1       1.0X
+HOUR of interval                                    803            806           4         12.5          80.3       1.0X
+MINUTE of interval                                  808            809           2         12.4          80.8       1.0X
+SECOND of interval                                  911            919           9         11.0          91.1       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Invoke date_part for interval:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-cast to interval                                    791            794           2         12.6          79.1       1.0X
-YEAR of interval                                    789            805          15         12.7          78.9       1.0X
-MONTH of interval                                   781            787           5         12.8          78.1       1.0X
-DAY of interval                                     791            794           2         12.6          79.1       1.0X
-HOUR of interval                                    798            804          11         12.5          79.8       1.0X
-MINUTE of interval                                  795            798           3         12.6          79.5       1.0X
-SECOND of interval                                  881            883           2         11.3          88.1       0.9X
+cast to interval                                    816            819           3         12.3          81.6       1.0X
+YEAR of interval                                    805            808           2         12.4          80.5       1.0X
+MONTH of interval                                   801            802           1         12.5          80.1       1.0X
+DAY of interval                                     797            814          16         12.5          79.7       1.0X
+HOUR of interval                                    806            807           1         12.4          80.6       1.0X
+MINUTE of interval                                  804            815          15         12.4          80.4       1.0X
+SECOND of interval                                  912            924          12         11.0          91.2       0.9X
 
diff --git a/sql/core/benchmarks/FilterPushdownBenchmark-jdk21-results.txt b/sql/core/benchmarks/FilterPushdownBenchmark-jdk21-results.txt
index 8128fae5e350f..c00d771725f8a 100644
--- a/sql/core/benchmarks/FilterPushdownBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/FilterPushdownBenchmark-jdk21-results.txt
@@ -2,733 +2,733 @@
 Pushdown for many distinct value case
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 string row (value IS NULL):      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6419           6495          69          2.5         408.1       1.0X
-Parquet Vectorized (Pushdown)                       365            389          16         43.1          23.2      17.6X
-Native ORC Vectorized                              5170           5230          67          3.0         328.7       1.2X
-Native ORC Vectorized (Pushdown)                    309            324          13         50.9          19.6      20.8X
+Parquet Vectorized                                 6457           6511          42          2.4         410.5       1.0X
+Parquet Vectorized (Pushdown)                       331            362          18         47.5          21.0      19.5X
+Native ORC Vectorized                              5199           5291          68          3.0         330.5       1.2X
+Native ORC Vectorized (Pushdown)                    318            330           8         49.5          20.2      20.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 string row ('7864320' < value < '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                            6431           6441           7          2.4         408.9       1.0X
-Parquet Vectorized (Pushdown)                                  324            334           9         48.5          20.6      19.8X
-Native ORC Vectorized                                         5259           5289          32          3.0         334.4       1.2X
-Native ORC Vectorized (Pushdown)                               315            325          10         50.0          20.0      20.4X
+Parquet Vectorized                                            6315           6337          18          2.5         401.5       1.0X
+Parquet Vectorized (Pushdown)                                  327            335           6         48.1          20.8      19.3X
+Native ORC Vectorized                                         5307           5322          17          3.0         337.4       1.2X
+Native ORC Vectorized (Pushdown)                               325            347          28         48.3          20.7      19.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 string row (value = '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6492           6515          17          2.4         412.8       1.0X
-Parquet Vectorized (Pushdown)                       309            326          14         50.9          19.7      21.0X
-Native ORC Vectorized                              5394           5411          26          2.9         342.9       1.2X
-Native ORC Vectorized (Pushdown)                    299            316          12         52.7          19.0      21.7X
+Parquet Vectorized                                 6387           6422          28          2.5         406.1       1.0X
+Parquet Vectorized (Pushdown)                       324            330           5         48.6          20.6      19.7X
+Native ORC Vectorized                              5314           5324           7          3.0         337.9       1.2X
+Native ORC Vectorized (Pushdown)                    320            327           6         49.2          20.3      20.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 string row (value <=> '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  6495           6531          31          2.4         412.9       1.0X
-Parquet Vectorized (Pushdown)                        304            313          10         51.8          19.3      21.4X
-Native ORC Vectorized                               5285           5300          14          3.0         336.0       1.2X
-Native ORC Vectorized (Pushdown)                     292            305           9         53.8          18.6      22.2X
+Parquet Vectorized                                  6328           6336           7          2.5         402.3       1.0X
+Parquet Vectorized (Pushdown)                        317            320           2         49.6          20.1      20.0X
+Native ORC Vectorized                               5292           5307          14          3.0         336.4       1.2X
+Native ORC Vectorized (Pushdown)                     315            318           3         50.0          20.0      20.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 string row ('7864320' <= value <= '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                              6421           6460          39          2.4         408.2       1.0X
-Parquet Vectorized (Pushdown)                                    303            316           9         51.8          19.3      21.2X
-Native ORC Vectorized                                           5286           5308          16          3.0         336.0       1.2X
-Native ORC Vectorized (Pushdown)                                 298            304           6         52.8          19.0      21.5X
+Parquet Vectorized                                              6317           6332          15          2.5         401.6       1.0X
+Parquet Vectorized (Pushdown)                                    317            323           6         49.6          20.1      19.9X
+Native ORC Vectorized                                           5298           5316          12          3.0         336.8       1.2X
+Native ORC Vectorized (Pushdown)                                 317            328          11         49.6          20.2      19.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all string rows (value IS NOT NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  14207          14265          44          1.1         903.3       1.0X
-Parquet Vectorized (Pushdown)                       14166          14227          38          1.1         900.7       1.0X
-Native ORC Vectorized                               12799          12822          29          1.2         813.7       1.1X
-Native ORC Vectorized (Pushdown)                    12860          12881          15          1.2         817.6       1.1X
+Parquet Vectorized                                  13607          13761          92          1.2         865.1       1.0X
+Parquet Vectorized (Pushdown)                       13872          13912          58          1.1         881.9       1.0X
+Native ORC Vectorized                               12865          12905          33          1.2         817.9       1.1X
+Native ORC Vectorized (Pushdown)                    12967          13013          37          1.2         824.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 int row (value IS NULL):         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6233           6274          34          2.5         396.3       1.0X
-Parquet Vectorized (Pushdown)                       296            324          23         53.2          18.8      21.1X
-Native ORC Vectorized                              4775           4801          25          3.3         303.6       1.3X
-Native ORC Vectorized (Pushdown)                    294            303           8         53.5          18.7      21.2X
+Parquet Vectorized                                 6151           6175          19          2.6         391.1       1.0X
+Parquet Vectorized (Pushdown)                       292            313          19         53.8          18.6      21.1X
+Native ORC Vectorized                              4759           4811          39          3.3         302.6       1.3X
+Native ORC Vectorized (Pushdown)                    287            310          12         54.8          18.2      21.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 int row (7864320 < value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     6109           6131          22          2.6         388.4       1.0X
-Parquet Vectorized (Pushdown)                           316            324           6         49.8          20.1      19.3X
-Native ORC Vectorized                                  4766           4781          13          3.3         303.0       1.3X
-Native ORC Vectorized (Pushdown)                        297            305           7         53.0          18.9      20.6X
+Parquet Vectorized                                     6072           6079           5          2.6         386.1       1.0X
+Parquet Vectorized (Pushdown)                           297            304           5         52.9          18.9      20.4X
+Native ORC Vectorized                                  4752           4766           9          3.3         302.1       1.3X
+Native ORC Vectorized (Pushdown)                        287            298          10         54.7          18.3      21.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (value = 7864320):       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6211           6238          26          2.5         394.9       1.0X
-Parquet Vectorized (Pushdown)                       304            315           9         51.8          19.3      20.5X
-Native ORC Vectorized                              4824           4849          22          3.3         306.7       1.3X
-Native ORC Vectorized (Pushdown)                    278            286           7         56.6          17.7      22.4X
+Parquet Vectorized                                 6134           6144           7          2.6         390.0       1.0X
+Parquet Vectorized (Pushdown)                       291            299           5         54.1          18.5      21.1X
+Native ORC Vectorized                              4773           4832          34          3.3         303.5       1.3X
+Native ORC Vectorized (Pushdown)                    288            294           4         54.6          18.3      21.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (value <=> 7864320):     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6153           6156           4          2.6         391.2       1.0X
-Parquet Vectorized (Pushdown)                       295            301           4         53.4          18.7      20.9X
-Native ORC Vectorized                              4864           4881          10          3.2         309.3       1.3X
-Native ORC Vectorized (Pushdown)                    277            289           9         56.8          17.6      22.2X
+Parquet Vectorized                                 6130           6144          20          2.6         389.7       1.0X
+Parquet Vectorized (Pushdown)                       288            293           4         54.7          18.3      21.3X
+Native ORC Vectorized                              4769           4810          23          3.3         303.2       1.3X
+Native ORC Vectorized (Pushdown)                    286            292           5         55.0          18.2      21.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (7864320 <= value <= 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                       6164           6181          14          2.6         391.9       1.0X
-Parquet Vectorized (Pushdown)                             299            302           4         52.7          19.0      20.6X
-Native ORC Vectorized                                    4846           4871          24          3.2         308.1       1.3X
-Native ORC Vectorized (Pushdown)                          277            289           8         56.7          17.6      22.2X
+Parquet Vectorized                                       6118           6142          22          2.6         388.9       1.0X
+Parquet Vectorized (Pushdown)                             290            294           3         54.2          18.4      21.1X
+Native ORC Vectorized                                    4826           4830           2          3.3         306.9       1.3X
+Native ORC Vectorized (Pushdown)                          288            294           4         54.7          18.3      21.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (7864319 < value < 7864321):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     6138           6163          16          2.6         390.2       1.0X
-Parquet Vectorized (Pushdown)                           291            300           5         54.0          18.5      21.1X
-Native ORC Vectorized                                  4833           4849          14          3.3         307.3       1.3X
-Native ORC Vectorized (Pushdown)                        274            282           6         57.5          17.4      22.4X
+Parquet Vectorized                                     6113           6125          17          2.6         388.6       1.0X
+Parquet Vectorized (Pushdown)                           288            293           4         54.7          18.3      21.3X
+Native ORC Vectorized                                  4806           4820          21          3.3         305.5       1.3X
+Native ORC Vectorized (Pushdown)                        283            290           5         55.5          18.0      21.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% int rows (value < 1572864):    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6789           6817          29          2.3         431.6       1.0X
-Parquet Vectorized (Pushdown)                      1547           1564          17         10.2          98.3       4.4X
-Native ORC Vectorized                              5444           5466          17          2.9         346.1       1.2X
-Native ORC Vectorized (Pushdown)                   1388           1394           8         11.3          88.2       4.9X
+Parquet Vectorized                                 6781           6812          29          2.3         431.1       1.0X
+Parquet Vectorized (Pushdown)                      1545           1550           6         10.2          98.2       4.4X
+Native ORC Vectorized                              5477           5482           4          2.9         348.2       1.2X
+Native ORC Vectorized (Pushdown)                   1426           1434           7         11.0          90.6       4.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% int rows (value < 7864320):    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 9167           9207          37          1.7         582.8       1.0X
-Parquet Vectorized (Pushdown)                      6291           6306          12          2.5         400.0       1.5X
-Native ORC Vectorized                              7845           7882          46          2.0         498.8       1.2X
-Native ORC Vectorized (Pushdown)                   5718           5729          11          2.8         363.5       1.6X
+Parquet Vectorized                                 9288           9304          12          1.7         590.5       1.0X
+Parquet Vectorized (Pushdown)                      6431           6456          17          2.4         408.9       1.4X
+Native ORC Vectorized                              8090           8131          60          1.9         514.3       1.1X
+Native ORC Vectorized (Pushdown)                   5847           5861          11          2.7         371.8       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% int rows (value < 14155776):   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                11661          11680          16          1.3         741.4       1.0X
-Parquet Vectorized (Pushdown)                     11121          11142          23          1.4         707.0       1.0X
-Native ORC Vectorized                             10366          10402          38          1.5         659.1       1.1X
-Native ORC Vectorized (Pushdown)                   9982          10009          28          1.6         634.6       1.2X
+Parquet Vectorized                                11939          11962          20          1.3         759.0       1.0X
+Parquet Vectorized (Pushdown)                     11431          11452          14          1.4         726.8       1.0X
+Native ORC Vectorized                             10627          10646          17          1.5         675.6       1.1X
+Native ORC Vectorized (Pushdown)                  10242          10282          53          1.5         651.2       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all int rows (value IS NOT NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                12163          12182          18          1.3         773.3       1.0X
-Parquet Vectorized (Pushdown)                     12196          12224          20          1.3         775.4       1.0X
-Native ORC Vectorized                             10954          10971          26          1.4         696.5       1.1X
-Native ORC Vectorized (Pushdown)                  11012          11035          19          1.4         700.2       1.1X
+Parquet Vectorized                                12465          12473           6          1.3         792.5       1.0X
+Parquet Vectorized (Pushdown)                     12514          12541          21          1.3         795.6       1.0X
+Native ORC Vectorized                             11133          11145          10          1.4         707.8       1.1X
+Native ORC Vectorized (Pushdown)                  11245          11275          22          1.4         715.0       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all int rows (value > -1):         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                12326          12343          12          1.3         783.7       1.0X
-Parquet Vectorized (Pushdown)                     12321          12343          19          1.3         783.3       1.0X
-Native ORC Vectorized                             10831          10850          27          1.5         688.6       1.1X
-Native ORC Vectorized (Pushdown)                  10937          10953          12          1.4         695.3       1.1X
+Parquet Vectorized                                12470          12495          26          1.3         792.8       1.0X
+Parquet Vectorized (Pushdown)                     12543          12569          17          1.3         797.5       1.0X
+Native ORC Vectorized                             11253          11274          12          1.4         715.5       1.1X
+Native ORC Vectorized (Pushdown)                  11339          11371          20          1.4         720.9       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all int rows (value != -1):        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                12060          12089          20          1.3         766.7       1.0X
-Parquet Vectorized (Pushdown)                     12142          12186          43          1.3         772.0       1.0X
-Native ORC Vectorized                             10799          10834          24          1.5         686.6       1.1X
-Native ORC Vectorized (Pushdown)                  10903          10952          41          1.4         693.2       1.1X
+Parquet Vectorized                                12512          12556          28          1.3         795.5       1.0X
+Parquet Vectorized (Pushdown)                     12589          12618          28          1.2         800.4       1.0X
+Native ORC Vectorized                             11292          11305          24          1.4         718.0       1.1X
+Native ORC Vectorized (Pushdown)                  11355          11384          31          1.4         721.9       1.1X
 
 
 ================================================================================================
 Pushdown for few distinct value case (use dictionary encoding)
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 distinct string row (value IS NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     5716           5771          45          2.8         363.4       1.0X
-Parquet Vectorized (Pushdown)                           245            256          11         64.1          15.6      23.3X
-Native ORC Vectorized                                  6171           6213          43          2.5         392.3       0.9X
-Native ORC Vectorized (Pushdown)                        906            913           6         17.4          57.6       6.3X
+Parquet Vectorized                                     5514           5533          19          2.9         350.5       1.0X
+Parquet Vectorized (Pushdown)                           240            265          22         65.6          15.2      23.0X
+Native ORC Vectorized                                  6365           6386          19          2.5         404.7       0.9X
+Native ORC Vectorized (Pushdown)                        944            955           9         16.7          60.0       5.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 distinct string row ('100' < value < '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                             5665           5686          22          2.8         360.2       1.0X
-Parquet Vectorized (Pushdown)                                   246            254           7         63.9          15.7      23.0X
-Native ORC Vectorized                                          6401           6409          15          2.5         407.0       0.9X
-Native ORC Vectorized (Pushdown)                                908            921          15         17.3          57.7       6.2X
+Parquet Vectorized                                             5579           5590           9          2.8         354.7       1.0X
+Parquet Vectorized (Pushdown)                                   239            246          10         65.9          15.2      23.4X
+Native ORC Vectorized                                          6575           6586           9          2.4         418.0       0.8X
+Native ORC Vectorized (Pushdown)                                947            954           5         16.6          60.2       5.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 distinct string row (value = '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     5621           5633          12          2.8         357.3       1.0X
-Parquet Vectorized (Pushdown)                           310            317           7         50.8          19.7      18.1X
-Native ORC Vectorized                                  6390           6402          10          2.5         406.2       0.9X
-Native ORC Vectorized (Pushdown)                        949            955           6         16.6          60.3       5.9X
+Parquet Vectorized                                     5554           5560           5          2.8         353.1       1.0X
+Parquet Vectorized (Pushdown)                           284            290           6         55.3          18.1      19.5X
+Native ORC Vectorized                                  6614           6626          12          2.4         420.5       0.8X
+Native ORC Vectorized (Pushdown)                        996           1013          22         15.8          63.3       5.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 distinct string row (value <=> '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                       5605           5620          18          2.8         356.4       1.0X
-Parquet Vectorized (Pushdown)                             288            292           3         54.6          18.3      19.4X
-Native ORC Vectorized                                    6377           6406          26          2.5         405.4       0.9X
-Native ORC Vectorized (Pushdown)                          947            954           6         16.6          60.2       5.9X
+Parquet Vectorized                                       5500           5524          21          2.9         349.7       1.0X
+Parquet Vectorized (Pushdown)                             282            286           2         55.7          18.0      19.5X
+Native ORC Vectorized                                    6609           6637          18          2.4         420.2       0.8X
+Native ORC Vectorized (Pushdown)                         1000           1008          10         15.7          63.6       5.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 distinct string row ('100' <= value <= '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               5673           5705          27          2.8         360.7       1.0X
-Parquet Vectorized (Pushdown)                                     294            303          10         53.5          18.7      19.3X
-Native ORC Vectorized                                            6458           6481          27          2.4         410.6       0.9X
-Native ORC Vectorized (Pushdown)                                  958            962           5         16.4          60.9       5.9X
+Parquet Vectorized                                               5574           5599          24          2.8         354.4       1.0X
+Parquet Vectorized (Pushdown)                                     285            293           8         55.1          18.1      19.5X
+Native ORC Vectorized                                            6654           6668          15          2.4         423.0       0.8X
+Native ORC Vectorized (Pushdown)                                  999           1005           7         15.7          63.5       5.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all distinct string rows (value IS NOT NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                           13823          13841          17          1.1         878.8       1.0X
-Parquet Vectorized (Pushdown)                                13836          13862          22          1.1         879.6       1.0X
-Native ORC Vectorized                                        14784          14837          79          1.1         939.9       0.9X
-Native ORC Vectorized (Pushdown)                             14990          15048          52          1.0         953.1       0.9X
+Parquet Vectorized                                           13703          13741          26          1.1         871.2       1.0X
+Parquet Vectorized (Pushdown)                                13739          13772          24          1.1         873.5       1.0X
+Native ORC Vectorized                                        15511          15562          38          1.0         986.2       0.9X
+Native ORC Vectorized (Pushdown)                             15773          15841         122          1.0        1002.8       0.9X
 
 
 ================================================================================================
 Pushdown benchmark for StringStartsWith
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringStartsWith filter: (value like '10%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                    6910           6946          24          2.3         439.3       1.0X
-Parquet Vectorized (Pushdown)                          922            938          14         17.1          58.6       7.5X
-Native ORC Vectorized                                 5528           5546          14          2.8         351.4       1.3X
-Native ORC Vectorized (Pushdown)                      5609           5625          10          2.8         356.6       1.2X
+Parquet Vectorized                                    6657           6673          11          2.4         423.2       1.0X
+Parquet Vectorized (Pushdown)                          922            929           4         17.1          58.6       7.2X
+Native ORC Vectorized                                 5672           5736          58          2.8         360.6       1.2X
+Native ORC Vectorized (Pushdown)                      5742           5761          21          2.7         365.1       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringStartsWith filter: (value like '1000%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      6554           6567          11          2.4         416.7       1.0X
-Parquet Vectorized (Pushdown)                            302            310           7         52.1          19.2      21.7X
-Native ORC Vectorized                                   5339           5360          17          2.9         339.4       1.2X
-Native ORC Vectorized (Pushdown)                        5436           5460          20          2.9         345.6       1.2X
+Parquet Vectorized                                      6434           6445          16          2.4         409.1       1.0X
+Parquet Vectorized (Pushdown)                            278            282           4         56.7          17.7      23.2X
+Native ORC Vectorized                                   5484           5500          25          2.9         348.7       1.2X
+Native ORC Vectorized (Pushdown)                        5556           5579          17          2.8         353.2       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringStartsWith filter: (value like '786432%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                        6549           6556           6          2.4         416.4       1.0X
-Parquet Vectorized (Pushdown)                              296            303           5         53.2          18.8      22.1X
-Native ORC Vectorized                                     5348           5378          20          2.9         340.0       1.2X
-Native ORC Vectorized (Pushdown)                          5441           5449           8          2.9         345.9       1.2X
+Parquet Vectorized                                        6419           6434          15          2.5         408.1       1.0X
+Parquet Vectorized (Pushdown)                              268            276           7         58.7          17.0      23.9X
+Native ORC Vectorized                                     5454           5480          27          2.9         346.7       1.2X
+Native ORC Vectorized (Pushdown)                          5541           5561          16          2.8         352.3       1.2X
 
 
 ================================================================================================
 Pushdown benchmark for StringEndsWith
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringEndsWith filter: (value like '%10'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  5813           5950         171          2.7         369.6       1.0X
-Parquet Vectorized (Pushdown)                        403            455          56         39.0          25.6      14.4X
-Native ORC Vectorized                               6523           6559          24          2.4         414.7       0.9X
-Native ORC Vectorized (Pushdown)                    6692           6727          30          2.4         425.5       0.9X
+Parquet Vectorized                                  5559           5580          31          2.8         353.5       1.0X
+Parquet Vectorized (Pushdown)                        359            379          21         43.8          22.8      15.5X
+Native ORC Vectorized                               6650           6690          58          2.4         422.8       0.8X
+Native ORC Vectorized (Pushdown)                    6873           6889          19          2.3         437.0       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringEndsWith filter: (value like '%1000'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                    5552           5564           9          2.8         353.0       1.0X
-Parquet Vectorized (Pushdown)                          284            304          19         55.5          18.0      19.6X
-Native ORC Vectorized                                 6441           6457          16          2.4         409.5       0.9X
-Native ORC Vectorized (Pushdown)                      6687           6714          17          2.4         425.1       0.8X
+Parquet Vectorized                                    5438           5451          12          2.9         345.7       1.0X
+Parquet Vectorized (Pushdown)                          267            271           4         59.0          17.0      20.4X
+Native ORC Vectorized                                 6587           6605          19          2.4         418.8       0.8X
+Native ORC Vectorized (Pushdown)                      6784           6809          21          2.3         431.3       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringEndsWith filter: (value like '%786432'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      5525           5541          21          2.8         351.3       1.0X
-Parquet Vectorized (Pushdown)                            276            290           7         56.9          17.6      20.0X
-Native ORC Vectorized                                   6437           6455          17          2.4         409.2       0.9X
-Native ORC Vectorized (Pushdown)                        6634           6658          21          2.4         421.8       0.8X
+Parquet Vectorized                                      5445           5460          10          2.9         346.2       1.0X
+Parquet Vectorized (Pushdown)                            269            279          14         58.6          17.1      20.3X
+Native ORC Vectorized                                   6625           6641          10          2.4         421.2       0.8X
+Native ORC Vectorized (Pushdown)                        6854           6869          12          2.3         435.8       0.8X
 
 
 ================================================================================================
 Pushdown benchmark for StringContains
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringContains filter: (value like '%10%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                   5809           5972          92          2.7         369.3       1.0X
-Parquet Vectorized (Pushdown)                         832            846          14         18.9          52.9       7.0X
-Native ORC Vectorized                                6491           6536          47          2.4         412.7       0.9X
-Native ORC Vectorized (Pushdown)                     6711           6733          27          2.3         426.7       0.9X
+Parquet Vectorized                                   5895           5923          22          2.7         374.8       1.0X
+Parquet Vectorized (Pushdown)                         821            837          13         19.2          52.2       7.2X
+Native ORC Vectorized                                6951           7011          79          2.3         442.0       0.8X
+Native ORC Vectorized (Pushdown)                     7168           7197          25          2.2         455.7       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringContains filter: (value like '%1000%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     5538           5551          15          2.8         352.1       1.0X
-Parquet Vectorized (Pushdown)                           280            291           8         56.1          17.8      19.8X
-Native ORC Vectorized                                  6255           6270          12          2.5         397.7       0.9X
-Native ORC Vectorized (Pushdown)                       6481           6505          23          2.4         412.1       0.9X
+Parquet Vectorized                                     5503           5520          16          2.9         349.8       1.0X
+Parquet Vectorized (Pushdown)                           267            273           3         58.8          17.0      20.6X
+Native ORC Vectorized                                  6657           6667          13          2.4         423.2       0.8X
+Native ORC Vectorized (Pushdown)                       6874           6888          12          2.3         437.0       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringContains filter: (value like '%786432%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                       5541           5547           6          2.8         352.3       1.0X
-Parquet Vectorized (Pushdown)                             282            287           4         55.7          17.9      19.6X
-Native ORC Vectorized                                    6246           6271          21          2.5         397.1       0.9X
-Native ORC Vectorized (Pushdown)                         6461           6475          10          2.4         410.8       0.9X
+Parquet Vectorized                                       5503           5517          13          2.9         349.9       1.0X
+Parquet Vectorized (Pushdown)                             270            275           3         58.2          17.2      20.4X
+Native ORC Vectorized                                    6659           6681          22          2.4         423.3       0.8X
+Native ORC Vectorized (Pushdown)                         6865           6898          22          2.3         436.5       0.8X
 
 
 ================================================================================================
 Pushdown benchmark for decimal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 decimal(9, 2) row (value = 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     2439           2480          64          6.5         155.0       1.0X
-Parquet Vectorized (Pushdown)                            72             88          17        219.8           4.5      34.1X
-Native ORC Vectorized                                  3246           3265          25          4.8         206.4       0.8X
-Native ORC Vectorized (Pushdown)                         58             63           6        272.9           3.7      42.3X
+Parquet Vectorized                                     2335           2352          24          6.7         148.4       1.0X
+Parquet Vectorized (Pushdown)                            70             81           5        223.8           4.5      33.2X
+Native ORC Vectorized                                  3294           3304          18          4.8         209.4       0.7X
+Native ORC Vectorized (Pushdown)                         61             70           5        257.9           3.9      38.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% decimal(9, 2) rows (value < 1572864):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                        3793           3802           8          4.1         241.2       1.0X
-Parquet Vectorized (Pushdown)                             1887           1907          20          8.3         120.0       2.0X
-Native ORC Vectorized                                     4669           4712          44          3.4         296.8       0.8X
-Native ORC Vectorized (Pushdown)                          2076           2103          21          7.6         132.0       1.8X
+Parquet Vectorized                                        3704           3728          29          4.2         235.5       1.0X
+Parquet Vectorized (Pushdown)                             1851           1863           7          8.5         117.7       2.0X
+Native ORC Vectorized                                     4887           4906          11          3.2         310.7       0.8X
+Native ORC Vectorized (Pushdown)                          2234           2240           4          7.0         142.1       1.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% decimal(9, 2) rows (value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                        8246           8261          17          1.9         524.3       1.0X
-Parquet Vectorized (Pushdown)                             7933           7958          17          2.0         504.4       1.0X
-Native ORC Vectorized                                     9316           9341          19          1.7         592.3       0.9X
-Native ORC Vectorized (Pushdown)                          8905           8938          27          1.8         566.1       0.9X
+Parquet Vectorized                                        8080           8103          29          1.9         513.7       1.0X
+Parquet Vectorized (Pushdown)                             7803           7823          12          2.0         496.1       1.0X
+Native ORC Vectorized                                    10009          10022          11          1.6         636.4       0.8X
+Native ORC Vectorized (Pushdown)                          9572           9599          39          1.6         608.5       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% decimal(9, 2) rows (value < 14155776):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         9503           9576          69          1.7         604.2       1.0X
-Parquet Vectorized (Pushdown)                              9497           9514          14          1.7         603.8       1.0X
-Native ORC Vectorized                                     10621          10667          50          1.5         675.2       0.9X
-Native ORC Vectorized (Pushdown)                          10603          10654          36          1.5         674.1       0.9X
+Parquet Vectorized                                         9337           9366          32          1.7         593.6       1.0X
+Parquet Vectorized (Pushdown)                              9353           9366          10          1.7         594.6       1.0X
+Native ORC Vectorized                                     11264          11287          18          1.4         716.1       0.8X
+Native ORC Vectorized (Pushdown)                          11287          11309          16          1.4         717.6       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 decimal(18, 2) row (value = 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      2641           2666          30          6.0         167.9       1.0X
-Parquet Vectorized (Pushdown)                             72             78          10        217.5           4.6      36.5X
-Native ORC Vectorized                                   3288           3324          37          4.8         209.0       0.8X
-Native ORC Vectorized (Pushdown)                          55             65           7        286.3           3.5      48.1X
+Parquet Vectorized                                      2529           2539           7          6.2         160.8       1.0X
+Parquet Vectorized (Pushdown)                             71             82           7        221.4           4.5      35.6X
+Native ORC Vectorized                                   3300           3321          26          4.8         209.8       0.8X
+Native ORC Vectorized (Pushdown)                          59             66           5        267.7           3.7      43.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% decimal(18, 2) rows (value < 1572864):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         3314           3376          74          4.7         210.7       1.0X
-Parquet Vectorized (Pushdown)                              1045           1054           8         15.1          66.4       3.2X
-Native ORC Vectorized                                      4024           4048          36          3.9         255.9       0.8X
-Native ORC Vectorized (Pushdown)                           1090           1102          12         14.4          69.3       3.0X
+Parquet Vectorized                                         3232           3257          36          4.9         205.5       1.0X
+Parquet Vectorized (Pushdown)                              1028           1031           3         15.3          65.4       3.1X
+Native ORC Vectorized                                      4080           4090          11          3.9         259.4       0.8X
+Native ORC Vectorized (Pushdown)                           1166           1172           7         13.5          74.1       2.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% decimal(18, 2) rows (value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         6161           6172          10          2.6         391.7       1.0X
-Parquet Vectorized (Pushdown)                              4923           4957          51          3.2         313.0       1.3X
-Native ORC Vectorized                                      6961           6979          19          2.3         442.6       0.9X
-Native ORC Vectorized (Pushdown)                           5280           5301          18          3.0         335.7       1.2X
+Parquet Vectorized                                         6104           6112           8          2.6         388.1       1.0X
+Parquet Vectorized (Pushdown)                              4888           4905          18          3.2         310.8       1.2X
+Native ORC Vectorized                                      7257           7276          11          2.2         461.4       0.8X
+Native ORC Vectorized (Pushdown)                           5610           5620           7          2.8         356.7       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% decimal(18, 2) rows (value < 14155776):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                          9004           9028          28          1.7         572.5       1.0X
-Parquet Vectorized (Pushdown)                               8775           8790          11          1.8         557.9       1.0X
-Native ORC Vectorized                                       9794           9807          15          1.6         622.7       0.9X
-Native ORC Vectorized (Pushdown)                            9490           9506          12          1.7         603.4       0.9X
+Parquet Vectorized                                          8832           8872          41          1.8         561.5       1.0X
+Parquet Vectorized (Pushdown)                               8620           8628           7          1.8         548.0       1.0X
+Native ORC Vectorized                                      10412          10427          20          1.5         662.0       0.8X
+Native ORC Vectorized (Pushdown)                           10104          10139          37          1.6         642.4       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 decimal(38, 2) row (value = 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      3780           3801          16          4.2         240.3       1.0X
-Parquet Vectorized (Pushdown)                             79             98          22        200.0           5.0      48.1X
-Native ORC Vectorized                                   3288           3300           9          4.8         209.1       1.1X
-Native ORC Vectorized (Pushdown)                          54             59           5        288.6           3.5      69.4X
+Parquet Vectorized                                      3829           3847          13          4.1         243.4       1.0X
+Parquet Vectorized (Pushdown)                             75             84           5        210.2           4.8      51.2X
+Native ORC Vectorized                                   3304           3316          24          4.8         210.0       1.2X
+Native ORC Vectorized (Pushdown)                          57             65           4        276.5           3.6      67.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% decimal(38, 2) rows (value < 1572864):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         4732           4780          66          3.3         300.8       1.0X
-Parquet Vectorized (Pushdown)                              1392           1404           8         11.3          88.5       3.4X
-Native ORC Vectorized                                      4156           4165          10          3.8         264.2       1.1X
-Native ORC Vectorized (Pushdown)                           1234           1241           5         12.7          78.5       3.8X
+Parquet Vectorized                                         4667           4699          40          3.4         296.7       1.0X
+Parquet Vectorized (Pushdown)                              1339           1344           4         11.7          85.1       3.5X
+Native ORC Vectorized                                      4215           4227          11          3.7         268.0       1.1X
+Native ORC Vectorized (Pushdown)                           1286           1289           3         12.2          81.8       3.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% decimal(38, 2) rows (value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         8479           8513          43          1.9         539.1       1.0X
-Parquet Vectorized (Pushdown)                              6654           6669          23          2.4         423.0       1.3X
-Native ORC Vectorized                                      7628           7634           5          2.1         485.0       1.1X
-Native ORC Vectorized (Pushdown)                           5957           5981          37          2.6         378.8       1.4X
+Parquet Vectorized                                         8329           8343          16          1.9         529.6       1.0X
+Parquet Vectorized (Pushdown)                              6485           6499          11          2.4         412.3       1.3X
+Native ORC Vectorized                                      7903           7918          15          2.0         502.5       1.1X
+Native ORC Vectorized (Pushdown)                           6234           6256          12          2.5         396.4       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% decimal(38, 2) rows (value < 14155776):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         12128          12143          13          1.3         771.1       1.0X
-Parquet Vectorized (Pushdown)                              11813          11820          11          1.3         751.0       1.0X
-Native ORC Vectorized                                      11005          11012           6          1.4         699.7       1.1X
-Native ORC Vectorized (Pushdown)                           10691          10711          15          1.5         679.7       1.1X
+Parquet Vectorized                                         11910          11926          16          1.3         757.2       1.0X
+Parquet Vectorized (Pushdown)                              11574          11583           9          1.4         735.9       1.0X
+Native ORC Vectorized                                      11496          11534          67          1.4         730.9       1.0X
+Native ORC Vectorized (Pushdown)                           11211          11250          33          1.4         712.8       1.1X
 
 
 ================================================================================================
 Pushdown benchmark for InSet -> InFilters
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 5, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               6541           6622          78          2.4         415.9       1.0X
-Parquet Vectorized (Pushdown)                                     396            432          41         39.7          25.2      16.5X
-Native ORC Vectorized                                            4724           4750          20          3.3         300.3       1.4X
-Native ORC Vectorized (Pushdown)                                  325            350          29         48.4          20.7      20.1X
+Parquet Vectorized                                               6234           6271          28          2.5         396.3       1.0X
+Parquet Vectorized (Pushdown)                                     297            317          16         52.9          18.9      21.0X
+Native ORC Vectorized                                            4805           4847          38          3.3         305.5       1.3X
+Native ORC Vectorized (Pushdown)                                  315            320           5         49.9          20.0      19.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 5, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               6231           6249          17          2.5         396.2       1.0X
-Parquet Vectorized (Pushdown)                                     303            316           8         51.9          19.3      20.6X
-Native ORC Vectorized                                            4716           4729          12          3.3         299.8       1.3X
-Native ORC Vectorized (Pushdown)                                  296            307           6         53.1          18.8      21.0X
+Parquet Vectorized                                               6125           6153          29          2.6         389.4       1.0X
+Parquet Vectorized (Pushdown)                                     283            289           3         55.6          18.0      21.6X
+Native ORC Vectorized                                            4766           4789          19          3.3         303.0       1.3X
+Native ORC Vectorized (Pushdown)                                  296            306          10         53.2          18.8      20.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 5, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               6193           6206          14          2.5         393.7       1.0X
-Parquet Vectorized (Pushdown)                                     299            304           4         52.6          19.0      20.7X
-Native ORC Vectorized                                            4700           4736          32          3.3         298.8       1.3X
-Native ORC Vectorized (Pushdown)                                  292            309          19         53.9          18.5      21.2X
+Parquet Vectorized                                               6131           6144          19          2.6         389.8       1.0X
+Parquet Vectorized (Pushdown)                                     285            291           4         55.2          18.1      21.5X
+Native ORC Vectorized                                            4765           4783          14          3.3         302.9       1.3X
+Native ORC Vectorized (Pushdown)                                  298            302           3         52.9          18.9      20.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 10, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6192           6229          26          2.5         393.7       1.0X
-Parquet Vectorized (Pushdown)                                      314            347          63         50.1          20.0      19.7X
-Native ORC Vectorized                                             4746           4757          23          3.3         301.7       1.3X
-Native ORC Vectorized (Pushdown)                                   307            315           6         51.2          19.5      20.2X
+Parquet Vectorized                                                6124           6142          15          2.6         389.3       1.0X
+Parquet Vectorized (Pushdown)                                      300            304           3         52.5          19.1      20.4X
+Native ORC Vectorized                                             4780           4786           9          3.3         303.9       1.3X
+Native ORC Vectorized (Pushdown)                                   310            315           3         50.7          19.7      19.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 10, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6195           6204           9          2.5         393.9       1.0X
-Parquet Vectorized (Pushdown)                                      318            323           6         49.5          20.2      19.5X
-Native ORC Vectorized                                             4724           4790          96          3.3         300.4       1.3X
-Native ORC Vectorized (Pushdown)                                   305            311           8         51.5          19.4      20.3X
+Parquet Vectorized                                                6146           6183          36          2.6         390.8       1.0X
+Parquet Vectorized (Pushdown)                                      298            302           3         52.8          18.9      20.6X
+Native ORC Vectorized                                             4768           4790          15          3.3         303.1       1.3X
+Native ORC Vectorized (Pushdown)                                   308            313           2         51.0          19.6      19.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 10, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6215           6232          16          2.5         395.1       1.0X
-Parquet Vectorized (Pushdown)                                      310            317           7         50.7          19.7      20.0X
-Native ORC Vectorized                                             4738           4748          14          3.3         301.2       1.3X
-Native ORC Vectorized (Pushdown)                                   304            310           8         51.7          19.4      20.4X
+Parquet Vectorized                                                6120           6151          29          2.6         389.1       1.0X
+Parquet Vectorized (Pushdown)                                      297            302           4         52.9          18.9      20.6X
+Native ORC Vectorized                                             4746           4767          14          3.3         301.7       1.3X
+Native ORC Vectorized (Pushdown)                                   308            314           5         51.0          19.6      19.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 50, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6390           6421          23          2.5         406.3       1.0X
-Parquet Vectorized (Pushdown)                                      892            901           9         17.6          56.7       7.2X
-Native ORC Vectorized                                             4915           4928          12          3.2         312.5       1.3X
-Native ORC Vectorized (Pushdown)                                   413            421           7         38.1          26.2      15.5X
+Parquet Vectorized                                                6324           6337          15          2.5         402.1       1.0X
+Parquet Vectorized (Pushdown)                                      880            886           4         17.9          56.0       7.2X
+Native ORC Vectorized                                             4958           4972          10          3.2         315.2       1.3X
+Native ORC Vectorized (Pushdown)                                   412            416           2         38.2          26.2      15.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 50, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6392           6396           4          2.5         406.4       1.0X
-Parquet Vectorized (Pushdown)                                     3302           3315          10          4.8         209.9       1.9X
-Native ORC Vectorized                                             4916           4925           7          3.2         312.6       1.3X
-Native ORC Vectorized (Pushdown)                                   431            433           2         36.5          27.4      14.8X
+Parquet Vectorized                                                6319           6338          18          2.5         401.8       1.0X
+Parquet Vectorized (Pushdown)                                     3192           3199           8          4.9         202.9       2.0X
+Native ORC Vectorized                                             4954           4981          18          3.2         315.0       1.3X
+Native ORC Vectorized (Pushdown)                                   422            429           5         37.3          26.8      15.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 50, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6384           6399          11          2.5         405.9       1.0X
-Parquet Vectorized (Pushdown)                                     5735           5748          10          2.7         364.6       1.1X
-Native ORC Vectorized                                             4930           4937           6          3.2         313.5       1.3X
-Native ORC Vectorized (Pushdown)                                   425            429           3         37.0          27.0      15.0X
+Parquet Vectorized                                                6314           6337          18          2.5         401.4       1.0X
+Parquet Vectorized (Pushdown)                                     5356           5400          29          2.9         340.5       1.2X
+Native ORC Vectorized                                             4983           4994          17          3.2         316.8       1.3X
+Native ORC Vectorized (Pushdown)                                   438            444           3         35.9          27.9      14.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 100, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                 6355           6365          12          2.5         404.1       1.0X
-Parquet Vectorized (Pushdown)                                       879            883           4         17.9          55.9       7.2X
-Native ORC Vectorized                                              4881           4894          16          3.2         310.3       1.3X
-Native ORC Vectorized (Pushdown)                                    504            508           5         31.2          32.0      12.6X
+Parquet Vectorized                                                 6330           6336           7          2.5         402.4       1.0X
+Parquet Vectorized (Pushdown)                                       874            879           4         18.0          55.6       7.2X
+Native ORC Vectorized                                              4910           4938          19          3.2         312.2       1.3X
+Native ORC Vectorized (Pushdown)                                    506            507           1         31.1          32.1      12.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 100, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                 6342           6360          16          2.5         403.2       1.0X
-Parquet Vectorized (Pushdown)                                      3308           3329          22          4.8         210.3       1.9X
-Native ORC Vectorized                                              4865           4886          16          3.2         309.3       1.3X
-Native ORC Vectorized (Pushdown)                                    550            552           2         28.6          34.9      11.5X
+Parquet Vectorized                                                 6330           6338           7          2.5         402.4       1.0X
+Parquet Vectorized (Pushdown)                                      3244           3255          11          4.8         206.3       2.0X
+Native ORC Vectorized                                              4919           4939          14          3.2         312.8       1.3X
+Native ORC Vectorized (Pushdown)                                    579            588          11         27.2          36.8      10.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 100, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                 6352           6364          12          2.5         403.8       1.0X
-Parquet Vectorized (Pushdown)                                      5622           5644          25          2.8         357.4       1.1X
-Native ORC Vectorized                                              4888           4898          11          3.2         310.8       1.3X
-Native ORC Vectorized (Pushdown)                                    576            581           4         27.3          36.6      11.0X
+Parquet Vectorized                                                 6332           6358          19          2.5         402.6       1.0X
+Parquet Vectorized (Pushdown)                                      5562           5579          21          2.8         353.6       1.1X
+Native ORC Vectorized                                              4927           4946          16          3.2         313.2       1.3X
+Native ORC Vectorized (Pushdown)                                    591            593           1         26.6          37.6      10.7X
 
 
 ================================================================================================
 Pushdown benchmark for tinyint
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 tinyint row (value = CAST(63 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                           2796           2818          23          5.6         177.8       1.0X
-Parquet Vectorized (Pushdown)                                 111            127          17        141.6           7.1      25.2X
-Native ORC Vectorized                                        2199           2223          17          7.2         139.8       1.3X
-Native ORC Vectorized (Pushdown)                              118            135          16        133.8           7.5      23.8X
+Parquet Vectorized                                           2632           2651          13          6.0         167.3       1.0X
+Parquet Vectorized (Pushdown)                                 105            121          17        150.3           6.7      25.2X
+Native ORC Vectorized                                        2183           2201          13          7.2         138.8       1.2X
+Native ORC Vectorized (Pushdown)                              120            138          20        130.8           7.6      21.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% tinyint rows (value < CAST(12 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                              3387           3439          50          4.6         215.3       1.0X
-Parquet Vectorized (Pushdown)                                    995           1014          14         15.8          63.3       3.4X
-Native ORC Vectorized                                           2750           2769          15          5.7         174.8       1.2X
-Native ORC Vectorized (Pushdown)                                 888            909          26         17.7          56.5       3.8X
+Parquet Vectorized                                              3288           3347          55          4.8         209.1       1.0X
+Parquet Vectorized (Pushdown)                                    953            967          13         16.5          60.6       3.5X
+Native ORC Vectorized                                           2820           2827           7          5.6         179.3       1.2X
+Native ORC Vectorized (Pushdown)                                 937            942           3         16.8          59.6       3.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% tinyint rows (value < CAST(63 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                              6036           6059          24          2.6         383.8       1.0X
-Parquet Vectorized (Pushdown)                                   4750           4767          14          3.3         302.0       1.3X
-Native ORC Vectorized                                           5234           5255          18          3.0         332.8       1.2X
-Native ORC Vectorized (Pushdown)                                4180           4191          19          3.8         265.8       1.4X
+Parquet Vectorized                                              5802           5841          53          2.7         368.9       1.0X
+Parquet Vectorized (Pushdown)                                   4542           4559          16          3.5         288.8       1.3X
+Native ORC Vectorized                                           5429           5445          11          2.9         345.2       1.1X
+Native ORC Vectorized (Pushdown)                                4359           4373          12          3.6         277.1       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% tinyint rows (value < CAST(114 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               8795           8807          11          1.8         559.2       1.0X
-Parquet Vectorized (Pushdown)                                    8512           8539          23          1.8         541.2       1.0X
-Native ORC Vectorized                                            7798           7816          20          2.0         495.8       1.1X
-Native ORC Vectorized (Pushdown)                                 7622           7649          44          2.1         484.6       1.2X
+Parquet Vectorized                                               8235           8274          39          1.9         523.6       1.0X
+Parquet Vectorized (Pushdown)                                    8031           8051          16          2.0         510.6       1.0X
+Native ORC Vectorized                                            8040           8056          13          2.0         511.2       1.0X
+Native ORC Vectorized (Pushdown)                                 7876           7882           9          2.0         500.7       1.0X
 
 
 ================================================================================================
 Pushdown benchmark for Timestamp
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 timestamp stored as INT96 row (value = timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                    3139           3152          11          5.0         199.6       1.0X
-Parquet Vectorized (Pushdown)                                                         3143           3149           8          5.0         199.8       1.0X
-Native ORC Vectorized                                                                 2025           2035          10          7.8         128.8       1.6X
-Native ORC Vectorized (Pushdown)                                                        40             44           5        390.9           2.6      78.0X
+Parquet Vectorized                                                                    3011           3017           4          5.2         191.4       1.0X
+Parquet Vectorized (Pushdown)                                                         3012           3030          27          5.2         191.5       1.0X
+Native ORC Vectorized                                                                 2018           2032          11          7.8         128.3       1.5X
+Native ORC Vectorized (Pushdown)                                                        43             47           5        369.2           2.7      70.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% timestamp stored as INT96 rows (value < timestamp_seconds(1572864)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                       3808           3822          16          4.1         242.1       1.0X
-Parquet Vectorized (Pushdown)                                                            3800           3809          10          4.1         241.6       1.0X
-Native ORC Vectorized                                                                    2667           2681          19          5.9         169.6       1.4X
-Native ORC Vectorized (Pushdown)                                                          879            885           5         17.9          55.9       4.3X
+Parquet Vectorized                                                                       3674           3710          49          4.3         233.6       1.0X
+Parquet Vectorized (Pushdown)                                                            3683           3694          10          4.3         234.2       1.0X
+Native ORC Vectorized                                                                    2722           2740          19          5.8         173.1       1.3X
+Native ORC Vectorized (Pushdown)                                                          942            946           4         16.7          59.9       3.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% timestamp stored as INT96 rows (value < timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                       6618           6632          11          2.4         420.8       1.0X
-Parquet Vectorized (Pushdown)                                                            6637           6645          11          2.4         422.0       1.0X
-Native ORC Vectorized                                                                    5201           5215          18          3.0         330.7       1.3X
-Native ORC Vectorized (Pushdown)                                                         4180           4189           6          3.8         265.8       1.6X
+Parquet Vectorized                                                                       6337           6368          20          2.5         402.9       1.0X
+Parquet Vectorized (Pushdown)                                                            6358           6376          21          2.5         404.2       1.0X
+Native ORC Vectorized                                                                    5698           5721          15          2.8         362.3       1.1X
+Native ORC Vectorized (Pushdown)                                                         4688           4703          13          3.4         298.0       1.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% timestamp stored as INT96 rows (value < timestamp_seconds(14155776)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                        9362           9370          12          1.7         595.2       1.0X
-Parquet Vectorized (Pushdown)                                                             9129           9137          14          1.7         580.4       1.0X
-Native ORC Vectorized                                                                     7670           7713          43          2.1         487.6       1.2X
-Native ORC Vectorized (Pushdown)                                                          7481           7505          33          2.1         475.6       1.3X
+Parquet Vectorized                                                                        8881           8914          29          1.8         564.6       1.0X
+Parquet Vectorized (Pushdown)                                                             8916           8933          13          1.8         566.8       1.0X
+Native ORC Vectorized                                                                     8438           8454          13          1.9         536.5       1.1X
+Native ORC Vectorized (Pushdown)                                                          8251           8265           9          1.9         524.6       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 timestamp stored as TIMESTAMP_MICROS row (value = timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                               2609           2626          22          6.0         165.9       1.0X
-Parquet Vectorized (Pushdown)                                                                      71             74           4        222.2           4.5      36.8X
-Native ORC Vectorized                                                                            2015           2029          14          7.8         128.1       1.3X
-Native ORC Vectorized (Pushdown)                                                                   40             43           4        397.2           2.5      65.9X
+Parquet Vectorized                                                                               2497           2508          10          6.3         158.8       1.0X
+Parquet Vectorized (Pushdown)                                                                      69             73           4        227.6           4.4      36.1X
+Native ORC Vectorized                                                                            2011           2015           5          7.8         127.9       1.2X
+Native ORC Vectorized (Pushdown)                                                                   42             44           3        377.1           2.7      59.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% timestamp stored as TIMESTAMP_MICROS rows (value < timestamp_seconds(1572864)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  3242           3252           9          4.9         206.1       1.0X
-Parquet Vectorized (Pushdown)                                                                        974            978           3         16.1          61.9       3.3X
-Native ORC Vectorized                                                                               2641           2650           6          6.0         167.9       1.2X
-Native ORC Vectorized (Pushdown)                                                                     867            868           1         18.2          55.1       3.7X
+Parquet Vectorized                                                                                  3141           3146           6          5.0         199.7       1.0X
+Parquet Vectorized (Pushdown)                                                                        976            978           1         16.1          62.1       3.2X
+Native ORC Vectorized                                                                               2741           2747           5          5.7         174.3       1.1X
+Native ORC Vectorized (Pushdown)                                                                     940            944           2         16.7          59.8       3.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% timestamp stored as TIMESTAMP_MICROS rows (value < timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  5990           6015          19          2.6         380.9       1.0X
-Parquet Vectorized (Pushdown)                                                                       4747           4810          61          3.3         301.8       1.3X
-Native ORC Vectorized                                                                               5172           5193          15          3.0         328.8       1.2X
-Native ORC Vectorized (Pushdown)                                                                    4160           4166           5          3.8         264.5       1.4X
+Parquet Vectorized                                                                                  5793           5833          45          2.7         368.3       1.0X
+Parquet Vectorized (Pushdown)                                                                       4601           4617          15          3.4         292.6       1.3X
+Native ORC Vectorized                                                                               5587           5601          18          2.8         355.2       1.0X
+Native ORC Vectorized (Pushdown)                                                                    4537           4551          11          3.5         288.4       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% timestamp stored as TIMESTAMP_MICROS rows (value < timestamp_seconds(14155776)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                   8667           8710          31          1.8         551.1       1.0X
-Parquet Vectorized (Pushdown)                                                                        8479           8484           5          1.9         539.1       1.0X
-Native ORC Vectorized                                                                                7685           7720          37          2.0         488.6       1.1X
-Native ORC Vectorized (Pushdown)                                                                     7487           7530          50          2.1         476.0       1.2X
+Parquet Vectorized                                                                                   8361           8369           8          1.9         531.6       1.0X
+Parquet Vectorized (Pushdown)                                                                        8155           8177          14          1.9         518.5       1.0X
+Native ORC Vectorized                                                                                8452           8461          12          1.9         537.3       1.0X
+Native ORC Vectorized (Pushdown)                                                                     8246           8267          14          1.9         524.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 timestamp stored as TIMESTAMP_MILLIS row (value = timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                               2770           2777           5          5.7         176.1       1.0X
-Parquet Vectorized (Pushdown)                                                                      71             73           3        222.8           4.5      39.2X
-Native ORC Vectorized                                                                            2025           2036          11          7.8         128.7       1.4X
-Native ORC Vectorized (Pushdown)                                                                   40             44           4        394.9           2.5      69.5X
+Parquet Vectorized                                                                               2660           2661           2          5.9         169.1       1.0X
+Parquet Vectorized (Pushdown)                                                                      68             71           4        231.8           4.3      39.2X
+Native ORC Vectorized                                                                            2019           2023           6          7.8         128.3       1.3X
+Native ORC Vectorized (Pushdown)                                                                   41             44           4        380.7           2.6      64.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% timestamp stored as TIMESTAMP_MILLIS rows (value < timestamp_seconds(1572864)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  3428           3447          28          4.6         218.0       1.0X
-Parquet Vectorized (Pushdown)                                                                       1006           1011           4         15.6          64.0       3.4X
-Native ORC Vectorized                                                                               2667           2677           8          5.9         169.6       1.3X
-Native ORC Vectorized (Pushdown)                                                                     876            881           3         17.9          55.7       3.9X
+Parquet Vectorized                                                                                  3312           3326          15          4.7         210.6       1.0X
+Parquet Vectorized (Pushdown)                                                                        991            994           4         15.9          63.0       3.3X
+Native ORC Vectorized                                                                               2738           2749           8          5.7         174.1       1.2X
+Native ORC Vectorized (Pushdown)                                                                     941            944           3         16.7          59.8       3.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% timestamp stored as TIMESTAMP_MILLIS rows (value < timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  6140           6151           9          2.6         390.4       1.0X
-Parquet Vectorized (Pushdown)                                                                       4807           4813           5          3.3         305.6       1.3X
-Native ORC Vectorized                                                                               5154           5162           8          3.1         327.7       1.2X
-Native ORC Vectorized (Pushdown)                                                                    4122           4131          10          3.8         262.0       1.5X
+Parquet Vectorized                                                                                  5947           5965          18          2.6         378.1       1.0X
+Parquet Vectorized (Pushdown)                                                                       4690           4707          14          3.4         298.2       1.3X
+Native ORC Vectorized                                                                               5579           5591          11          2.8         354.7       1.1X
+Native ORC Vectorized (Pushdown)                                                                    4552           4567          13          3.5         289.4       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% timestamp stored as TIMESTAMP_MILLIS rows (value < timestamp_seconds(14155776)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                   8880           8900          13          1.8         564.6       1.0X
-Parquet Vectorized (Pushdown)                                                                        8616           8629          14          1.8         547.8       1.0X
-Native ORC Vectorized                                                                                7696           7735          46          2.0         489.3       1.2X
-Native ORC Vectorized (Pushdown)                                                                     7497           7510           9          2.1         476.7       1.2X
+Parquet Vectorized                                                                                   8541           8556          11          1.8         543.0       1.0X
+Parquet Vectorized (Pushdown)                                                                        8321           8341          21          1.9         529.0       1.0X
+Native ORC Vectorized                                                                                8434           8456          20          1.9         536.2       1.0X
+Native ORC Vectorized (Pushdown)                                                                     8261           8268          12          1.9         525.2       1.0X
 
 
 ================================================================================================
 Pushdown benchmark with many filters
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 row with 1 filters:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                   51             75          17          0.0    51336693.0       1.0X
-Parquet Vectorized (Pushdown)                        52             54           3          0.0    51779493.0       1.0X
-Native ORC Vectorized                                45             46           2          0.0    44817022.0       1.1X
-Native ORC Vectorized (Pushdown)                     47             51           5          0.0    46799315.0       1.1X
+Parquet Vectorized                                   47             54          10          0.0    47073806.0       1.0X
+Parquet Vectorized (Pushdown)                        48             51           3          0.0    48254597.0       1.0X
+Native ORC Vectorized                                43             46           5          0.0    42518323.0       1.1X
+Native ORC Vectorized (Pushdown)                     44             47           3          0.0    44456944.0       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 row with 250 filters:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  170            181           9          0.0   170098519.0       1.0X
-Parquet Vectorized (Pushdown)                       177            183           5          0.0   176637480.0       1.0X
-Native ORC Vectorized                               166            169           3          0.0   165753639.0       1.0X
-Native ORC Vectorized (Pushdown)                    167            173           5          0.0   167076087.0       1.0X
+Parquet Vectorized                                  170            178           7          0.0   170168877.0       1.0X
+Parquet Vectorized (Pushdown)                       173            180           7          0.0   173290596.0       1.0X
+Native ORC Vectorized                               165            173           6          0.0   164773308.0       1.0X
+Native ORC Vectorized (Pushdown)                    165            171           5          0.0   165283905.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 row with 500 filters:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  510            530          18          0.0   510147157.0       1.0X
-Parquet Vectorized (Pushdown)                       518            539          19          0.0   517520226.0       1.0X
-Native ORC Vectorized                               502            510           9          0.0   502346348.0       1.0X
-Native ORC Vectorized (Pushdown)                    514            530          17          0.0   513941675.0       1.0X
+Parquet Vectorized                                  525            535          13          0.0   524597822.0       1.0X
+Parquet Vectorized (Pushdown)                       535            552          16          0.0   534526800.0       1.0X
+Native ORC Vectorized                               519            528           8          0.0   519431475.0       1.0X
+Native ORC Vectorized (Pushdown)                    525            538          14          0.0   525191651.0       1.0X
 
 
diff --git a/sql/core/benchmarks/FilterPushdownBenchmark-results.txt b/sql/core/benchmarks/FilterPushdownBenchmark-results.txt
index 89eb049c3a0fa..a672109ce5844 100644
--- a/sql/core/benchmarks/FilterPushdownBenchmark-results.txt
+++ b/sql/core/benchmarks/FilterPushdownBenchmark-results.txt
@@ -2,733 +2,733 @@
 Pushdown for many distinct value case
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 string row (value IS NULL):      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6856           6933          83          2.3         435.9       1.0X
-Parquet Vectorized (Pushdown)                       331            338           7         47.5          21.0      20.7X
-Native ORC Vectorized                              5021           5090          53          3.1         319.3       1.4X
-Native ORC Vectorized (Pushdown)                    303            317          11         52.0          19.2      22.7X
+Parquet Vectorized                                 6883           6923          37          2.3         437.6       1.0X
+Parquet Vectorized (Pushdown)                       335            349          11         46.9          21.3      20.5X
+Native ORC Vectorized                              5462           5502          36          2.9         347.3       1.3X
+Native ORC Vectorized (Pushdown)                    320            337          11         49.2          20.3      21.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 string row ('7864320' < value < '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                            6956           6978          20          2.3         442.2       1.0X
-Parquet Vectorized (Pushdown)                                  319            334          17         49.3          20.3      21.8X
-Native ORC Vectorized                                         5161           5171          11          3.0         328.1       1.3X
-Native ORC Vectorized (Pushdown)                               310            326          18         50.8          19.7      22.5X
+Parquet Vectorized                                            6943           6965          22          2.3         441.4       1.0X
+Parquet Vectorized (Pushdown)                                  335            359          18         46.9          21.3      20.7X
+Native ORC Vectorized                                         5559           5582          17          2.8         353.4       1.2X
+Native ORC Vectorized (Pushdown)                               327            335           6         48.1          20.8      21.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 string row (value = '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6911           6952          39          2.3         439.4       1.0X
-Parquet Vectorized (Pushdown)                       302            313          10         52.2          19.2      22.9X
-Native ORC Vectorized                              5121           5145          23          3.1         325.6       1.3X
-Native ORC Vectorized (Pushdown)                    295            303           7         53.3          18.8      23.4X
+Parquet Vectorized                                 6928           6941          14          2.3         440.4       1.0X
+Parquet Vectorized (Pushdown)                       317            327           7         49.6          20.1      21.9X
+Native ORC Vectorized                              5571           5591          26          2.8         354.2       1.2X
+Native ORC Vectorized (Pushdown)                    313            320           9         50.3          19.9      22.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 string row (value <=> '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  6908           6916           8          2.3         439.2       1.0X
-Parquet Vectorized (Pushdown)                        293            306          11         53.7          18.6      23.6X
-Native ORC Vectorized                               5113           5133          16          3.1         325.1       1.4X
-Native ORC Vectorized (Pushdown)                     289            295           3         54.4          18.4      23.9X
+Parquet Vectorized                                  6899           6914          12          2.3         438.6       1.0X
+Parquet Vectorized (Pushdown)                        310            327          15         50.8          19.7      22.3X
+Native ORC Vectorized                               5547           5557           6          2.8         352.7       1.2X
+Native ORC Vectorized (Pushdown)                     303            309           4         51.9          19.3      22.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 string row ('7864320' <= value <= '7864320'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                              6953           6979          24          2.3         442.1       1.0X
-Parquet Vectorized (Pushdown)                                    300            305           6         52.4          19.1      23.1X
-Native ORC Vectorized                                           5147           5175          25          3.1         327.2       1.4X
-Native ORC Vectorized (Pushdown)                                 296            303           7         53.1          18.8      23.5X
+Parquet Vectorized                                              6944           6971          41          2.3         441.5       1.0X
+Parquet Vectorized (Pushdown)                                    309            320          11         50.8          19.7      22.4X
+Native ORC Vectorized                                           5534           5554          22          2.8         351.8       1.3X
+Native ORC Vectorized (Pushdown)                                 307            326          16         51.2          19.5      22.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all string rows (value IS NOT NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  14342          14384          46          1.1         911.9       1.0X
-Parquet Vectorized (Pushdown)                       14364          14404          29          1.1         913.2       1.0X
-Native ORC Vectorized                               12523          12580          38          1.3         796.2       1.1X
-Native ORC Vectorized (Pushdown)                    12619          12644          24          1.2         802.3       1.1X
+Parquet Vectorized                                  14452          14519          48          1.1         918.9       1.0X
+Parquet Vectorized (Pushdown)                       14521          14546          19          1.1         923.2       1.0X
+Native ORC Vectorized                               13001          13039          35          1.2         826.6       1.1X
+Native ORC Vectorized (Pushdown)                    13112          13137          36          1.2         833.6       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 int row (value IS NULL):         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6539           6556          14          2.4         415.7       1.0X
-Parquet Vectorized (Pushdown)                       274            280           6         57.5          17.4      23.9X
-Native ORC Vectorized                              4657           4676          14          3.4         296.1       1.4X
-Native ORC Vectorized (Pushdown)                    277            281           5         56.8          17.6      23.6X
+Parquet Vectorized                                 6546           6562          15          2.4         416.2       1.0X
+Parquet Vectorized (Pushdown)                       292            301           7         53.8          18.6      22.4X
+Native ORC Vectorized                              5044           5050           7          3.1         320.7       1.3X
+Native ORC Vectorized (Pushdown)                    288            297           5         54.6          18.3      22.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 int row (7864320 < value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     6488           6520          39          2.4         412.5       1.0X
-Parquet Vectorized (Pushdown)                           279            287           5         56.3          17.8      23.2X
-Native ORC Vectorized                                  4664           4677          13          3.4         296.5       1.4X
-Native ORC Vectorized (Pushdown)                        282            287           4         55.8          17.9      23.0X
+Parquet Vectorized                                     6530           6539          12          2.4         415.2       1.0X
+Parquet Vectorized (Pushdown)                           301            306           4         52.2          19.1      21.7X
+Native ORC Vectorized                                  5040           5057          15          3.1         320.4       1.3X
+Native ORC Vectorized (Pushdown)                        294            304          11         53.5          18.7      22.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (value = 7864320):       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6538           6546           7          2.4         415.7       1.0X
-Parquet Vectorized (Pushdown)                       278            283           5         56.6          17.7      23.5X
-Native ORC Vectorized                              4742           4764          20          3.3         301.5       1.4X
-Native ORC Vectorized (Pushdown)                    282            288           7         55.8          17.9      23.2X
+Parquet Vectorized                                 6543           6555          17          2.4         416.0       1.0X
+Parquet Vectorized (Pushdown)                       298            305           7         52.8          18.9      22.0X
+Native ORC Vectorized                              5084           5093           6          3.1         323.2       1.3X
+Native ORC Vectorized (Pushdown)                    290            298          10         54.2          18.5      22.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (value <=> 7864320):     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 6544           6573          21          2.4         416.0       1.0X
-Parquet Vectorized (Pushdown)                       276            286           7         56.9          17.6      23.7X
-Native ORC Vectorized                              4709           4749          56          3.3         299.4       1.4X
-Native ORC Vectorized (Pushdown)                    276            283           4         57.1          17.5      23.7X
+Parquet Vectorized                                 6550           6583          46          2.4         416.5       1.0X
+Parquet Vectorized (Pushdown)                       293            298           3         53.6          18.6      22.3X
+Native ORC Vectorized                              5081           5093          12          3.1         323.0       1.3X
+Native ORC Vectorized (Pushdown)                    285            298          12         55.2          18.1      23.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (7864320 <= value <= 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                       6532           6545           8          2.4         415.3       1.0X
-Parquet Vectorized (Pushdown)                             277            279           2         56.8          17.6      23.6X
-Native ORC Vectorized                                    4704           4731          28          3.3         299.0       1.4X
-Native ORC Vectorized (Pushdown)                          282            287           4         55.8          17.9      23.2X
+Parquet Vectorized                                       6546           6574          17          2.4         416.2       1.0X
+Parquet Vectorized (Pushdown)                             297            302           3         52.9          18.9      22.0X
+Native ORC Vectorized                                    5072           5079           4          3.1         322.5       1.3X
+Native ORC Vectorized (Pushdown)                          289            296           6         54.4          18.4      22.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 int row (7864319 < value < 7864321):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     6538           6558          23          2.4         415.7       1.0X
-Parquet Vectorized (Pushdown)                           275            287          10         57.2          17.5      23.8X
-Native ORC Vectorized                                  4723           4749          25          3.3         300.3       1.4X
-Native ORC Vectorized (Pushdown)                        278            282           3         56.6          17.7      23.5X
+Parquet Vectorized                                     6535           6575          43          2.4         415.5       1.0X
+Parquet Vectorized (Pushdown)                           295            299           3         53.4          18.7      22.2X
+Native ORC Vectorized                                  5070           5074           2          3.1         322.3       1.3X
+Native ORC Vectorized (Pushdown)                        289            294           3         54.4          18.4      22.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% int rows (value < 1572864):    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                 7258           7290          37          2.2         461.5       1.0X
-Parquet Vectorized (Pushdown)                      1623           1633           8          9.7         103.2       4.5X
-Native ORC Vectorized                              5374           5380           5          2.9         341.6       1.4X
-Native ORC Vectorized (Pushdown)                   1414           1420           6         11.1          89.9       5.1X
+Parquet Vectorized                                 7234           7253          18          2.2         459.9       1.0X
+Parquet Vectorized (Pushdown)                      1629           1633           5          9.7         103.6       4.4X
+Native ORC Vectorized                              5766           5771           5          2.7         366.6       1.3X
+Native ORC Vectorized (Pushdown)                   1467           1471           4         10.7          93.3       4.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% int rows (value < 7864320):    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                10004          10038          29          1.6         636.0       1.0X
-Parquet Vectorized (Pushdown)                      6892           6906          11          2.3         438.2       1.5X
-Native ORC Vectorized                              8061           8078          15          2.0         512.5       1.2X
-Native ORC Vectorized (Pushdown)                   5897           5910          12          2.7         374.9       1.7X
+Parquet Vectorized                                 9845           9864          22          1.6         626.0       1.0X
+Parquet Vectorized (Pushdown)                      6755           6762          11          2.3         429.5       1.5X
+Native ORC Vectorized                              8373           8380           8          1.9         532.4       1.2X
+Native ORC Vectorized (Pushdown)                   6027           6041          15          2.6         383.2       1.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% int rows (value < 14155776):   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                12533          12571          35          1.3         796.9       1.0X
-Parquet Vectorized (Pushdown)                     11864          11902          33          1.3         754.3       1.1X
-Native ORC Vectorized                             10727          10812          85          1.5         682.0       1.2X
-Native ORC Vectorized (Pushdown)                  10366          10408          35          1.5         659.1       1.2X
+Parquet Vectorized                                12382          12396          13          1.3         787.2       1.0X
+Parquet Vectorized (Pushdown)                     11785          11802          11          1.3         749.3       1.1X
+Native ORC Vectorized                             10944          10975          25          1.4         695.8       1.1X
+Native ORC Vectorized (Pushdown)                  10555          10561           9          1.5         671.1       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all int rows (value IS NOT NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                13484          13490           7          1.2         857.3       1.0X
-Parquet Vectorized (Pushdown)                     13500          13533          22          1.2         858.3       1.0X
-Native ORC Vectorized                             11483          11532          39          1.4         730.0       1.2X
-Native ORC Vectorized (Pushdown)                  11477          11592         107          1.4         729.7       1.2X
+Parquet Vectorized                                13150          13174          22          1.2         836.1       1.0X
+Parquet Vectorized (Pushdown)                     13194          13220          20          1.2         838.9       1.0X
+Native ORC Vectorized                             11537          11552          14          1.4         733.5       1.1X
+Native ORC Vectorized (Pushdown)                  11622          11639          15          1.4         738.9       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all int rows (value > -1):         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                13032          13061          20          1.2         828.6       1.0X
-Parquet Vectorized (Pushdown)                     13076          13100          19          1.2         831.4       1.0X
-Native ORC Vectorized                             11456          11486          47          1.4         728.3       1.1X
-Native ORC Vectorized (Pushdown)                  11538          11569          25          1.4         733.5       1.1X
+Parquet Vectorized                                13086          13099          11          1.2         832.0       1.0X
+Parquet Vectorized (Pushdown)                     13137          13156          15          1.2         835.2       1.0X
+Native ORC Vectorized                             11614          11630          20          1.4         738.4       1.1X
+Native ORC Vectorized (Pushdown)                  11685          11702          18          1.3         742.9       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all int rows (value != -1):        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                13201          13227          23          1.2         839.3       1.0X
-Parquet Vectorized (Pushdown)                     13322          13336          24          1.2         847.0       1.0X
-Native ORC Vectorized                             11276          11304          19          1.4         716.9       1.2X
-Native ORC Vectorized (Pushdown)                  11397          11430          41          1.4         724.6       1.2X
+Parquet Vectorized                                13062          13077          11          1.2         830.5       1.0X
+Parquet Vectorized (Pushdown)                     13127          13151          27          1.2         834.6       1.0X
+Native ORC Vectorized                             11692          11786         192          1.3         743.4       1.1X
+Native ORC Vectorized (Pushdown)                  11803          11846          41          1.3         750.4       1.1X
 
 
 ================================================================================================
 Pushdown for few distinct value case (use dictionary encoding)
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 distinct string row (value IS NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     5934           5955          21          2.7         377.3       1.0X
-Parquet Vectorized (Pushdown)                           240            249          10         65.6          15.3      24.7X
-Native ORC Vectorized                                  6197           6233          41          2.5         394.0       1.0X
-Native ORC Vectorized (Pushdown)                        924            937           9         17.0          58.8       6.4X
+Parquet Vectorized                                     5890           5919          34          2.7         374.5       1.0X
+Parquet Vectorized (Pushdown)                           240            244           3         65.5          15.3      24.5X
+Native ORC Vectorized                                  6629           6641          12          2.4         421.5       0.9X
+Native ORC Vectorized (Pushdown)                        952            962           8         16.5          60.5       6.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 0 distinct string row ('100' < value < '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                             6043           6055           9          2.6         384.2       1.0X
-Parquet Vectorized (Pushdown)                                   243            248           6         64.8          15.4      24.9X
-Native ORC Vectorized                                          6428           6455          19          2.4         408.7       0.9X
-Native ORC Vectorized (Pushdown)                                930            938           7         16.9          59.1       6.5X
+Parquet Vectorized                                             6043           6053          11          2.6         384.2       1.0X
+Parquet Vectorized (Pushdown)                                   242            245           2         64.9          15.4      24.9X
+Native ORC Vectorized                                          6856           6867           8          2.3         435.9       0.9X
+Native ORC Vectorized (Pushdown)                                960            967           5         16.4          61.1       6.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 distinct string row (value = '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     5954           5969          13          2.6         378.5       1.0X
-Parquet Vectorized (Pushdown)                           290            294           3         54.3          18.4      20.6X
-Native ORC Vectorized                                  6362           6379          14          2.5         404.5       0.9X
-Native ORC Vectorized (Pushdown)                        957            975          18         16.4          60.9       6.2X
+Parquet Vectorized                                     5951           5984          19          2.6         378.4       1.0X
+Parquet Vectorized (Pushdown)                           292            296           4         53.8          18.6      20.4X
+Native ORC Vectorized                                  6823           7080         199          2.3         433.8       0.9X
+Native ORC Vectorized (Pushdown)                       1008           1042          26         15.6          64.1       5.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 distinct string row (value <=> '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                       5962           5984          24          2.6         379.0       1.0X
-Parquet Vectorized (Pushdown)                             289            295           7         54.4          18.4      20.6X
-Native ORC Vectorized                                    6353           6382          17          2.5         403.9       0.9X
-Native ORC Vectorized (Pushdown)                          952            963          13         16.5          60.5       6.3X
+Parquet Vectorized                                       5941           5958          11          2.6         377.7       1.0X
+Parquet Vectorized (Pushdown)                             292            296           4         53.9          18.5      20.4X
+Native ORC Vectorized                                    6766           7201         429          2.3         430.2       0.9X
+Native ORC Vectorized (Pushdown)                         1333           1380          41         11.8          84.7       4.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 distinct string row ('100' <= value <= '100'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               6008           6017           8          2.6         382.0       1.0X
-Parquet Vectorized (Pushdown)                                     290            297           5         54.2          18.5      20.7X
-Native ORC Vectorized                                            6437           6457          17          2.4         409.3       0.9X
-Native ORC Vectorized (Pushdown)                                  972            975           2         16.2          61.8       6.2X
+Parquet Vectorized                                               6076           6112          22          2.6         386.3       1.0X
+Parquet Vectorized (Pushdown)                                     301            312           8         52.3          19.1      20.2X
+Native ORC Vectorized                                            8039           8099          56          2.0         511.1       0.8X
+Native ORC Vectorized (Pushdown)                                 1339           1380          50         11.7          85.2       4.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select all distinct string rows (value IS NOT NULL):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                           14051          14073          29          1.1         893.3       1.0X
-Parquet Vectorized (Pushdown)                                14119          14153          26          1.1         897.7       1.0X
-Native ORC Vectorized                                        14169          14225          54          1.1         900.8       1.0X
-Native ORC Vectorized (Pushdown)                             14404          14427          28          1.1         915.8       1.0X
+Parquet Vectorized                                           14721          14761          24          1.1         935.9       1.0X
+Parquet Vectorized (Pushdown)                                14796          14846          70          1.1         940.7       1.0X
+Native ORC Vectorized                                        16834          17184         208          0.9        1070.3       0.9X
+Native ORC Vectorized (Pushdown)                             17994          18093         111          0.9        1144.0       0.8X
 
 
 ================================================================================================
 Pushdown benchmark for StringStartsWith
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringStartsWith filter: (value like '10%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                    7175           7182           6          2.2         456.2       1.0X
-Parquet Vectorized (Pushdown)                          944            950           7         16.7          60.0       7.6X
-Native ORC Vectorized                                 5261           5285          15          3.0         334.5       1.4X
-Native ORC Vectorized (Pushdown)                      5356           5363          11          2.9         340.5       1.3X
+Parquet Vectorized                                    7173           7238          68          2.2         456.1       1.0X
+Parquet Vectorized (Pushdown)                          942            946           3         16.7          59.9       7.6X
+Native ORC Vectorized                                 5658           5672           9          2.8         359.7       1.3X
+Native ORC Vectorized (Pushdown)                      5758           5774          20          2.7         366.1       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringStartsWith filter: (value like '1000%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      6984           6993          10          2.3         444.1       1.0X
-Parquet Vectorized (Pushdown)                            277            284           5         56.8          17.6      25.2X
-Native ORC Vectorized                                   5115           5154          32          3.1         325.2       1.4X
-Native ORC Vectorized (Pushdown)                        5195           5217          13          3.0         330.3       1.3X
+Parquet Vectorized                                      7001           7010          11          2.2         445.1       1.0X
+Parquet Vectorized (Pushdown)                            283            286           3         55.6          18.0      24.7X
+Native ORC Vectorized                                   5551           5686         146          2.8         352.9       1.3X
+Native ORC Vectorized (Pushdown)                        5627           5640          16          2.8         357.7       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringStartsWith filter: (value like '786432%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                        6979           6997          12          2.3         443.7       1.0X
-Parquet Vectorized (Pushdown)                              274            280           9         57.3          17.4      25.4X
-Native ORC Vectorized                                     5119           5136          15          3.1         325.5       1.4X
-Native ORC Vectorized (Pushdown)                          5198           5208          12          3.0         330.5       1.3X
+Parquet Vectorized                                        6988           7047          59          2.3         444.3       1.0X
+Parquet Vectorized (Pushdown)                              277            284           6         56.7          17.6      25.2X
+Native ORC Vectorized                                     5540           5572          25          2.8         352.2       1.3X
+Native ORC Vectorized (Pushdown)                          5590           5668         138          2.8         355.4       1.2X
 
 
 ================================================================================================
 Pushdown benchmark for StringEndsWith
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringEndsWith filter: (value like '%10'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  5973           5987          14          2.6         379.7       1.0X
-Parquet Vectorized (Pushdown)                        370            382          16         42.5          23.5      16.1X
-Native ORC Vectorized                               6351           6383          32          2.5         403.8       0.9X
-Native ORC Vectorized (Pushdown)                    6544           6582          25          2.4         416.0       0.9X
+Parquet Vectorized                                  5945           5962          14          2.6         378.0       1.0X
+Parquet Vectorized (Pushdown)                        366            372           5         42.9          23.3      16.2X
+Native ORC Vectorized                               6752           6760           8          2.3         429.3       0.9X
+Native ORC Vectorized (Pushdown)                    6960           6970          10          2.3         442.5       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringEndsWith filter: (value like '%1000'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                    5923           5933           8          2.7         376.6       1.0X
-Parquet Vectorized (Pushdown)                          275            283           9         57.2          17.5      21.5X
-Native ORC Vectorized                                 6303           6319          15          2.5         400.8       0.9X
-Native ORC Vectorized (Pushdown)                      6516           6534          23          2.4         414.3       0.9X
+Parquet Vectorized                                    5870           5880           8          2.7         373.2       1.0X
+Parquet Vectorized (Pushdown)                          270            274           3         58.2          17.2      21.7X
+Native ORC Vectorized                                 6702           6714           7          2.3         426.1       0.9X
+Native ORC Vectorized (Pushdown)                      6889           6899           7          2.3         438.0       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringEndsWith filter: (value like '%786432'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      5917           5931          12          2.7         376.2       1.0X
-Parquet Vectorized (Pushdown)                            273            277           5         57.6          17.4      21.7X
-Native ORC Vectorized                                   6287           6313          29          2.5         399.7       0.9X
-Native ORC Vectorized (Pushdown)                        6497           6528          39          2.4         413.1       0.9X
+Parquet Vectorized                                      5875           5884           9          2.7         373.5       1.0X
+Parquet Vectorized (Pushdown)                            273            275           2         57.7          17.3      21.6X
+Native ORC Vectorized                                   6701           6719          15          2.3         426.0       0.9X
+Native ORC Vectorized (Pushdown)                        6898           6907          14          2.3         438.5       0.9X
 
 
 ================================================================================================
 Pushdown benchmark for StringContains
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringContains filter: (value like '%10%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                   6150           6166          17          2.6         391.0       1.0X
-Parquet Vectorized (Pushdown)                         807            812           6         19.5          51.3       7.6X
-Native ORC Vectorized                                6520           6534          11          2.4         414.5       0.9X
-Native ORC Vectorized (Pushdown)                     6732           6769          43          2.3         428.0       0.9X
+Parquet Vectorized                                   6133           6149          15          2.6         390.0       1.0X
+Parquet Vectorized (Pushdown)                         800            804           2         19.7          50.9       7.7X
+Native ORC Vectorized                                6956           6979          21          2.3         442.3       0.9X
+Native ORC Vectorized (Pushdown)                     7151           7176          30          2.2         454.6       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringContains filter: (value like '%1000%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     5929           5947          22          2.7         376.9       1.0X
-Parquet Vectorized (Pushdown)                           271            274           2         58.0          17.2      21.9X
-Native ORC Vectorized                                  6293           6322          18          2.5         400.1       0.9X
-Native ORC Vectorized (Pushdown)                       6524           6551          23          2.4         414.8       0.9X
+Parquet Vectorized                                     5890           5907          30          2.7         374.5       1.0X
+Parquet Vectorized (Pushdown)                           273            275           2         57.6          17.4      21.6X
+Native ORC Vectorized                                  6734           6755          18          2.3         428.2       0.9X
+Native ORC Vectorized (Pushdown)                       6939           6969          40          2.3         441.2       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 StringContains filter: (value like '%786432%'):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                       5928           5940          12          2.7         376.9       1.0X
-Parquet Vectorized (Pushdown)                             270            276           4         58.2          17.2      21.9X
-Native ORC Vectorized                                    6315           6331          14          2.5         401.5       0.9X
-Native ORC Vectorized (Pushdown)                         6541           6560          24          2.4         415.9       0.9X
+Parquet Vectorized                                       5903           5912           7          2.7         375.3       1.0X
+Parquet Vectorized (Pushdown)                             272            277           7         57.8          17.3      21.7X
+Native ORC Vectorized                                    6750           6754           5          2.3         429.2       0.9X
+Native ORC Vectorized (Pushdown)                         6959           6964           3          2.3         442.4       0.8X
 
 
 ================================================================================================
 Pushdown benchmark for decimal
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 decimal(9, 2) row (value = 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                     2844           2858          11          5.5         180.8       1.0X
-Parquet Vectorized (Pushdown)                            71             75           4        220.7           4.5      39.9X
-Native ORC Vectorized                                  3269           3284          13          4.8         207.8       0.9X
-Native ORC Vectorized (Pushdown)                         57             62           5        277.1           3.6      50.1X
+Parquet Vectorized                                     2841           2858          10          5.5         180.6       1.0X
+Parquet Vectorized (Pushdown)                            72             75           3        218.2           4.6      39.4X
+Native ORC Vectorized                                  3436           3446          11          4.6         218.5       0.8X
+Native ORC Vectorized (Pushdown)                         60             63           5        261.1           3.8      47.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% decimal(9, 2) rows (value < 1572864):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                        4167           4190          17          3.8         264.9       1.0X
-Parquet Vectorized (Pushdown)                             1956           1963           7          8.0         124.3       2.1X
-Native ORC Vectorized                                     4702           4733          34          3.3         298.9       0.9X
-Native ORC Vectorized (Pushdown)                          2072           2081           8          7.6         131.8       2.0X
+Parquet Vectorized                                        4213           4222           9          3.7         267.9       1.0X
+Parquet Vectorized (Pushdown)                             1983           1995          12          7.9         126.1       2.1X
+Native ORC Vectorized                                     4828           4877          49          3.3         307.0       0.9X
+Native ORC Vectorized (Pushdown)                          2110           2113           2          7.5         134.2       2.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% decimal(9, 2) rows (value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                        9042           9066          19          1.7         574.9       1.0X
-Parquet Vectorized (Pushdown)                             8702           8717          13          1.8         553.2       1.0X
-Native ORC Vectorized                                     9335           9389          60          1.7         593.5       1.0X
-Native ORC Vectorized (Pushdown)                          8897           8916          17          1.8         565.7       1.0X
+Parquet Vectorized                                        8728           8781          48          1.8         554.9       1.0X
+Parquet Vectorized (Pushdown)                             8352           8367          10          1.9         531.0       1.0X
+Native ORC Vectorized                                     9324           9363          72          1.7         592.8       0.9X
+Native ORC Vectorized (Pushdown)                          8880           8907          21          1.8         564.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% decimal(9, 2) rows (value < 14155776):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                        10057          10077          30          1.6         639.4       1.0X
-Parquet Vectorized (Pushdown)                             10085          10114          25          1.6         641.2       1.0X
-Native ORC Vectorized                                     10713          10729          23          1.5         681.1       0.9X
-Native ORC Vectorized (Pushdown)                          10724          10732           8          1.5         681.8       0.9X
+Parquet Vectorized                                         9920           9933          13          1.6         630.7       1.0X
+Parquet Vectorized (Pushdown)                              9939           9967          37          1.6         631.9       1.0X
+Native ORC Vectorized                                     10375          10402          31          1.5         659.7       1.0X
+Native ORC Vectorized (Pushdown)                          10399          10412          12          1.5         661.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 decimal(18, 2) row (value = 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      3024           3051          16          5.2         192.3       1.0X
-Parquet Vectorized (Pushdown)                             70             73           3        224.1           4.5      43.1X
-Native ORC Vectorized                                   3265           3286          21          4.8         207.6       0.9X
-Native ORC Vectorized (Pushdown)                          55             59           3        288.1           3.5      55.4X
+Parquet Vectorized                                      3006           3036          18          5.2         191.1       1.0X
+Parquet Vectorized (Pushdown)                             70             71           3        226.0           4.4      43.2X
+Native ORC Vectorized                                   3412           3426          18          4.6         216.9       0.9X
+Native ORC Vectorized (Pushdown)                          57             61           4        273.9           3.7      52.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% decimal(18, 2) rows (value < 1572864):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         3784           3803          19          4.2         240.6       1.0X
-Parquet Vectorized (Pushdown)                              1083           1086           2         14.5          68.9       3.5X
-Native ORC Vectorized                                      4014           4036          21          3.9         255.2       0.9X
-Native ORC Vectorized (Pushdown)                           1060           1065           5         14.8          67.4       3.6X
+Parquet Vectorized                                         3776           3787           9          4.2         240.1       1.0X
+Parquet Vectorized (Pushdown)                              1081           1089           5         14.5          68.7       3.5X
+Native ORC Vectorized                                      4137           4149          20          3.8         263.0       0.9X
+Native ORC Vectorized (Pushdown)                           1103           1106           4         14.3          70.1       3.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% decimal(18, 2) rows (value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         6657           6670          11          2.4         423.2       1.0X
-Parquet Vectorized (Pushdown)                              5177           5188           7          3.0         329.1       1.3X
-Native ORC Vectorized                                      6809           6821          11          2.3         432.9       1.0X
-Native ORC Vectorized (Pushdown)                           5138           5159          21          3.1         326.6       1.3X
+Parquet Vectorized                                         6676           6690          11          2.4         424.5       1.0X
+Parquet Vectorized (Pushdown)                              5195           5201           5          3.0         330.3       1.3X
+Native ORC Vectorized                                      6988           6997           8          2.3         444.3       1.0X
+Native ORC Vectorized (Pushdown)                           5310           5313           3          3.0         337.6       1.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% decimal(18, 2) rows (value < 14155776):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                          9548           9572          19          1.6         607.0       1.0X
-Parquet Vectorized (Pushdown)                               9291           9322          27          1.7         590.7       1.0X
-Native ORC Vectorized                                       9610           9623          13          1.6         611.0       1.0X
-Native ORC Vectorized (Pushdown)                            9260           9297          30          1.7         588.7       1.0X
+Parquet Vectorized                                          9514           9520           9          1.7         604.9       1.0X
+Parquet Vectorized (Pushdown)                               9238           9281          48          1.7         587.3       1.0X
+Native ORC Vectorized                                       9832           9868          23          1.6         625.1       1.0X
+Native ORC Vectorized (Pushdown)                            9492           9499           5          1.7         603.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 decimal(38, 2) row (value = 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                      4320           4337          10          3.6         274.7       1.0X
-Parquet Vectorized (Pushdown)                             78             82           5        201.0           5.0      55.2X
-Native ORC Vectorized                                   3340           3363          21          4.7         212.4       1.3X
-Native ORC Vectorized (Pushdown)                          55             57           2        285.9           3.5      78.5X
+Parquet Vectorized                                      4281           4291           8          3.7         272.2       1.0X
+Parquet Vectorized (Pushdown)                             76             79           3        206.4           4.8      56.2X
+Native ORC Vectorized                                   3458           3474          17          4.5         219.8       1.2X
+Native ORC Vectorized (Pushdown)                          58             60           3        273.4           3.7      74.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% decimal(38, 2) rows (value < 1572864):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         5208           5229          32          3.0         331.1       1.0X
-Parquet Vectorized (Pushdown)                              1386           1393           9         11.3          88.1       3.8X
-Native ORC Vectorized                                      4160           4198          56          3.8         264.5       1.3X
-Native ORC Vectorized (Pushdown)                           1187           1194           9         13.3          75.5       4.4X
+Parquet Vectorized                                         5238           5246           8          3.0         333.0       1.0X
+Parquet Vectorized (Pushdown)                              1422           1424           1         11.1          90.4       3.7X
+Native ORC Vectorized                                      4308           4321          15          3.7         273.9       1.2X
+Native ORC Vectorized (Pushdown)                           1227           1230           3         12.8          78.0       4.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% decimal(38, 2) rows (value < 7864320):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         8789           8818          34          1.8         558.8       1.0X
-Parquet Vectorized (Pushdown)                              6686           6697          13          2.4         425.1       1.3X
-Native ORC Vectorized                                      7476           7500          26          2.1         475.3       1.2X
-Native ORC Vectorized (Pushdown)                           5812           5837          37          2.7         369.5       1.5X
+Parquet Vectorized                                         8951           8969          18          1.8         569.1       1.0X
+Parquet Vectorized (Pushdown)                              6863           6900          29          2.3         436.4       1.3X
+Native ORC Vectorized                                      7606           7620          10          2.1         483.6       1.2X
+Native ORC Vectorized (Pushdown)                           5900           5906           7          2.7         375.1       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% decimal(38, 2) rows (value < 14155776):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                         12304          12358          67          1.3         782.2       1.0X
-Parquet Vectorized (Pushdown)                              11966          12032          48          1.3         760.8       1.0X
-Native ORC Vectorized                                      10772          10813          30          1.5         684.9       1.1X
-Native ORC Vectorized (Pushdown)                           10441          10482          35          1.5         663.8       1.2X
+Parquet Vectorized                                         12623          12678          67          1.2         802.5       1.0X
+Parquet Vectorized (Pushdown)                              12207          12224          16          1.3         776.1       1.0X
+Native ORC Vectorized                                      10898          10906           5          1.4         692.9       1.2X
+Native ORC Vectorized (Pushdown)                           10575          10588          11          1.5         672.3       1.2X
 
 
 ================================================================================================
 Pushdown benchmark for InSet -> InFilters
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 5, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               6578           6604          16          2.4         418.2       1.0X
-Parquet Vectorized (Pushdown)                                     294            298           4         53.5          18.7      22.4X
-Native ORC Vectorized                                            4871           4897          29          3.2         309.7       1.4X
-Native ORC Vectorized (Pushdown)                                  286            292           4         54.9          18.2      23.0X
+Parquet Vectorized                                               6516           6546          29          2.4         414.3       1.0X
+Parquet Vectorized (Pushdown)                                     289            292           4         54.5          18.4      22.6X
+Native ORC Vectorized                                            4902           4907           4          3.2         311.7       1.3X
+Native ORC Vectorized (Pushdown)                                  296            304          10         53.2          18.8      22.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 5, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               6590           6598           7          2.4         419.0       1.0X
-Parquet Vectorized (Pushdown)                                     294            303           9         53.5          18.7      22.4X
-Native ORC Vectorized                                            4778           4800          25          3.3         303.8       1.4X
-Native ORC Vectorized (Pushdown)                                  283            286           2         55.6          18.0      23.3X
+Parquet Vectorized                                               6532           6549          13          2.4         415.3       1.0X
+Parquet Vectorized (Pushdown)                                     285            287           2         55.2          18.1      22.9X
+Native ORC Vectorized                                            4884           4887           3          3.2         310.5       1.3X
+Native ORC Vectorized (Pushdown)                                  292            300           8         53.8          18.6      22.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 5, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               6532           6560          29          2.4         415.3       1.0X
-Parquet Vectorized (Pushdown)                                     289            294           5         54.5          18.4      22.6X
-Native ORC Vectorized                                            4769           4784          11          3.3         303.2       1.4X
-Native ORC Vectorized (Pushdown)                                  283            285           2         55.6          18.0      23.1X
+Parquet Vectorized                                               6524           6531           7          2.4         414.8       1.0X
+Parquet Vectorized (Pushdown)                                     287            291           5         54.8          18.2      22.7X
+Native ORC Vectorized                                            4897           4912          16          3.2         311.3       1.3X
+Native ORC Vectorized (Pushdown)                                  294            300           7         53.5          18.7      22.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 10, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6565           6610          62          2.4         417.4       1.0X
-Parquet Vectorized (Pushdown)                                      302            313          11         52.1          19.2      21.8X
-Native ORC Vectorized                                             4787           4816          57          3.3         304.3       1.4X
-Native ORC Vectorized (Pushdown)                                   296            298           3         53.2          18.8      22.2X
+Parquet Vectorized                                                6534           6553          12          2.4         415.4       1.0X
+Parquet Vectorized (Pushdown)                                      302            306           3         52.1          19.2      21.6X
+Native ORC Vectorized                                             4889           4900          13          3.2         310.9       1.3X
+Native ORC Vectorized (Pushdown)                                   310            314           6         50.8          19.7      21.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 10, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6569           6591          15          2.4         417.6       1.0X
-Parquet Vectorized (Pushdown)                                      303            307           3         51.8          19.3      21.6X
-Native ORC Vectorized                                             4772           4801          25          3.3         303.4       1.4X
-Native ORC Vectorized (Pushdown)                                   297            304          11         53.0          18.9      22.1X
+Parquet Vectorized                                                6521           6537          15          2.4         414.6       1.0X
+Parquet Vectorized (Pushdown)                                      303            306           2         51.9          19.3      21.5X
+Native ORC Vectorized                                             4892           4897           4          3.2         311.0       1.3X
+Native ORC Vectorized (Pushdown)                                   310            319          13         50.8          19.7      21.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 10, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6552           6564          17          2.4         416.5       1.0X
-Parquet Vectorized (Pushdown)                                      307            314          11         51.3          19.5      21.4X
-Native ORC Vectorized                                             4782           4799          11          3.3         304.0       1.4X
-Native ORC Vectorized (Pushdown)                                   300            305           5         52.4          19.1      21.8X
+Parquet Vectorized                                                6517           6526          10          2.4         414.4       1.0X
+Parquet Vectorized (Pushdown)                                      304            309           4         51.8          19.3      21.5X
+Native ORC Vectorized                                             4891           4898           9          3.2         310.9       1.3X
+Native ORC Vectorized (Pushdown)                                   310            315           5         50.8          19.7      21.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 50, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6741           6765          20          2.3         428.6       1.0X
-Parquet Vectorized (Pushdown)                                      895            899           5         17.6          56.9       7.5X
-Native ORC Vectorized                                             4998           5024          19          3.1         317.8       1.3X
-Native ORC Vectorized (Pushdown)                                   397            401           3         39.6          25.3      17.0X
+Parquet Vectorized                                                6739           6750           7          2.3         428.5       1.0X
+Parquet Vectorized (Pushdown)                                      886            889           2         17.8          56.3       7.6X
+Native ORC Vectorized                                             5109           5115           3          3.1         324.8       1.3X
+Native ORC Vectorized (Pushdown)                                   417            425           9         37.7          26.5      16.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 50, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6749           6756           9          2.3         429.1       1.0X
-Parquet Vectorized (Pushdown)                                     3368           3387          24          4.7         214.1       2.0X
-Native ORC Vectorized                                             4978           5002          16          3.2         316.5       1.4X
-Native ORC Vectorized (Pushdown)                                   426            430           5         36.9          27.1      15.8X
+Parquet Vectorized                                                6742           6750           7          2.3         428.6       1.0X
+Parquet Vectorized (Pushdown)                                     3390           3412          37          4.6         215.5       2.0X
+Native ORC Vectorized                                             5124           5127           5          3.1         325.8       1.3X
+Native ORC Vectorized (Pushdown)                                   443            448           3         35.5          28.2      15.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 50, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                6724           6744          13          2.3         427.5       1.0X
-Parquet Vectorized (Pushdown)                                     6089           6117          29          2.6         387.1       1.1X
-Native ORC Vectorized                                             4978           4995          14          3.2         316.5       1.4X
-Native ORC Vectorized (Pushdown)                                   423            424           1         37.2          26.9      15.9X
+Parquet Vectorized                                                6737           6741           3          2.3         428.3       1.0X
+Parquet Vectorized (Pushdown)                                     6038           6051          12          2.6         383.9       1.1X
+Native ORC Vectorized                                             5095           5110          15          3.1         323.9       1.3X
+Native ORC Vectorized (Pushdown)                                   444            448           5         35.5          28.2      15.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 100, distribution: 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                 6727           6765          45          2.3         427.7       1.0X
-Parquet Vectorized (Pushdown)                                       923            928           7         17.0          58.7       7.3X
-Native ORC Vectorized                                              4938           4959          18          3.2         313.9       1.4X
-Native ORC Vectorized (Pushdown)                                    500            509           7         31.5          31.8      13.5X
+Parquet Vectorized                                                 6679           6694          13          2.4         424.7       1.0X
+Parquet Vectorized (Pushdown)                                       894            898           3         17.6          56.9       7.5X
+Native ORC Vectorized                                              5069           5087          30          3.1         322.3       1.3X
+Native ORC Vectorized (Pushdown)                                    514            521           6         30.6          32.7      13.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 100, distribution: 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                 6705           6743          54          2.3         426.3       1.0X
-Parquet Vectorized (Pushdown)                                      3479           3492          19          4.5         221.2       1.9X
-Native ORC Vectorized                                              4952           4959           8          3.2         314.9       1.4X
-Native ORC Vectorized (Pushdown)                                    581            587           6         27.1          36.9      11.5X
+Parquet Vectorized                                                 6685           6698           9          2.4         425.1       1.0X
+Parquet Vectorized (Pushdown)                                      3472           3482           8          4.5         220.7       1.9X
+Native ORC Vectorized                                              5078           5084           4          3.1         322.8       1.3X
+Native ORC Vectorized (Pushdown)                                    589            593           4         26.7          37.4      11.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 InSet -> InFilters (values count: 100, distribution: 90):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                 6696           6718          21          2.3         425.7       1.0X
-Parquet Vectorized (Pushdown)                                      6017           6033          17          2.6         382.6       1.1X
-Native ORC Vectorized                                              4926           4943          11          3.2         313.2       1.4X
-Native ORC Vectorized (Pushdown)                                    583            590           5         27.0          37.1      11.5X
+Parquet Vectorized                                                 6685           6710          28          2.4         425.1       1.0X
+Parquet Vectorized (Pushdown)                                      6014           6035          30          2.6         382.4       1.1X
+Native ORC Vectorized                                              5078           5086           8          3.1         322.8       1.3X
+Native ORC Vectorized (Pushdown)                                    607            612           7         25.9          38.6      11.0X
 
 
 ================================================================================================
 Pushdown benchmark for tinyint
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 tinyint row (value = CAST(63 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                           3127           3134           6          5.0         198.8       1.0X
-Parquet Vectorized (Pushdown)                                 109            114           6        144.1           6.9      28.6X
-Native ORC Vectorized                                        2198           2204           4          7.2         139.8       1.4X
-Native ORC Vectorized (Pushdown)                              114            117           3        137.4           7.3      27.3X
+Parquet Vectorized                                           3186           3197          20          4.9         202.6       1.0X
+Parquet Vectorized (Pushdown)                                 110            113           3        142.6           7.0      28.9X
+Native ORC Vectorized                                        2375           2386           9          6.6         151.0       1.3X
+Native ORC Vectorized (Pushdown)                              119            122           3        131.8           7.6      26.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% tinyint rows (value < CAST(12 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                              3775           3787          16          4.2         240.0       1.0X
-Parquet Vectorized (Pushdown)                                   1009           1011           2         15.6          64.2       3.7X
-Native ORC Vectorized                                           2801           2805           3          5.6         178.1       1.3X
-Native ORC Vectorized (Pushdown)                                 900            908          12         17.5          57.3       4.2X
+Parquet Vectorized                                              3763           3770           8          4.2         239.3       1.0X
+Parquet Vectorized (Pushdown)                                   1006           1011           5         15.6          64.0       3.7X
+Native ORC Vectorized                                           2942           2982          46          5.3         187.1       1.3X
+Native ORC Vectorized (Pushdown)                                 874            877           3         18.0          55.6       4.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% tinyint rows (value < CAST(63 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                              6493           6501           6          2.4         412.8       1.0X
-Parquet Vectorized (Pushdown)                                   4968           4989          30          3.2         315.8       1.3X
-Native ORC Vectorized                                           5371           5406          36          2.9         341.5       1.2X
-Native ORC Vectorized (Pushdown)                                4292           4310          16          3.7         272.9       1.5X
+Parquet Vectorized                                              6306           6312           7          2.5         400.9       1.0X
+Parquet Vectorized (Pushdown)                                   4795           4802           6          3.3         304.8       1.3X
+Native ORC Vectorized                                           5414           5423           6          2.9         344.2       1.2X
+Native ORC Vectorized (Pushdown)                                4282           4284           3          3.7         272.2       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% tinyint rows (value < CAST(114 AS tinyint)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                               9195           9235          69          1.7         584.6       1.0X
-Parquet Vectorized (Pushdown)                                    8940           8970          48          1.8         568.4       1.0X
-Native ORC Vectorized                                            7767           7796          46          2.0         493.8       1.2X
-Native ORC Vectorized (Pushdown)                                 7592           7621          27          2.1         482.7       1.2X
+Parquet Vectorized                                               9069           9075           5          1.7         576.6       1.0X
+Parquet Vectorized (Pushdown)                                    8806           8818           9          1.8         559.9       1.0X
+Native ORC Vectorized                                            7795           7800           5          2.0         495.6       1.2X
+Native ORC Vectorized (Pushdown)                                 7586           7605          16          2.1         482.3       1.2X
 
 
 ================================================================================================
 Pushdown benchmark for Timestamp
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 timestamp stored as INT96 row (value = timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                    3252           3261           7          4.8         206.8       1.0X
-Parquet Vectorized (Pushdown)                                                         3242           3262          24          4.9         206.1       1.0X
-Native ORC Vectorized                                                                 2097           2110          11          7.5         133.3       1.6X
-Native ORC Vectorized (Pushdown)                                                        39             43           4        401.0           2.5      82.9X
+Parquet Vectorized                                                                    3221           3224           3          4.9         204.8       1.0X
+Parquet Vectorized (Pushdown)                                                         3228           3235           8          4.9         205.3       1.0X
+Native ORC Vectorized                                                                 2229           2241          15          7.1         141.7       1.4X
+Native ORC Vectorized (Pushdown)                                                        43             45           3        369.5           2.7      75.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% timestamp stored as INT96 rows (value < timestamp_seconds(1572864)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                       3941           3946           5          4.0         250.6       1.0X
-Parquet Vectorized (Pushdown)                                                            3930           3942          16          4.0         249.8       1.0X
-Native ORC Vectorized                                                                    2713           2722          16          5.8         172.5       1.5X
-Native ORC Vectorized (Pushdown)                                                          852            858           9         18.5          54.2       4.6X
+Parquet Vectorized                                                                       3932           3953          18          4.0         250.0       1.0X
+Parquet Vectorized (Pushdown)                                                            3926           3932           4          4.0         249.6       1.0X
+Native ORC Vectorized                                                                    2893           2902          13          5.4         183.9       1.4X
+Native ORC Vectorized (Pushdown)                                                          914            922           8         17.2          58.1       4.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% timestamp stored as INT96 rows (value < timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                       6700           6735          46          2.3         426.0       1.0X
-Parquet Vectorized (Pushdown)                                                            6701           6727          19          2.3         426.0       1.0X
-Native ORC Vectorized                                                                    5113           5127          18          3.1         325.1       1.3X
-Native ORC Vectorized (Pushdown)                                                         4045           4067          31          3.9         257.2       1.7X
+Parquet Vectorized                                                                       6853           6857           3          2.3         435.7       1.0X
+Parquet Vectorized (Pushdown)                                                            6848           6857          14          2.3         435.4       1.0X
+Native ORC Vectorized                                                                    5512           5540          37          2.9         350.4       1.2X
+Native ORC Vectorized (Pushdown)                                                         4361           4386          27          3.6         277.3       1.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% timestamp stored as INT96 rows (value < timestamp_seconds(14155776)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                        9366           9381          19          1.7         595.5       1.0X
-Parquet Vectorized (Pushdown)                                                             9369           9383          22          1.7         595.7       1.0X
-Native ORC Vectorized                                                                     7608           7687          83          2.1         483.7       1.2X
-Native ORC Vectorized (Pushdown)                                                          7411           7431          19          2.1         471.2       1.3X
+Parquet Vectorized                                                                        9465           9534          92          1.7         601.7       1.0X
+Parquet Vectorized (Pushdown)                                                             9532           9575          45          1.7         606.1       1.0X
+Native ORC Vectorized                                                                     8097           8146          39          1.9         514.8       1.2X
+Native ORC Vectorized (Pushdown)                                                          8029           8064          27          2.0         510.5       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 timestamp stored as TIMESTAMP_MICROS row (value = timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                               3004           3041          38          5.2         191.0       1.0X
-Parquet Vectorized (Pushdown)                                                                      69             72           4        229.2           4.4      43.8X
-Native ORC Vectorized                                                                            2095           2101           5          7.5         133.2       1.4X
-Native ORC Vectorized (Pushdown)                                                                   38             41           3        409.1           2.4      78.1X
+Parquet Vectorized                                                                               2994           3008          15          5.3         190.3       1.0X
+Parquet Vectorized (Pushdown)                                                                      70             75           3        223.8           4.5      42.6X
+Native ORC Vectorized                                                                            2247           2257          12          7.0         142.8       1.3X
+Native ORC Vectorized (Pushdown)                                                                   44             51           5        354.7           2.8      67.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% timestamp stored as TIMESTAMP_MICROS rows (value < timestamp_seconds(1572864)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  3705           3715          10          4.2         235.6       1.0X
-Parquet Vectorized (Pushdown)                                                                       1050           1052           2         15.0          66.7       3.5X
-Native ORC Vectorized                                                                               2714           2726           9          5.8         172.6       1.4X
-Native ORC Vectorized (Pushdown)                                                                     851            854           6         18.5          54.1       4.4X
+Parquet Vectorized                                                                                  3719           3796          54          4.2         236.4       1.0X
+Parquet Vectorized (Pushdown)                                                                       1074           1091          12         14.6          68.3       3.5X
+Native ORC Vectorized                                                                               2922           2951          17          5.4         185.8       1.3X
+Native ORC Vectorized (Pushdown)                                                                     926            944          13         17.0          58.9       4.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% timestamp stored as TIMESTAMP_MICROS rows (value < timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  6438           6454          13          2.4         409.3       1.0X
-Parquet Vectorized (Pushdown)                                                                       4976           4983           5          3.2         316.4       1.3X
-Native ORC Vectorized                                                                               5124           5140          16          3.1         325.8       1.3X
-Native ORC Vectorized (Pushdown)                                                                    4055           4089          30          3.9         257.8       1.6X
+Parquet Vectorized                                                                                  6719           6753          25          2.3         427.2       1.0X
+Parquet Vectorized (Pushdown)                                                                       5237           5278          27          3.0         333.0       1.3X
+Native ORC Vectorized                                                                               5596           5604          10          2.8         355.8       1.2X
+Native ORC Vectorized (Pushdown)                                                                    4331           4388          47          3.6         275.3       1.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% timestamp stored as TIMESTAMP_MICROS rows (value < timestamp_seconds(14155776)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                   9096           9115          18          1.7         578.3       1.0X
-Parquet Vectorized (Pushdown)                                                                        8823           8839          11          1.8         561.0       1.0X
-Native ORC Vectorized                                                                                7554           7578          23          2.1         480.2       1.2X
-Native ORC Vectorized (Pushdown)                                                                     7372           7392          16          2.1         468.7       1.2X
+Parquet Vectorized                                                                                   9216           9232          14          1.7         585.9       1.0X
+Parquet Vectorized (Pushdown)                                                                        8949           8960          11          1.8         569.0       1.0X
+Native ORC Vectorized                                                                                8266           8296          51          1.9         525.5       1.1X
+Native ORC Vectorized (Pushdown)                                                                     8030           8045          16          2.0         510.6       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 timestamp stored as TIMESTAMP_MILLIS row (value = timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                               3027           3036           7          5.2         192.5       1.0X
-Parquet Vectorized (Pushdown)                                                                      69             71           3        228.9           4.4      44.1X
-Native ORC Vectorized                                                                            2093           2100          11          7.5         133.1       1.4X
-Native ORC Vectorized (Pushdown)                                                                   38             41           3        411.8           2.4      79.2X
+Parquet Vectorized                                                                               3022           3027           5          5.2         192.1       1.0X
+Parquet Vectorized (Pushdown)                                                                      69             70           2        228.7           4.4      43.9X
+Native ORC Vectorized                                                                            2225           2230           3          7.1         141.5       1.4X
+Native ORC Vectorized (Pushdown)                                                                   42             44           3        377.3           2.7      72.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 10% timestamp stored as TIMESTAMP_MILLIS rows (value < timestamp_seconds(1572864)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  3718           3735          21          4.2         236.4       1.0X
-Parquet Vectorized (Pushdown)                                                                       1043           1049           7         15.1          66.3       3.6X
-Native ORC Vectorized                                                                               2707           2719          17          5.8         172.1       1.4X
-Native ORC Vectorized (Pushdown)                                                                     848            852           3         18.6          53.9       4.4X
+Parquet Vectorized                                                                                  3711           3727          14          4.2         236.0       1.0X
+Parquet Vectorized (Pushdown)                                                                       1053           1056           3         14.9          66.9       3.5X
+Native ORC Vectorized                                                                               2889           2917          54          5.4         183.7       1.3X
+Native ORC Vectorized (Pushdown)                                                                     912            915           2         17.3          58.0       4.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 50% timestamp stored as TIMESTAMP_MILLIS rows (value < timestamp_seconds(7864320)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                  6450           6462          13          2.4         410.1       1.0X
-Parquet Vectorized (Pushdown)                                                                       4988           4998           8          3.2         317.1       1.3X
-Native ORC Vectorized                                                                               5126           5140          15          3.1         325.9       1.3X
-Native ORC Vectorized (Pushdown)                                                                    4049           4060           8          3.9         257.4       1.6X
+Parquet Vectorized                                                                                  6607           6613          10          2.4         420.1       1.0X
+Parquet Vectorized (Pushdown)                                                                       5149           5167          33          3.1         327.3       1.3X
+Native ORC Vectorized                                                                               5498           5511           9          2.9         349.6       1.2X
+Native ORC Vectorized (Pushdown)                                                                    4356           4368          10          3.6         276.9       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 90% timestamp stored as TIMESTAMP_MILLIS rows (value < timestamp_seconds(14155776)):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                                                                   9130           9146          18          1.7         580.4       1.0X
-Parquet Vectorized (Pushdown)                                                                        8854           8885          20          1.8         562.9       1.0X
-Native ORC Vectorized                                                                                7538           7557          20          2.1         479.3       1.2X
-Native ORC Vectorized (Pushdown)                                                                     7310           7361          38          2.2         464.8       1.2X
+Parquet Vectorized                                                                                   9222           9225           2          1.7         586.3       1.0X
+Parquet Vectorized (Pushdown)                                                                        8952           8972          19          1.8         569.2       1.0X
+Native ORC Vectorized                                                                                8251           8266          16          1.9         524.6       1.1X
+Native ORC Vectorized (Pushdown)                                                                     8030           8044          16          2.0         510.5       1.1X
 
 
 ================================================================================================
 Pushdown benchmark with many filters
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 row with 1 filters:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                   48             49           2          0.0    47572233.0       1.0X
-Parquet Vectorized (Pushdown)                        48             51           3          0.0    47933317.0       1.0X
-Native ORC Vectorized                                41             43           2          0.0    41232680.0       1.2X
-Native ORC Vectorized (Pushdown)                     44             50           8          0.0    43791797.0       1.1X
+Parquet Vectorized                                   47             49           5          0.0    46814687.0       1.0X
+Parquet Vectorized (Pushdown)                        48             50           4          0.0    48049852.0       1.0X
+Native ORC Vectorized                                42             44           4          0.0    41770894.0       1.1X
+Native ORC Vectorized (Pushdown)                     45             47           4          0.0    44627062.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 row with 250 filters:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  172            179           5          0.0   171668021.0       1.0X
-Parquet Vectorized (Pushdown)                       175            183           8          0.0   174931280.0       1.0X
-Native ORC Vectorized                               165            173           8          0.0   164882447.0       1.0X
-Native ORC Vectorized (Pushdown)                    169            174           6          0.0   168734657.0       1.0X
+Parquet Vectorized                                  174            179           5          0.0   173730940.0       1.0X
+Parquet Vectorized (Pushdown)                       177            183           6          0.0   177380451.0       1.0X
+Native ORC Vectorized                               168            174           4          0.0   168397398.0       1.0X
+Native ORC Vectorized (Pushdown)                    174            178           6          0.0   173527951.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select 1 row with 500 filters:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Parquet Vectorized                                  523            547          25          0.0   523403894.0       1.0X
-Parquet Vectorized (Pushdown)                       546            559          13          0.0   545572756.0       1.0X
-Native ORC Vectorized                               525            544          15          0.0   525242709.0       1.0X
-Native ORC Vectorized (Pushdown)                    532            554          28          0.0   531883827.0       1.0X
+Parquet Vectorized                                  545            556          11          0.0   544697398.0       1.0X
+Parquet Vectorized (Pushdown)                       564            568           3          0.0   564247787.0       1.0X
+Native ORC Vectorized                               536            549          11          0.0   536299871.0       1.0X
+Native ORC Vectorized (Pushdown)                    545            548           3          0.0   544510520.0       1.0X
 
 
diff --git a/sql/core/benchmarks/GenerateExecBenchmark-jdk21-results.txt b/sql/core/benchmarks/GenerateExecBenchmark-jdk21-results.txt
index dc19c4fac6858..68ee1e97ee016 100644
--- a/sql/core/benchmarks/GenerateExecBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/GenerateExecBenchmark-jdk21-results.txt
@@ -2,11 +2,11 @@
 GenerateExec benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 GenerateExec Benchmark:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-GenerateExec Benchmark wholestage off             70672          71244         809          1.4         706.7       1.0X
-GenerateExec Benchmark wholestage on              21022          21399         226          4.8         210.2       3.4X
+GenerateExec Benchmark wholestage off             72498          73647        1625          1.4         725.0       1.0X
+GenerateExec Benchmark wholestage on              23805          23956         189          4.2         238.1       3.0X
 
 
diff --git a/sql/core/benchmarks/GenerateExecBenchmark-results.txt b/sql/core/benchmarks/GenerateExecBenchmark-results.txt
index ab7a58d4f8a6d..bbdacf15ef8f0 100644
--- a/sql/core/benchmarks/GenerateExecBenchmark-results.txt
+++ b/sql/core/benchmarks/GenerateExecBenchmark-results.txt
@@ -2,11 +2,11 @@
 GenerateExec benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 GenerateExec Benchmark:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-GenerateExec Benchmark wholestage off             69333          69516         259          1.4         693.3       1.0X
-GenerateExec Benchmark wholestage on              23359          23683         302          4.3         233.6       3.0X
+GenerateExec Benchmark wholestage off             70300          70379         111          1.4         703.0       1.0X
+GenerateExec Benchmark wholestage on              25435          25593         321          3.9         254.3       2.8X
 
 
diff --git a/sql/core/benchmarks/HashedRelationMetricsBenchmark-jdk21-results.txt b/sql/core/benchmarks/HashedRelationMetricsBenchmark-jdk21-results.txt
index edb74e92c5ee0..7449722cdcbef 100644
--- a/sql/core/benchmarks/HashedRelationMetricsBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/HashedRelationMetricsBenchmark-jdk21-results.txt
@@ -2,10 +2,10 @@
 LongToUnsafeRowMap metrics
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LongToUnsafeRowMap metrics:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-LongToUnsafeRowMap                                  265            268           3          1.9         529.3       1.0X
+LongToUnsafeRowMap                                  267            271           4          1.9         534.8       1.0X
 
 
diff --git a/sql/core/benchmarks/HashedRelationMetricsBenchmark-results.txt b/sql/core/benchmarks/HashedRelationMetricsBenchmark-results.txt
index e8fcbffee58b8..55452a515f1f2 100644
--- a/sql/core/benchmarks/HashedRelationMetricsBenchmark-results.txt
+++ b/sql/core/benchmarks/HashedRelationMetricsBenchmark-results.txt
@@ -2,10 +2,10 @@
 LongToUnsafeRowMap metrics
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 LongToUnsafeRowMap metrics:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-LongToUnsafeRowMap                                  249            252           2          2.0         498.8       1.0X
+LongToUnsafeRowMap                                  258            263           6          1.9         515.9       1.0X
 
 
diff --git a/sql/core/benchmarks/InExpressionBenchmark-jdk21-results.txt b/sql/core/benchmarks/InExpressionBenchmark-jdk21-results.txt
index 3a7e026c04398..e6f609f1c52f0 100644
--- a/sql/core/benchmarks/InExpressionBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/InExpressionBenchmark-jdk21-results.txt
@@ -2,739 +2,739 @@
 In Expression Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 bytes:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        37             50           9        273.5           3.7       1.0X
-InSet expression                                     65             75           8        153.6           6.5       0.6X
+In expression                                        40             53           8        252.1           4.0       1.0X
+InSet expression                                     67             81          10        148.2           6.7       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 bytes:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        34             40           6        290.9           3.4       1.0X
-InSet expression                                     59             64           4        168.1           5.9       0.6X
+In expression                                        37             42           7        270.7           3.7       1.0X
+InSet expression                                     63             65           2        159.3           6.3       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 bytes:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        63             67           6        158.6           6.3       1.0X
-InSet expression                                     76             78           2        131.4           7.6       0.8X
+In expression                                        63             68           7        158.2           6.3       1.0X
+InSet expression                                     77             81           4        129.2           7.7       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 bytes:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       104            106           2         96.2          10.4       1.0X
-InSet expression                                     83             86           3        120.8           8.3       1.3X
+In expression                                       107            110           3         93.4          10.7       1.0X
+InSet expression                                     84             88           4        119.3           8.4       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 bytes:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       183            185           3         54.7          18.3       1.0X
-InSet expression                                     96            100           2        104.1           9.6       1.9X
+In expression                                       185            187           2         54.0          18.5       1.0X
+InSet expression                                     97            101           3        102.7           9.7       1.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 bytes:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       396            402           7         25.2          39.6       1.0X
-InSet expression                                    192            194           2         52.1          19.2       2.1X
+In expression                                       396            402           8         25.2          39.6       1.0X
+InSet expression                                    191            194           3         52.3          19.1       2.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 shorts:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        29             34           5        340.7           2.9       1.0X
-InSet expression                                     80             82           2        125.3           8.0       0.4X
+In expression                                        30             34           5        329.7           3.0       1.0X
+InSet expression                                     76             80           2        131.0           7.6       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 shorts:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        38             44           9        260.8           3.8       1.0X
-InSet expression                                     95             97           2        105.8           9.5       0.4X
+In expression                                        40             44           4        248.7           4.0       1.0X
+InSet expression                                     93             96           8        107.9           9.3       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 shorts:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        69             71           2        143.9           6.9       1.0X
-InSet expression                                     94             98           2        105.9           9.4       0.7X
+In expression                                        71             72           2        140.3           7.1       1.0X
+InSet expression                                     91             93           1        109.7           9.1       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 shorts:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       117            118           1         85.6          11.7       1.0X
-InSet expression                                    131            135           3         76.5          13.1       0.9X
+In expression                                       119            121           3         84.1          11.9       1.0X
+InSet expression                                    130            132           3         77.2          13.0       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       195            197           2         51.3          19.5       1.0X
-InSet expression                                    119            122           2         84.0          11.9       1.6X
+In expression                                       197            202          10         50.7          19.7       1.0X
+InSet expression                                    115            118           2         86.8          11.5       1.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       370            371           1         27.1          37.0       1.0X
-InSet expression                                    129            131           1         77.5          12.9       2.9X
+In expression                                       369            371           4         27.1          36.9       1.0X
+InSet expression                                    123            126           2         81.6          12.3       3.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       553            558           4         18.1          55.3       1.0X
-InSet expression                                    142            144           2         70.4          14.2       3.9X
+In expression                                       550            551           1         18.2          55.0       1.0X
+InSet expression                                    136            139           2         73.7          13.6       4.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       733            737           3         13.6          73.3       1.0X
-InSet expression                                    154            157           3         64.9          15.4       4.8X
+In expression                                       735            736           1         13.6          73.5       1.0X
+InSet expression                                    150            152           1         66.6          15.0       4.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       938            945           5         10.7          93.8       1.0X
-InSet expression                                    168            171           2         59.4          16.8       5.6X
+In expression                                       988            992           3         10.1          98.8       1.0X
+InSet expression                                    162            165           1         61.6          16.2       6.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 shorts (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        26             28           3        389.4           2.6       1.0X
-InSet expression                                     77             80           3        129.7           7.7       0.3X
+In expression                                        27             30           4        367.2           2.7       1.0X
+InSet expression                                     73             76           2        136.3           7.3       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 shorts (non-compact):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        34             37           4        295.5           3.4       1.0X
-InSet expression                                     94             96           1        106.4           9.4       0.4X
+In expression                                        35             39           5        283.8           3.5       1.0X
+InSet expression                                     92             95           2        108.3           9.2       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 shorts (non-compact):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        59             61           3        169.7           5.9       1.0X
-InSet expression                                    122            126           7         82.1          12.2       0.5X
+In expression                                        61             63           3        165.0           6.1       1.0X
+InSet expression                                    121            124           2         82.4          12.1       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 shorts (non-compact):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       110            112           4         91.0          11.0       1.0X
-InSet expression                                    138            141           2         72.5          13.8       0.8X
+In expression                                       112            113           2         89.4          11.2       1.0X
+InSet expression                                    135            139           4         73.9          13.5       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       192            196           4         52.0          19.2       1.0X
-InSet expression                                    122            125           2         81.9          12.2       1.6X
+In expression                                       194            195           2         51.4          19.4       1.0X
+InSet expression                                    117            121           2         85.2          11.7       1.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       342            344           3         29.3          34.2       1.0X
-InSet expression                                    129            132           3         77.5          12.9       2.6X
+In expression                                       343            344           1         29.1          34.3       1.0X
+InSet expression                                    123            126           2         81.2          12.3       2.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       513            521           7         19.5          51.3       1.0X
-InSet expression                                    139            142           2         72.2          13.9       3.7X
+In expression                                       514            515           1         19.5          51.4       1.0X
+InSet expression                                    134            136           1         74.7          13.4       3.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       660            661           1         15.1          66.0       1.0X
-InSet expression                                    153            156           1         65.4          15.3       4.3X
+In expression                                       662            665           4         15.1          66.2       1.0X
+InSet expression                                    147            151           3         68.1          14.7       4.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       858            865           6         11.7          85.8       1.0X
-InSet expression                                    164            173          21         61.1          16.4       5.2X
+In expression                                       847            853           4         11.8          84.7       1.0X
+InSet expression                                    160            162           2         62.7          16.0       5.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 ints:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        25             27           4        398.8           2.5       1.0X
-InSet expression                                     86             87           1        116.6           8.6       0.3X
+In expression                                        26             28           3        385.2           2.6       1.0X
+InSet expression                                     81             83           1        123.4           8.1       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 ints:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        36             40           5        277.9           3.6       1.0X
-InSet expression                                    106            109           3         94.4          10.6       0.3X
+In expression                                        38             40           3        266.2           3.8       1.0X
+InSet expression                                     98            100           1        102.4           9.8       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 ints:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        58             60           3        172.3           5.8       1.0X
-InSet expression                                    107            108           1         93.9          10.7       0.5X
+In expression                                        60             62           3        167.1           6.0       1.0X
+InSet expression                                     98            100           2        102.2           9.8       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 ints:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       115            116           2         87.1          11.5       1.0X
-InSet expression                                    151            154           1         66.0          15.1       0.8X
+In expression                                       117            118           1         85.5          11.7       1.0X
+InSet expression                                    135            138           2         73.9          13.5       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       192            198           5         52.2          19.2       1.0X
-InSet expression                                    129            131           3         77.7          12.9       1.5X
+In expression                                       184            193           4         54.4          18.4       1.0X
+InSet expression                                    118            121           2         84.4          11.8       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       353            357           5         28.3          35.3       1.0X
-InSet expression                                    134            136           1         74.5          13.4       2.6X
+In expression                                       354            355           1         28.3          35.4       1.0X
+InSet expression                                    124            125           1         80.7          12.4       2.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       508            527          21         19.7          50.8       1.0X
-InSet expression                                    146            148           2         68.3          14.6       3.5X
+In expression                                       513            513           1         19.5          51.3       1.0X
+InSet expression                                    136            138           1         73.6          13.6       3.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       668            685          15         15.0          66.8       1.0X
-InSet expression                                    159            162           2         62.8          15.9       4.2X
+In expression                                       678            680           4         14.8          67.8       1.0X
+InSet expression                                    148            152           3         67.5          14.8       4.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       833            860          47         12.0          83.3       1.0X
-InSet expression                                    173            176           2         57.8          17.3       4.8X
+In expression                                       829            834           6         12.1          82.9       1.0X
+InSet expression                                    160            163           1         62.3          16.0       5.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 ints (non-compact):                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        20             23           5        509.7           2.0       1.0X
-InSet expression                                     82             84           2        122.5           8.2       0.2X
+In expression                                        20             24           4        495.0           2.0       1.0X
+InSet expression                                     78             80           1        127.9           7.8       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 ints (non-compact):                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        27             29           3        364.7           2.7       1.0X
-InSet expression                                    102            104           1         97.7          10.2       0.3X
+In expression                                        29             31           3        349.1           2.9       1.0X
+InSet expression                                     95             97           1        105.3           9.5       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 ints (non-compact):                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        56             58           3        178.9           5.6       1.0X
-InSet expression                                    118            120           1         84.4          11.8       0.5X
+In expression                                        58             60           2        173.7           5.8       1.0X
+InSet expression                                    108            110           1         92.3          10.8       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 ints (non-compact):                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        99             99           1        101.5           9.9       1.0X
-InSet expression                                    147            149           1         68.0          14.7       0.7X
+In expression                                       100            101           2         99.7          10.0       1.0X
+InSet expression                                    134            135           1         74.8          13.4       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       178            180           2         56.1          17.8       1.0X
-InSet expression                                    133            136           3         75.0          13.3       1.3X
+In expression                                       180            181           1         55.6          18.0       1.0X
+InSet expression                                    121            124           2         82.4          12.1       1.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       338            344           6         29.5          33.8       1.0X
-InSet expression                                    138            139           1         72.7          13.8       2.5X
+In expression                                       338            347           6         29.6          33.8       1.0X
+InSet expression                                    128            130           1         77.9          12.8       2.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       506            509           2         19.7          50.6       1.0X
-InSet expression                                    146            148           3         68.5          14.6       3.5X
+In expression                                       507            509           4         19.7          50.7       1.0X
+InSet expression                                    136            139           2         73.5          13.6       3.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       670            677           8         14.9          67.0       1.0X
-InSet expression                                    159            162           2         62.8          15.9       4.2X
+In expression                                       674            676           3         14.8          67.4       1.0X
+InSet expression                                    148            151           2         67.6          14.8       4.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       833            864          66         12.0          83.3       1.0X
-InSet expression                                    172            173           1         58.3          17.2       4.9X
+In expression                                       833            867          62         12.0          83.3       1.0X
+InSet expression                                    160            162           1         62.6          16.0       5.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 longs:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        19             20           3        537.7           1.9       1.0X
-InSet expression                                     75             76           1        134.2           7.5       0.2X
+In expression                                        20             22           2        498.7           2.0       1.0X
+InSet expression                                     87             89           2        115.6           8.7       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 longs:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        28             30           2        356.7           2.8       1.0X
-InSet expression                                     91             94           3        109.5           9.1       0.3X
+In expression                                        30             32           3        337.9           3.0       1.0X
+InSet expression                                    102            105           4         98.4          10.2       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 longs:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        50             52           3        199.6           5.0       1.0X
-InSet expression                                     91             93           1        109.5           9.1       0.5X
+In expression                                        54             57           3        185.2           5.4       1.0X
+InSet expression                                    102            104           2         98.0          10.2       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 longs:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        91             92           1        110.4           9.1       1.0X
-InSet expression                                    129            130           1         77.7          12.9       0.7X
+In expression                                        93             94           1        107.8           9.3       1.0X
+InSet expression                                    137            139           2         73.2          13.7       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 longs:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       170            171           1         58.9          17.0       1.0X
-InSet expression                                    110            111           1         91.1          11.0       1.5X
+In expression                                       173            180           3         57.7          17.3       1.0X
+InSet expression                                    122            125           4         81.8          12.2       1.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 longs:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       328            345          14         30.5          32.8       1.0X
-InSet expression                                    117            119           2         85.5          11.7       2.8X
+In expression                                       330            344          14         30.3          33.0       1.0X
+InSet expression                                    130            132           2         77.0          13.0       2.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 floats:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        36             39           3        279.2           3.6       1.0X
-InSet expression                                     77             79           2        129.3           7.7       0.5X
+In expression                                        35             41           4        287.7           3.5       1.0X
+InSet expression                                     78             79           1        128.8           7.8       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 floats:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        58             63           3        173.0           5.8       1.0X
-InSet expression                                     99            101           2        101.4           9.9       0.6X
+In expression                                        63             64           2        158.9           6.3       1.0X
+InSet expression                                    101            103           1         98.9          10.1       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 floats:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       147            149           2         67.8          14.7       1.0X
-InSet expression                                     98            100           2        102.3           9.8       1.5X
+In expression                                       149            150           1         67.1          14.9       1.0X
+InSet expression                                    100            106          18        100.4          10.0       1.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 floats:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       228            231           3         43.8          22.8       1.0X
-InSet expression                                    144            146           2         69.3          14.4       1.6X
+In expression                                       232            237           4         43.2          23.2       1.0X
+InSet expression                                    147            151           4         67.8          14.7       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 floats:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       382            388           6         26.2          38.2       1.0X
-InSet expression                                    115            117           2         86.8          11.5       3.3X
+In expression                                       384            386           1         26.0          38.4       1.0X
+InSet expression                                    119            121           2         84.4          11.9       3.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 floats:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1921           1958          80          5.2         192.1       1.0X
-InSet expression                                    117            119           1         85.2          11.7      16.4X
+In expression                                      1901           1936          67          5.3         190.1       1.0X
+InSet expression                                    122            124           2         82.0          12.2      15.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 doubles:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        36             38           2        274.4           3.6       1.0X
-InSet expression                                     77             79           1        129.8           7.7       0.5X
+In expression                                        38             40           3        263.8           3.8       1.0X
+InSet expression                                     78             80           2        127.9           7.8       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 doubles:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        60             61           3        167.8           6.0       1.0X
-InSet expression                                     98            100           1        101.8           9.8       0.6X
+In expression                                        62             63           2        161.8           6.2       1.0X
+InSet expression                                    100            101           1         99.6          10.0       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 doubles:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       147            149           2         67.9          14.7       1.0X
-InSet expression                                     97             98           1        103.5           9.7       1.5X
+In expression                                       150            151           1         66.6          15.0       1.0X
+InSet expression                                    101            102           1         99.5          10.1       1.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 doubles:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       228            229           1         43.9          22.8       1.0X
-InSet expression                                    144            147           2         69.4          14.4       1.6X
+In expression                                       231            232           1         43.3          23.1       1.0X
+InSet expression                                    144            147           1         69.6          14.4       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 doubles:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       394            396           2         25.4          39.4       1.0X
-InSet expression                                    117            119           1         85.4          11.7       3.4X
+In expression                                       390            395           4         25.6          39.0       1.0X
+InSet expression                                    117            118           1         85.8          11.7       3.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 doubles:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      2228           2268          82          4.5         222.8       1.0X
-InSet expression                                    120            122           2         83.4          12.0      18.6X
+In expression                                      2231           2275          79          4.5         223.1       1.0X
+InSet expression                                    120            122           1         83.6          12.0      18.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 small decimals:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        19             21           2         51.8          19.3       1.0X
-InSet expression                                     49             51           1         20.4          48.9       0.4X
+In expression                                        21             23           2         47.6          21.0       1.0X
+InSet expression                                     51             53           2         19.5          51.3       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 small decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        25             27           2         39.4          25.4       1.0X
-InSet expression                                     51             53           3         19.6          50.9       0.5X
+In expression                                        27             28           2         37.1          26.9       1.0X
+InSet expression                                     54             56           3         18.5          54.1       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 small decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        40             43           4         25.2          39.7       1.0X
-InSet expression                                     52             56           8         19.4          51.6       0.8X
+In expression                                        41             45           3         24.5          40.8       1.0X
+InSet expression                                     54             55           2         18.6          53.8       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 small decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        78             83           4         12.8          78.4       1.0X
-InSet expression                                     57             58           2         17.7          56.6       1.4X
+In expression                                        80             84           4         12.5          80.0       1.0X
+InSet expression                                     59             61           2         17.0          58.9       1.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 small decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       241            242           1          4.1         241.4       1.0X
-InSet expression                                     54             59           4         18.4          54.4       4.4X
+In expression                                       241            242           2          4.2         240.9       1.0X
+InSet expression                                     57             58           1         17.6          56.9       4.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 small decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       582            586           3          1.7         581.8       1.0X
-InSet expression                                     56             58           1         17.8          56.2      10.3X
+In expression                                       580            582           2          1.7         580.2       1.0X
+InSet expression                                     59             61           2         17.1          58.5       9.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 large decimals:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         5              6           2        211.6           4.7       1.0X
-InSet expression                                      5              5           2        219.6           4.6       1.0X
+In expression                                         5              7           2        201.5           5.0       1.0X
+InSet expression                                      5              7           2        207.6           4.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 large decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         5              6           2        212.4           4.7       1.0X
-InSet expression                                      5              5           2        218.3           4.6       1.0X
+In expression                                         5              6           2        207.3           4.8       1.0X
+InSet expression                                      5              6           2        213.9           4.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 large decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         5              6           2        196.9           5.1       1.0X
-InSet expression                                      5              6           2        202.0           4.9       1.0X
+In expression                                         5              7           2        197.8           5.1       1.0X
+InSet expression                                      5              6           2        198.9           5.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 large decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         6              6           2        174.3           5.7       1.0X
-InSet expression                                      6              7           2        172.5           5.8       1.0X
+In expression                                         6              8           2        170.6           5.9       1.0X
+InSet expression                                      6              7           2        168.6           5.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 large decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         7              8           2        135.3           7.4       1.0X
-InSet expression                                      7              8           2        138.4           7.2       1.0X
+In expression                                         8              9           2        129.1           7.7       1.0X
+InSet expression                                      7              9           2        136.3           7.3       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 large decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        11             11           2         94.3          10.6       1.0X
-InSet expression                                     11             12           3         94.2          10.6       1.0X
+In expression                                        10             12           2         95.3          10.5       1.0X
+InSet expression                                     11             13           3         92.8          10.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 strings:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        28             29           2         35.5          28.2       1.0X
-InSet expression                                     42             43           1         24.1          41.5       0.7X
+In expression                                        28             30           1         35.2          28.4       1.0X
+InSet expression                                     42             44           1         23.6          42.3       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 strings:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        33             34           2         29.9          33.4       1.0X
-InSet expression                                     44             45           2         22.7          44.1       0.8X
+In expression                                        34             35           1         29.5          33.9       1.0X
+InSet expression                                     45             47           2         22.1          45.2       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 strings:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        42             43           1         23.8          42.0       1.0X
-InSet expression                                     48             49           1         20.6          48.5       0.9X
+In expression                                        43             45           1         23.2          43.1       1.0X
+InSet expression                                     50             51           1         20.1          49.9       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 strings:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        57             61           3         17.6          57.0       1.0X
-InSet expression                                     52             55           3         19.1          52.3       1.1X
+In expression                                        59             63           3         17.0          58.8       1.0X
+InSet expression                                     54             55           1         18.6          53.9       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 strings:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        88             89           1         11.3          88.3       1.0X
-InSet expression                                     49             50           1         20.4          48.9       1.8X
+In expression                                        90             94           3         11.1          89.7       1.0X
+InSet expression                                     51             52           2         19.7          50.7       1.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 strings:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       509            511           2          2.0         508.9       1.0X
-InSet expression                                     49             50           1         20.2          49.4      10.3X
+In expression                                       427            430           4          2.3         427.2       1.0X
+InSet expression                                     52             53           3         19.4          51.5       8.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 timestamps:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        16             18           2        607.3           1.6       1.0X
-InSet expression                                     81             82           1        124.0           8.1       0.2X
+In expression                                        17             19           2        591.4           1.7       1.0X
+InSet expression                                     81             82           1        123.9           8.1       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 timestamps:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        22             23           2        451.5           2.2       1.0X
-InSet expression                                     94             96           1        105.9           9.4       0.2X
+In expression                                        22             24           2        451.1           2.2       1.0X
+InSet expression                                     94             95           1        106.1           9.4       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 timestamps:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        47             49           3        213.9           4.7       1.0X
-InSet expression                                    128            130           1         77.9          12.8       0.4X
+In expression                                        48             50           2        210.3           4.8       1.0X
+InSet expression                                    127            129           4         79.0          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 timestamps:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        80             81           1        125.0           8.0       1.0X
-InSet expression                                    161            163           1         62.1          16.1       0.5X
+In expression                                        81             82           1        123.0           8.1       1.0X
+InSet expression                                    159            161           2         63.0          15.9       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 timestamps:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       151            152           1         66.0          15.1       1.0X
-InSet expression                                    137            139           2         72.8          13.7       1.1X
+In expression                                       153            154           1         65.4          15.3       1.0X
+InSet expression                                    137            139           1         73.1          13.7       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 timestamps:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       296            308          11         33.7          29.6       1.0X
-InSet expression                                    132            134           2         75.7          13.2       2.2X
+In expression                                       295            305          11         33.9          29.5       1.0X
+InSet expression                                    131            133           1         76.4          13.1       2.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 dates:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       287            289           2         34.8          28.7       1.0X
-InSet expression                                    282            290           6         35.5          28.2       1.0X
+In expression                                       313            314           1         32.0          31.3       1.0X
+InSet expression                                    306            307           2         32.7          30.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 dates:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       304            305           1         32.9          30.4       1.0X
-InSet expression                                    286            289           2         35.0          28.6       1.1X
+In expression                                       325            329           4         30.8          32.5       1.0X
+InSet expression                                    306            308           2         32.7          30.6       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 dates:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       327            335           7         30.6          32.7       1.0X
-InSet expression                                    291            296           6         34.4          29.1       1.1X
+In expression                                       364            365           2         27.5          36.4       1.0X
+InSet expression                                    306            308           1         32.7          30.6       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 dates:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       397            399           1         25.2          39.7       1.0X
-InSet expression                                    282            286           3         35.5          28.2       1.4X
+In expression                                       411            412           1         24.3          41.1       1.0X
+InSet expression                                    305            308           2         32.8          30.5       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       476            478           1         21.0          47.6       1.0X
-InSet expression                                    283            288           4         35.3          28.3       1.7X
+In expression                                       493            496           4         20.3          49.3       1.0X
+InSet expression                                    310            312           1         32.2          31.0       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       626            628           2         16.0          62.6       1.0X
-InSet expression                                    287            291           4         34.9          28.7       2.2X
+In expression                                       657            660           3         15.2          65.7       1.0X
+InSet expression                                    311            312           1         32.2          31.1       2.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       788            791           2         12.7          78.8       1.0X
-InSet expression                                    286            292           5         35.0          28.6       2.8X
+In expression                                       812            862          28         12.3          81.2       1.0X
+InSet expression                                    316            317           2         31.7          31.6       2.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       956            960           5         10.5          95.6       1.0X
-InSet expression                                    293            297           2         34.1          29.3       3.3X
+In expression                                       978            981           3         10.2          97.8       1.0X
+InSet expression                                    311            317           5         32.1          31.1       3.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1114           1120           4          9.0         111.4       1.0X
-InSet expression                                    380            382           1         26.3          38.0       2.9X
+In expression                                      1144           1152           8          8.7         114.4       1.0X
+InSet expression                                    391            392           1         25.6          39.1       2.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 arrays:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        25             26           1         40.3          24.8       1.0X
-InSet expression                                     57             58           1         17.6          56.7       0.4X
+In expression                                        27             28           1         37.1          27.0       1.0X
+InSet expression                                     60             61           1         16.8          59.6       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 arrays:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        39             43           3         25.4          39.4       1.0X
-InSet expression                                     85             87           1         11.7          85.5       0.5X
+In expression                                        42             46           3         24.0          41.7       1.0X
+InSet expression                                     89             90           1         11.3          88.7       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 arrays:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       133            134           1          7.5         133.0       1.0X
-InSet expression                                    100            103           3         10.0         100.2       1.3X
+In expression                                       169            175           4          5.9         169.4       1.0X
+InSet expression                                    104            105           2          9.7         103.6       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 arrays:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       410            411           1          2.4         409.7       1.0X
-InSet expression                                    129            133           4          7.7         129.1       3.2X
+In expression                                       393            396           3          2.5         393.4       1.0X
+InSet expression                                    133            136           3          7.5         133.1       3.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 arrays:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       792            795           2          1.3         792.0       1.0X
-InSet expression                                    147            148           2          6.8         147.0       5.4X
+In expression                                       817            821           4          1.2         817.2       1.0X
+InSet expression                                    151            151           0          6.6         150.5       5.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 arrays:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1758           1924         334          0.6        1758.0       1.0X
-InSet expression                                    164            166           1          6.1         164.3      10.7X
+In expression                                      1702           1856         335          0.6        1702.4       1.0X
+InSet expression                                    167            168           2          6.0         166.6      10.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 structs:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        16             17           2         61.4          16.3       1.0X
-InSet expression                                     81             83           1         12.3          81.5       0.2X
+In expression                                        17             18           1         58.4          17.1       1.0X
+InSet expression                                     87             88           1         11.5          87.0       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 structs:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        23             24           1         43.1          23.2       1.0X
-InSet expression                                    126            128           1          7.9         126.2       0.2X
+In expression                                        24             25           2         42.1          23.7       1.0X
+InSet expression                                    132            134           2          7.6         131.8       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 structs:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        70             74           3         14.3          70.1       1.0X
-InSet expression                                    149            153           9          6.7         148.5       0.5X
+In expression                                        72             77           4         14.0          71.6       1.0X
+InSet expression                                    155            157           2          6.5         154.7       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 structs:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       207            211           3          4.8         207.1       1.0X
-InSet expression                                    192            196           2          5.2         192.4       1.1X
+In expression                                       198            203           4          5.0         198.5       1.0X
+InSet expression                                    201            203           3          5.0         200.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 structs:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       575            580           4          1.7         575.3       1.0X
-InSet expression                                    218            221           2          4.6         218.5       2.6X
+In expression                                       562            564           3          1.8         561.8       1.0X
+InSet expression                                    224            227           1          4.5         224.1       2.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 structs:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1351           1527         240          0.7        1350.5       1.0X
-InSet expression                                    249            252           2          4.0         249.3       5.4X
+In expression                                      1333           1511         260          0.8        1333.3       1.0X
+InSet expression                                    269            274           7          3.7         269.2       5.0X
 
 
diff --git a/sql/core/benchmarks/InExpressionBenchmark-results.txt b/sql/core/benchmarks/InExpressionBenchmark-results.txt
index 16e3c78bdb722..a72d901035c49 100644
--- a/sql/core/benchmarks/InExpressionBenchmark-results.txt
+++ b/sql/core/benchmarks/InExpressionBenchmark-results.txt
@@ -2,739 +2,739 @@
 In Expression Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 bytes:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        40             56           8        249.7           4.0       1.0X
-InSet expression                                     80             87           4        124.5           8.0       0.5X
+In expression                                        38             52           9        264.5           3.8       1.0X
+InSet expression                                     85             91           4        117.7           8.5       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 bytes:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        38             42           4        264.1           3.8       1.0X
-InSet expression                                     76             80           4        130.9           7.6       0.5X
+In expression                                        37             42           5        273.4           3.7       1.0X
+InSet expression                                     82             86           4        122.1           8.2       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 bytes:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        66             69           3        151.9           6.6       1.0X
-InSet expression                                     85             89           4        117.8           8.5       0.8X
+In expression                                        65             67           2        154.1           6.5       1.0X
+InSet expression                                     83             88           5        120.8           8.3       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 bytes:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       106            108           3         94.2          10.6       1.0X
-InSet expression                                     90             93           3        111.3           9.0       1.2X
+In expression                                       106            108           2         94.6          10.6       1.0X
+InSet expression                                     89             91           4        112.9           8.9       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 bytes:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       194            197           4         51.5          19.4       1.0X
-InSet expression                                    101            103           3         99.3          10.1       1.9X
+In expression                                       194            196           3         51.6          19.4       1.0X
+InSet expression                                     98            101           2        101.6           9.8       2.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 bytes:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       397            400           3         25.2          39.7       1.0X
-InSet expression                                    197            205           6         50.9          19.7       2.0X
+In expression                                       397            400           2         25.2          39.7       1.0X
+InSet expression                                    195            199           5         51.4          19.5       2.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 shorts:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        31             34           4        323.9           3.1       1.0X
-InSet expression                                    100            103           4         99.8          10.0       0.3X
+In expression                                        34             37           3        297.7           3.4       1.0X
+InSet expression                                     98            101           2        101.7           9.8       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 shorts:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        37             39           2        272.3           3.7       1.0X
-InSet expression                                    115            118           2         86.6          11.5       0.3X
+In expression                                        36             39           2        274.2           3.6       1.0X
+InSet expression                                    113            116           3         88.7          11.3       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 shorts:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        72             74           4        138.7           7.2       1.0X
-InSet expression                                    115            117           1         87.0          11.5       0.6X
+In expression                                        72             74           2        138.5           7.2       1.0X
+InSet expression                                    112            115           2         89.0          11.2       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 shorts:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       118            121           5         84.8          11.8       1.0X
-InSet expression                                    142            146           4         70.4          14.2       0.8X
+In expression                                       118            120           3         84.9          11.8       1.0X
+InSet expression                                    142            144           1         70.6          14.2       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       186            189           5         53.7          18.6       1.0X
-InSet expression                                    126            131           5         79.2          12.6       1.5X
+In expression                                       198            200           2         50.4          19.8       1.0X
+InSet expression                                    126            129           3         79.2          12.6       1.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       366            373          14         27.4          36.6       1.0X
-InSet expression                                    134            138           4         74.7          13.4       2.7X
+In expression                                       366            368           2         27.3          36.6       1.0X
+InSet expression                                    132            135           2         75.6          13.2       2.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       550            552           4         18.2          55.0       1.0X
-InSet expression                                    146            151           4         68.4          14.6       3.8X
+In expression                                       551            552           2         18.2          55.1       1.0X
+InSet expression                                    146            149           2         68.3          14.6       3.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       668            673           5         15.0          66.8       1.0X
-InSet expression                                    161            164           5         62.3          16.1       4.2X
+In expression                                       668            669           1         15.0          66.8       1.0X
+InSet expression                                    158            162           3         63.2          15.8       4.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 shorts:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       941            946           6         10.6          94.1       1.0X
-InSet expression                                    174            183          18         57.4          17.4       5.4X
+In expression                                       939            941           3         10.7          93.9       1.0X
+InSet expression                                    172            174           1         58.1          17.2       5.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 shorts (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        30             31           3        336.9           3.0       1.0X
-InSet expression                                     97             99           2        103.3           9.7       0.3X
+In expression                                        30             31           1        337.0           3.0       1.0X
+InSet expression                                     94             96           1        105.9           9.4       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 shorts (non-compact):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        37             39           2        270.3           3.7       1.0X
-InSet expression                                    114            116           2         87.9          11.4       0.3X
+In expression                                        36             39           3        274.8           3.6       1.0X
+InSet expression                                    112            115           2         89.0          11.2       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 shorts (non-compact):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        70             72           2        143.1           7.0       1.0X
-InSet expression                                    133            136           2         75.1          13.3       0.5X
+In expression                                        70             71           2        142.3           7.0       1.0X
+InSet expression                                    133            135           1         75.1          13.3       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 shorts (non-compact):                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       105            107           1         94.8          10.5       1.0X
-InSet expression                                    148            151           1         67.4          14.8       0.7X
+In expression                                       106            107           1         94.4          10.6       1.0X
+InSet expression                                    149            151           2         67.3          14.9       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       196            200           5         51.0          19.6       1.0X
-InSet expression                                    129            133           3         77.4          12.9       1.5X
+In expression                                       196            197           2         51.0          19.6       1.0X
+InSet expression                                    128            131           2         78.0          12.8       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       354            356           3         28.3          35.4       1.0X
-InSet expression                                    134            137           5         74.9          13.4       2.6X
+In expression                                       354            355           1         28.3          35.4       1.0X
+InSet expression                                    133            135           1         74.9          13.3       2.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       659            662           4         15.2          65.9       1.0X
-InSet expression                                    147            150           5         68.2          14.7       4.5X
+In expression                                       502            502           0         19.9          50.2       1.0X
+InSet expression                                    143            145           1         70.0          14.3       3.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       668            669           2         15.0          66.8       1.0X
-InSet expression                                    157            160           2         63.6          15.7       4.3X
+In expression                                       669            671           3         14.9          66.9       1.0X
+InSet expression                                    155            158           2         64.6          15.5       4.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 shorts (non-compact):                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       854            857           4         11.7          85.4       1.0X
-InSet expression                                    169            173           3         59.2          16.9       5.1X
+In expression                                       860            861           2         11.6          86.0       1.0X
+InSet expression                                    167            172           3         59.9          16.7       5.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 ints:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        28             30           2        354.7           2.8       1.0X
-InSet expression                                     99            100           1        101.3           9.9       0.3X
+In expression                                        28             30           3        362.5           2.8       1.0X
+InSet expression                                     96             98           2        103.7           9.6       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 ints:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        35             36           2        285.9           3.5       1.0X
-InSet expression                                    114            116           1         87.8          11.4       0.3X
+In expression                                        36             37           1        278.5           3.6       1.0X
+InSet expression                                    112            114           1         89.3          11.2       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 ints:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        62             64           3        161.4           6.2       1.0X
-InSet expression                                    117            120           3         85.3          11.7       0.5X
+In expression                                        62             65           7        161.9           6.2       1.0X
+InSet expression                                    115            117           1         86.8          11.5       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 ints:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       114            115           1         87.6          11.4       1.0X
-InSet expression                                    145            147           1         69.2          14.5       0.8X
+In expression                                       105            106           1         95.3          10.5       1.0X
+InSet expression                                    143            144           2         70.2          14.3       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       195            197           2         51.4          19.5       1.0X
-InSet expression                                    126            127           1         79.6          12.6       1.5X
+In expression                                       184            184           1         54.4          18.4       1.0X
+InSet expression                                    122            123           1         82.3          12.2       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       351            357           3         28.5          35.1       1.0X
-InSet expression                                    131            135           5         76.2          13.1       2.7X
+In expression                                       352            355           2         28.4          35.2       1.0X
+InSet expression                                    128            131           3         78.3          12.8       2.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       511            520           5         19.6          51.1       1.0X
-InSet expression                                    143            147           8         70.0          14.3       3.6X
+In expression                                       514            533          18         19.4          51.4       1.0X
+InSet expression                                    140            143           5         71.5          14.0       3.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       673            689          10         14.9          67.3       1.0X
-InSet expression                                    154            157           3         64.9          15.4       4.4X
+In expression                                       668            678           8         15.0          66.8       1.0X
+InSet expression                                    151            154           1         66.1          15.1       4.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 ints:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       828            860          42         12.1          82.8       1.0X
-InSet expression                                    167            170           6         60.0          16.7       5.0X
+In expression                                       836            850          13         12.0          83.6       1.0X
+InSet expression                                    164            166           1         60.9          16.4       5.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 ints (non-compact):                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        22             25           4        461.8           2.2       1.0X
-InSet expression                                     95             98           3        105.3           9.5       0.2X
+In expression                                        22             24           4        451.0           2.2       1.0X
+InSet expression                                     93             95           2        107.4           9.3       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 ints (non-compact):                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        28             30           2        354.7           2.8       1.0X
-InSet expression                                    110            114           3         90.7          11.0       0.3X
+In expression                                        28             30           2        351.9           2.8       1.0X
+InSet expression                                    109            110           1         92.1          10.9       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 ints (non-compact):                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        55             57           1        180.8           5.5       1.0X
-InSet expression                                    125            129           7         79.8          12.5       0.4X
+In expression                                        55             57           2        180.3           5.5       1.0X
+InSet expression                                    124            125           1         80.8          12.4       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 ints (non-compact):                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       100            101           1        100.3          10.0       1.0X
-InSet expression                                    142            145           3         70.3          14.2       0.7X
+In expression                                       101            102           1         99.3          10.1       1.0X
+InSet expression                                    143            145           1         69.9          14.3       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       179            180           1         55.9          17.9       1.0X
-InSet expression                                    128            132           8         78.1          12.8       1.4X
+In expression                                       180            184           8         55.6          18.0       1.0X
+InSet expression                                    124            128           3         80.3          12.4       1.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       345            348           3         29.0          34.5       1.0X
-InSet expression                                    132            135           2         75.6          13.2       2.6X
+In expression                                       346            347           2         28.9          34.6       1.0X
+InSet expression                                    129            133           5         77.3          12.9       2.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       507            509           2         19.7          50.7       1.0X
-InSet expression                                    142            145           5         70.6          14.2       3.6X
+In expression                                       506            508           3         19.8          50.6       1.0X
+InSet expression                                    139            142           3         72.0          13.9       3.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       662            667           4         15.1          66.2       1.0X
-InSet expression                                    154            156           1         65.0          15.4       4.3X
+In expression                                       658            664           4         15.2          65.8       1.0X
+InSet expression                                    151            153           2         66.3          15.1       4.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 ints (non-compact):                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       820            856          78         12.2          82.0       1.0X
-InSet expression                                    165            170           4         60.4          16.5       5.0X
+In expression                                       821            864          95         12.2          82.1       1.0X
+InSet expression                                    163            165           1         61.4          16.3       5.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 longs:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        21             23           3        481.5           2.1       1.0X
-InSet expression                                     87             89           2        114.5           8.7       0.2X
+In expression                                        21             23           3        467.1           2.1       1.0X
+InSet expression                                     88             89           2        114.2           8.8       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 longs:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        29             31           3        350.3           2.9       1.0X
-InSet expression                                    103            107           3         97.0          10.3       0.3X
+In expression                                        29             31           1        343.5           2.9       1.0X
+InSet expression                                    103            106           4         97.3          10.3       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 longs:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        54             55           2        186.1           5.4       1.0X
-InSet expression                                    105            111          13         95.4          10.5       0.5X
+In expression                                        55             56           1        183.2           5.5       1.0X
+InSet expression                                    105            108           3         94.9          10.5       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 longs:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        92             97           3        108.4           9.2       1.0X
+In expression                                        95             97           2        105.7           9.5       1.0X
 InSet expression                                    134            137           2         74.5          13.4       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 longs:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       174            183           6         57.6          17.4       1.0X
-InSet expression                                    113            119          14         88.2          11.3       1.5X
+In expression                                       177            182           4         56.6          17.7       1.0X
+InSet expression                                    115            117           1         86.8          11.5       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 longs:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       330            352          13         30.3          33.0       1.0X
-InSet expression                                    118            121           2         84.8          11.8       2.8X
+In expression                                       330            342          12         30.3          33.0       1.0X
+InSet expression                                    121            123           1         82.3          12.1       2.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 floats:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        35             37           2        284.5           3.5       1.0X
-InSet expression                                    115            118           3         87.3          11.5       0.3X
+In expression                                        40             42           2        252.8           4.0       1.0X
+InSet expression                                     95             97           1        104.8           9.5       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 floats:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        63             65           1        157.8           6.3       1.0X
-InSet expression                                    145            146           1         69.0          14.5       0.4X
+In expression                                        64             65           1        156.9           6.4       1.0X
+InSet expression                                    115            117           1         86.8          11.5       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 floats:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       127            129           1         78.5          12.7       1.0X
-InSet expression                                    144            147           4         69.5          14.4       0.9X
+In expression                                       127            129           3         78.7          12.7       1.0X
+InSet expression                                    117            118           1         85.4          11.7       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 floats:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
 In expression                                       209            210           1         47.8          20.9       1.0X
-InSet expression                                    189            191           2         52.8          18.9       1.1X
+InSet expression                                    158            160           3         63.4          15.8       1.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 floats:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       366            368           3         27.3          36.6       1.0X
-InSet expression                                    148            151           5         67.7          14.8       2.5X
+In expression                                       367            367           1         27.3          36.7       1.0X
+InSet expression                                    128            130           2         78.4          12.8       2.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 floats:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1693           1819          98          5.9         169.3       1.0X
-InSet expression                                    151            154           3         66.1          15.1      11.2X
+In expression                                      1672           1739          94          6.0         167.2       1.0X
+InSet expression                                    133            135           2         75.2          13.3      12.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 doubles:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        41             43           3        243.1           4.1       1.0X
-InSet expression                                    115            117           1         86.6          11.5       0.4X
+In expression                                        40             42           4        252.2           4.0       1.0X
+InSet expression                                    116            119           6         86.0          11.6       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 doubles:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        63             65           1        157.9           6.3       1.0X
-InSet expression                                    145            147           1         69.2          14.5       0.4X
+In expression                                        62             64           2        160.7           6.2       1.0X
+InSet expression                                    146            148           1         68.3          14.6       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 doubles:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       129            131           2         77.4          12.9       1.0X
-InSet expression                                    144            146           2         69.4          14.4       0.9X
+In expression                                       129            130           1         77.4          12.9       1.0X
+InSet expression                                    143            144           1         70.0          14.3       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 doubles:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       210            211           2         47.7          21.0       1.0X
-InSet expression                                    191            195           4         52.4          19.1       1.1X
+In expression                                       209            210           1         47.8          20.9       1.0X
+InSet expression                                    192            195           3         52.0          19.2       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 doubles:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       367            368           1         27.3          36.7       1.0X
-InSet expression                                    150            163          36         66.6          15.0       2.4X
+In expression                                       366            367           1         27.3          36.6       1.0X
+InSet expression                                    150            152           2         66.5          15.0       2.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 doubles:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1929           2031          96          5.2         192.9       1.0X
-InSet expression                                    149            152           1         67.1          14.9      12.9X
+In expression                                      1953           2014         103          5.1         195.3       1.0X
+InSet expression                                    154            156           1         64.8          15.4      12.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 small decimals:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        20             22           3         49.9          20.0       1.0X
-InSet expression                                     62             65           3         16.0          62.5       0.3X
+In expression                                        20             22           3         49.4          20.2       1.0X
+InSet expression                                     58             60           1         17.2          58.1       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 small decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        25             27           2         39.3          25.5       1.0X
-InSet expression                                     64             66           2         15.6          64.2       0.4X
+In expression                                        25             27           1         39.9          25.0       1.0X
+InSet expression                                     60             62           2         16.6          60.4       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 small decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        41             43           2         24.4          41.0       1.0X
-InSet expression                                     65             67           2         15.3          65.3       0.6X
+In expression                                        41             43           1         24.3          41.1       1.0X
+InSet expression                                     60             63           2         16.5          60.5       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 small decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        79             81           3         12.6          79.1       1.0X
-InSet expression                                     70             72           1         14.4          69.7       1.1X
+In expression                                        79             80           1         12.6          79.3       1.0X
+InSet expression                                     65             68           2         15.4          65.1       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 small decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       236            237           2          4.2         235.9       1.0X
-InSet expression                                     69             71           2         14.4          69.3       3.4X
+In expression                                       237            238           2          4.2         236.6       1.0X
+InSet expression                                     63             64           1         15.9          62.9       3.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 small decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       558            623         139          1.8         557.5       1.0X
-InSet expression                                     70             73           2         14.2          70.4       7.9X
+In expression                                       558            616         124          1.8         558.3       1.0X
+InSet expression                                     65             67           1         15.5          64.7       8.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 large decimals:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         5              6           1        201.1           5.0       1.0X
-InSet expression                                      5              6           1        205.5           4.9       1.0X
+In expression                                         5              7           1        182.6           5.5       1.0X
+InSet expression                                      5              7           1        190.9           5.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 large decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         5              6           1        202.4           4.9       1.0X
-InSet expression                                      5              6           1        206.3           4.8       1.0X
+In expression                                         5              6           1        192.6           5.2       1.0X
+InSet expression                                      5              6           1        201.3           5.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 large decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         5              6           1        191.2           5.2       1.0X
-InSet expression                                      5              6           1        190.9           5.2       1.0X
+In expression                                         6              7           1        180.3           5.5       1.0X
+InSet expression                                      5              6           1        186.4           5.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 large decimals:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         6              6           1        168.7           5.9       1.0X
-InSet expression                                      6              6           1        168.2           5.9       1.0X
+In expression                                         6              7           1        163.0           6.1       1.0X
+InSet expression                                      6              7           1        164.1           6.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 large decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                         8              9           1        130.5           7.7       1.0X
-InSet expression                                      8              8           1        132.0           7.6       1.0X
+In expression                                         8             10           1        123.9           8.1       1.0X
+InSet expression                                      8              9           1        124.0           8.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 large decimals:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        11             12           2         90.9          11.0       1.0X
-InSet expression                                     11             12           1         90.6          11.0       1.0X
+In expression                                        11             12           1         88.2          11.3       1.0X
+InSet expression                                     11             13           2         89.3          11.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 strings:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        30             31           1         33.5          29.9       1.0X
-InSet expression                                     47             48           1         21.2          47.1       0.6X
+In expression                                        29             31           1         34.3          29.2       1.0X
+InSet expression                                     47             49           2         21.1          47.4       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 strings:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        35             38           3         28.4          35.3       1.0X
-InSet expression                                     49             51           2         20.2          49.4       0.7X
+In expression                                        35             36           1         28.8          34.7       1.0X
+InSet expression                                     49             50           1         20.6          48.5       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 strings:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        44             45           1         22.8          43.9       1.0X
-InSet expression                                     53             55           2         18.7          53.4       0.8X
+In expression                                        43             44           1         23.4          42.8       1.0X
+InSet expression                                     53             54           1         19.0          52.6       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 strings:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        59             60           2         17.0          58.7       1.0X
-InSet expression                                     57             59           1         17.5          57.3       1.0X
+In expression                                        57             59           1         17.5          57.3       1.0X
+InSet expression                                     55             58           4         18.0          55.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 strings:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        88             90           2         11.3          88.4       1.0X
-InSet expression                                     53             55           1         18.8          53.3       1.7X
+In expression                                        86             87           1         11.6          85.9       1.0X
+InSet expression                                     52             54           2         19.2          52.0       1.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 strings:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       394            398           9          2.5         393.9       1.0X
-InSet expression                                     54             56           2         18.6          53.7       7.3X
+In expression                                       378            379           1          2.6         377.6       1.0X
+InSet expression                                     52             55           2         19.1          52.5       7.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 timestamps:                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        16             19           2        607.4           1.6       1.0X
-InSet expression                                     89             91           1        111.7           8.9       0.2X
+In expression                                        16             18           3        623.0           1.6       1.0X
+InSet expression                                     90             92           1        110.8           9.0       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 timestamps:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        24             26           1        412.7           2.4       1.0X
-InSet expression                                    100            101           1        100.2          10.0       0.2X
+In expression                                        23             24           1        430.0           2.3       1.0X
+InSet expression                                    101            107          16         99.4          10.1       0.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 timestamps:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        47             48           2        210.7           4.7       1.0X
-InSet expression                                    127            129           1         79.0          12.7       0.4X
+In expression                                        46             47           1        219.5           4.6       1.0X
+InSet expression                                    127            129           4         78.9          12.7       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 timestamps:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        82             84           2        121.4           8.2       1.0X
-InSet expression                                    154            156           2         65.0          15.4       0.5X
+In expression                                        81             82           1        123.7           8.1       1.0X
+InSet expression                                    154            156           2         64.9          15.4       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 timestamps:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       154            154           1         65.1          15.4       1.0X
-InSet expression                                    132            135           3         75.5          13.2       1.2X
+In expression                                       153            153           1         65.4          15.3       1.0X
+InSet expression                                    135            136           1         74.2          13.5       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 timestamps:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       295            306          12         33.9          29.5       1.0X
-InSet expression                                    128            130           2         78.1          12.8       2.3X
+In expression                                       295            306          13         33.9          29.5       1.0X
+InSet expression                                    130            131           1         77.2          13.0       2.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 dates:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       371            373           3         27.0          37.1       1.0X
-InSet expression                                    365            371           5         27.4          36.5       1.0X
+In expression                                       367            367           1         27.3          36.7       1.0X
+InSet expression                                    363            364           1         27.5          36.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 dates:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       380            382           1         26.3          38.0       1.0X
-InSet expression                                    364            365           1         27.5          36.4       1.0X
+In expression                                       373            380           5         26.8          37.3       1.0X
+InSet expression                                    369            374           3         27.1          36.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 dates:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       404            407           3         24.7          40.4       1.0X
-InSet expression                                    369            371           1         27.1          36.9       1.1X
+In expression                                       413            415           1         24.2          41.3       1.0X
+InSet expression                                    362            363           1         27.6          36.2       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 dates:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       460            462           3         21.8          46.0       1.0X
-InSet expression                                    363            365           2         27.5          36.3       1.3X
+In expression                                       457            461           6         21.9          45.7       1.0X
+InSet expression                                    366            367           1         27.3          36.6       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       543            552          12         18.4          54.3       1.0X
-InSet expression                                    370            372           3         27.1          37.0       1.5X
+In expression                                       545            546           1         18.4          54.5       1.0X
+InSet expression                                    364            372          15         27.5          36.4       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       706            711           6         14.2          70.6       1.0X
-InSet expression                                    371            376           5         26.9          37.1       1.9X
+In expression                                       707            708           1         14.1          70.7       1.0X
+InSet expression                                    368            378           7         27.2          36.8       1.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 300 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       868            882          10         11.5          86.8       1.0X
-InSet expression                                    366            376           6         27.4          36.6       2.4X
+In expression                                       866            868           3         11.6          86.6       1.0X
+InSet expression                                    384            386           1         26.0          38.4       2.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 400 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1026           1041           9          9.7         102.6       1.0X
-InSet expression                                    370            379           7         27.0          37.0       2.8X
+In expression                                      1031           1034           2          9.7         103.1       1.0X
+InSet expression                                    385            385           1         26.0          38.5       2.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 500 dates:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1209           1214           6          8.3         120.9       1.0X
-InSet expression                                    463            471           5         21.6          46.3       2.6X
+In expression                                      1220           1223           3          8.2         122.0       1.0X
+InSet expression                                    462            463           2         21.7          46.2       2.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 arrays:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        27             29           2         36.8          27.1       1.0X
-InSet expression                                     58             59           1         17.4          57.6       0.5X
+In expression                                        25             26           1         40.2          24.9       1.0X
+InSet expression                                     55             57           1         18.2          54.9       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 arrays:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        42             43           2         24.1          41.6       1.0X
-InSet expression                                     85             87           1         11.8          85.1       0.5X
+In expression                                        40             41           2         25.0          40.0       1.0X
+InSet expression                                     83             85           1         12.1          83.0       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 arrays:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       181            183           2          5.5         181.2       1.0X
-InSet expression                                     99            102           4         10.1          99.4       1.8X
+In expression                                       135            136           1          7.4         135.0       1.0X
+InSet expression                                     98            100           2         10.2          98.1       1.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 arrays:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       384            389           8          2.6         384.2       1.0X
-InSet expression                                    128            131           2          7.8         128.1       3.0X
+In expression                                       372            375           5          2.7         371.7       1.0X
+InSet expression                                    125            129           4          8.0         125.3       3.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 arrays:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       769            775           5          1.3         769.0       1.0X
-InSet expression                                    143            146           1          7.0         143.3       5.4X
+In expression                                       753            755           1          1.3         753.3       1.0X
+InSet expression                                    141            143           1          7.1         141.0       5.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 arrays:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1684           1898         330          0.6        1684.1       1.0X
-InSet expression                                    162            165           4          6.2         162.1      10.4X
+In expression                                      1502           1786         267          0.7        1501.6       1.0X
+InSet expression                                    160            160           1          6.3         159.6       9.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 5 structs:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        22             23           1         45.4          22.0       1.0X
-InSet expression                                     80             83           6         12.4          80.4       0.3X
+In expression                                        20             22           2         48.8          20.5       1.0X
+InSet expression                                     77             80           3         12.9          77.2       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 10 structs:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        32             33           2         31.6          31.7       1.0X
-InSet expression                                    121            123           2          8.2         121.3       0.3X
+In expression                                        30             32           1         33.2          30.1       1.0X
+InSet expression                                    117            118           1          8.6         116.6       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 25 structs:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                        85             86           1         11.7          85.2       1.0X
-InSet expression                                    142            145           3          7.0         142.3       0.6X
+In expression                                        70             71           1         14.3          70.0       1.0X
+InSet expression                                    137            142          14          7.3         136.6       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 50 structs:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       203            205           4          4.9         202.7       1.0X
-InSet expression                                    182            186           2          5.5         182.4       1.1X
+In expression                                       217            220           2          4.6         216.6       1.0X
+InSet expression                                    177            179           3          5.7         176.6       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 100 structs:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                       489            511          13          2.0         489.0       1.0X
-InSet expression                                    205            207           1          4.9         205.0       2.4X
+In expression                                       510            513           2          2.0         510.3       1.0X
+InSet expression                                    198            202           5          5.0         198.0       2.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 200 structs:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-In expression                                      1256           1403         264          0.8        1256.3       1.0X
-InSet expression                                    237            245          11          4.2         237.1       5.3X
+In expression                                      1222           1430         265          0.8        1222.2       1.0X
+InSet expression                                    233            235           2          4.3         232.6       5.3X
 
 
diff --git a/sql/core/benchmarks/InMemoryColumnarBenchmark-jdk21-results.txt b/sql/core/benchmarks/InMemoryColumnarBenchmark-jdk21-results.txt
index cc5acfe9c1670..e200db961f9cd 100644
--- a/sql/core/benchmarks/InMemoryColumnarBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/InMemoryColumnarBenchmark-jdk21-results.txt
@@ -2,11 +2,11 @@
 Int In-memory with 1000000 rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int In-Memory scan:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-columnar deserialization + columnar-to-row            193            253          52          5.2         193.2       1.0X
-row-based deserialization                             146            155           9          6.9         145.7       1.3X
+columnar deserialization + columnar-to-row            177            222          65          5.6         177.5       1.0X
+row-based deserialization                             129            164          55          7.7         129.5       1.4X
 
 
diff --git a/sql/core/benchmarks/InMemoryColumnarBenchmark-results.txt b/sql/core/benchmarks/InMemoryColumnarBenchmark-results.txt
index 45d9390a5602e..51ac715059fae 100644
--- a/sql/core/benchmarks/InMemoryColumnarBenchmark-results.txt
+++ b/sql/core/benchmarks/InMemoryColumnarBenchmark-results.txt
@@ -2,11 +2,11 @@
 Int In-memory with 1000000 rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int In-Memory scan:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-columnar deserialization + columnar-to-row            179            220          36          5.6         178.7       1.0X
-row-based deserialization                             171            219          70          5.9         170.5       1.0X
+columnar deserialization + columnar-to-row            222            257          41          4.5         222.3       1.0X
+row-based deserialization                             140            178          63          7.2         139.8       1.6X
 
 
diff --git a/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-jdk21-results.txt b/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-jdk21-results.txt
index 9ab15d2804ac9..f86a35823fc47 100644
--- a/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-jdk21-results.txt
@@ -1,8 +1,8 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dynamic insert table benchmark, totalRows = 200000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------
-one partition column, 100 partitions                         7569           7811         343          0.0       37844.8       1.0X
-two partition columns, 500 partitions                       21079          21237         223          0.0      105396.1       0.4X
-three partition columns, 2000 partitions                    58077          58838        1077          0.0      290383.9       0.1X
+one partition column, 100 partitions                         7661           7709          67          0.0       38305.2       1.0X
+two partition columns, 500 partitions                       19979          20122         202          0.0       99894.4       0.4X
+three partition columns, 2000 partitions                    56004          56084         113          0.0      280021.2       0.1X
 
diff --git a/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-results.txt b/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-results.txt
index 9168ce1502a16..e5cbfddc48482 100644
--- a/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-results.txt
+++ b/sql/core/benchmarks/InsertTableWithDynamicPartitionsBenchmark-results.txt
@@ -1,8 +1,8 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 dynamic insert table benchmark, totalRows = 200000:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------
-one partition column, 100 partitions                         7507           7533          37          0.0       37536.8       1.0X
-two partition columns, 500 partitions                       20204          20330         178          0.0      101021.9       0.4X
-three partition columns, 2000 partitions                    54668          55077         578          0.0      273341.1       0.1X
+one partition column, 100 partitions                         7780           7799          26          0.0       38901.1       1.0X
+two partition columns, 500 partitions                       20050          20197         207          0.0      100252.3       0.4X
+three partition columns, 2000 partitions                    55234          55365         186          0.0      276167.7       0.1X
 
diff --git a/sql/core/benchmarks/IntervalBenchmark-jdk21-results.txt b/sql/core/benchmarks/IntervalBenchmark-jdk21-results.txt
index 895b83b4c0e5e..5096583abec42 100644
--- a/sql/core/benchmarks/IntervalBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/IntervalBenchmark-jdk21-results.txt
@@ -1,40 +1,40 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast strings to intervals:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-prepare string w/ interval                          423            439          15          2.4         423.2       1.0X
-prepare string w/o interval                         384            393           9          2.6         383.6       1.1X
-1 units w/ interval                                 319            325           7          3.1         319.0       1.3X
-1 units w/o interval                                348            351           3          2.9         348.4       1.2X
-2 units w/ interval                                 547            558          12          1.8         546.7       0.8X
-2 units w/o interval                                530            549          18          1.9         529.8       0.8X
-3 units w/ interval                                1074           1082          11          0.9        1074.1       0.4X
-3 units w/o interval                               1061           1077          18          0.9        1061.5       0.4X
-4 units w/ interval                                1208           1222          13          0.8        1208.0       0.4X
-4 units w/o interval                               1216           1225          15          0.8        1216.4       0.3X
-5 units w/ interval                                1340           1345           4          0.7        1339.9       0.3X
-5 units w/o interval                               1333           1340           7          0.8        1332.9       0.3X
-6 units w/ interval                                1481           1502          29          0.7        1481.4       0.3X
-6 units w/o interval                               1513           1517           3          0.7        1513.4       0.3X
-7 units w/ interval                                1835           1842           9          0.5        1834.7       0.2X
-7 units w/o interval                               1830           1840           9          0.5        1829.8       0.2X
-8 units w/ interval                                1931           1939           7          0.5        1931.2       0.2X
-8 units w/o interval                               1920           1924           3          0.5        1920.4       0.2X
-9 units w/ interval                                2051           2055           4          0.5        2050.7       0.2X
-9 units w/o interval                               2061           2064           4          0.5        2060.6       0.2X
-10 units w/ interval                               2346           2363          25          0.4        2346.0       0.2X
-10 units w/o interval                              2337           2345          13          0.4        2336.7       0.2X
-11 units w/ interval                               2979           2995          28          0.3        2979.0       0.1X
-11 units w/o interval                              2966           2979          11          0.3        2966.0       0.1X
+prepare string w/ interval                          409            451          37          2.4         409.1       1.0X
+prepare string w/o interval                         387            407          18          2.6         387.1       1.1X
+1 units w/ interval                                 338            341           5          3.0         337.9       1.2X
+1 units w/o interval                                358            369          10          2.8         358.0       1.1X
+2 units w/ interval                                 559            565           6          1.8         559.4       0.7X
+2 units w/o interval                                542            555          15          1.8         542.2       0.8X
+3 units w/ interval                                1057           1066           9          0.9        1057.4       0.4X
+3 units w/o interval                               1047           1052           4          1.0        1047.2       0.4X
+4 units w/ interval                                1209           1218          13          0.8        1208.8       0.3X
+4 units w/o interval                               1208           1213           8          0.8        1208.1       0.3X
+5 units w/ interval                                1315           1317           2          0.8        1315.3       0.3X
+5 units w/o interval                               1321           1324           4          0.8        1320.5       0.3X
+6 units w/ interval                                1457           1457           0          0.7        1457.0       0.3X
+6 units w/o interval                               1452           1457           4          0.7        1451.7       0.3X
+7 units w/ interval                                1816           1821           5          0.6        1815.6       0.2X
+7 units w/o interval                               1836           1836           0          0.5        1835.8       0.2X
+8 units w/ interval                                1902           1907           4          0.5        1902.3       0.2X
+8 units w/o interval                               1900           1901           1          0.5        1899.6       0.2X
+9 units w/ interval                                2046           2055          13          0.5        2045.8       0.2X
+9 units w/o interval                               2061           2062           2          0.5        2060.7       0.2X
+10 units w/ interval                               2331           2338           8          0.4        2330.9       0.2X
+10 units w/o interval                              2325           2326           1          0.4        2325.0       0.2X
+11 units w/ interval                               2507           2516           8          0.4        2507.4       0.2X
+11 units w/o interval                              2508           2511           5          0.4        2507.8       0.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 make_interval():                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-prepare make_interval()                               328            337           7          3.0         328.4       1.0X
-make_interval(0, 1, 2, 3, 4, 5, 50.123456)             44             45           1         22.7          44.0       7.5X
-make_interval(*, *, 2, 3, 4, 5, 50.123456)             52             62          12         19.2          52.1       6.3X
-make_interval(0, 1, *, *, 4, 5, 50.123456)             56             58           3         17.9          56.0       5.9X
-make_interval(0, 1, 2, 3, *, *, *)                    319            321           2          3.1         318.8       1.0X
-make_interval(*, *, *, *, *, *, *)                    341            343           4          2.9         340.7       1.0X
+prepare make_interval()                               328            329           1          3.0         328.1       1.0X
+make_interval(0, 1, 2, 3, 4, 5, 50.123456)             48             51           3         20.8          48.1       6.8X
+make_interval(*, *, 2, 3, 4, 5, 50.123456)             53             58           7         18.9          53.0       6.2X
+make_interval(0, 1, *, *, 4, 5, 50.123456)             57             57           1         17.6          56.8       5.8X
+make_interval(0, 1, 2, 3, *, *, *)                    322            323           1          3.1         321.8       1.0X
+make_interval(*, *, *, *, *, *, *)                    332            334           2          3.0         332.2       1.0X
 
diff --git a/sql/core/benchmarks/IntervalBenchmark-results.txt b/sql/core/benchmarks/IntervalBenchmark-results.txt
index c0a7962c2dc5f..fed39f6a291d2 100644
--- a/sql/core/benchmarks/IntervalBenchmark-results.txt
+++ b/sql/core/benchmarks/IntervalBenchmark-results.txt
@@ -1,40 +1,40 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 cast strings to intervals:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-prepare string w/ interval                          395            404          10          2.5         395.1       1.0X
-prepare string w/o interval                         368            378          16          2.7         367.6       1.1X
-1 units w/ interval                                 360            363           3          2.8         359.6       1.1X
-1 units w/o interval                                346            352           9          2.9         345.7       1.1X
-2 units w/ interval                                 508            510           2          2.0         508.1       0.8X
-2 units w/o interval                                490            494           5          2.0         490.3       0.8X
-3 units w/ interval                                1127           1129           2          0.9        1126.9       0.4X
-3 units w/o interval                               1113           1124          20          0.9        1112.9       0.4X
-4 units w/ interval                                1265           1283          17          0.8        1265.0       0.3X
-4 units w/o interval                               1248           1253           9          0.8        1247.7       0.3X
-5 units w/ interval                                1388           1390           1          0.7        1388.5       0.3X
-5 units w/o interval                               1379           1382           4          0.7        1379.2       0.3X
-6 units w/ interval                                1530           1533           2          0.7        1530.2       0.3X
-6 units w/o interval                               1510           1513           6          0.7        1509.6       0.3X
-7 units w/ interval                                1866           1877          14          0.5        1866.2       0.2X
-7 units w/o interval                               1841           1845           6          0.5        1840.7       0.2X
-8 units w/ interval                                2068           2080          14          0.5        2068.1       0.2X
-8 units w/o interval                               2062           2066           3          0.5        2061.9       0.2X
-9 units w/ interval                                2642           2650          13          0.4        2641.6       0.1X
-9 units w/o interval                               2626           2634           8          0.4        2625.9       0.2X
-10 units w/ interval                               2817           2832          17          0.4        2817.3       0.1X
-10 units w/o interval                              2775           2779           5          0.4        2774.9       0.1X
-11 units w/ interval                               3096           3100           6          0.3        3095.8       0.1X
-11 units w/o interval                              3080           3084           4          0.3        3080.1       0.1X
+prepare string w/ interval                          403            419          13          2.5         403.2       1.0X
+prepare string w/o interval                         389            390           1          2.6         388.8       1.0X
+1 units w/ interval                                 362            366           5          2.8         362.2       1.1X
+1 units w/o interval                                363            370           6          2.8         362.8       1.1X
+2 units w/ interval                                 513            520           6          1.9         513.2       0.8X
+2 units w/o interval                                499            503           3          2.0         499.3       0.8X
+3 units w/ interval                                1135           1136           1          0.9        1135.1       0.4X
+3 units w/o interval                               1125           1126           2          0.9        1124.9       0.4X
+4 units w/ interval                                1226           1238          16          0.8        1226.2       0.3X
+4 units w/o interval                               1233           1238           8          0.8        1233.2       0.3X
+5 units w/ interval                                1384           1389           7          0.7        1383.7       0.3X
+5 units w/o interval                               1366           1368           1          0.7        1366.2       0.3X
+6 units w/ interval                                1547           1550           2          0.6        1547.4       0.3X
+6 units w/o interval                               1526           1528           2          0.7        1526.4       0.3X
+7 units w/ interval                                1858           1863           5          0.5        1858.5       0.2X
+7 units w/o interval                               1853           1856           3          0.5        1853.3       0.2X
+8 units w/ interval                                2063           2083          23          0.5        2062.7       0.2X
+8 units w/o interval                               2049           2055           7          0.5        2048.5       0.2X
+9 units w/ interval                                2599           2609          13          0.4        2599.2       0.2X
+9 units w/o interval                               2586           2588           2          0.4        2585.9       0.2X
+10 units w/ interval                               2811           2817           6          0.4        2811.4       0.1X
+10 units w/o interval                              2788           2791           5          0.4        2788.4       0.1X
+11 units w/ interval                               3070           3074           4          0.3        3069.9       0.1X
+11 units w/o interval                              3056           3060           4          0.3        3056.3       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 make_interval():                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-prepare make_interval()                               344            348           4          2.9         343.8       1.0X
-make_interval(0, 1, 2, 3, 4, 5, 50.123456)             40             42           2         24.7          40.5       8.5X
-make_interval(*, *, 2, 3, 4, 5, 50.123456)             50             54           4         19.8          50.4       6.8X
-make_interval(0, 1, *, *, 4, 5, 50.123456)             55             59           3         18.1          55.1       6.2X
-make_interval(0, 1, 2, 3, *, *, *)                    329            336           6          3.0         329.4       1.0X
-make_interval(*, *, *, *, *, *, *)                    337            339           2          3.0         336.9       1.0X
+prepare make_interval()                               350            352           2          2.9         349.8       1.0X
+make_interval(0, 1, 2, 3, 4, 5, 50.123456)             47             51           6         21.5          46.6       7.5X
+make_interval(*, *, 2, 3, 4, 5, 50.123456)             55             58           4         18.0          55.5       6.3X
+make_interval(0, 1, *, *, 4, 5, 50.123456)             56             58           2         17.9          55.9       6.3X
+make_interval(0, 1, 2, 3, *, *, *)                    336            338           3          3.0         335.8       1.0X
+make_interval(*, *, *, *, *, *, *)                    342            343           1          2.9         342.1       1.0X
 
diff --git a/sql/core/benchmarks/JoinBenchmark-jdk21-results.txt b/sql/core/benchmarks/JoinBenchmark-jdk21-results.txt
index cff5e95c7b36b..cc31554ecdfbf 100644
--- a/sql/core/benchmarks/JoinBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/JoinBenchmark-jdk21-results.txt
@@ -2,81 +2,81 @@
 Join Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w long:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w long wholestage off                         2249           2276          38          9.3         107.2       1.0X
-Join w long wholestage on                          1050           1088          41         20.0          50.1       2.1X
+Join w long wholestage off                         2144           2152          11          9.8         102.2       1.0X
+Join w long wholestage on                           913            938          19         23.0          43.5       2.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w long duplicated:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w long duplicated wholestage off              2043           2046           4         10.3          97.4       1.0X
-Join w long duplicated wholestage on                902            921          18         23.3          43.0       2.3X
+Join w long duplicated wholestage off              2025           2029           6         10.4          96.6       1.0X
+Join w long duplicated wholestage on                947            997          28         22.1          45.2       2.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w 2 ints:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w 2 ints wholestage off                     107986         107997          15          0.2        5149.2       1.0X
-Join w 2 ints wholestage on                      106359         106444          62          0.2        5071.6       1.0X
+Join w 2 ints wholestage off                     108340         108384          62          0.2        5166.1       1.0X
+Join w 2 ints wholestage on                      106411         106556         130          0.2        5074.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w 2 longs:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w 2 longs wholestage off                      3719           3858         196          5.6         177.4       1.0X
-Join w 2 longs wholestage on                       2415           2498          54          8.7         115.2       1.5X
+Join w 2 longs wholestage off                      3530           3550          28          5.9         168.3       1.0X
+Join w 2 longs wholestage on                       1968           1989          14         10.7          93.8       1.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w 2 longs duplicated:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w 2 longs duplicated wholestage off           8503           8531          39          2.5         405.5       1.0X
-Join w 2 longs duplicated wholestage on            5581           5695          74          3.8         266.1       1.5X
+Join w 2 longs duplicated wholestage off           8952           9029         109          2.3         426.8       1.0X
+Join w 2 longs duplicated wholestage on            5694           5767          67          3.7         271.5       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 outer join w long:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-outer join w long wholestage off                   1770           1812          59         11.8          84.4       1.0X
-outer join w long wholestage on                    1057           1096          32         19.8          50.4       1.7X
+outer join w long wholestage off                   1574           1576           3         13.3          75.1       1.0X
+outer join w long wholestage on                     934            993         102         22.4          44.6       1.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 semi join w long:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-semi join w long wholestage off                    1064           1068           6         19.7          50.7       1.0X
-semi join w long wholestage on                      553            566          12         37.9          26.4       1.9X
+semi join w long wholestage off                    1060           1063           4         19.8          50.6       1.0X
+semi join w long wholestage on                      555            578          15         37.8          26.5       1.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sort merge join:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sort merge join wholestage off                      535            541           9          3.9         254.9       1.0X
-sort merge join wholestage on                       470            482          14          4.5         224.0       1.1X
+sort merge join wholestage off                      507            514           9          4.1         241.8       1.0X
+sort merge join wholestage on                       461            468           6          4.5         219.8       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sort merge join with duplicates:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-sort merge join with duplicates wholestage off           1056           1057           1          2.0         503.7       1.0X
-sort merge join with duplicates wholestage on             955            966           7          2.2         455.6       1.1X
+sort merge join with duplicates wholestage off           1013           1015           2          2.1         483.0       1.0X
+sort merge join with duplicates wholestage on             921            931          10          2.3         439.0       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 shuffle hash join:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-shuffle hash join wholestage off                    536            554          25          7.8         127.9       1.0X
-shuffle hash join wholestage on                     416            433          14         10.1          99.1       1.3X
+shuffle hash join wholestage off                    516            528          17          8.1         123.1       1.0X
+shuffle hash join wholestage on                     370            391          17         11.3          88.3       1.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 broadcast nested loop join:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-broadcast nested loop join wholestage off          27126          27236         155          0.8        1293.5       1.0X
-broadcast nested loop join wholestage on           21319          21567         223          1.0        1016.6       1.3X
+broadcast nested loop join wholestage off          25481          25537          80          0.8        1215.0       1.0X
+broadcast nested loop join wholestage on           17573          17808         226          1.2         838.0       1.4X
 
 
diff --git a/sql/core/benchmarks/JoinBenchmark-results.txt b/sql/core/benchmarks/JoinBenchmark-results.txt
index 9d546eff9eb1d..71fad9100fe82 100644
--- a/sql/core/benchmarks/JoinBenchmark-results.txt
+++ b/sql/core/benchmarks/JoinBenchmark-results.txt
@@ -2,81 +2,81 @@
 Join Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w long:                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w long wholestage off                         2042           2057          21         10.3          97.4       1.0X
-Join w long wholestage on                           955           1006          70         22.0          45.5       2.1X
+Join w long wholestage off                         2023           2060          52         10.4          96.5       1.0X
+Join w long wholestage on                          1018           1066          29         20.6          48.5       2.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w long duplicated:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w long duplicated wholestage off              1989           2101         159         10.5          94.8       1.0X
-Join w long duplicated wholestage on                905            925          22         23.2          43.1       2.2X
+Join w long duplicated wholestage off              1960           1982          32         10.7          93.4       1.0X
+Join w long duplicated wholestage on                901            928          31         23.3          43.0       2.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w 2 ints:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w 2 ints wholestage off                     112857         112868          15          0.2        5381.5       1.0X
-Join w 2 ints wholestage on                      111346         111409          65          0.2        5309.4       1.0X
+Join w 2 ints wholestage off                     112829         112886          81          0.2        5380.1       1.0X
+Join w 2 ints wholestage on                      111531         111580          43          0.2        5318.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w 2 longs:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w 2 longs wholestage off                      3248           3257          13          6.5         154.9       1.0X
-Join w 2 longs wholestage on                       2023           2051          36         10.4          96.5       1.6X
+Join w 2 longs wholestage off                      3306           3312           8          6.3         157.7       1.0X
+Join w 2 longs wholestage on                       2188           2225          37          9.6         104.3       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Join w 2 longs duplicated:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Join w 2 longs duplicated wholestage off           8464           8469           6          2.5         403.6       1.0X
-Join w 2 longs duplicated wholestage on            5481           5504          17          3.8         261.4       1.5X
+Join w 2 longs duplicated wholestage off           8196           8221          35          2.6         390.8       1.0X
+Join w 2 longs duplicated wholestage on            5451           5509          35          3.8         259.9       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 outer join w long:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-outer join w long wholestage off                   1590           1598          11         13.2          75.8       1.0X
-outer join w long wholestage on                     942            947           4         22.3          44.9       1.7X
+outer join w long wholestage off                   1710           1712           3         12.3          81.5       1.0X
+outer join w long wholestage on                    1036           1045          10         20.2          49.4       1.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 semi join w long:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-semi join w long wholestage off                    1074           1076           3         19.5          51.2       1.0X
-semi join w long wholestage on                      529            559          32         39.6          25.2       2.0X
+semi join w long wholestage off                    1077           1116          56         19.5          51.4       1.0X
+semi join w long wholestage on                      526            548          36         39.9          25.1       2.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sort merge join:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sort merge join wholestage off                      542            543           2          3.9         258.5       1.0X
-sort merge join wholestage on                       467            480          16          4.5         222.8       1.2X
+sort merge join wholestage off                      533            538           7          3.9         254.1       1.0X
+sort merge join wholestage on                       460            470           6          4.6         219.2       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sort merge join with duplicates:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-sort merge join with duplicates wholestage off           1074           1076           3          2.0         512.1       1.0X
-sort merge join with duplicates wholestage on             957            966           6          2.2         456.4       1.1X
+sort merge join with duplicates wholestage off           1052           1054           3          2.0         501.5       1.0X
+sort merge join with duplicates wholestage on             944            950           6          2.2         450.1       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 shuffle hash join:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-shuffle hash join wholestage off                    484            486           3          8.7         115.4       1.0X
-shuffle hash join wholestage on                     366            373           8         11.5          87.1       1.3X
+shuffle hash join wholestage off                    483            487           6          8.7         115.1       1.0X
+shuffle hash join wholestage on                     367            378           9         11.4          87.5       1.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 broadcast nested loop join:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-broadcast nested loop join wholestage off          26051          26090          55          0.8        1242.2       1.0X
-broadcast nested loop join wholestage on           17018          17068          32          1.2         811.5       1.5X
+broadcast nested loop join wholestage off          27392          27733         482          0.8        1306.2       1.0X
+broadcast nested loop join wholestage on           19262          19470         214          1.1         918.5       1.4X
 
 
diff --git a/sql/core/benchmarks/JsonBenchmark-jdk21-results.txt b/sql/core/benchmarks/JsonBenchmark-jdk21-results.txt
index 3a126b6f0da15..8222b122c0d5b 100644
--- a/sql/core/benchmarks/JsonBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/JsonBenchmark-jdk21-results.txt
@@ -3,128 +3,128 @@ Benchmark for performance of JSON parsing
 ================================================================================================
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON schema inferring:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        2253           2358         117          2.2         450.6       1.0X
-UTF-8 is set                                       4846           4861          13          1.0         969.2       0.5X
+No encoding                                        2449           2522         100          2.0         489.8       1.0X
+UTF-8 is set                                       4926           4949          35          1.0         985.2       0.5X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 count a short column:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        2105           2123          18          2.4         421.0       1.0X
-UTF-8 is set                                       4657           4664          10          1.1         931.3       0.5X
+No encoding                                        1976           2030          55          2.5         395.3       1.0X
+UTF-8 is set                                       4585           4593          10          1.1         917.0       0.4X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 count a wide column:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        4551           4598          77          0.2        4550.7       1.0X
-UTF-8 is set                                       4372           4379           8          0.2        4372.2       1.0X
+No encoding                                        4544           4562          18          0.2        4543.6       1.0X
+UTF-8 is set                                       4417           4433          14          0.2        4417.2       1.0X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 select wide row:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        9258           9360         152          0.0      185154.2       1.0X
-UTF-8 is set                                      10320          10346          23          0.0      206392.2       0.9X
+No encoding                                       10431          10576         227          0.0      208628.1       1.0X
+UTF-8 is set                                      11244          11277          30          0.0      224872.2       0.9X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select a subset of 10 columns:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select 10 columns                                  1712           1713           1          0.6        1712.4       1.0X
-Select 1 column                                    1291           1298          10          0.8        1290.9       1.3X
+Select 10 columns                                  1735           1736           2          0.6        1734.5       1.0X
+Select 1 column                                    1146           1148           2          0.9        1146.2       1.5X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 creation of JSON parser per line:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Short column without encoding                       647            649           4          1.5         647.0       1.0X
-Short column with UTF-8                            1169           1180          10          0.9        1169.2       0.6X
-Wide column without encoding                       5268           5293          27          0.2        5267.8       0.1X
-Wide column with UTF-8                             6536           6557          20          0.2        6535.9       0.1X
+Short column without encoding                       601            603           3          1.7         600.7       1.0X
+Short column with UTF-8                            1130           1132           2          0.9        1129.9       0.5X
+Wide column without encoding                       5232           5270          41          0.2        5231.8       0.1X
+Wide column with UTF-8                             8895           8907          10          0.1        8895.4       0.1X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON functions:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Text read                                            57             65           7         17.5          57.2       1.0X
-from_json                                          1080           1085           7          0.9        1079.9       0.1X
-json_tuple                                         1010           1012           2          1.0        1010.4       0.1X
-get_json_object wholestage off                     1033           1038           4          1.0        1033.4       0.1X
-get_json_object wholestage on                       951            952           2          1.1         950.9       0.1X
+Text read                                            59             65           5         16.9          59.1       1.0X
+from_json                                          1090           1103          14          0.9        1090.2       0.1X
+json_tuple                                         1044           1053           8          1.0        1043.6       0.1X
+get_json_object wholestage off                     1052           1059           6          1.0        1052.4       0.1X
+get_json_object wholestage on                       983            998          13          1.0         983.1       0.1X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Dataset of json strings:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Text read                                           259            262           3         19.3          51.8       1.0X
-schema inferring                                   1918           1934          15          2.6         383.5       0.1X
-parsing                                            2804           2815          11          1.8         560.8       0.1X
+Text read                                           234            236           2         21.3          46.8       1.0X
+schema inferring                                   1793           1797           5          2.8         358.6       0.1X
+parsing                                            2582           2583           1          1.9         516.4       0.1X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Json files in the per-line mode:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Text read                                           583            592           8          8.6         116.7       1.0X
-Schema inferring                                   2412           2414           2          2.1         482.4       0.2X
-Parsing without charset                            2962           2970           9          1.7         592.3       0.2X
-Parsing with UTF-8                                 5458           5462           5          0.9        1091.7       0.1X
+Text read                                           593            596           3          8.4         118.5       1.0X
+Schema inferring                                   2369           2370           1          2.1         473.7       0.3X
+Parsing without charset                            2771           2776           6          1.8         554.3       0.2X
+Parsing with UTF-8                                 5392           5400           9          0.9        1078.4       0.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write dates and timestamps:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Create a dataset of timestamps                      105            109           5          9.5         105.2       1.0X
-to_json(timestamp)                                  550            551           2          1.8         549.9       0.2X
-write timestamps to files                           582            586           3          1.7         582.4       0.2X
-Create a dataset of dates                           113            114           2          8.9         112.8       0.9X
-to_json(date)                                       417            419           3          2.4         416.8       0.3X
-write dates to files                                390            392           2          2.6         390.2       0.3X
+Create a dataset of timestamps                      105            107           2          9.5         105.2       1.0X
+to_json(timestamp)                                  541            546           8          1.8         540.6       0.2X
+write timestamps to files                           572            574           3          1.7         571.9       0.2X
+Create a dataset of dates                           110            113           3          9.1         110.2       1.0X
+to_json(date)                                       385            386           1          2.6         384.8       0.3X
+write dates to files                                414            417           3          2.4         413.6       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read dates and timestamps:                                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-read timestamp text from files                                                   150            154           3          6.6         150.4       1.0X
-read timestamps from files                                                      1131           1149          19          0.9        1130.9       0.1X
-infer timestamps from files                                                     2155           2156           0          0.5        2155.3       0.1X
-read date text from files                                                        138            143           4          7.2         138.3       1.1X
-read date from files                                                             718            721           5          1.4         718.1       0.2X
-timestamp strings                                                                142            143           1          7.0         142.4       1.1X
-parse timestamps from Dataset[String]                                           1270           1272           3          0.8        1269.8       0.1X
-infer timestamps from Dataset[String]                                           2224           2227           3          0.4        2224.4       0.1X
-date strings                                                                     195            196           1          5.1         195.3       0.8X
-parse dates from Dataset[String]                                                 972            973           1          1.0         972.4       0.2X
-from_json(timestamp)                                                            1739           1742           3          0.6        1739.4       0.1X
-from_json(date)                                                                 1400           1401           1          0.7        1400.2       0.1X
-infer error timestamps from Dataset[String] with default format                 1433           1437           4          0.7        1433.0       0.1X
-infer error timestamps from Dataset[String] with user-provided format           1439           1442           3          0.7        1439.0       0.1X
-infer error timestamps from Dataset[String] with legacy format                  1475           1480           4          0.7        1475.3       0.1X
+read timestamp text from files                                                   158            160           3          6.3         157.5       1.0X
+read timestamps from files                                                      1078           1084           5          0.9        1078.0       0.1X
+infer timestamps from files                                                     2034           2041          11          0.5        2034.1       0.1X
+read date text from files                                                        146            153           6          6.8         146.3       1.1X
+read date from files                                                             674            675           2          1.5         673.7       0.2X
+timestamp strings                                                                136            138           2          7.4         135.6       1.2X
+parse timestamps from Dataset[String]                                           1255           1260           6          0.8        1254.7       0.1X
+infer timestamps from Dataset[String]                                           2203           2210           6          0.5        2203.3       0.1X
+date strings                                                                     202            202           0          5.0         201.8       0.8X
+parse dates from Dataset[String]                                                 955            959           5          1.0         954.8       0.2X
+from_json(timestamp)                                                            1731           1736           6          0.6        1731.2       0.1X
+from_json(date)                                                                 1438           1440           3          0.7        1437.9       0.1X
+infer error timestamps from Dataset[String] with default format                 1352           1358           4          0.7        1352.5       0.1X
+infer error timestamps from Dataset[String] with user-provided format           1352           1352           0          0.7        1351.6       0.1X
+infer error timestamps from Dataset[String] with legacy format                  1378           1381           4          0.7        1377.7       0.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Filters pushdown:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-w/o filters                                        6068           6076          11          0.0       60681.7       1.0X
-pushdown disabled                                  5926           5934          10          0.0       59263.4       1.0X
-w/ filters                                          650            654           4          0.2        6496.2       9.3X
+w/o filters                                        6114           6115           1          0.0       61142.8       1.0X
+pushdown disabled                                  6017           6030          12          0.0       60165.6       1.0X
+w/ filters                                          712            721           7          0.1        7124.1       8.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partial JSON results:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-parse invalid JSON                                 2249           2258          14          0.0      224874.5       1.0X
+parse invalid JSON                                 2534           2540           7          0.0      253448.0       1.0X
 
 
diff --git a/sql/core/benchmarks/JsonBenchmark-results.txt b/sql/core/benchmarks/JsonBenchmark-results.txt
index f3115219608e8..43f7ce63768a6 100644
--- a/sql/core/benchmarks/JsonBenchmark-results.txt
+++ b/sql/core/benchmarks/JsonBenchmark-results.txt
@@ -3,128 +3,128 @@ Benchmark for performance of JSON parsing
 ================================================================================================
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON schema inferring:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        2310           2321          12          2.2         461.9       1.0X
-UTF-8 is set                                       4784           4795          10          1.0         956.9       0.5X
+No encoding                                        2179           2239          75          2.3         435.9       1.0X
+UTF-8 is set                                       5291           5328          33          0.9        1058.2       0.4X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 count a short column:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        2215           2246          30          2.3         443.0       1.0X
-UTF-8 is set                                       4718           4724           7          1.1         943.5       0.5X
+No encoding                                        2029           2079          72          2.5         405.8       1.0X
+UTF-8 is set                                       4499           4501           2          1.1         899.8       0.5X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 count a wide column:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        4269           4376         151          0.2        4268.9       1.0X
-UTF-8 is set                                       4447           4459          15          0.2        4446.8       1.0X
+No encoding                                        4605           4651          40          0.2        4604.9       1.0X
+UTF-8 is set                                       4661           4685          24          0.2        4660.5       1.0X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 select wide row:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-No encoding                                        9025           9101          70          0.0      180505.7       1.0X
-UTF-8 is set                                       9983          10004          24          0.0      199666.6       0.9X
+No encoding                                        8833           8999         215          0.0      176664.5       1.0X
+UTF-8 is set                                       9740           9745           5          0.0      194807.7       0.9X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Select a subset of 10 columns:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Select 10 columns                                  1585           1588           5          0.6        1584.6       1.0X
-Select 1 column                                    1253           1256           4          0.8        1253.2       1.3X
+Select 10 columns                                  1487           1497          12          0.7        1487.0       1.0X
+Select 1 column                                    1083           1088           4          0.9        1083.4       1.4X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 creation of JSON parser per line:         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Short column without encoding                       644            646           2          1.6         644.2       1.0X
-Short column with UTF-8                            1163           1174          18          0.9        1162.6       0.6X
-Wide column without encoding                       5178           5191          12          0.2        5177.7       0.1X
-Wide column with UTF-8                             5983           5987           4          0.2        5982.7       0.1X
+Short column without encoding                       600            607           7          1.7         600.1       1.0X
+Short column with UTF-8                            1073           1081           9          0.9        1072.8       0.6X
+Wide column without encoding                       5205           5216          15          0.2        5205.5       0.1X
+Wide column with UTF-8                             6720           6730          10          0.1        6719.9       0.1X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON functions:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Text read                                            56             59           3         17.9          55.8       1.0X
-from_json                                          1039           1057          28          1.0        1038.8       0.1X
-json_tuple                                         1036           1040           5          1.0        1035.5       0.1X
-get_json_object wholestage off                     1056           1061           8          0.9        1055.9       0.1X
-get_json_object wholestage on                       993            999           6          1.0         992.7       0.1X
+Text read                                            64             71           6         15.6          64.1       1.0X
+from_json                                          1058           1061           2          0.9        1058.5       0.1X
+json_tuple                                         1004           1006           3          1.0        1003.6       0.1X
+get_json_object wholestage off                     1036           1044           7          1.0        1036.3       0.1X
+get_json_object wholestage on                       953            956           3          1.0         953.0       0.1X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Dataset of json strings:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Text read                                           260            263           4         19.2          52.0       1.0X
-schema inferring                                   1765           1768           2          2.8         353.0       0.1X
-parsing                                            2756           2775          18          1.8         551.2       0.1X
+Text read                                           249            253           6         20.0          49.9       1.0X
+schema inferring                                   1822           1831          15          2.7         364.4       0.1X
+parsing                                            2444           2456          10          2.0         488.8       0.1X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Json files in the per-line mode:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Text read                                           580            583           2          8.6         116.1       1.0X
-Schema inferring                                   2349           2355           8          2.1         469.8       0.2X
-Parsing without charset                            2935           2940           8          1.7         587.0       0.2X
-Parsing with UTF-8                                 5463           5504          69          0.9        1092.6       0.1X
+Text read                                           602            603           1          8.3         120.4       1.0X
+Schema inferring                                   2349           2352           3          2.1         469.7       0.3X
+Parsing without charset                            2701           2709           6          1.9         540.2       0.2X
+Parsing with UTF-8                                 5177           5184           7          1.0        1035.3       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write dates and timestamps:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Create a dataset of timestamps                      102            106           6          9.8         101.9       1.0X
-to_json(timestamp)                                  634            637           3          1.6         634.4       0.2X
-write timestamps to files                           676            678           2          1.5         676.2       0.2X
-Create a dataset of dates                           114            117           2          8.7         114.4       0.9X
-to_json(date)                                       439            440           1          2.3         439.1       0.2X
-write dates to files                                435            438           2          2.3         435.2       0.2X
+Create a dataset of timestamps                      110            113           3          9.1         110.3       1.0X
+to_json(timestamp)                                  633            637           6          1.6         632.6       0.2X
+write timestamps to files                           668            672           4          1.5         667.9       0.2X
+Create a dataset of dates                           115            117           3          8.7         115.4       1.0X
+to_json(date)                                       437            438           0          2.3         437.2       0.3X
+write dates to files                                424            428           3          2.4         424.4       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read dates and timestamps:                                             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-read timestamp text from files                                                   151            154           2          6.6         151.5       1.0X
-read timestamps from files                                                      1049           1051           3          1.0        1048.9       0.1X
-infer timestamps from files                                                     1959           1967          10          0.5        1958.7       0.1X
-read date text from files                                                        136            141           5          7.4         135.9       1.1X
-read date from files                                                             703            713          10          1.4         702.7       0.2X
-timestamp strings                                                                141            143           2          7.1         141.1       1.1X
-parse timestamps from Dataset[String]                                           1191           1195           7          0.8        1190.9       0.1X
-infer timestamps from Dataset[String]                                           2065           2071           9          0.5        2065.3       0.1X
-date strings                                                                     203            205           2          4.9         202.6       0.7X
-parse dates from Dataset[String]                                                 967            970           4          1.0         967.0       0.2X
-from_json(timestamp)                                                            1629           1632           2          0.6        1628.9       0.1X
-from_json(date)                                                                 1371           1396          41          0.7        1371.0       0.1X
-infer error timestamps from Dataset[String] with default format                 1400           1404           4          0.7        1400.1       0.1X
-infer error timestamps from Dataset[String] with user-provided format           1401           1405           5          0.7        1400.8       0.1X
-infer error timestamps from Dataset[String] with legacy format                  1429           1431           2          0.7        1429.0       0.1X
+read timestamp text from files                                                   152            158           6          6.6         152.2       1.0X
+read timestamps from files                                                       983            984           1          1.0         982.9       0.2X
+infer timestamps from files                                                     1857           1866           8          0.5        1857.2       0.1X
+read date text from files                                                        147            153           9          6.8         146.5       1.0X
+read date from files                                                             671            674           4          1.5         671.0       0.2X
+timestamp strings                                                                135            138           2          7.4         135.0       1.1X
+parse timestamps from Dataset[String]                                           1138           1140           3          0.9        1137.8       0.1X
+infer timestamps from Dataset[String]                                           1985           1992           6          0.5        1985.4       0.1X
+date strings                                                                     229            230           1          4.4         228.8       0.7X
+parse dates from Dataset[String]                                                 916            917           1          1.1         915.7       0.2X
+from_json(timestamp)                                                            1644           1648           7          0.6        1643.7       0.1X
+from_json(date)                                                                 1390           1400           9          0.7        1390.4       0.1X
+infer error timestamps from Dataset[String] with default format                 1317           1322           9          0.8        1317.1       0.1X
+infer error timestamps from Dataset[String] with user-provided format           1316           1330          12          0.8        1316.4       0.1X
+infer error timestamps from Dataset[String] with legacy format                  1341           1344           3          0.7        1341.2       0.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Filters pushdown:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-w/o filters                                        6452           6469          19          0.0       64519.3       1.0X
-pushdown disabled                                  6245           6253           8          0.0       62445.5       1.0X
-w/ filters                                          556            560           4          0.2        5563.4      11.6X
+w/o filters                                        5704           5706           2          0.0       57043.0       1.0X
+pushdown disabled                                  5604           5622          24          0.0       56042.1       1.0X
+w/ filters                                          643            654          11          0.2        6430.2       8.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partial JSON results:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-parse invalid JSON                                 2255           2376         205          0.0      225510.6       1.0X
+parse invalid JSON                                 2332           2422         150          0.0      233209.5       1.0X
 
 
diff --git a/sql/core/benchmarks/LargeRowBenchmark-jdk21-results.txt b/sql/core/benchmarks/LargeRowBenchmark-jdk21-results.txt
index cbd78a086ea36..a34a68164c754 100644
--- a/sql/core/benchmarks/LargeRowBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/LargeRowBenchmark-jdk21-results.txt
@@ -2,25 +2,25 @@
 Large Row Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 #rows: 100, #cols: 10, cell: 1.3 MB:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-built-in UPPER                                     5912           6241         466          0.0    59115266.3       1.0X
-udf UPPER                                          4116           4134          25          0.0    41162058.1       1.4X
+built-in UPPER                                     5851           6220         521          0.0    58513209.6       1.0X
+udf UPPER                                          5127           5162          50          0.0    51266519.2       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 #rows: 1, #cols: 1, cell: 300.0 MB:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-built-in UPPER                                     1339           1346          10          0.0  1339197183.0       1.0X
-udf UPPER                                           932            969          50          0.0   931637076.0       1.4X
+built-in UPPER                                     1315           1322           9          0.0  1315306640.0       1.0X
+udf UPPER                                          1001           1004           3          0.0  1001420387.0       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 #rows: 1, #cols: 200, cell: 1.0 MB:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-built-in UPPER                                     1116           1137          30          0.0  1115727291.0       1.0X
-udf UPPER                                          1187           1217          43          0.0  1186838839.0       0.9X
+built-in UPPER                                     1130           1145          21          0.0  1130109481.0       1.0X
+udf UPPER                                          1199           1248          70          0.0  1198653800.0       0.9X
 
 
diff --git a/sql/core/benchmarks/LargeRowBenchmark-results.txt b/sql/core/benchmarks/LargeRowBenchmark-results.txt
index 8c8eea8b92226..a8dc06172135f 100644
--- a/sql/core/benchmarks/LargeRowBenchmark-results.txt
+++ b/sql/core/benchmarks/LargeRowBenchmark-results.txt
@@ -2,25 +2,25 @@
 Large Row Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 #rows: 100, #cols: 10, cell: 1.3 MB:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-built-in UPPER                                     6896           6962          93          0.0    68960045.7       1.0X
-udf UPPER                                          4315           4367          74          0.0    43151937.6       1.6X
+built-in UPPER                                     6774           6793          27          0.0    67735578.9       1.0X
+udf UPPER                                          4768           4770           2          0.0    47680577.5       1.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 #rows: 1, #cols: 1, cell: 300.0 MB:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-built-in UPPER                                     1532           1534           4          0.0  1531617745.0       1.0X
-udf UPPER                                           996            999           3          0.0   995955863.0       1.5X
+built-in UPPER                                     1520           1530          14          0.0  1520168353.0       1.0X
+udf UPPER                                          1048           1049           2          0.0  1047675797.0       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 #rows: 1, #cols: 200, cell: 1.0 MB:       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-built-in UPPER                                     1263           1308          63          0.0  1263021540.0       1.0X
-udf UPPER                                          1366           1438         102          0.0  1365656763.0       0.9X
+built-in UPPER                                     1250           1267          25          0.0  1249716088.0       1.0X
+udf UPPER                                          1231           1309         110          0.0  1231441056.0       1.0X
 
 
diff --git a/sql/core/benchmarks/MakeDateTimeBenchmark-jdk21-results.txt b/sql/core/benchmarks/MakeDateTimeBenchmark-jdk21-results.txt
index e3a39091e0d88..df4d262091ac8 100644
--- a/sql/core/benchmarks/MakeDateTimeBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/MakeDateTimeBenchmark-jdk21-results.txt
@@ -1,22 +1,22 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 make_date():                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-prepare make_date()                                2308           2354          49         43.3          23.1       1.0X
-make_date(2019, 9, 16)                             2016           2102          80         49.6          20.2       1.1X
-make_date(*, *, *)                                 2866           2886          17         34.9          28.7       0.8X
+prepare make_date()                                2331           2417         144         42.9          23.3       1.0X
+make_date(2019, 9, 16)                             1966           1985          27         50.9          19.7       1.2X
+make_date(*, *, *)                                 2979           2989           9         33.6          29.8       0.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 make_timestamp():                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-prepare make_timestamp()                               333            334           2          3.0         332.6       1.0X
-make_timestamp(2019, 1, 2, 3, 4, 50.123456)             38             45           7         26.3          38.1       8.7X
-make_timestamp(2019, 1, 2, 3, 4, 60.000000)             35             44           9         29.0          34.5       9.6X
-make_timestamp(2019, 12, 31, 23, 59, 60.00)             33             39           4         30.0          33.3      10.0X
-make_timestamp(*, *, *, 3, 4, 50.123456)               144            148           5          7.0         143.8       2.3X
-make_timestamp(*, *, *, *, *, 0)                       106            115           8          9.4         106.0       3.1X
-make_timestamp(*, *, *, *, *, 60.0)                    141            141           0          7.1         140.6       2.4X
-make_timestamp(2019, 1, 2, *, *, *)                    450            454           7          2.2         449.7       0.7X
-make_timestamp(*, *, *, *, *, *)                       461            465           3          2.2         461.4       0.7X
+prepare make_timestamp()                               331            337           5          3.0         330.6       1.0X
+make_timestamp(2019, 1, 2, 3, 4, 50.123456)             41             42           1         24.6          40.6       8.1X
+make_timestamp(2019, 1, 2, 3, 4, 60.000000)             38             40           3         26.2          38.1       8.7X
+make_timestamp(2019, 12, 31, 23, 59, 60.00)             35             39           5         28.6          35.0       9.5X
+make_timestamp(*, *, *, 3, 4, 50.123456)               171            171           0          5.8         171.1       1.9X
+make_timestamp(*, *, *, *, *, 0)                       111            113           3          9.0         110.5       3.0X
+make_timestamp(*, *, *, *, *, 60.0)                    139            142           3          7.2         138.7       2.4X
+make_timestamp(2019, 1, 2, *, *, *)                    454            455           1          2.2         453.5       0.7X
+make_timestamp(*, *, *, *, *, *)                       494            495           1          2.0         494.0       0.7X
 
diff --git a/sql/core/benchmarks/MakeDateTimeBenchmark-results.txt b/sql/core/benchmarks/MakeDateTimeBenchmark-results.txt
index 6fabd6588ce73..016c678bf9ed6 100644
--- a/sql/core/benchmarks/MakeDateTimeBenchmark-results.txt
+++ b/sql/core/benchmarks/MakeDateTimeBenchmark-results.txt
@@ -1,22 +1,22 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 make_date():                              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-prepare make_date()                                2197           2236          43         45.5          22.0       1.0X
-make_date(2019, 9, 16)                             1756           1858          94         56.9          17.6       1.3X
-make_date(*, *, *)                                 2969           2971           2         33.7          29.7       0.7X
+prepare make_date()                                2215           2250          31         45.1          22.2       1.0X
+make_date(2019, 9, 16)                             1908           1968          65         52.4          19.1       1.2X
+make_date(*, *, *)                                 2978           3021          47         33.6          29.8       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 make_timestamp():                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-prepare make_timestamp()                               357            397          57          2.8         356.6       1.0X
-make_timestamp(2019, 1, 2, 3, 4, 50.123456)             45             46           1         22.3          44.9       7.9X
-make_timestamp(2019, 1, 2, 3, 4, 60.000000)             36             39           5         27.6          36.2       9.9X
-make_timestamp(2019, 12, 31, 23, 59, 60.00)             41             42           2         24.6          40.7       8.8X
-make_timestamp(*, *, *, 3, 4, 50.123456)               162            164           2          6.2         161.6       2.2X
-make_timestamp(*, *, *, *, *, 0)                       108            115           6          9.3         107.6       3.3X
-make_timestamp(*, *, *, *, *, 60.0)                    137            141           4          7.3         136.8       2.6X
-make_timestamp(2019, 1, 2, *, *, *)                    482            487           5          2.1         481.9       0.7X
-make_timestamp(*, *, *, *, *, *)                       480            485           5          2.1         480.2       0.7X
+prepare make_timestamp()                               343            356          15          2.9         343.4       1.0X
+make_timestamp(2019, 1, 2, 3, 4, 50.123456)             40             41           1         25.1          39.8       8.6X
+make_timestamp(2019, 1, 2, 3, 4, 60.000000)             36             39           5         28.1          35.5       9.7X
+make_timestamp(2019, 12, 31, 23, 59, 60.00)             35             38           3         28.7          34.9       9.8X
+make_timestamp(*, *, *, 3, 4, 50.123456)               168            170           3          6.0         168.1       2.0X
+make_timestamp(*, *, *, *, *, 0)                       108            109           2          9.3         108.0       3.2X
+make_timestamp(*, *, *, *, *, 60.0)                    136            138           4          7.4         135.5       2.5X
+make_timestamp(2019, 1, 2, *, *, *)                    438            441           4          2.3         438.4       0.8X
+make_timestamp(*, *, *, *, *, *)                       466            468           2          2.1         466.0       0.7X
 
diff --git a/sql/core/benchmarks/MetadataStructBenchmark-jdk21-results.txt b/sql/core/benchmarks/MetadataStructBenchmark-jdk21-results.txt
index 35bf5113ee895..e07f622fdd53a 100644
--- a/sql/core/benchmarks/MetadataStructBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/MetadataStructBenchmark-jdk21-results.txt
@@ -2,45 +2,45 @@
 Metadata Struct Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Vectorized Parquet:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-no metadata columns                                 629            650          18          7.9         125.8       1.0X
-_metadata.file_path                                 729            744          12          6.9         145.9       0.9X
-_metadata.file_name                                 735            745          16          6.8         146.9       0.9X
-_metadata.file_size                                 657            669           7          7.6         131.3       1.0X
-_metadata.file_block_start                          658            668           9          7.6         131.6       1.0X
-_metadata.file_block_length                         657            666           8          7.6         131.3       1.0X
-_metadata.file_modification_time                    627            655          11          8.0         125.5       1.0X
-_metadata.row_index                                 710            719          11          7.0         142.0       0.9X
-_metadata                                           954            976          11          5.2         190.9       0.7X
+no metadata columns                                 639            659          16          7.8         127.8       1.0X
+_metadata.file_path                                 735            749          11          6.8         147.1       0.9X
+_metadata.file_name                                 735            745           9          6.8         147.0       0.9X
+_metadata.file_size                                 662            673           9          7.6         132.3       1.0X
+_metadata.file_block_start                          631            666          12          7.9         126.3       1.0X
+_metadata.file_block_length                         661            671           6          7.6         132.3       1.0X
+_metadata.file_modification_time                    662            670           6          7.6         132.3       1.0X
+_metadata.row_index                                 695            715          12          7.2         139.0       0.9X
+_metadata                                           954            978          11          5.2         190.8       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet-mr:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-no metadata columns                                2703           2746          29          1.8         540.7       1.0X
-_metadata.file_path                                3467           3505          21          1.4         693.4       0.8X
-_metadata.file_name                                3515           3538          15          1.4         703.0       0.8X
-_metadata.file_size                                3292           3322          17          1.5         658.5       0.8X
-_metadata.file_block_start                         3312           3345          19          1.5         662.3       0.8X
-_metadata.file_block_length                        3310           3339          16          1.5         662.0       0.8X
-_metadata.file_modification_time                   3305           3355          31          1.5         661.1       0.8X
-_metadata.row_index                                3625           3655          18          1.4         725.1       0.7X
-_metadata                                          4831           4871          27          1.0         966.2       0.6X
+no metadata columns                                2758           2792          27          1.8         551.7       1.0X
+_metadata.file_path                                3525           3567          22          1.4         705.0       0.8X
+_metadata.file_name                                3511           3541          16          1.4         702.2       0.8X
+_metadata.file_size                                3358           3391          30          1.5         671.6       0.8X
+_metadata.file_block_start                         3363           3387          19          1.5         672.5       0.8X
+_metadata.file_block_length                        3359           3386          20          1.5         671.8       0.8X
+_metadata.file_modification_time                   3355           3387          20          1.5         671.0       0.8X
+_metadata.row_index                                3650           3681          32          1.4         730.0       0.8X
+_metadata                                          4791           4824          24          1.0         958.2       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-no metadata columns                                6623           6680          78          0.8        1324.5       1.0X
-_metadata.file_path                                7465           7493          16          0.7        1493.1       0.9X
-_metadata.file_name                                7485           7510          23          0.7        1497.0       0.9X
-_metadata.file_size                                7311           7335          13          0.7        1462.1       0.9X
-_metadata.file_block_start                         7316           7331           9          0.7        1463.3       0.9X
-_metadata.file_block_length                        7327           7343          13          0.7        1465.4       0.9X
-_metadata.file_modification_time                   7314           7331          11          0.7        1462.7       0.9X
-_metadata                                          8155           8175          15          0.6        1631.0       0.8X
+no metadata columns                                6897           6946          65          0.7        1379.4       1.0X
+_metadata.file_path                                7726           7756          14          0.6        1545.3       0.9X
+_metadata.file_name                                7734           7793          38          0.6        1546.8       0.9X
+_metadata.file_size                                7549           7581          20          0.7        1509.8       0.9X
+_metadata.file_block_start                         7546           7602          33          0.7        1509.2       0.9X
+_metadata.file_block_length                        7574           7610          24          0.7        1514.8       0.9X
+_metadata.file_modification_time                   7561           7600          21          0.7        1512.1       0.9X
+_metadata                                          8303           8337          18          0.6        1660.5       0.8X
 
 
diff --git a/sql/core/benchmarks/MetadataStructBenchmark-results.txt b/sql/core/benchmarks/MetadataStructBenchmark-results.txt
index bc35900fc09a2..f3ea90a400b5c 100644
--- a/sql/core/benchmarks/MetadataStructBenchmark-results.txt
+++ b/sql/core/benchmarks/MetadataStructBenchmark-results.txt
@@ -2,45 +2,45 @@
 Metadata Struct Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Vectorized Parquet:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-no metadata columns                                 634            661          21          7.9         126.9       1.0X
-_metadata.file_path                                 737            753           9          6.8         147.5       0.9X
-_metadata.file_name                                 723            741           9          6.9         144.6       0.9X
-_metadata.file_size                                 673            682           4          7.4         134.7       0.9X
-_metadata.file_block_start                          676            680           4          7.4         135.1       0.9X
-_metadata.file_block_length                         657            677           6          7.6         131.4       1.0X
-_metadata.file_modification_time                    648            670          10          7.7         129.6       1.0X
-_metadata.row_index                                 718            727           7          7.0         143.7       0.9X
-_metadata                                           981           1015          15          5.1         196.3       0.6X
+no metadata columns                                 654            680          29          7.6         130.9       1.0X
+_metadata.file_path                                 750            765          16          6.7         150.0       0.9X
+_metadata.file_name                                 747            756           6          6.7         149.4       0.9X
+_metadata.file_size                                 679            689           6          7.4         135.8       1.0X
+_metadata.file_block_start                          682            688           4          7.3         136.4       1.0X
+_metadata.file_block_length                         682            691           8          7.3         136.5       1.0X
+_metadata.file_modification_time                    685            690           4          7.3         136.9       1.0X
+_metadata.row_index                                 731            741          12          6.8         146.2       0.9X
+_metadata                                          1026           1035           8          4.9         205.1       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parquet-mr:                               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-no metadata columns                                2005           2050          21          2.5         401.0       1.0X
-_metadata.file_path                                2828           2874          18          1.8         565.7       0.7X
-_metadata.file_name                                2745           2812          25          1.8         549.0       0.7X
-_metadata.file_size                                2527           2567          20          2.0         505.4       0.8X
-_metadata.file_block_start                         2515           2546          16          2.0         503.0       0.8X
-_metadata.file_block_length                        2531           2588          21          2.0         506.1       0.8X
-_metadata.file_modification_time                   2595           2634          34          1.9         519.1       0.8X
-_metadata.row_index                                3427           3478          24          1.5         685.4       0.6X
-_metadata                                          4669           4713          29          1.1         933.9       0.4X
+no metadata columns                                2718           2741          18          1.8         543.7       1.0X
+_metadata.file_path                                3470           3486          14          1.4         694.0       0.8X
+_metadata.file_name                                3437           3458          22          1.5         687.3       0.8X
+_metadata.file_size                                3320           3333          10          1.5         664.0       0.8X
+_metadata.file_block_start                         3316           3332          14          1.5         663.1       0.8X
+_metadata.file_block_length                        3313           3336          22          1.5         662.6       0.8X
+_metadata.file_modification_time                   3314           3328          12          1.5         662.8       0.8X
+_metadata.row_index                                3666           3687          25          1.4         733.1       0.7X
+_metadata                                          4883           4904           9          1.0         976.6       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 JSON:                                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-no metadata columns                                6665           6893          88          0.8        1333.1       1.0X
-_metadata.file_path                                7367           7424          39          0.7        1473.4       0.9X
-_metadata.file_name                                7384           7445          39          0.7        1476.8       0.9X
-_metadata.file_size                                7193           7227          20          0.7        1438.6       0.9X
-_metadata.file_block_start                         7207           7250          27          0.7        1441.4       0.9X
-_metadata.file_block_length                        7183           7345         154          0.7        1436.6       0.9X
-_metadata.file_modification_time                   7236           7281          34          0.7        1447.2       0.9X
-_metadata                                          8172           8239          46          0.6        1634.5       0.8X
+no metadata columns                                7035           7057          16          0.7        1407.0       1.0X
+_metadata.file_path                                7916           7950          42          0.6        1583.2       0.9X
+_metadata.file_name                                7926           7948          15          0.6        1585.3       0.9X
+_metadata.file_size                                7671           7705          17          0.7        1534.2       0.9X
+_metadata.file_block_start                         7697           7721          15          0.6        1539.4       0.9X
+_metadata.file_block_length                        7706           7729          13          0.6        1541.2       0.9X
+_metadata.file_modification_time                   7709           7741          22          0.6        1541.9       0.9X
+_metadata                                          8703           8727          14          0.6        1740.5       0.8X
 
 
diff --git a/sql/core/benchmarks/MetricsAggregationBenchmark-jdk21-results.txt b/sql/core/benchmarks/MetricsAggregationBenchmark-jdk21-results.txt
index 4baacbec53763..a02bedff5b676 100644
--- a/sql/core/benchmarks/MetricsAggregationBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/MetricsAggregationBenchmark-jdk21-results.txt
@@ -1,12 +1,12 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 metrics aggregation (50 metrics, 100000 tasks per stage):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-1 stage(s)                                                          471            621         140          0.0   470645682.0       1.0X
-2 stage(s)                                                          990           1152         228          0.0   990437475.0       0.5X
-3 stage(s)                                                         1685           1804         169          0.0  1684707956.0       0.3X
+1 stage(s)                                                          510            673         113          0.0   510483174.0       1.0X
+2 stage(s)                                                         1590           1640          71          0.0  1590439310.0       0.3X
+3 stage(s)                                                         2512           2582         100          0.0  2511748396.0       0.2X
 
 Stage Count    Stage Proc. Time    Aggreg. Time
-     1              376                58
-     2              288                131
-     3              352                157
+     1              499                58
+     2              563                167
+     3              552                258
diff --git a/sql/core/benchmarks/MetricsAggregationBenchmark-results.txt b/sql/core/benchmarks/MetricsAggregationBenchmark-results.txt
index 5324f515b813c..f0df3ee4fe20d 100644
--- a/sql/core/benchmarks/MetricsAggregationBenchmark-results.txt
+++ b/sql/core/benchmarks/MetricsAggregationBenchmark-results.txt
@@ -1,12 +1,12 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 metrics aggregation (50 metrics, 100000 tasks per stage):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ----------------------------------------------------------------------------------------------------------------------------------------
-1 stage(s)                                                          635            682          45          0.0   635457575.0       1.0X
-2 stage(s)                                                         1395           1406          16          0.0  1394972033.0       0.5X
-3 stage(s)                                                         1935           2037         145          0.0  1934636284.0       0.3X
+1 stage(s)                                                          383            418          71          0.0   383366848.0       1.0X
+2 stage(s)                                                         1367           1383          22          0.0  1367425765.0       0.3X
+3 stage(s)                                                         1732           1910         253          0.0  1731683484.0       0.2X
 
 Stage Count    Stage Proc. Time    Aggreg. Time
-     1              402                36
-     2              367                179
-     3              390                174
+     1              252                51
+     2              400                148
+     3              371                246
diff --git a/sql/core/benchmarks/MiscBenchmark-jdk21-results.txt b/sql/core/benchmarks/MiscBenchmark-jdk21-results.txt
index ff2335fc3d6e1..422b5fd109610 100644
--- a/sql/core/benchmarks/MiscBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/MiscBenchmark-jdk21-results.txt
@@ -2,126 +2,126 @@
 filter & aggregate without group
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 range/filter/sum:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-range/filter/sum wholestage off                   35430          36341        1288         59.2          16.9       1.0X
-range/filter/sum wholestage on                     3511           3649          78        597.2           1.7      10.1X
+range/filter/sum wholestage off                   36339          37196        1213         57.7          17.3       1.0X
+range/filter/sum wholestage on                     3502           3770         300        598.8           1.7      10.4X
 
 
 ================================================================================================
 range/limit/sum
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 range/limit/sum:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-range/limit/sum wholestage off                       67             68           2       7864.7           0.1       1.0X
-range/limit/sum wholestage on                        81             95          12       6502.2           0.2       0.8X
+range/limit/sum wholestage off                       74             75           2       7125.3           0.1       1.0X
+range/limit/sum wholestage on                        75             84           7       6972.8           0.1       1.0X
 
 
 ================================================================================================
 sample
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sample with replacement:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sample with replacement wholestage off             7948           8022         104         16.5          60.6       1.0X
-sample with replacement wholestage on              5104           5183          45         25.7          38.9       1.6X
+sample with replacement wholestage off             8091           8152          87         16.2          61.7       1.0X
+sample with replacement wholestage on              5134           5156          21         25.5          39.2       1.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sample without replacement:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-sample without replacement wholestage off           1832           1842          14         71.6          14.0       1.0X
-sample without replacement wholestage on             661            671           8        198.4           5.0       2.8X
+sample without replacement wholestage off           1895           1896           2         69.2          14.5       1.0X
+sample without replacement wholestage on             657            677          13        199.6           5.0       2.9X
 
 
 ================================================================================================
 collect
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collect:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-collect 1 million                                   154            214          58          6.8         147.0       1.0X
-collect 2 millions                                  329            422          86          3.2         313.6       0.5X
-collect 4 millions                                  741            821          83          1.4         706.9       0.2X
+collect 1 million                                   169            218         118          6.2         161.3       1.0X
+collect 2 millions                                  309            440          84          3.4         294.7       0.5X
+collect 4 millions                                  635            747         116          1.7         605.7       0.3X
 
 
 ================================================================================================
 collect limit
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collect limit:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-collect limit 1 million                             151            222          69          7.0         143.7       1.0X
-collect limit 2 millions                            314            421         131          3.3         299.0       0.5X
+collect limit 1 million                             149            230          95          7.1         141.8       1.0X
+collect limit 2 millions                            288            409          70          3.6         274.5       0.5X
 
 
 ================================================================================================
 generate explode
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate explode array:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate explode array wholestage off             11858          11982         176          1.4         706.8       1.0X
-generate explode array wholestage on               3019           3063          86          5.6         179.9       3.9X
+generate explode array wholestage off             12491          12542          71          1.3         744.5       1.0X
+generate explode array wholestage on               2970           3145         175          5.6         177.0       4.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate explode map:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate explode map wholestage off               24900          24951          72          0.7        1484.1       1.0X
-generate explode map wholestage on                 9324           9385          41          1.8         555.8       2.7X
+generate explode map wholestage off               24462          24644         257          0.7        1458.0       1.0X
+generate explode map wholestage on                 9106           9313         230          1.8         542.7       2.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate posexplode array:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate posexplode array wholestage off          12596          12671         105          1.3         750.8       1.0X
-generate posexplode array wholestage on            2984           3094          71          5.6         177.8       4.2X
+generate posexplode array wholestage off          12603          12606           4          1.3         751.2       1.0X
+generate posexplode array wholestage on            3011           3097          49          5.6         179.5       4.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate inline array:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate inline array wholestage off               7072           7114          59          2.4         421.5       1.0X
-generate inline array wholestage on                2399           2468          74          7.0         143.0       2.9X
+generate inline array wholestage off               6943           6983          57          2.4         413.8       1.0X
+generate inline array wholestage on                2498           2566          75          6.7         148.9       2.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate big struct array:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate big struct array wholestage off            208            209           1          0.3        3463.4       1.0X
-generate big struct array wholestage on             156            169          14          0.4        2593.2       1.3X
+generate big struct array wholestage off            192            198           8          0.3        3201.2       1.0X
+generate big struct array wholestage on             152            161           8          0.4        2526.6       1.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate big nested struct array:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-generate big nested struct array wholestage off          18211          18237          36          0.0      303524.5       1.0X
-generate big nested struct array wholestage on             154            172          16          0.4        2559.5     118.6X
+generate big nested struct array wholestage off          18968          20994        2866          0.0      316136.8       1.0X
+generate big nested struct array wholestage on             153            161           9          0.4        2544.7     124.2X
 
 
 ================================================================================================
 generate regular generator
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate stack:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate stack wholestage off                     13727          13943         305          1.2         818.2       1.0X
-generate stack wholestage on                       3152           3206          36          5.3         187.9       4.4X
+generate stack wholestage off                     13409          13455          66          1.3         799.2       1.0X
+generate stack wholestage on                       3050           3056           4          5.5         181.8       4.4X
 
 
diff --git a/sql/core/benchmarks/MiscBenchmark-results.txt b/sql/core/benchmarks/MiscBenchmark-results.txt
index f2d3eb1988b62..24b0ce572ddae 100644
--- a/sql/core/benchmarks/MiscBenchmark-results.txt
+++ b/sql/core/benchmarks/MiscBenchmark-results.txt
@@ -2,126 +2,126 @@
 filter & aggregate without group
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 range/filter/sum:                         Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-range/filter/sum wholestage off                   36214          36785         807         57.9          17.3       1.0X
-range/filter/sum wholestage on                     3468           3752         160        604.7           1.7      10.4X
+range/filter/sum wholestage off                   36126          37069        1333         58.1          17.2       1.0X
+range/filter/sum wholestage on                     3453           3747         166        607.3           1.6      10.5X
 
 
 ================================================================================================
 range/limit/sum
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 range/limit/sum:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-range/limit/sum wholestage off                       76             76           0       6926.9           0.1       1.0X
-range/limit/sum wholestage on                        78             81           3       6685.5           0.1       1.0X
+range/limit/sum wholestage off                       73             76           5       7206.6           0.1       1.0X
+range/limit/sum wholestage on                        87             95           6       6028.2           0.2       0.8X
 
 
 ================================================================================================
 sample
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sample with replacement:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sample with replacement wholestage off             8042           8116         106         16.3          61.4       1.0X
-sample with replacement wholestage on              5265           5351          52         24.9          40.2       1.5X
+sample with replacement wholestage off             7717           7759          60         17.0          58.9       1.0X
+sample with replacement wholestage on              5018           5026           7         26.1          38.3       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 sample without replacement:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-sample without replacement wholestage off           1942           1946           6         67.5          14.8       1.0X
-sample without replacement wholestage on             713            740          29        183.8           5.4       2.7X
+sample without replacement wholestage off           1808           1814           8         72.5          13.8       1.0X
+sample without replacement wholestage on             701            743          77        186.9           5.3       2.6X
 
 
 ================================================================================================
 collect
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collect:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-collect 1 million                                   158            216          72          6.7         150.2       1.0X
-collect 2 millions                                  298            407          91          3.5         284.3       0.5X
-collect 4 millions                                  722            827         132          1.5         688.9       0.2X
+collect 1 million                                   160            213          67          6.6         152.2       1.0X
+collect 2 millions                                  301            430          73          3.5         286.9       0.5X
+collect 4 millions                                  716            840         134          1.5         682.5       0.2X
 
 
 ================================================================================================
 collect limit
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 collect limit:                            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-collect limit 1 million                             152            235         119          6.9         145.4       1.0X
-collect limit 2 millions                            317            433         117          3.3         302.2       0.5X
+collect limit 1 million                             162            200          66          6.5         154.4       1.0X
+collect limit 2 millions                            315            407          75          3.3         300.2       0.5X
 
 
 ================================================================================================
 generate explode
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate explode array:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate explode array wholestage off             11844          11877          48          1.4         705.9       1.0X
-generate explode array wholestage on               2946           2980          59          5.7         175.6       4.0X
+generate explode array wholestage off             11515          11594         112          1.5         686.3       1.0X
+generate explode array wholestage on               2936           3021          82          5.7         175.0       3.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate explode map:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate explode map wholestage off               23185          23254          98          0.7        1381.9       1.0X
-generate explode map wholestage on                 9594           9844         196          1.7         571.8       2.4X
+generate explode map wholestage off               23775          23804          41          0.7        1417.1       1.0X
+generate explode map wholestage on                 9691           9798          93          1.7         577.6       2.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate posexplode array:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate posexplode array wholestage off          12281          12328          67          1.4         732.0       1.0X
-generate posexplode array wholestage on            2914           3004          76          5.8         173.7       4.2X
+generate posexplode array wholestage off          12212          12393         257          1.4         727.9       1.0X
+generate posexplode array wholestage on            2971           3034          40          5.6         177.1       4.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate inline array:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate inline array wholestage off               6803           6881         112          2.5         405.5       1.0X
-generate inline array wholestage on                2506           2515          11          6.7         149.4       2.7X
+generate inline array wholestage off               6705           6754          69          2.5         399.7       1.0X
+generate inline array wholestage on                2490           2525          40          6.7         148.4       2.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate big struct array:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate big struct array wholestage off            228            241          18          0.3        3799.8       1.0X
-generate big struct array wholestage on             175            181           5          0.3        2909.8       1.3X
+generate big struct array wholestage off            200            212          16          0.3        3339.2       1.0X
+generate big struct array wholestage on             180            188          14          0.3        2996.2       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate big nested struct array:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------
-generate big nested struct array wholestage off          17588          18273         968          0.0      293139.3       1.0X
-generate big nested struct array wholestage on             169            179           8          0.4        2812.8     104.2X
+generate big nested struct array wholestage off          18810          19086         390          0.0      313505.9       1.0X
+generate big nested struct array wholestage on             173            186          13          0.3        2886.8     108.6X
 
 
 ================================================================================================
 generate regular generator
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 generate stack:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-generate stack wholestage off                     13013          13020          10          1.3         775.7       1.0X
-generate stack wholestage on                       3085           3093           7          5.4         183.9       4.2X
+generate stack wholestage off                     12822          12842          28          1.3         764.3       1.0X
+generate stack wholestage on                       3056           3073          13          5.5         182.2       4.2X
 
 
diff --git a/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-jdk21-results.txt b/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-jdk21-results.txt
index 4fcfd547e40dd..f87f452a1b484 100644
--- a/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-jdk21-results.txt
@@ -2,52 +2,52 @@
 Nested Schema Pruning Benchmark For ORC v1
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Selection:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     59             71           8         16.9          59.3       1.0X
-Nested column                                        58             66           7         17.3          57.7       1.0X
-Nested column in array                              161            166           3          6.2         160.8       0.4X
+Top-level column                                     67             93          14         14.8          67.4       1.0X
+Nested column                                        61             72           8         16.4          60.9       1.1X
+Nested column in array                              168            171           3          6.0         167.8       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Limiting:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    227            240          12          4.4         227.0       1.0X
-Nested column                                       230            253          17          4.3         230.1       1.0X
-Nested column in array                              500            522          14          2.0         500.1       0.5X
+Top-level column                                    239            255          16          4.2         239.2       1.0X
+Nested column                                       245            267          16          4.1         245.1       1.0X
+Nested column in array                              539            562          20          1.9         539.0       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    206            218           9          4.9         206.1       1.0X
-Nested column                                       210            221          12          4.8         210.0       1.0X
-Nested column in array                              448            469          12          2.2         447.7       0.5X
+Top-level column                                    215            229          11          4.7         214.7       1.0X
+Nested column                                       225            239          11          4.4         224.7       1.0X
+Nested column in array                              481            488           5          2.1         480.8       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning by exprs:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    201            214           7          5.0         200.7       1.0X
-Nested column                                       224            237           8          4.5         223.8       0.9X
-Nested column in array                              501            514           7          2.0         500.8       0.4X
+Top-level column                                    212            226          10          4.7         212.2       1.0X
+Nested column                                       234            248           8          4.3         234.2       0.9X
+Nested column in array                              512            521           7          2.0         512.4       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sample:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     67             79          10         15.0          66.8       1.0X
-Nested column                                        75             91          17         13.3          75.0       0.9X
-Nested column in array                              214            232          11          4.7         213.6       0.3X
+Top-level column                                     67             82          13         14.9          66.9       1.0X
+Nested column                                        75             91          13         13.4          74.8       0.9X
+Nested column in array                              215            240          24          4.6         215.2       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sorting:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    293            306          13          3.4         293.5       1.0X
-Nested column                                       340            349          10          2.9         340.4       0.9X
-Nested column in array                              712            778          41          1.4         712.3       0.4X
+Top-level column                                    297            314          16          3.4         297.1       1.0X
+Nested column                                       341            351          14          2.9         341.5       0.9X
+Nested column in array                              714            729          19          1.4         714.4       0.4X
 
 
diff --git a/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-results.txt b/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-results.txt
index a50f57fd5abbe..74179e5b6c504 100644
--- a/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-results.txt
+++ b/sql/core/benchmarks/OrcNestedSchemaPruningBenchmark-results.txt
@@ -2,52 +2,52 @@
 Nested Schema Pruning Benchmark For ORC v1
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Selection:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     62             79          11         16.1          62.0       1.0X
-Nested column                                        58             66           7         17.2          58.2       1.1X
-Nested column in array                              160            166           5          6.2         160.4       0.4X
+Top-level column                                     63             78          11         16.0          62.7       1.0X
+Nested column                                        58             67           7         17.2          58.3       1.1X
+Nested column in array                              168            177           9          5.9         168.5       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Limiting:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    226            246          12          4.4         226.0       1.0X
-Nested column                                       230            247          11          4.4         229.8       1.0X
-Nested column in array                              488            507          22          2.0         488.0       0.5X
+Top-level column                                    247            263          22          4.0         247.4       1.0X
+Nested column                                       236            252           9          4.2         235.9       1.0X
+Nested column in array                              490            512          14          2.0         489.8       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    205            209           5          4.9         204.5       1.0X
-Nested column                                       209            216           6          4.8         208.7       1.0X
-Nested column in array                              447            454           5          2.2         447.3       0.5X
+Top-level column                                    207            214           5          4.8         207.5       1.0X
+Nested column                                       214            221           6          4.7         213.6       1.0X
+Nested column in array                              454            460           4          2.2         453.7       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning by exprs:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    202            207           5          5.0         201.8       1.0X
-Nested column                                       225            233           4          4.4         225.1       0.9X
-Nested column in array                              481            489           6          2.1         481.2       0.4X
+Top-level column                                    209            212           2          4.8         208.7       1.0X
+Nested column                                       231            238           7          4.3         230.6       0.9X
+Nested column in array                              488            495           5          2.1         487.5       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sample:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     67             80          12         15.0          66.9       1.0X
-Nested column                                        74             89          14         13.5          74.3       0.9X
-Nested column in array                              193            252          48          5.2         193.5       0.3X
+Top-level column                                     70             77           6         14.2          70.3       1.0X
+Nested column                                        76             91          14         13.2          75.9       0.9X
+Nested column in array                              208            243          26          4.8         208.3       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sorting:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    285            297           8          3.5         285.1       1.0X
-Nested column                                       342            349           5          2.9         341.9       0.8X
-Nested column in array                              714            722           8          1.4         713.5       0.4X
+Top-level column                                    297            306           7          3.4         297.0       1.0X
+Nested column                                       351            359           6          2.9         350.9       0.8X
+Nested column in array                              696            711          17          1.4         695.7       0.4X
 
 
diff --git a/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-jdk21-results.txt b/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-jdk21-results.txt
index 9478a15923122..3805177dde47b 100644
--- a/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-jdk21-results.txt
@@ -2,52 +2,52 @@
 Nested Schema Pruning Benchmark For ORC v2
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Selection:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     59             75          10         17.0          58.8       1.0X
-Nested column                                        60             68           7         16.8          59.5       1.0X
-Nested column in array                              160            164           4          6.3         160.0       0.4X
+Top-level column                                     59             73          12         16.9          59.1       1.0X
+Nested column                                        58             67           6         17.2          58.0       1.0X
+Nested column in array                              167            172           5          6.0         167.1       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Limiting:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    243            258          13          4.1         242.5       1.0X
-Nested column                                       234            256          15          4.3         234.4       1.0X
-Nested column in array                              525            543          12          1.9         525.2       0.5X
+Top-level column                                    243            260          22          4.1         243.4       1.0X
+Nested column                                       244            263          15          4.1         243.6       1.0X
+Nested column in array                              508            538          17          2.0         508.1       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    209            221           7          4.8         209.3       1.0X
-Nested column                                       217            229           8          4.6         217.2       1.0X
-Nested column in array                              458            474           7          2.2         457.7       0.5X
+Top-level column                                    213            227           8          4.7         213.2       1.0X
+Nested column                                       221            233           7          4.5         221.3       1.0X
+Nested column in array                              464            481          14          2.2         464.2       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning by exprs:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    205            217           8          4.9         205.4       1.0X
-Nested column                                       228            239           7          4.4         227.7       0.9X
-Nested column in array                              498            509           6          2.0         498.3       0.4X
+Top-level column                                    212            224           8          4.7         212.1       1.0X
+Nested column                                       243            254           7          4.1         243.3       0.9X
+Nested column in array                              514            522           6          1.9         514.4       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sample:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     73             85          12         13.6          73.4       1.0X
-Nested column                                        76             92          12         13.1          76.3       1.0X
-Nested column in array                              204            233          32          4.9         203.7       0.4X
+Top-level column                                     73             83          11         13.7          73.0       1.0X
+Nested column                                        76             89          11         13.1          76.3       1.0X
+Nested column in array                              214            254          33          4.7         214.5       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sorting:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    296            307          18          3.4         295.9       1.0X
-Nested column                                       337            348          18          3.0         337.1       0.9X
-Nested column in array                              683            711          34          1.5         682.6       0.4X
+Top-level column                                    307            326          25          3.3         306.9       1.0X
+Nested column                                       352            361          13          2.8         351.7       0.9X
+Nested column in array                              708            728          15          1.4         708.3       0.4X
 
 
diff --git a/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-results.txt b/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-results.txt
index 9c608cdc104db..75c922e834670 100644
--- a/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-results.txt
+++ b/sql/core/benchmarks/OrcV2NestedSchemaPruningBenchmark-results.txt
@@ -2,52 +2,52 @@
 Nested Schema Pruning Benchmark For ORC v2
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Selection:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     64             76          11         15.6          64.1       1.0X
-Nested column                                        57             64           4         17.7          56.6       1.1X
-Nested column in array                              160            165           5          6.3         159.6       0.4X
+Top-level column                                     69             84          11         14.5          68.9       1.0X
+Nested column                                        59             67           5         16.8          59.5       1.2X
+Nested column in array                              167            171           4          6.0         166.6       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Limiting:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    231            248          15          4.3         230.8       1.0X
-Nested column                                       234            251          20          4.3         233.5       1.0X
-Nested column in array                              498            523          16          2.0         498.0       0.5X
+Top-level column                                    233            259          20          4.3         233.1       1.0X
+Nested column                                       235            248           9          4.2         235.5       1.0X
+Nested column in array                              493            511          12          2.0         493.0       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    203            211           6          4.9         202.5       1.0X
-Nested column                                       209            217           4          4.8         209.2       1.0X
-Nested column in array                              447            455           6          2.2         446.9       0.5X
+Top-level column                                    207            214           6          4.8         206.7       1.0X
+Nested column                                       210            218           7          4.8         210.5       1.0X
+Nested column in array                              445            452           4          2.2         445.1       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning by exprs:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    204            206           3          4.9         203.6       1.0X
-Nested column                                       225            230           5          4.4         225.2       0.9X
-Nested column in array                              482            489           6          2.1         481.8       0.4X
+Top-level column                                    203            207           3          4.9         203.4       1.0X
+Nested column                                       229            236           6          4.4         228.5       0.9X
+Nested column in array                              479            487           6          2.1         479.2       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sample:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     60             81          10         16.7          60.0       1.0X
-Nested column                                        75             89          19         13.3          75.0       0.8X
-Nested column in array                              197            236          21          5.1         197.4       0.3X
+Top-level column                                     69             79           7         14.4          69.3       1.0X
+Nested column                                        76             89          10         13.2          75.7       0.9X
+Nested column in array                              199            218          16          5.0         199.0       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sorting:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    295            301           4          3.4         295.1       1.0X
-Nested column                                       340            348           7          2.9         339.7       0.9X
-Nested column in array                              696            713          15          1.4         696.2       0.4X
+Top-level column                                    290            300           7          3.5         289.8       1.0X
+Nested column                                       347            352           5          2.9         346.9       0.8X
+Nested column in array                              691            704          13          1.4         691.5       0.4X
 
 
diff --git a/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-jdk21-results.txt b/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-jdk21-results.txt
index 36df6288ae20c..d577a05c07562 100644
--- a/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-jdk21-results.txt
@@ -1,21 +1,21 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Can skip all row groups:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without nested predicate Pushdown                  6432           6461          39         16.3          61.3       1.0X
-With nested predicate Pushdown                       50             64           9       2098.5           0.5     128.7X
+Without nested predicate Pushdown                  6444           6497          51         16.3          61.5       1.0X
+With nested predicate Pushdown                       63             77          12       1661.1           0.6     102.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Can skip some row groups:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without nested predicate Pushdown                  6867           7113          88         15.3          65.5       1.0X
-With nested predicate Pushdown                       50             66          12       2108.2           0.5     138.1X
+Without nested predicate Pushdown                  6923           6941          15         15.1          66.0       1.0X
+With nested predicate Pushdown                       56             71          12       1889.2           0.5     124.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Can skip no row groups:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without nested predicate Pushdown                 13364          13431          62          7.8         127.4       1.0X
-With nested predicate Pushdown                    13367          13482          91          7.8         127.5       1.0X
+Without nested predicate Pushdown                 13365          13428          32          7.8         127.5       1.0X
+With nested predicate Pushdown                    13404          13469          40          7.8         127.8       1.0X
 
diff --git a/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-results.txt b/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-results.txt
index 3744a6c32b9e5..638672ca7b4c9 100644
--- a/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-results.txt
+++ b/sql/core/benchmarks/ParquetNestedPredicatePushDownBenchmark-results.txt
@@ -1,21 +1,21 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Can skip all row groups:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without nested predicate Pushdown                  7205           7285          64         14.6          68.7       1.0X
-With nested predicate Pushdown                       73             87          13       1429.5           0.7      98.2X
+Without nested predicate Pushdown                  7237           7306          72         14.5          69.0       1.0X
+With nested predicate Pushdown                       55             72          13       1904.2           0.5     131.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Can skip some row groups:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without nested predicate Pushdown                  7554           7851         109         13.9          72.0       1.0X
-With nested predicate Pushdown                       54             74           7       1954.7           0.5     140.8X
+Without nested predicate Pushdown                  7775           7852          63         13.5          74.1       1.0X
+With nested predicate Pushdown                       63             74           6       1665.2           0.6     123.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Can skip no row groups:                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Without nested predicate Pushdown                 14165          14208          28          7.4         135.1       1.0X
-With nested predicate Pushdown                    14195          14250          57          7.4         135.4       1.0X
+Without nested predicate Pushdown                 14210          14261          37          7.4         135.5       1.0X
+With nested predicate Pushdown                    14216          14254          33          7.4         135.6       1.0X
 
diff --git a/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-jdk21-results.txt b/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-jdk21-results.txt
index 03124ec591c2c..9351880547265 100644
--- a/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-jdk21-results.txt
@@ -2,52 +2,52 @@
 Nested Schema Pruning Benchmark For Parquet
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Selection:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     63             77          12         15.8          63.4       1.0X
-Nested column                                        64             71           6         15.6          64.0       1.0X
-Nested column in array                              215            220           5          4.6         215.2       0.3X
+Top-level column                                     65             78          16         15.3          65.4       1.0X
+Nested column                                        67             76          10         14.9          67.3       1.0X
+Nested column in array                              229            237           4          4.4         229.1       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Limiting:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    244            269          26          4.1         243.6       1.0X
-Nested column                                       247            267          15          4.0         247.1       1.0X
-Nested column in array                              573            596          18          1.7         573.5       0.4X
+Top-level column                                    243            263          11          4.1         243.3       1.0X
+Nested column                                       252            273          13          4.0         251.6       1.0X
+Nested column in array                              562            593          24          1.8         561.9       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    220            232          10          4.5         220.5       1.0X
-Nested column                                       231            243          10          4.3         230.7       1.0X
-Nested column in array                              507            530          16          2.0         507.3       0.4X
+Top-level column                                    234            241           6          4.3         234.1       1.0X
+Nested column                                       239            249           6          4.2         239.5       1.0X
+Nested column in array                              521            535          14          1.9         520.8       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning by exprs:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    216            234          25          4.6         216.4       1.0X
-Nested column                                       246            259           9          4.1         246.4       0.9X
-Nested column in array                              558            563           5          1.8         558.0       0.4X
+Top-level column                                    222            229          12          4.5         221.6       1.0X
+Nested column                                       247            267          27          4.1         246.5       0.9X
+Nested column in array                              558            571          10          1.8         558.4       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sample:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     73             87          10         13.7          72.8       1.0X
-Nested column                                        81             91           7         12.4          80.7       0.9X
-Nested column in array                              256            291          21          3.9         255.9       0.3X
+Top-level column                                     75             90          15         13.3          75.1       1.0X
+Nested column                                        81             98          19         12.3          81.1       0.9X
+Nested column in array                              281            309          18          3.6         280.6       0.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sorting:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    300            316          25          3.3         299.6       1.0X
-Nested column                                       343            354          10          2.9         342.5       0.9X
-Nested column in array                              755            778          25          1.3         754.7       0.4X
+Top-level column                                    308            324          17          3.2         308.4       1.0X
+Nested column                                       360            371          16          2.8         359.5       0.9X
+Nested column in array                              756            773          17          1.3         755.6       0.4X
 
 
diff --git a/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-results.txt b/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-results.txt
index 5f9a95e6fa8cb..8729ffc3428f9 100644
--- a/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-results.txt
+++ b/sql/core/benchmarks/ParquetNestedSchemaPruningBenchmark-results.txt
@@ -2,52 +2,52 @@
 Nested Schema Pruning Benchmark For Parquet
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Selection:                                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     67             88          13         14.9          67.1       1.0X
-Nested column                                        67             75           6         14.9          67.3       1.0X
-Nested column in array                              224            231           3          4.5         224.4       0.3X
+Top-level column                                     68             81          11         14.7          68.2       1.0X
+Nested column                                        69             80           9         14.6          68.6       1.0X
+Nested column in array                              229            235           5          4.4         228.6       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Limiting:                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    245            268          30          4.1         244.9       1.0X
-Nested column                                       244            258           9          4.1         244.0       1.0X
-Nested column in array                              551            582          14          1.8         551.4       0.4X
+Top-level column                                    255            272          12          3.9         254.8       1.0X
+Nested column                                       249            262           8          4.0         248.8       1.0X
+Nested column in array                              565            587          14          1.8         564.8       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    215            220           4          4.7         214.6       1.0X
-Nested column                                       218            226           6          4.6         217.8       1.0X
-Nested column in array                              511            516           5          2.0         511.2       0.4X
+Top-level column                                    223            227           4          4.5         222.8       1.0X
+Nested column                                       224            232           6          4.5         224.4       1.0X
+Nested column in array                              520            524           4          1.9         519.6       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repartitioning by exprs:                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    211            218           6          4.7         211.0       1.0X
-Nested column                                       237            244           9          4.2         237.1       0.9X
-Nested column in array                              545            553           4          1.8         545.3       0.4X
+Top-level column                                    219            225           5          4.6         218.8       1.0X
+Nested column                                       240            248           6          4.2         240.4       0.9X
+Nested column in array                              547            556           7          1.8         547.3       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sample:                                   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                     77             87           8         12.9          77.5       1.0X
-Nested column                                        86             96          10         11.6          85.9       0.9X
-Nested column in array                              260            283          13          3.8         259.9       0.3X
+Top-level column                                     78             92          13         12.9          77.6       1.0X
+Nested column                                        86             96          10         11.6          86.0       0.9X
+Nested column in array                              267            297          19          3.7         267.0       0.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Sorting:                                  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Top-level column                                    302            311           9          3.3         301.6       1.0X
-Nested column                                       348            354           5          2.9         348.1       0.9X
-Nested column in array                              754            775          21          1.3         754.5       0.4X
+Top-level column                                    305            312           3          3.3         305.0       1.0X
+Nested column                                       357            369          19          2.8         357.0       0.9X
+Nested column in array                              765            775          13          1.3         764.6       0.4X
 
 
diff --git a/sql/core/benchmarks/PrimitiveArrayBenchmark-jdk21-results.txt b/sql/core/benchmarks/PrimitiveArrayBenchmark-jdk21-results.txt
index c4e4c1e48a965..8c4594cd37c70 100644
--- a/sql/core/benchmarks/PrimitiveArrayBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/PrimitiveArrayBenchmark-jdk21-results.txt
@@ -2,11 +2,11 @@
 Write primitive arrays in dataset
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write an array in Dataset:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                 182            226          39         46.2          21.7       1.0X
-Double                                              243            263          12         34.5          29.0       0.7X
+Int                                                 180            204          13         46.5          21.5       1.0X
+Double                                              268            283          10         31.3          31.9       0.7X
 
 
diff --git a/sql/core/benchmarks/PrimitiveArrayBenchmark-results.txt b/sql/core/benchmarks/PrimitiveArrayBenchmark-results.txt
index 569b9714bed1e..ae32c6361729f 100644
--- a/sql/core/benchmarks/PrimitiveArrayBenchmark-results.txt
+++ b/sql/core/benchmarks/PrimitiveArrayBenchmark-results.txt
@@ -2,11 +2,11 @@
 Write primitive arrays in dataset
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write an array in Dataset:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                 205            226          21         40.9          24.4       1.0X
-Double                                              276            288          15         30.4          32.9       0.7X
+Int                                                 212            226           8         39.6          25.3       1.0X
+Double                                              283            308          26         29.6          33.8       0.7X
 
 
diff --git a/sql/core/benchmarks/RangeBenchmark-jdk21-results.txt b/sql/core/benchmarks/RangeBenchmark-jdk21-results.txt
index 39b54801fedd2..f63e056208c29 100644
--- a/sql/core/benchmarks/RangeBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/RangeBenchmark-jdk21-results.txt
@@ -2,14 +2,14 @@
 range
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 range:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-full scan                                         10188          10609         498         51.5          19.4       1.0X
-limit after range                                    51             53           2      10288.3           0.1     199.9X
-filter after range                                 1017           1035          21        515.5           1.9      10.0X
-count after range                                   351            355           5       1495.4           0.7      29.1X
-count after limit after range                        60             62           2       8676.6           0.1     168.6X
+full scan                                         10038          10468         600         52.2          19.1       1.0X
+limit after range                                    46             50           8      11408.3           0.1     218.4X
+filter after range                                 1010           1018           8        519.0           1.9       9.9X
+count after range                                   352            361           9       1489.1           0.7      28.5X
+count after limit after range                        53             59           4       9913.1           0.1     189.8X
 
 
diff --git a/sql/core/benchmarks/RangeBenchmark-results.txt b/sql/core/benchmarks/RangeBenchmark-results.txt
index c8aec61eb707d..eabc7f1298ca8 100644
--- a/sql/core/benchmarks/RangeBenchmark-results.txt
+++ b/sql/core/benchmarks/RangeBenchmark-results.txt
@@ -2,14 +2,14 @@
 range
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 range:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-full scan                                          9612          10290         492         54.5          18.3       1.0X
-limit after range                                    50             60           9      10545.4           0.1     193.3X
-filter after range                                 1004           1012           7        522.1           1.9       9.6X
-count after range                                   351            358           8       1494.1           0.7      27.4X
-count after limit after range                        64             65           1       8190.7           0.1     150.2X
+full scan                                          9860          10025         111         53.2          18.8       1.0X
+limit after range                                    61             63           3       8663.2           0.1     162.9X
+filter after range                                 1009           1025          18        519.6           1.9       9.8X
+count after range                                   352            355           4       1489.4           0.7      28.0X
+count after limit after range                        63             66           3       8265.4           0.1     155.4X
 
 
diff --git a/sql/core/benchmarks/RecursiveCTEBenchmark-jdk21-results.txt b/sql/core/benchmarks/RecursiveCTEBenchmark-jdk21-results.txt
new file mode 100644
index 0000000000000..fce114d867b2f
--- /dev/null
+++ b/sql/core/benchmarks/RecursiveCTEBenchmark-jdk21-results.txt
@@ -0,0 +1,95 @@
+================================================================================================
+Recursive CTE with only LocalRelation
+================================================================================================
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 10 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 10 integers using VALUES                                    136            150          16          0.0    13629654.3       1.0X
+First 10 integers using SELECT                                     86             93           8          0.0     8592266.5       1.6X
+First 10 integers using SELECT and LIMIT                           63             70           9          0.0     6270977.7       2.2X
+First 10 integers referencing external table in anchor            115            141          23          0.0    11516912.5       1.2X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 20 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 20 integers using VALUES                                     75             81           8          0.0     3767343.2       1.0X
+First 20 integers using SELECT                                     87             95           7          0.0     4358911.5       0.9X
+First 20 integers using SELECT and LIMIT                           59             62           3          0.0     2967261.6       1.3X
+First 20 integers referencing external table in anchor            113            117           3          0.0     5659810.4       0.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 30 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 30 integers using VALUES                                     77             82           5          0.0     2555962.6       1.0X
+First 30 integers using SELECT                                     75             83           9          0.0     2488825.0       1.0X
+First 30 integers using SELECT and LIMIT                           64             68           6          0.0     2131034.1       1.2X
+First 30 integers referencing external table in anchor            116            131          20          0.0     3870932.1       0.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 40 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 40 integers using VALUES                                     79             80           0          0.0     1986696.6       1.0X
+First 40 integers using SELECT                                     75             78           4          0.0     1879019.3       1.1X
+First 40 integers using SELECT and LIMIT                           68             71           5          0.0     1702571.8       1.2X
+First 40 integers referencing external table in anchor            114            128          15          0.0     2856194.8       0.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 50 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 50 integers using VALUES                                     82             93          18          0.0     1633748.5       1.0X
+First 50 integers using SELECT                                     84             87           6          0.0     1678713.9       1.0X
+First 50 integers using SELECT and LIMIT                           75             90          16          0.0     1508240.7       1.1X
+First 50 integers referencing external table in anchor            123            127           4          0.0     2451603.8       0.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 60 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 60 integers using VALUES                                     91             94           3          0.0     1512050.0       1.0X
+First 60 integers using SELECT                                     95             98           4          0.0     1576008.7       1.0X
+First 60 integers using SELECT and LIMIT                           87             87           0          0.0     1443233.9       1.0X
+First 60 integers referencing external table in anchor            134            137           5          0.0     2227818.3       0.7X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 70 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 70 integers using VALUES                                    107            114           7          0.0     1531580.2       1.0X
+First 70 integers using SELECT                                    108            113           5          0.0     1545424.7       1.0X
+First 70 integers using SELECT and LIMIT                           99            103           4          0.0     1413035.3       1.1X
+First 70 integers referencing external table in anchor            140            141           1          0.0     1994987.9       0.8X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 80 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 80 integers using VALUES                                    120            125           5          0.0     1495890.7       1.0X
+First 80 integers using SELECT                                    119            126           7          0.0     1493331.3       1.0X
+First 80 integers using SELECT and LIMIT                          101            103           2          0.0     1268107.2       1.2X
+First 80 integers referencing external table in anchor            154            165          14          0.0     1923761.7       0.8X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 90 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+--------------------------------------------------------------------------------------------------------------------------------------
+First 90 integers using VALUES                                    123            131           8          0.0     1363274.5       1.0X
+First 90 integers using SELECT                                    121            127           9          0.0     1345079.3       1.0X
+First 90 integers using SELECT and LIMIT                          118            122           4          0.0     1305706.1       1.0X
+First 90 integers referencing external table in anchor            163            169           5          0.0     1813308.8       0.8X
+
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
+First 100 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
+---------------------------------------------------------------------------------------------------------------------------------------
+First 100 integers using VALUES                                    140            143           2          0.0     1404497.4       1.0X
+First 100 integers using SELECT                                    133            136           4          0.0     1334375.7       1.1X
+First 100 integers using SELECT and LIMIT                          125            129           4          0.0     1246067.9       1.1X
+First 100 integers referencing external table in anchor            170            175           4          0.0     1703882.3       0.8X
+
+
diff --git a/sql/core/benchmarks/RecursiveCTEBenchmark-results.txt b/sql/core/benchmarks/RecursiveCTEBenchmark-results.txt
index 13c1cadc32bcf..a77aafe11591e 100644
--- a/sql/core/benchmarks/RecursiveCTEBenchmark-results.txt
+++ b/sql/core/benchmarks/RecursiveCTEBenchmark-results.txt
@@ -2,94 +2,94 @@
 Recursive CTE with only LocalRelation
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 10 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 10 integers using VALUES                                     31             41          11          0.0     3132641.6       1.0X
-First 10 integers using SELECT                                     27             29           3          0.0     2674441.6       1.2X
-First 10 integers using SELECT and LIMIT                           21             22           0          0.0     2133933.4       1.5X
-First 10 integers referencing external table in anchor             54             59           7          0.0     5351133.4       0.6X
+First 10 integers using VALUES                                    151            163          18          0.0    15065707.8       1.0X
+First 10 integers using SELECT                                    108            112           5          0.0    10772405.6       1.4X
+First 10 integers using SELECT and LIMIT                           86             90           3          0.0     8620888.3       1.7X
+First 10 integers referencing external table in anchor            150            158           9          0.0    15013999.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 20 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 20 integers using VALUES                                     25             25           1          0.0     1245431.3       1.0X
-First 20 integers using SELECT                                     24             24           1          0.0     1183625.0       1.1X
-First 20 integers using SELECT and LIMIT                           26             35          12          0.0     1288108.4       1.0X
-First 20 integers referencing external table in anchor             66             89          23          0.0     3291745.9       0.4X
+First 20 integers using VALUES                                     77             92          14          0.0     3869518.5       1.0X
+First 20 integers using SELECT                                     91             94           4          0.0     4571792.9       0.8X
+First 20 integers using SELECT and LIMIT                           65             72           7          0.0     3236348.5       1.2X
+First 20 integers referencing external table in anchor            124            141          15          0.0     6207737.9       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 30 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 30 integers using VALUES                                     25             25           1          0.0      826962.5       1.0X
-First 30 integers using SELECT                                     25             25           0          0.0      824329.2       1.0X
-First 30 integers using SELECT and LIMIT                           24             25           1          0.0      803851.4       1.0X
-First 30 integers referencing external table in anchor             67             70           3          0.0     2247233.3       0.4X
+First 30 integers using VALUES                                     77             93          16          0.0     2571754.4       1.0X
+First 30 integers using SELECT                                     96             99           5          0.0     3187083.6       0.8X
+First 30 integers using SELECT and LIMIT                           68             76          12          0.0     2250803.4       1.1X
+First 30 integers referencing external table in anchor            123            132           7          0.0     4113510.3       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 40 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 40 integers using VALUES                                     29             30           0          0.0      734365.6       1.0X
-First 40 integers using SELECT                                     29             30           1          0.0      725761.5       1.0X
-First 40 integers using SELECT and LIMIT                           29             33           8          0.0      721877.1       1.0X
-First 40 integers referencing external table in anchor             74             85           9          0.0     1860972.9       0.4X
+First 40 integers using VALUES                                     82             89           7          0.0     2041074.7       1.0X
+First 40 integers using SELECT                                     85             89           6          0.0     2131638.0       1.0X
+First 40 integers using SELECT and LIMIT                           78             80           4          0.0     1947446.2       1.0X
+First 40 integers referencing external table in anchor            118            122           4          0.0     2957424.4       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 50 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 50 integers using VALUES                                     34             34           1          0.0      673504.2       1.0X
-First 50 integers using SELECT                                     35             35           0          0.0      707847.5       1.0X
-First 50 integers using SELECT and LIMIT                           32             32           0          0.0      637159.2       1.1X
-First 50 integers referencing external table in anchor             61             62           1          0.0     1217748.3       0.6X
+First 50 integers using VALUES                                     96            111          13          0.0     1922421.5       1.0X
+First 50 integers using SELECT                                     86             89           3          0.0     1718552.2       1.1X
+First 50 integers using SELECT and LIMIT                           81             90          14          0.0     1610883.5       1.2X
+First 50 integers referencing external table in anchor            140            147           6          0.0     2806679.9       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 60 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 60 integers using VALUES                                     38             38           0          0.0      628445.8       1.0X
-First 60 integers using SELECT                                     38             38           0          0.0      635657.0       1.0X
-First 60 integers using SELECT and LIMIT                           35             35           0          0.0      584701.4       1.1X
-First 60 integers referencing external table in anchor             67             81          24          0.0     1109077.8       0.6X
+First 60 integers using VALUES                                     95             99           4          0.0     1588658.6       1.0X
+First 60 integers using SELECT                                     94             96           3          0.0     1567532.8       1.0X
+First 60 integers using SELECT and LIMIT                           87             87           0          0.0     1449613.9       1.1X
+First 60 integers referencing external table in anchor            138            147           8          0.0     2297241.5       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 70 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 70 integers using VALUES                                     42             42           0          0.0      602191.1       1.0X
-First 70 integers using SELECT                                     42             43           1          0.0      598091.7       1.0X
-First 70 integers using SELECT and LIMIT                           40             45           7          0.0      567091.1       1.1X
-First 70 integers referencing external table in anchor             72             90          18          0.0     1033307.7       0.6X
+First 70 integers using VALUES                                    107            113           7          0.0     1527431.7       1.0X
+First 70 integers using SELECT                                    107            107           1          0.0     1522253.3       1.0X
+First 70 integers using SELECT and LIMIT                           96            100           5          0.0     1376351.6       1.1X
+First 70 integers referencing external table in anchor            152            153           2          0.0     2174213.6       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 80 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 80 integers using VALUES                                     53             56           5          0.0      664916.7       1.0X
-First 80 integers using SELECT                                     47             51           6          0.0      583047.9       1.1X
-First 80 integers using SELECT and LIMIT                           52             54           2          0.0      645460.9       1.0X
-First 80 integers referencing external table in anchor             83             95          19          0.0     1042742.7       0.6X
+First 80 integers using VALUES                                    118            125          11          0.0     1471536.7       1.0X
+First 80 integers using SELECT                                    118            119           2          0.0     1470698.4       1.0X
+First 80 integers using SELECT and LIMIT                          107            109           2          0.0     1335795.1       1.1X
+First 80 integers referencing external table in anchor            156            164           9          0.0     1945739.9       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 90 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------
-First 90 integers using VALUES                                     50             51           2          0.0      554144.4       1.0X
-First 90 integers using SELECT                                     51             55           6          0.0      563051.4       1.0X
-First 90 integers using SELECT and LIMIT                           47             48           1          0.0      517157.9       1.1X
-First 90 integers referencing external table in anchor            147            148           1          0.0     1637719.4       0.3X
+First 90 integers using VALUES                                    128            132           5          0.0     1426374.7       1.0X
+First 90 integers using SELECT                                    129            133           6          0.0     1431482.2       1.0X
+First 90 integers using SELECT and LIMIT                          116            120           4          0.0     1283439.3       1.1X
+First 90 integers referencing external table in anchor            168            173           4          0.0     1871741.3       0.8X
 
-OpenJDK 64-Bit Server VM 17.0.13+11-LTS on Mac OS X 15.4
-Apple M3 Max
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
+AMD EPYC 7763 64-Core Processor
 First 100 integers:                                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-First 100 integers using VALUES                                     55             57           2          0.0      550062.9       1.0X
-First 100 integers using SELECT                                     54             55           0          0.0      544030.0       1.0X
-First 100 integers using SELECT and LIMIT                           51             55           6          0.0      511913.8       1.1X
-First 100 integers referencing external table in anchor             99            121          34          0.0      987736.3       0.6X
+First 100 integers using VALUES                                    140            142           4          0.0     1396375.8       1.0X
+First 100 integers using SELECT                                    140            143           4          0.0     1395777.3       1.0X
+First 100 integers using SELECT and LIMIT                          127            129           3          0.0     1265041.6       1.1X
+First 100 integers referencing external table in anchor            181            186           5          0.0     1809088.1       0.8X
 
 
diff --git a/sql/core/benchmarks/SetOperationsBenchmark-jdk21-results.txt b/sql/core/benchmarks/SetOperationsBenchmark-jdk21-results.txt
index aab7d77c3c5e8..37555720abf42 100644
--- a/sql/core/benchmarks/SetOperationsBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/SetOperationsBenchmark-jdk21-results.txt
@@ -2,12 +2,12 @@
 Set Operations Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parsing + Analysis:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UNION ALL                                           293            368          90          0.1       19561.0       1.0X
-EXCEPT ALL                                          248            258           6          0.1       16558.5       1.2X
-INTERSECT ALL                                       242            256          16          0.1       16119.8       1.2X
+UNION ALL                                           133            258         127          0.1        8834.8       1.0X
+EXCEPT ALL                                           95            100           6          0.2        6332.4       1.4X
+INTERSECT ALL                                        95            100           4          0.2        6341.7       1.4X
 
 
diff --git a/sql/core/benchmarks/SetOperationsBenchmark-results.txt b/sql/core/benchmarks/SetOperationsBenchmark-results.txt
index 7be9efd5dfd38..f1efa0b25910d 100644
--- a/sql/core/benchmarks/SetOperationsBenchmark-results.txt
+++ b/sql/core/benchmarks/SetOperationsBenchmark-results.txt
@@ -2,12 +2,12 @@
 Set Operations Benchmark
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Parsing + Analysis:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-UNION ALL                                           371            502         142          0.0       24706.1       1.0X
-EXCEPT ALL                                          270            281           8          0.1       17967.1       1.4X
-INTERSECT ALL                                       267            276           7          0.1       17797.3       1.4X
+UNION ALL                                           171            298         142          0.1       11411.6       1.0X
+EXCEPT ALL                                          123            130           6          0.1        8185.4       1.4X
+INTERSECT ALL                                       123            129           6          0.1        8200.2       1.4X
 
 
diff --git a/sql/core/benchmarks/SortBenchmark-jdk21-results.txt b/sql/core/benchmarks/SortBenchmark-jdk21-results.txt
index 9003f22a818e8..2c27c2abb065a 100644
--- a/sql/core/benchmarks/SortBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/SortBenchmark-jdk21-results.txt
@@ -2,15 +2,15 @@
 radix sort
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 radix sort 25000000:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-reference TimSort key prefix array                 8419           8432          18          3.0         336.8       1.0X
-reference Arrays.sort                              2175           2202          38         11.5          87.0       3.9X
-radix sort one byte                                  66             70           4        378.7           2.6     127.5X
-radix sort two bytes                                122            130          13        204.5           4.9      68.9X
-radix sort eight bytes                              488            492           7         51.2          19.5      17.2X
-radix sort key prefix array                         569            579          13         43.9          22.8      14.8X
+reference TimSort key prefix array                 8401           8446          64          3.0         336.0       1.0X
+reference Arrays.sort                              2180           2204          35         11.5          87.2       3.9X
+radix sort one byte                                  65             67           2        384.8           2.6     129.3X
+radix sort two bytes                                121            130           7        207.3           4.8      69.6X
+radix sort eight bytes                              467            472           5         53.6          18.7      18.0X
+radix sort key prefix array                         558            560           2         44.8          22.3      15.1X
 
 
diff --git a/sql/core/benchmarks/SortBenchmark-results.txt b/sql/core/benchmarks/SortBenchmark-results.txt
index b8a4f188bc201..7490a3bbf0ee2 100644
--- a/sql/core/benchmarks/SortBenchmark-results.txt
+++ b/sql/core/benchmarks/SortBenchmark-results.txt
@@ -2,15 +2,15 @@
 radix sort
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 radix sort 25000000:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-reference TimSort key prefix array                 8082           8117          50          3.1         323.3       1.0X
-reference Arrays.sort                              2066           2103          53         12.1          82.6       3.9X
-radix sort one byte                                  63             69           5        396.0           2.5     128.0X
-radix sort two bytes                                119            130           6        210.5           4.7      68.1X
-radix sort eight bytes                              492            502           7         50.8          19.7      16.4X
-radix sort key prefix array                         905            922          16         27.6          36.2       8.9X
+reference TimSort key prefix array                 8320           8326           9          3.0         332.8       1.0X
+reference Arrays.sort                              2062           2087          35         12.1          82.5       4.0X
+radix sort one byte                                  63             70           6        398.2           2.5     132.5X
+radix sort two bytes                                118            130           6        211.5           4.7      70.4X
+radix sort eight bytes                              453            480          17         55.2          18.1      18.4X
+radix sort key prefix array                         916            919           3         27.3          36.7       9.1X
 
 
diff --git a/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-jdk21-results.txt b/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-jdk21-results.txt
index 1e3fc590644ad..ede4e88fe91d8 100644
--- a/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-jdk21-results.txt
@@ -2,143 +2,143 @@
 put rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (10000 rows to overwrite - rate 100):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                            8              9           1          1.2         815.6       1.0X
-RocksDB (trackTotalNumberOfRows: true)                              46             47           2          0.2        4559.1       0.2X
-RocksDB (trackTotalNumberOfRows: false)                             17             18           1          0.6        1678.7       0.5X
+In-memory                                                            9             10           1          1.2         856.0       1.0X
+RocksDB (trackTotalNumberOfRows: true)                              47             49           2          0.2        4703.5       0.2X
+RocksDB (trackTotalNumberOfRows: false)                             18             19           1          0.6        1799.8       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (5000 rows to overwrite - rate 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                          8              9           1          1.3         798.1       1.0X
-RocksDB (trackTotalNumberOfRows: true)                            47             48           2          0.2        4659.8       0.2X
-RocksDB (trackTotalNumberOfRows: false)                           17             17           1          0.6        1663.4       0.5X
+In-memory                                                          8              9           1          1.2         833.3       1.0X
+RocksDB (trackTotalNumberOfRows: true)                            48             50           1          0.2        4832.1       0.2X
+RocksDB (trackTotalNumberOfRows: false)                           18             19           1          0.6        1791.8       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (1000 rows to overwrite - rate 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                          8              9           1          1.3         794.9       1.0X
-RocksDB (trackTotalNumberOfRows: true)                            46             48           1          0.2        4625.7       0.2X
-RocksDB (trackTotalNumberOfRows: false)                           17             17           1          0.6        1660.7       0.5X
+In-memory                                                          8             10           1          1.2         811.2       1.0X
+RocksDB (trackTotalNumberOfRows: true)                            48             50           1          0.2        4799.0       0.2X
+RocksDB (trackTotalNumberOfRows: false)                           17             19           1          0.6        1741.7       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (0 rows to overwrite - rate 0):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                      8              8           1          1.3         788.6       1.0X
-RocksDB (trackTotalNumberOfRows: true)                        46             47           1          0.2        4557.0       0.2X
-RocksDB (trackTotalNumberOfRows: false)                       17             17           1          0.6        1650.3       0.5X
+In-memory                                                      8             10           1          1.2         810.7       1.0X
+RocksDB (trackTotalNumberOfRows: true)                        48             49           1          0.2        4781.2       0.2X
+RocksDB (trackTotalNumberOfRows: false)                       18             19           1          0.6        1790.3       0.5X
 
 
 ================================================================================================
 merge rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (10000 rows to overwrite - rate 100):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                                    574            585           6          0.0       57387.8       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                                   181            186           3          0.1       18065.2       3.2X
+RocksDB (trackTotalNumberOfRows: true)                                                    581            597           7          0.0       58107.0       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                                   192            197           2          0.1       19209.3       3.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (5000 rows to overwrite - rate 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                                  504            515           5          0.0       50382.4       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                                 179            185           3          0.1       17882.2       2.8X
+RocksDB (trackTotalNumberOfRows: true)                                                  507            521           5          0.0       50704.7       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                                 191            196           2          0.1       19078.2       2.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (1000 rows to overwrite - rate 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                                  442            455           6          0.0       44235.2       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                                 180            185           3          0.1       17971.5       2.5X
+RocksDB (trackTotalNumberOfRows: true)                                                  447            459           5          0.0       44665.5       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                                 189            195           2          0.1       18919.4       2.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (0 rows to overwrite - rate 0):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                              424            436           5          0.0       42391.9       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                             179            185           4          0.1       17923.5       2.4X
+RocksDB (trackTotalNumberOfRows: true)                                              435            448           5          0.0       43468.5       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                             192            197           2          0.1       19164.7       2.3X
 
 
 ================================================================================================
 delete rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(10000 rows are non-existing - rate 100):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                        0              1           0         27.1          36.9       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                          45             46           1          0.2        4470.0       0.0X
-RocksDB (trackTotalNumberOfRows: false)                                                         16             17           1          0.6        1583.0       0.0X
+In-memory                                                                                        1              1           0         16.9          59.1       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                          46             47           1          0.2        4604.1       0.0X
+RocksDB (trackTotalNumberOfRows: false)                                                         17             18           0          0.6        1720.5       0.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(5000 rows are non-existing - rate 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                      7              7           0          1.5         651.4       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                        46             47           1          0.2        4580.3       0.1X
-RocksDB (trackTotalNumberOfRows: false)                                                       16             17           0          0.6        1582.7       0.4X
+In-memory                                                                                      8              9           1          1.3         762.2       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                        47             48           1          0.2        4666.1       0.2X
+RocksDB (trackTotalNumberOfRows: false)                                                       17             18           1          0.6        1710.9       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(1000 rows are non-existing - rate 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                      7              8           0          1.4         713.7       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                        45             47           1          0.2        4538.6       0.2X
-RocksDB (trackTotalNumberOfRows: false)                                                       16             16           0          0.6        1579.3       0.5X
+In-memory                                                                                      7             10           1          1.3         748.9       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                        46             47           1          0.2        4580.6       0.2X
+RocksDB (trackTotalNumberOfRows: false)                                                       17             18           0          0.6        1721.2       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(0 rows are non-existing - rate 0):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                  7              8           0          1.4         716.9       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                    45             46           1          0.2        4459.8       0.2X
-RocksDB (trackTotalNumberOfRows: false)                                                   16             16           1          0.6        1580.7       0.5X
+In-memory                                                                                  7              9           1          1.3         746.4       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                    45             46           1          0.2        4479.1       0.2X
+RocksDB (trackTotalNumberOfRows: false)                                                   17             18           0          0.6        1658.2       0.5X
 
 
 ================================================================================================
 evict rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 10000 rows (maxTimestampToEvictInMillis: 9999) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                            7              7           0          1.5         689.5       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                              44             45           1          0.2        4424.0       0.2X
-RocksDB (trackTotalNumberOfRows: false)                                             18             18           0          0.6        1784.2       0.4X
+In-memory                                                                            7              7           0          1.4         693.6       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                              43             44           1          0.2        4315.4       0.2X
+RocksDB (trackTotalNumberOfRows: false)                                             17             18           0          0.6        1724.8       0.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 5000 rows (maxTimestampToEvictInMillis: 4999) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                           6              7           0          1.5         650.0       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                             23             24           1          0.4        2347.8       0.3X
-RocksDB (trackTotalNumberOfRows: false)                                            10             11           0          1.0        1037.1       0.6X
+In-memory                                                                           7              7           0          1.5         650.5       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                             23             24           1          0.4        2308.7       0.3X
+RocksDB (trackTotalNumberOfRows: false)                                            10             11           0          1.0        1037.6       0.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 1000 rows (maxTimestampToEvictInMillis: 999) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                          6              6           0          1.7         585.4       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                             8              8           0          1.3         766.5       0.8X
-RocksDB (trackTotalNumberOfRows: false)                                            5              5           0          2.0         503.2       1.2X
+In-memory                                                                          6              7           0          1.7         598.8       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                             7              8           0          1.3         744.0       0.8X
+RocksDB (trackTotalNumberOfRows: false)                                            5              5           0          2.0         488.2       1.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 0 rows (maxTimestampToEvictInMillis: -1) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                      0              0           0         25.0          40.1       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                         4              4           0          2.8         359.1       0.1X
-RocksDB (trackTotalNumberOfRows: false)                                        4              4           0          2.8         359.9       0.1X
+In-memory                                                                      0              1           0         23.1          43.3       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                         3              4           0          2.9         349.9       0.1X
+RocksDB (trackTotalNumberOfRows: false)                                        4              4           1          2.9         350.0       0.1X
 
 
diff --git a/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-results.txt b/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-results.txt
index a3688c16f100a..19264ccf4a1a8 100644
--- a/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-results.txt
+++ b/sql/core/benchmarks/StateStoreBasicOperationsBenchmark-results.txt
@@ -2,143 +2,143 @@
 put rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (10000 rows to overwrite - rate 100):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                            8              9           1          1.2         816.3       1.0X
-RocksDB (trackTotalNumberOfRows: true)                              45             47           1          0.2        4514.1       0.2X
-RocksDB (trackTotalNumberOfRows: false)                             17             18           1          0.6        1682.7       0.5X
+In-memory                                                            8              9           1          1.2         806.5       1.0X
+RocksDB (trackTotalNumberOfRows: true)                              46             48           1          0.2        4641.9       0.2X
+RocksDB (trackTotalNumberOfRows: false)                             17             18           1          0.6        1739.9       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (5000 rows to overwrite - rate 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                          8             10           1          1.2         811.7       1.0X
-RocksDB (trackTotalNumberOfRows: true)                            47             49           1          0.2        4694.9       0.2X
-RocksDB (trackTotalNumberOfRows: false)                           17             18           1          0.6        1680.2       0.5X
+In-memory                                                          8              9           0          1.2         801.7       1.0X
+RocksDB (trackTotalNumberOfRows: true)                            48             50           1          0.2        4800.8       0.2X
+RocksDB (trackTotalNumberOfRows: false)                           17             18           1          0.6        1720.0       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (1000 rows to overwrite - rate 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                          8              9           1          1.3         786.5       1.0X
-RocksDB (trackTotalNumberOfRows: true)                            47             48           1          0.2        4679.7       0.2X
-RocksDB (trackTotalNumberOfRows: false)                           17             18           1          0.6        1650.0       0.5X
+In-memory                                                          8              8           0          1.3         782.4       1.0X
+RocksDB (trackTotalNumberOfRows: true)                            46             47           1          0.2        4614.3       0.2X
+RocksDB (trackTotalNumberOfRows: false)                           17             18           1          0.6        1702.2       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 putting 10000 rows (0 rows to overwrite - rate 0):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                      8              8           1          1.3         778.0       1.0X
-RocksDB (trackTotalNumberOfRows: true)                        46             48           1          0.2        4629.4       0.2X
-RocksDB (trackTotalNumberOfRows: false)                       17             17           1          0.6        1664.9       0.5X
+In-memory                                                      8              8           0          1.3         771.9       1.0X
+RocksDB (trackTotalNumberOfRows: true)                        46             47           1          0.2        4554.4       0.2X
+RocksDB (trackTotalNumberOfRows: false)                       17             18           1          0.6        1698.3       0.5X
 
 
 ================================================================================================
 merge rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (10000 rows to overwrite - rate 100):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                                    570            585           6          0.0       56996.2       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                                   184            190           3          0.1       18411.4       3.1X
+RocksDB (trackTotalNumberOfRows: true)                                                    580            592           5          0.0       57963.9       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                                   194            199           3          0.1       19366.7       3.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (5000 rows to overwrite - rate 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                                  493            505           5          0.0       49327.2       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                                 181            188           3          0.1       18140.8       2.7X
+RocksDB (trackTotalNumberOfRows: true)                                                  509            522           7          0.0       50899.9       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                                 194            199           3          0.1       19417.5       2.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (1000 rows to overwrite - rate 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                                  435            448           5          0.0       43484.3       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                                 183            188           3          0.1       18289.1       2.4X
+RocksDB (trackTotalNumberOfRows: true)                                                  450            460           4          0.0       44950.2       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                                 192            197           2          0.1       19171.3       2.3X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 merging 10000 rows with 10 values per key (0 rows to overwrite - rate 0):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------
-RocksDB (trackTotalNumberOfRows: true)                                              416            432           5          0.0       41606.2       1.0X
-RocksDB (trackTotalNumberOfRows: false)                                             183            189           3          0.1       18282.2       2.3X
+RocksDB (trackTotalNumberOfRows: true)                                              429            439           4          0.0       42875.5       1.0X
+RocksDB (trackTotalNumberOfRows: false)                                             191            197           2          0.1       19059.3       2.2X
 
 
 ================================================================================================
 delete rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(10000 rows are non-existing - rate 100):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                        0              1           0         26.6          37.7       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                          45             47           1          0.2        4514.1       0.0X
-RocksDB (trackTotalNumberOfRows: false)                                                         16             17           0          0.6        1587.8       0.0X
+In-memory                                                                                        0              1           0         25.6          39.0       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                          46             47           1          0.2        4575.3       0.0X
+RocksDB (trackTotalNumberOfRows: false)                                                         17             18           0          0.6        1684.7       0.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(5000 rows are non-existing - rate 50):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                      6              7           1          1.6         644.9       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                        45             47           1          0.2        4524.6       0.1X
-RocksDB (trackTotalNumberOfRows: false)                                                       16             17           1          0.6        1579.1       0.4X
+In-memory                                                                                      6              7           0          1.6         630.0       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                        47             48           1          0.2        4667.7       0.1X
+RocksDB (trackTotalNumberOfRows: false)                                                       17             18           0          0.6        1697.3       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(1000 rows are non-existing - rate 10):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                      7              8           1          1.4         698.2       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                        45             46           1          0.2        4481.1       0.2X
-RocksDB (trackTotalNumberOfRows: false)                                                       16             17           1          0.6        1585.3       0.4X
+In-memory                                                                                      7              7           0          1.4         701.4       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                        46             47           1          0.2        4590.1       0.2X
+RocksDB (trackTotalNumberOfRows: false)                                                       17             18           0          0.6        1698.0       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 trying to delete 10000 rows from 10000 rows(0 rows are non-existing - rate 0):  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                                  7              8           1          1.4         707.0       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                                    43             45           1          0.2        4326.6       0.2X
-RocksDB (trackTotalNumberOfRows: false)                                                   16             17           1          0.6        1560.6       0.5X
+In-memory                                                                                  7              7           0          1.4         716.7       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                                    46             47           1          0.2        4563.4       0.2X
+RocksDB (trackTotalNumberOfRows: false)                                                   17             18           0          0.6        1665.2       0.4X
 
 
 ================================================================================================
 evict rows
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 10000 rows (maxTimestampToEvictInMillis: 9999) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                            7              7           0          1.4         693.7       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                              43             44           1          0.2        4285.3       0.2X
-RocksDB (trackTotalNumberOfRows: false)                                             17             18           0          0.6        1726.3       0.4X
+In-memory                                                                            7              7           0          1.5         683.9       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                              45             46           1          0.2        4454.0       0.2X
+RocksDB (trackTotalNumberOfRows: false)                                             18             18           0          0.6        1771.2       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 5000 rows (maxTimestampToEvictInMillis: 4999) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                           6              7           0          1.5         646.3       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                             24             24           0          0.4        2351.2       0.3X
-RocksDB (trackTotalNumberOfRows: false)                                            11             11           0          0.9        1062.9       0.6X
+In-memory                                                                           6              7           0          1.6         631.7       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                             24             25           0          0.4        2414.0       0.3X
+RocksDB (trackTotalNumberOfRows: false)                                            11             11           0          0.9        1066.8       0.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 1000 rows (maxTimestampToEvictInMillis: 999) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                          6              6           0          1.7         587.7       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                             8              8           0          1.3         784.7       0.7X
-RocksDB (trackTotalNumberOfRows: false)                                            5              6           0          1.9         529.1       1.1X
+In-memory                                                                          6              6           0          1.7         574.0       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                             8              8           0          1.3         780.8       0.7X
+RocksDB (trackTotalNumberOfRows: false)                                            5              5           0          2.0         507.7       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 evicting 0 rows (maxTimestampToEvictInMillis: -1) from 10000 rows:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------
-In-memory                                                                      0              0           0         23.2          43.2       1.0X
-RocksDB (trackTotalNumberOfRows: true)                                         4              4           0          2.6         387.5       0.1X
-RocksDB (trackTotalNumberOfRows: false)                                        4              4           0          2.6         389.4       0.1X
+In-memory                                                                      0              0           0         22.6          44.3       1.0X
+RocksDB (trackTotalNumberOfRows: true)                                         4              4           0          2.8         360.5       0.1X
+RocksDB (trackTotalNumberOfRows: false)                                        4              4           0          2.8         360.8       0.1X
 
 
diff --git a/sql/core/benchmarks/StringFunctionsBenchmark-jdk21-results.txt b/sql/core/benchmarks/StringFunctionsBenchmark-jdk21-results.txt
index c1684fae10653..caff1265db41e 100644
--- a/sql/core/benchmarks/StringFunctionsBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/StringFunctionsBenchmark-jdk21-results.txt
@@ -2,10 +2,10 @@
 SQL string functions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 regexp_replace:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-regexp_replace('*-*', '(\\d+)', 'num')              500            515          11          2.0         499.9       1.0X
+regexp_replace('*-*', '(\\d+)', 'num')              491            512          24          2.0         491.4       1.0X
 
 
diff --git a/sql/core/benchmarks/StringFunctionsBenchmark-results.txt b/sql/core/benchmarks/StringFunctionsBenchmark-results.txt
index a6571007f7aac..ae35dc90be5e3 100644
--- a/sql/core/benchmarks/StringFunctionsBenchmark-results.txt
+++ b/sql/core/benchmarks/StringFunctionsBenchmark-results.txt
@@ -2,10 +2,10 @@
 SQL string functions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 regexp_replace:                           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-regexp_replace('*-*', '(\\d+)', 'num')              500            514          13          2.0         499.7       1.0X
+regexp_replace('*-*', '(\\d+)', 'num')              536            552          14          1.9         536.2       1.0X
 
 
diff --git a/sql/core/benchmarks/SubExprEliminationBenchmark-jdk21-results.txt b/sql/core/benchmarks/SubExprEliminationBenchmark-jdk21-results.txt
index 8cf0ba7224bad..ba1109cab5578 100644
--- a/sql/core/benchmarks/SubExprEliminationBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/SubExprEliminationBenchmark-jdk21-results.txt
@@ -3,23 +3,23 @@ Benchmark for performance of subexpression elimination
 ================================================================================================
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_json as subExpr in Project:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-subExprElimination false, codegen: true            6700           7047         301          0.0    67001649.1       1.0X
-subExprElimination false, codegen: false           6719           6837         118          0.0    67191470.6       1.0X
-subExprElimination true, codegen: true             1350           1489         122          0.0    13503842.8       5.0X
-subExprElimination true, codegen: false            1366           1444          96          0.0    13658823.9       4.9X
+subExprElimination false, codegen: true            6356           6511         154          0.0    63562019.6       1.0X
+subExprElimination false, codegen: false           6308           6384          66          0.0    63084255.4       1.0X
+subExprElimination true, codegen: true             1210           1265          93          0.0    12099184.7       5.3X
+subExprElimination true, codegen: false            1236           1299          99          0.0    12360076.2       5.1X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_json as subExpr in Filter:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-subExprElimination false, codegen: true            7250           7520         384          0.0    72501549.6       1.0X
-subExprElimination false, codegen: false           7255           7366         114          0.0    72554716.3       1.0X
-subExprElimination true, codegen: true             1934           2024          79          0.0    19344228.2       3.7X
-subExprElimination true, codegen: false            1981           2015          29          0.0    19814306.4       3.7X
+subExprElimination false, codegen: true            6485           6649         174          0.0    64852199.5       1.0X
+subExprElimination false, codegen: false           6390           6489          87          0.0    63895276.1       1.0X
+subExprElimination true, codegen: true             1580           1633          52          0.0    15799544.7       4.1X
+subExprElimination true, codegen: false            1619           1649          27          0.0    16193983.0       4.0X
 
 
diff --git a/sql/core/benchmarks/SubExprEliminationBenchmark-results.txt b/sql/core/benchmarks/SubExprEliminationBenchmark-results.txt
index b689fef720f78..2a0da13bab2ec 100644
--- a/sql/core/benchmarks/SubExprEliminationBenchmark-results.txt
+++ b/sql/core/benchmarks/SubExprEliminationBenchmark-results.txt
@@ -3,23 +3,23 @@ Benchmark for performance of subexpression elimination
 ================================================================================================
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_json as subExpr in Project:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-subExprElimination false, codegen: true            6389           6498         173          0.0    63887225.6       1.0X
-subExprElimination false, codegen: false           6235           6292          81          0.0    62351284.2       1.0X
-subExprElimination true, codegen: true             1328           1368          47          0.0    13284825.9       4.8X
-subExprElimination true, codegen: false            1323           1368          73          0.0    13227629.0       4.8X
+subExprElimination false, codegen: true            6643           6703          53          0.0    66433286.4       1.0X
+subExprElimination false, codegen: false           6408           6436          26          0.0    64082328.5       1.0X
+subExprElimination true, codegen: true             1545           1596          44          0.0    15454792.9       4.3X
+subExprElimination true, codegen: false            1459           1548          79          0.0    14592926.1       4.6X
 
 Preparing data for benchmarking ...
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1021-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 from_json as subExpr in Filter:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-subExprElimination false, codegen: true            7081           7177          86          0.0    70813603.9       1.0X
-subExprElimination false, codegen: false           6586           6720         139          0.0    65859888.8       1.1X
-subExprElimination true, codegen: true             1729           1827         117          0.0    17291697.7       4.1X
-subExprElimination true, codegen: false            1726           1789          57          0.0    17255779.7       4.1X
+subExprElimination false, codegen: true            6726           6789          69          0.0    67259727.5       1.0X
+subExprElimination false, codegen: false           6800           6851          77          0.0    68003862.4       1.0X
+subExprElimination true, codegen: true             1833           1906          74          0.0    18325029.8       3.7X
+subExprElimination true, codegen: false            1834           1901          64          0.0    18341410.4       3.7X
 
 
diff --git a/sql/core/benchmarks/TPCDSQueryBenchmark-jdk21-results.txt b/sql/core/benchmarks/TPCDSQueryBenchmark-jdk21-results.txt
index c92e2b6d44980..808031f4085cb 100644
--- a/sql/core/benchmarks/TPCDSQueryBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/TPCDSQueryBenchmark-jdk21-results.txt
@@ -1,810 +1,810 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q1                                                  646            812         151          0.7        1400.6       1.0X
+q1                                                  702            806         129          0.7        1521.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q2                                                  889            901          21          2.5         398.3       1.0X
+q2                                                  882            961          72          2.5         395.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q3                                                  230            279          41         12.9          77.5       1.0X
+q3                                                  241            276          33         12.3          81.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q4                                                 5117           5164          67          1.0         981.8       1.0X
+q4                                                 4969           5281         442          1.0         953.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q5                                                 1140           1339         282          4.9         202.5       1.0X
+q5                                                 1126           1294         239          5.0         200.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q6                                                 1125           1137          17          2.8         360.4       1.0X
+q6                                                 1103           1185         115          2.8         353.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q7                                                  604            636          33          8.1         123.4       1.0X
+q7                                                  591            630          45          8.3         120.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q8                                                  489            517          32          6.3         157.5       1.0X
+q8                                                  435            509          93          7.1         140.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q9                                                  900            925          23          0.0    25708761.0       1.0X
+q9                                                  878            926          41          0.0    25082543.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q10                                                1997           2109         159          1.0         964.3       1.0X
+q10                                                2047           2064          24          1.0         988.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q11                                                1857           2054         279          2.0         492.4       1.0X
+q11                                                1758           2001         343          2.1         466.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q12                                                 163            199          39          5.0         201.1       1.0X
+q12                                                 173            203          31          4.7         213.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q13                                                 817            855          39          6.0         165.7       1.0X
+q13                                                 775            821          61          6.4         157.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14a                                               5011           5171         226          1.0         976.8       1.0X
+q14a                                               4554           4759         290          1.1         887.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14b                                               4082           4106          34          1.3         795.7       1.0X
+q14b                                               3718           3760          60          1.4         724.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q15                                                 391            410          34          4.3         235.2       1.0X
+q15                                                 404            431          41          4.1         242.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q16                                                 595            666          49          2.6         380.5       1.0X
+q16                                                 606            653          59          2.6         387.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q17                                                1243           1338         133          3.8         264.6       1.0X
+q17                                                1341           1361          29          3.5         285.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q18                                                1051           1247         277          3.4         291.8       1.0X
+q18                                                1128           1281         216          3.2         313.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q19                                                 303            321          21         10.3          97.1       1.0X
+q19                                                 305            328          28         10.2          97.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q20                                                 183            207          32          8.4         119.6       1.0X
+q20                                                 186            208          49          8.2         121.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q21                                                 660            683          39         17.9          55.7       1.0X
+q21                                                 667            693          39         17.7          56.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q22                                                3373           3418          64          3.5         285.0       1.0X
+q22                                                3318           3393         106          3.6         280.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q23a                                               5880           6049         239          0.9        1124.3       1.0X
+q23a                                               5982           6138         220          0.9        1143.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q23b                                               5821           5955         189          0.9        1113.1       1.0X
+q23b                                               6036           6134         139          0.9        1154.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q24a                                                212            266          43         15.7          63.7       1.0X
+q24a                                                221            255          44         15.1          66.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q24b                                                223            261          48         15.0          66.7       1.0X
+q24b                                                215            245          23         15.5          64.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q25                                                1315           1343          40          3.6         279.8       1.0X
+q25                                                1279           1346          95          3.7         272.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q26                                                 357            386          36          9.7         103.3       1.0X
+q26                                                 348            381          32          9.9         100.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q27                                                 577            611          27          8.5         117.9       1.0X
+q27                                                 574            611          42          8.5         117.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q28                                                1373           1414          57          2.1         476.8       1.0X
+q28                                                1319           1411         130          2.2         458.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q29                                                1235           1300          93          3.8         262.7       1.0X
+q29                                                1311           1368          80          3.6         279.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q30                                                 390            438          38          0.8        1323.4       1.0X
+q30                                                 410            435          28          0.7        1390.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q31                                                 811           1114         429          4.6         217.9       1.0X
+q31                                                 805            920         186          4.6         216.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q32                                                 221            234           9          6.9         144.7       1.0X
+q32                                                 206            242          59          7.4         134.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q33                                                 429            467          39         12.1          82.8       1.0X
+q33                                                 386            419          38         13.4          74.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q34                                                 371            407          25          8.3         121.2       1.0X
+q34                                                 359            391          36          8.5         117.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q35                                                1252           1302          71          1.7         604.6       1.0X
+q35                                                1234           1281          66          1.7         596.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q36                                                 533            560          41          5.6         179.4       1.0X
+q36                                                 529            565          40          5.6         178.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q37                                                 798            827          26         16.6          60.1       1.0X
+q37                                                 841            875          35         15.8          63.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q38                                                 641            711          65          8.1         123.1       1.0X
+q38                                                 657            703          62          7.9         126.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q39a                                               1349           1486         193          8.8         114.0       1.0X
+q39a                                               1502           1556          77          7.9         126.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q39b                                               1360           1447         123          8.7         114.9       1.0X
+q39b                                               1406           1428          32          8.4         118.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q40                                                 309            401          71          5.4         184.6       1.0X
+q40                                                 318            349          35          5.3         190.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q41                                                 137            158          27          0.1        7598.4       1.0X
+q41                                                 137            157          19          0.1        7635.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q42                                                 149            161          17         19.9          50.1       1.0X
+q42                                                 150            172          30         19.8          50.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q43                                                 316            347          34          9.3         107.2       1.0X
+q43                                                 314            339          31          9.4         106.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q44                                                 351            381          29          8.3         121.1       1.0X
+q44                                                 341            369          28          8.5         117.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q45                                                 211            231          15          4.5         220.1       1.0X
+q45                                                 186            218          34          5.2         194.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q46                                                 482            503          25          6.5         154.9       1.0X
+q46                                                 458            493          37          6.8         147.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q47                                                1486           1605         168          2.0         500.1       1.0X
+q47                                                1658           1673          22          1.8         557.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q48                                                 943            947           4          5.2         191.6       1.0X
+q48                                                 878            919          42          5.6         178.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q49                                                 585            670         127          9.6         104.1       1.0X
+q49                                                 537            587          34         10.5          95.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q50                                                 641            693          50          5.1         197.8       1.0X
+q50                                                 627            686          62          5.2         193.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q51                                                2650           2698          68          1.4         721.7       1.0X
+q51                                                2585           2765         254          1.4         704.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q52                                                 150            182          27         19.8          50.6       1.0X
+q52                                                 152            165          18         19.5          51.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q53                                                 282            322          37         10.5          94.9       1.0X
+q53                                                 278            308          28         10.7          93.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q54                                                1220           1248          40          4.3         231.0       1.0X
+q54                                                1205           1236          44          4.4         228.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q55                                                 146            160          19         20.3          49.2       1.0X
+q55                                                 151            166          20         19.7          50.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q56                                                 402            447          43         12.9          77.7       1.0X
+q56                                                 386            433          55         13.4          74.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q57                                                 759            820          71          2.0         495.7       1.0X
+q57                                                 743            840         107          2.1         485.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q58                                                 403            428          30         12.7          78.6       1.0X
+q58                                                 462            522         108         11.1          90.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q59                                                 702            715          14          4.2         237.6       1.0X
+q59                                                 671            689          23          4.4         227.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q60                                                 422            468          46         12.3          81.6       1.0X
+q60                                                 401            416          15         12.9          77.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q61                                                 537            571          35          5.8         172.2       1.0X
+q61                                                 523            575          85          6.0         167.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q62                                                 180            194          21          4.4         227.4       1.0X
+q62                                                 180            203          28          4.4         227.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q63                                                 276            296          22         10.8          92.9       1.0X
+q63                                                 283            302          32         10.5          95.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q64                                                2183           2459         391          3.2         315.4       1.0X
+q64                                                2215           2452         336          3.1         320.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q65                                                 594            646          66          5.0         200.0       1.0X
+q65                                                 598            637          41          5.0         201.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q66                                                 515            612         121          4.5         222.2       1.0X
+q66                                                 464            503          46          5.0         200.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q67                                                5498           5512          19          0.5        1850.8       1.0X
+q67                                                5499           5604         149          0.5        1850.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q68                                                 469            509          36          6.6         150.9       1.0X
+q68                                                 430            476          44          7.2         138.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q69                                                1706           1714          11          1.2         824.0       1.0X
+q69                                                1662           1673          15          1.2         802.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q70                                                 566            598          42          5.2         191.8       1.0X
+q70                                                 586            612          41          5.0         198.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q71                                                 374            408          30         14.0          71.7       1.0X
+q71                                                 361            382          35         14.5          69.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q72                                              106812         113451        9389          0.1        6959.4       1.0X
+q72                                              119812         123190        4778          0.1        7806.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q73                                                 349            371          36          8.8         113.9       1.0X
+q73                                                 332            360          35          9.2         108.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q74                                                1195           1502         434          3.2         316.9       1.0X
+q74                                                1242           1393         214          3.0         329.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q75                                                1487           1666         252          3.8         264.0       1.0X
+q75                                                1269           1615         489          4.4         225.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q76                                                 295            316          21         17.4          57.5       1.0X
+q76                                                 291            321          26         17.6          56.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q77                                                 538            719         163         10.4          95.7       1.0X
+q77                                                 643            792         142          8.7         114.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q78                                                1963           2055         129          2.9         349.6       1.0X
+q78                                                2160           2354         275          2.6         384.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q79                                                 418            451          26          7.3         136.7       1.0X
+q79                                                 418            444          27          7.3         136.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q80                                                1551           1845         416          3.6         274.7       1.0X
+q80                                                1333           1458         177          4.2         236.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q81                                                 339            390          39          1.1         924.9       1.0X
+q81                                                 277            387          80          1.3         756.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q82                                                1101           1102           1         13.4          74.8       1.0X
+q82                                                1074           1103          41         13.7          73.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q83                                                 244            283          39          2.4         409.7       1.0X
+q83                                                 239            283          36          2.5         402.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q84                                                 615            671          48          3.8         259.9       1.0X
+q84                                                 646            686          53          3.7         273.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q85                                                1636           1926         410          1.7         577.2       1.0X
+q85                                                1638           1768         185          1.7         577.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q86                                                 187            208          22          4.3         231.1       1.0X
+q86                                                 185            205          20          4.4         228.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q87                                                 652            719          81          8.0         125.0       1.0X
+q87                                                 669            752          73          7.8         128.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q88                                                1207           1396         268          2.5         405.9       1.0X
+q88                                                1259           1351         131          2.4         423.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q89                                                 317            365          43          9.4         106.8       1.0X
+q89                                                 317            347          43          9.4         106.7       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q90                                                 113            139          20          7.2         138.5       1.0X
+q90                                                 117            139          22          6.9         144.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q91                                                 335            381          45          6.9         145.8       1.0X
+q91                                                 323            368          55          7.1         140.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q92                                                 134            153          23          6.0         165.8       1.0X
+q92                                                 135            158          21          6.0         166.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q93                                                 402            441          42          7.9         126.9       1.0X
+q93                                                 450            533          91          7.0         142.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q94                                                 313            353          45          2.7         371.3       1.0X
+q94                                                 331            360          31          2.5         393.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q95                                                5220           5267          66          0.2        6199.7       1.0X
+q95                                                5243           5383         197          0.2        6227.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q96                                                 165            183          23         18.1          55.4       1.0X
+q96                                                 172            187          20         17.2          58.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q97                                                1090           1139          70          4.0         248.2       1.0X
+q97                                                1177           1190          19          3.7         267.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q98                                                 254            288          29         11.7          85.5       1.0X
+q98                                                 276            296          30         10.8          92.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q99                                                 267            288          24          5.7         176.7       1.0X
+q99                                                 269            292          32          5.6         178.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q5a-v2.7                                           1315           1472         221          4.3         233.7       1.0X
+q5a-v2.7                                           1159           1215          80          4.9         206.0       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q6-v2.7                                             892            954          62          3.5         285.7       1.0X
+q6-v2.7                                             959           1002          60          3.3         307.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q10a-v2.7                                          1836           1927         129          1.1         886.5       1.0X
+q10a-v2.7                                          1899           1941          59          1.1         917.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q11-v2.7                                           1673           1998         460          2.3         443.5       1.0X
+q11-v2.7                                           1529           1934         573          2.5         405.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q12-v2.7                                            126            143          22          6.4         155.7       1.0X
+q12-v2.7                                            131            149          22          6.2         161.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14-v2.7                                           3412           3660         351          1.5         665.1       1.0X
+q14-v2.7                                           3360           3619         366          1.5         655.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14a-v2.7                                          7118           7330         301          0.7        1387.6       1.0X
+q14a-v2.7                                          7535           7653         167          0.7        1468.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q18a-v2.7                                          1954           2086         188          1.8         542.4       1.0X
+q18a-v2.7                                          2009           2283         388          1.8         557.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q20-v2.7                                            161            190          47          9.5         105.2       1.0X
+q20-v2.7                                            165            174          11          9.3         107.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q22-v2.7                                          13538          13568          42          0.9        1143.8       1.0X
+q22-v2.7                                          13296          13422         178          0.9        1123.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q22a-v2.7                                          1993           2057          90          5.9         168.4       1.0X
+q22a-v2.7                                          1956           2080         176          6.1         165.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q24-v2.7                                            202            233          25         16.5          60.6       1.0X
+q24-v2.7                                            197            225          27         16.9          59.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q27a-v2.7                                          1219           1552         470          4.0         249.2       1.0X
+q27a-v2.7                                          1351           1699         492          3.6         276.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q34-v2.7                                            347            377          28          8.8         113.4       1.0X
+q34-v2.7                                            344            378          50          8.9         112.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q35-v2.7                                           1211           1240          42          1.7         584.7       1.0X
+q35-v2.7                                           1196           1249          76          1.7         577.5       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q35a-v2.7                                          1225           1263          54          1.7         591.7       1.0X
+q35a-v2.7                                          1166           1223          82          1.8         562.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q36a-v2.7                                           492            525          38          6.0         165.7       1.0X
+q36a-v2.7                                           494            511          20          6.0         166.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q47-v2.7                                           1560           1705         205          1.9         525.2       1.0X
+q47-v2.7                                           1632           1657          36          1.8         549.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q49-v2.7                                            541            624          81         10.4          96.3       1.0X
+q49-v2.7                                            503            538          55         11.2          89.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q51a-v2.7                                         15126          15337         298          0.2        4119.6       1.0X
+q51a-v2.7                                         14959          15258         423          0.2        4074.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q57-v2.7                                            747            823          67          2.1         487.6       1.0X
+q57-v2.7                                            759            816          78          2.0         495.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q64-v2.7                                           2071           2354         400          3.3         299.3       1.0X
+q64-v2.7                                           2234           2554         453          3.1         322.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q67a-v2.7                                          6815           7072         363          0.4        2294.0       1.0X
+q67a-v2.7                                          7609           7799         270          0.4        2561.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q70a-v2.7                                           619            636          13          4.8         209.8       1.0X
+q70a-v2.7                                           626            674          57          4.7         212.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q72-v2.7                                         101776         104972        4519          0.2        6631.3       1.0X
+q72-v2.7                                         123476         124060         826          0.1        8045.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q74-v2.7                                           1219           1398         254          3.1         323.1       1.0X
+q74-v2.7                                           1378           1388          15          2.7         365.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q75-v2.7                                           1236           1484         351          4.6         219.5       1.0X
+q75-v2.7                                           1303           1621         450          4.3         231.3       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q77a-v2.7                                           780            895         156          7.2         138.9       1.0X
+q77a-v2.7                                           699            810          96          8.0         124.6       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q78-v2.7                                           1939           2304         516          2.9         345.2       1.0X
+q78-v2.7                                           2490           2537          67          2.3         443.4       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q80a-v2.7                                          1689           1700          14          3.3         299.3       1.0X
+q80a-v2.7                                          1751           1915         231          3.2         310.2       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q86a-v2.7                                           227            267          36          3.6         280.2       1.0X
+q86a-v2.7                                           236            267          36          3.4         291.8       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q98-v2.7                                            255            283          37         11.6          85.9       1.0X
+q98-v2.7                                            270            294          25         11.0          90.8       1.0X
 
diff --git a/sql/core/benchmarks/TPCDSQueryBenchmark-results.txt b/sql/core/benchmarks/TPCDSQueryBenchmark-results.txt
index 1a4205ac535ae..aa67c8b71436b 100644
--- a/sql/core/benchmarks/TPCDSQueryBenchmark-results.txt
+++ b/sql/core/benchmarks/TPCDSQueryBenchmark-results.txt
@@ -1,810 +1,810 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q1                                                  597            789         167          0.8        1294.9       1.0X
+q1                                                  663            797         219          0.7        1437.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q2                                                  800            887          76          2.8         358.5       1.0X
+q2                                                 1027           1149         173          2.2         459.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q3                                                  221            251          23         13.5          74.3       1.0X
+q3                                                  245            280          23         12.1          82.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q4                                                 4538           4797         367          1.1         870.7       1.0X
+q4                                                 4521           4868         491          1.2         867.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q5                                                 1210           1277          96          4.7         214.9       1.0X
+q5                                                 1156           1372         306          4.9         205.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q6                                                 1030           1052          31          3.0         330.1       1.0X
+q6                                                 1128           1152          34          2.8         361.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q7                                                  584            603          18          8.4         119.3       1.0X
+q7                                                  706            753          70          6.9         144.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q8                                                  455            490          33          6.8         146.5       1.0X
+q8                                                  649            667          22          4.8         209.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q9                                                  829            878          48          0.0    23682965.2       1.0X
+q9                                                  976           1039          89          0.0    27895478.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q10                                                1969           2095         178          1.1         950.8       1.0X
+q10                                                1940           2072         187          1.1         936.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q11                                                1966           2226         367          1.9         521.3       1.0X
+q11                                                2074           2322         350          1.8         549.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q12                                                 218            263          34          3.7         268.7       1.0X
+q12                                                 218            267          26          3.7         268.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q13                                                 854            892          42          5.8         173.1       1.0X
+q13                                                 864            928          64          5.7         175.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14a                                               5110           5424         444          1.0         996.1       1.0X
+q14a                                               4917           5335         592          1.0         958.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14b                                               3621           3785         232          1.4         706.0       1.0X
+q14b                                               3663           3816         216          1.4         714.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q15                                                 390            411          32          4.3         234.6       1.0X
+q15                                                 415            439          26          4.0         249.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q16                                                 709            748          48          2.2         453.5       1.0X
+q16                                                 721            776          60          2.2         461.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q17                                                1340           1515         247          3.5         285.2       1.0X
+q17                                                1598           1735         194          2.9         340.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q18                                                1295           1421         178          2.8         359.6       1.0X
+q18                                                1385           1390           7          2.6         384.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q19                                                 370            402          35          8.4         118.7       1.0X
+q19                                                 381            401          20          8.2         122.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q20                                                 223            254          35          6.9         145.9       1.0X
+q20                                                 200            237          44          7.7         130.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q21                                                 687            695          14         17.2          58.0       1.0X
+q21                                                 724            743          17         16.4          61.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q22                                                3422           3542         171          3.5         289.1       1.0X
+q22                                                3529           3631         144          3.4         298.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q23a                                               5917           6315         563          0.9        1131.5       1.0X
+q23a                                               6128           6160          46          0.9        1171.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q23b                                               5882           5930          67          0.9        1124.8       1.0X
+q23b                                               5923           5963          56          0.9        1132.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q24a                                                232            295          61         14.4          69.6       1.0X
+q24a                                                273            320          46         12.2          81.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q24b                                                146            239          48         22.8          43.9       1.0X
+q24b                                                209            253          38         16.0          62.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q25                                                1270           1289          27          3.7         270.4       1.0X
+q25                                                1281           1291          15          3.7         272.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q26                                                 390            419          26          8.8         113.1       1.0X
+q26                                                 405            420          18          8.5         117.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q27                                                 599            619          17          8.2         122.5       1.0X
+q27                                                 592            614          25          8.3         121.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q28                                                1437           1530         131          2.0         499.1       1.0X
+q28                                                1481           1542          87          1.9         514.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q29                                                1438           1566         181          3.3         306.0       1.0X
+q29                                                1446           1547         142          3.2         307.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q30                                                 471            514          36          0.6        1597.0       1.0X
+q30                                                 450            521          62          0.7        1526.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q31                                                1152           1411         366          3.2         309.6       1.0X
+q31                                                1369           1443         104          2.7         367.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q32                                                 238            273          49          6.4         155.5       1.0X
+q32                                                 250            288          31          6.1         163.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q33                                                 498            552          55         10.4          96.2       1.0X
+q33                                                 463            547         138         11.2          89.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q34                                                 436            465          39          7.0         142.6       1.0X
+q34                                                 423            443          12          7.2         138.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q35                                                1494           1500           8          1.4         721.7       1.0X
+q35                                                1375           1418          62          1.5         663.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q36                                                 590            599          14          5.0         198.5       1.0X
+q36                                                 571            586          15          5.2         192.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q37                                                 883            920          33         15.0          66.5       1.0X
+q37                                                 906            912           6         14.6          68.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q38                                                 953           1211         365          5.5         182.8       1.0X
+q38                                                 812           1068         362          6.4         155.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q39a                                               1453           1643         269          8.1         122.7       1.0X
+q39a                                               1516           1733         307          7.8         128.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q39b                                               1440           1540         142          8.2         121.6       1.0X
+q39b                                               1564           1683         168          7.6         132.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q40                                                 325            352          22          5.2         193.8       1.0X
+q40                                                 343            357          17          4.9         204.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q41                                                 152            185          27          0.1        8439.8       1.0X
+q41                                                 154            179          18          0.1        8582.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q42                                                 164            207          39         18.1          55.3       1.0X
+q42                                                 172            193          24         17.3          57.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q43                                                 354            369          14          8.4         119.8       1.0X
+q43                                                 345            359          14          8.6         116.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q44                                                 336            347           8          8.6         116.0       1.0X
+q44                                                 340            373          31          8.5         117.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q45                                                 190            226          39          5.1         197.9       1.0X
+q45                                                 214            253          20          4.5         222.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q46                                                 489            522          23          6.4         157.1       1.0X
+q46                                                 517            560          49          6.0         166.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q47                                                1612           1816         288          1.8         542.6       1.0X
+q47                                                1564           1607          62          1.9         526.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q48                                                 913            935          22          5.4         185.5       1.0X
+q48                                                 813            873          56          6.1         165.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q49                                                 715            829         190          7.8         127.4       1.0X
+q49                                                 533            571          36         10.5          95.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q50                                                 715            734          17          4.5         220.6       1.0X
+q50                                                 755            763           9          4.3         232.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q51                                                2685           2797         158          1.4         731.3       1.0X
+q51                                                2352           2471         167          1.6         640.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q52                                                 158            182          21         18.8          53.3       1.0X
+q52                                                 151            158           8         19.7          50.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q53                                                 298            338          38         10.0         100.4       1.0X
+q53                                                 280            287           8         10.6          94.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q54                                                1280           1337          81          4.1         242.4       1.0X
+q54                                                1157           1204          68          4.6         219.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q55                                                 166            189          25         17.9          55.7       1.0X
+q55                                                 148            158           4         20.1          49.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q56                                                 490            561          98         10.6          94.6       1.0X
+q56                                                 473            529          54         11.0          91.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q57                                                 770            882         166          2.0         502.8       1.0X
+q57                                                 905           1198         414          1.7         591.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q58                                                 415            440          29         12.3          81.0       1.0X
+q58                                                 514            535          25         10.0         100.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q59                                                 643            675          42          4.6         217.8       1.0X
+q59                                                 652            688          31          4.5         220.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q60                                                 574            594          33          9.0         110.9       1.0X
+q60                                                 412            419           6         12.6          79.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q61                                                 569            598          47          5.5         182.1       1.0X
+q61                                                 628            686          52          5.0         201.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q62                                                 181            187           7          4.4         228.0       1.0X
+q62                                                 168            180          12          4.7         211.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q63                                                 296            345          37         10.0          99.5       1.0X
+q63                                                 279            293          18         10.7          93.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q64                                                2546           2784         338          2.7         367.8       1.0X
+q64                                                2533           2795         371          2.7         365.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q65                                                 804            822          20          3.7         270.6       1.0X
+q65                                                 727            730           4          4.1         244.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q66                                                 611            660          75          3.8         263.7       1.0X
+q66                                                 516            562          68          4.5         222.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q67                                                5472           5599         180          0.5        1841.9       1.0X
+q67                                                5325           5412         123          0.6        1792.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q68                                                 526            545          16          5.9         169.1       1.0X
+q68                                                 508            545          48          6.1         163.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q69                                                1772           1813          58          1.2         855.8       1.0X
+q69                                                1734           1799          92          1.2         837.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q70                                                 668            679          10          4.4         226.3       1.0X
+q70                                                 671            678           8          4.4         227.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q71                                                 412            431          17         12.7          79.0       1.0X
+q71                                                 426            440          16         12.2          81.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q72                                              118708         121669        4188          0.1        7734.4       1.0X
+q72                                              108371         110305        2735          0.1        7061.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q73                                                 410            432          19          7.5         134.0       1.0X
+q73                                                 393            400           9          7.8         128.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q74                                                1615           1807         271          2.3         428.2       1.0X
+q74                                                1490           1742         357          2.5         394.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q75                                                1702           1934         328          3.3         302.1       1.0X
+q75                                                1696           1895         282          3.3         301.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q76                                                 344            361          16         14.9          67.1       1.0X
+q76                                                 329            346          15         15.6          64.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q77                                                1025           1076          71          5.5         182.6       1.0X
+q77                                                 581            742         222          9.7         103.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q78                                                2602           2762         226          2.2         463.4       1.0X
+q78                                                2032           2334         427          2.8         361.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q79                                                 460            468           6          6.6         150.5       1.0X
+q79                                                 408            416           5          7.5         133.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q80                                                1722           1769          66          3.3         305.0       1.0X
+q80                                                1592           1598           9          3.5         281.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q81                                                 412            456          47          0.9        1124.0       1.0X
+q81                                                 379            431          61          1.0        1034.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q82                                                1181           1197          24         12.5          80.2       1.0X
+q82                                                1185           1185           0         12.4          80.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q83                                                 316            336          17          1.9         531.0       1.0X
+q83                                                 305            343          31          2.0         512.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q84                                                 776            780           6          3.1         327.7       1.0X
+q84                                                 777            796          28          3.0         328.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q85                                                2164           2318         218          1.3         763.4       1.0X
+q85                                                1792           2035         343          1.6         632.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q86                                                 217            242          19          3.7         267.9       1.0X
+q86                                                 211            234          17          3.8         260.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q87                                                 802            850          48          6.5         153.9       1.0X
+q87                                                 949           1160         298          5.5         182.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q88                                                1373           1670         420          2.2         461.6       1.0X
+q88                                                1194           1352         223          2.5         401.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q89                                                 364            421          51          8.2         122.5       1.0X
+q89                                                 352            427          66          8.4         118.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q90                                                 138            163          20          5.9         170.2       1.0X
+q90                                                 121            132           9          6.7         148.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q91                                                 350            395          41          6.6         152.3       1.0X
+q91                                                 320            356          44          7.2         139.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q92                                                 138            160          20          5.9         170.1       1.0X
+q92                                                 130            149          14          6.2         160.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q93                                                 493            522          22          6.4         155.6       1.0X
+q93                                                 451            494          51          7.0         142.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q94                                                 384            410          33          2.2         456.3       1.0X
+q94                                                 354            382          26          2.4         420.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q95                                                5272           5368         134          0.2        6261.8       1.0X
+q95                                                5246           5366         169          0.2        6230.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q96                                                 184            211          28         16.2          61.7       1.0X
+q96                                                 180            200          18         16.5          60.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q97                                                1291           1397         149          3.4         294.0       1.0X
+q97                                                1207           1268          86          3.6         274.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q98                                                 323            345          22          9.2         108.8       1.0X
+q98                                                 278            301          32         10.7          93.5       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q99                                                 315            329          14          4.8         208.1       1.0X
+q99                                                 275            302          17          5.5         182.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q5a-v2.7                                           1597           1683         121          3.5         283.8       1.0X
+q5a-v2.7                                           1579           1853         387          3.6         280.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q6-v2.7                                            1047           1108          86          3.0         335.6       1.0X
+q6-v2.7                                            1003           1003           0          3.1         321.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q10a-v2.7                                          1788           1920         186          1.2         863.6       1.0X
+q10a-v2.7                                          1797           1879         116          1.2         867.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q11-v2.7                                           1888           2202         443          2.0         500.7       1.0X
+q11-v2.7                                           1834           2280         630          2.1         486.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q12-v2.7                                            141            161          17          5.8         173.7       1.0X
+q12-v2.7                                            157            184          20          5.2         193.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14-v2.7                                           3971           4128         222          1.3         774.1       1.0X
+q14-v2.7                                           3900           4113         302          1.3         760.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q14a-v2.7                                          7072           7411         480          0.7        1378.5       1.0X
+q14a-v2.7                                          8068           8102          48          0.6        1572.9       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q18a-v2.7                                          1893           2189         419          1.9         525.6       1.0X
+q18a-v2.7                                          1755           2323         803          2.1         487.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q20-v2.7                                            159            178          14          9.6         104.1       1.0X
+q20-v2.7                                            162            173           6          9.4         106.1       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q22-v2.7                                          14036          14248         299          0.8        1185.9       1.0X
+q22-v2.7                                          14196          14538         483          0.8        1199.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q22a-v2.7                                          2096           2192         137          5.6         177.1       1.0X
+q22a-v2.7                                          2107           2195         124          5.6         178.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q24-v2.7                                            252            272          16         13.3          75.4       1.0X
+q24-v2.7                                            203            233          18         16.4          60.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q27a-v2.7                                          1357           1569         299          3.6         277.4       1.0X
+q27a-v2.7                                          1275           1711         617          3.8         260.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q34-v2.7                                            405            425          24          7.6         132.3       1.0X
+q34-v2.7                                            350            370          19          8.7         114.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q35-v2.7                                           1343           1424         115          1.5         648.5       1.0X
+q35-v2.7                                           1276           1323          66          1.6         616.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q35a-v2.7                                          1343           1429         122          1.5         648.4       1.0X
+q35a-v2.7                                          1234           1348         161          1.7         595.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q36a-v2.7                                           542            570          30          5.5         182.3       1.0X
+q36a-v2.7                                           557            588          26          5.3         187.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q47-v2.7                                           1533           1731         279          1.9         516.1       1.0X
+q47-v2.7                                           1756           1929         244          1.7         591.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q49-v2.7                                            627            644          31          9.0         111.6       1.0X
+q49-v2.7                                            573            646          95          9.8         102.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q51a-v2.7                                         14685          14924         338          0.3        3999.5       1.0X
+q51a-v2.7                                         14343          14818         673          0.3        3906.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q57-v2.7                                            786            837          44          1.9         513.5       1.0X
+q57-v2.7                                            803            861          99          1.9         524.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q64-v2.7                                           2399           2642         343          2.9         346.6       1.0X
+q64-v2.7                                           2618           3021         571          2.6         378.2       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q67a-v2.7                                          7749           7811          87          0.4        2608.4       1.0X
+q67a-v2.7                                          7111           7314         287          0.4        2393.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q70a-v2.7                                           696            704           8          4.2         235.8       1.0X
+q70a-v2.7                                           739            750          13          4.0         250.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q72-v2.7                                          97059          97107          67          0.2        6323.9       1.0X
+q72-v2.7                                         115607         117956        3321          0.1        7532.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q74-v2.7                                           1404           1675         383          2.7         372.2       1.0X
+q74-v2.7                                           1551           1714         230          2.4         411.3       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q75-v2.7                                           1434           1878         628          3.9         254.6       1.0X
+q75-v2.7                                           1705           1883         252          3.3         302.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q77a-v2.7                                           816           1004         283          6.9         145.2       1.0X
+q77a-v2.7                                          1262           1277          21          4.5         224.7       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q78-v2.7                                           2024           2365         482          2.8         360.5       1.0X
+q78-v2.7                                           2239           2684         630          2.5         398.8       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q80a-v2.7                                          1822           1984         230          3.1         322.6       1.0X
+q80a-v2.7                                          2166           2242         108          2.6         383.6       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q86a-v2.7                                           268            296          20          3.0         331.4       1.0X
+q86a-v2.7                                           285            311          19          2.8         352.0       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TPCDS:                                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-q98-v2.7                                            291            312          19         10.2          98.1       1.0X
+q98-v2.7                                            288            333          40         10.3          97.1       1.0X
 
diff --git a/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-jdk21-results.txt b/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-jdk21-results.txt
index 01299cee6fb90..6e3e10b804e81 100644
--- a/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-jdk21-results.txt
@@ -2,11 +2,11 @@
 TakeOrderedAndProject
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TakeOrderedAndProject with SMJ:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-TakeOrderedAndProject with SMJ for doExecute                 173            201          30          0.1       17333.6       1.0X
-TakeOrderedAndProject with SMJ for executeCollect            112            117           5          0.1       11175.1       1.6X
+TakeOrderedAndProject with SMJ for doExecute                 188            208          18          0.1       18765.1       1.0X
+TakeOrderedAndProject with SMJ for executeCollect             95            104          12          0.1        9544.5       2.0X
 
 
diff --git a/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-results.txt b/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-results.txt
index efc97286cf50c..a641d73a1e043 100644
--- a/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-results.txt
+++ b/sql/core/benchmarks/TakeOrderedAndProjectBenchmark-results.txt
@@ -2,11 +2,11 @@
 TakeOrderedAndProject
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 TakeOrderedAndProject with SMJ:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-TakeOrderedAndProject with SMJ for doExecute                 206            212           5          0.0       20631.3       1.0X
-TakeOrderedAndProject with SMJ for executeCollect            111            121          10          0.1       11106.3       1.9X
+TakeOrderedAndProject with SMJ for doExecute                 215            216           1          0.0       21490.5       1.0X
+TakeOrderedAndProject with SMJ for executeCollect            105            110           4          0.1       10469.7       2.1X
 
 
diff --git a/sql/core/benchmarks/TopKBenchmark-jdk21-results.txt b/sql/core/benchmarks/TopKBenchmark-jdk21-results.txt
index e5c669c53da3d..c15157e9d2362 100644
--- a/sql/core/benchmarks/TopKBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/TopKBenchmark-jdk21-results.txt
@@ -2,21 +2,21 @@
 Top-K Computation
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark Top-K:                                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------
-ROW_NUMBER (PARTITION: , WindowGroupLimit: false)                         8967           9181         174          2.3         427.6       1.0X
-ROW_NUMBER (PARTITION: , WindowGroupLimit: true)                          1868           1909          23         11.2          89.1       4.8X
-ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: false)          11459          11734         120          1.8         546.4       0.8X
-ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: true)            4913           5018          51          4.3         234.3       1.8X
-RANK (PARTITION: , WindowGroupLimit: false)                               9519           9767         113          2.2         453.9       0.9X
-RANK (PARTITION: , WindowGroupLimit: true)                                1785           1855          48         11.8          85.1       5.0X
-RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)                12177          12421          96          1.7         580.7       0.7X
-RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)                  4907           5011          56          4.3         234.0       1.8X
-DENSE_RANK (PARTITION: , WindowGroupLimit: false)                         9496           9681         150          2.2         452.8       0.9X
-DENSE_RANK (PARTITION: , WindowGroupLimit: true)                          1756           1788          32         11.9          83.7       5.1X
-DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)          12084          12385         158          1.7         576.2       0.7X
-DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)            4905           5035          69          4.3         233.9       1.8X
+ROW_NUMBER (PARTITION: , WindowGroupLimit: false)                         8842           8986          82          2.4         421.6       1.0X
+ROW_NUMBER (PARTITION: , WindowGroupLimit: true)                          1947           1970          12         10.8          92.8       4.5X
+ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: false)          11322          11472          78          1.9         539.9       0.8X
+ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: true)            4914           5102          88          4.3         234.3       1.8X
+RANK (PARTITION: , WindowGroupLimit: false)                               9422           9698         196          2.2         449.3       0.9X
+RANK (PARTITION: , WindowGroupLimit: true)                                1720           1752          20         12.2          82.0       5.1X
+RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)                11841          11996         120          1.8         564.6       0.7X
+RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)                  4790           4991         130          4.4         228.4       1.8X
+DENSE_RANK (PARTITION: , WindowGroupLimit: false)                         9185           9356         136          2.3         438.0       1.0X
+DENSE_RANK (PARTITION: , WindowGroupLimit: true)                          1756           1917         121         11.9          83.7       5.0X
+DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)          11572          11776         154          1.8         551.8       0.8X
+DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)            4749           4917         118          4.4         226.5       1.9X
 
 
diff --git a/sql/core/benchmarks/TopKBenchmark-results.txt b/sql/core/benchmarks/TopKBenchmark-results.txt
index b07a395f9e9ca..3e71741956878 100644
--- a/sql/core/benchmarks/TopKBenchmark-results.txt
+++ b/sql/core/benchmarks/TopKBenchmark-results.txt
@@ -2,21 +2,21 @@
 Top-K Computation
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Benchmark Top-K:                                                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------
-ROW_NUMBER (PARTITION: , WindowGroupLimit: false)                         9240           9454         213          2.3         440.6       1.0X
-ROW_NUMBER (PARTITION: , WindowGroupLimit: true)                          1612           1633          18         13.0          76.8       5.7X
-ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: false)          11354          11429          50          1.8         541.4       0.8X
-ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: true)            5117           5204          83          4.1         244.0       1.8X
-RANK (PARTITION: , WindowGroupLimit: false)                               9589           9766         239          2.2         457.2       1.0X
-RANK (PARTITION: , WindowGroupLimit: true)                                1848           1867          17         11.3          88.1       5.0X
-RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)                11752          11930         211          1.8         560.4       0.8X
-RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)                  5197           5255          32          4.0         247.8       1.8X
-DENSE_RANK (PARTITION: , WindowGroupLimit: false)                         9604           9645          50          2.2         457.9       1.0X
-DENSE_RANK (PARTITION: , WindowGroupLimit: true)                          1843           1883          39         11.4          87.9       5.0X
-DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)          11681          11993         569          1.8         557.0       0.8X
-DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)            5098           5191          72          4.1         243.1       1.8X
+ROW_NUMBER (PARTITION: , WindowGroupLimit: false)                         8866           8994         143          2.4         422.8       1.0X
+ROW_NUMBER (PARTITION: , WindowGroupLimit: true)                          1612           1628          18         13.0          76.9       5.5X
+ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: false)          11230          11313         118          1.9         535.5       0.8X
+ROW_NUMBER (PARTITION: PARTITION BY b, WindowGroupLimit: true)            4829           4961          94          4.3         230.3       1.8X
+RANK (PARTITION: , WindowGroupLimit: false)                               9412           9445          36          2.2         448.8       0.9X
+RANK (PARTITION: , WindowGroupLimit: true)                                1835           1976          51         11.4          87.5       4.8X
+RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)                11637          11818         148          1.8         554.9       0.8X
+RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)                  5005           5048          28          4.2         238.6       1.8X
+DENSE_RANK (PARTITION: , WindowGroupLimit: false)                         9288           9331          36          2.3         442.9       1.0X
+DENSE_RANK (PARTITION: , WindowGroupLimit: true)                          1808           1973          61         11.6          86.2       4.9X
+DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: false)          11553          11734         149          1.8         550.9       0.8X
+DENSE_RANK (PARTITION: PARTITION BY b, WindowGroupLimit: true)            4876           5021          81          4.3         232.5       1.8X
 
 
diff --git a/sql/core/benchmarks/UDFBenchmark-jdk21-results.txt b/sql/core/benchmarks/UDFBenchmark-jdk21-results.txt
index 8b0870813056c..f0cd4591f60c8 100644
--- a/sql/core/benchmarks/UDFBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/UDFBenchmark-jdk21-results.txt
@@ -2,58 +2,58 @@
 UDF with mixed input types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int/string to string:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-long/nullable int/string to string wholestage off            140            164          33          0.7        1402.0       1.0X
-long/nullable int/string to string wholestage on              65             72           8          1.5         650.3       2.2X
+long/nullable int/string to string wholestage off            102            117          20          1.0        1022.8       1.0X
+long/nullable int/string to string wholestage on              56             67           9          1.8         562.4       1.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int/string to option:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-long/nullable int/string to option wholestage off             56             62           8          1.8         557.2       1.0X
-long/nullable int/string to option wholestage on              39             44           4          2.6         386.4       1.4X
+long/nullable int/string to option wholestage off             41             41           1          2.5         406.0       1.0X
+long/nullable int/string to option wholestage on              38             44           5          2.6         381.5       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int/string to primitive:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-long/nullable int/string to primitive wholestage off             35             35           0          2.8         352.7       1.0X
-long/nullable int/string to primitive wholestage on              29             32           2          3.4         291.4       1.2X
+long/nullable int/string to primitive wholestage off             32             32           1          3.2         315.4       1.0X
+long/nullable int/string to primitive wholestage on              27             32           5          3.8         265.5       1.2X
 
 
 ================================================================================================
 UDF with primitive types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int to string:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-long/nullable int to string wholestage off             31             32           1          3.2         313.6       1.0X
-long/nullable int to string wholestage on              32             36           4          3.2         315.7       1.0X
+long/nullable int to string wholestage off             29             29           1          3.5         286.4       1.0X
+long/nullable int to string wholestage on              29             32           4          3.5         288.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int to option:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-long/nullable int to option wholestage off             23             24           2          4.4         226.0       1.0X
-long/nullable int to option wholestage on              26             32           6          3.9         258.2       0.9X
+long/nullable int to option wholestage off             21             24           4          4.7         213.9       1.0X
+long/nullable int to option wholestage on              21             23           3          4.8         208.1       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int to primitive:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-long/nullable int to primitive wholestage off             19             22           5          5.3         188.3       1.0X
-long/nullable int to primitive wholestage on              18             18           0          5.6         180.2       1.0X
+long/nullable int to primitive wholestage off             17             23           9          6.1         165.1       1.0X
+long/nullable int to primitive wholestage on              17             22           4          5.8         172.9       1.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 UDF identity overhead:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Baseline                                             12             14           2          8.2         122.4       1.0X
-With identity UDF                                    16             18           2          6.4         157.2       0.8X
+Baseline                                             12             14           1          8.4         118.8       1.0X
+With identity UDF                                    14             15           1          7.2         139.5       0.9X
 
 
diff --git a/sql/core/benchmarks/UDFBenchmark-results.txt b/sql/core/benchmarks/UDFBenchmark-results.txt
index ca92c3305295f..746babff4bf4f 100644
--- a/sql/core/benchmarks/UDFBenchmark-results.txt
+++ b/sql/core/benchmarks/UDFBenchmark-results.txt
@@ -2,58 +2,58 @@
 UDF with mixed input types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int/string to string:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-long/nullable int/string to string wholestage off            118            129          16          0.8        1182.2       1.0X
-long/nullable int/string to string wholestage on              70             88          12          1.4         704.4       1.7X
+long/nullable int/string to string wholestage off            124            149          34          0.8        1243.3       1.0X
+long/nullable int/string to string wholestage on              67             81           9          1.5         667.5       1.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int/string to option:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------------
-long/nullable int/string to option wholestage off             53             55           3          1.9         531.1       1.0X
-long/nullable int/string to option wholestage on              39             43           4          2.5         392.5       1.4X
+long/nullable int/string to option wholestage off             43             50           9          2.3         431.5       1.0X
+long/nullable int/string to option wholestage on              38             42           3          2.6         378.6       1.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int/string to primitive:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------
-long/nullable int/string to primitive wholestage off             30             32           3          3.4         298.1       1.0X
-long/nullable int/string to primitive wholestage on              30             34           4          3.3         303.9       1.0X
+long/nullable int/string to primitive wholestage off             30             31           1          3.3         304.0       1.0X
+long/nullable int/string to primitive wholestage on              31             37           5          3.2         308.7       1.0X
 
 
 ================================================================================================
 UDF with primitive types
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int to string:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-long/nullable int to string wholestage off             36             41           8          2.8         355.3       1.0X
-long/nullable int to string wholestage on              31             32           2          3.3         305.2       1.2X
+long/nullable int to string wholestage off             31             31           1          3.3         306.2       1.0X
+long/nullable int to string wholestage on              30             33           2          3.3         303.4       1.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int to option:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------
-long/nullable int to option wholestage off             31             32           1          3.2         314.5       1.0X
-long/nullable int to option wholestage on              22             24           2          4.5         220.3       1.4X
+long/nullable int to option wholestage off             32             32           0          3.1         320.4       1.0X
+long/nullable int to option wholestage on              21             25           5          4.7         213.7       1.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 long/nullable int to primitive:                Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------
-long/nullable int to primitive wholestage off             18             19           1          5.4         183.9       1.0X
-long/nullable int to primitive wholestage on              19             20           0          5.2         193.8       0.9X
+long/nullable int to primitive wholestage off             20             22           2          4.9         202.8       1.0X
+long/nullable int to primitive wholestage on              17             18           1          5.8         172.3       1.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 UDF identity overhead:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Baseline                                             12             13           1          8.3         120.0       1.0X
-With identity UDF                                    16             25           5          6.1         164.7       0.7X
+Baseline                                             11             13           3          9.1         109.9       1.0X
+With identity UDF                                    16             17           1          6.1         164.9       0.7X
 
 
diff --git a/sql/core/benchmarks/UnsafeArrayDataBenchmark-jdk21-results.txt b/sql/core/benchmarks/UnsafeArrayDataBenchmark-jdk21-results.txt
index 5f447a39039fa..4b93de5445f14 100644
--- a/sql/core/benchmarks/UnsafeArrayDataBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/UnsafeArrayDataBenchmark-jdk21-results.txt
@@ -2,32 +2,32 @@
 Benchmark UnsafeArrayData
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read UnsafeArrayData:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                  80             80           1       2091.7           0.5       1.0X
+Int                                                  80             80           0       2094.8           0.5       1.0X
 Double                                              159            159           0       1056.0           0.9       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write UnsafeArrayData:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                  12             16           2       1699.1           0.6       1.0X
-Double                                               28             34           4        738.0           1.4       0.4X
+Int                                                  14             16           3       1545.3           0.6       1.0X
+Double                                               29             33           3        721.4           1.4       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Get primitive array from UnsafeArrayData:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                  19             21           1       3255.6           0.3       1.0X
-Double                                               40             43           2       1572.0           0.6       0.5X
+Int                                                  20             22           1       3202.8           0.3       1.0X
+Double                                               41             45           2       1522.6           0.7       0.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Create UnsafeArrayData from primitive array:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Int                                                     20             22           1       3206.7           0.3       1.0X
-Double                                                  42             46           2       1496.8           0.7       0.5X
+Int                                                     21             24           1       2937.5           0.3       1.0X
+Double                                                  45             47           2       1411.0           0.7       0.5X
 
 
diff --git a/sql/core/benchmarks/UnsafeArrayDataBenchmark-results.txt b/sql/core/benchmarks/UnsafeArrayDataBenchmark-results.txt
index 3ddb3bdb3f0b4..689931d9b4aa1 100644
--- a/sql/core/benchmarks/UnsafeArrayDataBenchmark-results.txt
+++ b/sql/core/benchmarks/UnsafeArrayDataBenchmark-results.txt
@@ -2,32 +2,32 @@
 Benchmark UnsafeArrayData
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Read UnsafeArrayData:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                  76             77           1       2200.4           0.5       1.0X
-Double                                              158            159           0       1059.1           0.9       0.5X
+Int                                                  76             76           0       2204.0           0.5       1.0X
+Double                                              159            159           0       1055.2           0.9       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Write UnsafeArrayData:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                  12             13           1       1777.3           0.6       1.0X
-Double                                               28             33           4        754.2           1.3       0.4X
+Int                                                  14             15           1       1501.6           0.7       1.0X
+Double                                               32             38           3        647.1           1.5       0.4X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Get primitive array from UnsafeArrayData:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Int                                                  19             22           2       3276.8           0.3       1.0X
-Double                                               41             43           2       1546.7           0.6       0.5X
+Int                                                  21             24           1       2956.5           0.3       1.0X
+Double                                               45             48           1       1390.6           0.7       0.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Create UnsafeArrayData from primitive array:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ---------------------------------------------------------------------------------------------------------------------------
-Int                                                     20             23           1       3189.4           0.3       1.0X
-Double                                                  45             47           2       1400.8           0.7       0.4X
+Int                                                     22             25           1       2802.3           0.4       1.0X
+Double                                                  46             49           1       1357.5           0.7       0.5X
 
 
diff --git a/sql/core/benchmarks/UpdateFieldsBenchmark-jdk21-results.txt b/sql/core/benchmarks/UpdateFieldsBenchmark-jdk21-results.txt
index fdda101722dfc..1f33913b1038d 100644
--- a/sql/core/benchmarks/UpdateFieldsBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/UpdateFieldsBenchmark-jdk21-results.txt
@@ -2,25 +2,25 @@
 Add 2 columns and drop 2 columns at 3 different depths of nesting
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Add 2 columns and drop 2 columns at 3 different depths of nesting:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------
 To non-nullable StructTypes using performant method                            2              3           1          0.0      Infinity       1.0X
-To nullable StructTypes using performant method                                1              1           0          0.0      Infinity       1.4X
-To non-nullable StructTypes using non-performant method                       25             27           4          0.0      Infinity       0.1X
-To nullable StructTypes using non-performant method                          563            618          41          0.0      Infinity       0.0X
+To nullable StructTypes using performant method                                1              2           1          0.0      Infinity       1.4X
+To non-nullable StructTypes using non-performant method                       33             36           4          0.0      Infinity       0.1X
+To nullable StructTypes using non-performant method                          723            738          18          0.0      Infinity       0.0X
 
 
 ================================================================================================
 Add 50 columns and drop 50 columns at 100 different depths of nesting
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Add 50 columns and drop 50 columns at 100 different depths of nesting:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-To non-nullable StructTypes using performant method                              426            430           6          0.0      Infinity       1.0X
-To nullable StructTypes using performant method                                  455            471          20          0.0      Infinity       0.9X
+To non-nullable StructTypes using performant method                              714            731          20          0.0      Infinity       1.0X
+To nullable StructTypes using performant method                                  731            762          28          0.0      Infinity       1.0X
 
 
diff --git a/sql/core/benchmarks/UpdateFieldsBenchmark-results.txt b/sql/core/benchmarks/UpdateFieldsBenchmark-results.txt
index e6f50a6b410fa..f716aef1f4d52 100644
--- a/sql/core/benchmarks/UpdateFieldsBenchmark-results.txt
+++ b/sql/core/benchmarks/UpdateFieldsBenchmark-results.txt
@@ -2,25 +2,25 @@
 Add 2 columns and drop 2 columns at 3 different depths of nesting
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Add 2 columns and drop 2 columns at 3 different depths of nesting:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------
 To non-nullable StructTypes using performant method                            2              3           1          0.0      Infinity       1.0X
-To nullable StructTypes using performant method                                1              2           0          0.0      Infinity       1.4X
-To non-nullable StructTypes using non-performant method                       27             28           2          0.0      Infinity       0.1X
-To nullable StructTypes using non-performant method                          632            671          41          0.0      Infinity       0.0X
+To nullable StructTypes using performant method                                2              2           0          0.0      Infinity       1.3X
+To non-nullable StructTypes using non-performant method                       43             45           3          0.0      Infinity       0.0X
+To nullable StructTypes using non-performant method                          762            789          23          0.0      Infinity       0.0X
 
 
 ================================================================================================
 Add 50 columns and drop 50 columns at 100 different depths of nesting
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Add 50 columns and drop 50 columns at 100 different depths of nesting:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -----------------------------------------------------------------------------------------------------------------------------------------------------
-To non-nullable StructTypes using performant method                              523            528           4          0.0      Infinity       1.0X
-To nullable StructTypes using performant method                                  558            560           1          0.0      Infinity       0.9X
+To non-nullable StructTypes using performant method                             1058           1061           5          0.0      Infinity       1.0X
+To nullable StructTypes using performant method                                 1055           1061           8          0.0      Infinity       1.0X
 
 
diff --git a/sql/core/benchmarks/V2FunctionBenchmark-jdk21-results.txt b/sql/core/benchmarks/V2FunctionBenchmark-jdk21-results.txt
index 5057d398891b0..dc84a0f3a54a6 100644
--- a/sql/core/benchmarks/V2FunctionBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/V2FunctionBenchmark-jdk21-results.txt
@@ -1,44 +1,44 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = true codegen = true:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                       10089          10493         661         49.6          20.2       1.0X
-java_long_add_default                                                                 22867          22890          37         21.9          45.7       0.4X
-java_long_add_magic                                                                   11600          11644          57         43.1          23.2       0.9X
-java_long_add_static_magic                                                            11562          11720         228         43.2          23.1       0.9X
-scala_long_add_default                                                                23965          24147         265         20.9          47.9       0.4X
-scala_long_add_magic                                                                  11591          11820         356         43.1          23.2       0.9X
+native_long_add                                                                        9835          10320         826         50.8          19.7       1.0X
+java_long_add_default                                                                 21945          22529         922         22.8          43.9       0.4X
+java_long_add_magic                                                                   11566          11633         112         43.2          23.1       0.9X
+java_long_add_static_magic                                                            11509          11536          25         43.4          23.0       0.9X
+scala_long_add_default                                                                23210          23294         133         21.5          46.4       0.4X
+scala_long_add_magic                                                                  11543          11601          99         43.3          23.1       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = false codegen = true:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                        10907          11657         732         45.8          21.8       1.0X
-java_long_add_default                                                                  22513          22805         495         22.2          45.0       0.5X
-java_long_add_magic                                                                    12082          12151          67         41.4          24.2       0.9X
-java_long_add_static_magic                                                             10022          10193         174         49.9          20.0       1.1X
-scala_long_add_default                                                                 22328          22403          83         22.4          44.7       0.5X
-scala_long_add_magic                                                                   11624          11873         229         43.0          23.2       0.9X
+native_long_add                                                                        10152          10364         183         49.3          20.3       1.0X
+java_long_add_default                                                                  22197          22314         193         22.5          44.4       0.5X
+java_long_add_magic                                                                    11567          11620          60         43.2          23.1       0.9X
+java_long_add_static_magic                                                              9994          10035          37         50.0          20.0       1.0X
+scala_long_add_default                                                                 22078          22110          30         22.6          44.2       0.5X
+scala_long_add_magic                                                                   11575          11702         130         43.2          23.1       0.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = true codegen = false:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                        22932          23181         407         21.8          45.9       1.0X
-java_long_add_default                                                                  26925          27143         353         18.6          53.8       0.9X
-java_long_add_magic                                                                    32820          32934         125         15.2          65.6       0.7X
-java_long_add_static_magic                                                             30895          31058         156         16.2          61.8       0.7X
-scala_long_add_default                                                                 26669          26864         237         18.7          53.3       0.9X
-scala_long_add_magic                                                                   32976          33334         407         15.2          66.0       0.7X
+native_long_add                                                                        22677          22692          18         22.0          45.4       1.0X
+java_long_add_default                                                                  26749          26801          52         18.7          53.5       0.8X
+java_long_add_magic                                                                    32489          32582         100         15.4          65.0       0.7X
+java_long_add_static_magic                                                             30791          30824          37         16.2          61.6       0.7X
+scala_long_add_default                                                                 26460          26510          44         18.9          52.9       0.9X
+scala_long_add_magic                                                                   32668          32724          50         15.3          65.3       0.7X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = false codegen = false:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                         21803          21918         134         22.9          43.6       1.0X
-java_long_add_default                                                                   25534          25962         715         19.6          51.1       0.9X
-java_long_add_magic                                                                     32086          32180         123         15.6          64.2       0.7X
-java_long_add_static_magic                                                              29945          30086         149         16.7          59.9       0.7X
-scala_long_add_default                                                                  25475          25523          42         19.6          51.0       0.9X
-scala_long_add_magic                                                                    32125          32175          44         15.6          64.3       0.7X
+native_long_add                                                                         22890          23100         291         21.8          45.8       1.0X
+java_long_add_default                                                                   26587          26639          45         18.8          53.2       0.9X
+java_long_add_magic                                                                     32885          32954          65         15.2          65.8       0.7X
+java_long_add_static_magic                                                              31021          31268         224         16.1          62.0       0.7X
+scala_long_add_default                                                                  26612          26893         261         18.8          53.2       0.9X
+scala_long_add_magic                                                                    33112          33351         339         15.1          66.2       0.7X
 
diff --git a/sql/core/benchmarks/V2FunctionBenchmark-results.txt b/sql/core/benchmarks/V2FunctionBenchmark-results.txt
index 81726a34bcbba..966b8434ddb08 100644
--- a/sql/core/benchmarks/V2FunctionBenchmark-results.txt
+++ b/sql/core/benchmarks/V2FunctionBenchmark-results.txt
@@ -1,44 +1,44 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = true codegen = true:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                        9267           9290          37         54.0          18.5       1.0X
-java_long_add_default                                                                 22321          22462         232         22.4          44.6       0.4X
-java_long_add_magic                                                                   10925          10945          18         45.8          21.8       0.8X
-java_long_add_static_magic                                                            11068          11192         142         45.2          22.1       0.8X
-scala_long_add_default                                                                22271          22289          16         22.5          44.5       0.4X
-scala_long_add_magic                                                                  10930          10998          66         45.7          21.9       0.8X
+native_long_add                                                                        9191           9247          50         54.4          18.4       1.0X
+java_long_add_default                                                                 22939          23001          57         21.8          45.9       0.4X
+java_long_add_magic                                                                   10694          10751          81         46.8          21.4       0.9X
+java_long_add_static_magic                                                            10567          11615         998         47.3          21.1       0.9X
+scala_long_add_default                                                                23064          23144         104         21.7          46.1       0.4X
+scala_long_add_magic                                                                  10726          10797          62         46.6          21.5       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = false codegen = true:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                         9944          10134         286         50.3          19.9       1.0X
-java_long_add_default                                                                  21517          21538          19         23.2          43.0       0.5X
-java_long_add_magic                                                                    11487          11535          59         43.5          23.0       0.9X
-java_long_add_static_magic                                                             10276          10343          64         48.7          20.6       1.0X
-scala_long_add_default                                                                 21555          21610          51         23.2          43.1       0.5X
-scala_long_add_magic                                                                   11027          11154         187         45.3          22.1       0.9X
+native_long_add                                                                        10042          10098          93         49.8          20.1       1.0X
+java_long_add_default                                                                  22278          22326          64         22.4          44.6       0.5X
+java_long_add_magic                                                                    10647          10660          13         47.0          21.3       0.9X
+java_long_add_static_magic                                                              9944          10014          88         50.3          19.9       1.0X
+scala_long_add_default                                                                 22176          22516         586         22.5          44.4       0.5X
+scala_long_add_magic                                                                   10690          10745          79         46.8          21.4       0.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = true codegen = false:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                        22916          23049         122         21.8          45.8       1.0X
-java_long_add_default                                                                  28358          28408          80         17.6          56.7       0.8X
-java_long_add_magic                                                                    31588          31709         134         15.8          63.2       0.7X
-java_long_add_static_magic                                                             31198          31452         337         16.0          62.4       0.7X
-scala_long_add_default                                                                 26362          26390          36         19.0          52.7       0.9X
-scala_long_add_magic                                                                   31958          32000          37         15.6          63.9       0.7X
+native_long_add                                                                        22784          22953         185         21.9          45.6       1.0X
+java_long_add_default                                                                  26064          26088          38         19.2          52.1       0.9X
+java_long_add_magic                                                                    32566          32610          76         15.4          65.1       0.7X
+java_long_add_static_magic                                                             32014          32099          81         15.6          64.0       0.7X
+scala_long_add_default                                                                 27099          27195          92         18.5          54.2       0.8X
+scala_long_add_magic                                                                   32697          33739         915         15.3          65.4       0.7X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 scalar function (long + long) -> long, result_nullable = false codegen = false:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 --------------------------------------------------------------------------------------------------------------------------------------------------------------
-native_long_add                                                                         22121          22162          68         22.6          44.2       1.0X
-java_long_add_default                                                                   25925          26037          98         19.3          51.8       0.9X
-java_long_add_magic                                                                     31642          31668          24         15.8          63.3       0.7X
-java_long_add_static_magic                                                              30902          30948          55         16.2          61.8       0.7X
-scala_long_add_default                                                                  25906          25930          25         19.3          51.8       0.9X
-scala_long_add_magic                                                                    31693          32012         374         15.8          63.4       0.7X
+native_long_add                                                                         21805          21817          10         22.9          43.6       1.0X
+java_long_add_default                                                                   25863          26093         239         19.3          51.7       0.8X
+java_long_add_magic                                                                     31630          31668          55         15.8          63.3       0.7X
+java_long_add_static_magic                                                              31125          31300         263         16.1          62.3       0.7X
+scala_long_add_default                                                                  25823          26135         463         19.4          51.6       0.8X
+scala_long_add_magic                                                                    31689          31881         330         15.8          63.4       0.7X
 
diff --git a/sql/core/benchmarks/WideSchemaBenchmark-jdk21-results.txt b/sql/core/benchmarks/WideSchemaBenchmark-jdk21-results.txt
index 534aa70e59af2..9963575f763ff 100644
--- a/sql/core/benchmarks/WideSchemaBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/WideSchemaBenchmark-jdk21-results.txt
@@ -2,157 +2,157 @@
 parsing large select expressions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 parsing large select:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 select expressions                                  1              1           0          0.0      671823.0       1.0X
-100 select expressions                                3              3           0          0.0     3220274.0       0.2X
-2500 select expressions                              70             72           2          0.0    69682180.0       0.0X
+1 select expressions                                  1              1           0          0.0      632990.0       1.0X
+100 select expressions                                3              3           0          0.0     2850444.0       0.2X
+2500 select expressions                              63             65           3          0.0    62915152.0       0.0X
 
 
 ================================================================================================
 optimize large select expressions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 optimize large select:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-100 columns                                           3              4           1          0.0     2961331.0       1.0X
-1000 columns                                         16             18           3          0.0    15853499.0       0.2X
-10000 columns                                       150            170          14          0.0   150229609.0       0.0X
+100 columns                                           3              4           1          0.0     2952203.0       1.0X
+1000 columns                                         17             18           1          0.0    17106048.0       0.2X
+10000 columns                                       162            177          18          0.0   162356332.0       0.0X
 
 
 ================================================================================================
 many column field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 many column field r/w:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 cols x 100000 rows (read in-mem)                   14             21           4          6.9         144.2       1.0X
-1 cols x 100000 rows (exec in-mem)                   15             18           4          6.9         145.6       1.0X
-1 cols x 100000 rows (read parquet)                  27             37          10          3.7         272.7       0.5X
-1 cols x 100000 rows (write parquet)                 88             97          11          1.1         878.8       0.2X
-100 cols x 1000 rows (read in-mem)                   11             15           4          9.0         111.2       1.3X
-100 cols x 1000 rows (exec in-mem)                   13             18           5          7.4         134.6       1.1X
-100 cols x 1000 rows (read parquet)                  23             28           8          4.4         228.8       0.6X
-100 cols x 1000 rows (write parquet)                 85             92          11          1.2         845.1       0.2X
-2500 cols x 40 rows (read in-mem)                    44             51          10          2.3         435.1       0.3X
-2500 cols x 40 rows (exec in-mem)                    69             85          21          1.4         692.4       0.2X
-2500 cols x 40 rows (read parquet)                  263            268           6          0.4        2627.9       0.1X
-2500 cols x 40 rows (write parquet)                 119            136          17          0.8        1193.7       0.1X
+1 cols x 100000 rows (read in-mem)                   17             23           5          5.9         168.2       1.0X
+1 cols x 100000 rows (exec in-mem)                   16             21           4          6.3         159.8       1.1X
+1 cols x 100000 rows (read parquet)                  29             36           6          3.4         293.5       0.6X
+1 cols x 100000 rows (write parquet)                 92             97           6          1.1         915.5       0.2X
+100 cols x 1000 rows (read in-mem)                   13             17           4          8.0         125.5       1.3X
+100 cols x 1000 rows (exec in-mem)                   15             18           4          6.7         149.0       1.1X
+100 cols x 1000 rows (read parquet)                  24             29           6          4.1         244.8       0.7X
+100 cols x 1000 rows (write parquet)                 87             95           8          1.1         870.1       0.2X
+2500 cols x 40 rows (read in-mem)                    47             49           4          2.1         472.7       0.4X
+2500 cols x 40 rows (exec in-mem)                    74             79           9          1.3         741.1       0.2X
+2500 cols x 40 rows (read parquet)                  316            326           7          0.3        3160.6       0.1X
+2500 cols x 40 rows (write parquet)                 122            131           9          0.8        1220.3       0.1X
 
 
 ================================================================================================
 wide shallowly nested struct field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 wide shallowly nested struct field r/w:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 wide x 100000 rows (read in-mem)                   20             24           6          5.0         198.2       1.0X
-1 wide x 100000 rows (exec in-mem)                   21             26           6          4.7         213.3       0.9X
-1 wide x 100000 rows (read parquet)                  22             26           6          4.6         217.9       0.9X
-1 wide x 100000 rows (write parquet)                 94            102          11          1.1         944.8       0.2X
-100 wide x 1000 rows (read in-mem)                   15             19           6          6.6         150.9       1.3X
-100 wide x 1000 rows (exec in-mem)                   16             18           4          6.4         157.4       1.3X
-100 wide x 1000 rows (read parquet)                  22             25           5          4.6         215.3       0.9X
-100 wide x 1000 rows (write parquet)                 89            103          11          1.1         889.6       0.2X
-2500 wide x 40 rows (read in-mem)                    21             23           4          4.9         205.9       1.0X
-2500 wide x 40 rows (exec in-mem)                    22             25           5          4.5         219.9       0.9X
-2500 wide x 40 rows (read parquet)                   65             69           6          1.5         647.1       0.3X
-2500 wide x 40 rows (write parquet)                  94            110           7          1.1         944.7       0.2X
+1 wide x 100000 rows (read in-mem)                   21             28           7          4.8         208.2       1.0X
+1 wide x 100000 rows (exec in-mem)                   22             27           5          4.5         224.1       0.9X
+1 wide x 100000 rows (read parquet)                  23             29           8          4.3         230.1       0.9X
+1 wide x 100000 rows (write parquet)                 96            104           8          1.0         962.3       0.2X
+100 wide x 1000 rows (read in-mem)                   16             20           6          6.4         157.3       1.3X
+100 wide x 1000 rows (exec in-mem)                   17             21           6          6.0         166.2       1.3X
+100 wide x 1000 rows (read parquet)                  22             26           5          4.5         223.2       0.9X
+100 wide x 1000 rows (write parquet)                 90             99          12          1.1         896.8       0.2X
+2500 wide x 40 rows (read in-mem)                    21             24           5          4.8         209.2       1.0X
+2500 wide x 40 rows (exec in-mem)                    22             27           6          4.5         223.7       0.9X
+2500 wide x 40 rows (read parquet)                   65             70           6          1.5         654.5       0.3X
+2500 wide x 40 rows (write parquet)                  96            102           9          1.0         957.8       0.2X
 
 
 ================================================================================================
 deeply nested struct field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 deeply nested struct field r/w:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 deep x 100000 rows (read in-mem)                   16             19           5          6.4         155.5       1.0X
-1 deep x 100000 rows (exec in-mem)                   18             21           5          5.6         177.4       0.9X
-1 deep x 100000 rows (read parquet)                  18             21           5          5.5         182.1       0.9X
-1 deep x 100000 rows (write parquet)                 90             94           3          1.1         899.4       0.2X
-100 deep x 1000 rows (read in-mem)                   45             47           3          2.2         448.2       0.3X
-100 deep x 1000 rows (exec in-mem)                  455            463           6          0.2        4548.0       0.0X
-100 deep x 1000 rows (read parquet)                 462            471           6          0.2        4618.6       0.0X
-100 deep x 1000 rows (write parquet)                127            137           6          0.8        1271.2       0.1X
-250 deep x 400 rows (read in-mem)                   194            197           2          0.5        1940.9       0.1X
-250 deep x 400 rows (exec in-mem)                  2758           2764           9          0.0       27576.6       0.0X
-250 deep x 400 rows (read parquet)                 2752           2754           2          0.0       27523.9       0.0X
-250 deep x 400 rows (write parquet)                 268            274           5          0.4        2676.3       0.1X
+1 deep x 100000 rows (read in-mem)                   16             21           6          6.2         160.4       1.0X
+1 deep x 100000 rows (exec in-mem)                   18             23           6          5.5         183.0       0.9X
+1 deep x 100000 rows (read parquet)                  18             22           5          5.4         184.9       0.9X
+1 deep x 100000 rows (write parquet)                 90             98           7          1.1         902.9       0.2X
+100 deep x 1000 rows (read in-mem)                   44             47           4          2.3         440.2       0.4X
+100 deep x 1000 rows (exec in-mem)                  469            475           7          0.2        4690.1       0.0X
+100 deep x 1000 rows (read parquet)                 476            478           2          0.2        4761.2       0.0X
+100 deep x 1000 rows (write parquet)                119            124           4          0.8        1191.8       0.1X
+250 deep x 400 rows (read in-mem)                   192            196           4          0.5        1918.4       0.1X
+250 deep x 400 rows (exec in-mem)                  2876           2879           5          0.0       28758.0       0.0X
+250 deep x 400 rows (read parquet)                 2853           2856           4          0.0       28534.9       0.0X
+250 deep x 400 rows (write parquet)                 265            274           7          0.4        2651.7       0.1X
 
 
 ================================================================================================
 bushy struct field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 bushy struct field r/w:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-1 x 1 deep x 100000 rows (read in-mem)                13             15           4          7.6         131.1       1.0X
-1 x 1 deep x 100000 rows (exec in-mem)                15             17           4          6.6         151.7       0.9X
-1 x 1 deep x 100000 rows (read parquet)               18             20           5          5.7         175.1       0.7X
-1 x 1 deep x 100000 rows (write parquet)              87             91           4          1.1         873.2       0.2X
-128 x 8 deep x 1000 rows (read in-mem)                14             16           4          7.4         135.3       1.0X
-128 x 8 deep x 1000 rows (exec in-mem)                15             17           4          6.8         146.2       0.9X
-128 x 8 deep x 1000 rows (read parquet)               21             23           5          4.8         208.9       0.6X
-128 x 8 deep x 1000 rows (write parquet)              87             94           7          1.2         868.4       0.2X
-1024 x 11 deep x 100 rows (read in-mem)               16             19           4          6.1         164.9       0.8X
-1024 x 11 deep x 100 rows (exec in-mem)               18             20           4          5.6         180.1       0.7X
-1024 x 11 deep x 100 rows (read parquet)              34             38           5          2.9         342.1       0.4X
-1024 x 11 deep x 100 rows (write parquet)             91            101           9          1.1         906.6       0.1X
+1 x 1 deep x 100000 rows (read in-mem)                14             16           4          7.3         137.7       1.0X
+1 x 1 deep x 100000 rows (exec in-mem)                15             18           4          6.5         153.5       0.9X
+1 x 1 deep x 100000 rows (read parquet)               18             20           5          5.5         180.9       0.8X
+1 x 1 deep x 100000 rows (write parquet)              89             94           8          1.1         887.7       0.2X
+128 x 8 deep x 1000 rows (read in-mem)                13             16           5          7.5         134.0       1.0X
+128 x 8 deep x 1000 rows (exec in-mem)                15             17           4          6.8         146.1       0.9X
+128 x 8 deep x 1000 rows (read parquet)               21             25           5          4.7         212.1       0.6X
+128 x 8 deep x 1000 rows (write parquet)              87             92           7          1.1         873.3       0.2X
+1024 x 11 deep x 100 rows (read in-mem)               17             20           5          5.8         172.0       0.8X
+1024 x 11 deep x 100 rows (exec in-mem)               19             24           6          5.4         186.9       0.7X
+1024 x 11 deep x 100 rows (read parquet)              35             39           6          2.9         349.6       0.4X
+1024 x 11 deep x 100 rows (write parquet)             91             97           7          1.1         909.3       0.2X
 
 
 ================================================================================================
 wide array field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 wide array field r/w:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 wide x 100000 rows (read in-mem)                   15             17           4          6.7         150.3       1.0X
-1 wide x 100000 rows (exec in-mem)                   17             20           4          5.8         172.0       0.9X
-1 wide x 100000 rows (read parquet)                  18             20           4          5.6         177.3       0.8X
-1 wide x 100000 rows (write parquet)                 89             97           7          1.1         889.4       0.2X
-100 wide x 1000 rows (read in-mem)                   11             13           4          8.9         112.0       1.3X
-100 wide x 1000 rows (exec in-mem)                   13             15           4          7.8         128.7       1.2X
-100 wide x 1000 rows (read parquet)                  17             20           5          5.8         173.5       0.9X
-100 wide x 1000 rows (write parquet)                 85             95           7          1.2         850.1       0.2X
-2500 wide x 40 rows (read in-mem)                    11             13           4          9.2         109.1       1.4X
-2500 wide x 40 rows (exec in-mem)                    12             15           4          8.0         124.8       1.2X
-2500 wide x 40 rows (read parquet)                   17             19           4          5.9         170.3       0.9X
-2500 wide x 40 rows (write parquet)                  84             89           4          1.2         844.3       0.2X
+1 wide x 100000 rows (read in-mem)                   15             18           4          6.7         149.3       1.0X
+1 wide x 100000 rows (exec in-mem)                   17             19           4          5.9         170.3       0.9X
+1 wide x 100000 rows (read parquet)                  18             20           5          5.7         176.6       0.8X
+1 wide x 100000 rows (write parquet)                 88             94           7          1.1         884.9       0.2X
+100 wide x 1000 rows (read in-mem)                   11             14           4          8.8         113.4       1.3X
+100 wide x 1000 rows (exec in-mem)                   13             16           4          7.7         129.4       1.2X
+100 wide x 1000 rows (read parquet)                  17             20           6          5.8         173.6       0.9X
+100 wide x 1000 rows (write parquet)                 85             90           7          1.2         847.2       0.2X
+2500 wide x 40 rows (read in-mem)                    11             12           3          9.1         109.8       1.4X
+2500 wide x 40 rows (exec in-mem)                    12             14           4          8.1         124.2       1.2X
+2500 wide x 40 rows (read parquet)                   17             19           5          5.9         170.5       0.9X
+2500 wide x 40 rows (write parquet)                  84             91           6          1.2         841.5       0.2X
 
 
 ================================================================================================
 wide map field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 wide map field r/w:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 wide x 100000 rows (read in-mem)                   12             14           2          8.0         124.5       1.0X
-1 wide x 100000 rows (exec in-mem)                   16             19           3          6.1         164.2       0.8X
-1 wide x 100000 rows (read parquet)                  21             24           5          4.7         213.1       0.6X
-1 wide x 100000 rows (write parquet)                 86             92           6          1.2         855.4       0.1X
-100 wide x 1000 rows (read in-mem)                    8              9           2         13.0          76.7       1.6X
-100 wide x 1000 rows (exec in-mem)                   10             11           2         10.3          97.0       1.3X
-100 wide x 1000 rows (read parquet)                  19             22           5          5.3         187.1       0.7X
-100 wide x 1000 rows (write parquet)                 81             87           6          1.2         806.6       0.2X
-2500 wide x 40 rows (read in-mem)                    10             11           3         10.5          95.7       1.3X
-2500 wide x 40 rows (exec in-mem)                    11             13           3          8.8         113.7       1.1X
-2500 wide x 40 rows (read parquet)                   19             21           5          5.4         186.2       0.7X
-2500 wide x 40 rows (write parquet)                  83             89           6          1.2         826.0       0.2X
+1 wide x 100000 rows (read in-mem)                   12             14           3          8.1         123.4       1.0X
+1 wide x 100000 rows (exec in-mem)                   16             18           3          6.2         160.2       0.8X
+1 wide x 100000 rows (read parquet)                  21             25           5          4.7         213.2       0.6X
+1 wide x 100000 rows (write parquet)                 85             90           6          1.2         850.3       0.1X
+100 wide x 1000 rows (read in-mem)                    7              9           3         13.6          73.6       1.7X
+100 wide x 1000 rows (exec in-mem)                    9             11           3         10.6          94.0       1.3X
+100 wide x 1000 rows (read parquet)                  18             22           6          5.4         184.6       0.7X
+100 wide x 1000 rows (write parquet)                 80             84           5          1.2         802.4       0.2X
+2500 wide x 40 rows (read in-mem)                     9             10           3         11.1          90.0       1.4X
+2500 wide x 40 rows (exec in-mem)                    11             12           3          9.1         109.6       1.1X
+2500 wide x 40 rows (read parquet)                   19             21           4          5.3         189.2       0.7X
+2500 wide x 40 rows (write parquet)                  82             88           8          1.2         818.2       0.2X
 
 
diff --git a/sql/core/benchmarks/WideSchemaBenchmark-results.txt b/sql/core/benchmarks/WideSchemaBenchmark-results.txt
index fe8a25b6e918d..d2d2a4b9f084d 100644
--- a/sql/core/benchmarks/WideSchemaBenchmark-results.txt
+++ b/sql/core/benchmarks/WideSchemaBenchmark-results.txt
@@ -2,157 +2,157 @@
 parsing large select expressions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 parsing large select:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 select expressions                                  1              1           0          0.0      641958.0       1.0X
-100 select expressions                                3              3           1          0.0     3194529.0       0.2X
-2500 select expressions                              70             71           2          0.0    69525822.0       0.0X
+1 select expressions                                  1              1           0          0.0      650133.0       1.0X
+100 select expressions                                3              3           0          0.0     3239833.0       0.2X
+2500 select expressions                              71             73           2          0.0    70970829.0       0.0X
 
 
 ================================================================================================
 optimize large select expressions
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 optimize large select:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-100 columns                                           3              4           1          0.0     2941387.0       1.0X
-1000 columns                                         16             18           3          0.0    16490130.0       0.2X
-10000 columns                                       152            165          17          0.0   151554960.0       0.0X
+100 columns                                           3              4           1          0.0     3227010.0       1.0X
+1000 columns                                         18             20           2          0.0    18320597.0       0.2X
+10000 columns                                       182            198          18          0.0   182328011.0       0.0X
 
 
 ================================================================================================
 many column field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 many column field r/w:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 cols x 100000 rows (read in-mem)                   19             28           7          5.4         186.4       1.0X
-1 cols x 100000 rows (exec in-mem)                   16             25           6          6.1         162.9       1.1X
-1 cols x 100000 rows (read parquet)                  33             48           8          3.1         325.9       0.6X
-1 cols x 100000 rows (write parquet)                 93            119          13          1.1         932.5       0.2X
-100 cols x 1000 rows (read in-mem)                   11             15           3          8.7         114.6       1.6X
-100 cols x 1000 rows (exec in-mem)                   14             19           5          7.2         139.1       1.3X
-100 cols x 1000 rows (read parquet)                  23             28           4          4.3         231.6       0.8X
-100 cols x 1000 rows (write parquet)                 85             91           7          1.2         854.0       0.2X
-2500 cols x 40 rows (read in-mem)                    44             47           4          2.3         442.7       0.4X
-2500 cols x 40 rows (exec in-mem)                    71             76           5          1.4         710.2       0.3X
-2500 cols x 40 rows (read parquet)                  260            264           3          0.4        2598.0       0.1X
-2500 cols x 40 rows (write parquet)                 119            127           6          0.8        1193.2       0.2X
+1 cols x 100000 rows (read in-mem)                   18             24           3          5.5         180.9       1.0X
+1 cols x 100000 rows (exec in-mem)                   17             22           3          5.9         170.1       1.1X
+1 cols x 100000 rows (read parquet)                  31             37           5          3.3         306.0       0.6X
+1 cols x 100000 rows (write parquet)                 93            100           6          1.1         926.7       0.2X
+100 cols x 1000 rows (read in-mem)                   13             17           3          7.4         134.3       1.3X
+100 cols x 1000 rows (exec in-mem)                   16             19           3          6.3         160.0       1.1X
+100 cols x 1000 rows (read parquet)                  25             30           5          3.9         253.6       0.7X
+100 cols x 1000 rows (write parquet)                 88             94           6          1.1         884.9       0.2X
+2500 cols x 40 rows (read in-mem)                    49             51           6          2.0         489.9       0.4X
+2500 cols x 40 rows (exec in-mem)                    75             82          11          1.3         747.3       0.2X
+2500 cols x 40 rows (read parquet)                  284            292           9          0.4        2843.7       0.1X
+2500 cols x 40 rows (write parquet)                 125            135           8          0.8        1248.2       0.1X
 
 
 ================================================================================================
 wide shallowly nested struct field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 wide shallowly nested struct field r/w:   Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 wide x 100000 rows (read in-mem)                   20             26           5          5.0         199.2       1.0X
-1 wide x 100000 rows (exec in-mem)                   21             28           6          4.7         214.2       0.9X
-1 wide x 100000 rows (read parquet)                  22             29           6          4.5         220.0       0.9X
-1 wide x 100000 rows (write parquet)                 94            102           8          1.1         944.6       0.2X
-100 wide x 1000 rows (read in-mem)                   15             18           3          6.7         148.6       1.3X
-100 wide x 1000 rows (exec in-mem)                   16             18           3          6.3         159.2       1.3X
-100 wide x 1000 rows (read parquet)                  21             24           4          4.7         214.7       0.9X
-100 wide x 1000 rows (write parquet)                 90             97          12          1.1         899.6       0.2X
-2500 wide x 40 rows (read in-mem)                    21             22           3          4.9         206.0       1.0X
-2500 wide x 40 rows (exec in-mem)                    22             24           3          4.6         217.2       0.9X
-2500 wide x 40 rows (read parquet)                   65             70           4          1.5         652.8       0.3X
-2500 wide x 40 rows (write parquet)                  96            101           6          1.0         960.8       0.2X
+1 wide x 100000 rows (read in-mem)                   21             27           5          4.8         209.3       1.0X
+1 wide x 100000 rows (exec in-mem)                   23             27           3          4.3         232.4       0.9X
+1 wide x 100000 rows (read parquet)                  24             29           6          4.2         235.5       0.9X
+1 wide x 100000 rows (write parquet)                 96            104           7          1.0         956.0       0.2X
+100 wide x 1000 rows (read in-mem)                   16             19           3          6.3         159.5       1.3X
+100 wide x 1000 rows (exec in-mem)                   17             20           3          5.9         169.9       1.2X
+100 wide x 1000 rows (read parquet)                  22             25           3          4.5         224.4       0.9X
+100 wide x 1000 rows (write parquet)                 89             95           5          1.1         894.0       0.2X
+2500 wide x 40 rows (read in-mem)                    22             24           3          4.6         216.2       1.0X
+2500 wide x 40 rows (exec in-mem)                    23             26           4          4.4         229.5       0.9X
+2500 wide x 40 rows (read parquet)                   66             69           4          1.5         661.6       0.3X
+2500 wide x 40 rows (write parquet)                  96            103           8          1.0         964.4       0.2X
 
 
 ================================================================================================
 deeply nested struct field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 deeply nested struct field r/w:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 deep x 100000 rows (read in-mem)                   15             17           2          6.5         153.7       1.0X
-1 deep x 100000 rows (exec in-mem)                   17             20           3          5.8         172.2       0.9X
-1 deep x 100000 rows (read parquet)                  18             20           3          5.5         183.1       0.8X
-1 deep x 100000 rows (write parquet)                 90             97           5          1.1         901.8       0.2X
-100 deep x 1000 rows (read in-mem)                   28             30           3          3.5         283.9       0.5X
-100 deep x 1000 rows (exec in-mem)                  419            424           6          0.2        4192.5       0.0X
-100 deep x 1000 rows (read parquet)                 430            439           7          0.2        4304.2       0.0X
-100 deep x 1000 rows (write parquet)                105            110           6          1.0        1045.3       0.1X
-250 deep x 400 rows (read in-mem)                   106            111           6          0.9        1060.8       0.1X
-250 deep x 400 rows (exec in-mem)                  2507           2517          14          0.0       25067.5       0.0X
-250 deep x 400 rows (read parquet)                 2585           2589           5          0.0       25851.9       0.0X
-250 deep x 400 rows (write parquet)                 180            186           7          0.6        1799.1       0.1X
+1 deep x 100000 rows (read in-mem)                   16             19           4          6.1         163.9       1.0X
+1 deep x 100000 rows (exec in-mem)                   18             22           4          5.5         182.9       0.9X
+1 deep x 100000 rows (read parquet)                  19             22           4          5.4         185.2       0.9X
+1 deep x 100000 rows (write parquet)                 89             95           7          1.1         889.2       0.2X
+100 deep x 1000 rows (read in-mem)                   30             31           3          3.4         297.8       0.6X
+100 deep x 1000 rows (exec in-mem)                  404            410           8          0.2        4042.1       0.0X
+100 deep x 1000 rows (read parquet)                 418            434          23          0.2        4178.6       0.0X
+100 deep x 1000 rows (write parquet)                103            108           5          1.0        1025.2       0.2X
+250 deep x 400 rows (read in-mem)                   105            110           5          1.0        1050.3       0.2X
+250 deep x 400 rows (exec in-mem)                  2463           2480          23          0.0       24634.0       0.0X
+250 deep x 400 rows (read parquet)                 2537           2539           2          0.0       25372.5       0.0X
+250 deep x 400 rows (write parquet)                 177            182           4          0.6        1765.6       0.1X
 
 
 ================================================================================================
 bushy struct field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 bushy struct field r/w:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-1 x 1 deep x 100000 rows (read in-mem)                13             15           3          7.7         129.7       1.0X
-1 x 1 deep x 100000 rows (exec in-mem)                15             16           3          6.9         145.7       0.9X
-1 x 1 deep x 100000 rows (read parquet)               17             19           4          5.8         171.3       0.8X
-1 x 1 deep x 100000 rows (write parquet)              88             92           5          1.1         877.2       0.1X
-128 x 8 deep x 1000 rows (read in-mem)                13             14           2          7.9         126.5       1.0X
-128 x 8 deep x 1000 rows (exec in-mem)                14             15           2          7.1         140.8       0.9X
-128 x 8 deep x 1000 rows (read parquet)               20             23           3          5.0         201.6       0.6X
-128 x 8 deep x 1000 rows (write parquet)              87             96           9          1.1         870.6       0.1X
-1024 x 11 deep x 100 rows (read in-mem)               16             18           3          6.1         164.3       0.8X
-1024 x 11 deep x 100 rows (exec in-mem)               18             20           3          5.7         175.6       0.7X
-1024 x 11 deep x 100 rows (read parquet)              34             38           4          2.9         341.2       0.4X
-1024 x 11 deep x 100 rows (write parquet)             91             95           6          1.1         906.0       0.1X
+1 x 1 deep x 100000 rows (read in-mem)                14             16           4          7.2         138.9       1.0X
+1 x 1 deep x 100000 rows (exec in-mem)                16             18           3          6.4         156.5       0.9X
+1 x 1 deep x 100000 rows (read parquet)               18             20           3          5.5         181.8       0.8X
+1 x 1 deep x 100000 rows (write parquet)              87             92           5          1.1         874.0       0.2X
+128 x 8 deep x 1000 rows (read in-mem)                13             15           3          7.6         132.4       1.0X
+128 x 8 deep x 1000 rows (exec in-mem)                15             16           3          6.8         147.2       0.9X
+128 x 8 deep x 1000 rows (read parquet)               21             23           4          4.9         205.7       0.7X
+128 x 8 deep x 1000 rows (write parquet)              85             89           4          1.2         854.3       0.2X
+1024 x 11 deep x 100 rows (read in-mem)               18             20           3          5.7         176.0       0.8X
+1024 x 11 deep x 100 rows (exec in-mem)               19             22           4          5.3         190.1       0.7X
+1024 x 11 deep x 100 rows (read parquet)              35             37           4          2.9         346.4       0.4X
+1024 x 11 deep x 100 rows (write parquet)             91             95           5          1.1         909.0       0.2X
 
 
 ================================================================================================
 wide array field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 wide array field r/w:                     Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 wide x 100000 rows (read in-mem)                   15             17           3          6.7         150.1       1.0X
-1 wide x 100000 rows (exec in-mem)                   17             19           3          6.0         167.9       0.9X
-1 wide x 100000 rows (read parquet)                  17             21           3          5.8         173.9       0.9X
-1 wide x 100000 rows (write parquet)                 90             97           6          1.1         902.5       0.2X
-100 wide x 1000 rows (read in-mem)                   11             13           3          9.0         111.4       1.3X
-100 wide x 1000 rows (exec in-mem)                   12             14           3          8.0         124.8       1.2X
-100 wide x 1000 rows (read parquet)                  17             18           3          6.0         167.5       0.9X
-100 wide x 1000 rows (write parquet)                 85             91           6          1.2         852.9       0.2X
-2500 wide x 40 rows (read in-mem)                    11             13           3          9.0         111.4       1.3X
-2500 wide x 40 rows (exec in-mem)                    13             15           3          8.0         125.7       1.2X
-2500 wide x 40 rows (read parquet)                   18             19           3          5.6         178.1       0.8X
-2500 wide x 40 rows (write parquet)                  85             89           4          1.2         848.2       0.2X
+1 wide x 100000 rows (read in-mem)                   15             18           3          6.5         154.1       1.0X
+1 wide x 100000 rows (exec in-mem)                   18             21           4          5.4         185.0       0.8X
+1 wide x 100000 rows (read parquet)                  18             20           3          5.7         175.5       0.9X
+1 wide x 100000 rows (write parquet)                 87             92           5          1.2         866.2       0.2X
+100 wide x 1000 rows (read in-mem)                   12             13           3          8.6         116.8       1.3X
+100 wide x 1000 rows (exec in-mem)                   13             15           3          7.5         133.2       1.2X
+100 wide x 1000 rows (read parquet)                  17             20           3          5.9         169.6       0.9X
+100 wide x 1000 rows (write parquet)                 85             88           4          1.2         851.1       0.2X
+2500 wide x 40 rows (read in-mem)                    12             14           3          8.5         117.8       1.3X
+2500 wide x 40 rows (exec in-mem)                    13             15           3          7.5         133.7       1.2X
+2500 wide x 40 rows (read parquet)                   17             20           3          5.7         174.8       0.9X
+2500 wide x 40 rows (write parquet)                  84             88           6          1.2         835.1       0.2X
 
 
 ================================================================================================
 wide map field read and write
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 wide map field r/w:                       Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-1 wide x 100000 rows (read in-mem)                   13             14           2          7.8         127.5       1.0X
-1 wide x 100000 rows (exec in-mem)                   16             17           2          6.3         159.9       0.8X
-1 wide x 100000 rows (read parquet)                  21             23           3          4.8         206.7       0.6X
-1 wide x 100000 rows (write parquet)                 87             92           5          1.2         865.5       0.1X
-100 wide x 1000 rows (read in-mem)                    8              9           2         12.8          78.1       1.6X
-100 wide x 1000 rows (exec in-mem)                   10             11           2         10.2          97.9       1.3X
-100 wide x 1000 rows (read parquet)                  18             20           3          5.5         181.5       0.7X
-100 wide x 1000 rows (write parquet)                 81             85           4          1.2         808.5       0.2X
-2500 wide x 40 rows (read in-mem)                    10             10           1         10.2          97.6       1.3X
-2500 wide x 40 rows (exec in-mem)                    11             12           2          8.7         114.5       1.1X
-2500 wide x 40 rows (read parquet)                   19             20           3          5.4         185.3       0.7X
-2500 wide x 40 rows (write parquet)                  84             89           6          1.2         837.2       0.2X
+1 wide x 100000 rows (read in-mem)                   14             16           2          7.1         140.8       1.0X
+1 wide x 100000 rows (exec in-mem)                   18             20           2          5.5         180.9       0.8X
+1 wide x 100000 rows (read parquet)                  21             23           4          4.8         208.7       0.7X
+1 wide x 100000 rows (write parquet)                 85             89           3          1.2         851.5       0.2X
+100 wide x 1000 rows (read in-mem)                    8             10           2         13.3          75.3       1.9X
+100 wide x 1000 rows (exec in-mem)                    9             11           2         10.7          93.0       1.5X
+100 wide x 1000 rows (read parquet)                  18             21           3          5.5         182.0       0.8X
+100 wide x 1000 rows (write parquet)                 79             84           4          1.3         793.4       0.2X
+2500 wide x 40 rows (read in-mem)                    10             11           2         10.3          97.4       1.4X
+2500 wide x 40 rows (exec in-mem)                    11             13           2          8.7         114.6       1.2X
+2500 wide x 40 rows (read parquet)                   19             21           3          5.3         188.5       0.7X
+2500 wide x 40 rows (write parquet)                  80             86           6          1.2         804.0       0.2X
 
 
diff --git a/sql/core/benchmarks/WideTableBenchmark-jdk21-results.txt b/sql/core/benchmarks/WideTableBenchmark-jdk21-results.txt
index 9cf6f38fccc00..52708bcd12a70 100644
--- a/sql/core/benchmarks/WideTableBenchmark-jdk21-results.txt
+++ b/sql/core/benchmarks/WideTableBenchmark-jdk21-results.txt
@@ -2,16 +2,16 @@
 projection on wide table
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 projection on wide table:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-split threshold 10                                 2647           2714          60          0.4        2524.1       1.0X
-split threshold 100                                2171           2198          47          0.5        2070.3       1.2X
-split threshold 1024                               1654           1673          12          0.6        1577.3       1.6X
-split threshold 2048                               1614           1633          13          0.6        1539.5       1.6X
-split threshold 4096                               1737           1747           9          0.6        1656.7       1.5X
-split threshold 8192                               2309           2355          59          0.5        2202.2       1.1X
-split threshold 65536                             21274          21439         163          0.0       20288.2       0.1X
+split threshold 10                                 2651           2709          47          0.4        2527.9       1.0X
+split threshold 100                                2175           2187          19          0.5        2074.3       1.2X
+split threshold 1024                               1660           1680          13          0.6        1583.5       1.6X
+split threshold 2048                               1613           1628          18          0.7        1538.2       1.6X
+split threshold 4096                               1713           1745          21          0.6        1634.0       1.5X
+split threshold 8192                               2277           2288          13          0.5        2171.1       1.2X
+split threshold 65536                             21265          21793         328          0.0       20279.6       0.1X
 
 
diff --git a/sql/core/benchmarks/WideTableBenchmark-results.txt b/sql/core/benchmarks/WideTableBenchmark-results.txt
index 89b0c2490a0b5..62845b83a624d 100644
--- a/sql/core/benchmarks/WideTableBenchmark-results.txt
+++ b/sql/core/benchmarks/WideTableBenchmark-results.txt
@@ -2,16 +2,16 @@
 projection on wide table
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 projection on wide table:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-split threshold 10                                 2555           2620          67          0.4        2437.1       1.0X
-split threshold 100                                2044           2069          22          0.5        1949.7       1.2X
-split threshold 1024                               1653           1669          18          0.6        1576.0       1.5X
-split threshold 2048                               1617           1649          24          0.6        1541.7       1.6X
-split threshold 4096                               1687           1691           6          0.6        1608.7       1.5X
-split threshold 8192                               2129           2146          24          0.5        2030.3       1.2X
-split threshold 65536                             21564          21770         151          0.0       20565.0       0.1X
+split threshold 10                                 2546           2630          65          0.4        2428.4       1.0X
+split threshold 100                                2080           2092           8          0.5        1984.0       1.2X
+split threshold 1024                               1660           1685          19          0.6        1583.6       1.5X
+split threshold 2048                               1632           1636           5          0.6        1556.0       1.6X
+split threshold 4096                               1678           1696          15          0.6        1600.6       1.5X
+split threshold 8192                               2133           2141           9          0.5        2034.0       1.2X
+split threshold 65536                             21981          22102         128          0.0       20962.3       0.1X
 
 
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeExternalRowSorter.java b/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeExternalRowSorter.java
index 90b55a8586de7..66637ac2bbd9f 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeExternalRowSorter.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeExternalRowSorter.java
@@ -120,6 +120,8 @@ private UnsafeExternalRowSorter(
       pageSizeBytes,
       (int) SparkEnv.get().conf().get(
         package$.MODULE$.SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD()),
+      (long) SparkEnv.get().conf().get(
+        package$.MODULE$.SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD()),
       canUseRadixSort
     );
   }
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeFixedWidthAggregationMap.java b/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeFixedWidthAggregationMap.java
index 8587d9290078b..af8d5a4610f64 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeFixedWidthAggregationMap.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeFixedWidthAggregationMap.java
@@ -242,6 +242,8 @@ public UnsafeKVExternalSorter destructAndCreateExternalSorter() throws IOExcepti
       map.getPageSizeBytes(),
       (int) SparkEnv.get().conf().get(
         package$.MODULE$.SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD()),
+      (long) SparkEnv.get().conf().get(
+        package$.MODULE$.SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD()),
       map);
   }
 }
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeKVExternalSorter.java b/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeKVExternalSorter.java
index 6f2d12e6b790a..6affcb61b8d69 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeKVExternalSorter.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/UnsafeKVExternalSorter.java
@@ -60,9 +60,10 @@ public UnsafeKVExternalSorter(
       BlockManager blockManager,
       SerializerManager serializerManager,
       long pageSizeBytes,
-      int numElementsForSpillThreshold) throws IOException {
+      int numElementsForSpillThreshold,
+      long maxRecordsSizeForSpillThreshold) throws IOException {
     this(keySchema, valueSchema, blockManager, serializerManager, pageSizeBytes,
-      numElementsForSpillThreshold, null);
+      numElementsForSpillThreshold, maxRecordsSizeForSpillThreshold, null);
   }
 
   public UnsafeKVExternalSorter(
@@ -72,6 +73,7 @@ public UnsafeKVExternalSorter(
       SerializerManager serializerManager,
       long pageSizeBytes,
       int numElementsForSpillThreshold,
+      long maxRecordsSizeForSpillThreshold,
       @Nullable BytesToBytesMap map) throws IOException {
     this.keySchema = keySchema;
     this.valueSchema = valueSchema;
@@ -98,6 +100,7 @@ public UnsafeKVExternalSorter(
         (int) (long) SparkEnv.get().conf().get(package$.MODULE$.SHUFFLE_SORT_INIT_BUFFER_SIZE()),
         pageSizeBytes,
         numElementsForSpillThreshold,
+        maxRecordsSizeForSpillThreshold,
         canUseRadixSort);
     } else {
       // During spilling, the pointer array in `BytesToBytesMap` will not be used, so we can borrow
@@ -165,6 +168,7 @@ public UnsafeKVExternalSorter(
         (int) (long) SparkEnv.get().conf().get(package$.MODULE$.SHUFFLE_SORT_INIT_BUFFER_SIZE()),
         pageSizeBytes,
         numElementsForSpillThreshold,
+        maxRecordsSizeForSpillThreshold,
         inMemSorter,
         map.getTotalMemoryConsumption());
 
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/HadoopLineRecordReader.java b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/HadoopLineRecordReader.java
new file mode 100644
index 0000000000000..9a015cc740e42
--- /dev/null
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/HadoopLineRecordReader.java
@@ -0,0 +1,298 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution.datasources;
+
+import java.io.IOException;
+import java.io.InputStream;
+
+import scala.Option;
+
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.FSDataInputStream;
+import org.apache.hadoop.fs.FutureDataInputStreamBuilder;
+import org.apache.hadoop.fs.Path;
+import org.apache.hadoop.fs.Seekable;
+import org.apache.hadoop.io.LongWritable;
+import org.apache.hadoop.io.Text;
+import org.apache.hadoop.io.compress.CodecPool;
+import org.apache.hadoop.io.compress.CompressionCodec;
+import org.apache.hadoop.io.compress.SplitCompressionInputStream;
+import org.apache.hadoop.io.compress.SplittableCompressionCodec;
+import org.apache.hadoop.io.compress.Decompressor;
+import org.apache.hadoop.mapreduce.InputSplit;
+import org.apache.hadoop.mapreduce.MRJobConfig;
+import org.apache.hadoop.mapreduce.RecordReader;
+import org.apache.hadoop.mapreduce.TaskAttemptContext;
+import org.apache.hadoop.mapreduce.lib.input.FileSplit;
+import org.apache.hadoop.mapreduce.lib.input.SplitLineReader;
+import org.apache.hadoop.mapreduce.lib.input.CompressedSplitLineReader;
+import org.apache.hadoop.mapreduce.lib.input.UncompressedSplitLineReader;
+import org.apache.hadoop.util.functional.FutureIO;
+import org.apache.spark.internal.SparkLogger;
+import org.apache.spark.internal.SparkLoggerFactory;
+import org.apache.spark.io.HadoopCodecStreams;
+
+import static org.apache.hadoop.fs.Options.OpenFileOptions.FS_OPTION_OPENFILE_SPLIT_END;
+import static org.apache.hadoop.fs.Options.OpenFileOptions.FS_OPTION_OPENFILE_SPLIT_START;
+
+/**
+ * Inlined from Hadoop's LineRecordReader to add support for passing compression option
+ * and also add support for other codecs like ZSTD.
+ * Specifically, it calls in HadoopCodecStreams.getDecompressionCodec to get the codec
+ * and calls HadoopCodecStreams.createZstdInputStream when the codec fails to create the
+ * InputStream.
+ */
+
+/**
+ * Treats keys as offset in file and value as line.
+ */
+public class HadoopLineRecordReader extends RecordReader<LongWritable, Text> {
+    public static final String MAX_LINE_LENGTH =
+            "mapreduce.input.linerecordreader.line.maxlength";
+    private static final SparkLogger LOG =
+            SparkLoggerFactory.getLogger(HadoopLineRecordReader.class);
+
+    private long start;
+    private long pos;
+    private long end;
+    private SplitLineReader in;
+    private FSDataInputStream fileIn;
+    private Seekable filePosition;
+    private int maxLineLength;
+    private LongWritable key;
+    private Text value;
+    private boolean isCompressedInput;
+    private Decompressor decompressor;
+    private byte[] recordDelimiterBytes;
+
+    public HadoopLineRecordReader() {
+    }
+
+    public HadoopLineRecordReader(byte[] recordDelimiter) {
+        this.recordDelimiterBytes = recordDelimiter;
+    }
+
+    public void initialize(InputSplit genericSplit,
+                           TaskAttemptContext context) throws IOException {
+        FileSplit split = (FileSplit) genericSplit;
+        Configuration job = context.getConfiguration();
+        this.maxLineLength = job.getInt(MAX_LINE_LENGTH, Integer.MAX_VALUE);
+        start = split.getStart();
+        end = start + split.getLength();
+        final Path file = split.getPath();
+
+        // open the file and seek to the start of the split
+        final FutureDataInputStreamBuilder builder =
+                file.getFileSystem(job).openFile(file);
+        // the start and end of the split may be used to build
+        // an input strategy.
+        builder.optLong(FS_OPTION_OPENFILE_SPLIT_START, start);
+        builder.optLong(FS_OPTION_OPENFILE_SPLIT_END, end);
+        FutureIO.propagateOptions(builder, job,
+                MRJobConfig.INPUT_FILE_OPTION_PREFIX,
+                MRJobConfig.INPUT_FILE_MANDATORY_PREFIX);
+        fileIn = FutureIO.awaitFuture(builder.build());
+
+        try {
+            Option<CompressionCodec> codecOpt = HadoopCodecStreams.getDecompressionCodec(job, file);
+            if (codecOpt.isDefined()) {
+                CompressionCodec codec = codecOpt.get();
+                isCompressedInput = true;
+                try {
+                    decompressor = CodecPool.getDecompressor(codec);
+                    if (codec instanceof SplittableCompressionCodec) {
+                        final SplitCompressionInputStream cIn =
+                                ((SplittableCompressionCodec) codec).createInputStream(
+                                        fileIn, decompressor, start, end,
+                                        SplittableCompressionCodec.READ_MODE.BYBLOCK);
+                        in = new CompressedSplitLineReader(cIn, job,
+                                this.recordDelimiterBytes);
+                        start = cIn.getAdjustedStart();
+                        end = cIn.getAdjustedEnd();
+                        filePosition = cIn;
+                    } else {
+                        if (start != 0) {
+                            // So we have a split that is only part of a file stored using
+                            // a Compression codec that cannot be split.
+                            throw new IOException("Cannot seek in " +
+                                    codec.getClass().getSimpleName() + " compressed stream");
+                        }
+
+                        in = new SplitLineReader(codec.createInputStream(fileIn,
+                                decompressor), job, this.recordDelimiterBytes);
+                        filePosition = fileIn;
+                    }
+                } catch (RuntimeException e) {
+                    // Try Spark's ZSTD decompression support. This is not available in Hadoop's
+                    // version of LineRecordReader.
+                    Option<InputStream> decompressedStreamOpt =
+                            HadoopCodecStreams.createZstdInputStream(file, fileIn);
+                    if (decompressedStreamOpt.isEmpty()) {
+                        // File is either not ZSTD compressed or ZSTD codec is not available.
+                        throw e;
+                    }
+                    InputStream decompressedStream = decompressedStreamOpt.get();
+                    if (start != 0) {
+                        decompressedStream.close();
+                        throw new IOException("Cannot seek in "+ file.getName() +
+                                " compressed stream");
+                    }
+
+                    isCompressedInput = true;
+                    in = new SplitLineReader(decompressedStream, job, this.recordDelimiterBytes);
+                    filePosition = fileIn;
+                }
+            } else {
+                fileIn.seek(start);
+                in = new UncompressedSplitLineReader(
+                        fileIn, job, this.recordDelimiterBytes, split.getLength());
+                filePosition = fileIn;
+            }
+            // If this is not the first split, we always throw away first record
+            // because we always (except the last split) read one extra line in
+            // next() method.
+            if (start != 0) {
+                start += in.readLine(new Text(), 0, maxBytesToConsume(start));
+            }
+            this.pos = start;
+        } catch (Exception e) {
+            fileIn.close();
+            throw e;
+        }
+    }
+
+
+    private int maxBytesToConsume(long pos) {
+        return isCompressedInput
+                ? Integer.MAX_VALUE
+                : (int) Math.max(Math.min(Integer.MAX_VALUE, end - pos), maxLineLength);
+    }
+
+    private long getFilePosition() throws IOException {
+        long retVal;
+        if (isCompressedInput && null != filePosition) {
+            retVal = filePosition.getPos();
+        } else {
+            retVal = pos;
+        }
+        return retVal;
+    }
+
+    private int skipUtfByteOrderMark() throws IOException {
+        // Strip BOM(Byte Order Mark)
+        // Text only support UTF-8, we only need to check UTF-8 BOM
+        // (0xEF,0xBB,0xBF) at the start of the text stream.
+        int newMaxLineLength = (int) Math.min(3L + (long) maxLineLength,
+                Integer.MAX_VALUE);
+        int newSize = in.readLine(value, newMaxLineLength, maxBytesToConsume(pos));
+        // Even we read 3 extra bytes for the first line,
+        // we won't alter existing behavior (no backwards incompat issue).
+        // Because the newSize is less than maxLineLength and
+        // the number of bytes copied to Text is always no more than newSize.
+        // If the return size from readLine is not less than maxLineLength,
+        // we will discard the current line and read the next line.
+        pos += newSize;
+        int textLength = value.getLength();
+        byte[] textBytes = value.getBytes();
+        if ((textLength >= 3) && (textBytes[0] == (byte)0xEF) &&
+                (textBytes[1] == (byte)0xBB) && (textBytes[2] == (byte)0xBF)) {
+            // find UTF-8 BOM, strip it.
+            LOG.info("Found UTF-8 BOM and skipped it");
+            textLength -= 3;
+            newSize -= 3;
+            if (textLength > 0) {
+                // It may work to use the same buffer and not do the copyBytes
+                textBytes = value.copyBytes();
+                value.set(textBytes, 3, textLength);
+            } else {
+                value.clear();
+            }
+        }
+        return newSize;
+    }
+
+    public boolean nextKeyValue() throws IOException {
+        if (key == null) {
+            key = new LongWritable();
+        }
+        key.set(pos);
+        if (value == null) {
+            value = new Text();
+        }
+        int newSize = 0;
+        // We always read one extra line, which lies outside the upper
+        // split limit i.e. (end - 1)
+        while (getFilePosition() <= end || in.needAdditionalRecordAfterSplit()) {
+            if (pos == 0) {
+                newSize = skipUtfByteOrderMark();
+            } else {
+                newSize = in.readLine(value, maxLineLength, maxBytesToConsume(pos));
+                pos += newSize;
+            }
+
+            if ((newSize == 0) || (newSize < maxLineLength)) {
+                break;
+            }
+
+            // line too long. try again
+            LOG.info("Skipped line of size " + newSize + " at pos " +
+                    (pos - newSize));
+        }
+        if (newSize == 0) {
+            key = null;
+            value = null;
+            return false;
+        } else {
+            return true;
+        }
+    }
+
+    @Override
+    public LongWritable getCurrentKey() {
+        return key;
+    }
+
+    @Override
+    public Text getCurrentValue() {
+        return value;
+    }
+
+    /**
+     * Get the progress within the split
+     */
+    public float getProgress() throws IOException {
+        if (start == end) {
+            return 0.0f;
+        } else {
+            return Math.min(1.0f, (getFilePosition() - start) / (float)(end - start));
+        }
+    }
+
+    public synchronized void close() throws IOException {
+        try {
+            if (in != null) {
+                in.close();
+            }
+        } finally {
+            if (decompressor != null) {
+                CodecPool.returnDecompressor(decompressor);
+                decompressor = null;
+            }
+        }
+    }
+}
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnVector.java b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnVector.java
index 7fb8be7caf286..3331c8dfd8f5c 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnVector.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnVector.java
@@ -21,9 +21,8 @@
 import java.util.List;
 import java.util.Set;
 
-import com.google.common.base.Preconditions;
-
 import org.apache.spark.memory.MemoryMode;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.sql.execution.vectorized.OffHeapColumnVector;
 import org.apache.spark.sql.execution.vectorized.OnHeapColumnVector;
 import org.apache.spark.sql.execution.vectorized.WritableColumnVector;
@@ -131,7 +130,8 @@ final class ParquetColumnVector {
         definitionLevels = allocateLevelsVector(capacity, memoryMode);
       }
     } else {
-      Preconditions.checkArgument(column.children().size() == vector.getNumChildren());
+      JavaUtils.checkArgument(column.children().size() == vector.getNumChildren(),
+        "The number of column children is different from the number of vector children");
       boolean allChildrenAreMissing = true;
 
       for (int i = 0; i < column.children().size(); i++) {
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorUpdaterFactory.java b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorUpdaterFactory.java
index 889f11e119730..eb6c84b8113b8 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorUpdaterFactory.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorUpdaterFactory.java
@@ -24,6 +24,7 @@
 import org.apache.parquet.schema.LogicalTypeAnnotation.IntLogicalTypeAnnotation;
 import org.apache.parquet.schema.LogicalTypeAnnotation.DateLogicalTypeAnnotation;
 import org.apache.parquet.schema.LogicalTypeAnnotation.DecimalLogicalTypeAnnotation;
+import org.apache.parquet.schema.LogicalTypeAnnotation.TimeLogicalTypeAnnotation;
 import org.apache.parquet.schema.LogicalTypeAnnotation.TimestampLogicalTypeAnnotation;
 import org.apache.parquet.schema.PrimitiveType;
 
@@ -159,7 +160,7 @@ public ParquetVectorUpdater getUpdater(ColumnDescriptor descriptor, DataType spa
         } else if (canReadAsDecimal(descriptor, sparkType)) {
           return new LongToDecimalUpdater(descriptor, (DecimalType) sparkType);
         } else if (sparkType instanceof TimeType) {
-          return new LongUpdater();
+          return new LongAsNanosUpdater();
         }
       }
       case FLOAT -> {
@@ -233,6 +234,11 @@ boolean isTimestampTypeMatched(LogicalTypeAnnotation.TimeUnit unit) {
       annotation.getUnit() == unit;
   }
 
+  boolean isTimeTypeMatched(LogicalTypeAnnotation.TimeUnit unit) {
+    return logicalTypeAnnotation instanceof TimeLogicalTypeAnnotation annotation &&
+      annotation.getUnit() == unit;
+  }
+
   boolean isUnsignedIntTypeMatched(int bitWidth) {
     return logicalTypeAnnotation instanceof IntLogicalTypeAnnotation annotation &&
       !annotation.isSigned() && annotation.getBitWidth() == bitWidth;
@@ -825,6 +831,42 @@ public void decodeSingleDictionaryId(
     }
   }
 
+  private static class LongAsNanosUpdater implements ParquetVectorUpdater {
+    @Override
+    public void readValues(
+        int total,
+        int offset,
+        WritableColumnVector values,
+        VectorizedValuesReader valuesReader) {
+      for (int i = 0; i < total; ++i) {
+        readValue(offset + i, values, valuesReader);
+      }
+    }
+
+    @Override
+    public void skipValues(int total, VectorizedValuesReader valuesReader) {
+      valuesReader.skipLongs(total);
+    }
+
+    @Override
+    public void readValue(
+        int offset,
+        WritableColumnVector values,
+        VectorizedValuesReader valuesReader) {
+      values.putLong(offset, DateTimeUtils.microsToNanos(valuesReader.readLong()));
+    }
+
+    @Override
+    public void decodeSingleDictionaryId(
+        int offset,
+        WritableColumnVector values,
+        WritableColumnVector dictionaryIds,
+        Dictionary dictionary) {
+      long micros = dictionary.decodeToLong(dictionaryIds.getDictId(offset));
+      values.putLong(offset, DateTimeUtils.microsToNanos(micros));
+    }
+  }
+
   private static class FloatUpdater implements ParquetVectorUpdater {
     @Override
     public void readValues(
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedColumnReader.java b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedColumnReader.java
index 731c78cf94503..6e1660dc8c873 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedColumnReader.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedColumnReader.java
@@ -165,7 +165,8 @@ private boolean isLazyDecodingSupported(
       case INT64: {
         boolean isDecimal = sparkType instanceof DecimalType;
         boolean needsUpcast = (isDecimal && !DecimalType.is64BitDecimalType(sparkType)) ||
-          updaterFactory.isTimestampTypeMatched(TimeUnit.MILLIS);
+          updaterFactory.isTimestampTypeMatched(TimeUnit.MILLIS) ||
+          updaterFactory.isTimeTypeMatched(TimeUnit.MICROS);
         boolean needsRebase = updaterFactory.isTimestampTypeMatched(TimeUnit.MICROS) &&
           !"CORRECTED".equals(datetimeRebaseMode);
         isSupported = !needsUpcast && !needsRebase && !needsDecimalScaleRebase(sparkType);
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedDeltaBinaryPackedReader.java b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedDeltaBinaryPackedReader.java
index 071720d4dbfc7..7b56e1ebf2394 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedDeltaBinaryPackedReader.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedDeltaBinaryPackedReader.java
@@ -21,12 +21,13 @@
 import java.nio.ByteBuffer;
 import java.util.Arrays;
 
-import org.apache.parquet.Preconditions;
 import org.apache.parquet.bytes.ByteBufferInputStream;
 import org.apache.parquet.bytes.BytesUtils;
 import org.apache.parquet.column.values.bitpacking.BytePackerForLong;
 import org.apache.parquet.column.values.bitpacking.Packer;
 import org.apache.parquet.io.ParquetDecodingException;
+
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.sql.catalyst.util.RebaseDateTime;
 import org.apache.spark.sql.execution.datasources.DataSourceUtils;
 import org.apache.spark.sql.execution.vectorized.WritableColumnVector;
@@ -80,14 +81,14 @@ public class VectorizedDeltaBinaryPackedReader extends VectorizedReaderBase {
 
   @Override
   public void initFromPage(int valueCount, ByteBufferInputStream in) throws IOException {
-    Preconditions.checkArgument(valueCount >= 1,
+    JavaUtils.checkArgument(valueCount >= 1,
         "Page must have at least one value, but it has " + valueCount);
     this.in = in;
     // Read the header
     this.blockSizeInValues = BytesUtils.readUnsignedVarInt(in);
     this.miniBlockNumInABlock = BytesUtils.readUnsignedVarInt(in);
     double miniSize = (double) blockSizeInValues / miniBlockNumInABlock;
-    Preconditions.checkArgument(miniSize % 8 == 0,
+    JavaUtils.checkArgument(miniSize % 8 == 0,
         "miniBlockSize must be multiple of 8, but it's " + miniSize);
     this.miniBlockSizeInValues = (int) miniSize;
     // True value count. May be less than valueCount because of nulls
diff --git a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedRleValuesReader.java b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedRleValuesReader.java
index 0d380997fd5b6..60544665409df 100644
--- a/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedRleValuesReader.java
+++ b/sql/core/src/main/java/org/apache/spark/sql/execution/datasources/parquet/VectorizedRleValuesReader.java
@@ -20,7 +20,6 @@
 import java.io.IOException;
 import java.nio.ByteBuffer;
 
-import org.apache.parquet.Preconditions;
 import org.apache.parquet.bytes.ByteBufferInputStream;
 import org.apache.parquet.bytes.BytesUtils;
 import org.apache.parquet.column.values.ValuesReader;
@@ -30,6 +29,7 @@
 import org.apache.parquet.io.api.Binary;
 
 import org.apache.spark.SparkUnsupportedOperationException;
+import org.apache.spark.network.util.JavaUtils;
 import org.apache.spark.sql.execution.vectorized.WritableColumnVector;
 
 /**
@@ -122,7 +122,7 @@ public void initFromPage(int valueCount, ByteBufferInputStream in) throws IOExce
    * Initializes the internal state for decoding ints of `bitWidth`.
    */
   private void init(int bitWidth) {
-    Preconditions.checkArgument(bitWidth >= 0 && bitWidth <= 32, "bitWidth must be >= 0 and <= 32");
+    JavaUtils.checkArgument(bitWidth >= 0 && bitWidth <= 32, "bitWidth must be >= 0 and <= 32");
     this.bitWidth = bitWidth;
     this.bytesWidth = BytesUtils.paddedByteCountFromBits(bitWidth);
     this.packer = Packer.LITTLE_ENDIAN.newBytePacker(bitWidth);
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/api/python/PythonSQLUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/api/python/PythonSQLUtils.scala
index 40779c66600fd..85f59c282ff55 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/api/python/PythonSQLUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/api/python/PythonSQLUtils.scala
@@ -23,10 +23,10 @@ import java.nio.channels.{Channels, SocketChannel}
 import net.razorvine.pickle.{Pickler, Unpickler}
 
 import org.apache.spark.api.python.DechunkedInputStream
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_LOADER
 import org.apache.spark.security.SocketAuthServer
-import org.apache.spark.sql.{internal, Column, DataFrame, Row, SparkSession}
+import org.apache.spark.sql.{internal, Column, DataFrame, Row, SparkSession, TableArg}
 import org.apache.spark.sql.catalyst.{CatalystTypeConverters, InternalRow}
 import org.apache.spark.sql.catalyst.analysis.{FunctionRegistry, TableFunctionRegistry}
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
@@ -182,6 +182,9 @@ private[sql] object PythonSQLUtils extends Logging {
   def namedArgumentExpression(name: String, e: Column): Column =
     Column(NamedArgumentExpression(name, expression(e)))
 
+  def namedArgumentExpression(name: String, e: TableArg): Column =
+    Column(NamedArgumentExpression(name, e.expression))
+
   @scala.annotation.varargs
   def fn(name: String, arguments: Column*): Column = Column.fn(name, arguments: _*)
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/api/r/SQLUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/api/r/SQLUtils.scala
index 1efd8f9e32208..3fc3cf698df9b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/api/r/SQLUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/api/r/SQLUtils.scala
@@ -27,7 +27,7 @@ import org.apache.spark.TaskContext
 import org.apache.spark.api.java.{JavaRDD, JavaSparkContext}
 import org.apache.spark.api.r.SerDe
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CONFIG
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.Row
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/artifact/ArtifactManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/artifact/ArtifactManager.scala
index 35e8e5c6000ae..de91e5e8a44b2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/artifact/ArtifactManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/artifact/ArtifactManager.scala
@@ -25,14 +25,15 @@ import java.nio.file.{CopyOption, Files, Path, Paths, StandardCopyOption}
 import java.util.concurrent.CopyOnWriteArrayList
 import java.util.concurrent.atomic.AtomicBoolean
 
+import scala.collection.mutable.ListBuffer
 import scala.jdk.CollectionConverters._
 import scala.reflect.ClassTag
 
-import org.apache.commons.io.{FilenameUtils, FileUtils}
+import org.apache.commons.io.FilenameUtils
 import org.apache.hadoop.fs.{LocalFileSystem, Path => FSPath}
 
 import org.apache.spark.{JobArtifactSet, JobArtifactState, SparkContext, SparkEnv, SparkException, SparkRuntimeException, SparkUnsupportedOperationException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.{CONNECT_SCALA_UDF_STUB_PREFIXES, EXECUTOR_USER_CLASS_PATH_FIRST}
 import org.apache.spark.sql.Artifact
 import org.apache.spark.sql.classic.SparkSession
@@ -213,7 +214,7 @@ class ArtifactManager(session: SparkSession) extends AutoCloseable with Logging
       // Disallow overwriting with modified version
       if (Files.exists(target)) {
         // makes the query idempotent
-        if (FileUtils.contentEquals(target.toFile, serverLocalStagingPath.toFile)) {
+        if (Utils.contentEquals(target.toFile, serverLocalStagingPath.toFile)) {
           return
         }
 
@@ -266,28 +267,39 @@ class ArtifactManager(session: SparkSession) extends AutoCloseable with Logging
    * they are from a permanent location.
    */
   private[sql] def addLocalArtifacts(artifacts: Seq[Artifact]): Unit = {
+    val failedArtifactExceptions = ListBuffer[SparkRuntimeException]()
+
     artifacts.foreach { artifact =>
-      artifact.storage match {
-        case d: Artifact.LocalFile =>
-          addArtifact(
-            artifact.path,
-            d.path,
-            fragment = None,
-            deleteStagedFile = false)
-        case d: Artifact.InMemory =>
-          val tempDir = Utils.createTempDir().toPath
-          val tempFile = tempDir.resolve(artifact.path.getFileName)
-          val outStream = Files.newOutputStream(tempFile)
-          Utils.tryWithSafeFinallyAndFailureCallbacks {
-            d.stream.transferTo(outStream)
-            addArtifact(artifact.path, tempFile, fragment = None)
-          }(finallyBlock = {
-            outStream.close()
-          })
-        case _ =>
-          throw SparkException.internalError(s"Unsupported artifact storage: ${artifact.storage}")
+      try {
+        artifact.storage match {
+          case d: Artifact.LocalFile =>
+            addArtifact(
+              artifact.path,
+              d.path,
+              fragment = None,
+              deleteStagedFile = false)
+          case d: Artifact.InMemory =>
+            val tempDir = Utils.createTempDir().toPath
+            val tempFile = tempDir.resolve(artifact.path.getFileName)
+            val outStream = Files.newOutputStream(tempFile)
+            Utils.tryWithSafeFinallyAndFailureCallbacks {
+              d.stream.transferTo(outStream)
+              addArtifact(artifact.path, tempFile, fragment = None)
+            }(finallyBlock = {
+              outStream.close()
+            })
+          case _ =>
+            throw SparkException.internalError(s"Unsupported artifact storage: ${artifact.storage}")
+        }
+      } catch {
+        case e: SparkRuntimeException if e.getCondition == "ARTIFACT_ALREADY_EXISTS" =>
+          failedArtifactExceptions += e
       }
     }
+
+    if (failedArtifactExceptions.nonEmpty) {
+      throw ArtifactUtils.mergeExceptionsWithSuppressed(failedArtifactExceptions.toSeq)
+    }
   }
 
   def classloader: ClassLoader = synchronized {
@@ -340,7 +352,7 @@ class ArtifactManager(session: SparkSession) extends AutoCloseable with Logging
     val sparkContext = session.sparkContext
     val newArtifactManager = new ArtifactManager(newSession)
     if (artifactPath.toFile.exists()) {
-      FileUtils.copyDirectory(artifactPath.toFile, newArtifactManager.artifactPath.toFile)
+      Utils.copyDirectory(artifactPath.toFile, newArtifactManager.artifactPath.toFile)
     }
     val blockManager = sparkContext.env.blockManager
     val newBlockIds = cachedBlockIdList.asScala.map { blockId =>
@@ -524,7 +536,7 @@ object ArtifactManager extends Logging {
 
     // Clean up artifacts folder
     try {
-      FileUtils.deleteDirectory(artifactPath.toFile)
+      Utils.deleteRecursively(artifactPath.toFile)
     } catch {
       case e: IOException =>
         logWarning(log"Failed to delete directory ${MDC(LogKeys.PATH, artifactPath.toFile)}: " +
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroDeserializer.scala b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroDeserializer.scala
index 65fafb5a34c6e..f66b5bd988c2b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroDeserializer.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroDeserializer.scala
@@ -58,7 +58,7 @@ private[sql] class AvroDeserializer(
   def this(
       rootAvroType: Schema,
       rootCatalystType: DataType,
-      datetimeRebaseMode: LegacyBehaviorPolicy.Value,
+      datetimeRebaseMode: String,
       useStableIdForUnionType: Boolean,
       stableIdPrefixForUnionType: String,
       recursiveFieldMaxDepth: Int) = {
@@ -66,7 +66,7 @@ private[sql] class AvroDeserializer(
       rootAvroType,
       rootCatalystType,
       positionalFieldMatch = false,
-      RebaseSpec(datetimeRebaseMode),
+      RebaseSpec(LegacyBehaviorPolicy.withName(datetimeRebaseMode)),
       new NoopFilters,
       useStableIdForUnionType,
       stableIdPrefixForUnionType,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroFileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroFileFormat.scala
index bf35a78488e44..90781d4ad7077 100755
--- a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroFileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroFileFormat.scala
@@ -34,13 +34,16 @@ import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.{InternalRow, NoopFilters, OrderedFilters}
 import org.apache.spark.sql.execution.datasources.{DataSourceUtils, FileFormat, OutputWriterFactory, PartitionedFile}
-import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.internal.{SessionStateHelper, SQLConf}
 import org.apache.spark.sql.sources.{DataSourceRegister, Filter}
 import org.apache.spark.sql.types._
 import org.apache.spark.util.SerializableConfiguration
 
 private[sql] class AvroFileFormat extends FileFormat
-  with DataSourceRegister with Logging with Serializable {
+  with DataSourceRegister
+  with SessionStateHelper
+  with Logging
+  with Serializable {
 
   AvroFileFormat.registerCustomAvroTypes()
 
@@ -73,7 +76,7 @@ private[sql] class AvroFileFormat extends FileFormat
       job: Job,
       options: Map[String, String],
       dataSchema: StructType): OutputWriterFactory = {
-    AvroUtils.prepareWrite(spark.sessionState.conf, job, options, dataSchema)
+    AvroUtils.prepareWrite(getSqlConf(spark), job, options, dataSchema)
   }
 
   override def buildReader(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroOptions.scala b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroOptions.scala
index ab3607d1bd7a7..da42333fad0fb 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroOptions.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroOptions.scala
@@ -29,7 +29,7 @@ import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.{DataSourceOptions, FileSourceOptions}
 import org.apache.spark.sql.catalyst.util.{CaseInsensitiveMap, FailFastMode, ParseMode}
 import org.apache.spark.sql.errors.QueryCompilationErrors
-import org.apache.spark.sql.internal.{LegacyBehaviorPolicy, SQLConf}
+import org.apache.spark.sql.internal.SQLConf
 
 /**
  * Options for Avro Reader and Writer stored in case insensitive manner.
@@ -129,9 +129,9 @@ private[sql] class AvroOptions(
   /**
    * The rebasing mode for the DATE and TIMESTAMP_MICROS, TIMESTAMP_MILLIS values in reads.
    */
-  val datetimeRebaseModeInRead: LegacyBehaviorPolicy.Value = parameters
-    .get(DATETIME_REBASE_MODE).map(LegacyBehaviorPolicy.withName)
-    .getOrElse(SQLConf.get.getConf(SQLConf.AVRO_REBASE_MODE_IN_READ))
+  val datetimeRebaseModeInRead: String = parameters
+    .get(DATETIME_REBASE_MODE)
+    .getOrElse(SQLConf.get.getConf(SQLConf.AVRO_REBASE_MODE_IN_READ).toString)
 
   val useStableIdForUnionType: Boolean =
     parameters.get(STABLE_ID_FOR_UNION_TYPE).map(_.toBoolean).getOrElse(false)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroUtils.scala
index b388c98ffcb1d..c338bd428bbed 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/avro/AvroUtils.scala
@@ -31,7 +31,7 @@ import org.apache.hadoop.fs.FileStatus
 import org.apache.hadoop.mapreduce.Job
 
 import org.apache.spark.{SparkException, SparkIllegalArgumentException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CODEC_LEVEL, CODEC_NAME, CONFIG, PATH}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.avro.AvroCompressionCodec._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/avro/SchemaConverters.scala b/sql/core/src/main/scala/org/apache/spark/sql/avro/SchemaConverters.scala
index c936099ef3764..b425f63d6a7ed 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/avro/SchemaConverters.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/avro/SchemaConverters.scala
@@ -28,7 +28,7 @@ import org.apache.avro.Schema.Type._
 import org.apache.avro.SchemaBuilder.FieldAssembler
 
 import org.apache.spark.annotation.DeveloperApi
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FIELD_NAME, FIELD_TYPE, RECURSIVE_DEPTH}
 import org.apache.spark.sql.avro.AvroOptions.RECURSIVE_FIELD_MAX_DEPTH_LIMIT
 import org.apache.spark.sql.catalyst.parser.CatalystSqlParser
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataSource.scala
index 07208ca7760db..a7b3385a27820 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveDataSource.scala
@@ -34,7 +34,7 @@ import org.apache.spark.sql.execution.command.DDLUtils
 import org.apache.spark.sql.execution.datasources.{DataSource, LogicalRelation}
 import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2Utils, FileDataSourceV2}
 import org.apache.spark.sql.execution.datasources.v2.python.PythonDataSourceV2
-import org.apache.spark.sql.execution.streaming.StreamingRelation
+import org.apache.spark.sql.execution.streaming.runtime.StreamingRelation
 import org.apache.spark.sql.sources.StreamSourceProvider
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSessionCatalog.scala b/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSessionCatalog.scala
index d7d8fc07b872f..b664f52c8c1c5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSessionCatalog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/catalyst/analysis/ResolveSessionCatalog.scala
@@ -17,11 +17,8 @@
 
 package org.apache.spark.sql.catalyst.analysis
 
-import org.apache.commons.lang3.StringUtils
-
 import org.apache.spark.SparkException
 import org.apache.spark.internal.LogKeys.CONFIG
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.SaveMode
 import org.apache.spark.sql.catalyst.{FunctionIdentifier, TableIdentifier}
 import org.apache.spark.sql.catalyst.catalog.{CatalogStorageFormat, CatalogTable, CatalogTableType, CatalogUtils, ClusterBySpec}
@@ -40,6 +37,7 @@ import org.apache.spark.sql.internal.{HiveSerDe, SQLConf}
 import org.apache.spark.sql.internal.connector.V1Function
 import org.apache.spark.sql.types.{MetadataBuilder, StringType, StructField, StructType}
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.SparkStringUtils
 
 /**
  * Converts resolved v2 commands to v1 if the catalog is the session catalog. Since the v2 commands
@@ -149,7 +147,7 @@ class ResolveSessionCatalog(val catalogManager: CatalogManager)
       AlterDatabasePropertiesCommand(db, properties)
 
     case SetNamespaceLocation(ResolvedV1Database(db), location) if conf.useV1Command =>
-      if (StringUtils.isEmpty(location)) {
+      if (SparkStringUtils.isEmpty(location)) {
         throw QueryExecutionErrors.invalidEmptyLocationError(location)
       }
       AlterDatabaseSetLocationCommand(db, location)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/Catalog.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/Catalog.scala
index 1e028d2046eb5..45f494f65c300 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/Catalog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/Catalog.scala
@@ -36,6 +36,7 @@ import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
 import org.apache.spark.sql.connector.catalog.{CatalogManager, SupportsNamespaces, TableCatalog}
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.{CatalogHelper, MultipartIdentifierHelper, NamespaceHelper, TransformHelper}
+import org.apache.spark.sql.connector.catalog.CatalogV2Util.v2ColumnsToStructType
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.command.{ShowNamespacesCommand, ShowTablesCommand}
 import org.apache.spark.sql.execution.datasources.{DataSource, LogicalRelation}
@@ -408,7 +409,8 @@ class Catalog(sparkSession: SparkSession) extends catalog.Catalog {
         val clusteringColumnNames = clusterBySpecOpt.map { clusterBySpec =>
           clusterBySpec.columnNames.map(_.toString)
         }.getOrElse(Nil).toSet
-        schemaToColumns(table.schema(), partitionColumnNames.contains, bucketColumnNames.contains,
+        val schema = v2ColumnsToStructType(table.columns())
+        schemaToColumns(schema, partitionColumnNames.contains, bucketColumnNames.contains,
           clusteringColumnNames.contains)
 
       case ResolvedPersistentView(_, _, metadata) =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriter.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriter.scala
index 501b4985128dd..2d3e4b84d9ae5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriter.scala
@@ -25,7 +25,7 @@ import org.apache.spark.annotation.Stable
 import org.apache.spark.sql
 import org.apache.spark.sql.SaveMode
 import org.apache.spark.sql.catalyst.TableIdentifier
-import org.apache.spark.sql.catalyst.analysis.{EliminateSubqueryAliases, NoSuchTableException, UnresolvedIdentifier, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.analysis.{NoSuchTableException, UnresolvedIdentifier, UnresolvedRelation}
 import org.apache.spark.sql.catalyst.catalog._
 import org.apache.spark.sql.catalyst.expressions.Literal
 import org.apache.spark.sql.catalyst.plans.logical._
@@ -36,8 +36,8 @@ import org.apache.spark.sql.connector.catalog.TableWritePrivilege._
 import org.apache.spark.sql.connector.expressions.{ClusterByTransform, FieldReference, IdentityTransform, Transform}
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.QueryExecution
-import org.apache.spark.sql.execution.command.DDLUtils
-import org.apache.spark.sql.execution.datasources.{CreateTable, DataSource, DataSourceUtils, LogicalRelation}
+import org.apache.spark.sql.execution.command.{DDLUtils, SaveAsV1TableCommand}
+import org.apache.spark.sql.execution.datasources.{DataSource, DataSourceUtils}
 import org.apache.spark.sql.execution.datasources.v2._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.PartitionOverwriteMode
@@ -111,11 +111,9 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
    * @since 1.4.0
    */
   def save(path: String): Unit = {
-    if (!df.sparkSession.sessionState.conf.legacyPathOptionBehavior &&
-        extraOptions.contains("path")) {
-      throw QueryCompilationErrors.pathOptionNotSetCorrectlyWhenWritingError()
+    runCommand(df.sparkSession) {
+      saveCommand(Some(path))
     }
-    saveInternal(Some(path))
   }
 
   /**
@@ -123,9 +121,17 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
    *
    * @since 1.4.0
    */
-  def save(): Unit = saveInternal(None)
+  def save(): Unit = {
+    runCommand(df.sparkSession) {
+      saveCommand(None)
+    }
+  }
 
-  private def saveInternal(path: Option[String]): Unit = {
+  private[sql] def saveCommand(path: Option[String]): LogicalPlan = {
+    if (path.isDefined && !df.sparkSession.sessionState.conf.legacyPathOptionBehavior &&
+        extraOptions.contains("path")) {
+      throw QueryCompilationErrors.pathOptionNotSetCorrectlyWhenWritingError()
+    }
     if (source.toLowerCase(Locale.ROOT) == DDLUtils.HIVE_PROVIDER) {
       throw QueryCompilationErrors.cannotOperateOnHiveDataSourceFilesError("write")
     }
@@ -179,23 +185,19 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
                 // Streaming also uses the data source V2 API. So it may be that the data source
                 // implements v2, but has no v2 implementation for batch writes. In that case, we
                 // fall back to saving as though it's a V1 source.
-                return saveToV1Source(path)
+                return saveToV1SourceCommand(path)
               }
           }
 
           val relation = DataSourceV2Relation.create(table, catalog, ident, dsOptions)
           checkPartitioningMatchesV2Table(table)
           if (curmode == SaveMode.Append) {
-            runCommand(df.sparkSession) {
-              AppendData.byName(relation, df.logicalPlan, finalOptions)
-            }
+            AppendData.byName(relation, df.logicalPlan, finalOptions)
           } else {
             // Truncate the table. TableCapabilityCheck will throw a nice exception if this
             // isn't supported
-            runCommand(df.sparkSession) {
-              OverwriteByExpression.byName(
-                relation, df.logicalPlan, Literal(true), finalOptions)
-            }
+            OverwriteByExpression.byName(
+              relation, df.logicalPlan, Literal(true), finalOptions)
           }
 
         case createMode =>
@@ -215,16 +217,14 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
                 serde = None,
                 external = false,
                 constraints = Seq.empty)
-              runCommand(df.sparkSession) {
-                CreateTableAsSelect(
-                  UnresolvedIdentifier(
-                    catalog.name +: ident.namespace.toImmutableArraySeq :+ ident.name),
-                  partitioningAsV2,
-                  df.queryExecution.analyzed,
-                  tableSpec,
-                  finalOptions,
-                  ignoreIfExists = createMode == SaveMode.Ignore)
-              }
+              CreateTableAsSelect(
+                UnresolvedIdentifier(
+                  catalog.name +: ident.namespace.toImmutableArraySeq :+ ident.name),
+                partitioningAsV2,
+                df.queryExecution.analyzed,
+                tableSpec,
+                finalOptions,
+                ignoreIfExists = createMode == SaveMode.Ignore)
             case _: TableProvider =>
               if (getTable.supports(BATCH_WRITE)) {
                 throw QueryCompilationErrors.writeWithSaveModeUnsupportedBySourceError(
@@ -233,13 +233,13 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
                 // Streaming also uses the data source V2 API. So it may be that the data source
                 // implements v2, but has no v2 implementation for batch writes. In that case, we
                 // fallback to saving as though it's a V1 source.
-                saveToV1Source(path)
+                saveToV1SourceCommand(path)
               }
           }
       }
 
     } else {
-      saveToV1Source(path)
+      saveToV1SourceCommand(path)
     }
   }
 
@@ -251,7 +251,7 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
     }
   }
 
-  private def saveToV1Source(path: Option[String]): Unit = {
+  private def saveToV1SourceCommand(path: Option[String]): LogicalPlan = {
     partitioningColumns.foreach { columns =>
       extraOptions = extraOptions + (
         DataSourceUtils.PARTITIONING_COLUMNS_KEY ->
@@ -266,13 +266,11 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
     val optionsWithPath = getOptionsWithPath(path)
 
     // Code path for data source v1.
-    runCommand(df.sparkSession) {
-      DataSource(
-        sparkSession = df.sparkSession,
-        className = source,
-        partitionColumns = partitioningColumns.getOrElse(Nil),
-        options = optionsWithPath.originalMap).planForWriting(curmode, df.logicalPlan)
-    }
+    DataSource(
+      sparkSession = df.sparkSession,
+      className = source,
+      partitionColumns = partitioningColumns.getOrElse(Nil),
+      options = optionsWithPath.originalMap).planForWriting(curmode, df.logicalPlan)
   }
 
   /**
@@ -304,6 +302,12 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
    * @since 1.4.0
    */
   def insertInto(tableName: String): Unit = {
+    runCommand(df.sparkSession) {
+      insertIntoCommand(tableName)
+    }
+  }
+
+  private[sql] def insertIntoCommand(tableName: String): LogicalPlan = {
     import df.sparkSession.sessionState.analyzer.{AsTableIdentifier, NonSessionCatalogAndIdentifier, SessionCatalogAndIdentifier}
     import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
 
@@ -318,30 +322,30 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
 
     session.sessionState.sqlParser.parseMultipartIdentifier(tableName) match {
       case NonSessionCatalogAndIdentifier(catalog, ident) =>
-        insertInto(catalog, ident)
+        insertIntoCommand(catalog, ident)
 
       case SessionCatalogAndIdentifier(catalog, ident)
           if canUseV2 && ident.namespace().length <= 1 =>
-        insertInto(catalog, ident)
+        insertIntoCommand(catalog, ident)
 
       case AsTableIdentifier(tableIdentifier) =>
-        insertInto(tableIdentifier)
+        insertIntoCommand(tableIdentifier)
       case other =>
         throw QueryCompilationErrors.cannotFindCatalogToHandleIdentifierError(other.quoted)
     }
   }
 
-  private def insertInto(catalog: CatalogPlugin, ident: Identifier): Unit = {
+  private def insertIntoCommand(catalog: CatalogPlugin, ident: Identifier): LogicalPlan = {
     import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
 
     val table = catalog.asTableCatalog.loadTable(ident, getWritePrivileges.toSet.asJava) match {
       case _: V1Table =>
-        return insertInto(TableIdentifier(ident.name(), ident.namespace().headOption))
+        return insertIntoCommand(TableIdentifier(ident.name(), ident.namespace().headOption))
       case t =>
         DataSourceV2Relation.create(t, Some(catalog), Some(ident))
     }
 
-    val command = curmode match {
+    curmode match {
       case SaveMode.Append | SaveMode.ErrorIfExists | SaveMode.Ignore =>
         AppendData.byPosition(table, df.logicalPlan, extraOptions.toMap)
 
@@ -356,22 +360,16 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
           OverwriteByExpression.byPosition(table, df.logicalPlan, Literal(true), extraOptions.toMap)
         }
     }
-
-    runCommand(df.sparkSession) {
-      command
-    }
   }
 
-  private def insertInto(tableIdent: TableIdentifier): Unit = {
-    runCommand(df.sparkSession) {
-      InsertIntoStatement(
-        table = UnresolvedRelation(tableIdent).requireWritePrivileges(getWritePrivileges),
-        partitionSpec = Map.empty[String, Option[String]],
-        Nil,
-        query = df.logicalPlan,
-        overwrite = curmode == SaveMode.Overwrite,
-        ifPartitionNotExists = false)
-    }
+  private def insertIntoCommand(tableIdent: TableIdentifier): LogicalPlan = {
+    InsertIntoStatement(
+      table = UnresolvedRelation(tableIdent).requireWritePrivileges(getWritePrivileges),
+      partitionSpec = Map.empty[String, Option[String]],
+      Nil,
+      query = df.logicalPlan,
+      overwrite = curmode == SaveMode.Overwrite,
+      ifPartitionNotExists = false)
   }
 
   private def getWritePrivileges: Seq[TableWritePrivilege] = curmode match {
@@ -430,6 +428,12 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
    * @since 1.4.0
    */
   def saveAsTable(tableName: String): Unit = {
+    runCommand(df.sparkSession) {
+      saveAsTableCommand(tableName)
+    }
+  }
+
+  private[sql] def saveAsTableCommand(tableName: String): LogicalPlan = {
     import df.sparkSession.sessionState.analyzer.{AsTableIdentifier, NonSessionCatalogAndIdentifier, SessionCatalogAndIdentifier}
     import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
 
@@ -440,30 +444,29 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
 
     session.sessionState.sqlParser.parseMultipartIdentifier(tableName) match {
       case nameParts @ NonSessionCatalogAndIdentifier(catalog, ident) =>
-        saveAsTable(catalog.asTableCatalog, ident, nameParts)
+        saveAsTableCommand(catalog.asTableCatalog, ident, nameParts)
 
       case nameParts @ SessionCatalogAndIdentifier(catalog, ident)
           if canUseV2 && ident.namespace().length <= 1 =>
-        saveAsTable(catalog.asTableCatalog, ident, nameParts)
+        saveAsTableCommand(catalog.asTableCatalog, ident, nameParts)
 
       case AsTableIdentifier(tableIdentifier) =>
-        saveAsTable(tableIdentifier)
+        saveAsV1TableCommand(tableIdentifier)
 
       case other =>
         throw QueryCompilationErrors.cannotFindCatalogToHandleIdentifierError(other.quoted)
     }
   }
 
-
-  private def saveAsTable(
-      catalog: TableCatalog, ident: Identifier, nameParts: Seq[String]): Unit = {
+  private def saveAsTableCommand(
+      catalog: TableCatalog, ident: Identifier, nameParts: Seq[String]): LogicalPlan = {
     val tableOpt = try Option(catalog.loadTable(ident, getWritePrivileges.toSet.asJava)) catch {
       case _: NoSuchTableException => None
     }
 
-    val command = (curmode, tableOpt) match {
+    (curmode, tableOpt) match {
       case (_, Some(_: V1Table)) =>
-        return saveAsTable(TableIdentifier(ident.name(), ident.namespace().headOption))
+        saveAsV1TableCommand(TableIdentifier(ident.name(), ident.namespace().headOption))
 
       case (SaveMode.Append, Some(table)) =>
         checkPartitioningMatchesV2Table(table)
@@ -512,56 +515,9 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
           writeOptions = extraOptions.toMap,
           other == SaveMode.Ignore)
     }
-
-    runCommand(df.sparkSession) {
-      command
-    }
-  }
-
-  private def saveAsTable(tableIdent: TableIdentifier): Unit = {
-    val catalog = df.sparkSession.sessionState.catalog
-    val qualifiedIdent = catalog.qualifyIdentifier(tableIdent)
-    val tableExists = catalog.tableExists(qualifiedIdent)
-
-    (tableExists, curmode) match {
-      case (true, SaveMode.Ignore) =>
-        // Do nothing
-
-      case (true, SaveMode.ErrorIfExists) =>
-        throw QueryCompilationErrors.tableAlreadyExistsError(qualifiedIdent)
-
-      case (true, SaveMode.Overwrite) =>
-        // Get all input data source or hive relations of the query.
-        val srcRelations = df.logicalPlan.collect {
-          case l: LogicalRelation => l.relation
-          case relation: HiveTableRelation => relation.tableMeta.identifier
-        }
-
-        val tableRelation = df.sparkSession.table(qualifiedIdent).queryExecution.analyzed
-        EliminateSubqueryAliases(tableRelation) match {
-          // check if the table is a data source table (the relation is a BaseRelation).
-          case l: LogicalRelation if srcRelations.contains(l.relation) =>
-            throw QueryCompilationErrors.cannotOverwriteTableThatIsBeingReadFromError(
-              qualifiedIdent)
-          // check hive table relation when overwrite mode
-          case relation: HiveTableRelation
-              if srcRelations.contains(relation.tableMeta.identifier) =>
-            throw QueryCompilationErrors.cannotOverwriteTableThatIsBeingReadFromError(
-              qualifiedIdent)
-          case _ => // OK
-        }
-
-        // Drop the existing table
-        catalog.dropTable(qualifiedIdent, ignoreIfNotExists = true, purge = false)
-        createTable(qualifiedIdent)
-        // Refresh the cache of the table in the catalog.
-        catalog.refreshTable(qualifiedIdent)
-
-      case _ => createTable(qualifiedIdent)
-    }
   }
 
-  private def createTable(tableIdent: TableIdentifier): Unit = {
+  private def saveAsV1TableCommand(tableIdent: TableIdentifier): SaveAsV1TableCommand = {
     val storage = DataSource.buildStorageFormatFromOptions(extraOptions.toMap)
     val tableType = if (storage.locationUri.isDefined) {
       CatalogTableType.EXTERNAL
@@ -586,8 +542,7 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
       bucketSpec = getBucketSpec,
       properties = properties)
 
-    runCommand(df.sparkSession)(
-      CreateTable(tableDesc, curmode, Some(df.logicalPlan)))
+    SaveAsV1TableCommand(tableDesc, curmode, df.logicalPlan)
   }
 
   /** Converts the provided partitioning and bucketing information to DataSourceV2 Transforms. */
@@ -621,7 +576,8 @@ final class DataFrameWriter[T] private[sql](ds: Dataset[T]) extends sql.DataFram
    * user-registered callback functions.
    */
   private def runCommand(session: SparkSession)(command: LogicalPlan): Unit = {
-    val qe = new QueryExecution(session, command, df.queryExecution.tracker)
+    val qe = new QueryExecution(session, command, df.queryExecution.tracker,
+      shuffleCleanupMode = QueryExecution.determineShuffleCleanupMode(session.sessionState.conf))
     qe.assertCommandExecuted()
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriterV2.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriterV2.scala
index c6eacfe8f1ed9..7d481b86eb777 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriterV2.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/DataFrameWriterV2.scala
@@ -148,14 +148,17 @@ final class DataFrameWriterV2[T] private[sql](table: String, ds: Dataset[T])
 
   /** @inheritdoc */
   override def create(): Unit = {
-    runCommand(
-      CreateTableAsSelect(
-        UnresolvedIdentifier(tableName),
-        partitioning.getOrElse(Seq.empty) ++ clustering,
-        logicalPlan,
-        buildTableSpec(),
-        options.toMap,
-        false))
+    runCommand(createCommand())
+  }
+
+  private[sql] def createCommand(): LogicalPlan = {
+    CreateTableAsSelect(
+      UnresolvedIdentifier(tableName),
+      partitioning.getOrElse(Seq.empty) ++ clustering,
+      logicalPlan,
+      buildTableSpec(),
+      options.toMap,
+      false)
   }
 
   private def buildTableSpec(): UnresolvedTableSpec = {
@@ -186,28 +189,37 @@ final class DataFrameWriterV2[T] private[sql](table: String, ds: Dataset[T])
   /** @inheritdoc */
   @throws(classOf[NoSuchTableException])
   def append(): Unit = {
-    val append = AppendData.byName(
+    runCommand(appendCommand())
+  }
+
+  private[sql] def appendCommand(): LogicalPlan = {
+    AppendData.byName(
       UnresolvedRelation(tableName).requireWritePrivileges(Seq(INSERT)),
       logicalPlan, options.toMap)
-    runCommand(append)
   }
 
   /** @inheritdoc */
   @throws(classOf[NoSuchTableException])
   def overwrite(condition: Column): Unit = {
-    val overwrite = OverwriteByExpression.byName(
+    runCommand(overwriteCommand(condition))
+  }
+
+  private[sql] def overwriteCommand(condition: Column): LogicalPlan = {
+    OverwriteByExpression.byName(
       UnresolvedRelation(tableName).requireWritePrivileges(Seq(INSERT, DELETE)),
       logicalPlan, expression(condition), options.toMap)
-    runCommand(overwrite)
   }
 
   /** @inheritdoc */
   @throws(classOf[NoSuchTableException])
   def overwritePartitions(): Unit = {
-    val dynamicOverwrite = OverwritePartitionsDynamic.byName(
+    runCommand(overwritePartitionsCommand())
+  }
+
+  private[sql] def overwritePartitionsCommand(): LogicalPlan = {
+    OverwritePartitionsDynamic.byName(
       UnresolvedRelation(tableName).requireWritePrivileges(Seq(INSERT, DELETE)),
       logicalPlan, options.toMap)
-    runCommand(dynamicOverwrite)
   }
 
   /**
@@ -215,18 +227,24 @@ final class DataFrameWriterV2[T] private[sql](table: String, ds: Dataset[T])
    * callback functions.
    */
   private def runCommand(command: LogicalPlan): Unit = {
-    val qe = new QueryExecution(sparkSession, command, df.queryExecution.tracker)
+    val qe = new QueryExecution(sparkSession, command, df.queryExecution.tracker,
+      shuffleCleanupMode =
+        QueryExecution.determineShuffleCleanupMode(sparkSession.sessionState.conf))
     qe.assertCommandExecuted()
   }
 
   private def internalReplace(orCreate: Boolean): Unit = {
-    runCommand(ReplaceTableAsSelect(
+    runCommand(replaceCommand(orCreate))
+  }
+
+  private[sql] def replaceCommand(orCreate: Boolean): LogicalPlan = {
+    ReplaceTableAsSelect(
       UnresolvedIdentifier(tableName),
       partitioning.getOrElse(Seq.empty) ++ clustering,
       logicalPlan,
       buildTableSpec(),
       writeOptions = options.toMap,
-      orCreate = orCreate))
+      orCreate = orCreate)
   }
 }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/Dataset.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/Dataset.scala
index 8327d81816191..e2688c7ddab12 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/Dataset.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/Dataset.scala
@@ -26,10 +26,9 @@ import scala.reflect.ClassTag
 import scala.reflect.runtime.universe.TypeTag
 import scala.util.control.NonFatal
 
-import org.apache.commons.lang3.StringUtils
 import org.apache.commons.text.StringEscapeUtils
 
-import org.apache.spark.{sql, TaskContext}
+import org.apache.spark.{sql, SparkException, TaskContext}
 import org.apache.spark.annotation.{DeveloperApi, Stable, Unstable}
 import org.apache.spark.api.java.JavaRDD
 import org.apache.spark.api.java.function._
@@ -396,15 +395,15 @@ class Dataset[T] private[sql](
       val paddedRows = rows.map { row =>
         row.zipWithIndex.map { case (cell, i) =>
           if (truncate > 0) {
-            StringUtils.leftPad(cell, colWidths(i) - Utils.stringHalfWidth(cell) + cell.length)
+            Utils.leftPad(cell, colWidths(i) - Utils.stringHalfWidth(cell) + cell.length)
           } else {
-            StringUtils.rightPad(cell, colWidths(i) - Utils.stringHalfWidth(cell) + cell.length)
+            Utils.rightPad(cell, colWidths(i) - Utils.stringHalfWidth(cell) + cell.length)
           }
         }
       }
 
       // Create SeparateLine
-      val sep: String = colWidths.map("-" * _).addString(sb, "+", "+", "+\n").toString()
+      val sep: String = colWidths.map("-".repeat(_)).addString(sb, "+", "+", "+\n").toString()
 
       // column names
       paddedRows.head.addString(sb, "|", "|", "|\n")
@@ -428,13 +427,13 @@ class Dataset[T] private[sql](
 
       dataRows.zipWithIndex.foreach { case (row, i) =>
         // "+ 5" in size means a character length except for padded names and data
-        val rowHeader = StringUtils.rightPad(
+        val rowHeader = Utils.rightPad(
           s"-RECORD $i", fieldNameColWidth + dataColWidth + 5, "-")
         sb.append(rowHeader).append("\n")
         row.zipWithIndex.map { case (cell, j) =>
-          val fieldName = StringUtils.rightPad(fieldNames(j),
+          val fieldName = Utils.rightPad(fieldNames(j),
             fieldNameColWidth - Utils.stringHalfWidth(fieldNames(j)) + fieldNames(j).length)
-          val data = StringUtils.rightPad(cell,
+          val data = Utils.rightPad(cell,
             dataColWidth - Utils.stringHalfWidth(cell) + cell.length)
           s" $fieldName | $data "
         }.addString(sb, "", "\n", "\n")
@@ -650,7 +649,7 @@ class Dataset[T] private[sql](
   private def resolveSelfJoinCondition(
       right: Dataset[_],
       joinExprs: Option[Column],
-      joinType: String): Join = {
+      joinType: String): LogicalPlan = {
     // Note that in this function, we introduce a hack in the case of self-join to automatically
     // resolve ambiguous join conditions into ones that might make sense [SPARK-6231].
     // Consider this case: df.join(df, df("key") === df("key"))
@@ -661,28 +660,40 @@ class Dataset[T] private[sql](
 
     // Trigger analysis so in the case of self-join, the analyzer will clone the plan.
     // After the cloning, left and right side will have distinct expression ids.
-    val plan = withPlan(
-      Join(logicalPlan, right.logicalPlan,
-        JoinType(joinType), joinExprs.map(_.expr), JoinHint.NONE))
-      .queryExecution.analyzed.asInstanceOf[Join]
+    val planToAnalyze = Join(
+      logicalPlan, right.logicalPlan, JoinType(joinType), joinExprs.map(_.expr), JoinHint.NONE)
+    val analyzedJoinPlan = withPlan(planToAnalyze).queryExecution.analyzed
 
     // If auto self join alias is disabled, return the plan.
     if (!sparkSession.sessionState.conf.dataFrameSelfJoinAutoResolveAmbiguity) {
-      return plan
+      return analyzedJoinPlan
     }
 
     // If left/right have no output set intersection, return the plan.
     val lanalyzed = this.queryExecution.analyzed
     val ranalyzed = right.queryExecution.analyzed
     if (lanalyzed.outputSet.intersect(ranalyzed.outputSet).isEmpty) {
-      return plan
+      return analyzedJoinPlan
     }
 
     // Otherwise, find the trivially true predicates and automatically resolves them to both sides.
     // By the time we get here, since we have already run analysis, all attributes should've been
     // resolved and become AttributeReference.
-
-    JoinWith.resolveSelfJoinCondition(sparkSession.sessionState.analyzer.resolver, plan)
+    analyzedJoinPlan match {
+      case project @ Project(_, join: Join) =>
+        // SPARK-53143: Handling edge-cases when `AddMetadataColumns` analyzer rule adds `Project`
+        //              node on top of `Join` node.
+        // Check "SPARK-53143: self join edge-case when Join is not returned by the analyzer" in
+        //   `DataframeSelfJoinSuite` for more details.
+        val newProject = project.copy(child = JoinWith.resolveSelfJoinCondition(
+          sparkSession.sessionState.analyzer.resolver, join))
+        newProject.copyTagsFrom(project)
+        newProject
+      case join: Join =>
+        JoinWith.resolveSelfJoinCondition(sparkSession.sessionState.analyzer.resolver, join)
+      case _ => throw SparkException.internalError(
+        s"Unexpected plan type: ${analyzedJoinPlan.getClass.getName} for self join resolution.")
+    }
   }
 
   /** @inheritdoc */
@@ -782,28 +793,38 @@ class Dataset[T] private[sql](
       tolerance: Column,
       allowExactMatches: Boolean,
       direction: String): DataFrame = {
-    val joined = resolveSelfJoinCondition(other, Option(joinExprs), joinType)
-    val leftAsOfExpr = leftAsOf.expr.transformUp {
-      case a: AttributeReference if logicalPlan.outputSet.contains(a) =>
-        val index = logicalPlan.output.indexWhere(_.exprId == a.exprId)
-        joined.left.output(index)
-    }
-    val rightAsOfExpr = rightAsOf.expr.transformUp {
-      case a: AttributeReference if other.logicalPlan.outputSet.contains(a) =>
-        val index = other.logicalPlan.output.indexWhere(_.exprId == a.exprId)
-        joined.right.output(index)
-    }
-    withPlan {
+
+    def createAsOfJoinPlan(joinPlan: Join): AsOfJoin = {
+      val leftAsOfExpr = leftAsOf.expr.transformUp {
+        case a: AttributeReference if logicalPlan.outputSet.contains(a) =>
+          val index = logicalPlan.output.indexWhere(_.exprId == a.exprId)
+          joinPlan.left.output(index)
+      }
+      val rightAsOfExpr = rightAsOf.expr.transformUp {
+        case a: AttributeReference if other.logicalPlan.outputSet.contains(a) =>
+          val index = other.logicalPlan.output.indexWhere(_.exprId == a.exprId)
+          joinPlan.right.output(index)
+      }
       AsOfJoin(
-        joined.left, joined.right,
+        joinPlan.left, joinPlan.right,
         leftAsOfExpr, rightAsOfExpr,
-        joined.condition,
-        joined.joinType,
+        joinPlan.condition,
+        joinPlan.joinType,
         Option(tolerance).map(_.expr),
         allowExactMatches,
         AsOfJoinDirection(direction)
       )
     }
+
+    resolveSelfJoinCondition(other, Option(joinExprs), joinType) match {
+      case project @ Project(_, join: Join) =>
+        val newProjectPlan = project.copy(child = createAsOfJoinPlan(join))
+        newProjectPlan.copyTagsFrom(project)
+        withPlan { newProjectPlan }
+      case join: Join => withPlan { createAsOfJoinPlan(join) }
+      case plan => throw SparkException.internalError(
+        s"Unexpected plan type: ${plan.getClass.getName} returned from self join resolution.")
+    }
   }
 
   /** @inheritdoc */
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/MergeIntoWriter.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/MergeIntoWriter.scala
index 0269b15061c97..e3c872658c86a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/MergeIntoWriter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/MergeIntoWriter.scala
@@ -57,13 +57,18 @@ class MergeIntoWriter[T] private[sql](table: String, ds: Dataset[T], on: Column)
 
   /** @inheritdoc */
   def merge(): Unit = {
+    val qe = sparkSession.sessionState.executePlan(mergeCommand())
+    qe.assertCommandExecuted()
+  }
+
+  private[sql] def mergeCommand(): LogicalPlan = {
     if (matchedActions.isEmpty && notMatchedActions.isEmpty && notMatchedBySourceActions.isEmpty) {
       throw new SparkRuntimeException(
         errorClass = "NO_MERGE_ACTION_SPECIFIED",
         messageParameters = Map.empty)
     }
 
-    val merge = MergeIntoTable(
+    MergeIntoTable(
       UnresolvedRelation(tableName).requireWritePrivileges(MergeIntoTable.getWritePrivileges(
         matchedActions, notMatchedActions, notMatchedBySourceActions)),
       logicalPlan,
@@ -72,8 +77,6 @@ class MergeIntoWriter[T] private[sql](table: String, ds: Dataset[T], on: Column)
       notMatchedActions.toSeq,
       notMatchedBySourceActions.toSeq,
       schemaEvolutionEnabled)
-    val qe = sparkSession.sessionState.executePlan(merge)
-    qe.assertCommandExecuted()
   }
 
   override protected[sql] def insertAll(condition: Option[Column]): this.type = {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/RelationalGroupedDataset.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/RelationalGroupedDataset.scala
index 0fa6e91e21459..0b1da71be9ede 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/RelationalGroupedDataset.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/RelationalGroupedDataset.scala
@@ -444,8 +444,8 @@ class RelationalGroupedDataset protected[sql](
       stateStructType: StructType,
       outputModeStr: String,
       timeoutConfStr: String): DataFrame = {
-    val timeoutConf = org.apache.spark.sql.execution.streaming
-      .GroupStateImpl.groupStateTimeoutFromString(timeoutConfStr)
+    val timeoutConf = org.apache.spark.sql.execution.streaming.operators.stateful.
+      flatmapgroupswithstate.GroupStateImpl.groupStateTimeoutFromString(timeoutConfStr)
     val outputMode = InternalOutputModes(outputModeStr)
     if (outputMode != OutputMode.Append && outputMode != OutputMode.Update) {
       throw new IllegalArgumentException("The output mode of function should be append or update")
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/SparkSession.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/SparkSession.scala
index 0015d7ff99e2b..681e1b16af590 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/SparkSession.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/SparkSession.scala
@@ -31,7 +31,7 @@ import scala.util.control.NonFatal
 import org.apache.spark.{SPARK_VERSION, SparkConf, SparkContext, SparkException, TaskContext}
 import org.apache.spark.annotation.{DeveloperApi, Experimental, Stable, Unstable}
 import org.apache.spark.api.java.JavaRDD
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CALL_SITE_LONG_FORM, CLASS_NAME, CONFIG}
 import org.apache.spark.internal.config.{ConfigEntry, EXECUTOR_ALLOW_SPARK_CONTEXT}
 import org.apache.spark.rdd.RDD
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/classic/StreamingQueryManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/classic/StreamingQueryManager.scala
index 6d4a3ecd36037..0470f3b20ecc8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/classic/StreamingQueryManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/classic/StreamingQueryManager.scala
@@ -25,7 +25,7 @@ import scala.collection.mutable
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.annotation.Evolving
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, QUERY_ID, RUN_ID}
 import org.apache.spark.sql.catalyst.catalog.CatalogTable
 import org.apache.spark.sql.catalyst.streaming.{WriteToStream, WriteToStreamStatement}
@@ -33,6 +33,7 @@ import org.apache.spark.sql.connector.catalog.{Identifier, SupportsWrite, Table,
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.streaming._
 import org.apache.spark.sql.execution.streaming.continuous.ContinuousExecution
+import org.apache.spark.sql.execution.streaming.runtime.{AsyncProgressTrackingMicroBatchExecution, MicroBatchExecution, StreamingQueryListenerBus, StreamingQueryWrapper}
 import org.apache.spark.sql.execution.streaming.state.StateStoreCoordinatorRef
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.StaticSQLConf.STREAMING_QUERY_LISTENERS
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/columnar/CachedBatchSerializer.scala b/sql/core/src/main/scala/org/apache/spark/sql/columnar/CachedBatchSerializer.scala
index 885ddf4110cbb..2f1b79ec90f99 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/columnar/CachedBatchSerializer.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/columnar/CachedBatchSerializer.scala
@@ -18,12 +18,14 @@
 package org.apache.spark.sql.columnar
 
 import org.apache.spark.annotation.{DeveloperApi, Since}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FILTER, PREDICATE}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.expressions.{And, Attribute, AttributeReference, BindReferences, EqualNullSafe, EqualTo, Expression, GreaterThan, GreaterThanOrEqual, In, IsNotNull, IsNull, Length, LessThan, LessThanOrEqual, Literal, Or, Predicate, StartsWith}
+import org.apache.spark.sql.execution.{ColumnarToRowTransition, InputAdapter, SparkPlan, WholeStageCodegenExec}
+import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanExec
 import org.apache.spark.sql.execution.columnar.{ColumnStatisticsSchema, PartitionStatistics}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{AtomicType, BinaryType, StructType}
@@ -58,6 +60,40 @@ trait CachedBatchSerializer extends Serializable {
    */
   def supportsColumnarInput(schema: Seq[Attribute]): Boolean
 
+  /**
+   * Attempt to convert a query plan to its columnar equivalence for columnar caching.
+   * Called on the query plan that is about to be cached once [[supportsColumnarInput]] returns
+   * true on its output schema.
+   *
+   * The default implementation works by stripping the topmost columnar-to-row transition to
+   * expose the columnar-based plan to the serializer.
+   *
+   * @param plan The plan to convert.
+   * @return The output plan. Could either be a columnar plan if the input plan is convertible, or
+   *         the input plan unchanged if no viable conversion can be done.
+   */
+  @DeveloperApi
+  @Since("4.1.0")
+  def convertToColumnarPlanIfPossible(plan: SparkPlan): SparkPlan = plan match {
+    case gen: WholeStageCodegenExec =>
+      gen.child match {
+        case c2r: ColumnarToRowTransition =>
+          c2r.child match {
+            case ia: InputAdapter => ia.child
+            case _ => plan
+          }
+        case _ => plan
+      }
+    case c2r: ColumnarToRowTransition => // This matches when whole stage code gen is disabled.
+      c2r.child
+    case adaptive: AdaptiveSparkPlanExec =>
+      // If AQE is enabled for cached plan and table cache supports columnar in, we should mark
+      // `AdaptiveSparkPlanExec.supportsColumnar` as true to avoid inserting `ColumnarToRow`, so
+      // that `CachedBatchSerializer` can use `convertColumnarBatchToCachedBatch` to cache data.
+      adaptive.copy(supportsColumnar = true)
+    case _ => plan
+  }
+
   /**
    * Convert an `RDD[InternalRow]` into an `RDD[CachedBatch]` in preparation for caching the data.
    * @param input the input `RDD` to be converted.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/BaseScriptTransformationExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/BaseScriptTransformationExec.scala
index 60156bff1fb71..bfd813ad5ef11 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/BaseScriptTransformationExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/BaseScriptTransformationExec.scala
@@ -27,7 +27,7 @@ import scala.util.control.NonFatal
 import org.apache.hadoop.conf.Configuration
 
 import org.apache.spark.{SparkFiles, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.{CatalystTypeConverters, InternalRow}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/CacheManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/CacheManager.scala
index 5b68be2c4ce55..a8292a8dbaa3b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/CacheManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/CacheManager.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.execution
 
 import org.apache.hadoop.fs.{FileSystem, Path}
 
-import org.apache.spark.internal.{Logging, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.catalyst.catalog.HiveTableRelation
 import org.apache.spark.sql.catalyst.expressions.{Attribute, SubqueryExpression}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/Columnar.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/Columnar.scala
index 4c9ae155ec17a..f9193cd0495f6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/Columnar.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/Columnar.scala
@@ -32,7 +32,6 @@ import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
 import org.apache.spark.sql.execution.vectorized.WritableColumnVector
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.{ColumnarBatch, ColumnVector}
-import org.apache.spark.util.Utils
 
 /**
  * Holds a user defined rule that can be used to inject columnar implementations of various
@@ -66,9 +65,6 @@ trait ColumnarToRowTransition extends UnaryExecNode
  * [[MapPartitionsInRWithArrowExec]]. Eventually this should replace those implementations.
  */
 case class ColumnarToRowExec(child: SparkPlan) extends ColumnarToRowTransition with CodegenSupport {
-  // supportsColumnar requires to be only called on driver side, see also SPARK-37779.
-  assert(Utils.isInRunningSparkTask || child.supportsColumnar)
-
   override def output: Seq[Attribute] = child.output
 
   override def outputPartitioning: Partitioning = child.outputPartitioning
@@ -500,33 +496,31 @@ case class ApplyColumnarRulesAndInsertTransitions(
   extends Rule[SparkPlan] {
 
   /**
-   * Inserts an transition to columnar formatted data.
+   * Ensures columnar output on the input query plan. Transitions will be inserted
+   * on demand.
    */
-  private def insertRowToColumnar(plan: SparkPlan): SparkPlan = {
+  private def ensureOutputsColumnar(plan: SparkPlan): SparkPlan = {
     if (!plan.supportsColumnar) {
       // The tree feels kind of backwards
       // Columnar Processing will start here, so transition from row to columnar
-      RowToColumnarExec(insertTransitions(plan, outputsColumnar = false))
+      RowToColumnarExec(ensureOutputsRowBased(plan))
     } else if (!plan.isInstanceOf[RowToColumnarTransition]) {
-      plan.withNewChildren(plan.children.map(insertRowToColumnar))
+      plan.withNewChildren(plan.children.map(ensureOutputsColumnar))
     } else {
       plan
     }
   }
 
   /**
-   * Inserts RowToColumnarExecs and ColumnarToRowExecs where needed.
+   * Ensures row-based output on the input query plan. Transitions will be inserted
+   * on demand.
    */
-  private def insertTransitions(plan: SparkPlan, outputsColumnar: Boolean): SparkPlan = {
-    if (outputsColumnar) {
-      insertRowToColumnar(plan)
-    } else if (plan.supportsColumnar && !plan.supportsRowBased) {
+  private def ensureOutputsRowBased(plan: SparkPlan): SparkPlan = {
+    if (plan.supportsColumnar && !plan.supportsRowBased) {
       // `outputsColumnar` is false but the plan only outputs columnar format, so add a
       // to-row transition here.
-      ColumnarToRowExec(insertRowToColumnar(plan))
-    } else if (plan.isInstanceOf[ColumnarToRowTransition]) {
-      plan
-    } else {
+      ColumnarToRowExec(ensureOutputsColumnar(plan))
+    } else if (!plan.isInstanceOf[ColumnarToRowTransition]) {
       val outputsColumnar = plan match {
         // With planned write, the write command invokes child plan's `executeWrite` which is
         // neither columnar nor row-based.
@@ -541,6 +535,19 @@ case class ApplyColumnarRulesAndInsertTransitions(
           false
       }
       plan.withNewChildren(plan.children.map(insertTransitions(_, outputsColumnar)))
+    } else {
+      plan
+    }
+  }
+
+  /**
+   * Inserts RowToColumnarExecs and ColumnarToRowExecs where needed.
+   */
+  private def insertTransitions(plan: SparkPlan, outputsColumnar: Boolean): SparkPlan = {
+    if (outputsColumnar) {
+      ensureOutputsColumnar(plan)
+    } else {
+      ensureOutputsRowBased(plan)
     }
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala
index 31ab367c2d003..66e07aa4f7d44 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala
@@ -19,11 +19,9 @@ package org.apache.spark.sql.execution
 
 import java.util.concurrent.TimeUnit._
 
-import org.apache.commons.lang3.StringUtils
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.internal.LogKeys.{COUNT, MAX_SPLIT_BYTES, OPEN_COST_IN_BYTES}
-import org.apache.spark.internal.MDC
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.{FileSourceOptions, InternalRow, TableIdentifier}
 import org.apache.spark.sql.catalyst.catalog.BucketSpec
@@ -36,7 +34,7 @@ import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.datasources.parquet.{ParquetFileFormat => ParquetSource}
-import org.apache.spark.sql.execution.datasources.v2.PushedDownOperators
+import org.apache.spark.sql.execution.datasources.v2.{PushedDownOperators, TableSampleInfo}
 import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
 import org.apache.spark.sql.execution.vectorized.ConstantColumnVector
 import org.apache.spark.sql.internal.SQLConf
@@ -65,7 +63,7 @@ trait DataSourceScanExec extends LeafExecNode with StreamSourceAwareSparkPlan {
   override def simpleString(maxFields: Int): String = {
     val metadataEntries = metadata.toSeq.sorted.map {
       case (key, value) =>
-        key + ": " + StringUtils.abbreviate(redact(value), maxMetadataValueLength)
+        key + ": " + Utils.abbreviate(redact(value), maxMetadataValueLength)
     }
     val metadataStr = truncatedString(metadataEntries, " ", ", ", "", maxFields)
     redact(
@@ -159,10 +157,12 @@ case class RowDataSourceScanExec(
 
   override def inputRDD: RDD[InternalRow] = rdd
 
-  override val metadata: Map[String, String] = {
+  private def seqToString(seq: Seq[Any]): String = seq.mkString("[", ", ", "]")
 
-    def seqToString(seq: Seq[Any]): String = seq.mkString("[", ", ", "]")
+  private def pushedSampleMetadataString(s: TableSampleInfo): String =
+    s"SAMPLE (${(s.upperBound - s.lowerBound) * 100}) ${s.withReplacement} SEED(${s.seed})"
 
+  override val metadata: Map[String, String] = {
     val markedFilters = if (filters.nonEmpty) {
       for (filter <- filters) yield {
         if (handledFilters.contains(filter)) s"*$filter" else s"$filter"
@@ -189,6 +189,15 @@ case class RowDataSourceScanExec(
       seqToString(markedFilters.toSeq)
     }
 
+    val pushedJoins = if (pushedDownOperators.joinedRelationPushedDownOperators.nonEmpty) {
+      Map("PushedJoins" ->
+        s"\n${getPushedJoinString(
+          pushedDownOperators.joinedRelationPushedDownOperators(0),
+          pushedDownOperators.joinedRelationPushedDownOperators(1))}\n")
+    } else {
+      Map()
+    }
+
     Map("ReadSchema" -> requiredSchema.catalogString,
       "PushedFilters" -> pushedFilters) ++
       pushedDownOperators.aggregation.fold(Map[String, String]()) { v =>
@@ -198,9 +207,78 @@ case class RowDataSourceScanExec(
             seqToString(v.groupByExpressions.map(_.describe()).toImmutableArraySeq))} ++
       topNOrLimitInfo ++
       offsetInfo ++
-      pushedDownOperators.sample.map(v => "PushedSample" ->
-        s"SAMPLE (${(v.upperBound - v.lowerBound) * 100}) ${v.withReplacement} SEED(${v.seed})"
-      )
+      pushedDownOperators.sample.map(v => "PushedSample" -> pushedSampleMetadataString(v)) ++
+      pushedJoins
+  }
+
+  /**
+   * Build string for all the pushed down join operators. The method is recursive, so if there is
+   * join on top of 2 already joined relations, all of these will be present in string.
+   *
+   * The exmaple of resulting string is the following:
+   *
+   * PushedFilters: [id_3 = (id_4 + 1)], PushedJoins:
+   * [L]: PushedFilters: [ID_1 = (id_3 + 1)]
+   *      PushedJoins:
+   *      [L]: PushedFilters: [ID = (ID_1 + 1)]
+   *           PushedJoins:
+   *           [L]: Relation: join_pushdown_catalog.JOIN_SCHEMA.JOIN_TABLE_1
+   *                PushedFilters: [ID IS NOT NULL]
+   *           [R]: Relation: join_pushdown_catalog.JOIN_SCHEMA.JOIN_TABLE_2
+   *                PushedFilters: [ID IS NOT NULL]
+   *      [R]: Relation: join_pushdown_catalog.JOIN_SCHEMA.JOIN_TABLE_3
+   *           PushedFilters: [id IS NOT NULL]
+   * [R]: Relation: join_pushdown_catalog.JOIN_SCHEMA.JOIN_TABLE_4
+   *      PushedFilters: [id IS NOT NULL]
+   */
+  private def getPushedJoinString(
+      leftSidePushedDownOperators: PushedDownOperators,
+      rightSidePushedDownOperators: PushedDownOperators,
+      indent: Int = 0): String = {
+    val indentStr = " ".repeat(indent)
+
+    val leftSideOperators = buildOperatorParts(leftSidePushedDownOperators, indent)
+    val leftSideMetadataStr = formatMetadata(leftSideOperators, indentStr + " ".repeat(5))
+
+    val rightSideOperators = buildOperatorParts(rightSidePushedDownOperators, indent)
+    val rightSideMetadataStr = formatMetadata(rightSideOperators, indentStr + " ".repeat(5))
+
+    val leftSideString = s"$indentStr[L]: $leftSideMetadataStr"
+    val rightSideString = s"$indentStr[R]: $rightSideMetadataStr"
+    Seq(leftSideString, rightSideString).mkString("\n")
+  }
+
+  private def buildOperatorParts(operators: PushedDownOperators, indent: Int): List[String] = {
+    val parts = List.newBuilder[String]
+
+    // Add relation name for leaf nodes (nodes without further joins)
+    if (operators.joinedRelationPushedDownOperators.isEmpty) {
+      operators.relationName.foreach(name => parts += s"Relation: $name")
+    }
+
+    if (operators.pushedPredicates.nonEmpty) {
+      parts += s"PushedFilters: ${seqToString(operators.pushedPredicates.map(_.describe()))}"
+    }
+
+    operators.sample.foreach { sample =>
+      parts += s"PushedSample: ${pushedSampleMetadataString(sample)}"
+    }
+
+    // Recursively get the pushed join string for child with correct indentation.
+    if (operators.joinedRelationPushedDownOperators.nonEmpty) {
+      val nestedJoins = getPushedJoinString(
+        operators.joinedRelationPushedDownOperators(0),
+        operators.joinedRelationPushedDownOperators(1),
+        indent + 5)
+      parts += s"PushedJoins:\n$nestedJoins"
+    }
+
+    parts.result()
+  }
+
+  private def formatMetadata(parts: List[String], indentStr: String): String = {
+    val (basicParts, nestedJoinsParts) = parts.partition(!_.startsWith("PushedJoins:"))
+    (basicParts ++ nestedJoinsParts).mkString("\n" + indentStr)
   }
 
   // Don't care about `rdd` and `tableIdentifier`, and `stream` when canonicalizing.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/EmptyRelationExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/EmptyRelationExec.scala
index a0c3d7b51c2c3..70c9e5359e2ab 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/EmptyRelationExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/EmptyRelationExec.scala
@@ -61,6 +61,7 @@ case class EmptyRelationExec(@transient logical: LogicalPlan) extends LeafExecNo
       addSuffix: Boolean = false,
       maxFields: Int,
       printNodeId: Boolean,
+      printOutputColumns: Boolean,
       indent: Int = 0): Unit = {
     super.generateTreeString(depth,
       lastChildren,
@@ -70,11 +71,13 @@ case class EmptyRelationExec(@transient logical: LogicalPlan) extends LeafExecNo
       addSuffix,
       maxFields,
       printNodeId,
+      printOutputColumns,
       indent)
     Option(logical).foreach { _ =>
       lastChildren.add(true)
       logical.generateTreeString(
-        depth + 1, lastChildren, append, verbose, "", false, maxFields, printNodeId, indent)
+        depth + 1, lastChildren, append, verbose, "", false, maxFields, printNodeId,
+        printOutputColumns, indent)
       lastChildren.remove(lastChildren.size() - 1)
     }
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/ExistingRDD.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/ExistingRDD.scala
index 6000b3c20251e..6148fb30783e8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/ExistingRDD.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/ExistingRDD.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.execution
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{LOGICAL_PLAN_COLUMNS, OPTIMIZED_PLAN_COLUMNS}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.Encoder
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArray.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArray.scala
index 59810adc4b22e..3e98c28b29fbc 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArray.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArray.scala
@@ -22,7 +22,7 @@ import java.io.Closeable
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.{SparkEnv, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, MAX_NUM_ROWS_IN_MEMORY_BUFFER}
 import org.apache.spark.memory.TaskMemoryManager
 import org.apache.spark.serializer.SerializerManager
@@ -52,9 +52,12 @@ private[sql] class ExternalAppendOnlyUnsafeRowArray(
     initialSize: Int,
     pageSizeBytes: Long,
     numRowsInMemoryBufferThreshold: Int,
-    numRowsSpillThreshold: Int) extends Logging {
+    numRowsSpillThreshold: Int,
+    maxSizeSpillThreshold: Long) extends Logging {
 
-  def this(numRowsInMemoryBufferThreshold: Int, numRowsSpillThreshold: Int) = {
+  def this(numRowsInMemoryBufferThreshold: Int,
+    numRowsSpillThreshold: Int,
+    maxSizeSpillThreshold: Long) = {
     this(
       TaskContext.get().taskMemoryManager(),
       SparkEnv.get.blockManager,
@@ -63,7 +66,8 @@ private[sql] class ExternalAppendOnlyUnsafeRowArray(
       1024,
       SparkEnv.get.memoryManager.pageSizeBytes,
       numRowsInMemoryBufferThreshold,
-      numRowsSpillThreshold)
+      numRowsSpillThreshold,
+      maxSizeSpillThreshold)
   }
 
   private val initialSizeOfInMemoryBuffer =
@@ -138,6 +142,7 @@ private[sql] class ExternalAppendOnlyUnsafeRowArray(
           initialSize,
           pageSizeBytes,
           numRowsSpillThreshold,
+          maxSizeSpillThreshold,
           false)
 
         // populate with existing in-memory buffered rows
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/HiveResult.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/HiveResult.scala
index 21cf70dab59f7..3a7b75a555af1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/HiveResult.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/HiveResult.scala
@@ -149,6 +149,6 @@ object HiveResult extends SQLConfHelper {
         startField,
         endField)
     case (v: VariantVal, VariantType) => v.toString
-    case (other, _: UserDefinedType[_]) => other.toString
+    case (other, u: UserDefinedType[_]) => u.stringifyValue(other)
   }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/KeyGroupedPartitionedScan.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/KeyGroupedPartitionedScan.scala
new file mode 100644
index 0000000000000..5a789179219ad
--- /dev/null
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/KeyGroupedPartitionedScan.scala
@@ -0,0 +1,176 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.expressions.RowOrdering
+import org.apache.spark.sql.catalyst.plans.physical.{KeyGroupedPartitioning, KeyGroupedShuffleSpec}
+import org.apache.spark.sql.catalyst.util.InternalRowComparableWrapper
+import org.apache.spark.sql.execution.joins.StoragePartitionJoinParams
+
+/** Base trait for a data source scan capable of producing a key-grouped output. */
+trait KeyGroupedPartitionedScan[T] {
+  /**
+   * The output partitioning of this scan after applying any pushed-down SPJ parameters.
+   *
+   * @param basePartitioning  The original key-grouped partitioning of the scan.
+   * @param spjParams         SPJ parameters for the scan.
+   */
+  def getOutputKeyGroupedPartitioning(
+      basePartitioning: KeyGroupedPartitioning,
+      spjParams: StoragePartitionJoinParams): KeyGroupedPartitioning = {
+    val expressions = spjParams.joinKeyPositions match {
+      case Some(projectionPositions) =>
+        projectionPositions.map(i => basePartitioning.expressions(i))
+      case _ => basePartitioning.expressions
+    }
+
+    val newPartValues = spjParams.commonPartitionValues match {
+      case Some(commonPartValues) =>
+        // We allow duplicated partition values if
+        // `spark.sql.sources.v2.bucketing.partiallyClusteredDistribution.enabled` is true
+         commonPartValues.flatMap {
+           case (partValue, numSplits) => Seq.fill(numSplits)(partValue)
+         }
+      case None =>
+        spjParams.joinKeyPositions match {
+          case Some(projectionPositions) => basePartitioning.partitionValues.map { r =>
+            val projectedRow = KeyGroupedPartitioning.project(expressions,
+              projectionPositions, r)
+            InternalRowComparableWrapper(projectedRow, expressions)
+          }.distinct.map(_.row)
+          case _ => basePartitioning.partitionValues
+        }
+    }
+    basePartitioning.copy(expressions = expressions, numPartitions = newPartValues.length,
+      partitionValues = newPartValues)
+  }
+
+  /**
+   * Re-groups the input partitions for this scan based on the provided SPJ params, returning a list
+   * of partitions to be scanned by each scan task.
+   *
+   * @param p                      The output KeyGroupedPartitioning of this scan.
+   * @param spjParams              SPJ parameters for the scan.
+   * @param filteredPartitions     The input partitions (after applying filtering) to be
+   *                               re-grouped for this scan, initially grouped by partition value.
+   * @param partitionValueAccessor Accessor for the partition values (as an [[InternalRow]])
+   */
+  def getInputPartitionGrouping(
+      p: KeyGroupedPartitioning,
+      spjParams: StoragePartitionJoinParams,
+      filteredPartitions: Seq[Seq[T]],
+      partitionValueAccessor: T => InternalRow): Seq[Seq[T]] = {
+    assert(spjParams.keyGroupedPartitioning.isDefined)
+    val expressions = spjParams.keyGroupedPartitioning.get
+
+    // Re-group the input partitions if we are projecting on a subset of join keys
+    val (groupedPartitions, partExpressions) = spjParams.joinKeyPositions match {
+      case Some(projectPositions) =>
+        val projectedExpressions = projectPositions.map(i => expressions(i))
+        val parts = filteredPartitions.flatten.groupBy(part => {
+          val row = partitionValueAccessor(part)
+          val projectedRow = KeyGroupedPartitioning.project(
+            expressions, projectPositions, row)
+          InternalRowComparableWrapper(projectedRow, projectedExpressions)
+        }).map { case (wrapper, splits) => (wrapper.row, splits) }.toSeq
+        (parts, projectedExpressions)
+      case _ =>
+        val groupedParts = filteredPartitions.map(splits => {
+          assert(splits.nonEmpty)
+          (partitionValueAccessor(splits.head), splits)
+        })
+        (groupedParts, expressions)
+    }
+
+    // Also re-group the partitions if we are reducing compatible partition expressions
+    val finalGroupedPartitions = spjParams.reducers match {
+      case Some(reducers) =>
+        val result = groupedPartitions.groupBy { case (row, _) =>
+          KeyGroupedShuffleSpec.reducePartitionValue(row, partExpressions, reducers)
+        }.map { case (wrapper, splits) => (wrapper.row, splits.flatMap(_._2)) }.toSeq
+        val rowOrdering = RowOrdering.createNaturalAscendingOrdering(
+          partExpressions.map(_.dataType))
+        result.sorted(rowOrdering.on((t: (InternalRow, _)) => t._1))
+      case _ => groupedPartitions
+    }
+
+    // When partially clustered, the input partitions are not grouped by partition
+    // values. Here we'll need to check `commonPartitionValues` and decide how to group
+    // and replicate splits within a partition.
+    if (spjParams.commonPartitionValues.isDefined && spjParams.applyPartialClustering) {
+      // A mapping from the common partition values to how many splits the partition
+      // should contain.
+      val commonPartValuesMap = spjParams.commonPartitionValues
+          .get
+          .map(t => (InternalRowComparableWrapper(t._1, partExpressions), t._2))
+          .toMap
+      val filteredGroupedPartitions = finalGroupedPartitions.filter {
+        case (partValues, _) =>
+         commonPartValuesMap.keySet.contains(
+          InternalRowComparableWrapper(partValues, partExpressions))
+      }
+      val nestGroupedPartitions = filteredGroupedPartitions.map { case (partValue, splits) =>
+        // `commonPartValuesMap` should contain the part value since it's the super set.
+        val numSplits = commonPartValuesMap
+            .get(InternalRowComparableWrapper(partValue, partExpressions))
+        assert(numSplits.isDefined, s"Partition value $partValue does not exist in " +
+            "common partition values from Spark plan")
+
+        val newSplits = if (spjParams.replicatePartitions) {
+          // We need to also replicate partitions according to the other side of join
+          Seq.fill(numSplits.get)(splits)
+        } else {
+          // Not grouping by partition values: this could be the side with partially
+          // clustered distribution. Because of dynamic filtering, we'll need to check if
+          // the final number of splits of a partition is smaller than the original
+          // number, and fill with empty splits if so. This is necessary so that both
+          // sides of a join will have the same number of partitions & splits.
+          splits.map(Seq(_)).padTo(numSplits.get, Seq.empty)
+        }
+        (InternalRowComparableWrapper(partValue, partExpressions), newSplits)
+      }
+
+      // Now fill missing partition keys with empty partitions
+      val partitionMapping = nestGroupedPartitions.toMap
+      spjParams.commonPartitionValues.get.flatMap {
+        case (partValue, numSplits) =>
+          // Use empty partition for those partition values that are not present.
+          partitionMapping.getOrElse(
+            InternalRowComparableWrapper(partValue, partExpressions),
+            Seq.fill(numSplits)(Seq.empty))
+      }
+    } else {
+      // either `commonPartitionValues` is not defined, or it is defined but
+      // `applyPartialClustering` is false.
+      val partitionMapping = finalGroupedPartitions.map { case (partValue, splits) =>
+        InternalRowComparableWrapper(partValue, partExpressions) -> splits
+      }.toMap
+
+      // In case `commonPartitionValues` is not defined (e.g., SPJ is not used), there
+      // could exist duplicated partition values, as partition grouping is not done
+      // at the beginning and postponed to this method. It is important to use unique
+      // partition values here so that grouped partitions won't get duplicated.
+      p.uniquePartitionValues.map { partValue =>
+        // Use empty partition for those partition values that are not present
+        partitionMapping.getOrElse(
+          InternalRowComparableWrapper(partValue, partExpressions), Seq.empty)
+      }
+    }
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/QueryExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/QueryExecution.scala
index 9e5264d8d4f31..9f59bded94fe1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/QueryExecution.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/QueryExecution.scala
@@ -26,7 +26,7 @@ import scala.util.control.NonFatal
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.EXTENDED_EXPLAIN_GENERATOR
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.{AnalysisException, ExtendedExplainGenerator, Row}
@@ -44,7 +44,8 @@ import org.apache.spark.sql.execution.bucketing.{CoalesceBucketsInJoin, DisableU
 import org.apache.spark.sql.execution.dynamicpruning.PlanDynamicPruningFilters
 import org.apache.spark.sql.execution.exchange.EnsureRequirements
 import org.apache.spark.sql.execution.reuse.ReuseExchangeAndSubquery
-import org.apache.spark.sql.execution.streaming.{IncrementalExecution, OffsetSeqMetadata, WatermarkPropagator}
+import org.apache.spark.sql.execution.streaming.checkpointing.OffsetSeqMetadata
+import org.apache.spark.sql.execution.streaming.runtime.{IncrementalExecution, WatermarkPropagator}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.scripting.SqlScriptingExecution
 import org.apache.spark.sql.streaming.OutputMode
@@ -683,4 +684,12 @@ object QueryExecution {
       normalized
     }
   }
+
+  def determineShuffleCleanupMode(conf: SQLConf): ShuffleCleanupMode = {
+    if (conf.getConf(SQLConf.CLASSIC_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED)) {
+      RemoveShuffleFiles
+    } else {
+      DoNotCleanup
+    }
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/SQLExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/SQLExecution.scala
index 9dcb38f8ff10e..c5c2f9bb6a6f6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/SQLExecution.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/SQLExecution.scala
@@ -30,6 +30,7 @@ import org.apache.spark.internal.config.{SPARK_DRIVER_PREFIX, SPARK_EXECUTOR_PRE
 import org.apache.spark.internal.config.Tests.IS_TESTING
 import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanExec
+import org.apache.spark.sql.execution.exchange.ShuffleExchangeLike
 import org.apache.spark.sql.execution.ui.{SparkListenerSQLExecutionEnd, SparkListenerSQLExecutionStart}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.StaticSQLConf.SQL_EVENT_TRUNCATE_LENGTH
@@ -178,8 +179,11 @@ object SQLExecution extends Logging {
                 val shuffleIds = queryExecution.executedPlan match {
                   case ae: AdaptiveSparkPlanExec =>
                     ae.context.shuffleIds.asScala.keys
-                  case _ =>
-                    Iterable.empty
+                  case nonAdaptivePlan =>
+                    nonAdaptivePlan.collect {
+                      case exec: ShuffleExchangeLike =>
+                        exec.shuffleId
+                    }
                 }
                 shuffleIds.foreach { shuffleId =>
                   queryExecution.shuffleCleanupMode match {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/SortExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/SortExec.scala
index 5abc6f3ed5769..11fde41aae9e4 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/SortExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/SortExec.scala
@@ -62,7 +62,9 @@ case class SortExec(
     "peakMemory" -> SQLMetrics.createSizeMetric(sparkContext, "peak memory"),
     "spillSize" -> SQLMetrics.createSizeMetric(sparkContext, "spill size"))
 
-  private[sql] var rowSorter: UnsafeExternalRowSorter = _
+  // Each task has its own instance of UnsafeExternalRowSorter. It is created in the
+  // createSorter method and stored in a ThreadLocal variable.
+  private[sql] var rowSorter: ThreadLocal[UnsafeExternalRowSorter] = _
 
   /**
    * This method gets invoked only once for each SortExec instance to initialize an
@@ -71,6 +73,8 @@ case class SortExec(
    * should make it public.
    */
   def createSorter(): UnsafeExternalRowSorter = {
+    rowSorter = new ThreadLocal[UnsafeExternalRowSorter]()
+
     val ordering = RowOrdering.create(sortOrder, output)
 
     // The comparator for comparing prefix
@@ -95,13 +99,14 @@ case class SortExec(
     }
 
     val pageSize = SparkEnv.get.memoryManager.pageSizeBytes
-    rowSorter = UnsafeExternalRowSorter.create(
+    val newRowSorter = UnsafeExternalRowSorter.create(
       schema, ordering, prefixComparator, prefixComputer, pageSize, canUseRadixSort)
 
     if (testSpillFrequency > 0) {
-      rowSorter.setTestSpillFrequency(testSpillFrequency)
+      newRowSorter.setTestSpillFrequency(testSpillFrequency)
     }
-    rowSorter
+    rowSorter.set(newRowSorter)
+    rowSorter.get()
   }
 
   protected override def doExecute(): RDD[InternalRow] = {
@@ -194,11 +199,11 @@ case class SortExec(
    * In SortExec, we overwrites cleanupResources to close UnsafeExternalRowSorter.
    */
   override protected[sql] def cleanupResources(): Unit = {
-    if (rowSorter != null) {
+    if (rowSorter != null && rowSorter.get() != null) {
       // There's possible for rowSorter is null here, for example, in the scenario of empty
       // iterator in the current task, the downstream physical node(like SortMergeJoinExec) will
       // trigger cleanupResources before rowSorter initialized in createSorter.
-      rowSorter.cleanupResources()
+      rowSorter.get().cleanupResources()
     }
     super.cleanupResources()
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkPlan.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkPlan.scala
index d9bb057282dff..e7844a88bf141 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkPlan.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkPlan.scala
@@ -172,7 +172,7 @@ abstract class SparkPlan extends QueryPlan[SparkPlan] with Logging with Serializ
    * guarantees that the outputs of these children will have same number of partitions, so that the
    * operator can safely zip partitions of these children's result RDDs. Some operators can leverage
    * this guarantee to satisfy some interesting requirement, e.g., non-broadcast joins can specify
-   * HashClusteredDistribution(a,b) for its left child, and specify HashClusteredDistribution(c,d)
+   * ClusteredDistribution(a,b) for its left child, and specify ClusteredDistribution(c,d)
    * for its right child, then it's guaranteed that left and right child are co-partitioned by
    * a,b/c,d, which means tuples of same value are in the partitions of same index, e.g.,
    * (a=1,b=2) and (c=1,d=2) are both in the second partition of left and right child.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkStrategies.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkStrategies.scala
index d19ec2defc022..f76bc911bef8f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkStrategies.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/SparkStrategies.scala
@@ -40,7 +40,11 @@ import org.apache.spark.sql.execution.datasources.{WriteFiles, WriteFilesExec}
 import org.apache.spark.sql.execution.exchange.{REBALANCE_PARTITIONS_BY_COL, REBALANCE_PARTITIONS_BY_NONE, REPARTITION_BY_COL, REPARTITION_BY_NUM, ShuffleExchangeExec}
 import org.apache.spark.sql.execution.python._
 import org.apache.spark.sql.execution.python.streaming.{FlatMapGroupsInPandasWithStateExec, TransformWithStateInPySparkExec}
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.operators.stateful.{EventTimeWatermarkExec, StreamingDeduplicateExec, StreamingDeduplicateWithinWatermarkExec, StreamingGlobalLimitExec, StreamingLocalLimitExec, UpdateEventTimeColumnExec}
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.FlatMapGroupsWithStateExec
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinExec
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateExec
+import org.apache.spark.sql.execution.streaming.runtime.{StreamingExecutionRelation, StreamingRelation, StreamingRelationExec}
 import org.apache.spark.sql.execution.streaming.sources.MemoryPlan
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.OutputMode
@@ -644,7 +648,7 @@ abstract class SparkStrategies extends QueryPlanner[SparkPlan] {
 
       case PhysicalAggregation(groupingExpressions, aggExpressions, resultExpressions, child)
           if aggExpressions.forall(_.aggregateFunction.isInstanceOf[PythonUDAF]) =>
-        Seq(execution.python.AggregateInPandasExec(
+        Seq(execution.python.ArrowAggregatePythonExec(
           groupingExpressions,
           aggExpressions,
           resultExpressions,
@@ -671,7 +675,7 @@ abstract class SparkStrategies extends QueryPlanner[SparkPlan] {
 
       case PhysicalWindow(
         WindowFunctionType.Python, windowExprs, partitionSpec, orderSpec, child) =>
-        execution.python.WindowInPandasExec(
+        execution.python.ArrowWindowPythonExec(
           windowExprs, partitionSpec, orderSpec, planLater(child)) :: Nil
 
       case _ => Nil
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/UnionLoopExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/UnionLoopExec.scala
index e14f6f378b02a..47b5ba365cc20 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/UnionLoopExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/UnionLoopExec.scala
@@ -135,7 +135,8 @@ case class UnionLoopExec(
         // reference any external tables, we are able to calculate everything in the optimizer,
         // using the ConvertToLocalRelation rule, which significantly improves runtime.
         if (count <= localRelationLimit) {
-          val local = LocalRelation.fromExternalRows(anchor.output, df.collect().toIndexedSeq)
+          val local = LocalRelation.fromExternalRows(df.logicalPlan.output,
+            df.collect().toIndexedSeq)
          (Dataset.ofRows(session, local), count)
         } else {
           (materializedDF, count)
@@ -182,7 +183,10 @@ case class UnionLoopExec(
 
     // Main loop for obtaining the result of the recursive query.
     while (prevCount > 0 && !limitReached) {
-      var prevPlan: LogicalPlan = null
+      // The optimizer might have removed the UnionLoopRef in the recursion node (for example as a
+      // result of an empty join). In this case, prevPlan cannot be defined according to the cases
+      // below, so we set a default value of the previous result here.
+      var prevPlan: LogicalPlan = prevDF.logicalPlan
 
       // If the recursive part contains non-deterministic expressions that depends on a seed, we
       // need to create a new seed since the seed for this expression is set in the analysis, and
@@ -210,7 +214,7 @@ case class UnionLoopExec(
             // SQLConf.CTE_RECURSION_ANCHOR_ROWS_LIMIT_TO_CONVERT_TO_LOCAL_RELATION is set to be
             // anything larger than 0. However, we still handle this case in a special way to
             // optimize the case when the flag is set to 0.
-            case p @ Project(projectList, _: OneRowRelation) =>
+            case p @ Project(projectList, _: OneRowRelation) if p.subqueries.isEmpty =>
               prevPlan = p
               val prevPlanToRefMapping = projectList.zip(r.output).map {
                 case (fa: Alias, ta) => fa.withExprId(ta.exprId).withName(ta.name)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/UnsafeRowSerializer.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/UnsafeRowSerializer.scala
index 42fcfa8d60fa7..9728d664998e1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/UnsafeRowSerializer.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/UnsafeRowSerializer.scala
@@ -22,13 +22,12 @@ import java.nio.ByteBuffer
 
 import scala.reflect.ClassTag
 
-import com.google.common.io.ByteStreams
-
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.serializer.{DeserializationStream, SerializationStream, Serializer, SerializerInstance}
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.unsafe.Platform
+import org.apache.spark.util.Utils
 
 /**
  * Serializer for serializing [[UnsafeRow]]s during shuffle. Since UnsafeRows are already stored as
@@ -125,7 +124,7 @@ private class UnsafeRowSerializerInstance(
             if (rowBuffer.length < rowSize) {
               rowBuffer = new Array[Byte](rowSize)
             }
-            ByteStreams.readFully(dIn, rowBuffer, 0, rowSize)
+            Utils.readFully(dIn, rowBuffer, 0, rowSize)
             row.pointTo(rowBuffer, Platform.BYTE_ARRAY_OFFSET, rowSize)
             rowSize = readSize()
             if (rowSize == EOF) { // We are returning the last row in this stream
@@ -160,7 +159,7 @@ private class UnsafeRowSerializerInstance(
         if (rowBuffer.length < rowSize) {
           rowBuffer = new Array[Byte](rowSize)
         }
-        ByteStreams.readFully(dIn, rowBuffer, 0, rowSize)
+        Utils.readFully(dIn, rowBuffer, 0, rowSize)
         row.pointTo(rowBuffer, Platform.BYTE_ARRAY_OFFSET, rowSize)
         row.asInstanceOf[T]
       }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/WholeStageCodegenExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/WholeStageCodegenExec.scala
index 21b5177fe2208..246508965d3d6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/WholeStageCodegenExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/WholeStageCodegenExec.scala
@@ -25,7 +25,6 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.{broadcast, SparkException, SparkUnsupportedOperationException}
 import org.apache.spark.internal.LogKeys.{CODEGEN_STAGE_ID, CONFIG, ERROR, HUGE_METHOD_LIMIT, MAX_METHOD_CODE_SIZE, TREE_NODE}
-import org.apache.spark.internal.MDC
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
@@ -548,6 +547,7 @@ case class InputAdapter(child: SparkPlan) extends UnaryExecNode with InputRDDCod
       addSuffix: Boolean = false,
       maxFields: Int,
       printNodeId: Boolean,
+      printOutputColumns: Boolean,
       indent: Int = 0): Unit = {
     child.generateTreeString(
       depth,
@@ -558,6 +558,7 @@ case class InputAdapter(child: SparkPlan) extends UnaryExecNode with InputRDDCod
       addSuffix = false,
       maxFields,
       printNodeId,
+      printOutputColumns,
       indent)
   }
 
@@ -819,6 +820,7 @@ case class WholeStageCodegenExec(child: SparkPlan)(val codegenStageId: Int)
       addSuffix: Boolean = false,
       maxFields: Int,
       printNodeId: Boolean,
+      printOutputColumns: Boolean,
       indent: Int = 0): Unit = {
     child.generateTreeString(
       depth,
@@ -829,6 +831,7 @@ case class WholeStageCodegenExec(child: SparkPlan)(val codegenStageId: Int)
       false,
       maxFields,
       printNodeId,
+      printOutputColumns,
       indent)
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEOptimizer.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEOptimizer.scala
index 0f1743eeaacfb..f16c6d9cfe6dd 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEOptimizer.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEOptimizer.scala
@@ -18,7 +18,6 @@
 package org.apache.spark.sql.execution.adaptive
 
 import org.apache.spark.internal.LogKeys.{BATCH_NAME, RULE_NAME}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.analysis.UpdateAttributeNullability
 import org.apache.spark.sql.catalyst.optimizer.{ConvertToLocalRelation, EliminateLimits, OptimizeOneRowPlan}
 import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, LogicalPlanIntegrity}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEShuffleReadExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEShuffleReadExec.scala
index e8b70f94a7692..2a600b31cc297 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEShuffleReadExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AQEShuffleReadExec.scala
@@ -178,6 +178,15 @@ case class AQEShuffleReadExec private(
     numPartitionsMetric.set(partitionSpecs.length)
     driverAccumUpdates += (numPartitionsMetric.id -> partitionSpecs.length.toLong)
 
+    val numEmptyPartitionsMetric = metrics("numEmptyPartitions")
+    val numEmptyPartitions = child match {
+      case s: ShuffleQueryStageExec =>
+        s.mapStats.map(stats => stats.bytesByPartitionId.count(_ == 0)).getOrElse(0)
+      case _ => 0
+    }
+    numEmptyPartitionsMetric.set(numEmptyPartitions)
+    driverAccumUpdates += (numEmptyPartitionsMetric.id -> numEmptyPartitions.toLong)
+
     if (hasSkewedPartition) {
       val skewedSpecs = partitionSpecs.collect {
         case p: PartialReducerPartitionSpec => p
@@ -200,15 +209,7 @@ case class AQEShuffleReadExec private(
       val numCoalescedPartitionsMetric = metrics("numCoalescedPartitions")
       val x = partitionSpecs.count(isCoalescedSpec)
       numCoalescedPartitionsMetric.set(x)
-      val numEmptyPartitionsMetric = metrics("numEmptyPartitions")
-      val y = child match {
-        case s: ShuffleQueryStageExec =>
-          s.mapStats.map(stats => stats.bytesByPartitionId.count(_ == 0)).getOrElse(0)
-        case _ => 0
-      }
-      numEmptyPartitionsMetric.set(y)
-      driverAccumUpdates ++= Seq(numCoalescedPartitionsMetric.id -> x,
-        numEmptyPartitionsMetric.id -> y)
+      driverAccumUpdates ++= Seq(numCoalescedPartitionsMetric.id -> x)
     }
 
     partitionDataSizes.foreach { dataSizes =>
@@ -223,7 +224,9 @@ case class AQEShuffleReadExec private(
 
   @transient override lazy val metrics: Map[String, SQLMetric] = {
     if (shuffleStage.isDefined) {
-      Map("numPartitions" -> SQLMetrics.createMetric(sparkContext, "number of partitions")) ++ {
+      Map("numPartitions" -> SQLMetrics.createMetric(sparkContext, "number of partitions"),
+        "numEmptyPartitions" ->
+          SQLMetrics.createMetric(sparkContext, "number of empty partitions")) ++ {
         if (isLocalRead) {
           // We split the mapper partition evenly when creating local shuffle read, so no
           // data size info is available.
@@ -244,9 +247,7 @@ case class AQEShuffleReadExec private(
       } ++ {
         if (hasCoalescedPartition) {
           Map("numCoalescedPartitions" ->
-            SQLMetrics.createMetric(sparkContext, "number of coalesced partitions"),
-            "numEmptyPartitions" ->
-              SQLMetrics.createMetric(sparkContext, "number of empty partitions"))
+            SQLMetrics.createMetric(sparkContext, "number of coalesced partitions"))
         } else {
           Map.empty
         }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AdaptiveSparkPlanExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AdaptiveSparkPlanExec.scala
index 996e01a0ea936..0e50c03b6cc9f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AdaptiveSparkPlanExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/AdaptiveSparkPlanExec.scala
@@ -28,8 +28,8 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.SparkException
 import org.apache.spark.broadcast
-import org.apache.spark.internal.{MDC, MessageWithContext}
 import org.apache.spark.internal.LogKeys._
+import org.apache.spark.internal.MessageWithContext
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Attribute
@@ -430,6 +430,7 @@ case class AdaptiveSparkPlanExec(
       addSuffix: Boolean = false,
       maxFields: Int,
       printNodeId: Boolean,
+      printOutputColumns: Boolean,
       indent: Int = 0): Unit = {
     super.generateTreeString(
       depth,
@@ -440,6 +441,7 @@ case class AdaptiveSparkPlanExec(
       addSuffix,
       maxFields,
       printNodeId,
+      printOutputColumns,
       indent)
     if (currentPhysicalPlan.fastEquals(initialPlan)) {
       lastChildren.add(true)
@@ -452,6 +454,7 @@ case class AdaptiveSparkPlanExec(
         addSuffix = false,
         maxFields,
         printNodeId,
+        printOutputColumns,
         indent)
       lastChildren.remove(lastChildren.size() - 1)
     } else {
@@ -462,7 +465,8 @@ case class AdaptiveSparkPlanExec(
         append,
         verbose,
         maxFields,
-        printNodeId)
+        printNodeId,
+        printOutputColumns)
       generateTreeStringWithHeader(
         "Initial Plan",
         initialPlan,
@@ -470,11 +474,11 @@ case class AdaptiveSparkPlanExec(
         append,
         verbose,
         maxFields,
-        printNodeId)
+        printNodeId,
+        printOutputColumns)
     }
   }
 
-
   private def generateTreeStringWithHeader(
       header: String,
       plan: SparkPlan,
@@ -482,8 +486,9 @@ case class AdaptiveSparkPlanExec(
       append: String => Unit,
       verbose: Boolean,
       maxFields: Int,
-      printNodeId: Boolean): Unit = {
-    append("   " * depth)
+      printNodeId: Boolean,
+      printOutputColumns: Boolean): Unit = {
+    append("   ".repeat(depth))
     append(s"+- == $header ==\n")
     plan.generateTreeString(
       0,
@@ -494,6 +499,7 @@ case class AdaptiveSparkPlanExec(
       addSuffix = false,
       maxFields,
       printNodeId,
+      printOutputColumns,
       indent = depth + 1)
   }
 
@@ -891,7 +897,7 @@ case class AdaptiveSparkPlanExec(
     val e = if (originalErrors.size == 1) {
       originalErrors.head
     } else {
-      val se = QueryExecutionErrors.multiFailuresInStageMaterializationError(originalErrors.head)
+      val se = QueryExecutionErrors.multiFailuresInStageMaterializationError(originalErrors)
       originalErrors.tail.foreach(se.addSuppressed)
       se
     }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/InsertAdaptiveSparkPlan.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/InsertAdaptiveSparkPlan.scala
index 2855f902a8509..aa748d8de6dc0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/InsertAdaptiveSparkPlan.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/InsertAdaptiveSparkPlan.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution.adaptive
 import scala.collection.mutable
 
 import org.apache.spark.internal.LogKeys.{CONFIG, SUB_QUERY}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.expressions
 import org.apache.spark.sql.catalyst.expressions.{DynamicPruningSubquery, ListQuery, SubqueryExpression}
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/LogicalQueryStage.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/LogicalQueryStage.scala
index 506f52fd9072e..62e00d1ea6eda 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/LogicalQueryStage.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/LogicalQueryStage.scala
@@ -82,4 +82,32 @@ case class LogicalQueryStage(
     case _: QueryStageExec => true
     case _ => false
   }
+
+  override def generateTreeString(
+      depth: Int,
+      lastChildren: java.util.ArrayList[Boolean],
+      append: String => Unit,
+      verbose: Boolean,
+      prefix: String = "",
+      addSuffix: Boolean = false,
+      maxFields: Int,
+      printNodeId: Boolean,
+      printOutputColumns: Boolean,
+      indent: Int = 0): Unit = {
+    super.generateTreeString(depth,
+      lastChildren,
+      append,
+      verbose,
+      prefix,
+      addSuffix,
+      maxFields,
+      printNodeId,
+      printOutputColumns,
+      indent)
+    lastChildren.add(true)
+    logicalPlan.generateTreeString(
+      depth + 1, lastChildren, append, verbose, "", false, maxFields, printNodeId,
+      printOutputColumns, indent)
+    lastChildren.remove(lastChildren.size() - 1)
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/QueryStageExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/QueryStageExec.scala
index 0a5bdefea7bc5..be58bccd1489a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/QueryStageExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/QueryStageExec.scala
@@ -134,6 +134,7 @@ abstract class QueryStageExec extends LeafExecNode {
       addSuffix: Boolean = false,
       maxFields: Int,
       printNodeId: Boolean,
+      printOutputColumns: Boolean,
       indent: Int = 0): Unit = {
     super.generateTreeString(depth,
       lastChildren,
@@ -143,10 +144,12 @@ abstract class QueryStageExec extends LeafExecNode {
       addSuffix,
       maxFields,
       printNodeId,
+      printOutputColumns,
       indent)
     lastChildren.add(true)
     plan.generateTreeString(
-      depth + 1, lastChildren, append, verbose, "", false, maxFields, printNodeId, indent)
+      depth + 1, lastChildren, append, verbose, "", false, maxFields, printNodeId,
+      printOutputColumns, indent)
     lastChildren.remove(lastChildren.size() - 1)
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/ShufflePartitionsUtil.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/ShufflePartitionsUtil.scala
index 1ea4df0254673..b7cf0ce3150ba 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/ShufflePartitionsUtil.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/adaptive/ShufflePartitionsUtil.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.execution.adaptive
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.{MapOutputStatistics, MapOutputTrackerMaster, SparkEnv}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.execution.{CoalescedPartitionSpec, PartialReducerPartitionSpec, ShufflePartitionSpec}
 
 object ShufflePartitionsUtil extends Logging {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
index de1b83c16ac97..58055fa6129a5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggUtils.scala
@@ -22,7 +22,7 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate._
 import org.apache.spark.sql.catalyst.plans.logical.Aggregate
 import org.apache.spark.sql.execution.SparkPlan
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.operators.stateful._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.Utils
 import org.apache.spark.util.collection.{Utils => CUtils}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggregateCodegenSupport.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggregateCodegenSupport.scala
index 40112979c6d46..595cecabe9185 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggregateCodegenSupport.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/AggregateCodegenSupport.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.execution.aggregate
 
 import org.apache.spark.SparkException
 import org.apache.spark.internal.LogKeys.MAX_JVM_METHOD_PARAMS_LENGTH
-import org.apache.spark.internal.MDC
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeSet, Expression, ExpressionEquals, UnsafeRow}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/BaseAggregateExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/BaseAggregateExec.scala
index 5391d5807597c..7ae00467a0114 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/BaseAggregateExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/BaseAggregateExec.scala
@@ -22,7 +22,7 @@ import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeReference,
 import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, Final, PartialMerge}
 import org.apache.spark.sql.catalyst.plans.physical.{AllTuples, ClusteredDistribution, Distribution, UnspecifiedDistribution}
 import org.apache.spark.sql.execution.{ExplainUtils, PartitioningPreservingUnaryExecNode, UnaryExecNode}
-import org.apache.spark.sql.execution.streaming.StatefulOperatorPartitioning
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorPartitioning
 
 /**
  * Holds common logic for aggregate operators
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashAggregateExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashAggregateExec.scala
index 24528b6f4da15..4a0db1c613d60 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashAggregateExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashAggregateExec.scala
@@ -23,7 +23,6 @@ import scala.collection.mutable
 
 import org.apache.spark.TaskContext
 import org.apache.spark.internal.LogKeys.CONFIG
-import org.apache.spark.internal.MDC
 import org.apache.spark.memory.SparkOutOfMemoryError
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashMapGenerator.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashMapGenerator.scala
index 19a36483abe6d..af9dcb44cf1f6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashMapGenerator.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/HashMapGenerator.scala
@@ -160,7 +160,8 @@ abstract class HashMapGenerator(
       case BooleanType => hashInt(s"$input ? 1 : 0")
       case ByteType | ShortType | IntegerType | DateType | _: YearMonthIntervalType =>
         hashInt(input)
-      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType => hashLong(input)
+      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType =>
+        hashLong(input)
       case FloatType => hashInt(s"Float.floatToIntBits($input)")
       case DoubleType => hashLong(s"Double.doubleToLongBits($input)")
       case d: DecimalType =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationIterator.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationIterator.scala
index a4a6dc8e4ab01..fbd3ce040e487 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationIterator.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationIterator.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.execution.aggregate
 
 import org.apache.spark.{SparkEnv, SparkException, TaskContext}
-import org.apache.spark.internal.{config, Logging, MDC}
+import org.apache.spark.internal.{config, Logging}
 import org.apache.spark.internal.LogKeys.{CONFIG, HASH_MAP_SIZE, OBJECT_AGG_SORT_BASED_FALLBACK_THRESHOLD}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
@@ -332,6 +332,7 @@ class SortBasedAggregator(
       SparkEnv.get.serializerManager,
       TaskContext.get().taskMemoryManager().pageSizeBytes,
       SparkEnv.get.conf.get(config.SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD),
+      SparkEnv.get.conf.get(config.SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD),
       null
     )
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationMap.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationMap.scala
index 9b68e6f02a859..5384f939c31ab 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationMap.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/ObjectAggregationMap.scala
@@ -79,6 +79,7 @@ class ObjectAggregationMap() {
       SparkEnv.get.serializerManager,
       TaskContext.get().taskMemoryManager().pageSizeBytes,
       SparkEnv.get.conf.get(config.SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD),
+      SparkEnv.get.conf.get(config.SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD),
       null
     )
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsExec.scala
index b5dfd4639d8f2..b0b6d45620ac9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsExec.scala
@@ -23,7 +23,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Ascending, Attribute, SortOrder}
 import org.apache.spark.sql.catalyst.plans.physical.{AllTuples, ClusteredDistribution, Distribution, Partitioning}
 import org.apache.spark.sql.execution.{SparkPlan, UnaryExecNode}
-import org.apache.spark.sql.execution.streaming.StatefulOperatorPartitioning
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorPartitioning
 
 /**
  * This node updates the session window spec of each input rows via analyzing neighbor rows and
@@ -52,10 +52,11 @@ case class UpdatingSessionsExec(
   override protected def doExecute(): RDD[InternalRow] = {
     val inMemoryThreshold = conf.sessionWindowBufferInMemoryThreshold
     val spillThreshold = conf.sessionWindowBufferSpillThreshold
+    val spillSizeThreshold = conf.sessionWindowBufferSpillSizeThreshold
 
     child.execute().mapPartitions { iter =>
       new UpdatingSessionsIterator(iter, groupingExpression, sessionExpression,
-        child.output, inMemoryThreshold, spillThreshold)
+        child.output, inMemoryThreshold, spillThreshold, spillSizeThreshold)
     }
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsIterator.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsIterator.scala
index 39b835f1f45fb..64bb3717f52bc 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsIterator.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/UpdatingSessionsIterator.scala
@@ -43,7 +43,8 @@ class UpdatingSessionsIterator(
     sessionExpression: NamedExpression,
     inputSchema: Seq[Attribute],
     inMemoryThreshold: Int,
-    spillThreshold: Int) extends Iterator[InternalRow] {
+    spillThreshold: Int,
+    spillSizeThreshold: Long) extends Iterator[InternalRow] {
 
   private val groupingWithoutSession: Seq[NamedExpression] =
     groupingExpressions.diff(Seq(sessionExpression))
@@ -150,7 +151,8 @@ class UpdatingSessionsIterator(
     currentKeys = groupingKey.copy()
     currentSession = sessionStruct.copy()
 
-    rowsForCurrentSession = new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold)
+    rowsForCurrentSession = new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold,
+      spillSizeThreshold)
     rowsForCurrentSession.add(currentRow.asInstanceOf[UnsafeRow])
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/udaf.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/udaf.scala
index 1197a16a35e9b..492f11607ce6d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/udaf.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/aggregate/udaf.scala
@@ -84,7 +84,7 @@ sealed trait BufferSetterGetterUtils {
           (row: InternalRow, ordinal: Int) =>
             if (row.isNullAt(ordinal)) null else row.getInt(ordinal)
 
-        case TimestampType | TimestampNTZType =>
+        case TimestampType | TimestampNTZType | _: TimeType =>
           (row: InternalRow, ordinal: Int) =>
             if (row.isNullAt(ordinal)) null else row.getLong(ordinal)
 
@@ -188,7 +188,7 @@ sealed trait BufferSetterGetterUtils {
               row.setNullAt(ordinal)
             }
 
-        case TimestampType | TimestampNTZType =>
+        case TimestampType | TimestampNTZType | _: TimeType =>
           (row: InternalRow, ordinal: Int, value: Any) =>
             if (value != null) {
               row.setLong(ordinal, value.asInstanceOf[Long])
@@ -530,7 +530,7 @@ case class ScalaAggregator[IN, BUF, OUT](
 
   def eval(buffer: BUF): Any = {
     val row = outputSerializer(agg.finish(buffer))
-    if (outputEncoder.isSerializedAsStruct) row else row.get(0, dataType)
+    if (outputEncoder.isSerializedAsStructForTopLevel) row else row.get(0, dataType)
   }
 
   @transient private[this] lazy val bufferRow = new UnsafeRow(bufferEncoder.namedExpressions.length)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowConverters.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowConverters.scala
index ed490347ae821..3072a12e3d587 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowConverters.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/arrow/ArrowConverters.scala
@@ -264,6 +264,109 @@ private[sql] object ArrowConverters extends Logging {
     }
   }
 
+  /**
+   * This is a class that converts input data in the form of a Byte array to InternalRow instances
+   * implementing the Iterator interface.
+   *
+   * The input data must be a valid Arrow IPC stream, this means that the first message is always
+   * the schema followed by N record batches.
+   *
+   * @param input Input Data
+   * @param context Task Context for Spark
+   */
+  private[sql] class InternalRowIteratorFromIPCStream(
+      input: Array[Byte],
+      context: TaskContext) extends Iterator[InternalRow] {
+
+    // Keep all the resources we have opened in order, should be closed
+    // in reverse order finally.
+    private val resources = new ArrayBuffer[AutoCloseable]()
+
+    // Create an allocator used for all Arrow related memory.
+    protected val allocator: BufferAllocator = ArrowUtils.rootAllocator.newChildAllocator(
+      s"to${this.getClass.getSimpleName}",
+      0,
+      Long.MaxValue)
+    resources.append(allocator)
+
+    private val reader = try {
+      new ArrowStreamReader(new ByteArrayInputStream(input), allocator)
+    } catch {
+      case e: Exception =>
+        closeAll(resources.toSeq.reverse: _*)
+        throw new IllegalArgumentException(
+          s"Failed to create ArrowStreamReader: ${e.getMessage}", e)
+    }
+    resources.append(reader)
+
+    private val root: VectorSchemaRoot = try {
+      reader.getVectorSchemaRoot
+    } catch {
+      case e: Exception =>
+        closeAll(resources.toSeq.reverse: _*)
+        throw new IllegalArgumentException(
+          s"Failed to read schema from IPC stream: ${e.getMessage}", e)
+    }
+    resources.append(root)
+
+    val schema: StructType = try {
+      ArrowUtils.fromArrowSchema(root.getSchema)
+    } catch {
+      case e: Exception =>
+        closeAll(resources.toSeq.reverse: _*)
+        throw new IllegalArgumentException(s"Failed to convert Arrow schema: ${e.getMessage}", e)
+    }
+
+    // TODO: wrap in exception
+    private var rowIterator: Iterator[InternalRow] = vectorSchemaRootToIter(root)
+
+    // Metrics to track batch processing
+    private var _batchesLoaded: Int = 0
+    private var _totalRowsProcessed: Long = 0L
+
+    if (context != null) {
+      context.addTaskCompletionListener[Unit] { _ =>
+        closeAll(resources.toSeq.reverse: _*)
+      }
+    }
+
+    // Public accessors for metrics
+    def batchesLoaded: Int = _batchesLoaded
+    def totalRowsProcessed: Long = _totalRowsProcessed
+
+    // Loads the next batch from the Arrow reader and returns true or
+    // false if the next batch could be loaded.
+    private def loadNextBatch(): Boolean = {
+      if (reader.loadNextBatch()) {
+        rowIterator = vectorSchemaRootToIter(root)
+        _batchesLoaded += 1
+        true
+      } else {
+        false
+      }
+    }
+
+    override def hasNext: Boolean = {
+      if (rowIterator.hasNext) {
+        true
+      } else {
+        if (!loadNextBatch()) {
+          false
+        } else {
+          hasNext
+        }
+      }
+    }
+
+    override def next(): InternalRow = {
+      if (!hasNext) {
+        throw new NoSuchElementException("No more elements in iterator")
+      }
+      _totalRowsProcessed += 1
+      rowIterator.next()
+    }
+  }
+
   /**
    * An InternalRow iterator which parse data from serialized ArrowRecordBatches, subclass should
    * implement [[nextBatch]] to parse data from binary records.
@@ -382,6 +485,23 @@ private[sql] object ArrowConverters extends Logging {
     (iterator, iterator.schema)
   }
 
+  /**
+   * Creates an iterator from a Byte array to deserialize an Arrow IPC stream with exactly
+   * one schema and a varying number of record batches. Returns an iterator over the
+   * created InternalRow.
+   */
+  private[sql] def fromIPCStream(input: Array[Byte], context: TaskContext):
+      (Iterator[InternalRow], StructType) = {
+    fromIPCStreamWithIterator(input, context)
+  }
+
+  // Overloaded method for tests to access the iterator with metrics
+  private[sql] def fromIPCStreamWithIterator(input: Array[Byte], context: TaskContext):
+      (InternalRowIteratorFromIPCStream, StructType) = {
+    val iterator = new InternalRowIteratorFromIPCStream(input, context)
+    (iterator, iterator.schema)
+  }
+
   /**
    * Convert an arrow batch container into an iterator of InternalRow.
    */
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/basicPhysicalOperators.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/basicPhysicalOperators.scala
index 995f857bbf635..78d7eb4ec1f51 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/basicPhysicalOperators.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/basicPhysicalOperators.scala
@@ -25,7 +25,7 @@ import scala.concurrent.ExecutionContext
 import scala.concurrent.duration.Duration
 
 import org.apache.spark.{InterruptibleIterator, Partition, SparkContext, SparkException, TaskContext}
-import org.apache.spark.rdd.{EmptyRDD, PartitionwiseSampledRDD, RDD}
+import org.apache.spark.rdd.{EmptyRDD, PartitionwiseSampledRDD, RDD, SQLPartitioningAwareUnionRDD}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.BindReferences.bindReferences
@@ -699,8 +699,80 @@ case class UnionExec(children: Seq[SparkPlan]) extends SparkPlan {
     }
   }
 
-  protected override def doExecute(): RDD[InternalRow] =
-    sparkContext.union(children.map(_.execute()))
+  /**
+   * Returns the output partitionings of the children, with the attributes converted to
+   * the first child's attributes at the same position.
+   */
+  private def prepareOutputPartitioning(): Seq[Partitioning] = {
+    // Create a map of attributes from the other children to the first child.
+    val firstAttrs = children.head.output
+    val attributesMap = children.tail.map(_.output).map { otherAttrs =>
+      otherAttrs.zip(firstAttrs).map { case (attr, firstAttr) =>
+        attr -> firstAttr
+      }.toMap
+    }
+
+    val partitionings = children.map(_.outputPartitioning)
+    val firstPartitioning = partitionings.head
+    val otherPartitionings = partitionings.tail
+
+    val convertedOtherPartitionings = otherPartitionings.zipWithIndex.map { case (p, idx) =>
+      val attributeMap = attributesMap(idx)
+      p match {
+        case e: Expression =>
+          e.transform {
+            case a: Attribute if attributeMap.contains(a) => attributeMap(a)
+          }.asInstanceOf[Partitioning]
+        case _ => p
+      }
+    }
+    Seq(firstPartitioning) ++ convertedOtherPartitionings
+  }
+
+  private def comparePartitioning(left: Partitioning, right: Partitioning): Boolean = {
+    (left, right) match {
+      case (SinglePartition, SinglePartition) => true
+      case (l: HashPartitioningLike, r: HashPartitioningLike) => l == r
+      // Note: two `RangePartitioning`s with even same ordering and number of partitions
+      // are not equal, because they might have different partition bounds.
+      case _ => false
+    }
+  }
+
+  override def outputPartitioning: Partitioning = {
+    if (conf.getConf(SQLConf.UNION_OUTPUT_PARTITIONING)) {
+      val partitionings = prepareOutputPartitioning()
+      if (partitionings.forall(comparePartitioning(_, partitionings.head))) {
+        val partitioner = partitionings.head
+
+        // Take the output attributes of this union and map the partitioner to them.
+        val attributeMap = children.head.output.zip(output).toMap
+        partitioner match {
+          case e: Expression =>
+            e.transform {
+              case a: Attribute if attributeMap.contains(a) => attributeMap(a)
+            }.asInstanceOf[Partitioning]
+          case _ => partitioner
+        }
+      } else {
+        super.outputPartitioning
+      }
+    } else {
+      super.outputPartitioning
+    }
+  }
+
+  protected override def doExecute(): RDD[InternalRow] = {
+    if (outputPartitioning.isInstanceOf[UnknownPartitioning]) {
+      sparkContext.union(children.map(_.execute()))
+    } else {
+      // This union has a known partitioning, i.e., its children have the same partitioning
+      // in semantics so this union can choose not to change the partitioning by using a
+      // custom partitioning aware union RDD.
+      val nonEmptyRdds = children.map(_.execute()).filter(!_.partitions.isEmpty)
+      new SQLPartitioningAwareUnionRDD(sparkContext, nonEmptyRdds, outputPartitioning.numPartitions)
+    }
+  }
 
   override def supportsColumnar: Boolean = children.forall(_.supportsColumnar)
 
@@ -790,6 +862,7 @@ abstract class BaseSubqueryExec extends SparkPlan {
       addSuffix: Boolean = false,
       maxFields: Int,
       printNodeId: Boolean,
+      printOutputColumns: Boolean,
       indent: Int = 0): Unit = {
     /**
      * In the new explain mode `EXPLAIN FORMATTED`, the subqueries are not shown in the
@@ -807,6 +880,7 @@ abstract class BaseSubqueryExec extends SparkPlan {
         false,
         maxFields,
         printNodeId,
+        printOutputColumns,
         indent)
     }
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnAccessor.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnAccessor.scala
index 2074649cc9863..6fb1f5263b518 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnAccessor.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnAccessor.scala
@@ -147,7 +147,7 @@ private[sql] object ColumnAccessor {
       case ByteType => new ByteColumnAccessor(buf)
       case ShortType => new ShortColumnAccessor(buf)
       case IntegerType | DateType | _: YearMonthIntervalType => new IntColumnAccessor(buf)
-      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType =>
+      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType =>
         new LongColumnAccessor(buf)
       case FloatType => new FloatColumnAccessor(buf)
       case DoubleType => new DoubleColumnAccessor(buf)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnBuilder.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnBuilder.scala
index b65ef12f12d56..a63569b19a018 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnBuilder.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnBuilder.scala
@@ -185,7 +185,7 @@ private[columnar] object ColumnBuilder {
       case ByteType => new ByteColumnBuilder
       case ShortType => new ShortColumnBuilder
       case IntegerType | DateType | _: YearMonthIntervalType => new IntColumnBuilder
-      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType =>
+      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType =>
         new LongColumnBuilder
       case FloatType => new FloatColumnBuilder
       case DoubleType => new DoubleColumnBuilder
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnType.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnType.scala
index 60695a6c5d49c..df250e529e2ce 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnType.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/ColumnType.scala
@@ -869,7 +869,8 @@ private[columnar] object ColumnType {
       case ByteType => BYTE
       case ShortType => SHORT
       case IntegerType | DateType | _: YearMonthIntervalType => INT
-      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType => LONG
+      case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType =>
+        LONG
       case FloatType => FLOAT
       case DoubleType => DOUBLE
       case s: StringType => STRING(s)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/GenerateColumnAccessor.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/GenerateColumnAccessor.scala
index d07ebeb843bba..dd64d92bed71e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/GenerateColumnAccessor.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/GenerateColumnAccessor.scala
@@ -82,7 +82,7 @@ object GenerateColumnAccessor extends CodeGenerator[Seq[DataType], ColumnarItera
         case ByteType => classOf[ByteColumnAccessor].getName
         case ShortType => classOf[ShortColumnAccessor].getName
         case IntegerType | DateType | _: YearMonthIntervalType => classOf[IntColumnAccessor].getName
-        case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType =>
+        case LongType | TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType =>
           classOf[LongColumnAccessor].getName
         case FloatType => classOf[FloatColumnAccessor].getName
         case DoubleType => classOf[DoubleColumnAccessor].getName
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/InMemoryRelation.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/InMemoryRelation.scala
index 8f704cec7e892..eabbc7fc74f50 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/InMemoryRelation.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/columnar/InMemoryRelation.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.execution.columnar
 
 import com.esotericsoftware.kryo.{DefaultSerializer, Kryo, Serializer => KryoSerializer}
 import com.esotericsoftware.kryo.io.{Input => KryoInput, Output => KryoOutput}
-import org.apache.commons.lang3.StringUtils
 
 import org.apache.spark.{SparkException, TaskContext}
 import org.apache.spark.network.util.JavaUtils
@@ -267,42 +266,29 @@ case class CachedRDDBuilder(
   private val materializedPartitions = cachedPlan.session.sparkContext.longAccumulator
 
   val cachedName = tableName.map(n => s"In-memory table $n")
-    .getOrElse(StringUtils.abbreviate(cachedPlan.toString, 1024))
+    .getOrElse(Utils.abbreviate(cachedPlan.toString, 1024))
 
   val supportsColumnarInput: Boolean = {
     cachedPlan.supportsColumnar &&
       serializer.supportsColumnarInput(cachedPlan.output)
   }
 
-  def cachedColumnBuffers: RDD[CachedBatch] = {
+  def cachedColumnBuffers: RDD[CachedBatch] = synchronized {
     if (_cachedColumnBuffers == null) {
-      synchronized {
-        if (_cachedColumnBuffers == null) {
-          _cachedColumnBuffers = buildBuffers()
-        }
-      }
+      _cachedColumnBuffers = buildBuffers()
     }
     _cachedColumnBuffers
   }
 
-  def clearCache(blocking: Boolean = false): Unit = {
+  def clearCache(blocking: Boolean = false): Unit = synchronized {
     if (_cachedColumnBuffers != null) {
-      synchronized {
-        if (_cachedColumnBuffers != null) {
-          _cachedColumnBuffers.unpersist(blocking)
-          _cachedColumnBuffers = null
-        }
-      }
+      _cachedColumnBuffers.unpersist(blocking)
+      _cachedColumnBuffers = null
     }
   }
 
-  def isCachedColumnBuffersLoaded: Boolean = {
-    if (_cachedColumnBuffers != null) {
-      synchronized {
-        return _cachedColumnBuffers != null && isCachedRDDLoaded
-      }
-    }
-    false
+  def isCachedColumnBuffersLoaded: Boolean = synchronized {
+    _cachedColumnBuffers != null && isCachedRDDLoaded
   }
 
   private def isCachedRDDLoaded: Boolean = {
@@ -381,22 +367,8 @@ object InMemoryRelation {
   /* Visible for testing */
   private[columnar] def clearSerializer(): Unit = synchronized { ser = None }
 
-  def convertToColumnarIfPossible(plan: SparkPlan): SparkPlan = plan match {
-    case gen: WholeStageCodegenExec => gen.child match {
-      case c2r: ColumnarToRowTransition => c2r.child match {
-        case ia: InputAdapter => ia.child
-        case _ => plan
-      }
-      case _ => plan
-    }
-    case c2r: ColumnarToRowTransition => // This matches when whole stage code gen is disabled.
-      c2r.child
-    case adaptive: AdaptiveSparkPlanExec =>
-      // If AQE is enabled for cached plan and table cache supports columnar in, we should mark
-      // `AdaptiveSparkPlanExec.supportsColumnar` as true to avoid inserting `ColumnarToRow`, so
-      // that `CachedBatchSerializer` can use `convertColumnarBatchToCachedBatch` to cache data.
-      adaptive.copy(supportsColumnar = true)
-    case _ => plan
+  def convertToColumnarIfPossible(plan: SparkPlan): SparkPlan = {
+    getSerializer(plan.conf).convertToColumnarPlanIfPossible(plan)
   }
 
   def apply(
@@ -406,7 +378,7 @@ object InMemoryRelation {
     val optimizedPlan = qe.optimizedPlan
     val serializer = getSerializer(optimizedPlan.conf)
     val child = if (serializer.supportsColumnarInput(optimizedPlan.output)) {
-      convertToColumnarIfPossible(qe.executedPlan)
+      serializer.convertToColumnarPlanIfPossible(qe.executedPlan)
     } else {
       qe.executedPlan
     }
@@ -433,8 +405,9 @@ object InMemoryRelation {
 
   def apply(cacheBuilder: CachedRDDBuilder, qe: QueryExecution): InMemoryRelation = {
     val optimizedPlan = qe.optimizedPlan
-    val newBuilder = if (cacheBuilder.serializer.supportsColumnarInput(optimizedPlan.output)) {
-      cacheBuilder.copy(cachedPlan = convertToColumnarIfPossible(qe.executedPlan))
+    val serializer = cacheBuilder.serializer
+    val newBuilder = if (serializer.supportsColumnarInput(optimizedPlan.output)) {
+      cacheBuilder.copy(cachedPlan = serializer.convertToColumnarPlanIfPossible(qe.executedPlan))
     } else {
       cacheBuilder.copy(cachedPlan = qe.executedPlan)
     }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/AnalyzeTablesCommand.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/AnalyzeTablesCommand.scala
index 26192551632e3..f3a0da2437ae8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/AnalyzeTablesCommand.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/AnalyzeTablesCommand.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution.command
 import scala.util.control.NonFatal
 
 import org.apache.spark.internal.LogKeys.{DATABASE_NAME, ERROR, TABLE_NAME}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.{Row, SparkSession}
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CommandUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CommandUtils.scala
index 7cbba170cd1e6..9a86357ca0b76 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CommandUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CommandUtils.scala
@@ -24,7 +24,7 @@ import scala.util.control.NonFatal
 
 import org.apache.hadoop.fs.{FileStatus, FileSystem, Path, PathFilter}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{COUNT, DATABASE_NAME, ERROR, TABLE_NAME, TIME}
 import org.apache.spark.sql.catalyst.{InternalRow, TableIdentifier}
 import org.apache.spark.sql.catalyst.analysis.ResolvedIdentifier
@@ -36,7 +36,7 @@ import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.util.{ArrayData, GenericArrayData}
 import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.errors.QueryCompilationErrors
-import org.apache.spark.sql.execution.QueryExecution
+import org.apache.spark.sql.execution.{QueryExecution, RemoveShuffleFiles}
 import org.apache.spark.sql.execution.datasources.{DataSourceUtils, InMemoryFileIndex}
 import org.apache.spark.sql.functions.{col, lit}
 import org.apache.spark.sql.internal.{SessionState, SQLConf}
@@ -304,8 +304,8 @@ object CommandUtils extends Logging {
       columns.map(statExprs(_, conf, attributePercentiles))
 
     val namedExpressions = expressions.map(e => Alias(e, e.toString)())
-    val statsRow = new QueryExecution(sparkSession, Aggregate(Nil, namedExpressions, relation))
-      .executedPlan.executeTake(1).head
+    val statsRow = new QueryExecution(sparkSession, Aggregate(Nil, namedExpressions, relation),
+      shuffleCleanupMode = RemoveShuffleFiles).executedPlan.executeTake(1).head
 
     val rowCount = statsRow.getLong(0)
     val columnStats = columns.zipWithIndex.map { case (attr, i) =>
@@ -341,8 +341,8 @@ object CommandUtils extends Logging {
         Alias(expr, expr.toString)()
       }
 
-      val percentilesRow = new QueryExecution(sparkSession, Aggregate(Nil, namedExprs, relation))
-        .executedPlan.executeTake(1).head
+      val percentilesRow = new QueryExecution(sparkSession, Aggregate(Nil, namedExprs, relation),
+        shuffleCleanupMode = RemoveShuffleFiles).executedPlan.executeTake(1).head
       attrsToGenHistogram.zipWithIndex.foreach { case (attr, i) =>
         val percentiles = percentilesRow.getArray(i)
         // When there is no non-null value, `percentiles` is null. In such case, there is no
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateSQLFunctionCommand.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateSQLFunctionCommand.scala
index 09b2c86970754..eb860089b0c88 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateSQLFunctionCommand.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateSQLFunctionCommand.scala
@@ -20,13 +20,15 @@ package org.apache.spark.sql.execution.command
 import org.apache.spark.SparkException
 import org.apache.spark.sql.{AnalysisException, Row, SparkSession}
 import org.apache.spark.sql.catalyst.FunctionIdentifier
-import org.apache.spark.sql.catalyst.analysis.{Analyzer, SQLFunctionNode, UnresolvedAlias, UnresolvedAttribute, UnresolvedFunction, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.analysis.{withPosition, Analyzer, SQLFunctionExpression, SQLFunctionNode, SQLScalarFunction, SQLTableFunction, UnresolvedAlias, UnresolvedAttribute, UnresolvedFunction, UnresolvedRelation, UnresolvedTableValuedFunction}
 import org.apache.spark.sql.catalyst.catalog.{SessionCatalog, SQLFunction, UserDefinedFunction, UserDefinedFunctionErrors}
-import org.apache.spark.sql.catalyst.expressions.{Alias, Cast, Generator, LateralSubquery, Literal, ScalarSubquery, SubqueryExpression, WindowExpression}
+import org.apache.spark.sql.catalyst.catalog.UserDefinedFunction._
+import org.apache.spark.sql.catalyst.expressions.{Alias, Cast, Expression, Generator, LateralSubquery, Literal, ScalarSubquery, SubqueryExpression, WindowExpression}
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
 import org.apache.spark.sql.catalyst.plans.Inner
-import org.apache.spark.sql.catalyst.plans.logical.{LateralJoin, LogicalPlan, OneRowRelation, Project, UnresolvedWith}
+import org.apache.spark.sql.catalyst.plans.logical.{LateralJoin, LocalRelation, LogicalPlan, OneRowRelation, Project, Range, UnresolvedWith, View}
 import org.apache.spark.sql.catalyst.trees.TreePattern.UNRESOLVED_ATTRIBUTE
+import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.MultipartIdentifierHelper
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.command.CreateUserDefinedFunctionCommand._
 import org.apache.spark.sql.types.{DataType, StructField, StructType}
@@ -150,6 +152,9 @@ case class CreateSQLFunctionCommand(
           Project(outputAlias, inputPlan)
         }
 
+        // Check cyclic function reference before running the analyzer.
+        checkCyclicFunctionReference(catalog, name, plan)
+
         // Check the function body can be analyzed correctly.
         val analyzed = analyzer.execute(plan)
         val (resolved, resolvedReturnType) = analyzed match {
@@ -172,6 +177,8 @@ case class CreateSQLFunctionCommand(
         if (query.isEmpty) {
           throw UserDefinedFunctionErrors.bodyIsNotAQueryForSqlTableUdf(name.funcName)
         }
+        // Check cyclic function reference before running the analyzer.
+        checkCyclicFunctionReference(catalog, name, query.get)
 
         // Construct a lateral join to analyze the function body.
         val plan = LateralJoin(inputPlan, LateralSubquery(query.get), Inner, None)
@@ -241,10 +248,14 @@ case class CreateSQLFunctionCommand(
       // Derive determinism of the SQL function.
       val deterministic = analyzedPlan.deterministic
 
+      // Derive and check a SQL function with CONTAINS SQL data access should not reads SQL data.
+      val readsSQLData = deriveSQLDataAccess(analyzedPlan)
+
       function.copy(
         // Assign the return type, inferring from the function body if needed.
         returnType = inferredReturnType,
         deterministic = Some(function.deterministic.getOrElse(deterministic)),
+        containsSQL = Some(function.containsSQL.getOrElse(!readsSQLData)),
         properties = properties
       )
     }
@@ -367,6 +378,61 @@ case class CreateSQLFunctionCommand(
     }
   }
 
+  /**
+   * Check if the given plan contains cyclic function references.
+   */
+  private def checkCyclicFunctionReference(
+      catalog: SessionCatalog,
+      identifier: FunctionIdentifier,
+      plan: LogicalPlan): Unit = {
+
+    def checkPlan(plan: LogicalPlan, path: Seq[FunctionIdentifier]): Unit = {
+      plan.foreach {
+        case u @ UnresolvedTableValuedFunction(nameParts, arguments, _) =>
+          val funcId = nameParts.asFunctionIdentifier
+          val info = catalog.lookupFunctionInfo(funcId)
+          if (isSQLFunction(info.getClassName)) {
+            val f = withPosition(u) {
+              catalog.lookupTableFunction(funcId, arguments).asInstanceOf[SQLTableFunction]
+            }
+            // Check cyclic reference using qualified function names.
+            val newPath = path :+ f.function.name
+            if (f.function.name == name) {
+              throw UserDefinedFunctionErrors.cyclicFunctionReference(newPath.mkString(" -> "))
+            }
+            val plan = catalog.makeSQLTableFunctionPlan(f.name, f.function, f.inputs, f.output)
+            checkPlan(plan, newPath)
+        }
+        case p: LogicalPlan =>
+          p.expressions.foreach(checkExpression(_, path))
+      }
+    }
+
+    def checkExpression(expression: Expression, path: Seq[FunctionIdentifier]): Unit = {
+      expression.foreach {
+        case s: SubqueryExpression => checkPlan(s.plan, path)
+        case u @ UnresolvedFunction(nameParts, arguments, _, _, _, _, _) =>
+          val funcId = nameParts.asFunctionIdentifier
+          val info = catalog.lookupFunctionInfo(funcId)
+          if (isSQLFunction(info.getClassName)) {
+            val f = withPosition(u) {
+              catalog.lookupFunction(funcId, arguments).asInstanceOf[SQLFunctionExpression]
+            }
+            // Check cyclic reference using qualified function names.
+            val newPath = path :+ f.function.name
+            if (f.function.name == name) {
+              throw UserDefinedFunctionErrors.cyclicFunctionReference(newPath.mkString(" -> "))
+            }
+            val plan = catalog.makeSQLFunctionPlan(f.name, f.function, f.inputs)
+            checkPlan(plan, newPath)
+          }
+        case _ =>
+      }
+    }
+
+    checkPlan(plan, Seq(identifier))
+  }
+
   /**
    * Check if the SQL function body contains aggregate/window/generate functions.
    * Note subqueries inside the SQL function body can contain aggregate/window/generate functions.
@@ -384,6 +450,43 @@ case class CreateSQLFunctionCommand(
     }
   }
 
+  /**
+   * Derive the SQL data access routine of the function and check if the SQL function matches
+   * its data access routine. If the data access is CONTAINS SQL, the expression should not
+   * access operators and expressions that read SQL data.
+   *
+   * Returns true is SQL data access routine is READS SQL DATA, otherwise returns false.
+   */
+  private def deriveSQLDataAccess(plan: LogicalPlan): Boolean = {
+    // Find logical plan nodes that read SQL data.
+    val readsSQLData = plan.find {
+      case _: View => true
+      case p if p.children.isEmpty => p match {
+        case _: OneRowRelation | _: LocalRelation | _: Range => false
+        case _ => true
+      }
+      case f: SQLFunctionNode => f.function.containsSQL.contains(false)
+      case p: LogicalPlan =>
+        lazy val sub = p.subqueries.exists(deriveSQLDataAccess)
+        // If the SQL function contains another SQL function that has SQL data access routine
+        // to be READS SQL DATA, then this SQL function will also be READS SQL DATA.
+        p.expressions.exists(expr => expr.find {
+          case f: SQLScalarFunction => f.function.containsSQL.contains(false)
+          case sub: SubqueryExpression => deriveSQLDataAccess(sub.plan)
+          case _ => false
+        }.isDefined)
+    }.isDefined
+
+    if (containsSQL.contains(true) && readsSQLData) {
+      throw new AnalysisException(
+        errorClass = "INVALID_SQL_FUNCTION_DATA_ACCESS",
+        messageParameters = Map.empty
+      )
+    }
+
+    readsSQLData
+  }
+
   /**
    * Generate the function properties, including:
    * 1. the SQL configs when creating the function.
@@ -407,7 +510,7 @@ case class CreateSQLFunctionCommand(
     }
     val tempVars = ViewHelper.collectTemporaryVariables(analyzed)
 
-    sqlConfigsToProps(conf) ++
+    sqlConfigsToProps(conf, SQL_CONFIG_PREFIX) ++
       catalogAndNamespaceToProps(
         manager.currentCatalog.name,
         manager.currentNamespace.toIndexedSeq) ++
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateUserDefinedFunctionCommand.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateUserDefinedFunctionCommand.scala
index 1ee3c8a4c388f..78ff514bf9e51 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateUserDefinedFunctionCommand.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/CreateUserDefinedFunctionCommand.scala
@@ -20,9 +20,8 @@ package org.apache.spark.sql.execution.command
 import java.util.Locale
 
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.FunctionIdentifier
+import org.apache.spark.sql.catalyst.{CapturesConfig, FunctionIdentifier}
 import org.apache.spark.sql.catalyst.catalog.{LanguageSQL, RoutineLanguage, UserDefinedFunctionErrors}
-import org.apache.spark.sql.catalyst.catalog.UserDefinedFunction._
 import org.apache.spark.sql.catalyst.plans.logical.IgnoreCachedData
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StructType
@@ -31,7 +30,7 @@ import org.apache.spark.sql.types.StructType
  * The base class for CreateUserDefinedFunctionCommand
  */
 abstract class CreateUserDefinedFunctionCommand
-  extends LeafRunnableCommand with IgnoreCachedData
+  extends LeafRunnableCommand with IgnoreCachedData with CapturesConfig
 
 
 object CreateUserDefinedFunctionCommand {
@@ -81,18 +80,6 @@ object CreateUserDefinedFunctionCommand {
     }
   }
 
-  /**
-   * Convert SQL configs to properties by prefixing all configs with a key.
-   * When converting a function to [[org.apache.spark.sql.catalyst.catalog.CatalogFunction]] or
-   * [[org.apache.spark.sql.catalyst.expressions.ExpressionInfo]], all SQL configs and other
-   * function properties (such as the function parameters and the function return type)
-   * are saved together in a property map.
-   */
-  def sqlConfigsToProps(conf: SQLConf): Map[String, String] = {
-    val modifiedConfs = ViewHelper.getModifiedConf(conf)
-    modifiedConfs.map { case (key, value) => s"$SQL_CONFIG_PREFIX$key" -> value }
-  }
-
   /**
    * Check whether the function parameters contain duplicated column names.
    * It takes the function input parameter struct as input and verifies that there is no duplicates
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/InsertIntoDataSourceDirCommand.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/InsertIntoDataSourceDirCommand.scala
index d3a72f915c47b..667623fb95b03 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/InsertIntoDataSourceDirCommand.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/InsertIntoDataSourceDirCommand.scala
@@ -18,7 +18,6 @@
 package org.apache.spark.sql.execution.command
 
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.{AnalysisException, Row, SaveMode, SparkSession}
 import org.apache.spark.sql.catalyst.catalog._
 import org.apache.spark.sql.catalyst.plans.logical.{CTEInChildren, CTERelationDef, LogicalPlan, WithCTE}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/SetCommand.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/SetCommand.scala
index 87cd9376b77b1..a3591ff89e5cf 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/SetCommand.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/SetCommand.scala
@@ -17,9 +17,10 @@
 
 package org.apache.spark.sql.execution.command
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, CONFIG2, KEY, VALUE}
 import org.apache.spark.sql.{AnalysisException, Row, SparkSession}
+import org.apache.spark.sql.catalyst.analysis.{AnalysisContext, VariableResolution}
 import org.apache.spark.sql.catalyst.expressions.Attribute
 import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.catalyst.plans.logical.IgnoreCachedData
@@ -107,7 +108,14 @@ case class SetCommand(kv: Option[(String, Option[String])])
           Seq()
         }
         if (varName.nonEmpty && varName.length <= 3) {
-          if (sparkSession.sessionState.analyzer.lookupVariable(varName).isDefined) {
+          val variableResolution = new VariableResolution(
+            sparkSession.sessionState.analyzer.catalogManager.tempVariableManager
+          )
+          val variable = variableResolution.lookupVariable(
+            nameParts = varName,
+            resolvingExecuteImmediate = AnalysisContext.get.isExecuteImmediate
+          )
+          if (variable.isDefined) {
             throw new AnalysisException(
               errorClass = "UNSUPPORTED_FEATURE.SET_VARIABLE_USING_SET",
               messageParameters = Map("variableName" -> toSQLId(varName)))
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/commands.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/commands.scala
index ee21d7e970dfd..0ea52f3dccb84 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/commands.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/commands.scala
@@ -32,7 +32,7 @@ import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.{CommandExecutionMode, ExplainMode, LeafExecNode, SparkPlan, UnaryExecNode}
 import org.apache.spark.sql.execution.datasources.DataSource
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.IncrementalExecution
+import org.apache.spark.sql.execution.streaming.runtime.IncrementalExecution
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 import org.apache.spark.util.ArrayImplicits._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/createDataSourceTables.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/createDataSourceTables.scala
index f29d2267f75fd..5ef19b832f5b3 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/createDataSourceTables.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/createDataSourceTables.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution.command
 import java.net.URI
 
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.{AnalysisException, Row, SaveMode, SparkSession}
 import org.apache.spark.sql.catalyst.catalog._
 import org.apache.spark.sql.catalyst.plans.logical.{CTEInChildren, CTERelationDef, LogicalPlan, WithCTE}
@@ -119,9 +118,7 @@ case class CreateDataSourceTableCommand(table: CatalogTable, ignoreIfExists: Boo
 
     }
 
-    // We will return Nil or throw exception at the beginning if the table already exists, so when
-    // we reach here, the table should not exist and we should set `ignoreIfExists` to false.
-    sessionState.catalog.createTable(newTable, ignoreIfExists = false)
+    sessionState.catalog.createTable(newTable, ignoreIfExists)
 
     Seq.empty[Row]
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/ddl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/ddl.scala
index 13994c58f1206..8a4f586edfe05 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/ddl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/ddl.scala
@@ -28,11 +28,11 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 import org.apache.hadoop.mapred.{FileInputFormat, JobConf}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.RDD_PARALLEL_LISTING_THRESHOLD
-import org.apache.spark.sql.{Row, SparkSession}
+import org.apache.spark.sql.{Row, SaveMode, SparkSession}
 import org.apache.spark.sql.catalyst.TableIdentifier
-import org.apache.spark.sql.catalyst.analysis.Resolver
+import org.apache.spark.sql.catalyst.analysis.{EliminateSubqueryAliases, Resolver}
 import org.apache.spark.sql.catalyst.catalog._
 import org.apache.spark.sql.catalyst.catalog.CatalogTypes.TablePartitionSpec
 import org.apache.spark.sql.catalyst.expressions.Attribute
@@ -46,7 +46,7 @@ import org.apache.spark.sql.connector.catalog.CatalogManager.SESSION_CATALOG_NAM
 import org.apache.spark.sql.connector.catalog.SupportsNamespaces._
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.errors.QueryExecutionErrors.hiveTableWithAnsiIntervalsError
-import org.apache.spark.sql.execution.datasources.{DataSource, DataSourceUtils, FileFormat, HadoopFsRelation, LogicalRelationWithTable}
+import org.apache.spark.sql.execution.datasources.{CreateTable, DataSource, DataSourceUtils, FileFormat, HadoopFsRelation, LogicalRelation, LogicalRelationWithTable}
 import org.apache.spark.sql.execution.datasources.v2.FileDataSourceV2
 import org.apache.spark.sql.internal.{HiveSerDe, SQLConf}
 import org.apache.spark.sql.types._
@@ -189,8 +189,9 @@ case class DescribeDatabaseCommand(
       Row("Catalog Name", SESSION_CATALOG_NAME) ::
         Row("Database Name", dbMetadata.name) ::
         Row("Comment", dbMetadata.description) ::
-        Row("Location", CatalogUtils.URIToString(dbMetadata.locationUri))::
-        Row("Owner", allDbProperties.getOrElse(PROP_OWNER, "")) :: Nil
+        Row("Location", CatalogUtils.URIToString(dbMetadata.locationUri)) ::
+        Row("Owner", allDbProperties.getOrElse(PROP_OWNER, "")) ::
+        allDbProperties.get(PROP_COLLATION).map(Row("Collation", _)).toList
 
     if (extended) {
       val properties = allDbProperties -- CatalogV2Util.NAMESPACE_RESERVED_PROPERTIES
@@ -464,7 +465,7 @@ case class AlterTableChangeColumnCommand(
   // when altering column. Only changes in collation of data type or its nested types (recursively)
   // are allowed.
   private def canEvolveType(from: StructField, to: StructField): Boolean = {
-    DataType.equalsIgnoreCompatibleCollation(from.dataType, to.dataType)
+    DataType.equalsIgnoreCompatibleCollation(from.dataType, to.dataType, checkComplexTypes = false)
   }
 }
 
@@ -955,6 +956,64 @@ case class AlterTableSetLocationCommand(
   }
 }
 
+/**
+ * A command that saves a query as a V1 table.
+ */
+private[sql] case class SaveAsV1TableCommand(
+    tableDesc: CatalogTable,
+    mode: SaveMode,
+    query: LogicalPlan) extends LeafRunnableCommand {
+  override def run(sparkSession: SparkSession): Seq[Row] = {
+    val catalog = sparkSession.sessionState.catalog
+    val qualifiedIdent = catalog.qualifyIdentifier(tableDesc.identifier)
+    val tableDescWithQualifiedIdent = tableDesc.copy(identifier = qualifiedIdent)
+    val tableExists = catalog.tableExists(qualifiedIdent)
+
+    (tableExists, mode) match {
+      case (true, SaveMode.Ignore) =>
+        // Do nothing
+
+      case (true, SaveMode.ErrorIfExists) =>
+        throw QueryCompilationErrors.tableAlreadyExistsError(qualifiedIdent)
+
+      case (true, SaveMode.Overwrite) =>
+        // Get all input data source or hive relations of the query.
+        val srcRelations = query.collect {
+          case l: LogicalRelation => l.relation
+          case relation: HiveTableRelation => relation.tableMeta.identifier
+        }
+
+        val tableRelation = sparkSession.table(qualifiedIdent).queryExecution.analyzed
+        EliminateSubqueryAliases(tableRelation) match {
+          // check if the table is a data source table (the relation is a BaseRelation).
+          case l: LogicalRelation if srcRelations.contains(l.relation) =>
+            throw QueryCompilationErrors.cannotOverwriteTableThatIsBeingReadFromError(
+              qualifiedIdent)
+          // check hive table relation when overwrite mode
+          case relation: HiveTableRelation
+              if srcRelations.contains(relation.tableMeta.identifier) =>
+            throw QueryCompilationErrors.cannotOverwriteTableThatIsBeingReadFromError(
+              qualifiedIdent)
+          case _ => // OK
+        }
+
+        // Drop the existing table
+        catalog.dropTable(qualifiedIdent, ignoreIfNotExists = true, purge = false)
+        runCommand(sparkSession, CreateTable(tableDescWithQualifiedIdent, mode, Some(query)))
+        // Refresh the cache of the table in the catalog.
+        catalog.refreshTable(qualifiedIdent)
+
+      case _ =>
+        runCommand(sparkSession, CreateTable(tableDescWithQualifiedIdent, mode, Some(query)))
+    }
+    Seq.empty[Row]
+  }
+
+  private def runCommand(session: SparkSession, command: LogicalPlan): Unit = {
+    val qe = session.sessionState.executePlan(command)
+    qe.assertCommandExecuted()
+  }
+}
 
 object DDLUtils extends Logging {
   val HIVE_PROVIDER = "hive"
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/tables.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/tables.scala
index 092e6669338ee..d5dd934af2be1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/tables.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/tables.scala
@@ -247,8 +247,9 @@ case class AlterTableAddColumnsCommand(
     }
     DDLUtils.checkTableColumns(catalogTable, StructType(colsWithProcessedDefaults))
 
-    val existingSchema = CharVarcharUtils.getRawSchema(catalogTable.dataSchema)
-    catalog.alterTableDataSchema(table, StructType(existingSchema ++ colsWithProcessedDefaults))
+    val existingDataSchema = CharVarcharUtils.getRawSchema(catalogTable.dataSchema)
+    catalog.alterTableSchema(table,
+      StructType(existingDataSchema ++ colsWithProcessedDefaults ++ catalogTable.partitionSchema))
     Seq.empty[Row]
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/CreateVariableExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/CreateVariableExec.scala
index 1b9c1711853c3..e625f02b8bbe5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/CreateVariableExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/CreateVariableExec.scala
@@ -19,6 +19,9 @@ package org.apache.spark.sql.execution.command.v2
 
 import java.util.Locale
 
+import scala.collection.mutable
+
+import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.{InternalRow, SqlScriptingContextManager}
 import org.apache.spark.sql.catalyst.analysis.{FakeLocalCatalog, ResolvedIdentifier}
 import org.apache.spark.sql.catalyst.catalog.VariableDefinition
@@ -28,10 +31,10 @@ import org.apache.spark.sql.connector.catalog.Identifier
 import org.apache.spark.sql.execution.datasources.v2.LeafV2CommandExec
 
 /**
- * Physical plan node for creating a variable.
+ * Physical plan node for creating variables.
  */
 case class CreateVariableExec(
-    resolvedIdentifier: ResolvedIdentifier,
+    resolvedIdentifiers: Seq[ResolvedIdentifier],
     defaultExpr: DefaultValueExpression,
     replace: Boolean) extends LeafV2CommandExec with ExpressionsEvaluator {
 
@@ -43,25 +46,58 @@ case class CreateVariableExec(
     initializeExprs(exprs, 0)
     val initValue = Literal(exprs.head.eval(), defaultExpr.dataType)
 
-    val normalizedIdentifier = if (session.sessionState.conf.caseSensitiveAnalysis) {
-      resolvedIdentifier.identifier
-    } else {
-      Identifier.of(
-        resolvedIdentifier.identifier.namespace().map(_.toLowerCase(Locale.ROOT)),
-        resolvedIdentifier.identifier.name().toLowerCase(Locale.ROOT))
-    }
-    val varDef = VariableDefinition(normalizedIdentifier, defaultExpr.originalSQL, initValue)
-
-    // create local variable if we are in a script, otherwise create session variable
-    scriptingVariableManager
-      .filter(_ => resolvedIdentifier.catalog == FakeLocalCatalog)
+    val variableTuples = resolvedIdentifiers.map(resolvedIdentifier => {
+      val normalizedIdentifier = if (session.sessionState.conf.caseSensitiveAnalysis) {
+        resolvedIdentifier.identifier
+      } else {
+        Identifier.of(
+          resolvedIdentifier.identifier.namespace().map(_.toLowerCase(Locale.ROOT)),
+          resolvedIdentifier.identifier.name().toLowerCase(Locale.ROOT))
+      }
+      val varDef = VariableDefinition(normalizedIdentifier, defaultExpr.originalSQL, initValue)
+
+      (normalizedIdentifier.namespace().toSeq :+ normalizedIdentifier.name(), varDef)
+    })
+
+    // create local variables if we are in a script, otherwise create session variable
+    val variableManager =
+      scriptingVariableManager
+      .filter(_ => resolvedIdentifiers.head.catalog == FakeLocalCatalog)
       // If resolvedIdentifier.catalog is FakeLocalCatalog, scriptingVariableManager
       // will always be present.
       .getOrElse(tempVariableManager)
-      .create(
-        normalizedIdentifier.namespace().toSeq :+ normalizedIdentifier.name(),
-        varDef,
-        replace)
+
+    val uniqueNames = mutable.Set[String]()
+
+    variableTuples.foreach(variable => {
+      val nameParts: Seq[String] = variable._1
+      val name = nameParts.last
+
+      // Check if the variable name was already declared inside the same DECLARE statement
+      if (uniqueNames.contains(name)) {
+        throw new AnalysisException(
+          errorClass = "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE",
+          messageParameters = Map(
+            "variableName" -> variableManager.getVariableNameForError(name)))
+      }
+
+      // If DECLARE statement does not have OR REPLACE part, check if any of the variable names
+      // declared in the DECLARE statement already exists as a name of another variable
+      if (!replace && variableManager.get(nameParts).isDefined) {
+        throw new AnalysisException(
+          errorClass = "VARIABLE_ALREADY_EXISTS",
+          messageParameters = Map(
+            "variableName" -> variableManager.getVariableNameForError(name)))
+      }
+
+      uniqueNames.add(name)
+    })
+
+    variableTuples.foreach(variable => {
+      val nameParts: Seq[String] = variable._1
+      val varDef: VariableDefinition = variable._2
+      variableManager.create(nameParts, varDef, replace)
+    })
 
     Nil
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/V2CommandStrategy.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/V2CommandStrategy.scala
index 3e073202d4c7f..63c4cd9db158a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/V2CommandStrategy.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/v2/V2CommandStrategy.scala
@@ -27,8 +27,12 @@ object V2CommandStrategy extends Strategy {
 
   // TODO: move v2 commands to here which are not data source v2 related.
   override def apply(plan: LogicalPlan): Seq[SparkPlan] = plan match {
-    case CreateVariable(ident: ResolvedIdentifier, defaultExpr, replace) =>
-      CreateVariableExec(ident, defaultExpr, replace) :: Nil
+    case CreateVariable(idents: Seq[LogicalPlan], defaultExpr, replace)
+        if idents.forall(_.isInstanceOf[ResolvedIdentifier]) =>
+      CreateVariableExec(
+        idents.map(_.asInstanceOf[ResolvedIdentifier]),
+        defaultExpr,
+        replace) :: Nil
 
     case DropVariable(ident: ResolvedIdentifier, ifExists) =>
       DropVariableExec(ident.identifier.name, ifExists) :: Nil
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/views.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/views.scala
index e3beffaf920dc..514b64f6abed2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/command/views.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/command/views.scala
@@ -25,7 +25,7 @@ import org.json4s.jackson.JsonMethods._
 import org.apache.spark.SparkException
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.{Row, SparkSession}
-import org.apache.spark.sql.catalyst.{SQLConfHelper, TableIdentifier}
+import org.apache.spark.sql.catalyst.{CapturesConfig, SQLConfHelper, TableIdentifier}
 import org.apache.spark.sql.catalyst.analysis.{AnalysisContext, GlobalTempView, LocalTempView, SchemaEvolution, SchemaUnsupported, ViewSchemaMode, ViewType}
 import org.apache.spark.sql.catalyst.catalog.{CatalogStorageFormat, CatalogTable, CatalogTableType, TemporaryViewRelation}
 import org.apache.spark.sql.catalyst.expressions.{Alias, Attribute, SubqueryExpression, VariableReference}
@@ -34,7 +34,7 @@ import org.apache.spark.sql.catalyst.util.CharVarcharUtils
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.NamespaceHelper
 import org.apache.spark.sql.errors.QueryCompilationErrors
-import org.apache.spark.sql.internal.{SQLConf, StaticSQLConf}
+import org.apache.spark.sql.internal.StaticSQLConf
 import org.apache.spark.sql.types.{MetadataBuilder, StructType}
 import org.apache.spark.sql.util.SchemaUtils
 import org.apache.spark.util.ArrayImplicits._
@@ -413,37 +413,7 @@ case class ShowViewsCommand(
   }
 }
 
-object ViewHelper extends SQLConfHelper with Logging {
-
-  private val configPrefixDenyList = Seq(
-    SQLConf.MAX_NESTED_VIEW_DEPTH.key,
-    "spark.sql.optimizer.",
-    "spark.sql.codegen.",
-    "spark.sql.execution.",
-    "spark.sql.shuffle.",
-    "spark.sql.adaptive.",
-    // ignore optimization configs used in `RelationConversions`
-    "spark.sql.hive.convertMetastoreParquet",
-    "spark.sql.hive.convertMetastoreOrc",
-    "spark.sql.hive.convertInsertingPartitionedTable",
-    "spark.sql.hive.convertInsertingUnpartitionedTable",
-    "spark.sql.hive.convertMetastoreCtas",
-    SQLConf.ADDITIONAL_REMOTE_REPOSITORIES.key)
-
-  private val configAllowList = Seq(
-    SQLConf.DISABLE_HINTS.key
-  )
-
-  /**
-   * Capture view config either of:
-   * 1. exists in allowList
-   * 2. do not exists in denyList
-   */
-  private def shouldCaptureConfig(key: String): Boolean = {
-    configAllowList.exists(prefix => key.equals(prefix)) ||
-      !configPrefixDenyList.exists(prefix => key.startsWith(prefix))
-  }
-
+object ViewHelper extends SQLConfHelper with Logging with CapturesConfig {
   import CatalogTable._
 
   /**
@@ -471,34 +441,6 @@ object ViewHelper extends SQLConfHelper with Logging {
     }
   }
 
-  /**
-   * Get all configurations that are modifiable and should be captured.
-   */
-  def getModifiedConf(conf: SQLConf): Map[String, String] = {
-    conf.getAllConfs.filter { case (k, _) =>
-      conf.isModifiable(k) && shouldCaptureConfig(k)
-    }
-  }
-
-  /**
-   * Convert the view SQL configs to `properties`.
-   */
-  private def sqlConfigsToProps(conf: SQLConf): Map[String, String] = {
-    val modifiedConfs = getModifiedConf(conf)
-    // Some configs have dynamic default values, such as SESSION_LOCAL_TIMEZONE whose
-    // default value relies on the JVM system timezone. We need to always capture them to
-    // to make sure we apply the same configs when reading the view.
-    val alwaysCaptured = Seq(SQLConf.SESSION_LOCAL_TIMEZONE)
-      .filter(c => !modifiedConfs.contains(c.key))
-      .map(c => (c.key, conf.getConf(c)))
-
-    val props = new mutable.HashMap[String, String]
-    for ((key, value) <- modifiedConfs ++ alwaysCaptured) {
-      props.put(s"$VIEW_SQL_CONFIG_PREFIX$key", value)
-    }
-    props.toMap
-  }
-
   /**
    * Remove the view SQL configs in `properties`.
    */
@@ -586,13 +528,21 @@ object ViewHelper extends SQLConfHelper with Logging {
     // names.
     SchemaUtils.checkColumnNameDuplication(fieldNames.toImmutableArraySeq, conf.resolver)
 
+    val queryColumnNameProps = if (viewSchemaMode == SchemaEvolution) {
+      // If the view schema mode is SCHEMA EVOLUTION, we can avoid generating the query output
+      // column names as table properties, and always use view schema as they are always same
+      Seq()
+    } else {
+      generateQueryColumnNames(queryOutput.toImmutableArraySeq)
+    }
+
     // Generate the view default catalog and namespace, as well as captured SQL configs.
     val manager = session.sessionState.catalogManager
     removeReferredTempNames(removeSQLConfigs(removeQueryColumnNames(properties))) ++
       catalogAndNamespaceToProps(
         manager.currentCatalog.name, manager.currentNamespace.toImmutableArraySeq) ++
-      sqlConfigsToProps(conf) ++
-      generateQueryColumnNames(queryOutput.toImmutableArraySeq) ++
+      sqlConfigsToProps(conf, VIEW_SQL_CONFIG_PREFIX) ++
+      queryColumnNameProps ++
       referredTempNamesToProps(tempViewNames, tempFunctionNames, tempVariableNames) ++
       viewSchemaModeToProps(viewSchemaMode)
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/BasicWriteStatsTracker.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/BasicWriteStatsTracker.scala
index 1858a84213598..9a38cc35b33f8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/BasicWriteStatsTracker.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/BasicWriteStatsTracker.scala
@@ -26,7 +26,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.{SparkContext, TaskContext}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{ACTUAL_NUM_FILES, EXPECTED_NUM_FILES}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.execution.SQLExecution
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/CodecStreams.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/CodecStreams.scala
index 9fddfad249e5b..0ee3a9d90cfe2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/CodecStreams.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/CodecStreams.scala
@@ -28,20 +28,11 @@ import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat
 import org.apache.hadoop.util.ReflectionUtils
 
 import org.apache.spark.TaskContext
+import org.apache.spark.io.HadoopCodecStreams
 
 object CodecStreams {
-  private def getDecompressionCodec(config: Configuration, file: Path): Option[CompressionCodec] = {
-    val compressionCodecs = new CompressionCodecFactory(config)
-    Option(compressionCodecs.getCodec(file))
-  }
-
   def createInputStream(config: Configuration, file: Path): InputStream = {
-    val fs = file.getFileSystem(config)
-    val inputStream: InputStream = fs.open(file)
-
-    getDecompressionCodec(config, file)
-      .map(codec => codec.createInputStream(inputStream))
-      .getOrElse(inputStream)
+    HadoopCodecStreams.createInputStream(config, file)
   }
 
   /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSource.scala
index 489f62bd97769..3816a446a57c7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSource.scala
@@ -27,7 +27,7 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, DATA_SOURCE, DATA_SOURCES, PATHS}
 import org.apache.spark.sql.{AnalysisException, SaveMode, SparkSession}
 import org.apache.spark.sql.catalyst.DataSourceOptions
@@ -49,7 +49,9 @@ import org.apache.spark.sql.execution.datasources.v2.FileDataSourceV2
 import org.apache.spark.sql.execution.datasources.v2.orc.OrcDataSourceV2
 import org.apache.spark.sql.execution.datasources.v2.python.PythonDataSourceV2
 import org.apache.spark.sql.execution.datasources.xml.XmlFileFormat
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.{Sink, Source}
+import org.apache.spark.sql.execution.streaming.runtime._
+import org.apache.spark.sql.execution.streaming.sinks.FileStreamSink
 import org.apache.spark.sql.execution.streaming.sources.{RateStreamProvider, TextSocketSourceProvider}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.sources._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceManager.scala
index 711e096ebd1f8..790797e1f3183 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceManager.scala
@@ -21,7 +21,7 @@ import java.util.Locale
 import java.util.concurrent.ConcurrentHashMap
 
 import org.apache.spark.api.python.PythonUtils
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.DATA_SOURCE
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.datasources.v2.python.UserDefinedPythonDataSource
@@ -48,14 +48,13 @@ class DataSourceManager extends Logging {
    */
   def registerDataSource(name: String, source: UserDefinedPythonDataSource): Unit = {
     val normalizedName = normalize(name)
-    if (staticDataSourceBuilders.contains(normalizedName)) {
-      // Cannot overwrite static Python Data Sources.
-      throw QueryCompilationErrors.dataSourceAlreadyExists(name)
-    }
     val previousValue = runtimeDataSourceBuilders.put(normalizedName, source)
     if (previousValue != null) {
       logWarning(log"The data source ${MDC(DATA_SOURCE, name)} replaced a previously " +
         log"registered data source.")
+    } else if (staticDataSourceBuilders.contains(normalizedName)) {
+      logWarning(log"The data source ${MDC(DATA_SOURCE, name)} replaced a statically " +
+        log"registered data source.")
     }
   }
 
@@ -64,11 +63,7 @@ class DataSourceManager extends Logging {
    * it does not exist.
    */
   def lookupDataSource(name: String): UserDefinedPythonDataSource = {
-    if (dataSourceExists(name)) {
-      val normalizedName = normalize(name)
-      staticDataSourceBuilders.getOrElse(
-        normalizedName, runtimeDataSourceBuilders.get(normalizedName))
-    } else {
+    getDataSource(name).getOrElse {
       throw QueryCompilationErrors.dataSourceDoesNotExist(name)
     }
   }
@@ -77,9 +72,14 @@ class DataSourceManager extends Logging {
    * Checks if a data source with the specified name exists (case-insensitive).
    */
   def dataSourceExists(name: String): Boolean = {
+    getDataSource(name).isDefined
+  }
+
+  private def getDataSource(name: String): Option[UserDefinedPythonDataSource] = {
     val normalizedName = normalize(name)
-    staticDataSourceBuilders.contains(normalizedName) ||
-      runtimeDataSourceBuilders.containsKey(normalizedName)
+    // Runtime registration takes precedence over static.
+    Option(runtimeDataSourceBuilders.get(normalizedName))
+      .orElse(staticDataSourceBuilders.get(normalizedName))
   }
 
   override def clone(): DataSourceManager = {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceResolver.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceResolver.scala
index ec8182304f791..3e6dc6255d7f2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceResolver.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceResolver.scala
@@ -26,7 +26,7 @@ import org.apache.spark.sql.catalyst.catalog.UnresolvedCatalogRelation
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.streaming.StreamingRelationV2
 import org.apache.spark.sql.classic.SparkSession
-import org.apache.spark.sql.execution.streaming.StreamingRelation
+import org.apache.spark.sql.execution.streaming.runtime.StreamingRelation
 
 /**
  * The [[DataSourceResolver]] is a [[Resolver]] extension that resolves nodes defined in the
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceStrategy.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceStrategy.scala
index 3b55a294b21b5..2e47f08ac115a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceStrategy.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceStrategy.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PREDICATES
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.{Row, SaveMode}
@@ -37,6 +37,7 @@ import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
 import org.apache.spark.sql.catalyst.planning.PhysicalOperation
+import org.apache.spark.sql.catalyst.plans.{Inner, JoinType, LeftOuter, RightOuter}
 import org.apache.spark.sql.catalyst.plans.logical.{AppendData, InsertIntoDir, InsertIntoStatement, LogicalPlan, Project}
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.streaming.StreamingRelationV2
@@ -47,12 +48,13 @@ import org.apache.spark.sql.connector.catalog.{SupportsRead, V1Table}
 import org.apache.spark.sql.connector.catalog.TableCapability._
 import org.apache.spark.sql.connector.expressions.{Expression => V2Expression, NullOrdering, SortDirection, SortOrder => V2SortOrder, SortValue}
 import org.apache.spark.sql.connector.expressions.aggregate.{AggregateFunc, Aggregation}
+import org.apache.spark.sql.connector.join.{JoinType => V2JoinType}
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution
 import org.apache.spark.sql.execution.{RowDataSourceScanExec, SparkPlan}
 import org.apache.spark.sql.execution.command._
 import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2Relation, PushedDownOperators}
-import org.apache.spark.sql.execution.streaming.StreamingRelation
+import org.apache.spark.sql.execution.streaming.runtime.StreamingRelation
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.sources
 import org.apache.spark.sql.sources._
@@ -399,7 +401,7 @@ object DataSourceStrategy
         l.output.toStructType,
         Set.empty,
         Set.empty,
-        PushedDownOperators(None, None, None, None, Seq.empty, Seq.empty),
+        PushedDownOperators(None, None, None, None, Seq.empty, Seq.empty, Seq.empty, None),
         toCatalystRDD(l, baseRelation.buildScan()),
         baseRelation,
         l.stream,
@@ -474,7 +476,7 @@ object DataSourceStrategy
         requestedColumns.toStructType,
         pushedFilters.toSet,
         handledFilters,
-        PushedDownOperators(None, None, None, None, Seq.empty, Seq.empty),
+        PushedDownOperators(None, None, None, None, Seq.empty, Seq.empty, Seq.empty, None),
         scanBuilder(requestedColumns, candidatePredicates, pushedFilters),
         relation.relation,
         relation.stream,
@@ -498,7 +500,7 @@ object DataSourceStrategy
         requestedColumns.toStructType,
         pushedFilters.toSet,
         handledFilters,
-        PushedDownOperators(None, None, None, None, Seq.empty, Seq.empty),
+        PushedDownOperators(None, None, None, None, Seq.empty, Seq.empty, Seq.empty, None),
         scanBuilder(requestedColumns, candidatePredicates, pushedFilters),
         relation.relation,
         relation.stream,
@@ -508,6 +510,15 @@ object DataSourceStrategy
     }
   }
 
+  def translateJoinType(joinType: JoinType): Option[V2JoinType] = {
+    joinType match {
+      case Inner => Some(V2JoinType.INNER_JOIN)
+      case LeftOuter => Some(V2JoinType.LEFT_OUTER_JOIN)
+      case RightOuter => Some(V2JoinType.RIGHT_OUTER_JOIN)
+      case _ => None
+    }
+  }
+
   /**
    * Convert RDD of Row into RDD of InternalRow with objects in catalyst types
    */
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceUtils.scala
index 3e66b97f61a63..d43c9eab0a5ba 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/DataSourceUtils.scala
@@ -17,6 +17,7 @@
 
 package org.apache.spark.sql.execution.datasources
 
+import java.io.IOException
 import java.util.Locale
 
 import scala.jdk.CollectionConverters._
@@ -127,7 +128,7 @@ object DataSourceUtils extends PredicateHelper {
 
   private def getRebaseSpec(
       lookupFileMeta: String => String,
-      modeByConfig: LegacyBehaviorPolicy.Value,
+      modeByConfig: String,
       minVersion: String,
       metadataKey: String): RebaseSpec = {
     val policy = if (Utils.isTesting &&
@@ -145,7 +146,7 @@ object DataSourceUtils extends PredicateHelper {
         } else {
           LegacyBehaviorPolicy.CORRECTED
         }
-      }.getOrElse(modeByConfig)
+      }.getOrElse(LegacyBehaviorPolicy.withName(modeByConfig))
     }
     policy match {
       case LegacyBehaviorPolicy.LEGACY =>
@@ -156,7 +157,7 @@ object DataSourceUtils extends PredicateHelper {
 
   def datetimeRebaseSpec(
       lookupFileMeta: String => String,
-      modeByConfig: LegacyBehaviorPolicy.Value): RebaseSpec = {
+      modeByConfig: String): RebaseSpec = {
     getRebaseSpec(
       lookupFileMeta,
       modeByConfig,
@@ -166,7 +167,7 @@ object DataSourceUtils extends PredicateHelper {
 
   def int96RebaseSpec(
       lookupFileMeta: String => String,
-      modeByConfig: LegacyBehaviorPolicy.Value): RebaseSpec = {
+      modeByConfig: String): RebaseSpec = {
     getRebaseSpec(
       lookupFileMeta,
       modeByConfig,
@@ -197,6 +198,11 @@ object DataSourceUtils extends PredicateHelper {
     QueryExecutionErrors.sparkUpgradeInWritingDatesError(format, config)
   }
 
+  def shouldIgnoreCorruptFileException(e: Throwable): Boolean = e match {
+    case _: RuntimeException | _: IOException | _: InternalError => true
+    case _ => false
+  }
+
   def createDateRebaseFuncInRead(
       rebaseMode: LegacyBehaviorPolicy.Value,
       format: String): Int => Int = rebaseMode match {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormat.scala
index d3078740b819c..8a254b464da71 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormat.scala
@@ -29,7 +29,7 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.codegen.GenerateUnsafeProjection
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.internal.{SessionStateHelper, SQLConf}
 import org.apache.spark.sql.sources.Filter
 import org.apache.spark.sql.types._
 
@@ -356,7 +356,7 @@ object FileFormat {
 /**
  * The base class file format that is based on text file.
  */
-abstract class TextBasedFileFormat extends FileFormat {
+abstract class TextBasedFileFormat extends FileFormat with SessionStateHelper {
   private var codecFactory: CompressionCodecFactory = _
 
   override def isSplitable(
@@ -364,8 +364,7 @@ abstract class TextBasedFileFormat extends FileFormat {
       options: Map[String, String],
       path: Path): Boolean = {
     if (codecFactory == null) {
-      codecFactory = new CompressionCodecFactory(
-        sparkSession.sessionState.newHadoopConfWithOptions(options))
+      codecFactory = new CompressionCodecFactory(getHadoopConf(sparkSession, options))
     }
     val codec = codecFactory.getCodec(path)
     codec == null || codec.isInstanceOf[SplittableCompressionCodec]
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatDataWriter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatDataWriter.scala
index 7d071124b0b30..e11c2b15e0541 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatDataWriter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatDataWriter.scala
@@ -22,7 +22,7 @@ import org.apache.hadoop.fs.{FileAlreadyExistsException, Path}
 import org.apache.hadoop.mapreduce.TaskAttemptContext
 
 import org.apache.spark.TaskOutputFileAlreadyExistException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, NUM_CONCURRENT_WRITER}
 import org.apache.spark.internal.io.{FileCommitProtocol, FileNameSpec}
 import org.apache.spark.internal.io.FileCommitProtocol.TaskCommitMessage
@@ -172,7 +172,7 @@ class SingleDirectoryDataWriter(
     val currentPath = committer.newTaskTempFile(
       taskAttemptContext,
       None,
-      f"-c$fileCounter%03d" + ext)
+      FileNameSpec("", f"-c$fileCounter%03d" + ext))
 
     currentWriter = description.outputWriterFactory.newInstance(
       path = currentPath,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatWriter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatWriter.scala
index b4cffa59c98d5..55e2271dc058b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatWriter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileFormatWriter.scala
@@ -26,7 +26,7 @@ import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat
 import org.apache.hadoop.mapreduce.task.TaskAttemptContextImpl
 
 import org.apache.spark._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.io.{FileCommitProtocol, SparkHadoopWriterUtils}
 import org.apache.spark.sql.catalyst.InternalRow
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FilePartition.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FilePartition.scala
index 50af845c37cb1..68a9bbfc7ab1d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FilePartition.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FilePartition.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable.ArrayBuffer
 import scala.math.BigDecimal.RoundingMode
 
 import org.apache.spark.Partition
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, DESIRED_NUM_PARTITIONS, MAX_NUM_PARTITIONS, NUM_PARTITIONS}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.classic.ClassicConversions._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileScanRDD.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileScanRDD.scala
index e468807f4ffd1..5dc13ccee9ce0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileScanRDD.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileScanRDD.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.execution.datasources
 
-import java.io.{Closeable, FileNotFoundException, IOException}
+import java.io.{Closeable, FileNotFoundException}
 import java.net.URI
 
 import org.apache.hadoop.fs.Path
@@ -27,7 +27,6 @@ import org.apache.hadoop.security.AccessControlException
 import org.apache.spark.{Partition => RDDPartition, TaskContext}
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.internal.LogKeys.{CURRENT_FILE, PATH}
-import org.apache.spark.internal.MDC
 import org.apache.spark.paths.SparkPath
 import org.apache.spark.rdd.{InputFileBlockHolder, RDD}
 import org.apache.spark.sql.SparkSession
@@ -269,7 +268,8 @@ class FileScanRDD(
                   // Throw FileNotFoundException even if `ignoreCorruptFiles` is true
                   case e: FileNotFoundException if !ignoreMissingFiles => throw e
                   case e @ (_ : AccessControlException | _ : BlockMissingException) => throw e
-                  case e @ (_: RuntimeException | _: IOException) if ignoreCorruptFiles =>
+                  case e if ignoreCorruptFiles &&
+                      DataSourceUtils.shouldIgnoreCorruptFileException(e) =>
                     logWarning(log"Skipped the rest of the content in the corrupted file: " +
                       log"${MDC(PATH, currentFile)}", e)
                     finished = true
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategy.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategy.scala
index 7291da248294a..396375890c249 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategy.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategy.scala
@@ -21,7 +21,7 @@ import java.util.Locale
 
 import scala.collection.mutable
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{NUM_PRUNED, POST_SCAN_FILTERS, PUSHED_FILTERS, TOTAL}
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.catalog.BucketSpec
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileStatusCache.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileStatusCache.scala
index 2bb8476a9f0e8..cf182ec18f1c9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileStatusCache.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/FileStatusCache.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import com.google.common.cache._
 import org.apache.hadoop.fs.{FileStatus, Path}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CACHED_TABLE_PARTITION_METADATA_SIZE, MAX_TABLE_PARTITION_METADATA_SIZE}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.util.SizeEstimator
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/HadoopFileLinesReader.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/HadoopFileLinesReader.scala
index bf6da8765e516..be13dc340f48d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/HadoopFileLinesReader.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/HadoopFileLinesReader.scala
@@ -25,6 +25,7 @@ import org.apache.hadoop.mapreduce._
 import org.apache.hadoop.mapreduce.lib.input.{FileSplit, LineRecordReader}
 import org.apache.hadoop.mapreduce.task.TaskAttemptContextImpl
 
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.Utils
 
 /**
@@ -57,10 +58,13 @@ class HadoopFileLinesReader(
     val hadoopAttemptContext = new TaskAttemptContextImpl(conf, attemptId)
 
     Utils.tryInitializeResource(
-      lineSeparator match {
-        case Some(sep) => new LineRecordReader(sep)
-        // If the line separator is `None`, it covers `\r`, `\r\n` and `\n`.
-        case _ => new LineRecordReader()
+      // HadoopLineRecordReader is LineRecordReader with some changes like support for specifying
+      // compression codec as opposed to always infer from file extension.
+      // If the line separator is `None`, it covers `\r`, `\r\n` and `\n`.
+      if (SQLConf.get.hadoopLineRecordReaderEnabled) {
+        new HadoopLineRecordReader(lineSeparator.orNull)
+      } else {
+        new LineRecordReader(lineSeparator.orNull)
       }
     ) { reader =>
       reader.initialize(fileSplit, hadoopAttemptContext)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/InMemoryFileIndex.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/InMemoryFileIndex.scala
index 3b8a20c7cf741..2d68faa3ff526 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/InMemoryFileIndex.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/InMemoryFileIndex.scala
@@ -24,13 +24,13 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 import org.apache.hadoop.mapred.{FileInputFormat, JobConf}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{COUNT, ELAPSED_TIME}
 import org.apache.spark.metrics.source.HiveCatalogMetrics
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.FileSourceOptions
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
-import org.apache.spark.sql.execution.streaming.FileStreamSink
+import org.apache.spark.sql.execution.streaming.sinks.FileStreamSink
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.HadoopFSUtils
 
@@ -103,7 +103,8 @@ class InMemoryFileIndex(
   }
 
   override def equals(other: Any): Boolean = other match {
-    case hdfs: InMemoryFileIndex => rootPaths.toSet == hdfs.rootPaths.toSet
+    case hdfs: InMemoryFileIndex if rootPaths.size == hdfs.rootPaths.size =>
+      rootPaths.sorted == hdfs.rootPaths.sorted
     case _ => false
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/PartitioningAwareFileIndex.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/PartitioningAwareFileIndex.scala
index 07be3f89872cc..1bf0d2f0301f2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/PartitioningAwareFileIndex.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/PartitioningAwareFileIndex.scala
@@ -24,7 +24,7 @@ import scala.collection.mutable
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{COUNT, PERCENT, TOTAL}
 import org.apache.spark.paths.SparkPath
 import org.apache.spark.sql.SparkSession
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/SQLHadoopMapReduceCommitProtocol.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/SQLHadoopMapReduceCommitProtocol.scala
index 03e988eb0bd2b..db9a65a3814db 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/SQLHadoopMapReduceCommitProtocol.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/SQLHadoopMapReduceCommitProtocol.scala
@@ -21,7 +21,7 @@ import org.apache.hadoop.fs.Path
 import org.apache.hadoop.mapreduce.{OutputCommitter, TaskAttemptContext}
 import org.apache.hadoop.mapreduce.lib.output.FileOutputCommitter
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_NAME
 import org.apache.spark.internal.io.HadoopMapReduceCommitProtocol
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormat.scala
index a1f2e16449244..57e0efb993fb7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormat.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.execution.datasources.binaryfile
 
 import java.sql.Timestamp
 
-import com.google.common.io.{ByteStreams, Closeables}
+import com.google.common.io.Closeables
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, Path}
 import org.apache.hadoop.mapreduce.Job
@@ -31,6 +31,7 @@ import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.datasources.{FileFormat, OutputWriterFactory, PartitionedFile}
+import org.apache.spark.sql.internal.SessionStateHelper
 import org.apache.spark.sql.internal.SQLConf.SOURCES_BINARY_FILE_MAX_LENGTH
 import org.apache.spark.sql.sources.{And, DataSourceRegister, EqualTo, Filter, GreaterThan, GreaterThanOrEqual, LessThan, LessThanOrEqual, Not, Or}
 import org.apache.spark.sql.types._
@@ -55,7 +56,8 @@ import org.apache.spark.util.SerializableConfiguration
  *     .load("/path/to/fileDir");
  * }}}
  */
-case class BinaryFileFormat() extends FileFormat with DataSourceRegister {
+case class BinaryFileFormat() extends FileFormat
+  with DataSourceRegister with SessionStateHelper {
 
   import BinaryFileFormat._
 
@@ -98,7 +100,7 @@ case class BinaryFileFormat() extends FileFormat with DataSourceRegister {
     val broadcastedHadoopConf =
       SerializableConfiguration.broadcast(sparkSession.sparkContext, hadoopConf)
     val filterFuncs = filters.flatMap(filter => createFilterFunction(filter))
-    val maxLength = sparkSession.sessionState.conf.getConf(SOURCES_BINARY_FILE_MAX_LENGTH)
+    val maxLength = getSqlConf(sparkSession).getConf(SOURCES_BINARY_FILE_MAX_LENGTH)
 
     file: PartitionedFile => {
       val path = file.toPath
@@ -118,7 +120,7 @@ case class BinaryFileFormat() extends FileFormat with DataSourceRegister {
             }
             val stream = fs.open(status.getPath)
             try {
-              writer.write(i, ByteStreams.toByteArray(stream))
+              writer.write(i, stream.readAllBytes())
             } finally {
               Closeables.close(stream, true)
             }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVDataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVDataSource.scala
index c6b9764bee2c9..596edc8beaa34 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVDataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVDataSource.scala
@@ -30,7 +30,7 @@ import org.apache.hadoop.mapreduce.lib.input.FileInputFormat
 
 import org.apache.spark.TaskContext
 import org.apache.spark.input.{PortableDataStream, StreamInputFormat}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.paths.SparkPath
 import org.apache.spark.rdd.{BinaryFileRDD, RDD}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVFileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVFileFormat.scala
index 8aaeae3ae952f..bf189268b4d6a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVFileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/csv/CSVFileFormat.scala
@@ -43,23 +43,15 @@ case class CSVFileFormat() extends TextBasedFileFormat with DataSourceRegister {
       sparkSession: SparkSession,
       options: Map[String, String],
       path: Path): Boolean = {
-    val parsedOptions = new CSVOptions(
-      options,
-      columnPruning = sparkSession.sessionState.conf.csvColumnPruning,
-      sparkSession.sessionState.conf.sessionLocalTimeZone)
-    val csvDataSource = CSVDataSource(parsedOptions)
-    csvDataSource.isSplitable && super.isSplitable(sparkSession, options, path)
+    val parsedOptions = getCsvOptions(sparkSession, options)
+    CSVDataSource(parsedOptions).isSplitable && super.isSplitable(sparkSession, options, path)
   }
 
   override def inferSchema(
       sparkSession: SparkSession,
       options: Map[String, String],
       files: Seq[FileStatus]): Option[StructType] = {
-    val parsedOptions = new CSVOptions(
-      options,
-      columnPruning = sparkSession.sessionState.conf.csvColumnPruning,
-      sparkSession.sessionState.conf.sessionLocalTimeZone)
-
+    val parsedOptions = getCsvOptions(sparkSession, options)
     CSVDataSource(parsedOptions).inferSchema(sparkSession, files, parsedOptions)
   }
 
@@ -76,13 +68,9 @@ case class CSVFileFormat() extends TextBasedFileFormat with DataSourceRegister {
         throw QueryCompilationErrors.dataTypeUnsupportedByDataSourceError("CSV", field)
       }
     }
-    val conf = job.getConfiguration
-    val csvOptions = new CSVOptions(
-      options,
-      columnPruning = sparkSession.sessionState.conf.csvColumnPruning,
-      sparkSession.sessionState.conf.sessionLocalTimeZone)
-    csvOptions.compressionCodec.foreach { codec =>
-      CompressionCodecs.setCodecConfiguration(conf, codec)
+    val parsedOptions = getCsvOptions(sparkSession, options)
+    parsedOptions.compressionCodec.foreach { codec =>
+      CompressionCodecs.setCodecConfiguration(job.getConfiguration, codec)
     }
 
     new OutputWriterFactory {
@@ -90,11 +78,11 @@ case class CSVFileFormat() extends TextBasedFileFormat with DataSourceRegister {
           path: String,
           dataSchema: StructType,
           context: TaskAttemptContext): OutputWriter = {
-        new CsvOutputWriter(path, dataSchema, context, csvOptions)
+        new CsvOutputWriter(path, dataSchema, context, parsedOptions)
       }
 
       override def getFileExtension(context: TaskAttemptContext): String = {
-        "." + csvOptions.extension + CodecStreams.getCompressionExtension(context)
+        "." + parsedOptions.extension + CodecStreams.getCompressionExtension(context)
       }
     }
   }
@@ -109,11 +97,7 @@ case class CSVFileFormat() extends TextBasedFileFormat with DataSourceRegister {
       hadoopConf: Configuration): (PartitionedFile) => Iterator[InternalRow] = {
     val broadcastedHadoopConf =
       SerializableConfiguration.broadcast(sparkSession.sparkContext, hadoopConf)
-    val parsedOptions = new CSVOptions(
-      options,
-      sparkSession.sessionState.conf.csvColumnPruning,
-      sparkSession.sessionState.conf.sessionLocalTimeZone,
-      sparkSession.sessionState.conf.columnNameOfCorruptRecord)
+    val parsedOptions = getCsvOptions(sparkSession, options)
     val isColumnPruningEnabled = parsedOptions.isColumnPruningEnabled(requiredSchema)
 
     // Check a field requirement for corrupt records here to throw an exception in a driver side
@@ -180,4 +164,15 @@ case class CSVFileFormat() extends TextBasedFileFormat with DataSourceRegister {
   }
 
   override def allowDuplicatedColumnNames: Boolean = true
+
+  private def getCsvOptions(
+      sparkSession: SparkSession,
+      options: Map[String, String]): CSVOptions = {
+    val conf = getSqlConf(sparkSession)
+    new CSVOptions(
+      options,
+      conf.csvColumnPruning,
+      conf.sessionLocalTimeZone,
+      conf.columnNameOfCorruptRecord)
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCDatabaseMetadata.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCDatabaseMetadata.scala
new file mode 100644
index 0000000000000..7aa184f57fc00
--- /dev/null
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCDatabaseMetadata.scala
@@ -0,0 +1,102 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution.datasources.jdbc
+
+import java.sql.Connection
+
+import scala.util.control.NonFatal
+
+import org.apache.spark.internal.Logging
+
+/**
+ * Object that contains metadata about the external database.
+ * The metadata is static database information such as the version, or the version
+ * of the JDBC driver.
+ *
+ * This object is stored in JDBCRDD.
+ */
+case class JDBCDatabaseMetadata(
+   databaseMajorVersion: Option[Int],
+   databaseMinorVersion: Option[Int],
+   databaseDriverMajorVersion: Option[Int],
+   databaseDriverMinorVersion: Option[Int]
+ )
+
+/**
+ * Companion object for DatabaseMetadata.
+ * Contains factory methods to build instances.
+ */
+object JDBCDatabaseMetadata extends Logging {
+
+  /**
+   * Safely retrieves a piece of metadata.
+   *
+   * @param f A function that retrieves an integer value from DatabaseMetaData.
+   * @return Some(value) on success, None on failure.
+   */
+  private def safeGet(f: => Int): Option[Int] = {
+    try {
+      Some(f)
+    } catch {
+      case NonFatal(e) =>
+        logWarning(log"Exception while getting specific database metadata", e)
+        None
+    }
+  }
+
+  /**
+   * Creates a DatabaseMetadata instance from a JDBC Connection,
+   * handling errors for each field individually.
+   *
+   * @param getConnection A JDBC connection factory.
+   * @return A new instance of DatabaseMetadata containing the version metadata.
+   */
+  def fromJDBCConnectionFactory(getConnection: Int => Connection): JDBCDatabaseMetadata = {
+    var conn: Connection = null
+
+    def closeConnection(): Unit = {
+      try {
+        if (null != conn) {
+          conn.close()
+        }
+        logInfo("closed connection during metadata fetch")
+      } catch {
+        case e: Exception => logWarning("Exception closing connection during metadata fetch", e)
+      }
+    }
+
+    try {
+      conn = getConnection(-1)
+      // getMetaData itself can throw, so we catch that and return None for all fields
+      val databaseMetadata = conn.getMetaData
+
+      JDBCDatabaseMetadata(
+        databaseMajorVersion = safeGet(databaseMetadata.getDatabaseMajorVersion),
+        databaseMinorVersion = safeGet(databaseMetadata.getDatabaseMinorVersion),
+        databaseDriverMajorVersion = safeGet(databaseMetadata.getDriverMajorVersion),
+        databaseDriverMinorVersion = safeGet(databaseMetadata.getDriverMinorVersion)
+      )
+    } catch {
+      case NonFatal(e) =>
+        logWarning(log"Exception while getting database metadata object from connection", e)
+        JDBCDatabaseMetadata(None, None, None, None)
+    } finally {
+      closeConnection()
+    }
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCOptions.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCOptions.scala
index f0c638b7d07c8..3c85b6e65dee7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCOptions.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCOptions.scala
@@ -100,7 +100,7 @@ class JDBCOptions(
       if (subquery.isEmpty) {
         throw QueryExecutionErrors.emptyOptionError(JDBC_QUERY_STRING)
       } else {
-        s"(${subquery}) SPARK_GEN_SUBQ_${curId.getAndIncrement()}"
+        s"(${subquery.trim.replaceAll(";+$", "")}) SPARK_GEN_SUBQ_${curId.getAndIncrement()}"
       }
   }
 
@@ -215,6 +215,10 @@ class JDBCOptions(
   // This only applies to Data Source V2 JDBC
   val pushDownTableSample = parameters.getOrElse(JDBC_PUSHDOWN_TABLESAMPLE, "true").toBoolean
 
+  // An option to allow/disallow pushing down JOIN into JDBC data source
+  // This only applies to Data Source V2 JDBC
+  val pushDownJoin = parameters.getOrElse(JDBC_PUSHDOWN_JOIN, "true").toBoolean
+
   // The local path of user's keytab file, which is assumed to be pre-uploaded to all nodes either
   // by --files option of spark-submit or manually
   val keytab = {
@@ -321,6 +325,7 @@ object JDBCOptions {
   val JDBC_PUSHDOWN_LIMIT = newOption("pushDownLimit")
   val JDBC_PUSHDOWN_OFFSET = newOption("pushDownOffset")
   val JDBC_PUSHDOWN_TABLESAMPLE = newOption("pushDownTableSample")
+  val JDBC_PUSHDOWN_JOIN = newOption("pushDownJoin")
   val JDBC_KEYTAB = newOption("keytab")
   val JDBC_PRINCIPAL = newOption("principal")
   val JDBC_TABLE_COMMENT = newOption("tableComment")
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRDD.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRDD.scala
index 8342ae06da01a..33cb5342fd3d1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRDD.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRDD.scala
@@ -23,7 +23,7 @@ import scala.util.Using
 import scala.util.control.NonFatal
 
 import org.apache.spark.{InterruptibleIterator, Partition, SparkContext, SparkException, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.SQL_TEXT
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
@@ -54,7 +54,7 @@ object JDBCRDD extends Logging {
    * @throws java.sql.SQLException if the table specification is garbage.
    * @throws java.sql.SQLException if the table contains an unsupported type.
    */
-  def resolveTable(options: JDBCOptions): StructType = {
+  def resolveTable(options: JDBCOptions, conn: Connection): StructType = {
     val url = options.url
     val prepareQuery = options.prepareQuery
     val table = options.tableOrQuery
@@ -62,7 +62,7 @@ object JDBCRDD extends Logging {
     val fullQuery = prepareQuery + dialect.getSchemaQuery(table)
 
     try {
-      getQueryOutputSchema(fullQuery, options, dialect)
+      getQueryOutputSchema(fullQuery, options, dialect, conn)
     } catch {
       case e: SQLException if dialect.isSyntaxErrorBestEffort(e) =>
         throw new SparkException(
@@ -72,19 +72,31 @@ object JDBCRDD extends Logging {
     }
   }
 
+  def resolveTable(options: JDBCOptions): StructType = {
+    JdbcUtils.withConnection(options) {
+      resolveTable(options, _)
+    }
+  }
+
   def getQueryOutputSchema(
-      query: String, options: JDBCOptions, dialect: JdbcDialect): StructType = {
-    Using.resource(dialect.createConnectionFactory(options)(-1)) { conn =>
-      Using.resource(conn.prepareStatement(query)) { statement =>
-        statement.setQueryTimeout(options.queryTimeout)
-        Using.resource(statement.executeQuery()) { rs =>
-          JdbcUtils.getSchema(conn, rs, dialect, alwaysNullable = true,
-            isTimestampNTZ = options.preferTimestampNTZ)
-        }
+      query: String, options: JDBCOptions, dialect: JdbcDialect, conn: Connection): StructType = {
+    logInfo(log"Generated JDBC query to get scan output schema: ${MDC(SQL_TEXT, query)}")
+    Using.resource(conn.prepareStatement(query)) { statement =>
+      statement.setQueryTimeout(options.queryTimeout)
+      Using.resource(statement.executeQuery()) { rs =>
+        JdbcUtils.getSchema(conn, rs, dialect, alwaysNullable = true,
+          isTimestampNTZ = options.preferTimestampNTZ)
       }
     }
   }
 
+  def getQueryOutputSchema(
+      query: String, options: JDBCOptions, dialect: JdbcDialect): StructType = {
+    JdbcUtils.withConnection(options) {
+      getQueryOutputSchema(query, options, dialect, _)
+    }
+  }
+
   /**
    * Prune all but the specified columns from the specified Catalyst schema.
    *
@@ -130,7 +142,8 @@ object JDBCRDD extends Logging {
       sample: Option[TableSampleInfo] = None,
       limit: Int = 0,
       sortOrders: Array[String] = Array.empty[String],
-      offset: Int = 0): RDD[InternalRow] = {
+      offset: Int = 0,
+      additionalMetrics: Map[String, SQLMetric] = Map()): RDD[InternalRow] = {
     val url = options.url
     val dialect = JdbcDialects.get(url)
     val quotedColumns = if (groupByColumns.isEmpty) {
@@ -139,20 +152,24 @@ object JDBCRDD extends Logging {
       // these are already quoted in JDBCScanBuilder
       requiredColumns
     }
+    val connectionFactory = dialect.createConnectionFactory(options)
+
     new JDBCRDD(
       sc,
-      dialect.createConnectionFactory(options),
+      connectionFactory,
       outputSchema.getOrElse(pruneSchema(schema, requiredColumns)),
       quotedColumns,
       predicates,
       parts,
       url,
       options,
+      databaseMetadata = JDBCDatabaseMetadata.fromJDBCConnectionFactory(connectionFactory),
       groupByColumns,
       sample,
       limit,
       sortOrders,
-      offset)
+      offset,
+      additionalMetrics)
   }
   // scalastyle:on argcount
 }
@@ -171,11 +188,13 @@ class JDBCRDD(
     partitions: Array[Partition],
     url: String,
     options: JDBCOptions,
+    databaseMetadata: JDBCDatabaseMetadata,
     groupByColumns: Option[Array[String]],
     sample: Option[TableSampleInfo],
     limit: Int,
     sortOrders: Array[String],
-    offset: Int)
+    offset: Int,
+    additionalMetrics: Map[String, SQLMetric])
   extends RDD[InternalRow](sc, Nil) with DataSourceMetricsMixin with ExternalEngineDatasourceRDD {
 
   /**
@@ -185,6 +204,17 @@ class JDBCRDD(
     sparkContext,
     name = "JDBC query execution time")
 
+  /**
+   * Time needed to fetch the data and transform it into Spark's InternalRow format.
+   *
+   * Usually this is spent in network transfer time, but it can be spent in transformation time
+   * as well if we are transforming some more complex datatype such as structs.
+   */
+  val fetchAndTransformToInternalRowsMetric: SQLMetric = SQLMetrics.createNanoTimingMetric(
+    sparkContext,
+    // Message that user sees does not have to leak details about conversion
+    name = "JDBC remote data fetch and translation time")
+
   private lazy val dialect = JdbcDialects.get(url)
 
   def generateJdbcQuery(partition: Option[JDBCPartition]): String = {
@@ -219,6 +249,11 @@ class JDBCRDD(
     generateJdbcQuery(partition = None)
   }
 
+  /**
+   * Get the external engine database metadata.
+   */
+  def getDatabaseMetadata: JDBCDatabaseMetadata = databaseMetadata
+
   /**
    * Runs the SQL query against the JDBC driver.
    */
@@ -287,28 +322,31 @@ class JDBCRDD(
     }
 
     val sqlText = generateJdbcQuery(Some(part))
+    logInfo(log"Generated JDBC query to fetch data: ${MDC(SQL_TEXT, sqlText)}")
     stmt = conn.prepareStatement(sqlText,
         ResultSet.TYPE_FORWARD_ONLY, ResultSet.CONCUR_READ_ONLY)
     stmt.setFetchSize(options.fetchSize)
     stmt.setQueryTimeout(options.queryTimeout)
 
-    val startTime = System.nanoTime
-    rs = try {
-      stmt.executeQuery()
-    } catch {
-      case e: SQLException if dialect.isSyntaxErrorBestEffort(e) =>
-        throw new SparkException(
-          errorClass = "JDBC_EXTERNAL_ENGINE_SYNTAX_ERROR.DURING_QUERY_EXECUTION",
-          messageParameters = Map("jdbcQuery" -> sqlText),
-          cause = e)
+    rs = SQLMetrics.withTimingNs(queryExecutionTimeMetric) {
+      try {
+        stmt.executeQuery()
+      } catch {
+        case e: SQLException if dialect.isSyntaxErrorBestEffort(e) =>
+          throw new SparkException(
+            errorClass = "JDBC_EXTERNAL_ENGINE_SYNTAX_ERROR.DURING_QUERY_EXECUTION",
+            messageParameters = Map("jdbcQuery" -> sqlText),
+            cause = e)
+      }
     }
-    val endTime = System.nanoTime
-
-    val executionTime = endTime - startTime
-    queryExecutionTimeMetric.add(executionTime)
 
     val rowsIterator =
-      JdbcUtils.resultSetToSparkInternalRows(rs, dialect, schema, inputMetrics)
+      JdbcUtils.resultSetToSparkInternalRows(
+        rs,
+        dialect,
+        schema,
+        inputMetrics,
+        Some(fetchAndTransformToInternalRowsMetric))
 
     CompletionIterator[InternalRow, Iterator[InternalRow]](
       new InterruptibleIterator(context, rowsIterator), close())
@@ -316,7 +354,8 @@ class JDBCRDD(
 
   override def getMetrics: Seq[(String, SQLMetric)] = {
     Seq(
+      "fetchAndTransformToInternalRowsNs" -> fetchAndTransformToInternalRowsMetric,
       "queryExecutionTime" -> queryExecutionTimeMetric
-    )
+    ) ++ additionalMetrics
   }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRelation.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRelation.scala
index 2c4158dfe1533..05e30207314a7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRelation.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JDBCRelation.scala
@@ -21,7 +21,7 @@ import scala.collection.mutable.ArrayBuffer
 import scala.math.BigDecimal.RoundingMode
 
 import org.apache.spark.Partition
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLAUSES, LOWER_BOUND, NEW_VALUE, NUM_PARTITIONS, OLD_VALUE, UPPER_BOUND}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.{DataFrame, Row, SaveMode, SparkSession, SQLContext}
@@ -31,6 +31,7 @@ import org.apache.spark.sql.catalyst.util.DateTimeUtils.{getZoneId, stringToDate
 import org.apache.spark.sql.connector.expressions.filter.Predicate
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.datasources.v2.TableSampleInfo
+import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.jdbc.JdbcDialects
 import org.apache.spark.sql.sources._
@@ -48,6 +49,9 @@ private[sql] case class JDBCPartitioningInfo(
     numPartitions: Int)
 
 private[sql] object JDBCRelation extends Logging {
+
+  val schemaFetchName = "Remote JDBC schema fetch time"
+  val schemaFetchKey = "remoteSchemaFetchTime"
   /**
    * Given a partitioning schematic (a column of integral type, a number of
    * partitions, and upper and lower bounds on the column's value), generate
@@ -255,15 +259,20 @@ private[sql] object JDBCRelation extends Logging {
       parts: Array[Partition],
       jdbcOptions: JDBCOptions)(
       sparkSession: SparkSession): JDBCRelation = {
-    val schema = JDBCRelation.getSchema(sparkSession.sessionState.conf.resolver, jdbcOptions)
-    JDBCRelation(schema, parts, jdbcOptions)(sparkSession)
+    val remoteSchemaFetchMetric = JdbcUtils.createSchemaFetchMetric(sparkSession.sparkContext)
+    val schema = SQLMetrics.withTimingNs(remoteSchemaFetchMetric) {
+      JDBCRelation.getSchema(sparkSession.sessionState.conf.resolver, jdbcOptions)
+    }
+    JDBCRelation(schema, parts, jdbcOptions,
+      Map(schemaFetchKey -> remoteSchemaFetchMetric))(sparkSession)
   }
 }
 
 private[sql] case class JDBCRelation(
     override val schema: StructType,
     parts: Array[Partition],
-    jdbcOptions: JDBCOptions)(@transient val sparkSession: SparkSession)
+    jdbcOptions: JDBCOptions,
+    additionalMetrics: Map[String, SQLMetric] = Map())(@transient val sparkSession: SparkSession)
   extends BaseRelation
   with PrunedFilteredScan
   with InsertableRelation {
@@ -296,7 +305,8 @@ private[sql] case class JDBCRelation(
       requiredColumns,
       pushedPredicates,
       parts,
-      jdbcOptions).asInstanceOf[RDD[Row]]
+      jdbcOptions,
+      additionalMetrics = additionalMetrics).asInstanceOf[RDD[Row]]
   }
 
   def buildScan(
@@ -321,7 +331,8 @@ private[sql] case class JDBCRelation(
       tableSample,
       limit,
       sortOrders,
-      offset).asInstanceOf[RDD[Row]]
+      offset,
+      additionalMetrics).asInstanceOf[RDD[Row]]
   }
 
   override def insert(data: DataFrame, overwrite: Boolean): Unit = {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcRelationProvider.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcRelationProvider.scala
index d9be1a1e3f674..6b9d0520f2eb5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcRelationProvider.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcRelationProvider.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.execution.datasources.jdbc
 import org.apache.spark.sql.{DataFrame, SaveMode, SQLContext}
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.datasources.jdbc.JdbcUtils._
+import org.apache.spark.sql.execution.metric.SQLMetrics
 import org.apache.spark.sql.jdbc.JdbcDialects
 import org.apache.spark.sql.sources.{BaseRelation, CreatableRelationProvider, DataSourceRegister, RelationProvider}
 
@@ -35,9 +36,17 @@ class JdbcRelationProvider extends CreatableRelationProvider
     val sparkSession = sqlContext.sparkSession
     val resolver = sparkSession.sessionState.conf.resolver
     val timeZoneId = sparkSession.sessionState.conf.sessionLocalTimeZone
-    val schema = JDBCRelation.getSchema(resolver, jdbcOptions)
+    val remoteSchemaFetchMetric = JdbcUtils.createSchemaFetchMetric(sparkSession.sparkContext)
+    val schema = SQLMetrics.withTimingNs(remoteSchemaFetchMetric) {
+      JDBCRelation.getSchema(resolver, jdbcOptions)
+    }
     val parts = JDBCRelation.columnPartition(schema, resolver, timeZoneId, jdbcOptions)
-    JDBCRelation(schema, parts, jdbcOptions)(sparkSession)
+    JDBCRelation(
+      schema,
+      parts,
+      jdbcOptions,
+      Map(JDBCRelation.schemaFetchKey -> remoteSchemaFetchMetric)
+    )(sparkSession)
   }
 
   override def createRelation(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcUtils.scala
index 0077012e2b0e4..926c133d2875c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/jdbc/JdbcUtils.scala
@@ -29,9 +29,9 @@ import scala.jdk.CollectionConverters._
 import scala.util.{Failure, Success, Try}
 import scala.util.control.NonFatal
 
-import org.apache.spark.{SparkThrowable, SparkUnsupportedOperationException, TaskContext}
+import org.apache.spark.{SparkContext, SparkThrowable, SparkUnsupportedOperationException, TaskContext}
 import org.apache.spark.executor.InputMetrics
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DEFAULT_ISOLATION_LEVEL, ISOLATION_LEVEL}
 import org.apache.spark.sql.{DataFrame, Row}
 import org.apache.spark.sql.catalyst.{InternalRow, SQLConfHelper}
@@ -46,6 +46,7 @@ import org.apache.spark.sql.connector.catalog.{Identifier, TableChange}
 import org.apache.spark.sql.connector.catalog.index.{SupportsIndex, TableIndex}
 import org.apache.spark.sql.connector.expressions.NamedReference
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors}
+import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
 import org.apache.spark.sql.jdbc.{JdbcDialect, JdbcDialects, JdbcType, NoopDialect}
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.util.SchemaUtils
@@ -357,7 +358,8 @@ object JdbcUtils extends Logging with SQLConfHelper {
       resultSet: ResultSet,
       dialect: JdbcDialect,
       schema: StructType,
-      inputMetrics: InputMetrics): Iterator[InternalRow] = {
+      inputMetrics: InputMetrics,
+      fetchAndTransformToInternalRowsMetric: Option[SQLMetric] = None): Iterator[InternalRow] = {
     new NextIterator[InternalRow] {
       private[this] val rs = resultSet
       private[this] val getters: Array[JDBCValueGetter] = makeGetters(dialect, schema)
@@ -372,7 +374,7 @@ object JdbcUtils extends Logging with SQLConfHelper {
         }
       }
 
-      override protected def getNext(): InternalRow = {
+      private def getNextWithoutTiming: InternalRow = {
         if (rs.next()) {
           inputMetrics.incRecordsRead(1)
           var i = 0
@@ -387,9 +389,26 @@ object JdbcUtils extends Logging with SQLConfHelper {
           null.asInstanceOf[InternalRow]
         }
       }
+
+      override protected def getNext(): InternalRow = {
+        if (fetchAndTransformToInternalRowsMetric.isDefined) {
+          SQLMetrics.withTimingNs(fetchAndTransformToInternalRowsMetric.get) {
+            getNextWithoutTiming
+          }
+        } else {
+          getNextWithoutTiming
+        }
+      }
     }
   }
 
+  def createSchemaFetchMetric(sparkContext: SparkContext): SQLMetric = {
+    SQLMetrics.createNanoTimingMetric(
+      sparkContext,
+      JDBCRelation.schemaFetchName
+    )
+  }
+
   // A `JDBCValueGetter` is responsible for getting a value from `ResultSet` into a field
   // for `MutableRow`. The last argument `Int` means the index for the value to be set in
   // the row and also used for the value in `ResultSet`.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonDataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonDataSource.scala
index bedf5ec62e4ee..aaa5af478dbb7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonDataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonDataSource.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution.datasources.json
 import java.io.InputStream
 
 import com.fasterxml.jackson.core.{JsonFactory, JsonParser}
-import com.google.common.io.ByteStreams
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, Path}
 import org.apache.hadoop.io.Text
@@ -222,7 +221,7 @@ object MultiLineJsonDataSource extends JsonDataSource {
           CodecStreams.createInputStreamWithCloseResource(conf, file.toPath)
         }
       } { inputStream =>
-        UTF8String.fromBytes(ByteStreams.toByteArray(inputStream))
+        UTF8String.fromBytes(inputStream.readAllBytes())
       }
     }
     val streamParser = parser.options.encoding
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonFileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonFileFormat.scala
index ed096cf289b56..e3b78ef432505 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonFileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonFileFormat.scala
@@ -39,22 +39,15 @@ case class JsonFileFormat() extends TextBasedFileFormat with DataSourceRegister
       sparkSession: SparkSession,
       options: Map[String, String],
       path: Path): Boolean = {
-    val parsedOptions = new JSONOptionsInRead(
-      options,
-      sparkSession.sessionState.conf.sessionLocalTimeZone,
-      sparkSession.sessionState.conf.columnNameOfCorruptRecord)
-    val jsonDataSource = JsonDataSource(parsedOptions)
-    jsonDataSource.isSplitable && super.isSplitable(sparkSession, options, path)
+    val parsedOptions = getJsonOptions(sparkSession, options)
+    JsonDataSource(parsedOptions).isSplitable && super.isSplitable(sparkSession, options, path)
   }
 
   override def inferSchema(
       sparkSession: SparkSession,
       options: Map[String, String],
       files: Seq[FileStatus]): Option[StructType] = {
-    val parsedOptions = new JSONOptionsInRead(
-      options,
-      sparkSession.sessionState.conf.sessionLocalTimeZone,
-      sparkSession.sessionState.conf.columnNameOfCorruptRecord)
+    val parsedOptions = getJsonOptions(sparkSession, options)
     JsonDataSource(parsedOptions).inferSchema(sparkSession, files, parsedOptions)
   }
 
@@ -63,13 +56,9 @@ case class JsonFileFormat() extends TextBasedFileFormat with DataSourceRegister
       job: Job,
       options: Map[String, String],
       dataSchema: StructType): OutputWriterFactory = {
-    val conf = job.getConfiguration
-    val parsedOptions = new JSONOptions(
-      options,
-      sparkSession.sessionState.conf.sessionLocalTimeZone,
-      sparkSession.sessionState.conf.columnNameOfCorruptRecord)
+    val parsedOptions = getJsonOptions(sparkSession, options, inRead = false)
     parsedOptions.compressionCodec.foreach { codec =>
-      CompressionCodecs.setCodecConfiguration(conf, codec)
+      CompressionCodecs.setCodecConfiguration(job.getConfiguration, codec)
     }
 
     new OutputWriterFactory {
@@ -96,12 +85,7 @@ case class JsonFileFormat() extends TextBasedFileFormat with DataSourceRegister
       hadoopConf: Configuration): PartitionedFile => Iterator[InternalRow] = {
     val broadcastedHadoopConf =
       SerializableConfiguration.broadcast(sparkSession.sparkContext, hadoopConf)
-
-    val parsedOptions = new JSONOptionsInRead(
-      options,
-      sparkSession.sessionState.conf.sessionLocalTimeZone,
-      sparkSession.sessionState.conf.columnNameOfCorruptRecord)
-
+    val parsedOptions = getJsonOptions(sparkSession, options)
     val actualSchema =
       StructType(requiredSchema.filterNot(_.name == parsedOptions.columnNameOfCorruptRecord))
     // Check a field requirement for corrupt records here to throw an exception in a driver side
@@ -147,4 +131,16 @@ case class JsonFileFormat() extends TextBasedFileFormat with DataSourceRegister
 
     case _ => false
   }
+
+  private def getJsonOptions(
+      spark: SparkSession,
+      options: Map[String, String],
+      inRead: Boolean = true): JSONOptions = {
+    val conf = getSqlConf(spark)
+    if (inRead) {
+      new JSONOptionsInRead(options, conf.sessionLocalTimeZone, conf.columnNameOfCorruptRecord)
+    } else {
+      new JSONOptions(options, conf.sessionLocalTimeZone, conf.columnNameOfCorruptRecord)
+    }
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonOutputWriter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonOutputWriter.scala
index 5727c502a7097..4abfd96993785 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonOutputWriter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/json/JsonOutputWriter.scala
@@ -21,7 +21,7 @@ import java.nio.charset.{Charset, StandardCharsets}
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.mapreduce.TaskAttemptContext
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ENCODING, PATH}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.json.{JacksonGenerator, JSONOptions, JSONOptionsInRead}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/noop/NoopDataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/noop/NoopDataSource.scala
index a662ea3b8d2df..c44c5f780a6be 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/noop/NoopDataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/noop/NoopDataSource.scala
@@ -27,6 +27,7 @@ import org.apache.spark.sql.internal.connector.{SimpleTableProvider, SupportsStr
 import org.apache.spark.sql.sources.DataSourceRegister
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
+import org.apache.spark.util.Utils
 
 /**
  * This is no-op datasource. It does not do anything besides consuming its input.
@@ -48,6 +49,7 @@ private[noop] object NoopTable extends Table with SupportsWrite {
       TableCapability.TRUNCATE,
       TableCapability.ACCEPT_ANY_SCHEMA)
   }
+  override def toString: String = Utils.getFormattedClassName(this)
 }
 
 private[noop] object NoopWriteBuilder extends WriteBuilder
@@ -59,6 +61,7 @@ private[noop] object NoopWriteBuilder extends WriteBuilder
 private[noop] object NoopWrite extends Write {
   override def toBatch: BatchWrite = NoopBatchWrite
   override def toStreaming: StreamingWrite = NoopStreamingWrite
+  override def toString: String = Utils.getFormattedClassName(this)
 }
 
 private[noop] object NoopBatchWrite extends BatchWrite {
@@ -67,6 +70,7 @@ private[noop] object NoopBatchWrite extends BatchWrite {
   override def useCommitCoordinator(): Boolean = false
   override def commit(messages: Array[WriterCommitMessage]): Unit = {}
   override def abort(messages: Array[WriterCommitMessage]): Unit = {}
+  override def toString: String = Utils.getFormattedClassName(this)
 }
 
 private[noop] object NoopWriterFactory extends DataWriterFactory {
@@ -86,6 +90,7 @@ private[noop] object NoopStreamingWrite extends StreamingWrite {
   override def useCommitCoordinator(): Boolean = false
   override def commit(epochId: Long, messages: Array[WriterCommitMessage]): Unit = {}
   override def abort(epochId: Long, messages: Array[WriterCommitMessage]): Unit = {}
+  override def toString: String = Utils.getFormattedClassName(this)
 }
 
 private[noop] object NoopStreamingDataWriterFactory extends StreamingDataWriterFactory {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcFileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcFileFormat.scala
index 86528bf7a0af9..40d10d0e44034 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcFileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcFileFormat.scala
@@ -38,6 +38,7 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.codegen.GenerateUnsafeProjection
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
 import org.apache.spark.sql.execution.datasources._
+import org.apache.spark.sql.internal.SessionStateHelper
 import org.apache.spark.sql.sources._
 import org.apache.spark.sql.types._
 import org.apache.spark.util.{SerializableConfiguration, Utils}
@@ -48,6 +49,7 @@ import org.apache.spark.util.{SerializableConfiguration, Utils}
 class OrcFileFormat
   extends FileFormat
   with DataSourceRegister
+  with SessionStateHelper
   with Serializable {
 
   override def shortName(): String = "orc"
@@ -70,7 +72,8 @@ class OrcFileFormat
       job: Job,
       options: Map[String, String],
       dataSchema: StructType): OutputWriterFactory = {
-    val orcOptions = new OrcOptions(options, sparkSession.sessionState.conf)
+    val sqlConf = getSqlConf(sparkSession)
+    val orcOptions = new OrcOptions(options, sqlConf)
 
     val conf = job.getConfiguration
 
@@ -79,7 +82,7 @@ class OrcFileFormat
     conf.asInstanceOf[JobConf]
       .setOutputFormat(classOf[org.apache.orc.mapred.OrcOutputFormat[OrcStruct]])
 
-    val batchSize = sparkSession.sessionState.conf.orcVectorizedWriterBatchSize
+    val batchSize = sqlConf.orcVectorizedWriterBatchSize
 
     new OutputWriterFactory {
       override def newInstance(
@@ -101,10 +104,10 @@ class OrcFileFormat
   }
 
   override def supportBatch(sparkSession: SparkSession, schema: StructType): Boolean = {
-    val conf = sparkSession.sessionState.conf
-    conf.orcVectorizedReaderEnabled &&
+    val sqlConf = getSqlConf(sparkSession)
+    sqlConf.orcVectorizedReaderEnabled &&
       schema.forall(s => OrcUtils.supportColumnarReads(
-        s.dataType, sparkSession.sessionState.conf.orcVectorizedReaderNestedColumnEnabled))
+        s.dataType, sqlConf.orcVectorizedReaderNestedColumnEnabled))
   }
 
   override def isSplitable(
@@ -136,7 +139,7 @@ class OrcFileFormat
       hadoopConf: Configuration): (PartitionedFile) => Iterator[InternalRow] = {
 
     val resultSchema = StructType(requiredSchema.fields ++ partitionSchema.fields)
-    val sqlConf = sparkSession.sessionState.conf
+    val sqlConf = getSqlConf(sparkSession)
     val capacity = sqlConf.orcVectorizedReaderBatchSize
 
     // Should always be set by FileSourceScanExec creating this.
@@ -163,8 +166,8 @@ class OrcFileFormat
 
     val broadcastedConf =
         SerializableConfiguration.broadcast(sparkSession.sparkContext, hadoopConf)
-    val isCaseSensitive = sparkSession.sessionState.conf.caseSensitiveAnalysis
-    val orcFilterPushDown = sparkSession.sessionState.conf.orcFilterPushDown
+    val isCaseSensitive = sqlConf.caseSensitiveAnalysis
+    val orcFilterPushDown = sqlConf.orcFilterPushDown
 
     (file: PartitionedFile) => {
       val conf = broadcastedConf.value.value
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcUtils.scala
index 50c28c783b4cd..20c40f65b0686 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/orc/OrcUtils.scala
@@ -31,7 +31,7 @@ import org.apache.orc.{BooleanColumnStatistics, ColumnStatistics, DateColumnStat
 
 import org.apache.spark.{SPARK_VERSION_SHORT, SparkException}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.sql.{SPARK_VERSION_METADATA_KEY, SparkSession}
 import org.apache.spark.sql.catalyst.{FileSourceOptions, InternalRow}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFileFormat.scala
index c71d55a41c764..be6e5d1886670 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFileFormat.scala
@@ -32,7 +32,7 @@ import org.apache.parquet.format.converter.ParquetMetadataConverter.SKIP_ROW_GRO
 import org.apache.parquet.hadoop._
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{PATH, SCHEMA}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
@@ -44,7 +44,7 @@ import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.vectorized.{ConstantColumnVector, OffHeapColumnVector, OnHeapColumnVector}
-import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.internal.{SessionStateHelper, SQLConf}
 import org.apache.spark.sql.sources._
 import org.apache.spark.sql.types._
 import org.apache.spark.util.{SerializableConfiguration, ThreadUtils}
@@ -52,6 +52,7 @@ import org.apache.spark.util.{SerializableConfiguration, ThreadUtils}
 class ParquetFileFormat
   extends FileFormat
   with DataSourceRegister
+  with SessionStateHelper
   with Logging
   with Serializable {
 
@@ -68,7 +69,7 @@ class ParquetFileFormat
       job: Job,
       options: Map[String, String],
       dataSchema: StructType): OutputWriterFactory = {
-    val sqlConf = sparkSession.sessionState.conf
+    val sqlConf = getSqlConf(sparkSession)
     val parquetOptions = new ParquetOptions(options, sqlConf)
     ParquetUtils.prepareWrite(sqlConf, job, dataSchema, parquetOptions)
   }
@@ -84,8 +85,7 @@ class ParquetFileFormat
    * Returns whether the reader can return the rows as batch or not.
    */
   override def supportBatch(sparkSession: SparkSession, schema: StructType): Boolean = {
-    val conf = sparkSession.sessionState.conf
-    ParquetUtils.isBatchReadSupportedForSchema(conf, schema)
+    ParquetUtils.isBatchReadSupportedForSchema(getSqlConf(sparkSession), schema)
   }
 
   override def vectorTypes(
@@ -128,6 +128,7 @@ class ParquetFileFormat
       filters: Seq[Filter],
       options: Map[String, String],
       hadoopConf: Configuration): (PartitionedFile) => Iterator[InternalRow] = {
+    val sqlConf = getSqlConf(sparkSession)
     hadoopConf.set(ParquetInputFormat.READ_SUPPORT_CLASS, classOf[ParquetReadSupport].getName)
     hadoopConf.set(
       ParquetReadSupport.SPARK_ROW_REQUESTED_SCHEMA,
@@ -137,27 +138,27 @@ class ParquetFileFormat
       requiredSchema.json)
     hadoopConf.set(
       SQLConf.SESSION_LOCAL_TIMEZONE.key,
-      sparkSession.sessionState.conf.sessionLocalTimeZone)
+      sqlConf.sessionLocalTimeZone)
     hadoopConf.setBoolean(
       SQLConf.NESTED_SCHEMA_PRUNING_ENABLED.key,
-      sparkSession.sessionState.conf.nestedSchemaPruningEnabled)
+      sqlConf.nestedSchemaPruningEnabled)
     hadoopConf.setBoolean(
       SQLConf.CASE_SENSITIVE.key,
-      sparkSession.sessionState.conf.caseSensitiveAnalysis)
+      sqlConf.caseSensitiveAnalysis)
 
     // Sets flags for `ParquetToSparkSchemaConverter`
     hadoopConf.setBoolean(
       SQLConf.PARQUET_BINARY_AS_STRING.key,
-      sparkSession.sessionState.conf.isParquetBinaryAsString)
+      sqlConf.isParquetBinaryAsString)
     hadoopConf.setBoolean(
       SQLConf.PARQUET_INT96_AS_TIMESTAMP.key,
-      sparkSession.sessionState.conf.isParquetINT96AsTimestamp)
+      sqlConf.isParquetINT96AsTimestamp)
     hadoopConf.setBoolean(
       SQLConf.PARQUET_INFER_TIMESTAMP_NTZ_ENABLED.key,
-      sparkSession.sessionState.conf.parquetInferTimestampNTZEnabled)
+      sqlConf.parquetInferTimestampNTZEnabled)
     hadoopConf.setBoolean(
       SQLConf.LEGACY_PARQUET_NANOS_AS_LONG.key,
-      sparkSession.sessionState.conf.legacyParquetNanosAsLong)
+      sqlConf.legacyParquetNanosAsLong)
 
 
     val broadcastedHadoopConf =
@@ -167,7 +168,6 @@ class ParquetFileFormat
     // If true, enable using the custom RecordReader for parquet. This only works for
     // a subset of the types (no complex types).
     val resultSchema = StructType(partitionSchema.fields ++ requiredSchema.fields)
-    val sqlConf = sparkSession.sessionState.conf
     val enableOffHeapColumnVector = sqlConf.offHeapColumnVectorEnabled
     val enableVectorizedReader: Boolean =
       ParquetUtils.isBatchReadSupportedForSchema(sqlConf, resultSchema)
@@ -181,13 +181,13 @@ class ParquetFileFormat
     val pushDownStringPredicate = sqlConf.parquetFilterPushDownStringPredicate
     val pushDownInFilterThreshold = sqlConf.parquetFilterPushDownInFilterThreshold
     val isCaseSensitive = sqlConf.caseSensitiveAnalysis
-    val parquetOptions = new ParquetOptions(options, sparkSession.sessionState.conf)
+    val parquetOptions = new ParquetOptions(options, sqlConf)
     val datetimeRebaseModeInRead = parquetOptions.datetimeRebaseModeInRead
     val int96RebaseModeInRead = parquetOptions.int96RebaseModeInRead
 
     // Should always be set by FileSourceScanExec creating this.
     // Check conf before checking option, to allow working around an issue by changing conf.
-    val returningBatch = sparkSession.sessionState.conf.parquetVectorizedReaderEnabled &&
+    val returningBatch = sqlConf.parquetVectorizedReaderEnabled &&
       options.getOrElse(FileFormat.OPTION_RETURNING_BATCH,
         throw new IllegalArgumentException(
           "OPTION_RETURNING_BATCH should always be set for ParquetFileFormat. " +
@@ -380,11 +380,12 @@ object ParquetFileFormat extends Logging {
   private[parquet] def readSchema(
       footers: Seq[Footer], sparkSession: SparkSession): Option[StructType] = {
 
+    val sqlConf = SessionStateHelper.getSqlConf(sparkSession)
     val converter = new ParquetToSparkSchemaConverter(
-      sparkSession.sessionState.conf.isParquetBinaryAsString,
-      sparkSession.sessionState.conf.isParquetINT96AsTimestamp,
-      inferTimestampNTZ = sparkSession.sessionState.conf.parquetInferTimestampNTZEnabled,
-      nanosAsLong = sparkSession.sessionState.conf.legacyParquetNanosAsLong)
+      sqlConf.isParquetBinaryAsString,
+      sqlConf.isParquetINT96AsTimestamp,
+      inferTimestampNTZ = sqlConf.parquetInferTimestampNTZEnabled,
+      nanosAsLong = sqlConf.legacyParquetNanosAsLong)
 
     val seen = mutable.HashSet[String]()
     val finalSchemas: Seq[StructType] = footers.flatMap { footer =>
@@ -478,10 +479,11 @@ object ParquetFileFormat extends Logging {
       parameters: Map[String, String],
       filesToTouch: Seq[FileStatus],
       sparkSession: SparkSession): Option[StructType] = {
-    val assumeBinaryIsString = sparkSession.sessionState.conf.isParquetBinaryAsString
-    val assumeInt96IsTimestamp = sparkSession.sessionState.conf.isParquetINT96AsTimestamp
-    val inferTimestampNTZ = sparkSession.sessionState.conf.parquetInferTimestampNTZEnabled
-    val nanosAsLong = sparkSession.sessionState.conf.legacyParquetNanosAsLong
+    val sqlConf = SessionStateHelper.getSqlConf(sparkSession)
+    val assumeBinaryIsString = sqlConf.isParquetBinaryAsString
+    val assumeInt96IsTimestamp = sqlConf.isParquetINT96AsTimestamp
+    val inferTimestampNTZ = sqlConf.parquetInferTimestampNTZEnabled
+    val nanosAsLong = sqlConf.legacyParquetNanosAsLong
 
     val reader = (files: Seq[FileStatus], conf: Configuration, ignoreCorruptFiles: Boolean) => {
       // Converter used to convert Parquet `MessageType` to Spark SQL `StructType`
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFilters.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFilters.scala
index 565742671b9cd..4a9b17bf98e59 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFilters.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetFilters.scala
@@ -22,6 +22,7 @@ import java.math.{BigDecimal => JBigDecimal}
 import java.nio.charset.StandardCharsets.UTF_8
 import java.sql.{Date, Timestamp}
 import java.time.{Duration, Instant, LocalDate, LocalTime, Period}
+import java.time.temporal.ChronoField.MICRO_OF_DAY
 import java.util.HashSet
 import java.util.Locale
 
@@ -149,7 +150,7 @@ class ParquetFilters(
     ParquetSchemaType(LogicalTypeAnnotation.timestampType(true, TimeUnit.MICROS), INT64, 0)
   private val ParquetTimestampMillisType =
     ParquetSchemaType(LogicalTypeAnnotation.timestampType(true, TimeUnit.MILLIS), INT64, 0)
-  private val ParquetTimeType =
+  private val ParquetTimeMicrosType =
     ParquetSchemaType(LogicalTypeAnnotation.timeType(false, TimeUnit.MICROS), INT64, 0)
 
   private def dateToDays(date: Any): Int = {
@@ -176,7 +177,7 @@ class ParquetFilters(
   }
 
   private def localTimeToMicros(v: Any): JLong = {
-    DateTimeUtils.localTimeToMicros(v.asInstanceOf[LocalTime])
+    v.asInstanceOf[LocalTime].getLong(MICRO_OF_DAY)
   }
 
   private def decimalToInt32(decimal: JBigDecimal): Integer = decimal.unscaledValue().intValue()
@@ -213,7 +214,7 @@ class ParquetFilters(
 
   private def toLongValue(v: Any): JLong = v match {
     case d: Duration => IntervalUtils.durationToMicros(d)
-    case lt: LocalTime => DateTimeUtils.localTimeToMicros(lt)
+    case lt: LocalTime => localTimeToMicros(lt)
     case l => l.asInstanceOf[JLong]
   }
 
@@ -251,7 +252,7 @@ class ParquetFilters(
       (n: Array[String], v: Any) => FilterApi.eq(
         longColumn(n),
         Option(v).map(timestampToMillis).orNull)
-    case ParquetTimeType =>
+    case ParquetTimeMicrosType =>
       (n: Array[String], v: Any) => FilterApi.eq(
         longColumn(n),
         Option(v).map(localTimeToMicros).orNull)
@@ -304,7 +305,7 @@ class ParquetFilters(
       (n: Array[String], v: Any) => FilterApi.notEq(
         longColumn(n),
         Option(v).map(timestampToMillis).orNull)
-    case ParquetTimeType =>
+    case ParquetTimeMicrosType =>
       (n: Array[String], v: Any) => FilterApi.notEq(
         longColumn(n),
         Option(v).map(localTimeToMicros).orNull)
@@ -348,7 +349,7 @@ class ParquetFilters(
       (n: Array[String], v: Any) => FilterApi.lt(longColumn(n), timestampToMicros(v))
     case ParquetTimestampMillisType if pushDownTimestamp =>
       (n: Array[String], v: Any) => FilterApi.lt(longColumn(n), timestampToMillis(v))
-    case ParquetTimeType =>
+    case ParquetTimeMicrosType =>
       (n: Array[String], v: Any) => FilterApi.lt(longColumn(n), localTimeToMicros(v))
 
     case ParquetSchemaType(_: DecimalLogicalTypeAnnotation, INT32, _) if pushDownDecimal =>
@@ -387,7 +388,7 @@ class ParquetFilters(
       (n: Array[String], v: Any) => FilterApi.ltEq(longColumn(n), timestampToMicros(v))
     case ParquetTimestampMillisType if pushDownTimestamp =>
       (n: Array[String], v: Any) => FilterApi.ltEq(longColumn(n), timestampToMillis(v))
-    case ParquetTimeType =>
+    case ParquetTimeMicrosType =>
       (n: Array[String], v: Any) => FilterApi.ltEq(longColumn(n), localTimeToMicros(v))
 
     case ParquetSchemaType(_: DecimalLogicalTypeAnnotation, INT32, _) if pushDownDecimal =>
@@ -426,7 +427,7 @@ class ParquetFilters(
       (n: Array[String], v: Any) => FilterApi.gt(longColumn(n), timestampToMicros(v))
     case ParquetTimestampMillisType if pushDownTimestamp =>
       (n: Array[String], v: Any) => FilterApi.gt(longColumn(n), timestampToMillis(v))
-    case ParquetTimeType =>
+    case ParquetTimeMicrosType =>
       (n: Array[String], v: Any) => FilterApi.gt(longColumn(n), localTimeToMicros(v))
 
     case ParquetSchemaType(_: DecimalLogicalTypeAnnotation, INT32, _) if pushDownDecimal =>
@@ -465,7 +466,7 @@ class ParquetFilters(
       (n: Array[String], v: Any) => FilterApi.gtEq(longColumn(n), timestampToMicros(v))
     case ParquetTimestampMillisType if pushDownTimestamp =>
       (n: Array[String], v: Any) => FilterApi.gtEq(longColumn(n), timestampToMillis(v))
-    case ParquetTimeType =>
+    case ParquetTimeMicrosType =>
       (n: Array[String], v: Any) => FilterApi.gtEq(longColumn(n), localTimeToMicros(v))
 
     case ParquetSchemaType(_: DecimalLogicalTypeAnnotation, INT32, _) if pushDownDecimal =>
@@ -556,7 +557,7 @@ class ParquetFilters(
         }
         FilterApi.in(longColumn(n), set)
 
-    case ParquetTimeType =>
+    case ParquetTimeMicrosType =>
       (n: Array[String], values: Array[Any]) =>
         val set = new HashSet[JLong]()
         for (value <- values) {
@@ -661,7 +662,7 @@ class ParquetFilters(
         value.isInstanceOf[Date] || value.isInstanceOf[LocalDate]
       case ParquetTimestampMicrosType | ParquetTimestampMillisType =>
         value.isInstanceOf[Timestamp] || value.isInstanceOf[Instant]
-      case ParquetTimeType => value.isInstanceOf[LocalTime]
+      case ParquetTimeMicrosType => value.isInstanceOf[LocalTime]
       case ParquetSchemaType(decimalType: DecimalLogicalTypeAnnotation, INT32, _) =>
         isDecimalMatched(value, decimalType)
       case ParquetSchemaType(decimalType: DecimalLogicalTypeAnnotation, INT64, _) =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetOptions.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetOptions.scala
index eaedd99d8628c..dd5669bda07c9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetOptions.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetOptions.scala
@@ -24,7 +24,7 @@ import org.apache.parquet.hadoop.ParquetOutputFormat
 import org.apache.spark.sql.catalyst.{DataSourceOptions, FileSourceOptions}
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.internal.{LegacyBehaviorPolicy, SQLConf}
+import org.apache.spark.sql.internal.SQLConf
 
 /**
  * Options for the Parquet data source.
@@ -74,16 +74,15 @@ class ParquetOptions(
   /**
    * The rebasing mode for the DATE and TIMESTAMP_MICROS, TIMESTAMP_MILLIS values in reads.
    */
-  def datetimeRebaseModeInRead: LegacyBehaviorPolicy.Value = parameters
+  def datetimeRebaseModeInRead: String = parameters
     .get(DATETIME_REBASE_MODE)
-    .map(LegacyBehaviorPolicy.withName)
-    .getOrElse(sqlConf.getConf(SQLConf.PARQUET_REBASE_MODE_IN_READ))
+    .getOrElse(sqlConf.getConf(SQLConf.PARQUET_REBASE_MODE_IN_READ).toString)
   /**
    * The rebasing mode for INT96 timestamp values in reads.
    */
-  def int96RebaseModeInRead: LegacyBehaviorPolicy.Value = parameters
-    .get(INT96_REBASE_MODE).map(LegacyBehaviorPolicy.withName)
-    .getOrElse(sqlConf.getConf(SQLConf.PARQUET_INT96_REBASE_MODE_IN_READ))
+  def int96RebaseModeInRead: String = parameters
+    .get(INT96_REBASE_MODE)
+    .getOrElse(sqlConf.getConf(SQLConf.PARQUET_INT96_REBASE_MODE_IN_READ).toString)
 }
 
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetReadSupport.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetReadSupport.scala
index af0bf0d51f077..09fd0eccec4b3 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetReadSupport.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetReadSupport.scala
@@ -423,7 +423,7 @@ object ParquetReadSupport extends Logging {
       caseSensitiveParquetFieldMap
           .get(f.name)
           .map(clipParquetType(_, f.dataType, caseSensitive, useFieldId))
-          .getOrElse(toParquet.convertField(f))
+          .getOrElse(toParquet.convertField(f, inShredded = false))
     }
 
     def matchCaseInsensitiveField(f: StructField): Type = {
@@ -439,7 +439,7 @@ object ParquetReadSupport extends Logging {
             } else {
               clipParquetType(parquetTypes.head, f.dataType, caseSensitive, useFieldId)
             }
-          }.getOrElse(toParquet.convertField(f))
+          }.getOrElse(toParquet.convertField(f, inShredded = false))
     }
 
     def matchIdField(f: StructField): Type = {
@@ -458,7 +458,7 @@ object ParquetReadSupport extends Logging {
         }.getOrElse {
           // When there is no ID match, we use a fake name to avoid a name match by accident
           // We need this name to be unique as well, otherwise there will be type conflicts
-          toParquet.convertField(f.copy(name = generateFakeColumnName))
+          toParquet.convertField(f.copy(name = generateFakeColumnName), inShredded = false)
         }
     }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetRowConverter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetRowConverter.scala
index 0927f5c3c963c..cb5e7bf532157 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetRowConverter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetRowConverter.scala
@@ -487,7 +487,8 @@ private[parquet] class ParquetRowConverter(
             .asInstanceOf[TimeLogicalTypeAnnotation].getUnit == TimeUnit.MICROS =>
         new ParquetPrimitiveConverter(updater) {
           override def addLong(value: Long): Unit = {
-            this.updater.setLong(value)
+            val nanos = DateTimeUtils.microsToNanos(value)
+            this.updater.setLong(nanos)
           }
         }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetSchemaConverter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetSchemaConverter.scala
index e05d5fe2fd88a..0df21e2a52295 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetSchemaConverter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetSchemaConverter.scala
@@ -196,8 +196,7 @@ class ParquetToSparkSchemaConverter(
       field: ColumnIO,
       sparkReadType: Option[DataType] = None): ParquetColumn = {
     val targetType = sparkReadType.map {
-      case udt: UserDefinedType[_] => udt.sqlType
-      case otherType => otherType
+      _.transformRecursively { case t: UserDefinedType[_] => t.sqlType }
     }
     field match {
       case primitiveColumn: PrimitiveColumnIO => convertPrimitiveField(primitiveColumn, targetType)
@@ -550,15 +549,16 @@ class SparkToParquetSchemaConverter(
   def convert(catalystSchema: StructType): MessageType = {
     Types
       .buildMessage()
-      .addFields(catalystSchema.map(convertField): _*)
+      .addFields(catalystSchema.map(f => convertField(f, inShredded = false)): _*)
       .named(ParquetSchemaConverter.SPARK_PARQUET_SCHEMA_NAME)
   }
 
   /**
-   * Converts a Spark SQL [[StructField]] to a Parquet [[Type]].
+   * Converts a Spark SQL [[StructField]] to a Parquet [[Type]]. `inShredded` indicates whether
+   * the field is within a shredded Variant schema.
    */
-  def convertField(field: StructField): Type = {
-    val converted = convertField(field, if (field.nullable) OPTIONAL else REQUIRED)
+  def convertField(field: StructField, inShredded: Boolean): Type = {
+    val converted = convertField(field, if (field.nullable) OPTIONAL else REQUIRED, inShredded)
     if (useFieldId && ParquetUtils.hasFieldId(field)) {
       converted.withId(ParquetUtils.getFieldId(field))
     } else {
@@ -566,7 +566,10 @@ class SparkToParquetSchemaConverter(
     }
   }
 
-  private def convertField(field: StructField, repetition: Type.Repetition): Type = {
+  private def convertField(
+      field: StructField,
+      repetition: Type.Repetition,
+      inShredded: Boolean): Type = {
 
     field.dataType match {
       // ===================
@@ -622,16 +625,26 @@ class SparkToParquetSchemaConverter(
       // from Spark 1.5.0, we resort to a timestamp type with microsecond precision so that we can
       // store a timestamp into a `Long`.  This design decision is subject to change though, for
       // example, we may resort to nanosecond precision in the future.
+      //
+      // The Parquet Variant Shredding spec states that timestamps coming from shredded Variants
+      // must be stored as INT64, and the Spark Timestamp type always has microsecond precision,
+      // therefore, the TIMESTAMP_MICROS configuration is used when writing shredded variant
+      // timestamp subfields.
       case TimestampType =>
-        outputTimestampType match {
-          case SQLConf.ParquetOutputTimestampType.INT96 =>
-            Types.primitive(INT96, repetition).named(field.name)
-          case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MICROS =>
-            Types.primitive(INT64, repetition)
-              .as(LogicalTypeAnnotation.timestampType(true, TimeUnit.MICROS)).named(field.name)
-          case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MILLIS =>
-            Types.primitive(INT64, repetition)
-              .as(LogicalTypeAnnotation.timestampType(true, TimeUnit.MILLIS)).named(field.name)
+        if (inShredded) {
+          Types.primitive(INT64, repetition)
+            .as(LogicalTypeAnnotation.timestampType(true, TimeUnit.MICROS)).named(field.name)
+        } else {
+          outputTimestampType match {
+            case SQLConf.ParquetOutputTimestampType.INT96 =>
+              Types.primitive(INT96, repetition).named(field.name)
+            case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MICROS =>
+              Types.primitive(INT64, repetition)
+                .as(LogicalTypeAnnotation.timestampType(true, TimeUnit.MICROS)).named(field.name)
+            case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MILLIS =>
+              Types.primitive(INT64, repetition)
+                .as(LogicalTypeAnnotation.timestampType(true, TimeUnit.MILLIS)).named(field.name)
+          }
         }
 
       case TimestampNTZType =>
@@ -707,7 +720,7 @@ class SparkToParquetSchemaConverter(
           .buildGroup(repetition).as(LogicalTypeAnnotation.listType())
           .addField(Types
             .buildGroup(REPEATED)
-            .addField(convertField(StructField("array", elementType, nullable)))
+            .addField(convertField(StructField("array", elementType, nullable), inShredded))
             .named("bag"))
           .named(field.name)
 
@@ -723,7 +736,7 @@ class SparkToParquetSchemaConverter(
         Types
           .buildGroup(repetition).as(LogicalTypeAnnotation.listType())
           // "array" is the name chosen by parquet-avro (1.7.0 and prior version)
-          .addField(convertField(StructField("array", elementType, nullable), REPEATED))
+          .addField(convertField(StructField("array", elementType, nullable), REPEATED, inShredded))
           .named(field.name)
 
       // Spark 1.4.x and prior versions convert MapType into a 3-level group annotated by
@@ -738,8 +751,8 @@ class SparkToParquetSchemaConverter(
         ConversionPatterns.mapType(
           repetition,
           field.name,
-          convertField(StructField("key", keyType, nullable = false)),
-          convertField(StructField("value", valueType, valueContainsNull)))
+          convertField(StructField("key", keyType, nullable = false), inShredded),
+          convertField(StructField("value", valueType, valueContainsNull), inShredded))
 
       // =====================================
       // ArrayType and MapType (standard mode)
@@ -755,7 +768,7 @@ class SparkToParquetSchemaConverter(
           .buildGroup(repetition).as(LogicalTypeAnnotation.listType())
           .addField(
             Types.repeatedGroup()
-              .addField(convertField(StructField("element", elementType, containsNull)))
+              .addField(convertField(StructField("element", elementType, containsNull), inShredded))
               .named("list"))
           .named(field.name)
 
@@ -771,9 +784,10 @@ class SparkToParquetSchemaConverter(
           .addField(
             Types
               .repeatedGroup()
-              .addField(convertField(StructField("key", keyType, nullable = false)))
-              .addField(convertField(StructField("value", valueType, valueContainsNull)))
-              .named("key_value"))
+              .addField(convertField(StructField("key", keyType, nullable = false), inShredded))
+              .addField(
+                convertField(StructField("value", valueType, valueContainsNull), inShredded)
+              ).named("key_value"))
           .named(field.name)
 
       // ===========
@@ -782,25 +796,25 @@ class SparkToParquetSchemaConverter(
 
       case VariantType =>
         Types.buildGroup(repetition)
-          .addField(convertField(StructField("value", BinaryType, nullable = false)))
-          .addField(convertField(StructField("metadata", BinaryType, nullable = false)))
+          .addField(convertField(StructField("value", BinaryType, nullable = false), inShredded))
+          .addField(convertField(StructField("metadata", BinaryType, nullable = false), inShredded))
           .named(field.name)
 
       case s: StructType if SparkShreddingUtils.isVariantShreddingStruct(s) =>
         // Variant struct takes a Variant and writes to Parquet as a shredded schema.
         val group = Types.buildGroup(repetition)
         s.fields.foreach { f =>
-          group.addField(convertField(f))
+          group.addField(convertField(f, inShredded = true))
         }
         group.named(field.name)
 
       case StructType(fields) =>
         fields.foldLeft(Types.buildGroup(repetition)) { (builder, field) =>
-          builder.addField(convertField(field))
+          builder.addField(convertField(field, inShredded))
         }.named(field.name)
 
       case udt: UserDefinedType[_] =>
-        convertField(field.copy(dataType = udt.sqlType))
+        convertField(field.copy(dataType = udt.sqlType), inShredded)
 
       case _ =>
         throw QueryCompilationErrors.cannotConvertDataTypeToParquetTypeError(field)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetUtils.scala
index bad883534115c..5db3b0671db9f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetUtils.scala
@@ -33,7 +33,7 @@ import org.apache.parquet.schema.{PrimitiveType, Types}
 import org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName
 
 import org.apache.spark.{SparkException, SparkUnsupportedOperationException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CLASS_NAME, CONFIG}
 import org.apache.spark.sql.{Row, SparkSession}
 import org.apache.spark.sql.catalyst.InternalRow
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetWriteSupport.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetWriteSupport.scala
index 4022f7ea30032..2ab9fb64da43d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetWriteSupport.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetWriteSupport.scala
@@ -120,7 +120,8 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
       SQLConf.ParquetOutputTimestampType.withName(configuration.get(key))
     }
 
-    this.rootFieldWriters = shreddedSchema.map(_.dataType).map(makeWriter).toArray[ValueWriter]
+    this.rootFieldWriters =
+      shreddedSchema.map(_.dataType).map(makeWriter(_, inShredded = false)).toArray[ValueWriter]
 
     val messageType = new SparkToParquetSchemaConverter(configuration).convert(shreddedSchema)
     val metadata = Map(
@@ -187,7 +188,9 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
     }
   }
 
-  private def makeWriter(dataType: DataType): ValueWriter = {
+  // `inShredded` indicates whether the current traversal is nested within a shredded Variant
+  // schema. This affects how timestamp values are written.
+  private def makeWriter(dataType: DataType, inShredded: Boolean): ValueWriter = {
     dataType match {
       case BooleanType =>
         (row: SpecializedGetters, ordinal: Int) =>
@@ -209,7 +212,7 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
         (row: SpecializedGetters, ordinal: Int) =>
           recordConsumer.addInteger(row.getInt(ordinal))
 
-      case LongType | _: DayTimeIntervalType | _: TimeType =>
+      case LongType | _: DayTimeIntervalType =>
         (row: SpecializedGetters, ordinal: Int) =>
           recordConsumer.addLong(row.getLong(ordinal))
 
@@ -227,25 +230,34 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
             Binary.fromReusedByteArray(row.getUTF8String(ordinal).getBytes))
 
       case TimestampType =>
-        outputTimestampType match {
-          case SQLConf.ParquetOutputTimestampType.INT96 =>
-            (row: SpecializedGetters, ordinal: Int) =>
-              val micros = int96RebaseFunc(row.getLong(ordinal))
-              val (julianDay, timeOfDayNanos) = DateTimeUtils.toJulianDay(micros)
-              val buf = ByteBuffer.wrap(timestampBuffer)
-              buf.order(ByteOrder.LITTLE_ENDIAN).putLong(timeOfDayNanos).putInt(julianDay)
-              recordConsumer.addBinary(Binary.fromReusedByteArray(timestampBuffer))
-
-          case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MICROS =>
-            (row: SpecializedGetters, ordinal: Int) =>
-              val micros = row.getLong(ordinal)
-              recordConsumer.addLong(timestampRebaseFunc(micros))
-
-          case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MILLIS =>
-            (row: SpecializedGetters, ordinal: Int) =>
-              val micros = row.getLong(ordinal)
-              val millis = DateTimeUtils.microsToMillis(timestampRebaseFunc(micros))
-              recordConsumer.addLong(millis)
+        if (inShredded) {
+          // The Parquet Variant Shredding schema states that timestamp types must be stored as
+          // INT64. The Spark Timestamp type always has microsecond granularity and therefore, we
+          // always write shredded timestamps in the TIMESTAMP_MICROS configuration.
+          (row: SpecializedGetters, ordinal: Int) =>
+            val micros = row.getLong(ordinal)
+            recordConsumer.addLong(timestampRebaseFunc(micros))
+        } else {
+          outputTimestampType match {
+            case SQLConf.ParquetOutputTimestampType.INT96 =>
+              (row: SpecializedGetters, ordinal: Int) =>
+                val micros = int96RebaseFunc(row.getLong(ordinal))
+                val (julianDay, timeOfDayNanos) = DateTimeUtils.toJulianDay(micros)
+                val buf = ByteBuffer.wrap(timestampBuffer)
+                buf.order(ByteOrder.LITTLE_ENDIAN).putLong(timeOfDayNanos).putInt(julianDay)
+                recordConsumer.addBinary(Binary.fromReusedByteArray(timestampBuffer))
+
+            case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MICROS =>
+              (row: SpecializedGetters, ordinal: Int) =>
+                val micros = row.getLong(ordinal)
+                recordConsumer.addLong(timestampRebaseFunc(micros))
+
+            case SQLConf.ParquetOutputTimestampType.TIMESTAMP_MILLIS =>
+              (row: SpecializedGetters, ordinal: Int) =>
+                val micros = row.getLong(ordinal)
+                val millis = DateTimeUtils.microsToMillis(timestampRebaseFunc(micros))
+                recordConsumer.addLong(millis)
+          }
         }
 
       case TimestampNTZType =>
@@ -253,6 +265,10 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
         // MICROS time unit.
         (row: SpecializedGetters, ordinal: Int) => recordConsumer.addLong(row.getLong(ordinal))
 
+      case _: TimeType =>
+        (row: SpecializedGetters, ordinal: Int) =>
+          recordConsumer.addLong(DateTimeUtils.nanosToMicros(row.getLong(ordinal)))
+
       case BinaryType =>
         (row: SpecializedGetters, ordinal: Int) =>
           recordConsumer.addBinary(Binary.fromReusedByteArray(row.getBinary(ordinal)))
@@ -273,7 +289,8 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
           }
 
       case s: StructType if SparkShreddingUtils.isVariantShreddingStruct(s) =>
-        val fieldWriters = s.map(_.dataType).map(makeWriter).toArray[ValueWriter]
+        val fieldWriters =
+          s.map(_.dataType).map(makeWriter(_, inShredded = true)).toArray[ValueWriter]
         val variantShreddingSchema = SparkShreddingUtils.buildVariantSchema(s)
         (row: SpecializedGetters, ordinal: Int) =>
           val v = row.getVariant(ordinal)
@@ -284,17 +301,18 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
           }
 
       case t: StructType =>
-        val fieldWriters = t.map(_.dataType).map(makeWriter).toArray[ValueWriter]
+        val fieldWriters =
+          t.map(_.dataType).map(makeWriter(_, inShredded)).toArray[ValueWriter]
         (row: SpecializedGetters, ordinal: Int) =>
           consumeGroup {
             writeFields(row.getStruct(ordinal, t.length), t, fieldWriters)
           }
 
-      case t: ArrayType => makeArrayWriter(t)
+      case t: ArrayType => makeArrayWriter(t, inShredded)
 
-      case t: MapType => makeMapWriter(t)
+      case t: MapType => makeMapWriter(t, inShredded)
 
-      case t: UserDefinedType[_] => makeWriter(t.sqlType)
+      case t: UserDefinedType[_] => makeWriter(t.sqlType, inShredded)
 
       case _ => throw SparkException.internalError(s"Unsupported data type $dataType.")
     }
@@ -373,8 +391,9 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
     }
   }
 
-  def makeArrayWriter(arrayType: ArrayType): ValueWriter = {
-    val elementWriter = makeWriter(arrayType.elementType)
+  def makeArrayWriter(arrayType: ArrayType, inShredded: Boolean): ValueWriter = {
+    // The shredded schema should not have an array inside
+    val elementWriter = makeWriter(arrayType.elementType, inShredded)
 
     def threeLevelArrayWriter(repeatedGroupName: String, elementFieldName: String): ValueWriter =
       (row: SpecializedGetters, ordinal: Int) => {
@@ -453,9 +472,12 @@ class ParquetWriteSupport extends WriteSupport[InternalRow] with Logging {
     }
   }
 
-  private def makeMapWriter(mapType: MapType): ValueWriter = {
-    val keyWriter = makeWriter(mapType.keyType)
-    val valueWriter = makeWriter(mapType.valueType)
+  private def makeMapWriter(mapType: MapType, inShredded: Boolean): ValueWriter = {
+    // TODO: If maps are ever supported in the shredded schema, we should add a test in
+    //  `ParquetVariantShreddingSuite` to make sure that timestamps within maps are shredded
+    //  correctly as INT64.
+    val keyWriter = makeWriter(mapType.keyType, inShredded)
+    val valueWriter = makeWriter(mapType.valueType, inShredded)
     val repeatedGroupName = if (writeLegacyParquetFormat) {
       // Legacy mode:
       //
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/SparkShreddingUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/SparkShreddingUtils.scala
index 24f4fd8274d28..1132f074f29d1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/SparkShreddingUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/parquet/SparkShreddingUtils.scala
@@ -473,13 +473,15 @@ case object SparkShreddingUtils {
    *   b: struct<typed_value: string, value: binary>>>
    *
    */
-  def variantShreddingSchema(dataType: DataType, isTopLevel: Boolean = true): StructType = {
+  def variantShreddingSchema(dataType: DataType,
+      isTopLevel: Boolean = true,
+      isObjectField : Boolean = false): StructType = {
     val fields = dataType match {
       case ArrayType(elementType, _) =>
         // Always set containsNull to false. One of value or typed_value must always be set for
         // array elements.
         val arrayShreddingSchema =
-          ArrayType(variantShreddingSchema(elementType, false), containsNull = false)
+          ArrayType(variantShreddingSchema(elementType, false, false), containsNull = false)
         Seq(
           StructField(VariantValueFieldName, BinaryType, nullable = true),
           StructField(TypedValueFieldName, arrayShreddingSchema, nullable = true)
@@ -489,15 +491,17 @@ case object SparkShreddingUtils {
         // "value" columna as "00", and missing values are represented by setting both "value" and
         // "typed_value" to null.
         val objectShreddingSchema = StructType(fields.map(f =>
-            f.copy(dataType = variantShreddingSchema(f.dataType, false), nullable = false)))
+            f.copy(dataType = variantShreddingSchema(f.dataType, false, true), nullable = false)))
         Seq(
           StructField(VariantValueFieldName, BinaryType, nullable = true),
           StructField(TypedValueFieldName, objectShreddingSchema, nullable = true)
         )
       case VariantType =>
-        // For Variant, we don't need a typed column
+        // For Variant, we don't need a typed column. If there is no typed column, value is required
+        // for array elements or top-level fields, but optional for objects (where a null represents
+        // a missing field).
         Seq(
-          StructField(VariantValueFieldName, BinaryType, nullable = true)
+          StructField(VariantValueFieldName, BinaryType, nullable = isObjectField)
         )
       case _: NumericType | BooleanType | _: StringType | BinaryType | _: DatetimeType =>
         Seq(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/rules.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/rules.scala
index cf7bad0ecfe60..c8cb5d7ce7c51 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/rules.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/rules.scala
@@ -35,7 +35,6 @@ import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.connector.expressions.{FieldReference, RewritableTransform}
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.command.DDLUtils
-import org.apache.spark.sql.execution.command.ViewHelper.generateViewProperties
 import org.apache.spark.sql.execution.datasources.{CreateTable => CreateTableV1}
 import org.apache.spark.sql.execution.datasources.v2.FileDataSourceV2
 import org.apache.spark.sql.internal.SQLConf
@@ -705,16 +704,6 @@ object ViewSyncSchemaToMetaStore extends (LogicalPlan => Unit) {
         }
 
         if (redo) {
-          val newProperties = if (viewSchemaMode == SchemaEvolution) {
-            generateViewProperties(
-              metaData.properties,
-              session,
-              fieldNames,
-              fieldNames,
-              metaData.viewSchemaMode)
-          } else {
-            metaData.properties
-          }
           val newSchema = if (viewSchemaMode == SchemaTypeEvolution) {
             val newFields = viewQuery.schema.map {
               case StructField(name, dataType, nullable, _) =>
@@ -727,9 +716,7 @@ object ViewSyncSchemaToMetaStore extends (LogicalPlan => Unit) {
           }
           SchemaUtils.checkColumnNameDuplication(fieldNames.toImmutableArraySeq,
             session.sessionState.conf.resolver)
-          val updatedViewMeta = metaData.copy(
-            properties = newProperties,
-            schema = newSchema)
+          val updatedViewMeta = metaData.copy(schema = newSchema)
           session.sessionState.catalog.alterTable(updatedViewMeta)
         }
       case _ => // OK
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/BatchScanExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/BatchScanExec.scala
index 6a502a44fad58..55866cc858405 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/BatchScanExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/BatchScanExec.scala
@@ -17,18 +17,19 @@
 
 package org.apache.spark.sql.execution.datasources.v2
 
-import com.google.common.base.Objects
+import java.util.Objects
 
 import org.apache.spark.SparkException
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.plans.QueryPlan
-import org.apache.spark.sql.catalyst.plans.physical.{KeyGroupedPartitioning, KeyGroupedShuffleSpec, Partitioning, SinglePartition}
+import org.apache.spark.sql.catalyst.plans.physical.{KeyGroupedPartitioning, Partitioning, SinglePartition}
 import org.apache.spark.sql.catalyst.util.{truncatedString, InternalRowComparableWrapper}
 import org.apache.spark.sql.connector.catalog.Table
-import org.apache.spark.sql.connector.catalog.functions.Reducer
 import org.apache.spark.sql.connector.read._
+import org.apache.spark.sql.execution.KeyGroupedPartitionedScan
+import org.apache.spark.sql.execution.joins.StoragePartitionJoinParams
 import org.apache.spark.util.ArrayImplicits._
 
 /**
@@ -41,7 +42,7 @@ case class BatchScanExec(
     ordering: Option[Seq[SortOrder]] = None,
     @transient table: Table,
     spjParams: StoragePartitionJoinParams = StoragePartitionJoinParams()
-  ) extends DataSourceV2ScanExecBase {
+  ) extends DataSourceV2ScanExecBase with KeyGroupedPartitionedScan[InputPartition] {
 
   @transient lazy val batch: Batch = if (scan == null) null else scan.toBatch
 
@@ -55,7 +56,7 @@ case class BatchScanExec(
       false
   }
 
-  override def hashCode(): Int = Objects.hashCode(batch, runtimeFilters)
+  override def hashCode(): Int = Objects.hash(batch, runtimeFilters)
 
   @transient override lazy val inputPartitions: Seq[InputPartition] =
     batch.planInputPartitions().toImmutableArraySeq
@@ -118,31 +119,7 @@ case class BatchScanExec(
 
   override def outputPartitioning: Partitioning = {
     super.outputPartitioning match {
-      case k: KeyGroupedPartitioning =>
-        val expressions = spjParams.joinKeyPositions match {
-          case Some(projectionPositions) => projectionPositions.map(i => k.expressions(i))
-          case _ => k.expressions
-        }
-
-        val newPartValues = spjParams.commonPartitionValues match {
-          case Some(commonPartValues) =>
-            // We allow duplicated partition values if
-            // `spark.sql.sources.v2.bucketing.partiallyClusteredDistribution.enabled` is true
-             commonPartValues.flatMap {
-               case (partValue, numSplits) => Seq.fill(numSplits)(partValue)
-             }
-          case None =>
-            spjParams.joinKeyPositions match {
-              case Some(projectionPositions) => k.partitionValues.map{r =>
-                val projectedRow = KeyGroupedPartitioning.project(expressions,
-                  projectionPositions, r)
-                InternalRowComparableWrapper(projectedRow, expressions)
-              }.distinct.map(_.row)
-              case _ => k.partitionValues
-            }
-        }
-        k.copy(expressions = expressions, numPartitions = newPartValues.length,
-          partitionValues = newPartValues)
+      case k: KeyGroupedPartitioning => getOutputKeyGroupedPartitioning(k, spjParams)
       case p => p
     }
   }
@@ -155,104 +132,8 @@ case class BatchScanExec(
       sparkContext.parallelize(Array.empty[InternalRow].toImmutableArraySeq, 1)
     } else {
       val finalPartitions = outputPartitioning match {
-        case p: KeyGroupedPartitioning =>
-          assert(spjParams.keyGroupedPartitioning.isDefined)
-          val expressions = spjParams.keyGroupedPartitioning.get
-
-          // Re-group the input partitions if we are projecting on a subset of join keys
-          val (groupedPartitions, partExpressions) = spjParams.joinKeyPositions match {
-            case Some(projectPositions) =>
-              val projectedExpressions = projectPositions.map(i => expressions(i))
-              val parts = filteredPartitions.flatten.groupBy(part => {
-                val row = part.asInstanceOf[HasPartitionKey].partitionKey()
-                val projectedRow = KeyGroupedPartitioning.project(
-                  expressions, projectPositions, row)
-                InternalRowComparableWrapper(projectedRow, projectedExpressions)
-              }).map { case (wrapper, splits) => (wrapper.row, splits) }.toSeq
-              (parts, projectedExpressions)
-            case _ =>
-              val groupedParts = filteredPartitions.map(splits => {
-                assert(splits.nonEmpty && splits.head.isInstanceOf[HasPartitionKey])
-                (splits.head.asInstanceOf[HasPartitionKey].partitionKey(), splits)
-              })
-              (groupedParts, expressions)
-          }
-
-          // Also re-group the partitions if we are reducing compatible partition expressions
-          val finalGroupedPartitions = spjParams.reducers match {
-            case Some(reducers) =>
-              val result = groupedPartitions.groupBy { case (row, _) =>
-                KeyGroupedShuffleSpec.reducePartitionValue(row, partExpressions, reducers)
-              }.map { case (wrapper, splits) => (wrapper.row, splits.flatMap(_._2)) }.toSeq
-              val rowOrdering = RowOrdering.createNaturalAscendingOrdering(
-                partExpressions.map(_.dataType))
-              result.sorted(rowOrdering.on((t: (InternalRow, _)) => t._1))
-            case _ => groupedPartitions
-          }
-
-          // When partially clustered, the input partitions are not grouped by partition
-          // values. Here we'll need to check `commonPartitionValues` and decide how to group
-          // and replicate splits within a partition.
-          if (spjParams.commonPartitionValues.isDefined && spjParams.applyPartialClustering) {
-            // A mapping from the common partition values to how many splits the partition
-            // should contain.
-            val commonPartValuesMap = spjParams.commonPartitionValues
-                .get
-                .map(t => (InternalRowComparableWrapper(t._1, partExpressions), t._2))
-                .toMap
-            val filteredGroupedPartitions = finalGroupedPartitions.filter {
-              case (partValues, _) =>
-               commonPartValuesMap.keySet.contains(
-                InternalRowComparableWrapper(partValues, partExpressions))
-            }
-            val nestGroupedPartitions = filteredGroupedPartitions.map { case (partValue, splits) =>
-              // `commonPartValuesMap` should contain the part value since it's the super set.
-              val numSplits = commonPartValuesMap
-                  .get(InternalRowComparableWrapper(partValue, partExpressions))
-              assert(numSplits.isDefined, s"Partition value $partValue does not exist in " +
-                  "common partition values from Spark plan")
-
-              val newSplits = if (spjParams.replicatePartitions) {
-                // We need to also replicate partitions according to the other side of join
-                Seq.fill(numSplits.get)(splits)
-              } else {
-                // Not grouping by partition values: this could be the side with partially
-                // clustered distribution. Because of dynamic filtering, we'll need to check if
-                // the final number of splits of a partition is smaller than the original
-                // number, and fill with empty splits if so. This is necessary so that both
-                // sides of a join will have the same number of partitions & splits.
-                splits.map(Seq(_)).padTo(numSplits.get, Seq.empty)
-              }
-              (InternalRowComparableWrapper(partValue, partExpressions), newSplits)
-            }
-
-            // Now fill missing partition keys with empty partitions
-            val partitionMapping = nestGroupedPartitions.toMap
-            spjParams.commonPartitionValues.get.flatMap {
-              case (partValue, numSplits) =>
-                // Use empty partition for those partition values that are not present.
-                partitionMapping.getOrElse(
-                  InternalRowComparableWrapper(partValue, partExpressions),
-                  Seq.fill(numSplits)(Seq.empty))
-            }
-          } else {
-            // either `commonPartitionValues` is not defined, or it is defined but
-            // `applyPartialClustering` is false.
-            val partitionMapping = finalGroupedPartitions.map { case (partValue, splits) =>
-              InternalRowComparableWrapper(partValue, partExpressions) -> splits
-            }.toMap
-
-            // In case `commonPartitionValues` is not defined (e.g., SPJ is not used), there
-            // could exist duplicated partition values, as partition grouping is not done
-            // at the beginning and postponed to this method. It is important to use unique
-            // partition values here so that grouped partitions won't get duplicated.
-            p.uniquePartitionValues.map { partValue =>
-              // Use empty partition for those partition values that are not present
-              partitionMapping.getOrElse(
-                InternalRowComparableWrapper(partValue, partExpressions), Seq.empty)
-            }
-          }
-
+        case p: KeyGroupedPartitioning => getInputPartitionGrouping(
+          p, spjParams, filteredPartitions, p => p.asInstanceOf[HasPartitionKey].partitionKey())
         case _ => filteredPartitions
       }
 
@@ -285,28 +166,3 @@ case class BatchScanExec(
     s"BatchScan ${table.name()}".trim
   }
 }
-
-case class StoragePartitionJoinParams(
-    keyGroupedPartitioning: Option[Seq[Expression]] = None,
-    joinKeyPositions: Option[Seq[Int]] = None,
-    commonPartitionValues: Option[Seq[(InternalRow, Int)]] = None,
-    reducers: Option[Seq[Option[Reducer[_, _]]]] = None,
-    applyPartialClustering: Boolean = false,
-    replicatePartitions: Boolean = false) {
-  override def equals(other: Any): Boolean = other match {
-    case other: StoragePartitionJoinParams =>
-      this.commonPartitionValues == other.commonPartitionValues &&
-      this.replicatePartitions == other.replicatePartitions &&
-      this.applyPartialClustering == other.applyPartialClustering &&
-      this.joinKeyPositions == other.joinKeyPositions
-    case _ =>
-      false
-  }
-
-  override def hashCode(): Int = Objects.hashCode(
-    joinKeyPositions: Option[Seq[Int]],
-    commonPartitionValues: Option[Seq[(InternalRow, Int)]],
-    applyPartialClustering: java.lang.Boolean,
-    replicatePartitions: java.lang.Boolean)
-}
-
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CacheTableExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CacheTableExec.scala
index c7f47d2eaaaad..a28b40dc7cbf5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CacheTableExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CacheTableExec.scala
@@ -19,8 +19,9 @@ package org.apache.spark.sql.execution.datasources.v2
 
 import java.util.Locale
 
+import scala.util.control.NonFatal
+
 import org.apache.spark.internal.LogKeys.OPTIONS
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.{InternalRow, TableIdentifier}
 import org.apache.spark.sql.catalyst.analysis.{LocalTempView, UnresolvedRelation}
 import org.apache.spark.sql.catalyst.expressions.Attribute
@@ -28,8 +29,10 @@ import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
 import org.apache.spark.sql.classic.Dataset
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.MultipartIdentifierHelper
-import org.apache.spark.sql.execution.command.CreateViewCommand
+import org.apache.spark.sql.connector.catalog.Identifier
+import org.apache.spark.sql.execution.command.{CreateViewCommand, DropTempViewCommand}
 import org.apache.spark.storage.StorageLevel
+import org.apache.spark.util.Utils
 
 trait BaseCacheTableExec extends LeafV2CommandExec {
   def relationName: String
@@ -53,7 +56,16 @@ trait BaseCacheTableExec extends LeafV2CommandExec {
 
     if (!isLazy) {
       // Performs eager caching.
-      df.count()
+      try {
+        df.count()
+      } catch {
+        case NonFatal(e) =>
+          // If the query fails, we should remove the cached table.
+          Utils.tryLogNonFatalError {
+            session.sharedState.cacheManager.uncacheQuery(session, planToCache, cascade = false)
+          }
+          throw e
+      }
     }
 
     Seq.empty
@@ -99,7 +111,15 @@ case class CacheTableAsSelectExec(
       isAnalyzed = true,
       referredTempFunctions = referredTempFunctions
     ).run(session)
-    super.run()
+    try {
+      super.run()
+    } catch {
+      case NonFatal(e) =>
+        Utils.tryLogNonFatalError {
+          DropTempViewCommand(Identifier.of(Array.empty, tempViewName)).run(session)
+        }
+        throw e
+    }
   }
 }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateIndexExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateIndexExec.scala
index 60d44101da3b1..1de97ba4189ea 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateIndexExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateIndexExec.scala
@@ -22,7 +22,6 @@ import java.util
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.internal.LogKeys.{INDEX_NAME, TABLE_NAME}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.IndexAlreadyExistsException
 import org.apache.spark.sql.catalyst.expressions.Attribute
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateNamespaceExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateNamespaceExec.scala
index 76ba53ef99a00..ef069fd2fe23b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateNamespaceExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateNamespaceExec.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution.datasources.v2
 import scala.jdk.CollectionConverters.MapHasAsJava
 
 import org.apache.spark.internal.LogKeys.NAMESPACE
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.NamespaceAlreadyExistsException
 import org.apache.spark.sql.catalyst.expressions.Attribute
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateTableExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateTableExec.scala
index 3298a56d95992..58c63be38833f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateTableExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/CreateTableExec.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution.datasources.v2
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.internal.LogKeys.TABLE_NAME
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.TableAlreadyExistsException
 import org.apache.spark.sql.catalyst.expressions.Attribute
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceRDD.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceRDD.scala
index e46c0806ba2d9..6a07d3c3931a1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceRDD.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceRDD.scala
@@ -61,6 +61,14 @@ class DataSourceRDD(
       private var currentIter: Option[Iterator[Object]] = None
       private var currentIndex: Int = 0
 
+      private val partitionMetricCallback = new PartitionMetricCallback(customMetrics)
+
+      // In case of early stopping before consuming the entire iterator,
+      // we need to do one more metric update at the end of the task.
+      context.addTaskCompletionListener[Unit] { _ =>
+        partitionMetricCallback.execute()
+      }
+
       override def hasNext: Boolean = currentIter.exists(_.hasNext) || advanceToNextIter()
 
       override def next(): Object = {
@@ -87,14 +95,10 @@ class DataSourceRDD(
               new PartitionIterator[InternalRow](rowReader, customMetrics))
             (iter, rowReader)
           }
-          context.addTaskCompletionListener[Unit] { _ =>
-            // In case of early stopping before consuming the entire iterator,
-            // we need to do one more metric update at the end of the task.
-            CustomMetrics
-              .updateMetrics(reader.currentMetricsValues.toImmutableArraySeq, customMetrics)
-            iter.forceUpdateMetrics()
-            reader.close()
-          }
+
+          // Once we advance to the next partition, update the metric callback for early finish
+          partitionMetricCallback.advancePartition(iter, reader)
+
           currentIter = Some(iter)
           hasNext
         }
@@ -109,6 +113,28 @@ class DataSourceRDD(
   }
 }
 
+private class PartitionMetricCallback
+    (customMetrics: Map[String, SQLMetric]) {
+  private var iter: MetricsIterator[_] = null
+  private var reader: PartitionReader[_] = null
+
+  def advancePartition(iter: MetricsIterator[_], reader: PartitionReader[_]): Unit = {
+    execute()
+
+    this.iter = iter
+    this.reader = reader
+  }
+
+  def execute(): Unit = {
+    if (iter != null && reader != null) {
+      CustomMetrics
+        .updateMetrics(reader.currentMetricsValues.toImmutableArraySeq, customMetrics)
+      iter.forceUpdateMetrics()
+      reader.close()
+    }
+  }
+}
+
 private class PartitionIterator[T](
     reader: PartitionReader[T],
     customMetrics: Map[String, SQLMetric]) extends Iterator[T] {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Strategy.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Strategy.scala
index 9cbea3b69ab79..b07e0442d4f01 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Strategy.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2Strategy.scala
@@ -19,11 +19,10 @@ package org.apache.spark.sql.execution.datasources.v2
 
 import scala.collection.mutable
 
-import org.apache.commons.lang3.StringUtils
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.EXPR
 import org.apache.spark.sql.catalyst.analysis.{ResolvedIdentifier, ResolvedNamespace, ResolvedPartitionSpec, ResolvedTable}
 import org.apache.spark.sql.catalyst.catalog.CatalogUtils
@@ -46,12 +45,14 @@ import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors
 import org.apache.spark.sql.execution.{FilterExec, InSubqueryExec, LeafExecNode, LocalTableScanExec, ProjectExec, RowDataSourceScanExec, SparkPlan, SparkStrategy => Strategy}
 import org.apache.spark.sql.execution.command.CommandUtils
 import org.apache.spark.sql.execution.datasources.{DataSourceStrategy, LogicalRelationWithTable, PushableColumnAndNestedColumn}
+import org.apache.spark.sql.execution.joins.StoragePartitionJoinParams
 import org.apache.spark.sql.execution.streaming.continuous.{WriteToContinuousDataSource, WriteToContinuousDataSourceExec}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.StaticSQLConf.WAREHOUSE_PATH
 import org.apache.spark.sql.sources.{BaseRelation, TableScan}
 import org.apache.spark.storage.StorageLevel
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.SparkStringUtils
 
 class DataSourceV2Strategy(session: SparkSession) extends Strategy with PredicateHelper {
 
@@ -391,7 +392,7 @@ class DataSourceV2Strategy(session: SparkSession) extends Strategy with Predicat
       AlterNamespaceSetPropertiesExec(catalog.asNamespaceCatalog, ns, properties) :: Nil
 
     case SetNamespaceLocation(ResolvedNamespace(catalog, ns, _), location) =>
-      if (StringUtils.isEmpty(location)) {
+      if (SparkStringUtils.isEmpty(location)) {
         throw QueryExecutionErrors.invalidEmptyLocationError(location)
       }
       AlterNamespaceSetPropertiesExec(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DescribeTableExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DescribeTableExec.scala
index 7cfd601ef774f..3cc767380d8bb 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DescribeTableExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DescribeTableExec.scala
@@ -45,6 +45,7 @@ case class DescribeTableExec(
       addMetadataColumns(rows)
       addTableDetails(rows)
       addTableStats(rows)
+      addTableConstraints(rows)
     }
     rows.toSeq
   }
@@ -76,15 +77,25 @@ case class DescribeTableExec(
     rows += toCatalystRow("Table Properties", properties, "")
 
     // If any columns have default values, append them to the result.
-    ResolveDefaultColumns.getDescribeMetadata(table.schema).foreach { row =>
+    ResolveDefaultColumns.getDescribeMetadata(table.columns()).foreach { row =>
       rows += toCatalystRow(row._1, row._2, row._3)
     }
   }
 
   private def addSchema(rows: ArrayBuffer[InternalRow]): Unit = {
-    rows ++= table.schema.map{ column =>
+    rows ++= table.columns().map{ column =>
       toCatalystRow(
-        column.name, column.dataType.simpleString, column.getComment().orNull)
+        column.name, column.dataType.simpleString, column.comment)
+    }
+  }
+
+  private def addTableConstraints(rows: ArrayBuffer[InternalRow]): Unit = {
+    if (table.constraints.nonEmpty) {
+      rows += emptyRow()
+      rows += toCatalystRow("# Constraints", "", "")
+      rows ++= table.constraints().map{ constraint =>
+        toCatalystRow(constraint.name(), constraint.toDescription, "")
+      }
     }
   }
 
@@ -107,11 +118,12 @@ case class DescribeTableExec(
     rows += toCatalystRow("# Clustering Information", "", "")
     rows += toCatalystRow(s"# ${output.head.name}", output(1).name, output(2).name)
     rows ++= clusterBySpec.columnNames.map { fieldNames =>
-      val nestedField = table.schema.findNestedField(fieldNames.fieldNames.toIndexedSeq)
+      val schema = CatalogV2Util.v2ColumnsToStructType(table.columns())
+      val nestedField = schema.findNestedField(fieldNames.fieldNames.toIndexedSeq)
       assert(nestedField.isDefined,
         "The clustering column " +
           s"${fieldNames.fieldNames.map(quoteIfNeeded).mkString(".")} " +
-          s"was not found in the table schema ${table.schema.catalogString}.")
+          s"was not found in the table schema ${schema.catalogString}.")
       nestedField.get
     }.map { case (path, field) =>
       toCatalystRow(
@@ -153,15 +165,15 @@ case class DescribeTableExec(
       if (partitionColumnsOnly) {
         rows += toCatalystRow("# Partition Information", "", "")
         rows += toCatalystRow(s"# ${output(0).name}", output(1).name, output(2).name)
+        val schema = CatalogV2Util.v2ColumnsToStructType(table.columns())
         rows ++= table.partitioning
           .map(_.asInstanceOf[IdentityTransform].ref.fieldNames())
           .map { fieldNames =>
-            val nestedField = table.schema.findNestedField(fieldNames.toImmutableArraySeq)
+            val nestedField = schema.findNestedField(fieldNames.toImmutableArraySeq)
             if (nestedField.isEmpty) {
               throw QueryExecutionErrors.partitionColumnNotFoundInTheTableSchemaError(
                 fieldNames.toSeq,
-                table.schema()
-              )
+                schema)
             }
             nestedField.get
           }.map { case (path, field) =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DropIndexExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DropIndexExec.scala
index 4fe6c3cd4a0e8..b10f59686062e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DropIndexExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/DropIndexExec.scala
@@ -18,7 +18,6 @@
 package org.apache.spark.sql.execution.datasources.v2
 
 import org.apache.spark.internal.LogKeys.INDEX_NAME
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.analysis.NoSuchIndexException
 import org.apache.spark.sql.catalyst.expressions.Attribute
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileBatchWrite.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileBatchWrite.scala
index b9f058b55ed02..345a0b0a4a290 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileBatchWrite.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileBatchWrite.scala
@@ -18,7 +18,7 @@ package org.apache.spark.sql.execution.datasources.v2
 
 import org.apache.hadoop.mapreduce.Job
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.io.FileCommitProtocol
 import org.apache.spark.sql.connector.write.{BatchWrite, DataWriterFactory, PhysicalWriteInfo, WriterCommitMessage}
 import org.apache.spark.sql.execution.datasources.{WriteJobDescription, WriteTaskResult}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FilePartitionReader.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FilePartitionReader.scala
index be4f5dcb65aa1..37060f9bd0816 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FilePartitionReader.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FilePartitionReader.scala
@@ -16,17 +16,17 @@
  */
 package org.apache.spark.sql.execution.datasources.v2
 
-import java.io.{FileNotFoundException, IOException}
+import java.io.FileNotFoundException
 
 import org.apache.hadoop.hdfs.BlockMissingException
 import org.apache.hadoop.security.AccessControlException
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CURRENT_FILE, PARTITIONED_FILE_READER}
 import org.apache.spark.rdd.InputFileBlockHolder
 import org.apache.spark.sql.catalyst.FileSourceOptions
 import org.apache.spark.sql.connector.read.PartitionReader
-import org.apache.spark.sql.execution.datasources.PartitionedFile
+import org.apache.spark.sql.execution.datasources.{DataSourceUtils, PartitionedFile}
 
 class FilePartitionReader[T](
     files: Iterator[PartitionedFile],
@@ -53,7 +53,7 @@ class FilePartitionReader[T](
             currentReader = null
           case e @ (_ : AccessControlException | _ : BlockMissingException) =>
             throw FileDataSourceV2.attachFilePath(file.urlEncodedPath, e)
-          case e @ (_: RuntimeException | _: IOException) if ignoreCorruptFiles =>
+          case e if ignoreCorruptFiles && DataSourceUtils.shouldIgnoreCorruptFileException(e) =>
             logWarning(
               s"Skipped the rest of the content in the corrupted file.", e)
             currentReader = null
@@ -71,7 +71,7 @@ class FilePartitionReader[T](
     } catch {
       case e @ (_ : AccessControlException | _ : BlockMissingException) =>
         throw FileDataSourceV2.attachFilePath(currentReader.file.urlEncodedPath, e)
-      case e @ (_: RuntimeException | _: IOException) if ignoreCorruptFiles =>
+      case e if ignoreCorruptFiles && DataSourceUtils.shouldIgnoreCorruptFileException(e) =>
         logWarning(log"Skipped the rest of the content in the corrupted file: " +
           log"${MDC(PARTITIONED_FILE_READER, currentReader)}", e)
         false
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileScan.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileScan.scala
index 9ace0540ec243..5348f9ab6df62 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileScan.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileScan.scala
@@ -18,10 +18,9 @@ package org.apache.spark.sql.execution.datasources.v2
 
 import java.util.{Locale, OptionalLong}
 
-import org.apache.commons.lang3.StringUtils
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{PATH, REASON}
 import org.apache.spark.internal.config.IO_WARNING_LARGEFILETHRESHOLD
 import org.apache.spark.sql.SparkSession
@@ -30,11 +29,11 @@ import org.apache.spark.sql.catalyst.expressions.{AttributeSet, Expression, Expr
 import org.apache.spark.sql.catalyst.expressions.codegen.GenerateUnsafeProjection
 import org.apache.spark.sql.catalyst.plans.QueryPlan
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
-import org.apache.spark.sql.connector.read.{Batch, InputPartition, Scan, Statistics, SupportsReportStatistics}
+import org.apache.spark.sql.connector.read._
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.PartitionedFileUtil
 import org.apache.spark.sql.execution.datasources._
-import org.apache.spark.sql.internal.{SessionState, SQLConf}
+import org.apache.spark.sql.internal.{SessionStateHelper, SQLConf}
 import org.apache.spark.sql.internal.connector.SupportsMetadata
 import org.apache.spark.sql.sources.Filter
 import org.apache.spark.sql.types.StructType
@@ -113,10 +112,7 @@ trait FileScan extends Scan
 
   override def hashCode(): Int = getClass.hashCode()
 
-  override def conf: SQLConf = {
-    val sessionState: SessionState = sparkSession.sessionState
-    sessionState.conf
-  }
+  override def conf: SQLConf = SessionStateHelper.getSqlConf(sparkSession)
 
   val maxMetadataValueLength = conf.maxMetadataStringLength
 
@@ -125,7 +121,7 @@ trait FileScan extends Scan
       case (key, value) =>
         val redactedValue =
           Utils.redact(conf.stringRedactionPattern, value)
-        key + ": " + StringUtils.abbreviate(redactedValue, maxMetadataValueLength)
+        key + ": " + Utils.abbreviate(redactedValue, maxMetadataValueLength)
     }.mkString(", ")
     s"${this.getClass.getSimpleName} $metadataStr"
   }
@@ -177,7 +173,7 @@ trait FileScan extends Scan
     if (splitFiles.length == 1) {
       val path = splitFiles(0).toPath
       if (!isSplitable(path) && splitFiles(0).length >
-        sparkSession.sparkContext.conf.get(IO_WARNING_LARGEFILETHRESHOLD)) {
+        SessionStateHelper.getSparkConf(sparkSession).get(IO_WARNING_LARGEFILETHRESHOLD)) {
         logWarning(log"Loading one large unsplittable file ${MDC(PATH, path.toString)} with only " +
           log"one partition, the reason is: ${MDC(REASON, getFileUnSplittableReason(path))}")
       }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileTable.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileTable.scala
index 863104da80c2e..0af728c1958d4 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileTable.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/FileTable.scala
@@ -29,7 +29,8 @@ import org.apache.spark.sql.connector.expressions.Transform
 import org.apache.spark.sql.connector.write.{LogicalWriteInfo, LogicalWriteInfoImpl}
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.datasources._
-import org.apache.spark.sql.execution.streaming.{FileStreamSink, MetadataLogFileIndex}
+import org.apache.spark.sql.execution.streaming.runtime.MetadataLogFileIndex
+import org.apache.spark.sql.execution.streaming.sinks.FileStreamSink
 import org.apache.spark.sql.types.{DataType, StructType}
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 import org.apache.spark.sql.util.SchemaUtils
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/GroupBasedRowLevelOperationScanPlanning.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/GroupBasedRowLevelOperationScanPlanning.scala
index 8b8cdc06d398b..77e21bcbbdb8f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/GroupBasedRowLevelOperationScanPlanning.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/GroupBasedRowLevelOperationScanPlanning.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.execution.datasources.v2
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.sql.catalyst.expressions.{And, AttributeReference, AttributeSet, Expression, ExpressionSet, PredicateHelper, SubqueryExpression}
 import org.apache.spark.sql.catalyst.expressions.Literal.TrueLiteral
 import org.apache.spark.sql.catalyst.planning.{GroupBasedRowLevelOperation, PhysicalOperation}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/MergeRowsExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/MergeRowsExec.scala
index 8a25170fcee80..311bab084bbf7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/MergeRowsExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/MergeRowsExec.scala
@@ -29,11 +29,12 @@ import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.expressions.Projection
 import org.apache.spark.sql.catalyst.expressions.UnsafeProjection
 import org.apache.spark.sql.catalyst.expressions.codegen.GeneratePredicate
-import org.apache.spark.sql.catalyst.plans.logical.MergeRows.{Discard, Instruction, Keep, ROW_ID, Split}
+import org.apache.spark.sql.catalyst.plans.logical.MergeRows.{Context, Copy, Delete, Discard, Insert, Instruction, Keep, ROW_ID, Split, Update}
 import org.apache.spark.sql.catalyst.util.truncatedString
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.SparkPlan
 import org.apache.spark.sql.execution.UnaryExecNode
+import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
 
 case class MergeRowsExec(
     isSourceRowPresent: Expression,
@@ -45,6 +46,24 @@ case class MergeRowsExec(
     output: Seq[Attribute],
     child: SparkPlan) extends UnaryExecNode {
 
+  override lazy val metrics: Map[String, SQLMetric] = Map(
+    "numTargetRowsCopied" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows copied unmodified because they did not match any action"),
+    "numTargetRowsInserted" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows inserted"),
+    "numTargetRowsDeleted" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows deleted"),
+    "numTargetRowsUpdated" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows updated"),
+    "numTargetRowsMatchedUpdated" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows updated by a matched clause"),
+    "numTargetRowsMatchedDeleted" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows deleted by a matched clause"),
+    "numTargetRowsNotMatchedBySourceUpdated" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows updated by a not matched by source clause"),
+    "numTargetRowsNotMatchedBySourceDeleted" -> SQLMetrics.createMetric(sparkContext,
+      "number of target rows deleted by a not matched by source clause"))
+
   @transient override lazy val producedAttributes: AttributeSet = {
     AttributeSet(output.filterNot(attr => inputSet.contains(attr)))
   }
@@ -107,8 +126,8 @@ case class MergeRowsExec(
 
   private def planInstructions(instructions: Seq[Instruction]): Seq[InstructionExec] = {
     instructions.map {
-      case Keep(cond, output) =>
-        KeepExec(createPredicate(cond), createProjection(output))
+      case Keep(context, cond, output) =>
+        KeepExec(context, createPredicate(cond), createProjection(output))
 
       case Discard(cond) =>
         DiscardExec(createPredicate(cond))
@@ -127,7 +146,10 @@ case class MergeRowsExec(
     def condition: BasePredicate
   }
 
-  case class KeepExec(condition: BasePredicate, projection: Projection) extends InstructionExec {
+  case class KeepExec(
+      context: Context,
+      condition: BasePredicate,
+      projection: Projection) extends InstructionExec {
     def apply(row: InternalRow): InternalRow = projection.apply(row)
   }
 
@@ -203,9 +225,9 @@ case class MergeRowsExec(
 
       if (isTargetRowPresent && isSourceRowPresent) {
         cardinalityValidator.validate(row)
-        applyInstructions(row, matchedInstructions)
+        applyInstructions(row, matchedInstructions, sourcePresent = true)
       } else if (isSourceRowPresent) {
-        applyInstructions(row, notMatchedInstructions)
+        applyInstructions(row, notMatchedInstructions, sourcePresent = true)
       } else if (isTargetRowPresent) {
         applyInstructions(row, notMatchedBySourceInstructions)
       } else {
@@ -215,18 +237,29 @@ case class MergeRowsExec(
 
     private def applyInstructions(
         row: InternalRow,
-        instructions: Seq[InstructionExec]): InternalRow = {
+        instructions: Seq[InstructionExec],
+        sourcePresent: Boolean = false): InternalRow = {
 
       for (instruction <- instructions) {
         if (instruction.condition.eval(row)) {
           instruction match {
             case keep: KeepExec =>
+              keep.context match {
+                case Copy => incrementCopyMetric()
+                case Update => incrementUpdateMetric(sourcePresent)
+                case Insert => incrementInsertMetric()
+                case Delete => incrementDeleteMetric(sourcePresent)
+                case _ => throw new IllegalArgumentException(
+                  s"Unexpected context for KeepExec: ${keep.context}")
+              }
               return keep.apply(row)
 
             case _: DiscardExec =>
+              incrementDeleteMetric(sourcePresent)
               return null
 
             case split: SplitExec =>
+              incrementUpdateMetric(sourcePresent)
               cachedExtraRow = split.projectExtraRow(row)
               return split.projectRow(row)
           }
@@ -236,4 +269,27 @@ case class MergeRowsExec(
       null
     }
   }
+
+  // For group based merge, copy is inserted if row matches no other case
+  private def incrementCopyMetric(): Unit = longMetric("numTargetRowsCopied") += 1
+
+  private def incrementInsertMetric(): Unit = longMetric("numTargetRowsInserted") += 1
+
+  private def incrementDeleteMetric(sourcePresent: Boolean): Unit = {
+    longMetric("numTargetRowsDeleted") += 1
+    if (sourcePresent) {
+      longMetric("numTargetRowsMatchedDeleted") += 1
+    } else {
+      longMetric("numTargetRowsNotMatchedBySourceDeleted") += 1
+    }
+  }
+
+  private def incrementUpdateMetric(sourcePresent: Boolean): Unit = {
+    longMetric("numTargetRowsUpdated") += 1
+    if (sourcePresent) {
+      longMetric("numTargetRowsMatchedUpdated") += 1
+    } else {
+      longMetric("numTargetRowsNotMatchedBySourceUpdated") += 1
+    }
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/PushedDownOperators.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/PushedDownOperators.scala
index 49044c6e24db6..c7d2c56b89858 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/PushedDownOperators.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/PushedDownOperators.scala
@@ -30,6 +30,9 @@ case class PushedDownOperators(
     limit: Option[Int],
     offset: Option[Int],
     sortValues: Seq[SortOrder],
-    pushedPredicates: Seq[Predicate]) {
+    pushedPredicates: Seq[Predicate],
+    joinedRelationPushedDownOperators: Seq[PushedDownOperators],
+    // Relation name in case of leaf relation. For join nodes, this is empty.
+    relationName: Option[String]) {
   assert((limit.isEmpty && sortValues.isEmpty) || limit.isDefined)
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowCreateTableExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowCreateTableExec.scala
index 4195560c5cc1c..56e786d3e9334 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowCreateTableExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowCreateTableExec.scala
@@ -65,7 +65,8 @@ case class ShowCreateTableExec(
   private def showTableDataColumns(table: Table, builder: StringBuilder): Unit = {
     import org.apache.spark.sql.connector.catalog.CatalogV2Implicits._
     val columns = CharVarcharUtils.getRawSchema(table.columns.asSchema, conf).fields.map(_.toDDL)
-    builder ++= concatByMultiLines(columns)
+    val constraints = table.constraints().map(_.toDDL)
+    builder ++= concatByMultiLines(columns ++ constraints)
   }
 
   private def showTableUsing(table: Table, builder: StringBuilder): Unit = {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowTablesExtendedExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowTablesExtendedExec.scala
index 0b2d11a597d5c..ed62890c87d89 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowTablesExtendedExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/ShowTablesExtendedExec.scala
@@ -114,8 +114,8 @@ case class ShowTablesExtendedExec(
         field => quoteIdentifier(field.name)).mkString("[", ", ", "]"))
     }
 
-    if (table.schema().nonEmpty) {
-      results.put("Schema", table.schema().treeString)
+    if (table.columns().nonEmpty) {
+      results.put("Schema", CatalogV2Util.v2ColumnsToStructType(table.columns()).treeString)
     }
 
     results.map { case (key, value) =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/TableCapabilityCheck.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/TableCapabilityCheck.scala
index e332c6b8014a6..072dcc995f41c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/TableCapabilityCheck.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/TableCapabilityCheck.scala
@@ -23,7 +23,7 @@ import org.apache.spark.sql.catalyst.streaming.StreamingRelationV2
 import org.apache.spark.sql.connector.catalog.Table
 import org.apache.spark.sql.connector.catalog.TableCapability._
 import org.apache.spark.sql.errors.QueryCompilationErrors
-import org.apache.spark.sql.execution.streaming.StreamingRelation
+import org.apache.spark.sql.execution.streaming.runtime.StreamingRelation
 import org.apache.spark.sql.types.BooleanType
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanPartitioningAndOrdering.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanPartitioningAndOrdering.scala
index 7ee4374b45789..5d06c8786d894 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanPartitioningAndOrdering.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanPartitioningAndOrdering.scala
@@ -16,7 +16,7 @@
  */
 package org.apache.spark.sql.execution.datasources.v2
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_NAME
 import org.apache.spark.sql.catalyst.expressions.V2ExpressionUtils
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanRelationPushDown.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanRelationPushDown.scala
index 5f7e86cab5240..31a98e1ff96cb 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanRelationPushDown.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2ScanRelationPushDown.scala
@@ -17,21 +17,22 @@
 
 package org.apache.spark.sql.execution.datasources.v2
 
+import java.util.Locale
+
 import scala.collection.mutable
 
-import org.apache.spark.internal.LogKeys.{AGGREGATE_FUNCTIONS, GROUP_BY_EXPRS, POST_SCAN_FILTERS, PUSHED_FILTERS, RELATION_NAME, RELATION_OUTPUT}
-import org.apache.spark.internal.MDC
+import org.apache.spark.internal.LogKeys.{AGGREGATE_FUNCTIONS, COLUMN_NAMES, GROUP_BY_EXPRS, JOIN_CONDITION, JOIN_TYPE, POST_SCAN_FILTERS, PUSHED_FILTERS, RELATION_NAME, RELATION_OUTPUT}
 import org.apache.spark.sql.catalyst.expressions.{aggregate, Alias, And, Attribute, AttributeMap, AttributeReference, AttributeSet, Cast, Expression, IntegerLiteral, Literal, NamedExpression, PredicateHelper, ProjectionOverSchema, SortOrder, SubqueryExpression}
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
 import org.apache.spark.sql.catalyst.optimizer.CollapseProject
 import org.apache.spark.sql.catalyst.planning.{PhysicalOperation, ScanOperation}
-import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, LeafNode, Limit, LimitAndOffset, LocalLimit, LogicalPlan, Offset, OffsetAndLimit, Project, Sample, Sort}
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, Join, LeafNode, Limit, LimitAndOffset, LocalLimit, LogicalPlan, Offset, OffsetAndLimit, Project, Sample, Sort}
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
 import org.apache.spark.sql.connector.expressions.{SortOrder => V2SortOrder}
 import org.apache.spark.sql.connector.expressions.aggregate.{Aggregation, Avg, Count, CountStar, Max, Min, Sum}
 import org.apache.spark.sql.connector.expressions.filter.Predicate
-import org.apache.spark.sql.connector.read.{Scan, ScanBuilder, SupportsPushDownAggregates, SupportsPushDownFilters, V1Scan}
+import org.apache.spark.sql.connector.read.{Scan, ScanBuilder, SupportsPushDownAggregates, SupportsPushDownFilters, SupportsPushDownJoin, V1Scan}
 import org.apache.spark.sql.execution.datasources.DataSourceStrategy
 import org.apache.spark.sql.sources
 import org.apache.spark.sql.types.{DataType, DecimalType, IntegerType, StructType}
@@ -46,9 +47,11 @@ object V2ScanRelationPushDown extends Rule[LogicalPlan] with PredicateHelper {
       createScanBuilder,
       pushDownSample,
       pushDownFilters,
+      pushDownJoin,
       pushDownAggregates,
       pushDownLimitAndOffset,
       buildScanWithPushedAggregate,
+      buildScanWithPushedJoin,
       pruneColumns)
 
     pushdownRules.foldLeft(plan) { (newPlan, pushDownRule) =>
@@ -98,6 +101,218 @@ object V2ScanRelationPushDown extends Rule[LogicalPlan] with PredicateHelper {
       filterCondition.map(Filter(_, sHolder)).getOrElse(sHolder)
   }
 
+  def pushDownJoin(plan: LogicalPlan): LogicalPlan = plan.transformUp {
+    // Join can be attempted to be pushed down only if left and right side of join are
+    // compatible (same data source, for example). Also, another requirement is that if
+    // there are projections between Join and ScanBuilderHolder, these projections need to be
+    // AttributeReferences. We could probably support Alias as well, but this should be on
+    // TODO list.
+    // Alias can exist between Join and sHolder node because the query below is not valid:
+    // SELECT * FROM
+    // (SELECT * FROM tbl t1 JOIN tbl2 t2) p
+    // JOIN
+    // (SELECT * FROM tbl t3 JOIN tbl3 t4) q
+    // ON p.t1.col = q.t3.col (this is not possible)
+    // It's because there are duplicated columns in both sides of top level join and it's not
+    // possible to fully qualified the column names in condition. Therefore, query should be
+    // rewritten so that each of the outputs of child joins are aliased, so there would be a
+    // projection with aliases between top level join and scanBuilderHolder (that has pushed
+    // child joins).
+    case node @ Join(
+      PhysicalOperation(
+        leftProjections,
+        Nil,
+        leftHolder @ ScanBuilderHolder(_, _, lBuilder: SupportsPushDownJoin)
+      ),
+      PhysicalOperation(
+        rightProjections,
+        Nil,
+        rightHolder @ ScanBuilderHolder(_, _, rBuilder: SupportsPushDownJoin)
+      ),
+      joinType,
+      condition,
+    _) if conf.dataSourceV2JoinPushdown &&
+        // We do not support pushing down anything besides AttributeReference.
+        leftProjections.forall(_.isInstanceOf[AttributeReference]) &&
+        rightProjections.forall(_.isInstanceOf[AttributeReference]) &&
+        // Cross joins are not supported because they increase the amount of data.
+        condition.isDefined &&
+        lBuilder.isOtherSideCompatibleForJoin(rBuilder) =>
+      // Process left and right columns in original order
+      val (leftSideRequiredColumnsWithAliases, rightSideRequiredColumnsWithAliases) =
+        generateColumnAliasesForDuplicatedName(
+          getRequiredColumnNames(leftProjections, leftHolder),
+          getRequiredColumnNames(rightProjections, rightHolder))
+
+      // Create the AttributeMap that holds (Attribute -> Attribute with up to date name) mapping.
+      val pushedJoinOutputMap = AttributeMap[Expression](
+        node.output
+          .zip(leftSideRequiredColumnsWithAliases ++ rightSideRequiredColumnsWithAliases)
+          .collect {
+            case (attr, columnWithAlias) =>
+              if (columnWithAlias.alias() != null) {
+                (attr, attr.withName(columnWithAlias.alias()))
+              } else {
+                (attr, attr.withName(columnWithAlias.colName()))
+              }
+          }
+          .toMap
+      )
+
+      // Reuse the previously calculated map to update the condition with attributes
+      // with up-to-date names
+      val normalizedCondition = condition.map { e =>
+        DataSourceStrategy.normalizeExprs(
+          Seq(e),
+          (leftHolder.output ++ rightHolder.output).map { a =>
+            pushedJoinOutputMap.getOrElse(a, a).asInstanceOf[AttributeReference]
+          }
+        ).head
+      }
+
+      val translatedCondition =
+        normalizedCondition.flatMap(DataSourceV2Strategy.translateFilterV2(_))
+      val translatedJoinType = DataSourceStrategy.translateJoinType(joinType)
+
+      logInfo(log"DSv2 Join pushdown - translated join condition " +
+        log"${MDC(JOIN_CONDITION, translatedCondition)}")
+      logInfo(log"DSv2 Join pushdown - translated join type " +
+        log"${MDC(JOIN_TYPE, translatedJoinType)}")
+
+      logInfo(log"DSv2 Join pushdown - left side required columns with aliases: " +
+        log"${MDC(
+          COLUMN_NAMES,
+          leftSideRequiredColumnsWithAliases.map(_.prettyString()).mkString(", ")
+        )}")
+      logInfo(log"DSv2 Join pushdown - right side required columns with aliases: " +
+        log"${MDC(
+          COLUMN_NAMES,
+          rightSideRequiredColumnsWithAliases.map(_.prettyString()).mkString(", ")
+        )}")
+
+      if (translatedJoinType.isDefined &&
+        translatedCondition.isDefined &&
+        lBuilder.pushDownJoin(
+          rBuilder,
+          translatedJoinType.get,
+          leftSideRequiredColumnsWithAliases,
+          rightSideRequiredColumnsWithAliases,
+          translatedCondition.get)
+      ) {
+        val leftSidePushedDownOperators = getPushedDownOperators(leftHolder)
+        val rightSidePushedDownOperators = getPushedDownOperators(rightHolder)
+
+        leftHolder.joinedRelations = leftHolder.joinedRelations ++ rightHolder.joinedRelations
+        leftHolder.joinedRelationsPushedDownOperators =
+          Seq(leftSidePushedDownOperators, rightSidePushedDownOperators)
+
+        leftHolder.pushedPredicates = Seq(translatedCondition.get)
+        leftHolder.pushedSample = None
+
+        leftHolder.output = node.output.asInstanceOf[Seq[AttributeReference]]
+        leftHolder.pushedJoinOutputMap = pushedJoinOutputMap
+
+        // TODO: for cascade joins, already joined relations will still have the name of the
+        // original(leaf) relation. It should be thought of if we want to change the name of the
+        // relation when join is pushed down.
+        logInfo(log"DSv2 Join pushdown - successfully pushed down join between relations " +
+          log"${MDC(RELATION_NAME, leftHolder.relation.name)} and " +
+          log"${MDC(RELATION_NAME, rightHolder.relation.name)}.")
+
+        leftHolder
+      } else {
+        logInfo(log"DSv2 Join pushdown - failed to push down join.")
+        node
+      }
+  }
+  /**
+   * Generates unique column aliases for join operations to avoid naming conflicts.
+   * Handles case sensitivity issues across different databases (SQL Server, MySQL, etc.).
+   *
+   * @param leftSideRequiredColumnNames  Columns from the left side of the join
+   * @param rightSideRequiredColumnNames Columns from the right side of the join
+   * @return Tuple of (leftColumnsWithAliases, rightColumnsWithAliases)
+   */
+  private[v2] def generateColumnAliasesForDuplicatedName(
+    leftSideRequiredColumnNames: Array[String],
+    rightSideRequiredColumnNames: Array[String]
+  ): (Array[SupportsPushDownJoin.ColumnWithAlias],
+    Array[SupportsPushDownJoin.ColumnWithAlias]) = {
+    // Normalize all column names to lowercase for case-insensitive comparison
+    val normalizeCase: String => String = _.toLowerCase(Locale.ROOT)
+
+    // Count occurrences of each column name (case-insensitive)
+    val allRequiredColumnNames = leftSideRequiredColumnNames ++ rightSideRequiredColumnNames
+    val allNameCounts: Map[String, Int] =
+      allRequiredColumnNames.map(normalizeCase)
+        .groupBy(identity)
+        .view
+        .mapValues(_.length)
+        .toMap
+
+    // Track claimed aliases using normalized names.
+    // Use Set for O(1) lookups when checking existing column names, claim all names
+    // that appears only once to ensure they have highest priority.
+    val allClaimedAliases = mutable.Set.from(
+      allNameCounts.filter(_._2 == 1).keys
+    )
+
+    // Track suffix index for each base column name (starts at 0) to avoid extreme worst
+    // case of O(n^2) alias generation.
+    val aliasSuffixIndex = mutable.HashMap[String, Int]().withDefaultValue(0)
+
+    def processColumn(originalName: String): SupportsPushDownJoin.ColumnWithAlias = {
+      val normalizedName = normalizeCase(originalName)
+
+      // No alias needed for unique column names
+      if (allNameCounts(normalizedName) == 1) {
+        new SupportsPushDownJoin.ColumnWithAlias(originalName, null)
+      } else {
+        var attempt = aliasSuffixIndex(normalizedName)
+        var candidate = if (attempt == 0) originalName else s"${originalName}_$attempt"
+        var normalizedCandidate = normalizeCase(candidate)
+
+        // Find first available unique alias, use original name for the first attempt, then append
+        // suffix for more attempts.
+        while (allClaimedAliases.contains(normalizedCandidate)) {
+          attempt += 1
+          candidate = s"${originalName}_$attempt"
+          normalizedCandidate = normalizeCase(candidate)
+        }
+
+        // Update tracking state
+        aliasSuffixIndex(normalizedName) = attempt + 1
+        allClaimedAliases.add(normalizedCandidate)
+
+        if (originalName == candidate) {
+          new SupportsPushDownJoin.ColumnWithAlias(originalName, null)
+        } else {
+          new SupportsPushDownJoin.ColumnWithAlias(originalName, candidate)
+        }
+      }
+    }
+
+    (
+      leftSideRequiredColumnNames.map(processColumn),
+      rightSideRequiredColumnNames.map(processColumn)
+    )
+  }
+
+  // Projections' names are maybe not up to date if the joins have been previously pushed down.
+  // For this reason, we need to use pushedJoinOutputMap to get up to date names.
+  def getRequiredColumnNames(
+      projections: Seq[NamedExpression],
+      sHolder: ScanBuilderHolder): Array[String] = {
+    val normalizedProjections = DataSourceStrategy.normalizeExprs(
+      projections,
+      sHolder.output.map { a =>
+        sHolder.pushedJoinOutputMap.getOrElse(a, a).asInstanceOf[AttributeReference]
+      }
+    ).asInstanceOf[Seq[AttributeReference]]
+
+    normalizedProjections.map(_.name).toArray
+  }
+
   def pushDownAggregates(plan: LogicalPlan): LogicalPlan = plan.transform {
     // update the scan builder with agg pushdown and return a new plan with agg pushed
     case agg: Aggregate => rewriteAggregate(agg)
@@ -113,10 +328,9 @@ object V2ScanRelationPushDown extends Rule[LogicalPlan] with PredicateHelper {
 
       val aggExprToOutputOrdinal = mutable.HashMap.empty[Expression, Int]
       val aggregates = collectAggregates(actualResultExprs, aggExprToOutputOrdinal)
-      val normalizedAggExprs = DataSourceStrategy.normalizeExprs(
-        aggregates, holder.relation.output).asInstanceOf[Seq[AggregateExpression]]
-      val normalizedGroupingExpr = DataSourceStrategy.normalizeExprs(
-        actualGroupExprs, holder.relation.output)
+      val normalizedAggExprs =
+        normalizeExpressions(aggregates, holder).asInstanceOf[Seq[AggregateExpression]]
+      val normalizedGroupingExpr = normalizeExpressions(actualGroupExprs, holder)
       val translatedAggOpt = DataSourceStrategy.translateAggregation(
         normalizedAggExprs, normalizedGroupingExpr)
       if (translatedAggOpt.isEmpty) {
@@ -356,6 +570,25 @@ object V2ScanRelationPushDown extends Rule[LogicalPlan] with PredicateHelper {
       Project(projectList, scanRelation)
   }
 
+  def buildScanWithPushedJoin(plan: LogicalPlan): LogicalPlan = plan.transform {
+    case holder: ScanBuilderHolder if holder.joinedRelations.length > 1 =>
+      val scan = holder.builder.build()
+      val realOutput = toAttributes(scan.readSchema())
+      assert(realOutput.length == holder.output.length,
+        "The data source returns unexpected number of columns")
+      val wrappedScan = getWrappedScan(scan, holder)
+      val scanRelation = DataSourceV2ScanRelation(holder.relation, wrappedScan, realOutput)
+
+      // When join is pushed down, the real output is going to be, for example,
+      // SALARY_01234#0, NAME_ab123#1, DEPT_cd123#2.
+      // We should revert these names back to original names. For example,
+      // SALARY#0, NAME#1, DEPT#1. This is done by adding projection with appropriate aliases.
+      val projectList = realOutput.zip(holder.output).map { case (a1, a2) =>
+        Alias(a1, a2.name)(a2.exprId)
+      }
+      Project(projectList, scanRelation)
+  }
+
   def pruneColumns(plan: LogicalPlan): LogicalPlan = plan.transform {
     case ScanOperation(project, filtersStayUp, filtersPushDown, sHolder: ScanBuilderHolder) =>
       // column pruning
@@ -441,8 +674,7 @@ object V2ScanRelationPushDown extends Rule[LogicalPlan] with PredicateHelper {
       } else {
         aliasReplacedOrder.asInstanceOf[Seq[SortOrder]]
       }
-      val normalizedOrders = DataSourceStrategy.normalizeExprs(
-        newOrder, sHolder.relation.output).asInstanceOf[Seq[SortOrder]]
+      val normalizedOrders = normalizeExpressions(newOrder, sHolder).asInstanceOf[Seq[SortOrder]]
       val orders = DataSourceStrategy.translateSortOrders(normalizedOrders)
       if (orders.length == order.length) {
         val (isPushed, isPartiallyPushed) =
@@ -540,6 +772,23 @@ object V2ScanRelationPushDown extends Rule[LogicalPlan] with PredicateHelper {
       }
   }
 
+  private def normalizeExpressions(
+      expressions: Seq[Expression],
+      sHolder: ScanBuilderHolder): Seq[Expression] = {
+    val output = if (sHolder.joinedRelations.length == 1) {
+      // Join is not pushed down
+      sHolder.relation.output
+    } else {
+      // sHolder.output's names can be out of date if the joins has previously been pushed down.
+      // For this reason, we need to use pushedJoinOutputMap to get up to date names.
+      sHolder.output.map { a =>
+        sHolder.pushedJoinOutputMap.getOrElse(a, a).asInstanceOf[AttributeReference]
+      }
+    }
+
+    DataSourceStrategy.normalizeExprs(expressions, output)
+  }
+
   private def getWrappedScan(scan: Scan, sHolder: ScanBuilderHolder): Scan = {
     scan match {
       case v1: V1Scan =>
@@ -548,12 +797,18 @@ object V2ScanRelationPushDown extends Rule[LogicalPlan] with PredicateHelper {
             f.pushedFilters()
           case _ => Array.empty[sources.Filter]
         }
-        val pushedDownOperators = PushedDownOperators(sHolder.pushedAggregate, sHolder.pushedSample,
-          sHolder.pushedLimit, sHolder.pushedOffset, sHolder.sortOrders, sHolder.pushedPredicates)
+        val pushedDownOperators = getPushedDownOperators(sHolder)
         V1ScanWrapper(v1, pushedFilters.toImmutableArraySeq, pushedDownOperators)
       case _ => scan
     }
   }
+
+  private def getPushedDownOperators(sHolder: ScanBuilderHolder): PushedDownOperators = {
+    val optRelationName = Option.when(sHolder.joinedRelations.length <= 1)(sHolder.relation.name)
+    PushedDownOperators(sHolder.pushedAggregate, sHolder.pushedSample,
+      sHolder.pushedLimit, sHolder.pushedOffset, sHolder.sortOrders, sHolder.pushedPredicates,
+      sHolder.joinedRelationsPushedDownOperators, optRelationName)
+  }
 }
 
 case class ScanBuilderHolder(
@@ -573,6 +828,12 @@ case class ScanBuilderHolder(
   var pushedAggregate: Option[Aggregation] = None
 
   var pushedAggOutputMap: AttributeMap[Expression] = AttributeMap.empty[Expression]
+
+  var joinedRelations: Seq[DataSourceV2RelationBase] = Seq(relation)
+
+  var joinedRelationsPushedDownOperators: Seq[PushedDownOperators] = Seq.empty[PushedDownOperators]
+
+  var pushedJoinOutputMap: AttributeMap[Expression] = AttributeMap.empty[Expression]
 }
 
 // A wrapper for v1 scan to carry the translated filters and the handled ones, along with
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalog.scala
index 1088e3f7a7206..891728e6f7e19 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalog.scala
@@ -309,7 +309,7 @@ class V2SessionCatalog(catalog: SessionCatalog)
             collation = collation, storage = storage))
       }
       if (changes.exists(_.isInstanceOf[TableChange.ColumnChange])) {
-        catalog.alterTableDataSchema(ident.asTableIdentifier, schema)
+        catalog.alterTableSchema(ident.asTableIdentifier, schema)
       }
     } catch {
       case _: NoSuchTableException =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/WriteToDataSourceV2Exec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/WriteToDataSourceV2Exec.scala
index 4436c6b24f7c8..68e8c1c6e1047 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/WriteToDataSourceV2Exec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/WriteToDataSourceV2Exec.scala
@@ -17,10 +17,13 @@
 
 package org.apache.spark.sql.execution.datasources.v2
 
+import java.lang
+import java.util
+
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{SparkEnv, SparkException, TaskContext}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.{InternalRow, ProjectingInternalRow}
 import org.apache.spark.sql.catalyst.analysis.NoSuchTableException
@@ -34,6 +37,7 @@ import org.apache.spark.sql.connector.metric.CustomMetric
 import org.apache.spark.sql.connector.write.{BatchWrite, DataWriter, DataWriterFactory, DeltaWrite, DeltaWriter, PhysicalWriteInfoImpl, Write, WriterCommitMessage}
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors}
 import org.apache.spark.sql.execution.{SparkPlan, SQLExecution, UnaryExecNode}
+import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
 import org.apache.spark.sql.execution.metric.{CustomMetrics, SQLMetric, SQLMetrics}
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.{LongAccumulator, Utils}
@@ -303,8 +307,6 @@ case class ReplaceDataExec(
     projections: ReplaceDataProjections,
     write: Write) extends V2ExistingTableWriteExec {
 
-  override val stringArgs: Iterator[Any] = Iterator(query, write)
-
   override def writingTask: WritingSparkTask[_] = {
     projections match {
       case ReplaceDataProjections(dataProj, Some(metadataProj)) =>
@@ -328,8 +330,6 @@ case class WriteDeltaExec(
     projections: WriteDeltaProjections,
     write: DeltaWrite) extends V2ExistingTableWriteExec {
 
-  override lazy val stringArgs: Iterator[Any] = Iterator(query, write)
-
   override lazy val writingTask: WritingSparkTask[_] = {
     if (projections.metadataProjection.isDefined) {
       DeltaWithMetadataWritingSparkTask(projections)
@@ -349,6 +349,8 @@ case class WriteToDataSourceV2Exec(
     query: SparkPlan,
     writeMetrics: Seq[CustomMetric]) extends V2TableWriteExec {
 
+  override val stringArgs: Iterator[Any] = Iterator(batchWrite, query)
+
   override val customMetrics: Map[String, SQLMetric] = writeMetrics.map { customMetric =>
     customMetric.name() -> SQLMetrics.createV2CustomMetric(sparkContext, customMetric)
   }.toMap
@@ -367,6 +369,8 @@ trait V2ExistingTableWriteExec extends V2TableWriteExec {
   def refreshCache: () => Unit
   def write: Write
 
+  override val stringArgs: Iterator[Any] = Iterator(query, write)
+
   override val customMetrics: Map[String, SQLMetric] =
     write.supportedCustomMetrics().map { customMetric =>
       customMetric.name() -> SQLMetrics.createV2CustomMetric(sparkContext, customMetric)
@@ -398,7 +402,7 @@ trait V2ExistingTableWriteExec extends V2TableWriteExec {
 /**
  * The base physical plan for writing data into data source v2.
  */
-trait V2TableWriteExec extends V2CommandExec with UnaryExecNode {
+trait V2TableWriteExec extends V2CommandExec with UnaryExecNode with AdaptiveSparkPlanHelper {
   def query: SparkPlan
   def writingTask: WritingSparkTask[_] = DataWritingSparkTask
 
@@ -451,8 +455,9 @@ trait V2TableWriteExec extends V2CommandExec with UnaryExecNode {
         }
       )
 
+      val operationMetrics = getOperationMetrics(query)
       logInfo(log"Data source write support ${MDC(LogKeys.BATCH_WRITE, batchWrite)} is committing.")
-      batchWrite.commit(messages)
+      batchWrite.commit(messages, operationMetrics)
       logInfo(log"Data source write support ${MDC(LogKeys.BATCH_WRITE, batchWrite)} committed.")
       commitProgress = Some(StreamWriterCommitProgress(totalNumRowsAccumulator.value))
     } catch {
@@ -474,6 +479,12 @@ trait V2TableWriteExec extends V2CommandExec with UnaryExecNode {
 
     Nil
   }
+
+  private def getOperationMetrics(query: SparkPlan): util.Map[String, lang.Long] = {
+    collectFirst(query) { case m: MergeRowsExec => m }.map{ n =>
+      n.metrics.map { case (name, metric) => s"merge.$name" -> lang.Long.valueOf(metric.value) }
+    }.getOrElse(Map.empty[String, lang.Long]).asJava
+  }
 }
 
 trait WritingSparkTask[W <: DataWriter[InternalRow]] extends Logging with Serializable {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCScanBuilder.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCScanBuilder.scala
index 230f30fb1d069..b758ddd35e0d2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCScanBuilder.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCScanBuilder.scala
@@ -19,21 +19,25 @@ package org.apache.spark.sql.execution.datasources.v2.jdbc
 import scala.util.control.NonFatal
 
 import org.apache.spark.internal.Logging
+import org.apache.spark.internal.LogKeys.{JOIN_CONDITION, JOIN_TYPE, SCHEMA}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.connector.expressions.{FieldReference, SortOrder}
 import org.apache.spark.sql.connector.expressions.aggregate.Aggregation
 import org.apache.spark.sql.connector.expressions.filter.Predicate
-import org.apache.spark.sql.connector.read.{ScanBuilder, SupportsPushDownAggregates, SupportsPushDownLimit, SupportsPushDownOffset, SupportsPushDownRequiredColumns, SupportsPushDownTableSample, SupportsPushDownTopN, SupportsPushDownV2Filters}
+import org.apache.spark.sql.connector.join.JoinType
+import org.apache.spark.sql.connector.read.{ScanBuilder, SupportsPushDownAggregates, SupportsPushDownJoin, SupportsPushDownLimit, SupportsPushDownOffset, SupportsPushDownRequiredColumns, SupportsPushDownTableSample, SupportsPushDownTopN, SupportsPushDownV2Filters}
 import org.apache.spark.sql.execution.datasources.PartitioningUtils
-import org.apache.spark.sql.execution.datasources.jdbc.{JDBCOptions, JDBCRDD, JDBCRelation}
+import org.apache.spark.sql.execution.datasources.jdbc.{JDBCOptions, JDBCPartition, JDBCRDD, JDBCRelation}
 import org.apache.spark.sql.execution.datasources.v2.TableSampleInfo
-import org.apache.spark.sql.jdbc.JdbcDialects
+import org.apache.spark.sql.execution.metric.SQLMetric
+import org.apache.spark.sql.jdbc.{JdbcDialects, JdbcSQLQueryBuilder, JoinPushdownAliasGenerator}
 import org.apache.spark.sql.types.StructType
 
 case class JDBCScanBuilder(
     session: SparkSession,
     schema: StructType,
-    jdbcOptions: JDBCOptions)
+    var jdbcOptions: JDBCOptions,
+    additionalMetrics: Map[String, SQLMetric] = Map())
   extends ScanBuilder
     with SupportsPushDownV2Filters
     with SupportsPushDownRequiredColumns
@@ -42,6 +46,7 @@ case class JDBCScanBuilder(
     with SupportsPushDownOffset
     with SupportsPushDownTableSample
     with SupportsPushDownTopN
+    with SupportsPushDownJoin
     with Logging {
 
   private val dialect = JdbcDialects.get(jdbcOptions.url)
@@ -121,6 +126,151 @@ case class JDBCScanBuilder(
     }
   }
 
+  // TODO: currently we check that all the options are same (besides dbtable and query options).
+  // That is too strict, so in the future we should relax this check by asserting only specific
+  // options are some (e.g. host, port, username, password, database...).
+  // Also, we need to check if join is done on 2 tables from 2 different databases within same
+  // host. These shouldn't be allowed.
+  override def isOtherSideCompatibleForJoin(other: SupportsPushDownJoin): Boolean = {
+    if (!jdbcOptions.pushDownJoin ||
+        !dialect.supportsJoin ||
+        !other.isInstanceOf[JDBCScanBuilder]) {
+      return false
+    }
+
+    val filteredJDBCOptions = jdbcOptions.parameters -
+      JDBCOptions.JDBC_TABLE_NAME -
+      JDBCOptions.JDBC_QUERY_STRING
+
+    val otherSideFilteredJDBCOptions = other.asInstanceOf[JDBCScanBuilder].jdbcOptions.parameters -
+      JDBCOptions.JDBC_TABLE_NAME -
+      JDBCOptions.JDBC_QUERY_STRING
+
+    filteredJDBCOptions == otherSideFilteredJDBCOptions
+  };
+
+  /**
+   * Helper method to calculate StructType based on the SupportsPushDownJoin.ColumnWithAlias and
+   * the given schema.
+   *
+   * If ColumnWithAlias object has defined alias, new field with new name being equal to alias
+   * should be returned. Otherwise, original field is returned.
+   */
+  private def calculateJoinOutputSchema(
+      columnsWithAliases: Array[SupportsPushDownJoin.ColumnWithAlias],
+      schema: StructType): StructType = {
+    var newSchema = StructType(Seq())
+    columnsWithAliases.foreach { columnWithAlias =>
+      val colName = columnWithAlias.colName()
+      val alias = columnWithAlias.alias()
+      val field = schema(colName)
+
+      if (alias == null) {
+        newSchema = newSchema.add(field)
+      } else {
+        newSchema = newSchema.add(alias, field.dataType, field.nullable, field.metadata)
+      }
+    }
+
+    newSchema
+  }
+
+  override def pushDownJoin(
+      other: SupportsPushDownJoin,
+      joinType: JoinType,
+      leftSideRequiredColumnsWithAliases: Array[SupportsPushDownJoin.ColumnWithAlias],
+      rightSideRequiredColumnsWithAliases: Array[SupportsPushDownJoin.ColumnWithAlias],
+      condition: Predicate ): Boolean = {
+    if (!jdbcOptions.pushDownJoin || !dialect.supportsJoin) {
+      return false
+    }
+
+    val joinTypeStringOption = joinType match {
+      case JoinType.INNER_JOIN => Some("INNER JOIN")
+      case JoinType.LEFT_OUTER_JOIN => Some("LEFT JOIN")
+      case JoinType.RIGHT_OUTER_JOIN => Some("RIGHT JOIN")
+      case _ => None
+    }
+    if (!joinTypeStringOption.isDefined) {
+      logError(log"Failed to push down join to JDBC due to unsupported join type " +
+        log"${MDC(JOIN_TYPE, joinType)}")
+      return false
+    }
+
+    val compiledCondition = dialect.compileExpression(condition)
+    if (!compiledCondition.isDefined) {
+      logError(log"Failed to push down join to JDBC due to unsupported join condition " +
+        log"${MDC(JOIN_CONDITION, condition)}")
+      return false
+    }
+
+    val otherJdbcScanBuilder = other.asInstanceOf[JDBCScanBuilder]
+
+    // requiredSchema will become the finalSchema of this JDBCScanBuilder
+    var requiredSchema = StructType(Seq())
+    requiredSchema = calculateJoinOutputSchema(leftSideRequiredColumnsWithAliases, finalSchema)
+    requiredSchema = requiredSchema.merge(
+      calculateJoinOutputSchema(
+        rightSideRequiredColumnsWithAliases,
+        otherJdbcScanBuilder.finalSchema
+      )
+    )
+
+    val joinOutputColumns = requiredSchema.fields.map(f => dialect.quoteIdentifier(f.name))
+    val conditionString = compiledCondition.get
+
+    // Get left side and right side of join sql query builders and recursively build them when
+    // crafting join sql query.
+    val leftSideJdbcSQLBuilder = getJoinPushdownJdbcSQLBuilder(leftSideRequiredColumnsWithAliases)
+    val otherSideJdbcSQLBuilder = otherJdbcScanBuilder
+      .getJoinPushdownJdbcSQLBuilder(rightSideRequiredColumnsWithAliases)
+
+    val joinQuery = dialect
+      .getJdbcSQLQueryBuilder(jdbcOptions)
+      .withJoin(
+        leftSideJdbcSQLBuilder,
+        otherSideJdbcSQLBuilder,
+        JoinPushdownAliasGenerator.getSubqueryQualifier,
+        JoinPushdownAliasGenerator.getSubqueryQualifier,
+        joinOutputColumns,
+        joinTypeStringOption.get,
+        conditionString
+      )
+      .build()
+
+    val newJdbcOptionsMap = jdbcOptions.parameters.originalMap +
+      (JDBCOptions.JDBC_QUERY_STRING -> joinQuery) - JDBCOptions.JDBC_TABLE_NAME
+
+    jdbcOptions = new JDBCOptions(newJdbcOptionsMap)
+    finalSchema = requiredSchema
+    logInfo(log"Updated JDBC schema due to join pushdown. " +
+      log"New schema: ${MDC(SCHEMA, finalSchema.toDDL)}")
+
+    // We need to reset the pushedPredicate because it has already been consumed in previously
+    // crafted SQL query.
+    pushedPredicate = Array.empty[Predicate]
+    // Table sample is pushed down already as well, so we need to reset it to None to not push it
+    // down again when join pushdown is triggered again on this JDBCScanBuilder.
+    tableSample = None
+
+    true
+  }
+
+  def getJoinPushdownJdbcSQLBuilder(
+      columnsWithAliases: Array[SupportsPushDownJoin.ColumnWithAlias]): JdbcSQLQueryBuilder = {
+    val quotedColumns = columnsWithAliases.map(col => dialect.quoteIdentifier(col.colName()))
+    val quotedAliases = columnsWithAliases
+      .map(col => Option(col.alias()).map(dialect.quoteIdentifier))
+
+    // Only filters can be pushed down before join pushdown, so we need to craft SQL query
+    // that contains filters as well.
+    // Joins on top of samples are not supported so we don't need to provide tableSample here.
+    dialect
+      .getJdbcSQLQueryBuilder(jdbcOptions)
+      .withPredicates(pushedPredicate, JDBCPartition(whereClause = null, idx = 1))
+      .withAliasedColumns(quotedColumns, quotedAliases)
+  }
+
   override def pushTableSample(
       lowerBound: Double,
       upperBound: Double,
@@ -191,7 +341,9 @@ case class JDBCScanBuilder(
     // "DEPT","NAME",MAX("SALARY"),MIN("BONUS"), instead of getting column names from
     // prunedSchema and quote them (will become "MAX(SALARY)", "MIN(BONUS)" and can't
     // be used in sql string.
-    JDBCScan(JDBCRelation(schema, parts, jdbcOptions)(session), finalSchema, pushedPredicate,
-      pushedAggregateList, pushedGroupBys, tableSample, pushedLimit, sortOrders, pushedOffset)
+    JDBCScan(JDBCRelation(schema, parts, jdbcOptions, additionalMetrics)(session),
+      finalSchema, pushedPredicate, pushedAggregateList, pushedGroupBys,
+      tableSample, pushedLimit, sortOrders, pushedOffset)
   }
+
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTable.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTable.scala
index cf9aa4f8682bf..a242a24baf9cd 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTable.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTable.scala
@@ -28,17 +28,30 @@ import org.apache.spark.sql.connector.expressions.NamedReference
 import org.apache.spark.sql.connector.write.{LogicalWriteInfo, WriteBuilder}
 import org.apache.spark.sql.errors.DataTypeErrorsBase
 import org.apache.spark.sql.execution.datasources.jdbc.{JDBCOptions, JdbcOptionsInWrite, JdbcUtils}
+import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.sql.jdbc.JdbcDialects
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 
-case class JDBCTable(ident: Identifier, schema: StructType, jdbcOptions: JDBCOptions)
+case class JDBCTable(
+    ident: Identifier,
+    override val schema: StructType,
+    jdbcOptions: JDBCOptions,
+    additionalMetrics: Map[String, SQLMetric] = Map())
   extends Table
   with SupportsRead
   with SupportsWrite
   with SupportsIndex
   with DataTypeErrorsBase {
 
+  override def hashCode(): Int = (ident, schema, jdbcOptions).##
+
+  override def equals(obj: Any): Boolean = obj match {
+    case that: JDBCTable =>
+      this.ident == that.ident && this.schema == that.schema && this.jdbcOptions == that.jdbcOptions
+    case _ => false
+  }
+
   override def name(): String = ident.toString
 
   override def capabilities(): util.Set[TableCapability] = {
@@ -48,7 +61,7 @@ case class JDBCTable(ident: Identifier, schema: StructType, jdbcOptions: JDBCOpt
   override def newScanBuilder(options: CaseInsensitiveStringMap): JDBCScanBuilder = {
     val mergedOptions = new JDBCOptions(
       jdbcOptions.parameters.originalMap ++ options.asCaseSensitiveMap().asScala)
-    JDBCScanBuilder(SparkSession.active, schema, mergedOptions)
+    JDBCScanBuilder(SparkSession.active, schema, mergedOptions, additionalMetrics)
   }
 
   override def newWriteBuilder(info: LogicalWriteInfo): WriteBuilder = {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalog.scala
index 63048028c5877..7f9a408a597d8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/jdbc/JDBCTableCatalog.scala
@@ -16,7 +16,7 @@
  */
 package org.apache.spark.sql.execution.datasources.v2.jdbc
 
-import java.sql.SQLException
+import java.sql.{Connection, SQLException}
 import java.util
 
 import scala.collection.mutable
@@ -24,11 +24,13 @@ import scala.jdk.CollectionConverters._
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.analysis.NoSuchFunctionException
+import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Column, FunctionCatalog, Identifier, NamespaceChange, SupportsNamespaces, Table, TableCatalog, TableChange, TableSummary}
 import org.apache.spark.sql.connector.catalog.functions.UnboundFunction
 import org.apache.spark.sql.connector.expressions.Transform
 import org.apache.spark.sql.errors.{DataTypeErrorsBase, QueryCompilationErrors, QueryExecutionErrors}
-import org.apache.spark.sql.execution.datasources.jdbc.{JDBCOptions, JdbcOptionsInWrite, JDBCRDD, JdbcUtils}
+import org.apache.spark.sql.execution.datasources.jdbc.{JDBCOptions, JdbcOptionsInWrite, JDBCRDD, JDBCRelation, JdbcUtils}
+import org.apache.spark.sql.execution.metric.SQLMetrics
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.jdbc.{JdbcDialect, JdbcDialects}
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
@@ -91,19 +93,21 @@ class JDBCTableCatalog extends TableCatalog
   }
 
   override def tableExists(ident: Identifier): Boolean = {
+    JdbcUtils.withConnection(options)(tableExists(ident, _))
+  }
+
+  private def tableExists(ident: Identifier, conn: Connection): Boolean = {
     checkNamespace(ident.namespace())
     val writeOptions = new JdbcOptionsInWrite(
       options.parameters + (JDBCOptions.JDBC_TABLE_NAME -> getTableName(ident)))
-    JdbcUtils.withConnection(options) {
-      JdbcUtils.classifyException(
-        condition = "FAILED_JDBC.TABLE_EXISTS",
-        messageParameters = Map(
-          "url" -> options.getRedactUrl(),
-          "tableName" -> toSQLId(ident)),
-        dialect,
-        description = s"Failed table existence check: $ident",
-        isRuntime = false)(JdbcUtils.tableExists(_, writeOptions))
-    }
+    JdbcUtils.classifyException(
+      condition = "FAILED_JDBC.TABLE_EXISTS",
+      messageParameters = Map(
+        "url" -> options.getRedactUrl(),
+        "tableName" -> toSQLId(ident)),
+      dialect,
+      description = s"Failed table existence check: $ident",
+      isRuntime = false)(JdbcUtils.tableExists(conn, writeOptions))
   }
 
   override def dropTable(ident: Identifier): Boolean = {
@@ -136,23 +140,30 @@ class JDBCTableCatalog extends TableCatalog
   }
 
   override def loadTable(ident: Identifier): Table = {
-    if (!tableExists(ident)) {
-      throw QueryCompilationErrors.noSuchTableError(ident)
-    }
+    JdbcUtils.withConnection(options) { conn =>
+      if (!tableExists(ident, conn)) {
+        throw QueryCompilationErrors.noSuchTableError(ident)
+      }
 
-    val optionsWithTableName = new JDBCOptions(
-      options.parameters + (JDBCOptions.JDBC_TABLE_NAME -> getTableName(ident)))
-    JdbcUtils.classifyException(
-      condition = "FAILED_JDBC.LOAD_TABLE",
-      messageParameters = Map(
-        "url" -> options.getRedactUrl(),
-        "tableName" -> toSQLId(ident)),
-      dialect,
-      description = s"Failed to load table: $ident",
-      isRuntime = false
-    ) {
-      val schema = JDBCRDD.resolveTable(optionsWithTableName)
-      JDBCTable(ident, schema, optionsWithTableName)
+      val optionsWithTableName = new JDBCOptions(
+        options.parameters + (JDBCOptions.JDBC_TABLE_NAME -> getTableName(ident)))
+      JdbcUtils.classifyException(
+        condition = "FAILED_JDBC.LOAD_TABLE",
+        messageParameters = Map(
+          "url" -> options.getRedactUrl(),
+          "tableName" -> toSQLId(ident)),
+        dialect,
+        description = s"Failed to load table: $ident",
+        isRuntime = false
+      ) {
+        val remoteSchemaFetchMetric = JdbcUtils
+          .createSchemaFetchMetric(SparkSession.active.sparkContext)
+        val schema = SQLMetrics.withTimingNs(remoteSchemaFetchMetric) {
+          JDBCRDD.resolveTable(optionsWithTableName, conn)
+        }
+        JDBCTable(ident, schema, optionsWithTableName,
+          Map(JDBCRelation.schemaFetchKey -> remoteSchemaFetchMetric))
+      }
     }
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/parquet/ParquetPartitionReaderFactory.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/parquet/ParquetPartitionReaderFactory.scala
index ac15456f0c3d4..70ae8068a03a0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/parquet/ParquetPartitionReaderFactory.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/parquet/ParquetPartitionReaderFactory.scala
@@ -84,6 +84,8 @@ case class ParquetPartitionReaderFactory(
   private val datetimeRebaseModeInRead = options.datetimeRebaseModeInRead
   private val int96RebaseModeInRead = options.int96RebaseModeInRead
 
+  private val parquetReaderCallback = new ParquetReaderCallback()
+
   private def getFooter(file: PartitionedFile): ParquetMetadata = {
     val conf = broadcastedConf.value.value
     if (aggregation.isDefined || enableVectorizedReader) {
@@ -309,7 +311,8 @@ case class ParquetPartitionReaderFactory(
       reader, readDataSchema)
     val iter = new RecordReaderIterator(readerWithRowIndexes)
     // SPARK-23457 Register a task completion listener before `initialization`.
-    taskContext.foreach(_.addTaskCompletionListener[Unit](_ => iter.close()))
+    parquetReaderCallback.advanceFile(iter)
+    taskContext.foreach(parquetReaderCallback.initIfNotAlready)
     readerWithRowIndexes
   }
 
@@ -337,8 +340,39 @@ case class ParquetPartitionReaderFactory(
       capacity)
     val iter = new RecordReaderIterator(vectorizedReader)
     // SPARK-23457 Register a task completion listener before `initialization`.
-    taskContext.foreach(_.addTaskCompletionListener[Unit](_ => iter.close()))
+    parquetReaderCallback.advanceFile(iter)
+    taskContext.foreach(parquetReaderCallback.initIfNotAlready)
     logDebug(s"Appending $partitionSchema $partitionValues")
     vectorizedReader
   }
 }
+
+/**
+ * A callback class to handle the cleanup of Parquet readers.
+ *
+ * This class is used to ensure that the Parquet readers are closed properly when the task
+ * completes, and it also allows for the initialization of the reader callback only once per task.
+ */
+private class ParquetReaderCallback extends Serializable {
+  private var init: Boolean = false
+  private var iter: RecordReaderIterator[_] = null
+
+  def initIfNotAlready(taskContext: TaskContext): Unit = {
+    if (!init) {
+      taskContext.addTaskCompletionListener[Unit](_ => closeCurrent())
+      init = true
+    }
+  }
+
+  def advanceFile(iter: RecordReaderIterator[_]): Unit = {
+    closeCurrent()
+
+    this.iter = iter
+  }
+
+  def closeCurrent(): Unit = {
+    if (iter != null) {
+      iter.close()
+    }
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/python/PythonStreamingPartitionReaderFactory.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/python/PythonStreamingPartitionReaderFactory.scala
index 7d80cc2728102..466ecf6090938 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/python/PythonStreamingPartitionReaderFactory.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/python/PythonStreamingPartitionReaderFactory.scala
@@ -19,7 +19,7 @@
 package org.apache.spark.sql.execution.datasources.v2.python
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.connector.metric.CustomTaskMetric
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSource.scala
index 937eb1fc042d5..828c06ab834ab 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSource.scala
@@ -29,13 +29,18 @@ import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.DataSourceOptions
 import org.apache.spark.sql.connector.catalog.{Table, TableProvider}
 import org.apache.spark.sql.connector.expressions.Transform
-import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions.{JoinSideValues, READ_REGISTERED_TIMERS, STATE_VAR_NAME}
+import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions.{JoinSideValues, READ_REGISTERED_TIMERS, STATE_VAR_NAME, STORE_NAME}
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions.JoinSideValues.JoinSideValues
 import org.apache.spark.sql.execution.datasources.v2.state.metadata.{StateMetadataPartitionReader, StateMetadataTableEntry}
 import org.apache.spark.sql.execution.datasources.v2.state.utils.SchemaUtil
-import org.apache.spark.sql.execution.streaming.{OffsetSeqMetadata, StreamingQueryCheckpointMetadata, TimerStateUtils, TransformWithStateOperatorProperties, TransformWithStateVariableInfo}
-import org.apache.spark.sql.execution.streaming.StreamingCheckpointConstants.DIR_NAME_STATE
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.{LeftSide, RightSide}
+import org.apache.spark.sql.execution.streaming.checkpointing.OffsetSeqMetadata
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorsUtils
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.{LeftSide, RightSide}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.SymmetricHashJoinStateManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.{TransformWithStateOperatorProperties, TransformWithStateVariableInfo}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.timers.TimerStateUtils
+import org.apache.spark.sql.execution.streaming.runtime.StreamingCheckpointConstants.DIR_NAME_STATE
+import org.apache.spark.sql.execution.streaming.runtime.StreamingQueryCheckpointMetadata
 import org.apache.spark.sql.execution.streaming.state.{InMemoryStateSchemaProvider, KeyStateEncoderSpec, NoPrefixKeyStateEncoderSpec, PrefixKeyScanStateEncoderSpec, StateSchemaCompatibilityChecker, StateSchemaMetadata, StateSchemaProvider, StateStore, StateStoreColFamilySchema, StateStoreConf, StateStoreId, StateStoreProviderId}
 import org.apache.spark.sql.sources.DataSourceRegister
 import org.apache.spark.sql.streaming.TimeMode
@@ -51,25 +56,17 @@ class StateDataSource extends TableProvider with DataSourceRegister with Logging
 
   private lazy val hadoopConf: Configuration = session.sessionState.newHadoopConf()
 
-  private lazy val serializedHadoopConf = new SerializableConfiguration(hadoopConf)
-
-  // Seq of operator names who uses state schema v3 and TWS related options.
-  // This Seq was used in checks before reading state schema files.
-  private val twsShortNameSeq = Seq(
-    "transformWithStateExec",
-    "transformWithStateInPandasExec",
-    "transformWithStateInPySparkExec"
-  )
-
   override def shortName(): String = "statestore"
 
   override def getTable(
       schema: StructType,
       partitioning: Array[Transform],
       properties: util.Map[String, String]): Table = {
-    val sourceOptions = StateSourceOptions.apply(session, hadoopConf, properties)
+    val sourceOptions = StateSourceOptions.modifySourceOptions(hadoopConf,
+      StateSourceOptions.apply(session, hadoopConf, properties))
     val stateConf = buildStateStoreConf(sourceOptions.resolvedCpLocation, sourceOptions.batchId)
-    val stateStoreReaderInfo: StateStoreReaderInfo = getStoreMetadataAndRunChecks(sourceOptions)
+    val stateStoreReaderInfo: StateStoreReaderInfo = getStoreMetadataAndRunChecks(
+      sourceOptions)
 
     // The key state encoder spec should be available for all operators except stream-stream joins
     val keyStateEncoderSpec = if (stateStoreReaderInfo.keyStateEncoderSpecOpt.isDefined) {
@@ -82,25 +79,28 @@ class StateDataSource extends TableProvider with DataSourceRegister with Logging
     new StateTable(session, schema, sourceOptions, stateConf, keyStateEncoderSpec,
       stateStoreReaderInfo.transformWithStateVariableInfoOpt,
       stateStoreReaderInfo.stateStoreColFamilySchemaOpt,
-      stateStoreReaderInfo.stateSchemaProviderOpt)
+      stateStoreReaderInfo.stateSchemaProviderOpt,
+      stateStoreReaderInfo.joinColFamilyOpt)
   }
 
   override def inferSchema(options: CaseInsensitiveStringMap): StructType = {
-    val sourceOptions = StateSourceOptions.apply(session, hadoopConf, options)
+    val sourceOptions = StateSourceOptions.modifySourceOptions(hadoopConf,
+      StateSourceOptions.apply(session, hadoopConf, options))
 
-    val stateStoreReaderInfo: StateStoreReaderInfo = getStoreMetadataAndRunChecks(sourceOptions)
+    val stateStoreReaderInfo: StateStoreReaderInfo = getStoreMetadataAndRunChecks(
+      sourceOptions)
+    val oldSchemaFilePaths = StateDataSource.getOldSchemaFilePaths(sourceOptions, hadoopConf)
 
     val stateCheckpointLocation = sourceOptions.stateCheckpointLocation
     try {
-      // SPARK-51779 TODO: Support stream-stream joins with virtual column families
       val (keySchema, valueSchema) = sourceOptions.joinSide match {
         case JoinSideValues.left =>
           StreamStreamJoinStateHelper.readKeyValueSchema(session, stateCheckpointLocation.toString,
-            sourceOptions.operatorId, LeftSide)
+            sourceOptions.operatorId, LeftSide, oldSchemaFilePaths)
 
         case JoinSideValues.right =>
           StreamStreamJoinStateHelper.readKeyValueSchema(session, stateCheckpointLocation.toString,
-            sourceOptions.operatorId, RightSide)
+            sourceOptions.operatorId, RightSide, oldSchemaFilePaths)
 
         case JoinSideValues.none =>
           // we should have the schema for the state store if joinSide is none
@@ -141,19 +141,7 @@ class StateDataSource extends TableProvider with DataSourceRegister with Logging
   private def runStateVarChecks(
       sourceOptions: StateSourceOptions,
       stateStoreMetadata: Array[StateMetadataTableEntry]): Unit = {
-    if (sourceOptions.stateVarName.isDefined || sourceOptions.readRegisteredTimers) {
-      // Perform checks for transformWithState operator in case state variable name is provided
-      require(stateStoreMetadata.size == 1)
-      val opMetadata = stateStoreMetadata.head
-      if (!twsShortNameSeq.contains(opMetadata.operatorName)) {
-        // if we are trying to query state source with state variable name, then the operator
-        // should be transformWithState
-        val errorMsg = "Providing state variable names is only supported with the " +
-          s"transformWithState operator. Found operator=${opMetadata.operatorName}. " +
-          s"Please remove this option and re-run the query."
-        throw StateDataSourceErrors.invalidOptionValue(STATE_VAR_NAME, errorMsg)
-      }
-
+    def runTWSChecks(opMetadata: StateMetadataTableEntry): Unit = {
       // if the operator is transformWithState, but the operator properties are empty, then
       // the user has not defined any state variables for the operator
       val operatorProperties = opMetadata.operatorPropertiesJson
@@ -183,35 +171,74 @@ class StateDataSource extends TableProvider with DataSourceRegister with Logging
         throw StateDataSourceErrors.invalidOptionValue(STATE_VAR_NAME,
           s"State variable $stateVarName is not defined for the transformWithState operator.")
       }
-    } else {
-      // if the operator is transformWithState, then a state variable argument is mandatory
-      if (stateStoreMetadata.size == 1 &&
-        twsShortNameSeq.contains(stateStoreMetadata.head.operatorName)) {
-        throw StateDataSourceErrors.requiredOptionUnspecified("stateVarName")
-      }
     }
-  }
 
-  private def getStateStoreMetadata(stateSourceOptions: StateSourceOptions):
-    Array[StateMetadataTableEntry] = {
-    val allStateStoreMetadata = new StateMetadataPartitionReader(
-      stateSourceOptions.stateCheckpointLocation.getParent.toString,
-      serializedHadoopConf, stateSourceOptions.batchId).stateMetadata.toArray
-    val stateStoreMetadata = allStateStoreMetadata.filter { entry =>
-      entry.operatorId == stateSourceOptions.operatorId &&
-        entry.stateStoreName == stateSourceOptions.storeName
+    sourceOptions.stateVarName match {
+      case Some(name) =>
+        // Check that stateStoreMetadata exists
+        require(stateStoreMetadata.size == 1)
+        val opMetadata = stateStoreMetadata.head
+        opMetadata.operatorName match {
+          case opName: String if opName ==
+            StatefulOperatorsUtils.SYMMETRIC_HASH_JOIN_EXEC_OP_NAME =>
+            // Verify that the storename is valid
+            val possibleStoreNames = SymmetricHashJoinStateManager.allStateStoreNames(
+              LeftSide, RightSide)
+            if (!possibleStoreNames.contains(name)) {
+              val errorMsg = s"Store name $name not allowed for join operator. Allowed names are " +
+                s"$possibleStoreNames. " +
+                s"Please remove this option and re-run the query."
+              throw StateDataSourceErrors.invalidOptionValue(STORE_NAME, errorMsg)
+            }
+          case opName: String if StatefulOperatorsUtils.TRANSFORM_WITH_STATE_OP_NAMES
+            .contains(opName) =>
+            runTWSChecks(opMetadata)
+          case _ =>
+            // if we are trying to query state source with state variable name, then the operator
+            // should be transformWithState
+            val errorMsg = "Providing state variable names is only supported with the " +
+              s"transformWithState operator. Found operator=${opMetadata.operatorName}. " +
+              s"Please remove this option and re-run the query."
+            throw StateDataSourceErrors.invalidOptionValue(STATE_VAR_NAME, errorMsg)
+        }
+      case None =>
+        if (sourceOptions.readRegisteredTimers) {
+          // Check that stateStoreMetadata exists
+          require(stateStoreMetadata.size == 1)
+          val opMetadata = stateStoreMetadata.head
+          opMetadata.operatorName match {
+            case opName: String if StatefulOperatorsUtils.TRANSFORM_WITH_STATE_OP_NAMES
+              .contains(opName) =>
+              runTWSChecks(opMetadata)
+            case _ =>
+              // if we are trying to query state source with state variable name, then the operator
+              // should be transformWithState
+              val errorMsg = "Providing readRegisteredTimers=true is only supported with the " +
+                s"transformWithState operator. Found operator=${opMetadata.operatorName}. " +
+                s"Please remove this option and re-run the query."
+              throw StateDataSourceErrors.invalidOptionValue(READ_REGISTERED_TIMERS, errorMsg)
+          }
+        } else {
+          // if the operator is transformWithState, then a state variable argument is mandatory
+          if (stateStoreMetadata.size == 1 &&
+            StatefulOperatorsUtils.TRANSFORM_WITH_STATE_OP_NAMES.contains(
+              stateStoreMetadata.head.operatorName)) {
+            throw StateDataSourceErrors.requiredOptionUnspecified("stateVarName")
+          }
+        }
     }
-    stateStoreMetadata
   }
 
   private def getStoreMetadataAndRunChecks(sourceOptions: StateSourceOptions):
     StateStoreReaderInfo = {
-    val storeMetadata = getStateStoreMetadata(sourceOptions)
+    val storeMetadata = StateDataSource.getStateStoreMetadata(sourceOptions, hadoopConf)
     runStateVarChecks(sourceOptions, storeMetadata)
+
     var keyStateEncoderSpecOpt: Option[KeyStateEncoderSpec] = None
     var stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema] = None
     var transformWithStateVariableInfoOpt: Option[TransformWithStateVariableInfo] = None
     var stateSchemaProvider: Option[StateSchemaProvider] = None
+    var joinColFamilyOpt: Option[String] = None
     var timeMode: String = TimeMode.None.toString
 
     if (sourceOptions.joinSide == JoinSideValues.none) {
@@ -220,34 +247,41 @@ class StateDataSource extends TableProvider with DataSourceRegister with Logging
 
       // Read the schema file path from operator metadata version v2 onwards
       // for the transformWithState operator
-      val oldSchemaFilePaths = if (storeMetadata.length > 0 && storeMetadata.head.version == 2
-        && twsShortNameSeq.exists(storeMetadata.head.operatorName.contains)) {
-        val storeMetadataEntry = storeMetadata.head
-        val operatorProperties = TransformWithStateOperatorProperties.fromJson(
-          storeMetadataEntry.operatorPropertiesJson)
-        timeMode = operatorProperties.timeMode
-
-        if (sourceOptions.readRegisteredTimers) {
-          stateVarName = TimerStateUtils.getTimerStateVarNames(timeMode)._1
+      val oldSchemaFilePaths = if (storeMetadata.length > 0 && storeMetadata.head.version == 2) {
+        val opName = storeMetadata.head.operatorName
+        if (StatefulOperatorsUtils.TRANSFORM_WITH_STATE_OP_NAMES.exists(opName.contains)) {
+          val storeMetadataEntry = storeMetadata.head
+          val operatorProperties = TransformWithStateOperatorProperties.fromJson(
+            storeMetadataEntry.operatorPropertiesJson)
+          timeMode = operatorProperties.timeMode
+
+          if (sourceOptions.readRegisteredTimers) {
+            stateVarName = TimerStateUtils.getTimerStateVarNames(timeMode)._1
+          }
+
+          val stateVarInfoList = operatorProperties.stateVariables
+            .filter(stateVar => stateVar.stateName == stateVarName)
+          require(stateVarInfoList.size == 1, s"Failed to find unique state variable info " +
+            s"for state variable $stateVarName in operator ${sourceOptions.operatorId}")
+          val stateVarInfo = stateVarInfoList.head
+          transformWithStateVariableInfoOpt = Some(stateVarInfo)
+          val schemaFilePaths = storeMetadataEntry.stateSchemaFilePaths
+          val stateSchemaMetadata = StateSchemaMetadata.createStateSchemaMetadata(
+            sourceOptions.stateCheckpointLocation.toString,
+            hadoopConf,
+            schemaFilePaths
+          )
+          stateSchemaProvider = Some(new InMemoryStateSchemaProvider(stateSchemaMetadata))
+          schemaFilePaths.map(new Path(_))
+        } else {
+          if (opName == StatefulOperatorsUtils.SYMMETRIC_HASH_JOIN_EXEC_OP_NAME) {
+            joinColFamilyOpt = Some(stateVarName)
+          }
+          StateDataSource.getOldSchemaFilePaths(sourceOptions, hadoopConf)
         }
-
-        val stateVarInfoList = operatorProperties.stateVariables
-          .filter(stateVar => stateVar.stateName == stateVarName)
-        require(stateVarInfoList.size == 1, s"Failed to find unique state variable info " +
-          s"for state variable $stateVarName in operator ${sourceOptions.operatorId}")
-        val stateVarInfo = stateVarInfoList.head
-        transformWithStateVariableInfoOpt = Some(stateVarInfo)
-        val schemaFilePaths = storeMetadataEntry.stateSchemaFilePaths
-        val stateSchemaMetadata = StateSchemaMetadata.createStateSchemaMetadata(
-          sourceOptions.stateCheckpointLocation.toString,
-          hadoopConf,
-          schemaFilePaths
-        )
-        stateSchemaProvider = Some(new InMemoryStateSchemaProvider(stateSchemaMetadata))
-        schemaFilePaths.map(new Path(_))
       } else {
-        None
-      }.toList
+        StateDataSource.getOldSchemaFilePaths(sourceOptions, hadoopConf)
+      }
 
       try {
         // Read the actual state schema from the provided path for v2 or from the dedicated path
@@ -276,7 +310,8 @@ class StateDataSource extends TableProvider with DataSourceRegister with Logging
       keyStateEncoderSpecOpt,
       stateStoreColFamilySchemaOpt,
       transformWithStateVariableInfoOpt,
-      stateSchemaProvider
+      stateSchemaProvider,
+      joinColFamilyOpt
     )
   }
 
@@ -335,7 +370,8 @@ case class StateSourceOptions(
     readChangeFeedOptions: Option[ReadChangeFeedOptions],
     stateVarName: Option[String],
     readRegisteredTimers: Boolean,
-    flattenCollectionTypes: Boolean) {
+    flattenCollectionTypes: Boolean,
+    operatorStateUniqueIds: Option[Array[Array[String]]] = None) {
   def stateCheckpointLocation: Path = new Path(resolvedCpLocation, DIR_NAME_STATE)
 
   override def toString: String = {
@@ -532,10 +568,37 @@ object StateSourceOptions extends DataSourceOptions {
       }
     }
 
+    val startBatchId = if (fromSnapshotOptions.isDefined) {
+      fromSnapshotOptions.get.snapshotStartBatchId
+    } else if (readChangeFeedOptions.isDefined) {
+      readChangeFeedOptions.get.changeStartBatchId
+    } else {
+      batchId.get
+    }
+
+    val operatorStateUniqueIds = getOperatorStateUniqueIds(
+      sparkSession,
+      startBatchId,
+      operatorId,
+      resolvedCpLocation)
+
+    if (operatorStateUniqueIds.isDefined) {
+      if (fromSnapshotOptions.isDefined) {
+        throw StateDataSourceErrors.invalidOptionValue(
+          SNAPSHOT_START_BATCH_ID,
+          "Snapshot reading is currently not supported with checkpoint v2.")
+      }
+      if (readChangeFeedOptions.isDefined) {
+        throw StateDataSourceErrors.invalidOptionValue(
+          READ_CHANGE_FEED,
+          "Read change feed is currently not supported with checkpoint v2.")
+      }
+    }
+
     StateSourceOptions(
       resolvedCpLocation, batchId.get, operatorId, storeName, joinSide,
       readChangeFeed, fromSnapshotOptions, readChangeFeedOptions,
-      stateVarName, readRegisteredTimers, flattenCollectionTypes)
+      stateVarName, readRegisteredTimers, flattenCollectionTypes, operatorStateUniqueIds)
   }
 
   private def resolvedCheckpointLocation(
@@ -553,6 +616,41 @@ object StateSourceOptions extends DataSourceOptions {
       case None => throw StateDataSourceErrors.committedBatchUnavailable(checkpointLocation)
     }
   }
+
+  private def getOperatorStateUniqueIds(
+    session: SparkSession,
+    batchId: Long,
+    operatorId: Long,
+    checkpointLocation: String): Option[Array[Array[String]]] = {
+    val commitLog = new StreamingQueryCheckpointMetadata(session, checkpointLocation).commitLog
+    val commitMetadata = commitLog.get(batchId) match {
+      case Some(commitMetadata) => commitMetadata
+      case None => throw StateDataSourceErrors.committedBatchUnavailable(checkpointLocation)
+    }
+
+    commitMetadata.stateUniqueIds.flatMap(_.get(operatorId))
+  }
+
+  // Modifies options due to external data. Returns modified options.
+  // If this is a join operator specifying a store name using state format v3,
+  // we need to modify the options.
+  private[state] def modifySourceOptions(
+    hadoopConf: Configuration, sourceOptions: StateSourceOptions): StateSourceOptions = {
+    // If a storeName is specified (e.g. right-keyToNumValues) and v3 is used,
+    // we are using join with virtual column families not diff stores. Therefore,
+    // options will be modified to set stateVarName to that storeName and storeName
+    // to default.
+    if (sourceOptions.storeName != StateStoreId.DEFAULT_STORE_NAME &&
+      StreamStreamJoinStateHelper.usesVirtualColumnFamilies(
+        hadoopConf, sourceOptions.stateCheckpointLocation.toString,
+        sourceOptions.operatorId)) {
+      sourceOptions.copy(
+        stateVarName = Some(sourceOptions.storeName),
+        storeName = StateStoreId.DEFAULT_STORE_NAME)
+    } else {
+      sourceOptions
+    }
+  }
 }
 
 // Case class to store information around the key state encoder, col family schema and
@@ -561,5 +659,28 @@ case class StateStoreReaderInfo(
     keyStateEncoderSpecOpt: Option[KeyStateEncoderSpec],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
     transformWithStateVariableInfoOpt: Option[TransformWithStateVariableInfo],
-    stateSchemaProviderOpt: Option[StateSchemaProvider]
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String] // Only used for join op with state format v3
 )
+
+object StateDataSource {
+  private def getStateStoreMetadata(
+    stateSourceOptions: StateSourceOptions,
+    hadoopConf: Configuration): Array[StateMetadataTableEntry] = {
+    val allStateStoreMetadata = new StateMetadataPartitionReader(
+      stateSourceOptions.stateCheckpointLocation.getParent.toString,
+      new SerializableConfiguration(hadoopConf), stateSourceOptions.batchId).stateMetadata.toArray
+    val stateStoreMetadata = allStateStoreMetadata.filter { entry =>
+      entry.operatorId == stateSourceOptions.operatorId &&
+        entry.stateStoreName == stateSourceOptions.storeName
+    }
+    stateStoreMetadata
+  }
+
+  def getOldSchemaFilePaths(
+    stateSourceOptions: StateSourceOptions,
+    hadoopConf: Configuration): List[Path] = {
+    val metadata = getStateStoreMetadata(stateSourceOptions, hadoopConf)
+    metadata.headOption.map(_.stateSchemaFilePaths.map(new Path(_))).getOrElse(List.empty)
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StatePartitionReader.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StatePartitionReader.scala
index 4aa95ad42ec7f..ebef6e3dac552 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StatePartitionReader.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StatePartitionReader.scala
@@ -21,7 +21,8 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeRow}
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
 import org.apache.spark.sql.execution.datasources.v2.state.utils.SchemaUtil
-import org.apache.spark.sql.execution.streaming.{StateVariableType, TransformWithStateVariableInfo}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.SymmetricHashJoinStateManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.{StateVariableType, TransformWithStateVariableInfo}
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.execution.streaming.state.RecordType.{getRecordTypeAsString, RecordType}
 import org.apache.spark.sql.types.{NullType, StructField, StructType}
@@ -42,7 +43,8 @@ class StatePartitionReaderFactory(
     keyStateEncoderSpec: KeyStateEncoderSpec,
     stateVariableInfoOpt: Option[TransformWithStateVariableInfo],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
-    stateSchemaProviderOpt: Option[StateSchemaProvider])
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String])
   extends PartitionReaderFactory {
 
   override def createReader(partition: InputPartition): PartitionReader[InternalRow] = {
@@ -50,11 +52,11 @@ class StatePartitionReaderFactory(
     if (stateStoreInputPartition.sourceOptions.readChangeFeed) {
       new StateStoreChangeDataPartitionReader(storeConf, hadoopConf,
         stateStoreInputPartition, schema, keyStateEncoderSpec, stateVariableInfoOpt,
-        stateStoreColFamilySchemaOpt, stateSchemaProviderOpt)
+        stateStoreColFamilySchemaOpt, stateSchemaProviderOpt, joinColFamilyOpt)
     } else {
       new StatePartitionReader(storeConf, hadoopConf,
         stateStoreInputPartition, schema, keyStateEncoderSpec, stateVariableInfoOpt,
-        stateStoreColFamilySchemaOpt, stateSchemaProviderOpt)
+        stateStoreColFamilySchemaOpt, stateSchemaProviderOpt, joinColFamilyOpt)
     }
   }
 }
@@ -71,7 +73,8 @@ abstract class StatePartitionReaderBase(
     keyStateEncoderSpec: KeyStateEncoderSpec,
     stateVariableInfoOpt: Option[TransformWithStateVariableInfo],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
-    stateSchemaProviderOpt: Option[StateSchemaProvider])
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String])
   extends PartitionReader[InternalRow] with Logging {
   // Used primarily as a placeholder for the value schema in the context of
   // state variables used within the transformWithState operator.
@@ -93,16 +96,19 @@ abstract class StatePartitionReaderBase(
       schema, "value").asInstanceOf[StructType]
   }
 
+  protected val getStoreUniqueId : Option[String] = {
+    SymmetricHashJoinStateManager.getStateStoreCheckpointId(
+      storeName = partition.sourceOptions.storeName,
+      partitionId = partition.partition,
+      stateStoreCkptIds = partition.sourceOptions.operatorStateUniqueIds)
+  }
+
   protected lazy val provider: StateStoreProvider = {
     val stateStoreId = StateStoreId(partition.sourceOptions.stateCheckpointLocation.toString,
       partition.sourceOptions.operatorId, partition.partition, partition.sourceOptions.storeName)
     val stateStoreProviderId = StateStoreProviderId(stateStoreId, partition.queryId)
 
-    val useColFamilies = if (stateVariableInfoOpt.isDefined) {
-      true
-    } else {
-      false
-    }
+    val useColFamilies = stateVariableInfoOpt.isDefined || joinColFamilyOpt.isDefined
 
     val useMultipleValuesPerKey = SchemaUtil.checkVariableType(stateVariableInfoOpt,
       StateVariableType.ListState)
@@ -115,7 +121,9 @@ abstract class StatePartitionReaderBase(
     val isInternal = partition.sourceOptions.readRegisteredTimers
 
     if (useColFamilies) {
-      val store = provider.getStore(partition.sourceOptions.batchId + 1)
+      val store = provider.getStore(
+        partition.sourceOptions.batchId + 1,
+        getStoreUniqueId)
       require(stateStoreColFamilySchemaOpt.isDefined)
       val stateStoreColFamilySchema = stateStoreColFamilySchemaOpt.get
       require(stateStoreColFamilySchema.keyStateEncoderSpec.isDefined)
@@ -126,6 +134,7 @@ abstract class StatePartitionReaderBase(
         stateStoreColFamilySchema.keyStateEncoderSpec.get,
         useMultipleValuesPerKey = useMultipleValuesPerKey,
         isInternal = isInternal)
+      store.abort()
     }
     provider
   }
@@ -164,14 +173,19 @@ class StatePartitionReader(
     keyStateEncoderSpec: KeyStateEncoderSpec,
     stateVariableInfoOpt: Option[TransformWithStateVariableInfo],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
-    stateSchemaProviderOpt: Option[StateSchemaProvider])
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String])
   extends StatePartitionReaderBase(storeConf, hadoopConf, partition, schema,
     keyStateEncoderSpec, stateVariableInfoOpt, stateStoreColFamilySchemaOpt,
-    stateSchemaProviderOpt) {
+    stateSchemaProviderOpt, joinColFamilyOpt) {
 
   private lazy val store: ReadStateStore = {
     partition.sourceOptions.fromSnapshotOptions match {
-      case None => provider.getReadStore(partition.sourceOptions.batchId + 1)
+      case None =>
+        provider.getReadStore(
+          partition.sourceOptions.batchId + 1,
+          getStoreUniqueId
+        )
 
       case Some(fromSnapshotOptions) =>
         if (!provider.isInstanceOf[SupportsFineGrainedReplay]) {
@@ -186,17 +200,18 @@ class StatePartitionReader(
   }
 
   override lazy val iter: Iterator[InternalRow] = {
-    val stateVarName = stateVariableInfoOpt
-      .map(_.stateName).getOrElse(StateStore.DEFAULT_COL_FAMILY_NAME)
+    val colFamilyName = stateStoreColFamilySchemaOpt
+      .map(_.colFamilyName).getOrElse(
+        joinColFamilyOpt.getOrElse(StateStore.DEFAULT_COL_FAMILY_NAME))
 
     if (stateVariableInfoOpt.isDefined) {
       val stateVariableInfo = stateVariableInfoOpt.get
       val stateVarType = stateVariableInfo.stateVariableType
-      SchemaUtil.processStateEntries(stateVarType, stateVarName, store,
+      SchemaUtil.processStateEntries(stateVarType, colFamilyName, store,
         keySchema, partition.partition, partition.sourceOptions)
     } else {
       store
-        .iterator(stateVarName)
+        .iterator(colFamilyName)
         .map { pair =>
           SchemaUtil.unifyStateRowPair((pair.key, pair.value), partition.partition)
         }
@@ -204,7 +219,7 @@ class StatePartitionReader(
   }
 
   override def close(): Unit = {
-    store.abort()
+    store.release()
     super.close()
   }
 }
@@ -221,10 +236,11 @@ class StateStoreChangeDataPartitionReader(
     keyStateEncoderSpec: KeyStateEncoderSpec,
     stateVariableInfoOpt: Option[TransformWithStateVariableInfo],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
-    stateSchemaProviderOpt: Option[StateSchemaProvider])
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String])
   extends StatePartitionReaderBase(storeConf, hadoopConf, partition, schema,
     keyStateEncoderSpec, stateVariableInfoOpt, stateStoreColFamilySchemaOpt,
-    stateSchemaProviderOpt) {
+    stateSchemaProviderOpt, joinColFamilyOpt) {
 
   private lazy val changeDataReader:
     NextIterator[(RecordType.Value, UnsafeRow, UnsafeRow, Long)] = {
@@ -235,6 +251,8 @@ class StateStoreChangeDataPartitionReader(
 
     val colFamilyNameOpt = if (stateVariableInfoOpt.isDefined) {
       Some(stateVariableInfoOpt.get.stateName)
+    } else if (joinColFamilyOpt.isDefined) {
+      Some(joinColFamilyOpt.get)
     } else {
       None
     }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateScanBuilder.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateScanBuilder.scala
index 3b8dad7a18090..a1bd88f40740a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateScanBuilder.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateScanBuilder.scala
@@ -25,8 +25,8 @@ import org.apache.hadoop.fs.{Path, PathFilter}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.connector.read.{Batch, InputPartition, PartitionReaderFactory, Scan, ScanBuilder}
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions.JoinSideValues
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.{LeftSide, RightSide}
-import org.apache.spark.sql.execution.streaming.TransformWithStateVariableInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.{LeftSide, RightSide}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateVariableInfo
 import org.apache.spark.sql.execution.streaming.state.{KeyStateEncoderSpec, StateSchemaProvider, StateStoreColFamilySchema, StateStoreConf, StateStoreErrors}
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.SerializableConfiguration
@@ -45,9 +45,11 @@ class StateScanBuilder(
     keyStateEncoderSpec: KeyStateEncoderSpec,
     stateVariableInfoOpt: Option[TransformWithStateVariableInfo],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
-    stateSchemaProviderOpt: Option[StateSchemaProvider]) extends ScanBuilder {
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String]) extends ScanBuilder {
   override def build(): Scan = new StateScan(session, schema, sourceOptions, stateStoreConf,
-    keyStateEncoderSpec, stateVariableInfoOpt, stateStoreColFamilySchemaOpt, stateSchemaProviderOpt)
+    keyStateEncoderSpec, stateVariableInfoOpt, stateStoreColFamilySchemaOpt, stateSchemaProviderOpt,
+    joinColFamilyOpt)
 }
 
 /** An implementation of [[InputPartition]] for State Store data source. */
@@ -65,7 +67,8 @@ class StateScan(
     keyStateEncoderSpec: KeyStateEncoderSpec,
     stateVariableInfoOpt: Option[TransformWithStateVariableInfo],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
-    stateSchemaProviderOpt: Option[StateSchemaProvider])
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String])
   extends Scan with Batch {
 
   // A Hadoop Configuration can be about 10 KB, which is pretty big, so broadcast it
@@ -120,24 +123,28 @@ class StateScan(
   override def createReaderFactory(): PartitionReaderFactory = sourceOptions.joinSide match {
     case JoinSideValues.left =>
       val userFacingSchema = schema
+      val oldSchemaFilePaths = StateDataSource.getOldSchemaFilePaths(sourceOptions,
+        hadoopConfBroadcast.value.value)
       val stateSchema = StreamStreamJoinStateHelper.readSchema(session,
         sourceOptions.stateCheckpointLocation.toString, sourceOptions.operatorId, LeftSide,
-        excludeAuxColumns = false)
+        oldSchemaFilePaths, excludeAuxColumns = false)
       new StreamStreamJoinStatePartitionReaderFactory(stateStoreConf,
         hadoopConfBroadcast.value, userFacingSchema, stateSchema)
 
     case JoinSideValues.right =>
       val userFacingSchema = schema
+      val oldSchemaFilePaths = StateDataSource.getOldSchemaFilePaths(sourceOptions,
+        hadoopConfBroadcast.value.value)
       val stateSchema = StreamStreamJoinStateHelper.readSchema(session,
         sourceOptions.stateCheckpointLocation.toString, sourceOptions.operatorId, RightSide,
-        excludeAuxColumns = false)
+        oldSchemaFilePaths, excludeAuxColumns = false)
       new StreamStreamJoinStatePartitionReaderFactory(stateStoreConf,
         hadoopConfBroadcast.value, userFacingSchema, stateSchema)
 
     case JoinSideValues.none =>
       new StatePartitionReaderFactory(stateStoreConf, hadoopConfBroadcast.value, schema,
         keyStateEncoderSpec, stateVariableInfoOpt, stateStoreColFamilySchemaOpt,
-        stateSchemaProviderOpt)
+        stateSchemaProviderOpt, joinColFamilyOpt)
   }
 
   override def toBatch: Batch = this
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateTable.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateTable.scala
index 71b18be7fdf58..dfa378e8a5972 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateTable.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StateTable.scala
@@ -25,7 +25,7 @@ import org.apache.spark.sql.connector.catalog.{MetadataColumn, SupportsMetadataC
 import org.apache.spark.sql.connector.read.ScanBuilder
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions.JoinSideValues
 import org.apache.spark.sql.execution.datasources.v2.state.utils.SchemaUtil
-import org.apache.spark.sql.execution.streaming.TransformWithStateVariableInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateVariableInfo
 import org.apache.spark.sql.execution.streaming.state.{KeyStateEncoderSpec, StateSchemaProvider, StateStoreColFamilySchema, StateStoreConf}
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
@@ -44,7 +44,8 @@ class StateTable(
     keyStateEncoderSpec: KeyStateEncoderSpec,
     stateVariableInfoOpt: Option[TransformWithStateVariableInfo],
     stateStoreColFamilySchemaOpt: Option[StateStoreColFamilySchema],
-    stateSchemaProviderOpt: Option[StateSchemaProvider])
+    stateSchemaProviderOpt: Option[StateSchemaProvider],
+    joinColFamilyOpt: Option[String])
   extends Table with SupportsRead with SupportsMetadataColumns {
 
   import StateTable._
@@ -85,7 +86,8 @@ class StateTable(
 
   override def newScanBuilder(options: CaseInsensitiveStringMap): ScanBuilder =
     new StateScanBuilder(session, schema, sourceOptions, stateConf, keyStateEncoderSpec,
-      stateVariableInfoOpt, stateStoreColFamilySchemaOpt, stateSchemaProviderOpt)
+      stateVariableInfoOpt, stateStoreColFamilySchemaOpt, stateSchemaProviderOpt,
+      joinColFamilyOpt)
 
   override def properties(): util.Map[String, String] = Map.empty[String, String].asJava
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStateHelper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStateHelper.scala
index 1a04d24f0048d..5cb38022159cb 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStateHelper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStateHelper.scala
@@ -18,9 +18,14 @@ package org.apache.spark.sql.execution.datasources.v2.state
 
 import java.util.UUID
 
+import org.apache.hadoop.conf.Configuration
+import org.apache.hadoop.fs.Path
+
 import org.apache.spark.sql.SparkSession
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.JoinSide
-import org.apache.spark.sql.execution.streaming.state.{StateSchemaCompatibilityChecker, StateStore, StateStoreId, StateStoreProviderId, SymmetricHashJoinStateManager}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.{JoinSide, LeftSide}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.SymmetricHashJoinStateManager
+import org.apache.spark.sql.execution.streaming.state.{StateSchemaCompatibilityChecker, StateStore, StateStoreId, StateStoreProviderId}
 import org.apache.spark.sql.types.{BooleanType, StructType}
 
 /**
@@ -35,52 +40,92 @@ object StreamStreamJoinStateHelper {
       stateCheckpointLocation: String,
       operatorId: Int,
       side: JoinSide,
+      oldSchemaFilePaths: List[Path],
       excludeAuxColumns: Boolean = true): StructType = {
     val (keySchema, valueSchema) = readKeyValueSchema(session, stateCheckpointLocation,
-      operatorId, side, excludeAuxColumns)
+      operatorId, side, oldSchemaFilePaths, excludeAuxColumns)
 
     new StructType()
       .add("key", keySchema)
       .add("value", valueSchema)
   }
 
+  // Returns whether the checkpoint uses stateFormatVersion 3 which uses VCF for the join.
+  def usesVirtualColumnFamilies(
+    hadoopConf: Configuration,
+    stateCheckpointLocation: String,
+    operatorId: Int): Boolean = {
+    // If the schema exists for operatorId/partitionId/left-keyToNumValues, it is not
+    // stateFormatVersion 3.
+    val partitionId = StateStore.PARTITION_ID_TO_CHECK_SCHEMA
+    val storeId = new StateStoreId(stateCheckpointLocation, operatorId,
+      partitionId, SymmetricHashJoinStateManager.allStateStoreNames(LeftSide).toList.head)
+    val schemaFilePath = StateSchemaCompatibilityChecker.schemaFile(
+      storeId.storeCheckpointLocation())
+    val fm = CheckpointFileManager.create(schemaFilePath, hadoopConf)
+    !fm.exists(schemaFilePath)
+  }
+
   def readKeyValueSchema(
       session: SparkSession,
       stateCheckpointLocation: String,
       operatorId: Int,
       side: JoinSide,
+      oldSchemaFilePaths: List[Path],
       excludeAuxColumns: Boolean = true): (StructType, StructType) = {
 
+    val newHadoopConf = session.sessionState.newHadoopConf()
+    val partitionId = StateStore.PARTITION_ID_TO_CHECK_SCHEMA
     // KeyToNumValuesType, KeyWithIndexToValueType
     val storeNames = SymmetricHashJoinStateManager.allStateStoreNames(side).toList
 
-    val partitionId = StateStore.PARTITION_ID_TO_CHECK_SCHEMA
-    val storeIdForKeyToNumValues = new StateStoreId(stateCheckpointLocation, operatorId,
-      partitionId, storeNames(0))
-    val providerIdForKeyToNumValues = new StateStoreProviderId(storeIdForKeyToNumValues,
-      UUID.randomUUID())
+    val (keySchema, valueSchema) =
+      if (!usesVirtualColumnFamilies(
+        newHadoopConf, stateCheckpointLocation, operatorId)) {
+        val storeIdForKeyToNumValues = new StateStoreId(stateCheckpointLocation, operatorId,
+          partitionId, storeNames(0))
+        val providerIdForKeyToNumValues = new StateStoreProviderId(storeIdForKeyToNumValues,
+          UUID.randomUUID())
 
-    val storeIdForKeyWithIndexToValue = new StateStoreId(stateCheckpointLocation,
-      operatorId, partitionId, storeNames(1))
-    val providerIdForKeyWithIndexToValue = new StateStoreProviderId(storeIdForKeyWithIndexToValue,
-      UUID.randomUUID())
+        val storeIdForKeyWithIndexToValue = new StateStoreId(stateCheckpointLocation,
+          operatorId, partitionId, storeNames(1))
+        val providerIdForKeyWithIndexToValue = new StateStoreProviderId(
+          storeIdForKeyWithIndexToValue, UUID.randomUUID())
 
-    val newHadoopConf = session.sessionState.newHadoopConf()
+        // read the key schema from the keyToNumValues store for the join keys
+        val manager = new StateSchemaCompatibilityChecker(
+          providerIdForKeyToNumValues, newHadoopConf, oldSchemaFilePaths)
+        val kSchema = manager.readSchemaFile().head.keySchema
+
+        // read the value schema from the keyWithIndexToValue store for the values
+        val manager2 = new StateSchemaCompatibilityChecker(providerIdForKeyWithIndexToValue,
+          newHadoopConf, oldSchemaFilePaths)
+        val vSchema = manager2.readSchemaFile().head.valueSchema
+
+        (kSchema, vSchema)
+      } else {
+        val storeId = new StateStoreId(stateCheckpointLocation, operatorId,
+          partitionId, StateStoreId.DEFAULT_STORE_NAME)
+        val providerId = new StateStoreProviderId(storeId, UUID.randomUUID())
+
+        val manager = new StateSchemaCompatibilityChecker(
+          providerId, newHadoopConf, oldSchemaFilePaths)
+        val kSchema = manager.readSchemaFile().find { schema =>
+          schema.colFamilyName == storeNames(0)
+        }.map(_.keySchema).get
 
-    // read the key schema from the keyToNumValues store for the join keys
-    val manager = new StateSchemaCompatibilityChecker(providerIdForKeyToNumValues, newHadoopConf)
-    val keySchema = manager.readSchemaFile().head.keySchema
+        val vSchema = manager.readSchemaFile().find { schema =>
+          schema.colFamilyName == storeNames(1)
+        }.map(_.valueSchema).get
 
-    // read the value schema from the keyWithIndexToValue store for the values
-    val manager2 = new StateSchemaCompatibilityChecker(providerIdForKeyWithIndexToValue,
-      newHadoopConf)
-    val valueSchema = manager2.readSchemaFile().head.valueSchema
+        (kSchema, vSchema)
+      }
 
     val maybeMatchedColumn = valueSchema.last
 
     if (excludeAuxColumns
-        && maybeMatchedColumn.name == "matched"
-        && maybeMatchedColumn.dataType == BooleanType) {
+      && maybeMatchedColumn.name == "matched"
+      && maybeMatchedColumn.dataType == BooleanType) {
       // remove internal column `matched` for format version 2
       (keySchema, StructType(valueSchema.dropRight(1)))
     } else {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStatePartitionReader.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStatePartitionReader.scala
index e1d61de77380f..0f8a3b3b609f8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStatePartitionReader.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/StreamStreamJoinStatePartitionReader.scala
@@ -23,9 +23,10 @@ import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions.JoinSideValues
 import org.apache.spark.sql.execution.datasources.v2.state.utils.SchemaUtil
-import org.apache.spark.sql.execution.streaming.StatefulOperatorStateInfo
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.{JoinSide, LeftSide, RightSide}
-import org.apache.spark.sql.execution.streaming.state.{JoinStateManagerStoreGenerator, StateStoreConf, SymmetricHashJoinStateManager}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.{JoinStateManagerStoreGenerator, SymmetricHashJoinStateManager}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.{JoinSide, LeftSide, RightSide}
+import org.apache.spark.sql.execution.streaming.state.StateStoreConf
 import org.apache.spark.sql.types.{BooleanType, StructType}
 import org.apache.spark.util.SerializableConfiguration
 
@@ -70,6 +71,28 @@ class StreamStreamJoinStatePartitionReader(
       throw StateDataSourceErrors.internalError("Unexpected join side for stream-stream read!")
   }
 
+  private val usesVirtualColumnFamilies = StreamStreamJoinStateHelper.usesVirtualColumnFamilies(
+    hadoopConf.value,
+    partition.sourceOptions.stateCheckpointLocation.toString,
+    partition.sourceOptions.operatorId)
+
+  private val stateStoreCheckpointIds = SymmetricHashJoinStateManager.getStateStoreCheckpointIds(
+    partition.partition,
+    partition.sourceOptions.operatorStateUniqueIds,
+    usesVirtualColumnFamilies)
+
+  private val keyToNumValuesStateStoreCkptId = if (joinSide == LeftSide) {
+    stateStoreCheckpointIds.left.keyToNumValues
+  } else {
+    stateStoreCheckpointIds.right.keyToNumValues
+  }
+
+  private val keyWithIndexToValueStateStoreCkptId = if (joinSide == LeftSide) {
+    stateStoreCheckpointIds.left.keyWithIndexToValue
+  } else {
+    stateStoreCheckpointIds.right.keyWithIndexToValue
+  }
+
   /*
    * This is to handle the difference of schema across state format versions. The major difference
    * is whether we have added new field(s) in addition to the fields from input schema.
@@ -80,8 +103,15 @@ class StreamStreamJoinStatePartitionReader(
   private val (inputAttributes, formatVersion) = {
     val maybeMatchedColumn = valueSchema.last
     val (fields, version) = {
+      // If there is a matched column, version is either 2 or 3. We need to drop the matched
+      // column from the value schema to get the actual fields.
       if (maybeMatchedColumn.name == "matched" && maybeMatchedColumn.dataType == BooleanType) {
-        (valueSchema.dropRight(1), 2)
+        // If checkpoint is using one store and virtual column families, version is 3
+        if (usesVirtualColumnFamilies) {
+          (valueSchema.dropRight(1), 3)
+        } else {
+          (valueSchema.dropRight(1), 2)
+        }
       } else {
         (valueSchema, 1)
       }
@@ -119,8 +149,8 @@ class StreamStreamJoinStatePartitionReader(
         storeConf = storeConf,
         hadoopConf = hadoopConf.value,
         partitionId = partition.partition,
-        keyToNumValuesStateStoreCkptId = None,
-        keyWithIndexToValueStateStoreCkptId = None,
+        keyToNumValuesStateStoreCkptId = keyToNumValuesStateStoreCkptId,
+        keyWithIndexToValueStateStoreCkptId = keyWithIndexToValueStateStoreCkptId,
         formatVersion,
         skippedNullValueCount = None,
         useStateStoreCoordinator = false,
@@ -137,7 +167,7 @@ class StreamStreamJoinStatePartitionReader(
       inputAttributes)
 
     joinStateManager.iterator.map { pair =>
-      if (formatVersion == 2) {
+      if (formatVersion >= 2) {
         val row = valueWithMatchedRowGenerator(pair.value)
         row.setBoolean(indexOrdinalInValueWithMatchedRow, pair.matched)
         unifyStateRowPair(pair.key, row)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/metadata/StateMetadataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/metadata/StateMetadataSource.scala
index c5ccff9228d6e..31e6ac30a5984 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/metadata/StateMetadataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/metadata/StateMetadataSource.scala
@@ -23,7 +23,7 @@ import scala.jdk.CollectionConverters._
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{Path, PathFilter}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.GenericInternalRow
@@ -32,7 +32,7 @@ import org.apache.spark.sql.connector.expressions.Transform
 import org.apache.spark.sql.connector.read.{Batch, InputPartition, PartitionReader, PartitionReaderFactory, Scan, ScanBuilder}
 import org.apache.spark.sql.execution.datasources.v2.state.StateDataSourceErrors
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions.PATH
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
 import org.apache.spark.sql.execution.streaming.state.{OperatorStateMetadata, OperatorStateMetadataReader, OperatorStateMetadataUtils, OperatorStateMetadataV1, OperatorStateMetadataV2}
 import org.apache.spark.sql.sources.DataSourceRegister
 import org.apache.spark.sql.types.{DataType, IntegerType, LongType, StringType, StructType}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/utils/SchemaUtil.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/utils/SchemaUtil.scala
index 84eab3356c204..52df016791d48 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/utils/SchemaUtil.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/v2/state/utils/SchemaUtil.scala
@@ -25,8 +25,8 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeRow}
 import org.apache.spark.sql.catalyst.util.{ArrayBasedMapData, GenericArrayData}
 import org.apache.spark.sql.execution.datasources.v2.state.{StateDataSourceErrors, StateSourceOptions}
-import org.apache.spark.sql.execution.streaming.{StateVariableType, TransformWithStateVariableInfo}
-import org.apache.spark.sql.execution.streaming.StateVariableType._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.{StateVariableType, TransformWithStateVariableInfo}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateVariableType._
 import org.apache.spark.sql.execution.streaming.state.{ReadStateStore, StateStoreColFamilySchema, UnsafeRowPair}
 import org.apache.spark.sql.types.{ArrayType, DataType, IntegerType, LongType, MapType, StringType, StructType}
 import org.apache.spark.util.ArrayImplicits._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlDataSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlDataSource.scala
index 23bca35725397..9dbca57e2ae95 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlDataSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlDataSource.scala
@@ -22,7 +22,6 @@ import java.nio.charset.{Charset, StandardCharsets}
 
 import scala.util.control.NonFatal
 
-import org.apache.commons.lang3.exception.ExceptionUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, Path}
 import org.apache.hadoop.hdfs.BlockMissingException
@@ -37,7 +36,7 @@ import org.apache.spark.rdd.{BinaryFileRDD, RDD}
 import org.apache.spark.sql.{Dataset, Encoders, SparkSession}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.util.FailureSafeParser
-import org.apache.spark.sql.catalyst.xml.{StaxXmlParser, XmlInferSchema, XmlOptions}
+import org.apache.spark.sql.catalyst.xml.{StaxXmlParser, StaxXMLRecordReader, XmlInferSchema, XmlOptions}
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.execution.SQLExecution
 import org.apache.spark.sql.execution.datasources._
@@ -175,15 +174,26 @@ object MultiLineXmlDataSource extends XmlDataSource {
       file: PartitionedFile,
       parser: StaxXmlParser,
       requiredSchema: StructType): Iterator[InternalRow] = {
-    parser.parseStream(
-      CodecStreams.createInputStreamWithCloseResource(conf, file.toPath),
-      requiredSchema)
+    if (parser.options.useLegacyXMLParser) {
+      parser.parseStream(
+        CodecStreams.createInputStreamWithCloseResource(conf, file.toPath),
+        requiredSchema)
+    } else {
+      parser.parseStreamOptimized(
+        () => CodecStreams.createInputStreamWithCloseResource(conf, file.toPath),
+        requiredSchema)
+    }
   }
 
   override def infer(
       sparkSession: SparkSession,
       inputPaths: Seq[FileStatus],
       parsedOptions: XmlOptions): StructType = {
+
+    if (!parsedOptions.useLegacyXMLParser) {
+      return inferOptimized(sparkSession, inputPaths, parsedOptions)
+    }
+
     val xml = createBaseRdd(sparkSession, inputPaths, parsedOptions)
 
     val tokenRDD: RDD[String] =
@@ -199,7 +209,7 @@ object MultiLineXmlDataSource extends XmlDataSource {
             logWarning("Skipped missing file", e)
             Iterator.empty[String]
           case NonFatal(e) =>
-            ExceptionUtils.getRootCause(e) match {
+            Utils.getRootCause(e) match {
               case e @ (_ : AccessControlException | _ : BlockMissingException) => throw e
               case _: RuntimeException | _: IOException if parsedOptions.ignoreCorruptFiles =>
                 logWarning("Skipped the rest of the content in the corrupted file", e)
@@ -216,6 +226,31 @@ object MultiLineXmlDataSource extends XmlDataSource {
     }
   }
 
+  private def inferOptimized(
+      sparkSession: SparkSession,
+      inputPaths: Seq[FileStatus],
+      parsedOptions: XmlOptions): StructType = {
+
+    val xml = createBaseRdd(sparkSession, inputPaths, parsedOptions)
+
+    val xmlParserRdd: RDD[StaxXMLRecordReader] =
+      xml.flatMap { portableDataStream =>
+        val inputStream = () =>
+          CodecStreams.createInputStreamWithCloseResource(
+            portableDataStream.getConfiguration,
+            new Path(portableDataStream.getPath())
+          )
+        StaxXmlParser.convertStream(inputStream, parsedOptions)(identity)
+      }
+
+    SQLExecution.withSQLConfPropagated(sparkSession) {
+      val schema =
+        new XmlInferSchema(parsedOptions, sparkSession.sessionState.conf.caseSensitiveAnalysis)
+          .inferFromReaders(xmlParserRdd)
+      schema
+    }
+  }
+
   private def createBaseRdd(
       sparkSession: SparkSession,
       inputPaths: Seq[FileStatus],
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlFileFormat.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlFileFormat.scala
index 5072a87af4df7..06151c5fa4d64 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlFileFormat.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/datasources/xml/XmlFileFormat.scala
@@ -39,13 +39,11 @@ case class XmlFileFormat() extends TextBasedFileFormat with DataSourceRegister {
 
   override def shortName(): String = "xml"
 
-  def getXmlOptions(
+  private def getXmlOptions(
       sparkSession: SparkSession,
       parameters: Map[String, String]): XmlOptions = {
-    new XmlOptions(parameters,
-      sparkSession.sessionState.conf.sessionLocalTimeZone,
-      sparkSession.sessionState.conf.columnNameOfCorruptRecord,
-      true)
+    val conf = getSqlConf(sparkSession)
+    new XmlOptions(parameters, conf.sessionLocalTimeZone, conf.columnNameOfCorruptRecord, true)
   }
 
   override def isSplitable(
@@ -53,8 +51,7 @@ case class XmlFileFormat() extends TextBasedFileFormat with DataSourceRegister {
       options: Map[String, String],
       path: Path): Boolean = {
     val xmlOptions = getXmlOptions(sparkSession, options)
-    val xmlDataSource = XmlDataSource(xmlOptions)
-    xmlDataSource.isSplitable && super.isSplitable(sparkSession, options, path)
+    XmlDataSource(xmlOptions).isSplitable && super.isSplitable(sparkSession, options, path)
   }
 
   override def inferSchema(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/debug/package.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/debug/package.scala
index 0b97c8ebab815..b408f2823e16a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/debug/package.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/debug/package.scala
@@ -33,7 +33,7 @@ import org.apache.spark.sql.catalyst.plans.physical.Partitioning
 import org.apache.spark.sql.catalyst.trees.TreeNodeRef
 import org.apache.spark.sql.catalyst.util.StringConcat
 import org.apache.spark.sql.execution.adaptive.{AdaptiveSparkPlanExec, QueryStageExec}
-import org.apache.spark.sql.execution.streaming.{StreamExecution, StreamingQueryWrapper}
+import org.apache.spark.sql.execution.streaming.runtime.{StreamExecution, StreamingQueryWrapper}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamingQuery
 import org.apache.spark.sql.vectorized.ColumnarBatch
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/dynamicpruning/PlanDynamicPruningFilters.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/dynamicpruning/PlanDynamicPruningFilters.scala
index 059729d86bfaf..fbd341b6e7b87 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/dynamicpruning/PlanDynamicPruningFilters.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/dynamicpruning/PlanDynamicPruningFilters.scala
@@ -17,15 +17,14 @@
 
 package org.apache.spark.sql.execution.dynamicpruning
 
-import org.apache.spark.sql.catalyst.expressions
-import org.apache.spark.sql.catalyst.expressions.{Alias, AttributeSeq, BindReferences, DynamicPruningExpression, DynamicPruningSubquery, Expression, ListQuery, Literal}
+import org.apache.spark.sql.catalyst.expressions.{Alias, AttributeSeq, BindReferences, DynamicPruningExpression, DynamicPruningSubquery, Expression, Literal}
 import org.apache.spark.sql.catalyst.optimizer.{BuildLeft, BuildRight}
 import org.apache.spark.sql.catalyst.plans.logical.Aggregate
 import org.apache.spark.sql.catalyst.plans.physical.BroadcastMode
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.trees.TreePattern.DYNAMIC_PRUNING_SUBQUERY
 import org.apache.spark.sql.classic.SparkSession
-import org.apache.spark.sql.execution.{InSubqueryExec, QueryExecution, SparkPlan, SubqueryBroadcastExec}
+import org.apache.spark.sql.execution.{InSubqueryExec, QueryExecution, SparkPlan, SubqueryBroadcastExec, SubqueryExec}
 import org.apache.spark.sql.execution.exchange.BroadcastExchangeExec
 import org.apache.spark.sql.execution.joins._
 import org.apache.spark.sql.internal.SQLConf
@@ -56,6 +55,7 @@ case class PlanDynamicPruningFilters(sparkSession: SparkSession) extends Rule[Sp
       case DynamicPruningSubquery(
           value, buildPlan, buildKeys, broadcastKeyIndices, onlyInBroadcast, exprId, _) =>
         val sparkPlan = QueryExecution.createSparkPlan(sparkSession.sessionState.planner, buildPlan)
+        val name = s"dynamicpruning#${exprId.id}"
         // Using `sparkPlan` is a little hacky as it is based on the assumption that this rule is
         // the first to be applied (apart from `InsertAdaptiveSparkPlan`).
         val canReuseExchange = conf.exchangeReuseEnabled && buildKeys.nonEmpty &&
@@ -72,7 +72,6 @@ case class PlanDynamicPruningFilters(sparkSession: SparkSession) extends Rule[Sp
           val mode = broadcastMode(buildKeys, executedPlan.output)
           // plan a broadcast exchange of the build side of the join
           val exchange = BroadcastExchangeExec(mode, executedPlan)
-          val name = s"dynamicpruning#${exprId.id}"
           // place the broadcast adaptor for reusing the broadcast results on the probe side
           val broadcastValues =
             SubqueryBroadcastExec(name, broadcastKeyIndices, buildKeys, exchange)
@@ -85,8 +84,9 @@ case class PlanDynamicPruningFilters(sparkSession: SparkSession) extends Rule[Sp
           val aliases = broadcastKeyIndices.map(idx =>
             Alias(buildKeys(idx), buildKeys(idx).toString)())
           val aggregate = Aggregate(aliases, aliases, buildPlan)
-          DynamicPruningExpression(expressions.InSubquery(
-            Seq(value), ListQuery(aggregate, numCols = aggregate.output.length)))
+          val sparkPlan = QueryExecution.prepareExecutedPlan(sparkSession, aggregate)
+          val values = SubqueryExec(name, sparkPlan)
+          DynamicPruningExpression(InSubqueryExec(value, values, exprId))
         }
     }
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/BroadcastExchangeExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/BroadcastExchangeExec.scala
index c70ee637a2489..8c695f4f3958d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/BroadcastExchangeExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/BroadcastExchangeExec.scala
@@ -26,7 +26,6 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.{broadcast, SparkException}
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.rdd.{RDD, RDDOperationScope}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
@@ -145,6 +144,12 @@ case class BroadcastExchangeExec(
     Statistics(dataSize, Some(rowCount))
   }
 
+  override def resetMetrics(): Unit = {
+    // no-op
+    // BroadcastExchangeExec after materialized won't be materialized again, so we should not
+    // reset the metrics. Otherwise, we will lose the metrics collected in the broadcast job.
+  }
+
   @transient
   private lazy val promise = Promise[broadcast.Broadcast[Any]]()
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/EnsureRequirements.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/EnsureRequirements.scala
index de5c3aaa4fe4d..a0fc4b65fdbf3 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/EnsureRequirements.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/exchange/EnsureRequirements.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.execution.exchange
 import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.plans._
@@ -374,6 +374,26 @@ case class EnsureRequirements(
     }
   }
 
+  /**
+   * Whether partial clustering can be applied to a given child query plan. This is true if the plan
+   * consists only of a sequence of unary nodes where each node does not use the scan's key-grouped
+   * partitioning to satisfy its required distribution. Otherwise, partially clustering could be
+   * applied to a key-grouped partitioning unrelated to this join.
+   */
+  private def canApplyPartialClusteredDistribution(plan: SparkPlan): Boolean = {
+    !plan.exists {
+      // Unary nodes are safe as long as they don't have a required distribution (for example, a
+      // project or filter). If they have a required distribution, then we should assume that this
+      // plan can't be partially clustered (since the key-grouped partitioning may be needed to
+      // satisfy this distribution unrelated to this JOIN).
+      case u if u.children.length == 1 =>
+        u.requiredChildDistribution.head != UnspecifiedDistribution
+      // Only allow a non-unary node if it's a leaf node - key-grouped partitionings other binary
+      // nodes (like another JOIN) aren't safe to partially cluster.
+      case other => other.children.nonEmpty
+    }
+  }
+
   /**
    * Checks whether two children, `left` and `right`, of a join operator have compatible
    * `KeyGroupedPartitioning`, and can benefit from storage-partitioned join.
@@ -490,9 +510,16 @@ case class EnsureRequirements(
           // whether partially clustered distribution can be applied. For instance, the
           // optimization cannot be applied to a left outer join, where the left hand
           // side is chosen as the side to replicate partitions according to stats.
+          // Similarly, the partially clustered distribution cannot be applied if the
+          // partially clustered side must use the scan's key-grouped partitioning to
+          // satisfy some unrelated required distribution in its plan (for example, for an aggregate
+          // or window function), as this will give incorrect results (for example, duplicate
+          // row_number() values).
           // Otherwise, query result could be incorrect.
-          val canReplicateLeft = canReplicateLeftSide(joinType)
-          val canReplicateRight = canReplicateRightSide(joinType)
+          val canReplicateLeft = canReplicateLeftSide(joinType) &&
+            canApplyPartialClusteredDistribution(right)
+          val canReplicateRight = canReplicateRightSide(joinType) &&
+            canApplyPartialClusteredDistribution(left)
 
           if (!canReplicateLeft && !canReplicateRight) {
             logInfo(log"Skipping partially clustered distribution as it cannot be applied for " +
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/CartesianProductExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/CartesianProductExec.scala
index 8a996bce251c7..8065decb0dffe 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/CartesianProductExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/CartesianProductExec.scala
@@ -36,11 +36,13 @@ class UnsafeCartesianRDD(
     left : RDD[UnsafeRow],
     right : RDD[UnsafeRow],
     inMemoryBufferThreshold: Int,
-    spillThreshold: Int)
+    spillThreshold: Int,
+    spillSizeThreshold: Long)
   extends CartesianRDD[UnsafeRow, UnsafeRow](left.sparkContext, left, right) {
 
   override def compute(split: Partition, context: TaskContext): Iterator[(UnsafeRow, UnsafeRow)] = {
-    val rowArray = new ExternalAppendOnlyUnsafeRowArray(inMemoryBufferThreshold, spillThreshold)
+    val rowArray = new ExternalAppendOnlyUnsafeRowArray(inMemoryBufferThreshold, spillThreshold,
+      spillSizeThreshold)
 
     val partition = split.asInstanceOf[CartesianPartition]
     rdd2.iterator(partition.s2, context).foreach(rowArray.add)
@@ -81,7 +83,8 @@ case class CartesianProductExec(
       leftResults,
       rightResults,
       conf.cartesianProductExecBufferInMemoryThreshold,
-      conf.cartesianProductExecBufferSpillThreshold)
+      conf.cartesianProductExecBufferSpillThreshold,
+      conf.cartesianProductExecBufferSizeSpillThreshold)
     pair.mapPartitionsWithIndexInternal { (index, iter) =>
       val joiner = GenerateUnsafeRowJoiner.create(left.schema, right.schema)
       val filtered = if (condition.isDefined) {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledHashJoinExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledHashJoinExec.scala
index 974f6f9e50c2e..97ca74aee30c0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledHashJoinExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledHashJoinExec.scala
@@ -65,14 +65,35 @@ case class ShuffledHashJoinExec(
     case _ => super.outputOrdering
   }
 
+  private def validCondForIgnoreDupKey(cond: Expression): Boolean = {
+    // to ignore duplicate keys on the build side, the join condition must
+    // have the following properties:
+    // 1) a subtree that is a semantic match to a build-side key, and/or
+    // 2) outside any subtree that is a semantic match to a build-side key,
+    //    all attributes should be from the stream-side.
+    val buildKeysSet = ExpressionSet(buildKeys)
+    val streamedOutputAttrs = AttributeSet(streamedOutput)
+
+    def validCond(cond: Expression): Boolean = {
+      cond match {
+        // don't bother traversing any subtree that has a semantic match to a build key
+        case e: Expression if buildKeysSet.contains(e) => true
+        // all attributes (outside any subtree that matches a build key) should be
+        // from the stream side
+        case a: Attribute if !streamedOutputAttrs.contains(a) => false
+        case e: Expression =>
+          e.children.forall(validCond(_))
+        case _ => true
+      }
+    }
+
+    validCond(cond)
+  }
+
   // Exposed for testing
   @transient lazy val ignoreDuplicatedKey = joinType match {
     case LeftExistence(_) =>
-      // For building hash relation, ignore duplicated rows with same join keys if:
-      // 1. Join condition is empty, or
-      // 2. Join condition only references streamed attributes and build join keys.
-      val streamedOutputAndBuildKeys = AttributeSet(streamedOutput ++ buildKeys)
-      condition.forall(_.references.subsetOf(streamedOutputAndBuildKeys))
+      condition.forall(validCondForIgnoreDupKey(_))
     case _ => false
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledJoin.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledJoin.scala
index 60e5a7769a503..f363156c81e54 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledJoin.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/ShuffledJoin.scala
@@ -37,7 +37,7 @@ trait ShuffledJoin extends JoinCodegenSupport {
   override def requiredChildDistribution: Seq[Distribution] = {
     if (isSkewJoin) {
       // We re-arrange the shuffle partitions to deal with skew join, and the new children
-      // partitioning doesn't satisfy `HashClusteredDistribution`.
+      // partitioning doesn't satisfy `ClusteredDistribution`.
       UnspecifiedDistribution :: UnspecifiedDistribution :: Nil
     } else {
       ClusteredDistribution(leftKeys) :: ClusteredDistribution(rightKeys) :: Nil
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinEvaluatorFactory.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinEvaluatorFactory.scala
index 57ca135407d4a..b4e52ba050b8d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinEvaluatorFactory.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinEvaluatorFactory.scala
@@ -34,6 +34,7 @@ class SortMergeJoinEvaluatorFactory(
     output: Seq[Attribute],
     inMemoryThreshold: Int,
     spillThreshold: Int,
+    spillSizeThreshold: Long,
     numOutputRows: SQLMetric,
     spillSize: SQLMetric,
     onlyBufferFirstMatchedRow: Boolean)
@@ -85,6 +86,7 @@ class SortMergeJoinEvaluatorFactory(
               RowIterator.fromScala(rightIter),
               inMemoryThreshold,
               spillThreshold,
+              spillSizeThreshold,
               spillSize,
               cleanupResources)
             private[this] val joinRow = new JoinedRow
@@ -130,6 +132,7 @@ class SortMergeJoinEvaluatorFactory(
             bufferedIter = RowIterator.fromScala(rightIter),
             inMemoryThreshold,
             spillThreshold,
+            spillSizeThreshold,
             spillSize,
             cleanupResources)
           val rightNullRow = new GenericInternalRow(right.output.length)
@@ -149,6 +152,7 @@ class SortMergeJoinEvaluatorFactory(
             bufferedIter = RowIterator.fromScala(leftIter),
             inMemoryThreshold,
             spillThreshold,
+            spillSizeThreshold,
             spillSize,
             cleanupResources)
           val leftNullRow = new GenericInternalRow(left.output.length)
@@ -185,6 +189,7 @@ class SortMergeJoinEvaluatorFactory(
               RowIterator.fromScala(rightIter),
               inMemoryThreshold,
               spillThreshold,
+              spillSizeThreshold,
               spillSize,
               cleanupResources,
               onlyBufferFirstMatchedRow)
@@ -222,6 +227,7 @@ class SortMergeJoinEvaluatorFactory(
               RowIterator.fromScala(rightIter),
               inMemoryThreshold,
               spillThreshold,
+              spillSizeThreshold,
               spillSize,
               cleanupResources,
               onlyBufferFirstMatchedRow)
@@ -266,6 +272,7 @@ class SortMergeJoinEvaluatorFactory(
               RowIterator.fromScala(rightIter),
               inMemoryThreshold,
               spillThreshold,
+              spillSizeThreshold,
               spillSize,
               cleanupResources,
               onlyBufferFirstMatchedRow)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinExec.scala
index 8d49b1558d687..39387ebbb7ee3 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/SortMergeJoinExec.scala
@@ -103,6 +103,10 @@ case class SortMergeJoinExec(
     conf.sortMergeJoinExecBufferSpillThreshold
   }
 
+  private def getSpillSizeThreshold: Long = {
+    conf.sortMergeJoinExecBufferSpillSizeThreshold
+  }
+
   // Flag to only buffer first matched row, to avoid buffering unnecessary rows.
   private val onlyBufferFirstMatchedRow = (joinType, condition) match {
     case (LeftExistence(_), None) => true
@@ -121,6 +125,7 @@ case class SortMergeJoinExec(
     val numOutputRows = longMetric("numOutputRows")
     val spillSize = longMetric("spillSize")
     val spillThreshold = getSpillThreshold
+    val spillSizeThreshold = getSpillSizeThreshold
     val inMemoryThreshold = getInMemoryThreshold
     val evaluatorFactory = new SortMergeJoinEvaluatorFactory(
       leftKeys,
@@ -132,6 +137,7 @@ case class SortMergeJoinExec(
       output,
       inMemoryThreshold,
       spillThreshold,
+      spillSizeThreshold,
       numOutputRows,
       spillSize,
       onlyBufferFirstMatchedRow
@@ -222,11 +228,13 @@ case class SortMergeJoinExec(
     val clsName = classOf[ExternalAppendOnlyUnsafeRowArray].getName
 
     val spillThreshold = getSpillThreshold
+    val spillSizeThreshold = getSpillSizeThreshold
     val inMemoryThreshold = getInMemoryThreshold
 
     // Inline mutable state since not many join operations in a task
     val matches = ctx.addMutableState(clsName, "matches",
-      v => s"$v = new $clsName($inMemoryThreshold, $spillThreshold);", forceInline = true)
+      v => s"$v = new $clsName($inMemoryThreshold, $spillThreshold, ${spillSizeThreshold}L);",
+      forceInline = true)
     // Copy the streamed keys as class members so they could be used in next function call.
     val matchedKeyVars = copyKeys(ctx, streamedKeyVars)
 
@@ -1044,6 +1052,7 @@ case class SortMergeJoinExec(
  * @param inMemoryThreshold Threshold for number of rows guaranteed to be held in memory by
  *                          internal buffer
  * @param spillThreshold Threshold for number of rows to be spilled by internal buffer
+ * @param spillSizeThreshold Threshold for size of rows to be spilled by internal buffer
  * @param eagerCleanupResources the eager cleanup function to be invoked when no join row found
  * @param onlyBufferFirstMatch [[bufferMatchingRows]] should buffer only the first matching row
  */
@@ -1055,6 +1064,7 @@ private[joins] class SortMergeJoinScanner(
     bufferedIter: RowIterator,
     inMemoryThreshold: Int,
     spillThreshold: Int,
+    spillSizeThreshold: Long,
     spillSize: SQLMetric,
     eagerCleanupResources: () => Unit,
     onlyBufferFirstMatch: Boolean = false) {
@@ -1069,7 +1079,7 @@ private[joins] class SortMergeJoinScanner(
   private[this] var matchJoinKey: InternalRow = _
   /** Buffered rows from the buffered side of the join. This is empty if there are no matches. */
   private[this] val bufferedMatches: ExternalAppendOnlyUnsafeRowArray =
-    new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold)
+    new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
   // At the end of the task, update the task's spill size for buffered side.
   TaskContext.get().addTaskCompletionListener[Unit](_ => {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/StoragePartitionJoinParams.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/StoragePartitionJoinParams.scala
new file mode 100644
index 0000000000000..a28eafc5cae5b
--- /dev/null
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/joins/StoragePartitionJoinParams.scala
@@ -0,0 +1,48 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution.joins
+
+import java.util.Objects
+
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.expressions.Expression
+import org.apache.spark.sql.connector.catalog.functions.Reducer
+
+case class StoragePartitionJoinParams(
+    keyGroupedPartitioning: Option[Seq[Expression]] = None,
+    joinKeyPositions: Option[Seq[Int]] = None,
+    commonPartitionValues: Option[Seq[(InternalRow, Int)]] = None,
+    reducers: Option[Seq[Option[Reducer[_, _]]]] = None,
+    applyPartialClustering: Boolean = false,
+    replicatePartitions: Boolean = false) {
+  override def equals(other: Any): Boolean = other match {
+    case other: StoragePartitionJoinParams =>
+      this.commonPartitionValues == other.commonPartitionValues &&
+      this.replicatePartitions == other.replicatePartitions &&
+      this.applyPartialClustering == other.applyPartialClustering &&
+      this.joinKeyPositions == other.joinKeyPositions
+    case _ =>
+      false
+  }
+
+  override def hashCode(): Int = Objects.hash(
+    joinKeyPositions: Option[Seq[Int]],
+    commonPartitionValues: Option[Seq[(InternalRow, Int)]],
+    applyPartialClustering: java.lang.Boolean,
+    replicatePartitions: java.lang.Boolean)
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/metric/SQLMetrics.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/metric/SQLMetrics.scala
index 065c8db7ac6f9..13f4d7926bea8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/metric/SQLMetrics.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/metric/SQLMetrics.scala
@@ -221,4 +221,19 @@ object SQLMetrics {
         SparkListenerDriverAccumUpdates(executionId.toLong, metrics.map(m => m.id -> m.value)))
     }
   }
+
+  /**
+   * Measures the time taken by the function `f` in nanoseconds and adds it to the provided metric.
+   *
+   * @param metric SQLMetric to record the time taken.
+   * @param f Function/Codeblock to execute and measure.
+   * @return The result of the function `f`.
+   */
+  def withTimingNs[T](metric: SQLMetric)(f: => T): T = {
+      val startTime = System.nanoTime()
+      val result = f
+      val endTime = System.nanoTime()
+      metric.add(endTime - startTime)
+      result
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/objects.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/objects.scala
index ca7836992aacb..015872d98c372 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/objects.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/objects.scala
@@ -39,7 +39,7 @@ import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.python.BatchIterator
 import org.apache.spark.sql.execution.r.ArrowRRunner
-import org.apache.spark.sql.execution.streaming.GroupStateImpl
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.GroupStateTimeout
 import org.apache.spark.sql.types._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/AggregateInPandasExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowAggregatePythonExec.scala
similarity index 84%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/python/AggregateInPandasExec.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowAggregatePythonExec.scala
index 26871b68dde80..d6cc350e485a8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/AggregateInPandasExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowAggregatePythonExec.scala
@@ -21,7 +21,7 @@ import java.io.File
 
 import scala.collection.mutable.ArrayBuffer
 
-import org.apache.spark.{JobArtifactSet, SparkEnv, TaskContext}
+import org.apache.spark.{JobArtifactSet, SparkEnv, SparkException, TaskContext}
 import org.apache.spark.api.python.{ChainedPythonFunctions, PythonEvalType}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
@@ -35,19 +35,28 @@ import org.apache.spark.sql.types.{DataType, StructField, StructType}
 import org.apache.spark.util.Utils
 
 /**
- * Physical node for aggregation with group aggregate Pandas UDF.
+ * Physical node for aggregation with group aggregate vectorized UDF.
+ * Following eval types are supported:
+ *
+ * <ul>
+ *   <li> SQL_GROUPED_AGG_ARROW_UDF for Arrow UDF
+ *   <li> SQL_GROUPED_AGG_PANDAS_UDF for Pandas UDF
+ * </ul>
  *
  * This plan works by sending the necessary (projected) input grouped data as Arrow record batches
  * to the python worker, the python worker invokes the UDF and sends the results to the executor,
  * finally the executor evaluates any post-aggregation expressions and join the result with the
  * grouped key.
  */
-case class AggregateInPandasExec(
+case class ArrowAggregatePythonExec(
     groupingExpressions: Seq[NamedExpression],
     aggExpressions: Seq[AggregateExpression],
     resultExpressions: Seq[NamedExpression],
-    child: SparkPlan)
-  extends UnaryExecNode with PythonSQLMetrics {
+    child: SparkPlan,
+    evalType: Int) extends UnaryExecNode with PythonSQLMetrics {
+  if (!supportedPythonEvalTypes.contains(evalType)) {
+    throw SparkException.internalError(s"Unexpected eval type $evalType")
+  }
 
   override val output: Seq[Attribute] = resultExpressions.map(_.toAttribute)
 
@@ -173,7 +182,7 @@ case class AggregateInPandasExec(
 
       val columnarBatchIter = new ArrowPythonWithNamedArgumentRunner(
         pyFuncs,
-        PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF,
+        evalType,
         argMetas,
         aggInputSchema,
         sessionLocalTimeZone,
@@ -206,13 +215,33 @@ case class AggregateInPandasExec(
       case Some(sessionExpression) =>
         val inMemoryThreshold = conf.windowExecBufferInMemoryThreshold
         val spillThreshold = conf.windowExecBufferSpillThreshold
+        val spillSizeThreshold = conf.windowExecBufferSpillSizeThreshold
 
         new UpdatingSessionsIterator(iter, groupingWithoutSessionExpressions, sessionExpression,
-          child.output, inMemoryThreshold, spillThreshold)
+          child.output, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
       case None => iter
     }
 
     newIter
   }
+
+  private def supportedPythonEvalTypes: Array[Int] =
+    Array(
+      PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF,
+      PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF)
+}
+
+object ArrowAggregatePythonExec {
+  def apply(
+      groupingExpressions: Seq[NamedExpression],
+      aggExpressions: Seq[AggregateExpression],
+      resultExpressions: Seq[NamedExpression],
+      child: SparkPlan): ArrowAggregatePythonExec = {
+    val evalTypes = aggExpressions.map(_.aggregateFunction.asInstanceOf[PythonUDAF].evalType)
+    assert(evalTypes.distinct.size == 1,
+      "All aggregate functions must have the same eval type in ArrowAggregatePythonExec")
+    new ArrowAggregatePythonExec(
+      groupingExpressions, aggExpressions, resultExpressions, child, evalTypes.head)
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonExec.scala
index 9ec454731e4a6..92236ca42b2db 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonExec.scala
@@ -19,8 +19,8 @@ package org.apache.spark.sql.execution.python
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.spark.{JobArtifactSet, TaskContext}
-import org.apache.spark.api.python.ChainedPythonFunctions
+import org.apache.spark.{JobArtifactSet, SparkException, TaskContext}
+import org.apache.spark.api.python.{ChainedPythonFunctions, PythonEvalType}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.errors.QueryExecutionErrors
@@ -28,6 +28,7 @@ import org.apache.spark.sql.execution.SparkPlan
 import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.sql.execution.python.EvalPythonExec.ArgumentMetadata
 import org.apache.spark.sql.types.{StructType, UserDefinedType}
+import org.apache.spark.sql.types.DataType.equalsIgnoreCompatibleCollation
 
 /**
  * Grouped a iterator into batches.
@@ -59,11 +60,26 @@ private[spark] class BatchIterator[T](iter: Iterator[T], batchSize: Int)
 }
 
 /**
- * A physical plan that evaluates a [[PythonUDF]].
+ * A physical plan that evaluates a vectorized UDF.
+ * Following eval types are supported:
+ *
+ * <ul>
+ *   <li> SQL_ARROW_BATCHED_UDF for Arrow Optimized Python UDF
+ *   <li> SQL_SCALAR_ARROW_UDF for Scalar Arrow UDF
+ *   <li> SQL_SCALAR_ARROW_ITER_UDF for Scalar Iterator Arrow UDF
+ *   <li> SQL_SCALAR_PANDAS_UDF for Scalar Pandas UDF
+ *   <li> SQL_SCALAR_PANDAS_ITER_UDF for Scalar Iterator Pandas UDF
+ * </ul>
+ *
  */
-case class ArrowEvalPythonExec(udfs: Seq[PythonUDF], resultAttrs: Seq[Attribute], child: SparkPlan,
-    evalType: Int)
-  extends EvalPythonExec with PythonSQLMetrics {
+case class ArrowEvalPythonExec(
+    udfs: Seq[PythonUDF],
+    resultAttrs: Seq[Attribute],
+    child: SparkPlan,
+    evalType: Int) extends EvalPythonExec with PythonSQLMetrics {
+  if (!supportedPythonEvalTypes.contains(evalType)) {
+    throw SparkException.internalError(s"Unexpected eval type $evalType")
+  }
 
   private[this] val jobArtifactUUID = JobArtifactSet.getCurrentJobArtifactState.map(_.uuid)
 
@@ -84,6 +100,14 @@ case class ArrowEvalPythonExec(udfs: Seq[PythonUDF], resultAttrs: Seq[Attribute]
 
   override protected def withNewChildInternal(newChild: SparkPlan): SparkPlan =
     copy(child = newChild)
+
+  private def supportedPythonEvalTypes: Array[Int] =
+    Array(
+      PythonEvalType.SQL_ARROW_BATCHED_UDF,
+      PythonEvalType.SQL_SCALAR_ARROW_UDF,
+      PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF,
+      PythonEvalType.SQL_SCALAR_PANDAS_UDF,
+      PythonEvalType.SQL_SCALAR_PANDAS_ITER_UDF)
 }
 
 class ArrowEvalPythonEvaluatorFactory(
@@ -128,7 +152,7 @@ class ArrowEvalPythonEvaluatorFactory(
 
     columnarBatchIter.flatMap { batch =>
       val actualDataTypes = (0 until batch.numCols()).map(i => batch.column(i).dataType())
-      if (outputTypes != actualDataTypes) {
+      if (!equalsIgnoreCompatibleCollation(outputTypes, actualDataTypes)) {
         throw QueryExecutionErrors.arrowDataTypeMismatchError(
           "pandas_udf()", outputTypes, actualDataTypes)
       }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonUDTFExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonUDTFExec.scala
index d7106403a3880..ae1982ecec20e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonUDTFExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowEvalPythonUDTFExec.scala
@@ -25,7 +25,8 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.SparkPlan
 import org.apache.spark.sql.execution.python.EvalPythonExec.ArgumentMetadata
-import org.apache.spark.sql.types.StructType
+import org.apache.spark.sql.types.{StructType, UserDefinedType}
+import org.apache.spark.sql.types.DataType.equalsIgnoreCompatibleCollation
 import org.apache.spark.sql.vectorized.{ArrowColumnVector, ColumnarBatch}
 
 /**
@@ -61,7 +62,9 @@ case class ArrowEvalPythonUDTFExec(
 
     val batchIter = if (batchSize > 0) new BatchIterator(iter, batchSize) else Iterator(iter)
 
-    val outputTypes = resultAttrs.map(_.dataType)
+    val outputTypes = resultAttrs.map(_.dataType.transformRecursively {
+      case udt: UserDefinedType[_] => udt.sqlType
+    })
 
     val columnarBatchIter = new ArrowPythonUDTFRunner(
       udtf,
@@ -82,7 +85,7 @@ case class ArrowEvalPythonUDTFExec(
 
       val actualDataTypes = (0 until flattenedBatch.numCols()).map(
         i => flattenedBatch.column(i).dataType())
-      if (outputTypes != actualDataTypes) {
+      if (!equalsIgnoreCompatibleCollation(outputTypes, actualDataTypes)) {
         throw QueryExecutionErrors.arrowDataTypeMismatchError(
           "Python UDTF", outputTypes, actualDataTypes)
       }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonRunner.scala
index 9a9fb574b87fb..70d2b17de2e72 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonRunner.scala
@@ -49,6 +49,8 @@ abstract class BaseArrowPythonRunner(
   override val faultHandlerEnabled: Boolean = SQLConf.get.pythonUDFWorkerFaulthandlerEnabled
   override val idleTimeoutSeconds: Long = SQLConf.get.pythonUDFWorkerIdleTimeoutSeconds
   override val killOnIdleTimeout: Boolean = SQLConf.get.pythonUDFWorkerKillOnIdleTimeout
+  override val tracebackDumpIntervalSeconds: Long =
+    SQLConf.get.pythonUDFWorkerTracebackDumpIntervalSeconds
 
   override val errorOnDuplicatedFieldNames: Boolean = true
 
@@ -131,7 +133,15 @@ object ArrowPythonRunner {
     val legacyPandasConversion = Seq(
       SQLConf.PYTHON_TABLE_UDF_LEGACY_PANDAS_CONVERSION_ENABLED.key ->
       conf.legacyPandasConversion.toString)
+    val legacyPandasConversionUDF = Seq(
+      SQLConf.PYTHON_UDF_LEGACY_PANDAS_CONVERSION_ENABLED.key ->
+      conf.legacyPandasConversionUDF.toString)
+    val intToDecimalCoercion = Seq(
+      SQLConf.PYTHON_UDF_PANDAS_INT_TO_DECIMAL_COERCION_ENABLED.key ->
+      conf.getConf(SQLConf.PYTHON_UDF_PANDAS_INT_TO_DECIMAL_COERCION_ENABLED, false).toString)
     Map(timeZoneConf ++ pandasColsByName ++ arrowSafeTypeCheck ++
-      arrowAyncParallelism ++ useLargeVarTypes ++ legacyPandasConversion: _*)
+      arrowAyncParallelism ++ useLargeVarTypes ++
+      intToDecimalCoercion ++
+      legacyPandasConversion ++ legacyPandasConversionUDF: _*)
   }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonUDTFRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonUDTFRunner.scala
index ae875c777b434..c081787b52095 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonUDTFRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowPythonUDTFRunner.scala
@@ -48,6 +48,20 @@ class ArrowPythonUDTFRunner(
   with BasicPythonArrowOutput {
 
   override protected def writeUDF(dataOut: DataOutputStream): Unit = {
+    // For arrow-optimized Python UDTFs (@udtf(useArrow=True)), we need to write
+    // the schema to the worker to support UDT (user-defined type).
+    // Currently, UDT is not supported in PyArrow native UDTFs (arrow_udf)
+    if (evalType == PythonEvalType.SQL_ARROW_TABLE_UDF) {
+      PythonWorkerUtils.writeUTF(schema.json, dataOut)
+    }
+    // Write the table argument offsets for Arrow UDTFs.
+    else if (evalType == PythonEvalType.SQL_ARROW_UDTF) {
+      val tableArgOffsets = argMetas.collect {
+        case ArgumentMetadata(offset, _, isTableArg) if isTableArg => offset
+      }
+      dataOut.writeInt(tableArgOffsets.length)
+      tableArgOffsets.foreach(dataOut.writeInt(_))
+    }
     PythonUDTFRunner.writeUDTF(dataOut, udtf, argMetas)
   }
 
@@ -58,6 +72,8 @@ class ArrowPythonUDTFRunner(
   override val faultHandlerEnabled: Boolean = SQLConf.get.pythonUDFWorkerFaulthandlerEnabled
   override val idleTimeoutSeconds: Long = SQLConf.get.pythonUDFWorkerIdleTimeoutSeconds
   override val killOnIdleTimeout: Boolean = SQLConf.get.pythonUDFWorkerKillOnIdleTimeout
+  override val tracebackDumpIntervalSeconds: Long =
+    SQLConf.get.pythonUDFWorkerTracebackDumpIntervalSeconds
 
   override val errorOnDuplicatedFieldNames: Boolean = true
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/WindowInPandasEvaluatorFactory.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowWindowPythonEvaluatorFactory.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/python/WindowInPandasEvaluatorFactory.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowWindowPythonEvaluatorFactory.scala
index e7fc9c7391af4..92ed9ff9de456 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/WindowInPandasEvaluatorFactory.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowWindowPythonEvaluatorFactory.scala
@@ -23,7 +23,7 @@ import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{JobArtifactSet, PartitionEvaluator, PartitionEvaluatorFactory, SparkEnv, TaskContext}
-import org.apache.spark.api.python.{ChainedPythonFunctions, PythonEvalType}
+import org.apache.spark.api.python.ChainedPythonFunctions
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeReference, BoundReference, EmptyRow, Expression, JoinedRow, NamedArgumentExpression, NamedExpression, PythonFuncExpression, PythonUDAF, SortOrder, SpecificInternalRow, UnsafeProjection, UnsafeRow, WindowExpression}
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
@@ -37,11 +37,12 @@ import org.apache.spark.sql.types.{DataType, IntegerType, StructField, StructTyp
 import org.apache.spark.util.ArrayImplicits._
 import org.apache.spark.util.Utils
 
-class WindowInPandasEvaluatorFactory(
+class ArrowWindowPythonEvaluatorFactory(
     val windowExpression: Seq[NamedExpression],
     val partitionSpec: Seq[Expression],
     val orderSpec: Seq[SortOrder],
     val childOutput: Seq[Attribute],
+    val evalType: Int,
     val spillSize: SQLMetric,
     pythonMetrics: Map[String, SQLMetric],
     profiler: Option[String])
@@ -67,7 +68,7 @@ class WindowInPandasEvaluatorFactory(
 
   private object BoundedWindow extends WindowBoundType("bounded")
 
-  private val windowBoundTypeConf = "pandas_window_bound_types"
+  private val windowBoundTypeConf = "window_bound_types"
 
   private def collectFunctions(
       udf: PythonFuncExpression): ((ChainedPythonFunctions, Long), Seq[Expression]) = {
@@ -148,6 +149,7 @@ class WindowInPandasEvaluatorFactory(
 
     private val inMemoryThreshold = conf.windowExecBufferInMemoryThreshold
     private val spillThreshold = conf.windowExecBufferSpillThreshold
+    private val spillSizeThreshold = conf.windowExecBufferSpillSizeThreshold
     private val sessionLocalTimeZone = conf.sessionLocalTimeZone
     private val largeVarTypes = conf.arrowUseLargeVarTypes
 
@@ -286,7 +288,8 @@ class WindowInPandasEvaluatorFactory(
 
         // Manage the current partition.
         val buffer: ExternalAppendOnlyUnsafeRowArray =
-          new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold)
+          new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold,
+            spillSizeThreshold)
         var bufferIterator: Iterator[UnsafeRow] = _
 
         val indexRow =
@@ -362,7 +365,7 @@ class WindowInPandasEvaluatorFactory(
 
       val windowFunctionResult = new ArrowPythonWithNamedArgumentRunner(
         pyFuncs,
-        PythonEvalType.SQL_WINDOW_AGG_PANDAS_UDF,
+        evalType,
         argMetas,
         pythonInputSchema,
         sessionLocalTimeZone,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/WindowInPandasExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowWindowPythonExec.scala
similarity index 74%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/python/WindowInPandasExec.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowWindowPythonExec.scala
index 294bcdadc2b20..c8259c10dbd93 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/WindowInPandasExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ArrowWindowPythonExec.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.sql.execution.python
 
+import org.apache.spark.SparkException
+import org.apache.spark.api.python.PythonEvalType
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
@@ -26,6 +28,12 @@ import org.apache.spark.sql.execution.window._
 
 /**
  * This class calculates and outputs windowed aggregates over the rows in a single partition.
+ * Following eval types are supported:
+ *
+ * <ul>
+ *   <li> SQL_WINDOW_AGG_ARROW_UDF for Arrow UDF
+ *   <li> SQL_WINDOW_AGG_PANDAS_UDF for Pandas UDF
+ * </ul>
  *
  * This is similar to [[WindowExec]]. The main difference is that this node does not compute
  * any window aggregation values. Instead, it computes the lower and upper bound for each window
@@ -61,7 +69,7 @@ import org.apache.spark.sql.execution.window._
  *     Unbounded window takes only input columns.
  * (2) Bounded window evaluates the udf once per input row.
  *     Unbounded window evaluates the udf once per window partition.
- * This is controlled by Python runner conf "pandas_window_bound_types"
+ * This is controlled by Python runner conf "window_bound_types"
  *
  * The logic to compute window bounds is delegated to [[WindowFunctionFrame]] and shared with
  * [[WindowExec]]
@@ -69,23 +77,28 @@ import org.apache.spark.sql.execution.window._
  * Note this doesn't support partial aggregation and all aggregation is computed from the entire
  * window.
  */
-case class WindowInPandasExec(
+case class ArrowWindowPythonExec(
     windowExpression: Seq[NamedExpression],
     partitionSpec: Seq[Expression],
     orderSpec: Seq[SortOrder],
-    child: SparkPlan)
-  extends WindowExecBase with PythonSQLMetrics {
+    child: SparkPlan,
+    evalType: Int) extends WindowExecBase with PythonSQLMetrics {
+  if (!supportedPythonEvalTypes.contains(evalType)) {
+    throw SparkException.internalError(s"Unexpected eval type $evalType")
+  }
+
   override lazy val metrics: Map[String, SQLMetric] = pythonMetrics ++ Map(
     "spillSize" -> SQLMetrics.createSizeMetric(sparkContext, "spill size")
   )
 
   protected override def doExecute(): RDD[InternalRow] = {
     val evaluatorFactory =
-      new WindowInPandasEvaluatorFactory(
+      new ArrowWindowPythonEvaluatorFactory(
         windowExpression,
         partitionSpec,
         orderSpec,
         child.output,
+        evalType,
         longMetric("spillSize"),
         pythonMetrics,
         conf.pythonUDFProfiler)
@@ -101,6 +114,26 @@ case class WindowInPandasExec(
     }
   }
 
-  override protected def withNewChildInternal(newChild: SparkPlan): WindowInPandasExec =
+  override protected def withNewChildInternal(newChild: SparkPlan): ArrowWindowPythonExec =
     copy(child = newChild)
+
+  private def supportedPythonEvalTypes: Array[Int] =
+    Array(
+      PythonEvalType.SQL_WINDOW_AGG_ARROW_UDF,
+      PythonEvalType.SQL_WINDOW_AGG_PANDAS_UDF)
+}
+
+object ArrowWindowPythonExec {
+  def apply(
+      windowExpression: Seq[NamedExpression],
+      partitionSpec: Seq[Expression],
+      orderSpec: Seq[SortOrder],
+      child: SparkPlan): ArrowWindowPythonExec = {
+    val evalTypes = windowExpression.flatMap(w => WindowFunctionType.pythonEvalType(w))
+    assert(evalTypes.nonEmpty,
+      "Cannot extract eval type from PythonUDAFs in ArrowWindowPythonExec")
+    assert(evalTypes.distinct.size == 1,
+      "All window functions must have the same eval type in ArrowWindowPythonExec")
+    ArrowWindowPythonExec(windowExpression, partitionSpec, orderSpec, child, evalTypes.head)
+  }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/AttachDistributedSequenceExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/AttachDistributedSequenceExec.scala
index a8a6fa97c52a9..e27bde38a6f5f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/AttachDistributedSequenceExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/AttachDistributedSequenceExec.scala
@@ -18,7 +18,6 @@
 package org.apache.spark.sql.execution.python
 
 import org.apache.spark.internal.LogKeys.{RDD_ID, SPARK_PLAN_ID}
-import org.apache.spark.internal.MDC
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/BatchEvalPythonUDTFExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/BatchEvalPythonUDTFExec.scala
index c0dcb77817420..a1358c9cd7746 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/BatchEvalPythonUDTFExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/BatchEvalPythonUDTFExec.scala
@@ -120,7 +120,7 @@ object PythonUDTFRunner {
     // Write the argument types of the UDTF.
     dataOut.writeInt(argMetas.length)
     argMetas.foreach {
-      case ArgumentMetadata(offset, name) =>
+      case ArgumentMetadata(offset, name, _) =>
         dataOut.writeInt(offset)
         name match {
           case Some(name) =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/CoGroupedArrowPythonRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/CoGroupedArrowPythonRunner.scala
index 27d6f7dc1c66b..8b160accd7a4d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/CoGroupedArrowPythonRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/CoGroupedArrowPythonRunner.scala
@@ -62,6 +62,8 @@ class CoGroupedArrowPythonRunner(
   override val faultHandlerEnabled: Boolean = SQLConf.get.pythonUDFWorkerFaulthandlerEnabled
   override val idleTimeoutSeconds: Long = SQLConf.get.pythonUDFWorkerIdleTimeoutSeconds
   override val killOnIdleTimeout: Boolean = SQLConf.get.pythonUDFWorkerKillOnIdleTimeout
+  override val tracebackDumpIntervalSeconds: Long =
+    SQLConf.get.pythonUDFWorkerTracebackDumpIntervalSeconds
 
   override val hideTraceback: Boolean = SQLConf.get.pysparkHideTraceback
   override val simplifiedTraceback: Boolean = SQLConf.get.pysparkSimplifiedTraceback
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonExec.scala
index af6769cfbb9d7..0c366b1280b41 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonExec.scala
@@ -28,8 +28,9 @@ object EvalPythonExec {
    *
    * @param offset the offset of the argument
    * @param name the name of the argument if it's a `NamedArgumentExpression`
+   * @param isTableArg whether this argument is a table argument
    */
-  case class ArgumentMetadata(offset: Int, name: Option[String])
+  case class ArgumentMetadata(offset: Int, name: Option[String], isTableArg: Boolean = false)
 }
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonUDTFExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonUDTFExec.scala
index 41a99693443e5..3cb9431fed6f6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonUDTFExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvalPythonUDTFExec.scala
@@ -68,7 +68,9 @@ trait EvalPythonUDTFExec extends UnaryExecNode {
       // flatten all the arguments
       val allInputs = new ArrayBuffer[Expression]
       val dataTypes = new ArrayBuffer[DataType]
-      val argMetas = udtf.children.map { e =>
+      val argMetas = udtf.children.zip(
+        udtf.tableArguments.getOrElse(Seq.fill(udtf.children.length)(false))
+      ).map { case (e: Expression, isTableArg: Boolean) =>
         val (key, value) = e match {
           case NamedArgumentExpression(key, value) =>
             (Some(key), value)
@@ -76,11 +78,11 @@ trait EvalPythonUDTFExec extends UnaryExecNode {
             (None, e)
         }
         if (allInputs.exists(_.semanticEquals(value))) {
-          ArgumentMetadata(allInputs.indexWhere(_.semanticEquals(value)), key)
+          ArgumentMetadata(allInputs.indexWhere(_.semanticEquals(value)), key, isTableArg)
         } else {
           allInputs += value
           dataTypes += value.dataType
-          ArgumentMetadata(allInputs.length - 1, key)
+          ArgumentMetadata(allInputs.length - 1, key, isTableArg)
         }
       }.toArray
       val projection = MutableProjection.create(allInputs.toSeq, child.output)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvaluatePython.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvaluatePython.scala
index fd7ccb2189bff..5d117a67e6bee 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvaluatePython.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/EvaluatePython.scala
@@ -36,7 +36,8 @@ import org.apache.spark.unsafe.types.{UTF8String, VariantVal}
 object EvaluatePython {
 
   def needConversionInPython(dt: DataType): Boolean = dt match {
-    case DateType | TimestampType | TimestampNTZType | VariantType | _: DayTimeIntervalType => true
+    case DateType | TimestampType | TimestampNTZType | VariantType | _: DayTimeIntervalType
+         | _: TimeType => true
     case _: StructType => true
     case _: UserDefinedType[_] => true
     case ArrayType(elementType, _) => needConversionInPython(elementType)
@@ -78,7 +79,7 @@ object EvaluatePython {
 
     case (d: Decimal, _) => d.toJavaBigDecimal
 
-    case (s: UTF8String, StringType) => s.toString
+    case (s: UTF8String, _: StringType) => s.toString
 
     case (other, _) => other
   }
@@ -138,7 +139,7 @@ object EvaluatePython {
       case c: Int => c
     }
 
-    case TimestampType | TimestampNTZType | _: DayTimeIntervalType => (obj: Any) =>
+    case TimestampType | TimestampNTZType | _: DayTimeIntervalType | _: TimeType => (obj: Any) =>
       nullSafeConvert(obj) {
         case c: Long => c
         // Py4J serializes values between MIN_INT and MAX_INT as Ints, not Longs
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ExtractPythonUDFs.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ExtractPythonUDFs.scala
index a42e5d3e6c972..1407e020353f0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ExtractPythonUDFs.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/ExtractPythonUDFs.scala
@@ -22,7 +22,7 @@ import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.SparkException
 import org.apache.spark.api.python.PythonEvalType
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.REASON
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
@@ -169,16 +169,63 @@ object ExtractPythonUDFs extends Rule[LogicalPlan] with Logging {
     e.exists(PythonUDF.isScalarPythonUDF)
   }
 
+  /**
+   * Return true if we should extract the current expression, including all of its current
+   * children (including UDF expression, and all others), to a logical node.
+   * The children of the expression can be UDF expressions, this would be nested chaining.
+   * If child UDF expressions were already extracted before, then this will just extract
+   * the current UDF expression, so they will end up in separate logical nodes. The child
+   * expressions will have been transformed to Attribute expressions referencing the child plan
+   * node's output.
+   *
+   * Return false if there is no single continuous chain of UDFs that can be extracted:
+   * - if there are other expression in-between, return false. In
+   *   below example, the caller will have to extract bar(baz()) separately first:
+   *   Query: foo(1 + bar(baz()))
+   *   Plan:
+   *   - PythonUDF (foo)
+   *      - Project
+   *         - PythonUDF (bar)
+   *           - PythonUDF (baz)
+   * - if the eval types of the UDF expressions in the chain differ, return false.
+   * - if a UDF has more than one child, e.g. foo(bar(), baz()), return false
+   * If we return false here, the expectation is that the recursive calls of
+   * collectEvaluableUDFsFromExpressions will then visit the children and extract them first to
+   * separate nodes.
+   */
   @scala.annotation.tailrec
-  private def canEvaluateInPython(e: PythonUDF): Boolean = {
+  private def shouldExtractUDFExpressionTree(e: PythonUDF): Boolean = {
     e.children match {
-      // single PythonUDF child could be chained and evaluated in Python
-      case Seq(u: PythonUDF) => correctEvalType(e) == correctEvalType(u) && canEvaluateInPython(u)
+      case Seq(child: PythonUDF) => correctEvalType(e) == correctEvalType(child) &&
+        shouldExtractUDFExpressionTree(child)
       // Python UDF can't be evaluated directly in JVM
       case children => !children.exists(hasScalarPythonUDF)
     }
   }
 
+  /**
+   * We use the following terminology:
+   * - chaining is the act of combining multiple UDFs into a single logical node. This can be
+   *   accomplished in different cases, for example:
+   *   - parallel chaining: if the UDFs are siblings, e.g., foo(x), bar(x),
+   *     where multiple independent UDFs are evaluated together over the same input
+   *   - nested chaining: if the UDFs are nested, e.g., foo(bar(...)),
+   *     where the output of one UDF feeds into the next in a sequential pipeline
+   *
+   * collectEvaluableUDFsFromExpressions returns a list of UDF expressions that can be planned
+   * together into one plan node. collectEvaluableUDFsFromExpressions will be called multiple times
+   * by recursive calls of extract(plan), until no more evaluable UDFs are found.
+   *
+   * As an example, consider the following expression tree:
+   * udf1(udf2(udf3(x)), udf4(x))), where all UDFs are PythonUDFs of the same evaltype.
+   * We can only fuse UDFs of the same eval type, and never UDFs of SQL_SCALAR_PANDAS_ITER_UDF.
+   * The following udf expressions will be returned:
+   * - First, we will return Seq(udf3, udf4), as these two UDFs must be evaluated first.
+   *   We return both in one Seq, as it is possible to do parallel fusing for udf3 an udf4.
+   * - As we can only chain UDFs with exactly one child, we will not fuse udf2 with its children.
+   *   But we can chain udf1 and udf2, so a later call to collectEvaluableUDFsFromExpressions will
+   *   return Seq(udf1, udf2).
+   */
   private def collectEvaluableUDFsFromExpressions(expressions: Seq[Expression]): Seq[PythonUDF] = {
     // If first UDF is SQL_SCALAR_PANDAS_ITER_UDF or SQL_SCALAR_ARROW_ITER_UDF,
     // then only return this UDF,
@@ -187,7 +234,7 @@ object ExtractPythonUDFs extends Rule[LogicalPlan] with Logging {
 
     var firstVisitedScalarUDFEvalType: Option[Int] = None
 
-    def canChainUDF(evalType: Int): Boolean = {
+    def canChainWithParallelUDFs(evalType: Int): Boolean = {
       if (evalType == PythonEvalType.SQL_SCALAR_PANDAS_ITER_UDF ||
         evalType == PythonEvalType.SQL_SCALAR_ARROW_ITER_UDF) {
         false
@@ -197,12 +244,14 @@ object ExtractPythonUDFs extends Rule[LogicalPlan] with Logging {
     }
 
     def collectEvaluableUDFs(expr: Expression): Seq[PythonUDF] = expr match {
-      case udf: PythonUDF if PythonUDF.isScalarPythonUDF(udf) && canEvaluateInPython(udf)
+      case udf: PythonUDF if PythonUDF.isScalarPythonUDF(udf)
+        && shouldExtractUDFExpressionTree(udf)
         && firstVisitedScalarUDFEvalType.isEmpty =>
         firstVisitedScalarUDFEvalType = Some(correctEvalType(udf))
         Seq(udf)
-      case udf: PythonUDF if PythonUDF.isScalarPythonUDF(udf) && canEvaluateInPython(udf)
-        && canChainUDF(correctEvalType(udf)) =>
+      case udf: PythonUDF if PythonUDF.isScalarPythonUDF(udf)
+        && shouldExtractUDFExpressionTree(udf)
+        && canChainWithParallelUDFs(correctEvalType(udf)) =>
         Seq(udf)
       case e => e.children.flatMap(collectEvaluableUDFs)
     }
@@ -357,6 +406,10 @@ object ExtractPythonUDTFs extends Rule[LogicalPlan] {
           BatchEvalPythonUDTF(func, g.requiredChildOutput, g.generatorOutput, child)
         case PythonEvalType.SQL_ARROW_TABLE_UDF =>
           ArrowEvalPythonUDTF(func, g.requiredChildOutput, g.generatorOutput, child, func.evalType)
+        case PythonEvalType.SQL_ARROW_UDTF =>
+          ArrowEvalPythonUDTF(func, g.requiredChildOutput, g.generatorOutput, child, func.evalType)
+        case _ =>
+          throw SparkException.internalError(s"Unsupported UDTF eval type: ${func.evalType}")
       }
     }
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonPlannerRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonPlannerRunner.scala
index 897b520f0b1ab..200a92f3dc3c6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonPlannerRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonPlannerRunner.scala
@@ -30,7 +30,7 @@ import net.razorvine.pickle.Pickler
 
 import org.apache.spark.{JobArtifactSet, SparkEnv, SparkException}
 import org.apache.spark.api.python.{BasePythonRunner, PythonFunction, PythonWorker, PythonWorkerUtils, SpecialLengths}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.BUFFER_SIZE
 import org.apache.spark.internal.config.Python._
 import org.apache.spark.sql.internal.SQLConf
@@ -57,6 +57,7 @@ abstract class PythonPlannerRunner[T](func: PythonFunction) extends Logging {
     val faultHandlerEnabled: Boolean = SQLConf.get.pythonUDFWorkerFaulthandlerEnabled
     val idleTimeoutSeconds: Long = SQLConf.get.pythonUDFWorkerIdleTimeoutSeconds
     val killOnIdleTimeout: Boolean = SQLConf.get.pythonUDFWorkerKillOnIdleTimeout
+    val tracebackDumpIntervalSeconds: Long = SQLConf.get.pythonUDFWorkerTracebackDumpIntervalSeconds
     val hideTraceback: Boolean = SQLConf.get.pysparkHideTraceback
     val simplifiedTraceback: Boolean = SQLConf.get.pysparkSimplifiedTraceback
     val workerMemoryMb = SQLConf.get.pythonPlannerExecMemory
@@ -88,6 +89,9 @@ abstract class PythonPlannerRunner[T](func: PythonFunction) extends Logging {
     if (faultHandlerEnabled) {
       envVars.put("PYTHON_FAULTHANDLER_DIR", faultHandlerLogDir.toString)
     }
+    if (tracebackDumpIntervalSeconds > 0L) {
+      envVars.put("PYTHON_TRACEBACK_DUMP_INTERVAL_SECONDS", tracebackDumpIntervalSeconds.toString)
+    }
 
     envVars.put("SPARK_JOB_ARTIFACT_UUID", jobArtifactUUID.getOrElse("default"))
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonUDFRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonUDFRunner.scala
index 4baddcd4d9e77..8ff7e57d9421e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonUDFRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/PythonUDFRunner.scala
@@ -48,6 +48,8 @@ abstract class BasePythonUDFRunner(
   override val faultHandlerEnabled: Boolean = SQLConf.get.pythonUDFWorkerFaulthandlerEnabled
   override val idleTimeoutSeconds: Long = SQLConf.get.pythonUDFWorkerIdleTimeoutSeconds
   override val killOnIdleTimeout: Boolean = SQLConf.get.pythonUDFWorkerKillOnIdleTimeout
+  override val tracebackDumpIntervalSeconds: Long =
+    SQLConf.get.pythonUDFWorkerTracebackDumpIntervalSeconds
 
   override val bufferSize: Int = SQLConf.get.getConf(SQLConf.PYTHON_UDF_BUFFER_SIZE)
   override val batchSizeForPythonUDF: Int =
@@ -191,7 +193,7 @@ object PythonUDFRunner {
     funcs.zip(argMetas).foreach { case ((chained, resultId), metas) =>
       dataOut.writeInt(metas.length)
       metas.foreach {
-        case ArgumentMetadata(offset, name) =>
+        case ArgumentMetadata(offset, name, _) =>
           dataOut.writeInt(offset)
           name match {
             case Some(name) =>
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/UserDefinedPythonFunction.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/UserDefinedPythonFunction.scala
index c43cbad7c395f..5ab0d259d83c4 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/UserDefinedPythonFunction.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/UserDefinedPythonFunction.scala
@@ -25,7 +25,7 @@ import net.razorvine.pickle.Pickler
 
 import org.apache.spark.api.python.{PythonEvalType, PythonFunction, PythonWorkerUtils, SpecialLengths}
 import org.apache.spark.sql.{Column, TableArg}
-import org.apache.spark.sql.catalyst.expressions.{Alias, Ascending, Descending, Expression, FunctionTableSubqueryArgumentExpression, NamedArgumentExpression, NullsFirst, NullsLast, PythonUDAF, PythonUDF, PythonUDTF, PythonUDTFAnalyzeResult, PythonUDTFSelectedExpression, SortOrder, UnresolvedPolymorphicPythonUDTF}
+import org.apache.spark.sql.catalyst.expressions.{Alias, Ascending, Descending, Expression, FunctionTableSubqueryArgumentExpression, NamedArgumentExpression, NullsFirst, NullsLast, PythonUDAF, PythonUDF, PythonUDTF, PythonUDTFAnalyzeResult, PythonUDTFSelectedExpression, SortOrder, UnresolvedPolymorphicPythonUDTF, UnresolvedTableArgPlanId}
 import org.apache.spark.sql.catalyst.parser.ParserInterface
 import org.apache.spark.sql.catalyst.plans.logical.{Generate, LogicalPlan, NamedParametersSupport, OneRowRelation}
 import org.apache.spark.sql.classic.{DataFrame, Dataset, SparkSession}
@@ -50,7 +50,8 @@ case class UserDefinedPythonFunction(
         || pythonEvalType ==PythonEvalType.SQL_ARROW_BATCHED_UDF
         || pythonEvalType == PythonEvalType.SQL_SCALAR_PANDAS_UDF
         || pythonEvalType == PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF
-        || pythonEvalType == PythonEvalType.SQL_SCALAR_ARROW_UDF) {
+        || pythonEvalType == PythonEvalType.SQL_SCALAR_ARROW_UDF
+        || pythonEvalType == PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF) {
       /*
        * Check if the named arguments:
        * - don't have duplicated names
@@ -61,8 +62,9 @@ case class UserDefinedPythonFunction(
       throw QueryCompilationErrors.namedArgumentsNotSupported(name)
     }
 
-    if (pythonEvalType == PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF) {
-      PythonUDAF(name, func, dataType, e, udfDeterministic)
+    if (pythonEvalType == PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF
+      || pythonEvalType == PythonEvalType.SQL_GROUPED_AGG_ARROW_UDF) {
+      PythonUDAF(name, func, dataType, e, udfDeterministic, pythonEvalType)
     } else {
       PythonUDF(name, func, dataType, e, pythonEvalType, udfDeterministic)
     }
@@ -121,6 +123,16 @@ case class UserDefinedPythonTableFunction(
      */
     NamedParametersSupport.splitAndCheckNamedArguments(exprs, name)
 
+    // Check which argument is a table argument here since it will be replaced with
+    // `UnresolvedAttribute` to construct lateral join.
+    val tableArgs = exprs.map {
+      case _: FunctionTableSubqueryArgumentExpression => true
+      case _: UnresolvedTableArgPlanId => true
+      case NamedArgumentExpression(_, _: FunctionTableSubqueryArgumentExpression) => true
+      case NamedArgumentExpression(_, _: UnresolvedTableArgPlanId) => true
+      case _ => false
+    }
+
     val udtf = returnType match {
       case Some(rt) =>
         PythonUDTF(
@@ -130,15 +142,9 @@ case class UserDefinedPythonTableFunction(
           pickledAnalyzeResult = None,
           children = exprs,
           evalType = pythonEvalType,
-          udfDeterministic = udfDeterministic)
+          udfDeterministic = udfDeterministic,
+          tableArguments = Some(tableArgs))
       case _ =>
-        // Check which argument is a table argument here since it will be replaced with
-        // `UnresolvedAttribute` to construct lateral join.
-        val tableArgs = exprs.map {
-          case _: FunctionTableSubqueryArgumentExpression => true
-          case NamedArgumentExpression(_, _: FunctionTableSubqueryArgumentExpression) => true
-          case _ => false
-        }
         val runAnalyzeInPython = (func: PythonFunction, exprs: Seq[Expression]) => {
           val runner =
             new UserDefinedPythonTableFunctionAnalyzeRunner(name, func, exprs, tableArgs, parser)
@@ -150,7 +156,8 @@ case class UserDefinedPythonTableFunction(
           children = exprs,
           evalType = pythonEvalType,
           udfDeterministic = udfDeterministic,
-          resolveElementMetadata = runAnalyzeInPython)
+          resolveElementMetadata = runAnalyzeInPython,
+          tableArguments = Some(tableArgs))
     }
     Generate(
       udtf,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStatePythonRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStatePythonRunner.scala
index 0de937df05f4a..b6f6a4cbc30b6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStatePythonRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStatePythonRunner.scala
@@ -28,7 +28,6 @@ import org.json4s.jackson.JsonMethods._
 
 import org.apache.spark.api.python._
 import org.apache.spark.internal.LogKeys.CONFIG
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.api.python.PythonSQLUtils
 import org.apache.spark.sql.catalyst.InternalRow
@@ -39,7 +38,7 @@ import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.sql.execution.python.{PythonArrowInput, PythonArrowOutput, PythonUDFRunner}
 import org.apache.spark.sql.execution.python.streaming.ApplyInPandasWithStatePythonRunner.{COUNT_COLUMN_SCHEMA_FROM_PYTHON_WORKER, InType, OutType, OutTypeForState, STATE_METADATA_SCHEMA_FROM_PYTHON_WORKER}
 import org.apache.spark.sql.execution.python.streaming.ApplyInPandasWithStateWriter.STATE_METADATA_SCHEMA
-import org.apache.spark.sql.execution.streaming.GroupStateImpl
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.{ArrowColumnVector, ColumnarBatch}
@@ -78,6 +77,8 @@ class ApplyInPandasWithStatePythonRunner(
   override val faultHandlerEnabled: Boolean = SQLConf.get.pythonUDFWorkerFaulthandlerEnabled
   override val idleTimeoutSeconds: Long = SQLConf.get.pythonUDFWorkerIdleTimeoutSeconds
   override val killOnIdleTimeout: Boolean = SQLConf.get.pythonUDFWorkerKillOnIdleTimeout
+  override val tracebackDumpIntervalSeconds: Long =
+    SQLConf.get.pythonUDFWorkerTracebackDumpIntervalSeconds
 
   private val sqlConf = SQLConf.get
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStateWriter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStateWriter.scala
index 6bfa5440db37f..f55ca749112fb 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStateWriter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/ApplyInPandasWithStateWriter.scala
@@ -28,7 +28,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeRow}
 import org.apache.spark.sql.execution.arrow.ArrowWriter
 import org.apache.spark.sql.execution.arrow.ArrowWriter.createFieldWriter
-import org.apache.spark.sql.execution.streaming.GroupStateImpl
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl
 import org.apache.spark.sql.types.{BinaryType, BooleanType, IntegerType, StringType, StructField, StructType}
 import org.apache.spark.unsafe.types.UTF8String
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/FlatMapGroupsInPandasWithStateExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/FlatMapGroupsInPandasWithStateExec.scala
index e53bdae813d26..5b9b95ef413aa 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/FlatMapGroupsInPandasWithStateExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/FlatMapGroupsInPandasWithStateExec.scala
@@ -28,9 +28,10 @@ import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.execution.{GroupedIterator, SparkPlan, UnaryExecNode}
 import org.apache.spark.sql.execution.python.ArrowPythonRunner
 import org.apache.spark.sql.execution.python.PandasGroupUtils.resolveArgOffsets
-import org.apache.spark.sql.execution.streaming._
-import org.apache.spark.sql.execution.streaming.GroupStateImpl.NO_TIMESTAMP
-import org.apache.spark.sql.execution.streaming.state.FlatMapGroupsWithStateExecHelper.StateData
+import org.apache.spark.sql.execution.streaming.operators.stateful._
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.{FlatMapGroupsWithStateExecBase, GroupStateImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.FlatMapGroupsWithStateExecHelper.StateData
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl.NO_TIMESTAMP
 import org.apache.spark.sql.execution.streaming.state.StateStore
 import org.apache.spark.sql.streaming.{GroupStateTimeout, OutputMode}
 import org.apache.spark.sql.types.StructType
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonForeachWriter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonForeachWriter.scala
index 04c51c859baca..01643af9cf30d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonForeachWriter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonForeachWriter.scala
@@ -102,6 +102,8 @@ class PythonForeachWriter(func: PythonFunction, schema: StructType)
       override val faultHandlerEnabled: Boolean = SQLConf.get.pythonUDFWorkerFaulthandlerEnabled
       override val idleTimeoutSeconds: Long = SQLConf.get.pythonUDFWorkerIdleTimeoutSeconds
       override val killOnIdleTimeout: Boolean = SQLConf.get.pythonUDFWorkerKillOnIdleTimeout
+      override val tracebackDumpIntervalSeconds: Long =
+        SQLConf.get.pythonUDFWorkerTracebackDumpIntervalSeconds
 
       override val hideTraceback: Boolean = SQLConf.get.pysparkHideTraceback
       override val simplifiedTraceback: Boolean = SQLConf.get.pysparkSimplifiedTraceback
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingSourceRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingSourceRunner.scala
index 3979220618baa..5945b91084278 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingSourceRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingSourceRunner.scala
@@ -28,7 +28,7 @@ import org.apache.arrow.vector.ipc.ArrowStreamReader
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.api.python.{PythonFunction, PythonWorker, PythonWorkerFactory, PythonWorkerUtils, SpecialLengths}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.PYTHON_EXEC
 import org.apache.spark.internal.config.BUFFER_SIZE
 import org.apache.spark.internal.config.Python.PYTHON_AUTH_SOCKET_TIMEOUT
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkExec.scala
index b65d46fb16325..1b967af38b6db 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkExec.scala
@@ -35,8 +35,10 @@ import org.apache.spark.sql.execution.{CoGroupedIterator, SparkPlan}
 import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.sql.execution.python.ArrowPythonRunner
 import org.apache.spark.sql.execution.python.PandasGroupUtils.{executePython, groupAndProject, resolveArgOffsets}
-import org.apache.spark.sql.execution.streaming.{DriverStatefulProcessorHandleImpl, StatefulOperatorStateInfo, StatefulProcessorHandleImpl, TransformWithStateExecBase, TransformWithStateVariableInfo}
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.StateStoreAwareZipPartitionsHelper
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperatorStateInfo, StatefulOperatorsUtils}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.StateStoreAwareZipPartitionsHelper
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.{TransformWithStateExecBase, TransformWithStateVariableInfo}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{DriverStatefulProcessorHandleImpl, StatefulProcessorHandleImpl}
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, RocksDBStateStoreProvider, StateSchemaValidationResult, StateStore, StateStoreColFamilySchema, StateStoreConf, StateStoreId, StateStoreOps, StateStoreProvider, StateStoreProviderId}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.{OutputMode, TimeMode}
@@ -95,9 +97,9 @@ case class TransformWithStateInPySparkExec(
   override def shortName: String = if (
     userFacingDataType == TransformWithStateInPySpark.UserFacingDataType.PANDAS
   ) {
-    "transformWithStateInPandasExec"
+    StatefulOperatorsUtils.TRANSFORM_WITH_STATE_IN_PANDAS_EXEC_OP_NAME
   } else {
-    "transformWithStateInPySparkExec"
+    StatefulOperatorsUtils.TRANSFORM_WITH_STATE_IN_PYSPARK_EXEC_OP_NAME
   }
 
   private val pythonUDF = functionExpr.asInstanceOf[PythonUDF]
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkPythonRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkPythonRunner.scala
index dffdaca1b835e..51dc179c901ab 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkPythonRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkPythonRunner.scala
@@ -35,7 +35,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.sql.execution.python.{BasicPythonArrowOutput, PythonArrowInput, PythonUDFRunner}
 import org.apache.spark.sql.execution.python.streaming.TransformWithStateInPySparkPythonRunner.{GroupedInType, InType}
-import org.apache.spark.sql.execution.streaming.{DriverStatefulProcessorHandleImpl, StatefulProcessorHandleImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{DriverStatefulProcessorHandleImpl, StatefulProcessorHandleImpl}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.vectorized.ColumnarBatch
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServer.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServer.scala
index 5c8a55edaffc1..4edeae132b47a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServer.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServer.scala
@@ -29,14 +29,15 @@ import org.apache.arrow.vector.VectorSchemaRoot
 import org.apache.arrow.vector.ipc.ArrowStreamWriter
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.Python.PYTHON_UNIX_DOMAIN_SOCKET_ENABLED
 import org.apache.spark.sql.{Encoders, Row}
 import org.apache.spark.sql.api.python.PythonSQLUtils
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.parser.CatalystSqlParser
-import org.apache.spark.sql.execution.streaming.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl, StatefulProcessorHandleImplBase, StatefulProcessorHandleState, StateVariableType}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateVariableType
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl, StatefulProcessorHandleImplBase, StatefulProcessorHandleState}
 import org.apache.spark.sql.execution.streaming.state.StateMessage.{HandleState, ImplicitGroupingKeyRequest, ListStateCall, MapStateCall, StatefulProcessorCall, StateRequest, StateResponse, StateResponseWithLongTypeVal, StateResponseWithMapIterator, StateResponseWithMapKeysOrValues, StateResponseWithStringTypeVal, StateResponseWithTimer, StateVariableRequest, TimerInfo, TimerRequest, TimerStateCallCommand, TimerValueRequest, UtilsRequest, ValueStateCall}
 import org.apache.spark.sql.execution.streaming.state.StateMessage.KeyAndValuePair
 import org.apache.spark.sql.execution.streaming.state.StateMessage.StateResponseWithListGet
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/benchmark/BenchmarkTransformWithStateInPySparkStateServer.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/benchmark/BenchmarkTransformWithStateInPySparkStateServer.scala
index 3cb9bfa24a536..5dc7d9733dcdc 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/benchmark/BenchmarkTransformWithStateInPySparkStateServer.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/python/streaming/benchmark/BenchmarkTransformWithStateInPySparkStateServer.scala
@@ -33,9 +33,7 @@ import org.apache.spark.sql.Encoder
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.execution.python.streaming.TransformWithStateInPySparkStateServer
-import org.apache.spark.sql.execution.streaming.ImplicitGroupingKeyTracker
-import org.apache.spark.sql.execution.streaming.QueryInfoImpl
-import org.apache.spark.sql.execution.streaming.StatefulProcessorHandleImplBase
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{ImplicitGroupingKeyTracker, QueryInfoImpl, StatefulProcessorHandleImplBase}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.ListState
 import org.apache.spark.sql.streaming.MapState
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/r/ArrowRRunner.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/r/ArrowRRunner.scala
index aaf2f256273d3..fafe1fbe313ab 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/r/ArrowRRunner.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/r/ArrowRRunner.scala
@@ -30,7 +30,7 @@ import org.apache.spark.TaskContext
 import org.apache.spark.api.r._
 import org.apache.spark.api.r.SpecialLengths
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.execution.arrow.ArrowWriter
 import org.apache.spark.sql.types.StructType
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ManifestFileCommitProtocol.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ManifestFileCommitProtocol.scala
index b382642eb6bf6..66e90ec689131 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ManifestFileCommitProtocol.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ManifestFileCommitProtocol.scala
@@ -25,11 +25,12 @@ import scala.collection.mutable.ArrayBuffer
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.mapreduce.{JobContext, TaskAttemptContext}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{BATCH_ID, PATH}
-import org.apache.spark.internal.io.FileCommitProtocol
+import org.apache.spark.internal.io.{FileCommitProtocol, FileNameSpec}
 import org.apache.spark.internal.io.FileCommitProtocol.TaskCommitMessage
 import org.apache.spark.sql.errors.QueryExecutionErrors
+import org.apache.spark.sql.execution.streaming.sinks.{FileStreamSinkLog, SinkFileStatus}
 
 /**
  * A [[FileCommitProtocol]] that tracks the list of valid files in a manifest file, used in
@@ -114,13 +115,13 @@ class ManifestFileCommitProtocol(jobId: String, path: String)
   }
 
   override def newTaskTempFile(
-      taskContext: TaskAttemptContext, dir: Option[String], ext: String): String = {
+      taskContext: TaskAttemptContext, dir: Option[String], spec: FileNameSpec): String = {
     // The file name looks like part-r-00000-2dd664f9-d2c4-4ffe-878f-c6c70c1fb0cb_00003.gz.parquet
     // Note that %05d does not truncate the split number, so if we have more than 100000 tasks,
     // the file name is fine and won't overflow.
     val split = taskContext.getTaskAttemptID.getTaskID.getId
     val uuid = UUID.randomUUID.toString
-    val filename = f"part-$split%05d-$uuid$ext"
+    val filename = f"part-$split%05d-$uuid${spec.suffix}"
 
     val file = dir.map { d =>
       new Path(new Path(path, d), filename).toString
@@ -133,7 +134,7 @@ class ManifestFileCommitProtocol(jobId: String, path: String)
   }
 
   override def newTaskTempFileAbsPath(
-      taskContext: TaskAttemptContext, absoluteDir: String, ext: String): String = {
+      taskContext: TaskAttemptContext, absoluteDir: String, spec: FileNameSpec): String = {
     throw QueryExecutionErrors.addFilesWithAbsolutePathUnsupportedError(this.toString)
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingErrors.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingErrors.scala
new file mode 100644
index 0000000000000..98b8832ee2a82
--- /dev/null
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingErrors.scala
@@ -0,0 +1,42 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.sql.execution.streaming
+
+import org.apache.spark.SparkException
+
+/**
+ * Object for grouping error messages from streaming query exceptions
+ */
+object StreamingErrors {
+  def cannotLoadCheckpointFileManagerClass(path: String, className: String, err: Throwable):
+  Throwable = {
+    new SparkException(
+      errorClass = "CANNOT_LOAD_CHECKPOINT_FILE_MANAGER.ERROR_LOADING_CLASS",
+      messageParameters = Map("path" -> path, "className" -> className, "msg" -> err.toString),
+      cause = err
+    )
+  }
+
+  def cannotLoadCheckpointFileManager(path: String, err: Throwable):
+  Throwable = {
+    new SparkException(
+      errorClass = "CANNOT_LOAD_CHECKPOINT_FILE_MANAGER.UNCATEGORIZED",
+      messageParameters = Map("path" -> path),
+      cause = err
+    )
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncCommitLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/AsyncCommitLog.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncCommitLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/AsyncCommitLog.scala
index 6db01624fd26b..116ea18326ef0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncCommitLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/AsyncCommitLog.scala
@@ -15,14 +15,14 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 import java.io.OutputStream
 import java.util.concurrent.{CompletableFuture, ConcurrentLinkedDeque, ThreadPoolExecutor}
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.LogKeys
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.errors.QueryExecutionErrors
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncOffsetSeqLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/AsyncOffsetSeqLog.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncOffsetSeqLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/AsyncOffsetSeqLog.scala
index 54a8855b77cdb..18d18e61da475 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncOffsetSeqLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/AsyncOffsetSeqLog.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 import java.io.OutputStream
 import java.util.concurrent._
@@ -23,7 +23,7 @@ import java.util.concurrent.atomic.AtomicLong
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.util.{Clock, SystemClock}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CheckpointFileManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/CheckpointFileManager.scala
similarity index 92%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CheckpointFileManager.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/CheckpointFileManager.scala
index 982cc13c40868..3d07483ba4dd1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CheckpointFileManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/CheckpointFileManager.scala
@@ -14,9 +14,10 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 import java.io.{FileNotFoundException, OutputStream}
+import java.lang.reflect.InvocationTargetException
 import java.util.{EnumSet, UUID}
 
 import scala.util.control.NonFatal
@@ -26,10 +27,11 @@ import org.apache.hadoop.fs._
 import org.apache.hadoop.fs.local.{LocalFs, RawLocalFs}
 import org.apache.hadoop.fs.permission.FsPermission
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FINAL_PATH, PATH, TEMP_PATH}
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.RenameHelperMethods
+import org.apache.spark.sql.execution.streaming.StreamingErrors
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.RenameHelperMethods
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.Utils
 
@@ -49,7 +51,7 @@ import org.apache.spark.util.Utils
  */
 trait CheckpointFileManager {
 
-  import org.apache.spark.sql.execution.streaming.CheckpointFileManager._
+  import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager._
 
   /**
    * Create a file and make its contents available atomically after the output stream is closed.
@@ -200,10 +202,19 @@ object CheckpointFileManager extends Logging {
     val fileManagerClass = hadoopConf.get(
       SQLConf.STREAMING_CHECKPOINT_FILE_MANAGER_CLASS.parent.key)
     if (fileManagerClass != null) {
-      return Utils.classForName(fileManagerClass)
-        .getConstructor(classOf[Path], classOf[Configuration])
-        .newInstance(path, hadoopConf)
-        .asInstanceOf[CheckpointFileManager]
+      try {
+        return Utils.classForName(fileManagerClass)
+          .getConstructor(classOf[Path], classOf[Configuration])
+          .newInstance(path, hadoopConf)
+          .asInstanceOf[CheckpointFileManager]
+      } catch {
+        case e: InvocationTargetException if e.getCause != null =>
+          throw StreamingErrors.cannotLoadCheckpointFileManagerClass(path.toString,
+            fileManagerClass, e.getCause)
+        case NonFatal(e) =>
+          throw StreamingErrors.cannotLoadCheckpointFileManagerClass(path.toString,
+              fileManagerClass, e)
+      }
     }
     try {
       // Try to create a manager based on `FileContext` because HDFS's `FileContext.rename()
@@ -218,6 +229,8 @@ object CheckpointFileManager extends Logging {
             log"the implementation of FileSystem.rename() is not atomic, then the correctness " +
             log"and fault-tolerance of your Structured Streaming is not guaranteed.")
         new FileSystemBasedCheckpointFileManager(path, hadoopConf)
+      case NonFatal(e) =>
+        throw StreamingErrors.cannotLoadCheckpointFileManager(path.toString, e)
     }
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CommitLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/CommitLog.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CommitLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/CommitLog.scala
index f501b62b8a718..6892b6b535cf9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CommitLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/CommitLog.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 import java.io.{InputStream, OutputStream}
 import java.nio.charset.StandardCharsets._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/HDFSMetadataLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/HDFSMetadataLog.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/HDFSMetadataLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/HDFSMetadataLog.scala
index 423648f445904..6d35b1a8f8c00 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/HDFSMetadataLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/HDFSMetadataLog.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 import java.io._
 import java.nio.charset.StandardCharsets
@@ -24,17 +24,17 @@ import java.util.{Collections, LinkedHashMap => JLinkedHashMap}
 import scala.jdk.CollectionConverters._
 import scala.reflect.ClassTag
 
-import org.apache.commons.io.IOUtils
 import org.apache.hadoop.fs._
 import org.json4s.{Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.Utils
 
 
 /**
@@ -191,7 +191,7 @@ class HDFSMetadataLog[T <: AnyRef : ClassTag](sparkSession: SparkSession, path:
           throw new IllegalStateException(
             s"Failed to read log file $batchMetadataFile. ${ise.getMessage}", ise)
       } finally {
-        IOUtils.closeQuietly(input)
+        Utils.closeQuietly(input)
       }
     } else {
       throw QueryExecutionErrors.batchMetadataFileNotFoundError(batchMetadataFile)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/MetadataLog.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/MetadataLog.scala
index 4083d5d897afc..18c04e0b9b5db 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/MetadataLog.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 /**
  * A general MetadataLog that supports the following features:
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataVersionUtil.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/MetadataVersionUtil.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataVersionUtil.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/MetadataVersionUtil.scala
index 854e36b5304a9..8d832c21287a5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataVersionUtil.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/MetadataVersionUtil.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 import org.apache.spark.sql.errors.QueryExecutionErrors
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeq.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeq.scala
similarity index 93%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeq.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeq.scala
index a599f3bc66118..c1c3c379719a1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeq.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeq.scala
@@ -15,17 +15,20 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 import org.json4s.{Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, DEFAULT_VALUE, NEW_VALUE, OLD_VALUE, TIP}
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.RuntimeConfig
 import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2, SparkDataStream}
-import org.apache.spark.sql.execution.streaming.state.{FlatMapGroupsWithStateExecHelper, StreamingAggregationStateManager, SymmetricHashJoinStateManager}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StreamingAggregationStateManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.FlatMapGroupsWithStateExecHelper
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.SymmetricHashJoinStateManager
+import org.apache.spark.sql.execution.streaming.runtime.{MultipleWatermarkPolicy, StreamProgress}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf._
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeqLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeqLog.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeqLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeqLog.scala
index 7e490ef4cd53d..816563b3f09fd 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/OffsetSeqLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/checkpointing/OffsetSeqLog.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.checkpointing
 
 
 import java.io.{InputStream, OutputStream}
@@ -25,6 +25,7 @@ import scala.io.{Source => IOSource}
 
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2}
+import org.apache.spark.sql.execution.streaming.runtime.SerializedOffset
 
 /**
  * This class is used to log offsets to persistent files in HDFS.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/console.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/console.scala
index 67585bdf20ce0..d8666e6740046 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/console.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/console.scala
@@ -19,8 +19,8 @@ package org.apache.spark.sql.execution.streaming
 
 import java.util
 
-import org.apache.spark.sql._
-import org.apache.spark.sql.connector.catalog.{SupportsWrite, Table, TableCapability}
+import org.apache.spark.sql.{Column => _, _}
+import org.apache.spark.sql.connector.catalog.{Column, SupportsWrite, Table, TableCapability}
 import org.apache.spark.sql.connector.write.{LogicalWriteInfo, SupportsTruncate, Write, WriteBuilder}
 import org.apache.spark.sql.connector.write.streaming.StreamingWrite
 import org.apache.spark.sql.execution.streaming.sources.ConsoleWrite
@@ -64,7 +64,7 @@ object ConsoleTable extends Table with SupportsWrite {
 
   override def name(): String = "console"
 
-  override def schema(): StructType = StructType(Nil)
+  override def columns(): Array[Column] = Array.empty
 
   override def capabilities(): util.Set[TableCapability] = {
     util.EnumSet.of(TableCapability.STREAMING_WRITE)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousExecution.scala
index a13c00ee20576..51cd457fbc856 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousExecution.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousExecution.scala
@@ -26,7 +26,6 @@ import scala.collection.mutable.{Map => MutableMap}
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.expressions.{CurrentDate, CurrentTimestampLike, LocalTimestamp}
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.streaming.{StreamingRelationV2, WriteToStream}
@@ -40,6 +39,8 @@ import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors
 import org.apache.spark.sql.execution.SQLExecution
 import org.apache.spark.sql.execution.datasources.v2.{StreamingDataSourceV2Relation, StreamingDataSourceV2ScanRelation}
 import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.checkpointing.{CommitMetadata, OffsetSeq}
+import org.apache.spark.sql.execution.streaming.runtime.{AcceptsLatestSeenOffsetHandler, ACTIVE, ContinuousExecutionContext, IncrementalExecution, ProcessingTimeExecutor, RECONFIGURING, State, StreamExecution, StreamExecutionContext, TERMINATED, WatermarkPropagator}
 import org.apache.spark.sql.streaming.Trigger
 import org.apache.spark.util.ArrayImplicits._
 import org.apache.spark.util.Clock
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousQueuedDataReader.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousQueuedDataReader.scala
index 398df496d15ff..d9eff62bcc986 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousQueuedDataReader.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousQueuedDataReader.scala
@@ -23,7 +23,7 @@ import java.util.concurrent.{ArrayBlockingQueue, TimeUnit}
 import scala.util.control.NonFatal
 
 import org.apache.spark.{SparkEnv, TaskContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.UnsafeProjection
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousRateStreamSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousRateStreamSource.scala
index 132d9a9d61e57..ef5eab951b605 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousRateStreamSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousRateStreamSource.scala
@@ -24,7 +24,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.connector.read.InputPartition
 import org.apache.spark.sql.connector.read.streaming.{ContinuousPartitionReader, ContinuousPartitionReaderFactory, ContinuousStream, Offset, PartitionOffset}
-import org.apache.spark.sql.execution.streaming.{RateStreamOffset, ValueRunTimeMsPair}
+import org.apache.spark.sql.execution.streaming.runtime.{RateStreamOffset, ValueRunTimeMsPair}
 
 case class RateStreamPartitionOffset(
    partition: Int, currentValue: Long, currentTimeMs: Long) extends PartitionOffset
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousTextSocketSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousTextSocketSource.scala
index 273ffa6aefb7b..c23e38a13efee 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousTextSocketSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousTextSocketSource.scala
@@ -29,7 +29,7 @@ import org.json4s.{DefaultFormats, Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{HOST, PORT}
 import org.apache.spark.rpc.RpcEndpointRef
 import org.apache.spark.sql.Encoders
@@ -38,7 +38,8 @@ import org.apache.spark.sql.catalyst.encoders.encoderFor
 import org.apache.spark.sql.catalyst.expressions.{UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.connector.read.InputPartition
 import org.apache.spark.sql.connector.read.streaming.{ContinuousPartitionReader, ContinuousPartitionReaderFactory, ContinuousStream, Offset, PartitionOffset}
-import org.apache.spark.sql.execution.streaming.{Offset => _, _}
+import org.apache.spark.sql.execution.streaming.{Offset => _}
+import org.apache.spark.sql.execution.streaming.runtime.{ContinuousRecordEndpoint, ContinuousRecordPartitionOffset, GetRecord}
 import org.apache.spark.sql.execution.streaming.sources.TextSocketReader
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 import org.apache.spark.util.RpcUtils
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousWriteRDD.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousWriteRDD.scala
index d5daa9a875f83..51399969df1b9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousWriteRDD.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/ContinuousWriteRDD.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.execution.streaming.continuous
 
 import org.apache.spark.{Partition, SparkEnv, TaskContext}
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/WriteToContinuousDataSourceExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/WriteToContinuousDataSourceExec.scala
index 42ce32e1bc674..8b5d6c580f105 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/WriteToContinuousDataSourceExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/continuous/WriteToContinuousDataSourceExec.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.execution.streaming.continuous
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/EventTimeWatermarkExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/EventTimeWatermarkExec.scala
similarity index 99%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/EventTimeWatermarkExec.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/EventTimeWatermarkExec.scala
index d25c4be0fb84a..03c8d70ec87f9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/EventTimeWatermarkExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/EventTimeWatermarkExec.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful
 
 import java.util.UUID
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MergingSortWithSessionWindowStateIterator.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/MergingSortWithSessionWindowStateIterator.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MergingSortWithSessionWindowStateIterator.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/MergingSortWithSessionWindowStateIterator.scala
index a923ebd79889c..69577a1f74339 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MergingSortWithSessionWindowStateIterator.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/MergingSortWithSessionWindowStateIterator.scala
@@ -15,13 +15,13 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.expressions.codegen.GenerateUnsafeProjection
-import org.apache.spark.sql.execution.streaming.state.{ReadStateStore, StreamingSessionWindowStateManager}
+import org.apache.spark.sql.execution.streaming.state.ReadStateStore
 
 /**
  * This class technically does the merge sort between input rows and existing sessions in state,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulOperatorPartitioning.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StatefulOperatorPartitioning.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulOperatorPartitioning.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StatefulOperatorPartitioning.scala
index 527349201574e..ed2941e3f2f4c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulOperatorPartitioning.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StatefulOperatorPartitioning.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful
 
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.plans.physical.{ClusteredDistribution, Distribution, StatefulOpClusteredDistribution}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StreamingAggregationStateManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StreamingAggregationStateManager.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StreamingAggregationStateManager.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StreamingAggregationStateManager.scala
index 97feb9b579af9..c7f7f388010da 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StreamingAggregationStateManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StreamingAggregationStateManager.scala
@@ -15,12 +15,13 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming.state
+package org.apache.spark.sql.execution.streaming.operators.stateful
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.{Attribute, UnsafeRow}
 import org.apache.spark.sql.catalyst.expressions.codegen.{GenerateUnsafeProjection, GenerateUnsafeRowJoiner}
 import org.apache.spark.sql.catalyst.types.DataTypeUtils
+import org.apache.spark.sql.execution.streaming.state.{ReadStateStore, StateStore, UnsafeRowPair}
 import org.apache.spark.sql.types.StructType
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StreamingSessionWindowStateManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StreamingSessionWindowStateManager.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StreamingSessionWindowStateManager.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StreamingSessionWindowStateManager.scala
index 71df9dc65b419..a74b4aaf0da12 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StreamingSessionWindowStateManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/StreamingSessionWindowStateManager.scala
@@ -15,13 +15,14 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming.state
+package org.apache.spark.sql.execution.streaming.operators.stateful
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Literal, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.expressions.codegen.GenerateUnsafeProjection
+import org.apache.spark.sql.execution.streaming.state.{ReadStateStore, StateStore, UnsafeRowPair}
 import org.apache.spark.sql.types.{StructType, TimestampType}
 import org.apache.spark.util.NextIterator
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FlatMapGroupsWithStateExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/FlatMapGroupsWithStateExec.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FlatMapGroupsWithStateExec.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/FlatMapGroupsWithStateExec.scala
index ebf08358c07bc..a0778fbfb6149 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FlatMapGroupsWithStateExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/FlatMapGroupsWithStateExec.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate
 
 import java.util.concurrent.TimeUnit.NANOSECONDS
 
@@ -31,7 +31,8 @@ import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.plans.physical.Distribution
 import org.apache.spark.sql.execution._
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper._
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperatorPartitioning, StatefulOperatorStateInfo, StateStoreWriter, WatermarkSupport}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper._
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.streaming.{GroupStateTimeout, OutputMode}
 import org.apache.spark.sql.streaming.GroupStateTimeout.NoTimeout
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/FlatMapGroupsWithStateExecHelper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/FlatMapGroupsWithStateExecHelper.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/FlatMapGroupsWithStateExecHelper.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/FlatMapGroupsWithStateExecHelper.scala
index b68c08b3ea5c6..280fcfc0ca1ca 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/FlatMapGroupsWithStateExecHelper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/FlatMapGroupsWithStateExecHelper.scala
@@ -15,13 +15,14 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming.state
+package org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate
 
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
 import org.apache.spark.sql.execution.ObjectOperator
-import org.apache.spark.sql.execution.streaming.GroupStateImpl.NO_TIMESTAMP
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl.NO_TIMESTAMP
+import org.apache.spark.sql.execution.streaming.state.StateStore
 import org.apache.spark.sql.types._
 
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/GroupStateImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/GroupStateImpl.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/GroupStateImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/GroupStateImpl.scala
index d4e93642b8164..1cab963802ca2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/GroupStateImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/flatmapgroupswithstate/GroupStateImpl.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate
 
 import java.sql.Date
 import java.util.concurrent.TimeUnit
@@ -28,7 +28,7 @@ import org.apache.spark.api.java.Optional
 import org.apache.spark.sql.catalyst.plans.logical.{EventTimeTimeout, NoTimeout, ProcessingTimeTimeout}
 import org.apache.spark.sql.catalyst.util.IntervalUtils
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming.GroupStateImpl._
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl._
 import org.apache.spark.sql.streaming.{GroupStateTimeout, TestGroupState}
 import org.apache.spark.unsafe.types.UTF8String
 import org.apache.spark.util.Utils
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingSymmetricHashJoinExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/StreamingSymmetricHashJoinExec.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingSymmetricHashJoinExec.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/StreamingSymmetricHashJoinExec.scala
index 7d71db8d8e4b9..ef37185ce4166 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingSymmetricHashJoinExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/StreamingSymmetricHashJoinExec.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.join
 
 import java.util.concurrent.TimeUnit.NANOSECONDS
 
@@ -29,9 +29,10 @@ import org.apache.spark.sql.catalyst.plans.physical._
 import org.apache.spark.sql.catalyst.types.DataTypeUtils
 import org.apache.spark.sql.execution.{BinaryExecNode, SparkPlan}
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper._
+import org.apache.spark.sql.execution.streaming.operators.stateful.{SchemaValidationUtils, StatefulOperatorCustomMetric, StatefulOperatorCustomSumMetric, StatefulOperatorStateInfo, StatefulOperatorsUtils, StatefulOpStateStoreCheckpointInfo, StateStoreWriter, WatermarkSupport}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper._
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.SymmetricHashJoinStateManager.KeyToValuePair
 import org.apache.spark.sql.execution.streaming.state._
-import org.apache.spark.sql.execution.streaming.state.SymmetricHashJoinStateManager.KeyToValuePair
 import org.apache.spark.sql.internal.{SessionState, SQLConf}
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.{CompletionIterator, SerializableConfiguration}
@@ -236,7 +237,7 @@ case class StreamingSymmetricHashJoinExec(
     case _ => throwBadJoinTypeException()
   }
 
-  override def shortName: String = "symmetricHashJoin"
+  override def shortName: String = StatefulOperatorsUtils.SYMMETRIC_HASH_JOIN_EXEC_OP_NAME
 
   override val stateStoreNames: Seq[String] = _stateStoreNames
 
@@ -350,7 +351,7 @@ case class StreamingSymmetricHashJoinExec(
 
     assert(stateInfo.isDefined, "State info not defined")
     val checkpointIds = SymmetricHashJoinStateManager.getStateStoreCheckpointIds(
-      partitionId, stateInfo.get, useVirtualColumnFamilies)
+      partitionId, stateInfo.get.stateStoreCkptIds, useVirtualColumnFamilies)
 
     val inputSchema = left.output ++ right.output
     val postJoinFilter =
@@ -362,12 +363,12 @@ case class StreamingSymmetricHashJoinExec(
       new OneSideHashJoiner(
         LeftSide, left.output, leftKeys, leftInputIter,
         condition.leftSideOnly, postJoinFilter, stateWatermarkPredicates.left, partitionId,
-        checkpointIds.left.keyToNumValues, checkpointIds.left.valueToNumKeys,
+        checkpointIds.left.keyToNumValues, checkpointIds.left.keyWithIndexToValue,
         skippedNullValueCount, joinStateManagerStoreGenerator),
       new OneSideHashJoiner(
         RightSide, right.output, rightKeys, rightInputIter,
         condition.rightSideOnly, postJoinFilter, stateWatermarkPredicates.right, partitionId,
-        checkpointIds.right.keyToNumValues, checkpointIds.right.valueToNumKeys,
+        checkpointIds.right.keyToNumValues, checkpointIds.right.keyWithIndexToValue,
         skippedNullValueCount, joinStateManagerStoreGenerator))
 
     //  Join one side input using the other side's buffered/state rows. Here is how it is done.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingSymmetricHashJoinHelper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/StreamingSymmetricHashJoinHelper.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingSymmetricHashJoinHelper.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/StreamingSymmetricHashJoinHelper.scala
index 497e71070a09a..7b02a43cd5a9f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingSymmetricHashJoinHelper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/StreamingSymmetricHashJoinHelper.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.join
 
 import scala.reflect.ClassTag
 
@@ -26,7 +26,8 @@ import org.apache.spark.sql.catalyst.analysis.StreamingJoinHelper
 import org.apache.spark.sql.catalyst.expressions.{And, Attribute, AttributeSet, BoundReference, Expression, NamedExpression, PredicateHelper}
 import org.apache.spark.sql.catalyst.plans.logical.EventTimeWatermark._
 import org.apache.spark.sql.execution.SparkPlan
-import org.apache.spark.sql.execution.streaming.WatermarkSupport.watermarkExpression
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperatorStateInfo, WatermarkSupport}
+import org.apache.spark.sql.execution.streaming.operators.stateful.WatermarkSupport.watermarkExpression
 import org.apache.spark.sql.execution.streaming.state.{StateStoreCheckpointInfo, StateStoreCoordinatorRef, StateStoreProviderId}
 
 
@@ -323,15 +324,15 @@ object StreamingSymmetricHashJoinHelper extends Logging {
 
   case class JoinerStateStoreCkptInfo(
       keyToNumValues: StateStoreCheckpointInfo,
-      valueToNumKeys: StateStoreCheckpointInfo)
+      keyWithIndexToValue: StateStoreCheckpointInfo)
 
   case class JoinStateStoreCkptInfo(
       left: JoinerStateStoreCkptInfo,
       right: JoinerStateStoreCkptInfo)
 
   case class JoinerStateStoreCheckpointId(
-       keyToNumValues: Option[String],
-       valueToNumKeys: Option[String])
+      keyToNumValues: Option[String],
+      keyWithIndexToValue: Option[String])
 
   case class JoinStateStoreCheckpointId(
        left: JoinerStateStoreCheckpointId,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/SymmetricHashJoinStateManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/SymmetricHashJoinStateManager.scala
similarity index 91%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/SymmetricHashJoinStateManager.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/SymmetricHashJoinStateManager.scala
index 6ec197d7cc7b1..c0965747722e5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/SymmetricHashJoinStateManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/join/SymmetricHashJoinStateManager.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming.state
+package org.apache.spark.sql.execution.streaming.operators.stateful.join
 
 import java.util.Locale
 
@@ -24,15 +24,16 @@ import scala.annotation.tailrec
 import org.apache.hadoop.conf.Configuration
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{END_INDEX, START_INDEX, STATE_STORE_ID}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeReference, Expression, JoinedRow, Literal, SafeProjection, SpecificInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.StatefulOperatorStateInfo
-import org.apache.spark.sql.execution.streaming.StatefulOpStateStoreCheckpointInfo
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper._
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOpStateStoreCheckpointInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper._
+import org.apache.spark.sql.execution.streaming.state.{KeyStateEncoderSpec, NoPrefixKeyStateEncoderSpec, StateSchemaBroadcast, StateStore, StateStoreCheckpointInfo, StateStoreColFamilySchema, StateStoreConf, StateStoreErrors, StateStoreId, StateStoreMetrics, StateStoreProvider, StateStoreProviderId, SupportsFineGrainedReplay}
 import org.apache.spark.sql.types.{BooleanType, LongType, StructField, StructType}
 import org.apache.spark.util.NextIterator
 
@@ -439,7 +440,7 @@ abstract class SymmetricHashJoinStateManager(
    * NOTE: this function is only intended for use in unit tests
    * to simulate null values.
    */
-  private[state] def updateNumValuesTestOnly(key: UnsafeRow, numValues: Long): Unit = {
+  private[streaming] def updateNumValuesTestOnly(key: UnsafeRow, numValues: Long): Unit = {
     keyToNumValues.put(key, numValues)
   }
 
@@ -528,7 +529,7 @@ abstract class SymmetricHashJoinStateManager(
    * Helper class for representing data returned by [[KeyWithIndexToValueStore]].
    * Designed for object reuse.
    */
-  private[state] class KeyAndNumValues(var key: UnsafeRow = null, var numValue: Long = 0) {
+  private[join] class KeyAndNumValues(var key: UnsafeRow = null, var numValue: Long = 0) {
     def withNew(newKey: UnsafeRow, newNumValues: Long): this.type = {
       this.key = newKey
       this.numValue = newNumValues
@@ -595,7 +596,7 @@ abstract class SymmetricHashJoinStateManager(
    * Helper class for representing data returned by [[KeyWithIndexToValueStore]].
    * Designed for object reuse.
    */
-  private[state] class KeyWithIndexAndValue(
+  private[join] class KeyWithIndexAndValue(
     var key: UnsafeRow = null,
     var valueIndex: Long = -1,
     var value: UnsafeRow = null,
@@ -737,9 +738,9 @@ abstract class SymmetricHashJoinStateManager(
     if (useVirtualColumnFamilies) {
       stateStore.createColFamilyIfAbsent(
         colFamilyName,
-        keySchema,
+        keyWithIndexSchema,
         valueRowConverter.valueAttributes.toStructType,
-        NoPrefixKeyStateEncoderSpec(keySchema)
+        NoPrefixKeyStateEncoderSpec(keyWithIndexSchema)
       )
     }
 
@@ -1134,17 +1135,17 @@ object SymmetricHashJoinStateManager {
     val ckptIds = joinCkptInfo.left.keyToNumValues.stateStoreCkptId.map(
       Array(
         _,
-        joinCkptInfo.left.valueToNumKeys.stateStoreCkptId.get,
+        joinCkptInfo.left.keyWithIndexToValue.stateStoreCkptId.get,
         joinCkptInfo.right.keyToNumValues.stateStoreCkptId.get,
-        joinCkptInfo.right.valueToNumKeys.stateStoreCkptId.get
+        joinCkptInfo.right.keyWithIndexToValue.stateStoreCkptId.get
       )
     )
     val baseCkptIds = joinCkptInfo.left.keyToNumValues.baseStateStoreCkptId.map(
       Array(
         _,
-        joinCkptInfo.left.valueToNumKeys.baseStateStoreCkptId.get,
+        joinCkptInfo.left.keyWithIndexToValue.baseStateStoreCkptId.get,
         joinCkptInfo.right.keyToNumValues.baseStateStoreCkptId.get,
-        joinCkptInfo.right.valueToNumKeys.baseStateStoreCkptId.get
+        joinCkptInfo.right.keyWithIndexToValue.baseStateStoreCkptId.get
       )
     )
 
@@ -1157,49 +1158,94 @@ object SymmetricHashJoinStateManager {
 
   /**
    * Stream-stream join has 4 state stores instead of one. So it will generate 4 different
-   * checkpoint IDs. They are translated from each joiners' state store into an array through
-   * mergeStateStoreCheckpointInfo(). This function is used to read it back into individual state
-   * store checkpoint IDs.
-   * @param partitionId
-   * @param stateInfo
-   * @return
+   * checkpoint IDs using stateStoreCkptIds. They are translated from each joiners' state
+   * store into an array through mergeStateStoreCheckpointInfo(). This function is used to read
+   * it back into individual state store checkpoint IDs for each store.
+   * If useColumnFamiliesForJoins is true, then it will always return the first checkpoint ID.
+   *
+   * @param partitionId the partition ID of the state store
+   * @param stateStoreCkptIds the array of checkpoint IDs for all the state stores
+   * @param useColumnFamiliesForJoins whether virtual column families are used for the join
+   *
+   * @return the checkpoint IDs for all state stores used by this joiner
    */
   def getStateStoreCheckpointIds(
       partitionId: Int,
-      stateInfo: StatefulOperatorStateInfo,
+      stateStoreCkptIds: Option[Array[Array[String]]],
       useColumnFamiliesForJoins: Boolean): JoinStateStoreCheckpointId = {
     if (useColumnFamiliesForJoins) {
-      val ckpt = stateInfo.stateStoreCkptIds.map(_(partitionId)).map(_.head)
+      val ckpt = stateStoreCkptIds.map(_(partitionId)).map(_.head)
       JoinStateStoreCheckpointId(
-        left = JoinerStateStoreCheckpointId(keyToNumValues = ckpt, valueToNumKeys = ckpt),
-        right = JoinerStateStoreCheckpointId(keyToNumValues = ckpt, valueToNumKeys = ckpt)
+        left = JoinerStateStoreCheckpointId(keyToNumValues = ckpt, keyWithIndexToValue = ckpt),
+        right = JoinerStateStoreCheckpointId(keyToNumValues = ckpt, keyWithIndexToValue = ckpt)
       )
     } else {
-      val stateStoreCkptIds = stateInfo.stateStoreCkptIds
+      val stateStoreCkptIdsOpt = stateStoreCkptIds
         .map(_(partitionId))
         .map(_.map(Option(_)))
         .getOrElse(Array.fill[Option[String]](4)(None))
       JoinStateStoreCheckpointId(
         left = JoinerStateStoreCheckpointId(
-          keyToNumValues = stateStoreCkptIds(0),
-          valueToNumKeys = stateStoreCkptIds(1)),
+          keyToNumValues = stateStoreCkptIdsOpt(0),
+          keyWithIndexToValue = stateStoreCkptIdsOpt(1)),
         right = JoinerStateStoreCheckpointId(
-          keyToNumValues = stateStoreCkptIds(2),
-          valueToNumKeys = stateStoreCkptIds(3)))
+          keyToNumValues = stateStoreCkptIdsOpt(2),
+          keyWithIndexToValue = stateStoreCkptIdsOpt(3)))
+    }
+  }
+
+  /**
+   * Stream-stream join has 4 state stores instead of one. So it will generate 4 different
+   * checkpoint IDs when not using virtual column families.
+   * This function is used to get the checkpoint ID for a specific state store
+   * by the name of the store, partition ID and the stateStoreCkptIds array. The expected names
+   * for the stores are generated by getStateStoreName().
+   * If useColumnFamiliesForJoins is true, then it will always return the first checkpoint ID.
+   *
+   * @param storeName the name of the state store
+   * @param partitionId the partition ID of the state store
+   * @param stateStoreCkptIds the array of checkpoint IDs for all the state stores
+   * @param useColumnFamiliesForJoins whether virtual column families are used for the join
+   *
+   * @return the checkpoint ID for the specific state store, or None if not found
+   */
+  def getStateStoreCheckpointId(
+      storeName: String,
+      partitionId: Int,
+      stateStoreCkptIds: Option[Array[Array[String]]],
+      useColumnFamiliesForJoins: Boolean = false) : Option[String] = {
+    if (useColumnFamiliesForJoins || storeName == StateStoreId.DEFAULT_STORE_NAME) {
+      stateStoreCkptIds.map(_(partitionId)).map(_.head)
+    } else {
+      val joinStateStoreCkptIds = getStateStoreCheckpointIds(
+        partitionId, stateStoreCkptIds, useColumnFamiliesForJoins)
+
+      if (storeName == getStateStoreName(LeftSide, KeyToNumValuesType)) {
+        joinStateStoreCkptIds.left.keyToNumValues
+      } else if (storeName == getStateStoreName(RightSide, KeyToNumValuesType)) {
+        joinStateStoreCkptIds.right.keyToNumValues
+      } else if (storeName == getStateStoreName(LeftSide, KeyWithIndexToValueType)) {
+        joinStateStoreCkptIds.left.keyWithIndexToValue
+      } else if (storeName == getStateStoreName(RightSide, KeyWithIndexToValueType)) {
+        joinStateStoreCkptIds.right.keyWithIndexToValue
+      } else {
+        None
+      }
     }
   }
 
-  private[state] sealed trait StateStoreType
+  private[join] sealed trait StateStoreType
 
-  private[state] case object KeyToNumValuesType extends StateStoreType {
+  private[join] case object KeyToNumValuesType extends StateStoreType {
     override def toString(): String = "keyToNumValues"
   }
 
-  private[state] case object KeyWithIndexToValueType extends StateStoreType {
+  private[join] case object KeyWithIndexToValueType extends StateStoreType {
     override def toString(): String = "keyWithIndexToValue"
   }
 
-  private[state] def getStateStoreName(joinSide: JoinSide, storeType: StateStoreType): String = {
+  private[join] def getStateStoreName(
+      joinSide: JoinSide, storeType: StateStoreType): String = {
     s"$joinSide-$storeType"
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/statefulOperators.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/statefulOperators.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/statefulOperators.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/statefulOperators.scala
index d92e5dbae1aa1..cc8d354a03938 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/statefulOperators.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/statefulOperators.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful
 
 import java.util.UUID
 import java.util.concurrent.TimeUnit._
@@ -324,8 +324,11 @@ trait StateStoreWriter
       .map(_._2)
       .toArray
     assert(
-      ret.length == getStateInfo.numPartitions,
-      s"ChekpointInfo length: ${ret.length}, numPartitions: ${getStateInfo.numPartitions}")
+      // Normally, we should have checkpoint info for all partitions.
+      // However, for globalLimit operator, there is only one partition (0) that has state.
+      ret.length == getStateInfo.numPartitions
+        || (outputPartitioning.numPartitions == 1 && ret.length == 1),
+      s"CheckpointInfo length: ${ret.length}, numPartitions: ${getStateInfo.numPartitions}")
     ret
   }
 
@@ -1546,3 +1549,16 @@ trait SchemaValidationUtils extends Logging {
         schemaEvolutionEnabled = usingAvro && schemaEvolutionEnabledForOperator))
   }
 }
+
+object StatefulOperatorsUtils {
+  val TRANSFORM_WITH_STATE_EXEC_OP_NAME = "transformWithStateExec"
+  val TRANSFORM_WITH_STATE_IN_PANDAS_EXEC_OP_NAME = "transformWithStateInPandasExec"
+  val TRANSFORM_WITH_STATE_IN_PYSPARK_EXEC_OP_NAME = "transformWithStateInPySparkExec"
+  // Seq of operator names who uses state schema v3 and TWS related options.
+  val TRANSFORM_WITH_STATE_OP_NAMES: Seq[String] = Seq(
+    TRANSFORM_WITH_STATE_EXEC_OP_NAME,
+    TRANSFORM_WITH_STATE_IN_PANDAS_EXEC_OP_NAME,
+    TRANSFORM_WITH_STATE_IN_PYSPARK_EXEC_OP_NAME
+  )
+  val SYMMETRIC_HASH_JOIN_EXEC_OP_NAME = "symmetricHashJoin"
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/streamingLimits.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/streamingLimits.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/streamingLimits.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/streamingLimits.scala
index 07fe0ae4357d0..6816be103f6e2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/streamingLimits.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/streamingLimits.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful
 
 import java.util.concurrent.TimeUnit.NANOSECONDS
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StateStoreColumnFamilySchemaUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/StateStoreColumnFamilySchemaUtils.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StateStoreColumnFamilySchemaUtils.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/StateStoreColumnFamilySchemaUtils.scala
index 4401f8cedff6b..7e25960daf33d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StateStoreColumnFamilySchemaUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/StateStoreColumnFamilySchemaUtils.scala
@@ -14,14 +14,14 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate
 
 import scala.collection.mutable
 
 import org.apache.spark.sql.Encoder
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
-import org.apache.spark.sql.execution.streaming.TransformWithStateVariableUtils.getRowCounterCFName
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateVariableUtils.getRowCounterCFName
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, PrefixKeyScanStateEncoderSpec, RangeKeyScanStateEncoderSpec, StateStoreColFamilySchema}
 import org.apache.spark.sql.types._
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StateTypesEncoderUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/StateTypesEncoderUtils.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StateTypesEncoderUtils.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/StateTypesEncoderUtils.scala
index a2b7ee4ba7916..8ce300a40b43c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StateTypesEncoderUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/StateTypesEncoderUtils.scala
@@ -15,13 +15,15 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate
 
 import org.apache.spark.sql.Encoder
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.encoders.{encoderFor, ExpressionEncoder}
 import org.apache.spark.sql.catalyst.expressions.{UnsafeProjection, UnsafeRow}
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.ImplicitGroupingKeyTracker
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.StateTTL
 import org.apache.spark.sql.execution.streaming.state.StateStoreErrors
 import org.apache.spark.sql.types._
 
@@ -180,7 +182,7 @@ class CompositeKeyStateEncoder[K, V](
     stateName: String,
     hasTtl: Boolean = false)
   extends StateTypesEncoder[V](keyEncoder, valEncoder, stateName, hasTtl) {
-  import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
+  import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
 
   /** Encoders */
   private val userKeyExpressionEnc = encoderFor(userKeyEnc)
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateExec.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateExec.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateExec.scala
index 80fdaa1e71e2f..20e2c32015d84 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateExec.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate
 
 import java.util.UUID
 import java.util.concurrent.TimeUnit.NANOSECONDS
@@ -28,7 +28,10 @@ import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression, UnsafeRow}
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.execution._
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.StateStoreAwareZipPartitionsHelper
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperatorStateInfo, StatefulOperatorsUtils}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.StateStoreAwareZipPartitionsHelper
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{DriverStatefulProcessorHandleImpl, ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl, StatefulProcessorHandleState}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.timers.{ExpiredTimerInfoImpl, TimerValuesImpl}
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming._
@@ -84,7 +87,7 @@ case class TransformWithStateExec(
     initialState)
   with ObjectProducerExec {
 
-  override def shortName: String = "transformWithStateExec"
+  override def shortName: String = StatefulOperatorsUtils.TRANSFORM_WITH_STATE_EXEC_OP_NAME
 
   // We need to just initialize key and value deserializer once per partition.
   // The deserializers need to be lazily created on the executor since they
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateExecBase.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateExecBase.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateExecBase.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateExecBase.scala
index df68b21e0bb9f..c2d24e735ab2d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateExecBase.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateExecBase.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate
 
 import org.apache.spark.SparkThrowable
 import org.apache.spark.sql.catalyst.InternalRow
@@ -22,6 +22,8 @@ import org.apache.spark.sql.catalyst.expressions.{Ascending, Attribute, SortOrde
 import org.apache.spark.sql.catalyst.plans.logical.{EventTime, ProcessingTime}
 import org.apache.spark.sql.catalyst.plans.physical.Distribution
 import org.apache.spark.sql.execution.{BinaryExecNode, SparkPlan}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperatorCustomMetric, StatefulOperatorCustomSumMetric, StatefulOperatorPartitioning, StateStoreWriter, WatermarkSupport}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.ImplicitGroupingKeyTracker
 import org.apache.spark.sql.execution.streaming.state.{OperatorStateMetadata, TransformWithStateUserFunctionException}
 import org.apache.spark.sql.streaming.{OutputMode, TimeMode}
 import org.apache.spark.sql.types.{BinaryType, StructType}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateVariableUtils.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateVariableUtils.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateVariableUtils.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateVariableUtils.scala
index 7b9a478b8be19..068303e25e2e8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TransformWithStateVariableUtils.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/TransformWithStateVariableUtils.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate
 
 import org.json4s.DefaultFormats
 import org.json4s.JsonAST._
@@ -23,7 +23,8 @@ import org.json4s.jackson.JsonMethods
 import org.json4s.jackson.JsonMethods.{compact, render}
 
 import org.apache.spark.internal.Logging
-import org.apache.spark.sql.execution.streaming.StateVariableType.StateVariableType
+import org.apache.spark.sql.execution.streaming.operators.stateful.{SchemaValidationUtils, StatefulOperatorStateInfo}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateVariableType.StateVariableType
 import org.apache.spark.sql.execution.streaming.state.{OperatorInfoV1, OperatorStateMetadata, OperatorStateMetadataV2, StateStoreErrors, StateStoreId, StateStoreMetadataV2}
 import org.apache.spark.sql.streaming.{OutputMode, TimeMode}
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulProcessorHandleImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statefulprocessor/StatefulProcessorHandleImpl.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulProcessorHandleImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statefulprocessor/StatefulProcessorHandleImpl.scala
index 3cf3286fafb80..dfba0e1f12146 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulProcessorHandleImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statefulprocessor/StatefulProcessorHandleImpl.scala
@@ -14,7 +14,8 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+// scalastyle:off line.size.limit
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor
 
 import java.util
 import java.util.UUID
@@ -26,13 +27,19 @@ import org.apache.spark.internal.Logging
 import org.apache.spark.sql.Encoder
 import org.apache.spark.sql.catalyst.encoders.{encoderFor, ExpressionEncoder}
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.StatefulProcessorHandleState.PRE_INIT
-import org.apache.spark.sql.execution.streaming.StateVariableType._
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils.{getExpirationMsRowSchema, getTTLRowKeySchema}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.{StateStoreColumnFamilySchemaUtils, TimerKeyEncoder, TransformWithStateVariableInfo, TransformWithStateVariableUtils}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateVariableType._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils.{getExpirationMsRowSchema, getTTLRowKeySchema}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.StatefulProcessorHandleState.PRE_INIT
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statevariables.{ListStateImpl, MapStateImpl, ValueStateImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.timers.{TimerStateImpl, TimerStateUtils}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.{ListStateImplWithTTL, MapStateImplWithTTL, TTLState, ValueStateImplWithTTL}
+import org.apache.spark.sql.execution.streaming.runtime.{MicroBatchExecution, StreamExecution}
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.streaming.{ListState, MapState, QueryInfo, TimeMode, TTLConfig, ValueState}
 import org.apache.spark.sql.types._
 import org.apache.spark.util.Utils
+// scalastyle:on line.size.limit
 
 /**
  * Object used to assign/retrieve/remove grouping key passed implicitly for various state
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulProcessorHandleImplBase.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statefulprocessor/StatefulProcessorHandleImplBase.scala
similarity index 85%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulProcessorHandleImplBase.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statefulprocessor/StatefulProcessorHandleImplBase.scala
index 64d87073ccf9f..4b593fe309472 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StatefulProcessorHandleImplBase.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statefulprocessor/StatefulProcessorHandleImplBase.scala
@@ -14,13 +14,15 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+// scalastyle:off line.size.limit
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor
 
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.plans.logical.NoTime
-import org.apache.spark.sql.execution.streaming.StatefulProcessorHandleState.{INITIALIZED, PRE_INIT, StatefulProcessorHandleState, TIMER_PROCESSED}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.StatefulProcessorHandleState.{INITIALIZED, PRE_INIT, StatefulProcessorHandleState, TIMER_PROCESSED}
 import org.apache.spark.sql.execution.streaming.state.StateStoreErrors
 import org.apache.spark.sql.streaming.{StatefulProcessorHandle, TimeMode}
+// scalastyle:on line.size.limit
 
 abstract class StatefulProcessorHandleImplBase(
     timeMode: TimeMode, keyExprEnc: ExpressionEncoder[Any]) extends StatefulProcessorHandle {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ListStateImpl.scala
similarity index 93%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ListStateImpl.scala
index 32683aebd8c18..c6fe03da49ddf 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ListStateImpl.scala
@@ -14,14 +14,18 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+// scalastyle:off line.size.limit
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statevariables
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.execution.metric.SQLMetric
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateTypesEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.TWSMetricsUtils
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, StateStore, StateStoreErrors}
 import org.apache.spark.sql.streaming.ListState
 import org.apache.spark.sql.types.StructType
+// scalastyle:on line.size.limit
 
 /**
  * Provides concrete implementation for list of values associated with a state variable
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateMetricsImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ListStateMetricsImpl.scala
similarity index 91%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateMetricsImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ListStateMetricsImpl.scala
index 66b6bd063ae6b..2275aba1a5887 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateMetricsImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ListStateMetricsImpl.scala
@@ -14,13 +14,15 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+// scalastyle:off line.size.limit
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statevariables
 
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
-import org.apache.spark.sql.execution.streaming.TransformWithStateVariableUtils.getRowCounterCFName
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateVariableUtils.getRowCounterCFName
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, StateStore}
 import org.apache.spark.sql.types._
+// scalastyle:on line.size.limit
 
 /**
  * Trait that provides helper methods to maintain metrics for a list state.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MapStateImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/MapStateImpl.scala
similarity index 88%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MapStateImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/MapStateImpl.scala
index 4e608a5d5dbbe..007791ea55477 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MapStateImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/MapStateImpl.scala
@@ -14,15 +14,19 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+// scalastyle:off line.size.limit
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statevariables
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.CompositeKeyStateEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.TWSMetricsUtils
 import org.apache.spark.sql.execution.streaming.state.{PrefixKeyScanStateEncoderSpec, StateStore, StateStoreErrors, UnsafeRowPair}
 import org.apache.spark.sql.streaming.MapState
 import org.apache.spark.sql.types.StructType
+// scalastyle:on line.size.limit
 
 /**
  * Class that provides a concrete implementation for map state associated with state
@@ -56,7 +60,10 @@ class MapStateImpl[K, V](
 
   /** Whether state exists or not. */
   override def exists(): Boolean = {
-    store.prefixScan(stateTypesEncoder.encodeGroupingKey(), stateName).nonEmpty
+    val iter = store.prefixScan(stateTypesEncoder.encodeGroupingKey(), stateName)
+    val result = iter.nonEmpty
+    iter.close()
+    result
   }
 
   /** Get the state value if it exists */
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ValueStateImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ValueStateImpl.scala
similarity index 89%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ValueStateImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ValueStateImpl.scala
index d7e7a3d83f4df..2a4a79bca1e0a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ValueStateImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/statevariables/ValueStateImpl.scala
@@ -14,13 +14,17 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+// scalastyle:off line.size.limit
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statevariables
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.execution.metric.SQLMetric
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateTypesEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.TWSMetricsUtils
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, StateStore}
 import org.apache.spark.sql.streaming.ValueState
+// scalastyle:on line.size.limit
 
 /**
  * Class that provides a concrete implementation for a single value state associated with state
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ExpiredTimerInfoImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/ExpiredTimerInfoImpl.scala
similarity index 93%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ExpiredTimerInfoImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/ExpiredTimerInfoImpl.scala
index 984d650a27ccc..ec602988dc3e1 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ExpiredTimerInfoImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/ExpiredTimerInfoImpl.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.timers
 
 import org.apache.spark.sql.streaming.ExpiredTimerInfo
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TimerStateImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/TimerStateImpl.scala
similarity index 94%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TimerStateImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/TimerStateImpl.scala
index ede45fc924a98..647c0b3036a2a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TimerStateImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/TimerStateImpl.scala
@@ -14,13 +14,15 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.timers
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{EXPIRY_TIMESTAMP, KEY}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TimerKeyEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.ImplicitGroupingKeyTracker
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.streaming.TimeMode
 import org.apache.spark.sql.types._
@@ -199,7 +201,9 @@ class TimerStateImpl(
         }
       }
 
-      override protected def close(): Unit = { }
+      override protected def close(): Unit = {
+        iter.close()
+      }
     }
   }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TimerValuesImpl.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/TimerValuesImpl.scala
similarity index 94%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TimerValuesImpl.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/TimerValuesImpl.scala
index eb65aade67e36..234b80a84e8ed 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TimerValuesImpl.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/timers/TimerValuesImpl.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.timers
 
 import org.apache.spark.sql.streaming.TimerValues
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateImplWithTTL.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/ListStateImplWithTTL.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateImplWithTTL.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/ListStateImplWithTTL.scala
index 4e32b80578155..08f97e38bd086 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ListStateImplWithTTL.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/ListStateImplWithTTL.scala
@@ -14,12 +14,13 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl
 
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateTypesEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, StateStore, StateStoreErrors}
 import org.apache.spark.sql.streaming.{ListState, TTLConfig}
 import org.apache.spark.util.NextIterator
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MapStateImplWithTTL.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/MapStateImplWithTTL.scala
similarity index 94%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MapStateImplWithTTL.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/MapStateImplWithTTL.scala
index 64581006555e7..f063354bc8c8c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MapStateImplWithTTL.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/MapStateImplWithTTL.scala
@@ -14,12 +14,14 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.CompositeKeyStateEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.TWSMetricsUtils
 import org.apache.spark.sql.execution.streaming.state.{PrefixKeyScanStateEncoderSpec, StateStore, StateStoreErrors}
 import org.apache.spark.sql.streaming.{MapState, TTLConfig}
 import org.apache.spark.util.NextIterator
@@ -128,7 +130,9 @@ metrics: Map[String, SQLMetric])
         }
       }
 
-      override protected def close(): Unit = {}
+      override protected def close(): Unit = {
+        unsafeRowPairIterator.close()
+      }
     }
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TTLState.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/TTLState.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TTLState.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/TTLState.scala
index 398088ab16978..548a47ea75e13 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TTLState.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/TTLState.scala
@@ -14,14 +14,16 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl
 
 import java.time.Duration
 
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TTLEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.TWSMetricsUtils
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, RangeKeyScanStateEncoderSpec, StateStore}
 import org.apache.spark.sql.streaming.TTLConfig
 import org.apache.spark.sql.types._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ValueStateImplWithTTL.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/ValueStateImplWithTTL.scala
similarity index 94%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ValueStateImplWithTTL.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/ValueStateImplWithTTL.scala
index 836aac4cdb5a0..587da75993610 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ValueStateImplWithTTL.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/operators/stateful/transformwithstate/ttl/ValueStateImplWithTTL.scala
@@ -14,11 +14,12 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl
 
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.TransformWithStateKeyValueRowSchemaUtils._
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateTypesEncoder
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateKeyValueRowSchemaUtils._
 import org.apache.spark.sql.execution.streaming.state.{NoPrefixKeyStateEncoderSpec, StateStore}
 import org.apache.spark.sql.streaming.{TTLConfig, ValueState}
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AcceptsLatestSeenOffsetHandler.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AcceptsLatestSeenOffsetHandler.scala
similarity index 91%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AcceptsLatestSeenOffsetHandler.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AcceptsLatestSeenOffsetHandler.scala
index bf4333d8e9dd6..b15b93b47ada4 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AcceptsLatestSeenOffsetHandler.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AcceptsLatestSeenOffsetHandler.scala
@@ -15,10 +15,12 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.connector.read.streaming.{AcceptsLatestSeenOffset, SparkDataStream}
+import org.apache.spark.sql.execution.streaming.Source
+import org.apache.spark.sql.execution.streaming.checkpointing.OffsetSeq
 
 /**
  * This feeds "latest seen offset" to the sources that implement AcceptsLatestSeenOffset.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncLogPurge.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncLogPurge.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncLogPurge.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncLogPurge.scala
index cb7e71bda84dd..43d5a50b2ccda 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncLogPurge.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncLogPurge.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.concurrent.atomic.AtomicBoolean
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncProgressTrackingMicroBatchExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncProgressTrackingMicroBatchExecution.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncProgressTrackingMicroBatchExecution.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncProgressTrackingMicroBatchExecution.scala
index bbfedd5454deb..2a87ba3380883 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncProgressTrackingMicroBatchExecution.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncProgressTrackingMicroBatchExecution.scala
@@ -15,16 +15,18 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.concurrent._
 import java.util.concurrent.atomic.AtomicLong
 
 import org.apache.spark.internal.LogKeys.{BATCH_ID, PRETTY_ID_STRING}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.streaming.WriteToStream
 import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.errors.QueryExecutionErrors
+import org.apache.spark.sql.execution.streaming.{AvailableNowTrigger, OneTimeTrigger, ProcessingTimeTrigger}
+import org.apache.spark.sql.execution.streaming.checkpointing.{AsyncCommitLog, AsyncOffsetSeqLog, CommitMetadata, OffsetSeq}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StateStoreWriter
 import org.apache.spark.sql.streaming.Trigger
 import org.apache.spark.util.{Clock, ThreadUtils}
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncStreamingQueryCheckpointMetadata.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncStreamingQueryCheckpointMetadata.scala
similarity index 93%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncStreamingQueryCheckpointMetadata.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncStreamingQueryCheckpointMetadata.scala
index e3a5ded83eb17..65113ce15c397 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AsyncStreamingQueryCheckpointMetadata.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AsyncStreamingQueryCheckpointMetadata.scala
@@ -14,11 +14,12 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.concurrent.ThreadPoolExecutor
 
 import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.execution.streaming.checkpointing.{AsyncCommitLog, AsyncOffsetSeqLog}
 import org.apache.spark.util.Clock
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowDataStreamWrapper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowDataStreamWrapper.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowDataStreamWrapper.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowDataStreamWrapper.scala
index f42250c3c702d..9a5cf89d03fab 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowDataStreamWrapper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowDataStreamWrapper.scala
@@ -15,12 +15,13 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DELEGATE, READ_LIMIT}
 import org.apache.spark.sql.connector.read.streaming.{MicroBatchStream, ReadLimit, SparkDataStream, SupportsAdmissionControl, SupportsTriggerAvailableNow}
 import org.apache.spark.sql.connector.read.streaming
+import org.apache.spark.sql.execution.streaming.Source
 
 /**
  * This class wraps a [[SparkDataStream]] and makes it support Trigger.AvailableNow, by overriding
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowMicroBatchStreamWrapper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowMicroBatchStreamWrapper.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowMicroBatchStreamWrapper.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowMicroBatchStreamWrapper.scala
index 3df358ae9bf80..ec63033edd40b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowMicroBatchStreamWrapper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowMicroBatchStreamWrapper.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReaderFactory}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowSourceWrapper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowSourceWrapper.scala
similarity index 92%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowSourceWrapper.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowSourceWrapper.scala
index af5713144ebb2..bca4324447718 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/AvailableNowSourceWrapper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/AvailableNowSourceWrapper.scala
@@ -15,10 +15,11 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.DataFrame
+import org.apache.spark.sql.execution.streaming.{Offset, Source}
 import org.apache.spark.sql.types.StructType
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CompactibleFileStreamLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/CompactibleFileStreamLog.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CompactibleFileStreamLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/CompactibleFileStreamLog.scala
index d6770452e71f3..8a90982b7c0c6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/CompactibleFileStreamLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/CompactibleFileStreamLog.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.io.{FileNotFoundException, InputStream, IOException, OutputStream}
 import java.nio.charset.StandardCharsets.UTF_8
@@ -27,9 +27,10 @@ import org.apache.hadoop.fs.Path
 import org.json4s.{Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.LogKeys
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.errors.QueryExecutionErrors
+import org.apache.spark.sql.execution.streaming.checkpointing.HDFSMetadataLog
 import org.apache.spark.util.Utils
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ContinuousRecordEndpoint.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ContinuousRecordEndpoint.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ContinuousRecordEndpoint.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ContinuousRecordEndpoint.scala
index 11bdfee460e66..d948325c9ae3b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ContinuousRecordEndpoint.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ContinuousRecordEndpoint.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import scala.collection.mutable
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ErrorNotifier.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ErrorNotifier.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ErrorNotifier.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ErrorNotifier.scala
index 0f25d0667a0ef..19867c5168373 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ErrorNotifier.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ErrorNotifier.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.concurrent.atomic.AtomicReference
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamOptions.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamOptions.scala
similarity index 99%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamOptions.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamOptions.scala
index b259f9dbcdcb2..9ceee21a871c5 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamOptions.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamOptions.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.Locale
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSource.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSource.scala
similarity index 99%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSource.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSource.scala
index 465973cabe587..d5503f1c247da 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSource.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSource.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.concurrent.ThreadPoolExecutor
 import java.util.concurrent.TimeUnit._
@@ -27,7 +27,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, FileSystem, GlobFilter, Path}
 
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.paths.SparkPath
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
 import org.apache.spark.sql.classic.{DataFrame, Dataset, SparkSession}
@@ -35,6 +35,8 @@ import org.apache.spark.sql.connector.read.streaming
 import org.apache.spark.sql.connector.read.streaming.{ReadAllAvailable, ReadLimit, ReadMaxBytes, ReadMaxFiles, SupportsAdmissionControl, SupportsTriggerAvailableNow}
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.datasources.{DataSource, InMemoryFileIndex, LogicalRelation}
+import org.apache.spark.sql.execution.streaming.{Offset, Source}
+import org.apache.spark.sql.execution.streaming.sinks.FileStreamSink
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.ArrayImplicits._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSourceLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSourceLog.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSourceLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSourceLog.scala
index 14653864a2922..451cf41152421 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSourceLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSourceLog.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.{LinkedHashMap => JLinkedHashMap}
 import java.util.Map.Entry
@@ -23,7 +23,8 @@ import java.util.Map.Entry
 import scala.collection.mutable
 
 import org.apache.spark.sql.SparkSession
-import org.apache.spark.sql.execution.streaming.FileStreamSource.FileEntry
+import org.apache.spark.sql.execution.streaming.checkpointing.HDFSMetadataLog
+import org.apache.spark.sql.execution.streaming.runtime.FileStreamSource.FileEntry
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.ArrayImplicits._
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSourceOffset.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSourceOffset.scala
similarity index 94%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSourceOffset.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSourceOffset.scala
index ba79c77f38677..2cfece1942f0c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSourceOffset.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/FileStreamSourceOffset.scala
@@ -15,13 +15,15 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import scala.util.control.Exception._
 
 import org.json4s.{Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
+import org.apache.spark.sql.execution.streaming.Offset
+
 /**
  * Offset for the [[FileStreamSource]].
  *
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/IncrementalExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/IncrementalExecution.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/IncrementalExecution.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/IncrementalExecution.scala
index b6701182d7e06..0d4b0f0941d9d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/IncrementalExecution.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/IncrementalExecution.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.UUID
 import java.util.concurrent.atomic.AtomicInteger
@@ -24,7 +24,7 @@ import scala.collection.mutable.{Map => MutableMap}
 
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{BATCH_TIMESTAMP, ERROR}
 import org.apache.spark.sql.catalyst.QueryPlanningTracker
 import org.apache.spark.sql.catalyst.expressions.{CurrentBatchTimestamp, ExpressionWithRandomSeed}
@@ -38,6 +38,11 @@ import org.apache.spark.sql.execution.aggregate.{HashAggregateExec, MergingSessi
 import org.apache.spark.sql.execution.datasources.v2.state.metadata.StateMetadataPartitionReader
 import org.apache.spark.sql.execution.exchange.ShuffleExchangeLike
 import org.apache.spark.sql.execution.python.streaming.{FlatMapGroupsInPandasWithStateExec, TransformWithStateInPySparkExec}
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, OffsetSeqMetadata}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{SessionWindowStateStoreRestoreExec, SessionWindowStateStoreSaveExec, StatefulOperator, StatefulOperatorStateInfo, StateStoreRestoreExec, StateStoreSaveExec, StateStoreWriter, StreamingDeduplicateExec, StreamingDeduplicateWithinWatermarkExec, StreamingGlobalLimitExec, StreamingLocalLimitExec, UpdateEventTimeColumnExec}
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.FlatMapGroupsWithStateExec
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.{StreamingSymmetricHashJoinExec, StreamingSymmetricHashJoinHelper}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.TransformWithStateExec
 import org.apache.spark.sql.execution.streaming.sources.WriteToMicroBatchDataSourceV1
 import org.apache.spark.sql.execution.streaming.state.{OperatorStateMetadataReader, OperatorStateMetadataV1, OperatorStateMetadataV2, OperatorStateMetadataWriter, StateSchemaBroadcast, StateSchemaMetadata}
 import org.apache.spark.sql.internal.SQLConf
@@ -73,7 +78,9 @@ class IncrementalExecution(
       MutableMap[Long, StateSchemaBroadcast](),
     mode: CommandExecutionMode.Value = CommandExecutionMode.ALL,
     val isTerminatingTrigger: Boolean = false)
-  extends QueryExecution(sparkSession, logicalPlan, mode = mode) with Logging {
+  extends QueryExecution(sparkSession, logicalPlan, mode = mode,
+    shuffleCleanupMode =
+      QueryExecution.determineShuffleCleanupMode(sparkSession.sessionState.conf)) with Logging {
 
   // Modified planner with stateful operations.
   override val planner: SparkPlanner = new SparkPlanner(
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/LongOffset.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/LongOffset.scala
similarity index 92%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/LongOffset.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/LongOffset.scala
index a27898cb0c9fc..19588082b3c54 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/LongOffset.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/LongOffset.scala
@@ -15,7 +15,9 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
+
+import org.apache.spark.sql.execution.streaming.Offset
 
 /**
  * A simple offset for sources that produce a single linear stream of data.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataLogFileIndex.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MetadataLogFileIndex.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataLogFileIndex.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MetadataLogFileIndex.scala
index 45bb69a9c056b..32e2a0e53dd46 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetadataLogFileIndex.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MetadataLogFileIndex.scala
@@ -15,16 +15,16 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import scala.collection.mutable
 
 import org.apache.hadoop.fs.{FileStatus, Path}
 
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.execution.datasources._
+import org.apache.spark.sql.execution.streaming.sinks.{FileStreamSink, FileStreamSinkLog}
 import org.apache.spark.sql.types.StructType
 
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetricsReporter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MetricsReporter.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetricsReporter.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MetricsReporter.scala
index 3919f8a2eb21f..0789ecee8533a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MetricsReporter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MetricsReporter.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.time.ZonedDateTime
 import java.time.format.DateTimeFormatter
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MicroBatchExecution.scala
similarity index 90%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecution.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MicroBatchExecution.scala
index 1dd70ad985cc2..461936b40218c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecution.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/MicroBatchExecution.scala
@@ -15,15 +15,19 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import scala.collection.mutable.{Map => MutableMap}
 import scala.collection.mutable
+import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.hadoop.fs.Path
+
+import org.apache.spark.internal.LogKeys
+import org.apache.spark.internal.LogKeys.BATCH_ID
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions.{Alias, Attribute, CurrentBatchTimestamp, CurrentDate, CurrentTimestamp, FileSourceMetadataAttribute, LocalTimestamp}
-import org.apache.spark.sql.catalyst.plans.logical.{LeafNode, LocalRelation, LogicalPlan, Project, StreamSourceAwareLogicalPlan}
+import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, GlobalLimit, LeafNode, LocalRelation, LogicalPlan, Project, StreamSourceAwareLogicalPlan}
 import org.apache.spark.sql.catalyst.streaming.{StreamingRelationV2, WriteToStream}
 import org.apache.spark.sql.catalyst.trees.TreePattern.CURRENT_LIKE
 import org.apache.spark.sql.catalyst.util.truncatedString
@@ -35,8 +39,13 @@ import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.{SparkPlan, SQLExecution}
 import org.apache.spark.sql.execution.datasources.LogicalRelation
 import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2Relation, StreamingDataSourceV2Relation, StreamingDataSourceV2ScanRelation, StreamWriterCommitProgress, WriteToDataSourceV2Exec}
-import org.apache.spark.sql.execution.streaming.sources.{WriteToMicroBatchDataSource, WriteToMicroBatchDataSourceV1}
-import org.apache.spark.sql.execution.streaming.state.StateSchemaBroadcast
+import org.apache.spark.sql.execution.streaming.{AvailableNowTrigger, Offset, OneTimeTrigger, ProcessingTimeTrigger, Sink, Source}
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, CommitMetadata, OffsetSeq, OffsetSeqMetadata}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperatorStateInfo, StatefulOpStateStoreCheckpointInfo, StateStoreWriter}
+import org.apache.spark.sql.execution.streaming.runtime.AcceptsLatestSeenOffsetHandler
+import org.apache.spark.sql.execution.streaming.runtime.StreamingCheckpointConstants.{DIR_NAME_COMMITS, DIR_NAME_OFFSETS, DIR_NAME_STATE}
+import org.apache.spark.sql.execution.streaming.sources.{ForeachBatchSink, WriteToMicroBatchDataSource, WriteToMicroBatchDataSourceV1}
+import org.apache.spark.sql.execution.streaming.state.{StateSchemaBroadcast, StateStoreErrors}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.Trigger
 import org.apache.spark.util.{Clock, Utils}
@@ -303,6 +312,15 @@ class MicroBatchExecution(
   }
 
   private val watermarkPropagator = WatermarkPropagator(sparkSession.sessionState.conf)
+  private lazy val hasGlobalAggregateOrLimit = containsGlobalAggregateOrLimit(logicalPlan)
+
+  private def containsGlobalAggregateOrLimit(logicalPlan: LogicalPlan): Boolean = {
+    logicalPlan.collect {
+      case agg: Aggregate if agg.groupingExpressions.isEmpty => agg
+      case limit: GlobalLimit => limit
+    }.nonEmpty
+  }
+
 
   override def cleanup(): Unit = {
     super.cleanup()
@@ -547,12 +565,40 @@ class MicroBatchExecution(
           log"offsets ${MDC(LogKeys.STREAMING_OFFSETS_START, execCtx.startOffsets)} and " +
           log"available offsets ${MDC(LogKeys.STREAMING_OFFSETS_END, execCtx.endOffsets)}")
       case None => // We are starting this stream for the first time.
+        val shouldVerifyNewCheckpointDirectory =
+          sparkSession.conf.get(SQLConf.STREAMING_VERIFY_CHECKPOINT_DIRECTORY_EMPTY_ON_START)
+        if (shouldVerifyNewCheckpointDirectory) {
+          verifyNewCheckpointDirectory()
+        }
         logInfo(s"Starting new streaming query.")
         execCtx.batchId = 0
         watermarkTracker = WatermarkTracker(sparkSessionToRunBatches.conf, logicalPlan)
     }
   }
 
+  /**
+   * Verify that the checkpoint directory is in a good state to start a new
+   * streaming query. This checks that the offsets, state, commits directories are
+   * either non-existent or empty.
+   *
+   * If this check fails, an exception is thrown.
+   */
+  private def verifyNewCheckpointDirectory(): Unit = {
+    val fileManager = CheckpointFileManager.create(new Path(resolvedCheckpointRoot),
+      sparkSession.sessionState.newHadoopConf())
+    val dirNamesThatShouldNotHaveFiles = Array[String](
+      DIR_NAME_OFFSETS, DIR_NAME_STATE, DIR_NAME_COMMITS)
+
+    dirNamesThatShouldNotHaveFiles.foreach { dirName =>
+      val path = new Path(resolvedCheckpointRoot, dirName)
+
+      if (fileManager.exists(path) && !fileManager.list(path).isEmpty) {
+        val loc = path.toString
+        throw StateStoreErrors.streamingStateCheckpointLocationNotEmpty(loc)
+      }
+    }
+  }
+
   /**
    * Returns true if there is any new data available to be processed.
    */
@@ -862,6 +908,8 @@ class MicroBatchExecution(
         isTerminatingTrigger = trigger.isInstanceOf[AvailableNowTrigger.type])
       execCtx.executionPlan.executedPlan // Force the lazy generation of execution plan
     }
+    // Set up StateStore commit tracking before execution begins
+    setupStateStoreCommitTracking(execCtx)
 
     markMicroBatchExecutionStart(execCtx)
 
@@ -965,6 +1013,50 @@ class MicroBatchExecution(
     }
   }
 
+
+  /**
+   * Set up tracking for StateStore commits before batch execution begins.
+   * This collects information about expected stateful operators and initializes
+   * commit tracking, but only for ForeachBatchSink without global aggregates or limits.
+   */
+  private def setupStateStoreCommitTracking(execCtx: MicroBatchExecutionContext): Unit = {
+    try {
+      // Collect stateful operators from the executed plan
+      val statefulOps = execCtx.executionPlan.executedPlan.collect {
+        case s: StateStoreWriter => s
+      }
+
+      if (statefulOps.nonEmpty &&
+        sparkSession.sessionState.conf.stateStoreCommitValidationEnabled) {
+
+        // Start tracking before execution begins
+        // We only validate commits for ForeachBatchSink because it's the only sink where
+        // user-defined functions can cause partial processing (e.g., using show() or limit()).
+        // We exclude queries with global aggregates or limits because they naturally don't
+        // process all partitions, making commit validation unnecessary and potentially noisy.
+        if (sink.isInstanceOf[ForeachBatchSink[_]] && !hasGlobalAggregateOrLimit) {
+          progressReporter.shouldValidateStateStoreCommit.set(true)
+          // Build expected stores map: operatorId -> (storeName -> numPartitions)
+          val expectedStores = statefulOps.map { op =>
+            val operatorId = op.getStateInfo.operatorId
+            val numPartitions = op.getStateInfo.numPartitions
+            val storeNames = op.stateStoreNames.map(_ -> numPartitions).toMap
+            operatorId -> storeNames
+          }.toMap
+          sparkSession.streams.stateStoreCoordinator
+            .startStateStoreCommitTrackingForBatch(runId, execCtx.batchId, expectedStores)
+        }
+        // TODO: Find out how to dynamically set the SQLConf at this point to disable
+        //  the commit tracking
+      }
+    } catch {
+      case NonFatal(e) =>
+        // Log but don't fail the query for tracking setup errors
+        logWarning(log"Error during StateStore commit tracking setup for batch " +
+          log"${MDC(BATCH_ID, execCtx.batchId)}", e)
+    }
+  }
+
   /**
    * Called after the microbatch has completed execution. It takes care of committing the offset
    * to commit log and other bookkeeping.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ProgressReporter.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ProgressReporter.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ProgressReporter.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ProgressReporter.scala
index dc04ba3331e71..19aa068869dc2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ProgressReporter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ProgressReporter.scala
@@ -15,17 +15,18 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.time.Instant
 import java.time.ZoneId
 import java.time.format.DateTimeFormatter
 import java.util.{Optional, UUID}
+import java.util.concurrent.atomic.AtomicBoolean
 
 import scala.collection.mutable
 import scala.jdk.CollectionConverters._
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.catalyst.optimizer.InlineCTE
 import org.apache.spark.sql.catalyst.plans.logical.{EventTimeWatermark, LogicalPlan, WithCTE}
@@ -36,6 +37,8 @@ import org.apache.spark.sql.connector.catalog.Table
 import org.apache.spark.sql.connector.read.streaming.{MicroBatchStream, ReportsSinkMetrics, ReportsSourceMetrics, SparkDataStream}
 import org.apache.spark.sql.execution.{QueryExecution, StreamSourceAwareSparkPlan}
 import org.apache.spark.sql.execution.datasources.v2.{MicroBatchScanExec, StreamingDataSourceV2ScanRelation, StreamWriterCommitProgress}
+import org.apache.spark.sql.execution.streaming.checkpointing.OffsetSeqMetadata
+import org.apache.spark.sql.execution.streaming.operators.stateful.{EventTimeWatermarkExec, StateStoreWriter}
 import org.apache.spark.sql.execution.streaming.state.StateStoreCoordinatorRef
 import org.apache.spark.sql.streaming._
 import org.apache.spark.sql.streaming.StreamingQueryListener.{QueryIdleEvent, QueryProgressEvent}
@@ -56,6 +59,8 @@ class ProgressReporter(
   // The timestamp we report an event that has not executed anything
   var lastNoExecutionProgressEventTime = Long.MinValue
 
+  val shouldValidateStateStoreCommit = new AtomicBoolean(false)
+
   /** Holds the most recent query progress updates.  Accesses must lock on the queue itself. */
   private val progressBuffer = new mutable.Queue[StreamingQueryProgress]()
 
@@ -277,6 +282,15 @@ abstract class ProgressContext(
       currentTriggerStartOffsets != null && currentTriggerEndOffsets != null &&
         currentTriggerLatestOffsets != null
     )
+
+    // Only validate commits if enabled and the query has stateful operators
+    if (progressReporter.shouldValidateStateStoreCommit.get()) {
+      progressReporter.stateStoreCoordinator.validateStateStoreCommitForBatch(
+        lastExecution.runId,
+        lastExecution.currentBatchId
+      )
+    }
+
     currentTriggerEndTimestamp = triggerClock.getTimeMillis()
     val processingTimeMills = currentTriggerEndTimestamp - currentTriggerStartTimestamp
     assert(lastExecution != null, "executed batch should provide the information for execution.")
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/RateStreamOffset.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/RateStreamOffset.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/RateStreamOffset.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/RateStreamOffset.scala
index 84f0961e4af12..2ec50b604ac8f 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/RateStreamOffset.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/RateStreamOffset.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import org.json4s.DefaultFormats
 import org.json4s.jackson.Serialization
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ResolveWriteToStream.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ResolveWriteToStream.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ResolveWriteToStream.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ResolveWriteToStream.scala
index 6c0a228ec2fca..ee7bf67eb9121 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/ResolveWriteToStream.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/ResolveWriteToStream.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.UUID
 
@@ -24,13 +24,13 @@ import scala.util.control.NonFatal
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.internal.LogKeys.{CHECKPOINT_LOCATION, CHECKPOINT_ROOT, CONFIG, PATH}
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.analysis.UnsupportedOperationChecker
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.catalyst.streaming.{WriteToStream, WriteToStreamStatement}
 import org.apache.spark.sql.connector.catalog.SupportsWrite
 import org.apache.spark.sql.errors.{QueryCompilationErrors, QueryExecutionErrors}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.Utils
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/SerializedOffset.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/SerializedOffset.scala
similarity index 91%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/SerializedOffset.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/SerializedOffset.scala
index 129cfed860eb6..e84ac4c1a1ed8 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/SerializedOffset.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/SerializedOffset.scala
@@ -15,7 +15,9 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
+
+import org.apache.spark.sql.execution.streaming.Offset
 
 /**
  * Used when loading a JSON serialized offset from external storage.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamExecution.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecution.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamExecution.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecution.scala
index 8dd055949289a..17095bcabf32a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamExecution.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecution.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.io.{InterruptedIOException, UncheckedIOException}
 import java.nio.channels.ClosedByInterruptException
@@ -33,7 +33,7 @@ import org.apache.hadoop.fs.Path
 import org.apache.logging.log4j.CloseableThreadContext
 
 import org.apache.spark.{JobArtifactSet, SparkContext, SparkException, SparkThrowable}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CHECKPOINT_PATH, CHECKPOINT_ROOT, LOGICAL_PLAN, PATH, PRETTY_ID_STRING, QUERY_ID, RUN_ID, SPARK_DATA_STREAM}
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes._
@@ -43,6 +43,8 @@ import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2, ReadLi
 import org.apache.spark.sql.connector.write.{LogicalWriteInfoImpl, SupportsTruncate, Write}
 import org.apache.spark.sql.execution.SparkPlan
 import org.apache.spark.sql.execution.command.StreamingExplainCommand
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, CommitLog, OffsetSeqLog, OffsetSeqMetadata}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperator, StateStoreWriter}
 import org.apache.spark.sql.execution.streaming.sources.{ForeachBatchUserFuncException, ForeachUserFuncException}
 import org.apache.spark.sql.execution.streaming.state.OperatorStateMetadataV2FileManager
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamExecutionContext.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecutionContext.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamExecutionContext.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecutionContext.scala
index c5e14df3e20e1..b177bbdede740 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamExecutionContext.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamExecutionContext.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.UUID
 
@@ -24,6 +24,7 @@ import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.connector.catalog.Table
 import org.apache.spark.sql.connector.read.streaming.SparkDataStream
+import org.apache.spark.sql.execution.streaming.checkpointing.OffsetSeqMetadata
 import org.apache.spark.util.Clock
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamMetadata.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamMetadata.scala
similarity index 90%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamMetadata.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamMetadata.scala
index 84519150ca42b..04e2dfb7833e6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamMetadata.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamMetadata.scala
@@ -15,22 +15,23 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.io.{InputStreamReader, OutputStreamWriter}
 import java.nio.charset.StandardCharsets
 
 import scala.util.control.NonFatal
 
-import org.apache.commons.io.IOUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileAlreadyExistsException, FSDataInputStream, Path}
 import org.json4s.{Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.CancellableFSDataOutputStream
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.CancellableFSDataOutputStream
+import org.apache.spark.util.Utils
 
 /**
  * Contains metadata associated with a [[org.apache.spark.sql.streaming.StreamingQuery]].
@@ -63,7 +64,7 @@ object StreamMetadata extends Logging {
           logError(log"Error reading stream metadata from ${MDC(LogKeys.PATH, metadataFile)}", e)
           throw e
       } finally {
-        IOUtils.closeQuietly(input)
+        Utils.closeQuietly(input)
       }
     } else None
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamProgress.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamProgress.scala
similarity index 92%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamProgress.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamProgress.scala
index 02f52bb30e1f3..a6fd103e8d6a3 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamProgress.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamProgress.scala
@@ -15,11 +15,12 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import scala.collection.immutable
 
 import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2, SparkDataStream}
+import org.apache.spark.sql.execution.streaming.checkpointing.{OffsetSeq, OffsetSeqMetadata}
 
 /**
  * A helper class that looks like a Map[Source, Offset].
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingCheckpointConstants.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingCheckpointConstants.scala
similarity index 94%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingCheckpointConstants.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingCheckpointConstants.scala
index 27c76ba6bd67b..b92d862e17889 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingCheckpointConstants.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingCheckpointConstants.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 object StreamingCheckpointConstants {
   val DIR_NAME_COMMITS = "commits"
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryCheckpointMetadata.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryCheckpointMetadata.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryCheckpointMetadata.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryCheckpointMetadata.scala
index 072ccb21e514a..cc7e92d9d7d1c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryCheckpointMetadata.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryCheckpointMetadata.scala
@@ -14,13 +14,14 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.UUID
 
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.execution.streaming.checkpointing.{CommitLog, OffsetSeqLog}
 
 /**
  * An interface for accessing the checkpoint metadata associated with a streaming query.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryListenerBus.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryListenerBus.scala
similarity index 99%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryListenerBus.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryListenerBus.scala
index b3014ebc818da..d3762eada387e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryListenerBus.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryListenerBus.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.UUID
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryWrapper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryWrapper.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryWrapper.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryWrapper.scala
index c59b9584f5383..5585962ae16a0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingQueryWrapper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingQueryWrapper.scala
@@ -14,7 +14,7 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.UUID
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingRelation.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingRelation.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingRelation.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingRelation.scala
index c5d5a79d34545..96f6340cb958d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/StreamingRelation.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/StreamingRelation.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.SparkSession
@@ -29,6 +29,7 @@ import org.apache.spark.sql.connector.read.streaming.SparkDataStream
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.LeafExecNode
 import org.apache.spark.sql.execution.datasources.{DataSource, FileFormat}
+import org.apache.spark.sql.execution.streaming.Source
 import org.apache.spark.sql.sources.SupportsStreamSourceMetadataColumns
 
 object StreamingRelation {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TriggerExecutor.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/TriggerExecutor.scala
similarity index 95%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TriggerExecutor.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/TriggerExecutor.scala
index bfa838e43e288..8a175e633d49d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/TriggerExecutor.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/TriggerExecutor.scala
@@ -15,10 +15,11 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{ELAPSED_TIME, TRIGGER_INTERVAL}
+import org.apache.spark.sql.execution.streaming.ProcessingTimeTrigger
 import org.apache.spark.util.{Clock, SystemClock}
 
 trait TriggerExecutor {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/WatermarkPropagator.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/WatermarkPropagator.scala
similarity index 98%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/WatermarkPropagator.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/WatermarkPropagator.scala
index aaf8cbd69ea20..b3d5baf0b5af0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/WatermarkPropagator.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/WatermarkPropagator.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.{util => jutil}
 
@@ -24,6 +24,7 @@ import scala.collection.mutable
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.execution.SparkPlan
+import org.apache.spark.sql.execution.streaming.operators.stateful.{EventTimeWatermarkExec, StateStoreWriter}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.Utils
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/WatermarkTracker.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/WatermarkTracker.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/WatermarkTracker.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/WatermarkTracker.scala
index 7228767c4d18a..6d94630d8c3bd 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/WatermarkTracker.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/WatermarkTracker.scala
@@ -15,17 +15,18 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util.{Locale, UUID}
 
 import scala.collection.mutable
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.RuntimeConfig
 import org.apache.spark.sql.catalyst.plans.logical.{EventTimeWatermark, LogicalPlan}
 import org.apache.spark.sql.execution.SparkPlan
+import org.apache.spark.sql.execution.streaming.operators.stateful.EventTimeWatermarkExec
 import org.apache.spark.sql.internal.SQLConf
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/memory.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/memory.scala
similarity index 99%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/memory.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/memory.scala
index 48af1972e581c..68eb3cc7688d2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/memory.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/runtime/memory.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.runtime
 
 import java.util
 import java.util.concurrent.atomic.AtomicInteger
@@ -37,6 +37,7 @@ import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.connector.catalog.{SupportsRead, Table, TableCapability}
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory, Scan, ScanBuilder}
 import org.apache.spark.sql.connector.read.streaming.{ContinuousStream, MicroBatchStream, Offset => OffsetV2, ReadLimit, SparkDataStream, SupportsTriggerAvailableNow}
+import org.apache.spark.sql.execution.streaming.Offset
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.connector.SimpleTableProvider
 import org.apache.spark.sql.types.StructType
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSink.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sinks/FileStreamSink.scala
similarity index 96%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSink.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sinks/FileStreamSink.scala
index 11e764821c71a..978ec99ae9b39 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSink.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sinks/FileStreamSink.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.sinks
 
 import scala.util.control.NonFatal
 
@@ -23,7 +23,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{BATCH_ID, ERROR, PATH}
 import org.apache.spark.internal.io.FileCommitProtocol
 import org.apache.spark.sql.{DataFrame, SparkSession}
@@ -31,6 +31,8 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.datasources.{BasicWriteJobStatsTracker, FileFormat, FileFormatWriter}
+import org.apache.spark.sql.execution.streaming.{ManifestFileCommitProtocol, Sink}
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.{SerializableConfiguration, Utils}
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSinkLog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sinks/FileStreamSinkLog.scala
similarity index 97%
rename from sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSinkLog.scala
rename to sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sinks/FileStreamSinkLog.scala
index 556438811c44d..71679e284f9d9 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/FileStreamSinkLog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sinks/FileStreamSinkLog.scala
@@ -15,14 +15,14 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.streaming
+package org.apache.spark.sql.execution.streaming.sinks
 
 import org.apache.hadoop.fs.FileStatus
 
 import org.apache.spark.internal.LogKeys._
-import org.apache.spark.internal.MDC
 import org.apache.spark.paths.SparkPath
 import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.execution.streaming.runtime.CompactibleFileStreamLog
 import org.apache.spark.sql.internal.SQLConf
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/ContinuousMemoryStream.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/ContinuousMemoryStream.scala
index d0ba95ffd8a23..03884d02faeb7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/ContinuousMemoryStream.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/ContinuousMemoryStream.scala
@@ -32,7 +32,8 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.connector.read.InputPartition
 import org.apache.spark.sql.connector.read.streaming.{ContinuousPartitionReader, ContinuousPartitionReaderFactory, ContinuousStream, Offset, PartitionOffset}
-import org.apache.spark.sql.execution.streaming.{Offset => _, _}
+import org.apache.spark.sql.execution.streaming.{Offset => _}
+import org.apache.spark.sql.execution.streaming.runtime.{ContinuousRecordEndpoint, ContinuousRecordPartitionOffset, GetRecord, MemoryStreamBase}
 import org.apache.spark.util.RpcUtils
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamMicroBatchStream.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamMicroBatchStream.scala
index 6705201c67316..80d3d97b12ed7 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamMicroBatchStream.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamMicroBatchStream.scala
@@ -21,9 +21,7 @@ import java.io._
 import java.nio.charset.StandardCharsets
 import java.util.concurrent.TimeUnit
 
-import org.apache.commons.io.IOUtils
-
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
@@ -31,9 +29,10 @@ import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
 import org.apache.spark.sql.connector.read.streaming.{MicroBatchStream, Offset}
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.checkpointing.HDFSMetadataLog
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
-import org.apache.spark.util.{ManualClock, SystemClock}
+import org.apache.spark.util.{ManualClock, SystemClock, Utils}
 
 class RateStreamMicroBatchStream(
     rowsPerSecond: Long,
@@ -71,7 +70,7 @@ class RateStreamMicroBatchStream(
         }
 
         override def deserialize(in: InputStream): LongOffset = {
-          val content = IOUtils.toString(new InputStreamReader(in, StandardCharsets.UTF_8))
+          val content = Utils.toString(in)
           // HDFSMetadataLog guarantees that it never creates a partial file.
           assert(content.length != 0)
           if (content(0) == 'v') {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketMicroBatchStream.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketMicroBatchStream.scala
index 597b981ebe556..243d6c784f5ae 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketMicroBatchStream.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketMicroBatchStream.scala
@@ -25,13 +25,13 @@ import javax.annotation.concurrent.GuardedBy
 
 import scala.collection.mutable.ListBuffer
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{HOST, PORT}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
 import org.apache.spark.sql.connector.read.streaming.{MicroBatchStream, Offset}
-import org.apache.spark.sql.execution.streaming.LongOffset
+import org.apache.spark.sql.execution.streaming.runtime.LongOffset
 import org.apache.spark.unsafe.types.UTF8String
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/HDFSBackedStateStoreProvider.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/HDFSBackedStateStoreProvider.scala
index 25a1ca249c223..ac7f1a021960d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/HDFSBackedStateStoreProvider.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/HDFSBackedStateStoreProvider.scala
@@ -26,18 +26,16 @@ import scala.collection.mutable
 import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
-import com.google.common.io.ByteStreams
-import org.apache.commons.io.IOUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 
-import org.apache.spark.{SparkConf, SparkEnv, SparkException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC, MessageWithContext}
+import org.apache.spark.{SparkConf, SparkEnv, SparkException, TaskContext}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.CancellableFSDataOutputStream
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.CancellableFSDataOutputStream
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.{SizeEstimator, Utils}
 import org.apache.spark.util.ArrayImplicits._
@@ -83,19 +81,24 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
 
     override def get(key: UnsafeRow, colFamilyName: String): UnsafeRow = map.get(key)
 
-    override def iterator(colFamilyName: String): Iterator[UnsafeRowPair] = {
-      map.iterator()
+    override def iterator(colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
+      val iter = map.iterator()
+      new StateStoreIterator(iter)
     }
 
     override def abort(): Unit = {}
 
+    override def release(): Unit = {}
+
     override def toString(): String = {
-      s"HDFSReadStateStore[id=(op=${id.operatorId},part=${id.partitionId}),dir=$baseDir]"
+      s"HDFSReadStateStore[stateStoreId=$stateStoreId_, version=$version]"
     }
 
-    override def prefixScan(prefixKey: UnsafeRow, colFamilyName: String):
-      Iterator[UnsafeRowPair] = {
-      map.prefixScan(prefixKey)
+    override def prefixScan(
+        prefixKey: UnsafeRow,
+        colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
+      val iter = map.prefixScan(prefixKey)
+      new StateStoreIterator(iter)
     }
 
     override def valuesIterator(key: UnsafeRow, colFamilyName: String): Iterator[UnsafeRow] = {
@@ -112,6 +115,15 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
     case object UPDATING extends STATE
     case object COMMITTED extends STATE
     case object ABORTED extends STATE
+    case object RELEASED extends STATE
+
+    Option(TaskContext.get()).foreach { ctxt =>
+      ctxt.addTaskCompletionListener[Unit](ctx => {
+        if (state == UPDATING) {
+          abort()
+        }
+      })
+    }
 
     private val newVersion = version + 1
     @volatile private var state: STATE = UPDATING
@@ -173,6 +185,12 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
         logInfo(log"Committed version ${MDC(LogKeys.COMMITTED_VERSION, newVersion)} " +
           log"for ${MDC(LogKeys.STATE_STORE_PROVIDER, this)} to file " +
           log"${MDC(LogKeys.FILE_NAME, finalDeltaFile)}")
+
+        // Report the commit to StateStoreCoordinator for tracking
+        if (storeConf.commitValidationEnabled) {
+          StateStore.reportCommitToCoordinator(newVersion, stateStoreId, hadoopConf)
+        }
+
         newVersion
       } catch {
         case e: Throwable =>
@@ -198,15 +216,18 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
      * Get an iterator of all the store data.
      * This can be called only after committing all the updates made in the current thread.
      */
-    override def iterator(colFamilyName: String): Iterator[UnsafeRowPair] = {
+    override def iterator(colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
       assertUseOfDefaultColFamily(colFamilyName)
-      mapToUpdate.iterator()
+      val iter = mapToUpdate.iterator()
+      new StateStoreIterator(iter)
     }
 
-    override def prefixScan(prefixKey: UnsafeRow, colFamilyName: String):
-      Iterator[UnsafeRowPair] = {
+    override def prefixScan(
+        prefixKey: UnsafeRow,
+        colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
       assertUseOfDefaultColFamily(colFamilyName)
-      mapToUpdate.prefixScan(prefixKey)
+      val iter = mapToUpdate.prefixScan(prefixKey)
+      new StateStoreIterator(iter)
     }
 
     override def metrics: StateStoreMetrics = {
@@ -244,7 +265,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
     }
 
     override def toString(): String = {
-      s"HDFSStateStore[id=(op=${id.operatorId},part=${id.partitionId}),dir=$baseDir]"
+      s"HDFSStateStore[stateStoreId=$stateStoreId_, version=$version]"
     }
 
     override def removeColFamilyIfExists(colFamilyName: String): Boolean = {
@@ -351,7 +372,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
     assert(
       !storeConf.enableStateStoreCheckpointIds,
       "HDFS State Store Provider doesn't support checkpointFormatVersion >= 2 " +
-        s"checkpointFormatVersion ${storeConf.sqlConf.stateStoreCheckpointFormatVersion}")
+        s"checkpointFormatVersion ${storeConf.stateStoreCheckpointFormatVersion}")
 
     this.stateStoreId_ = stateStoreId
     this.keySchema = keySchema
@@ -360,6 +381,9 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
     this.hadoopConf = hadoopConf
     this.numberOfVersionsToRetainInMemory = storeConf.maxVersionsToRetainInMemory
 
+    val queryRunId = UUID.fromString(StateStoreProvider.getRunId(hadoopConf))
+    this.stateStoreProviderId = StateStoreProviderId(stateStoreId, queryRunId)
+
     // run a bunch of validation checks for this state store provider
     runValidation(useColumnFamilies, useMultipleValuesPerKey, keyStateEncoderSpec)
 
@@ -370,6 +394,8 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
 
   override def stateStoreId: StateStoreId = stateStoreId_
 
+  override protected def logName: String = s"${super.logName} ${stateStoreProviderId}"
+
   /** Do maintenance backing data files, including creating snapshots and cleaning up old files */
   override def doMaintenance(): Unit = {
     try {
@@ -377,7 +403,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
       cleanup()
     } catch {
       case NonFatal(e) =>
-        logWarning(log"Error performing snapshot and cleaning up " + toMessageWithContext)
+        logWarning(log"Error performing snapshot and cleaning up")
     }
   }
 
@@ -396,14 +422,8 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
   override def supportedInstanceMetrics: Seq[StateStoreInstanceMetric] =
     Seq(instanceMetricSnapshotLastUpload)
 
-  private def toMessageWithContext: MessageWithContext = {
-    log"HDFSStateStoreProvider[id = (op=${MDC(LogKeys.OP_ID, stateStoreId.operatorId)}," +
-      log"part=${MDC(LogKeys.PARTITION_ID, stateStoreId.partitionId)})," +
-      log"dir = ${MDC(LogKeys.PATH, baseDir)}]"
-  }
-
   override def toString(): String = {
-    toMessageWithContext.message
+    s"HDFSStateStoreProvider[stateStoreProviderId=$stateStoreProviderId]"
   }
 
   /* Internal fields and methods */
@@ -415,6 +435,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
   @volatile private var hadoopConf: Configuration = _
   @volatile private var numberOfVersionsToRetainInMemory: Int = _
   @volatile private var numColsPrefixKey: Int = 0
+  @volatile private var stateStoreProviderId: StateStoreProviderId = _
 
   // TODO: The validation should be moved to a higher level so that it works for all state store
   // implementations
@@ -640,7 +661,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
             fileToRead, toString(), keySize)
         } else {
           val keyRowBuffer = new Array[Byte](keySize)
-          ByteStreams.readFully(input, keyRowBuffer, 0, keySize)
+          Utils.readFully(input, keyRowBuffer, 0, keySize)
 
           val keyRow = new UnsafeRow(keySchema.fields.length)
           keyRow.pointTo(keyRowBuffer, keySize)
@@ -650,7 +671,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
             map.remove(keyRow)
           } else {
             val valueRowBuffer = new Array[Byte](valueSize)
-            ByteStreams.readFully(input, valueRowBuffer, 0, valueSize)
+            Utils.readFully(input, valueRowBuffer, 0, valueSize)
             val valueRow = new UnsafeRow(valueSchema.fields.length)
             // If valueSize in existing file is not multiple of 8, floor it to multiple of 8.
             // This is a workaround for the following:
@@ -720,7 +741,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
       rawStream: CancellableFSDataOutputStream): Unit = {
     try {
       if (rawStream != null) rawStream.cancel()
-      IOUtils.closeQuietly(compressedStream)
+      Utils.closeQuietly(compressedStream)
     } catch {
       // Closing the compressedStream causes the stream to write/flush flush data into the
       // rawStream. Since the rawStream is already closed, there may be errors.
@@ -760,7 +781,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
             fileToRead, toString(), keySize)
         } else {
           val keyRowBuffer = new Array[Byte](keySize)
-          ByteStreams.readFully(input, keyRowBuffer, 0, keySize)
+          Utils.readFully(input, keyRowBuffer, 0, keySize)
 
           val keyRow = new UnsafeRow(keySchema.fields.length)
           keyRow.pointTo(keyRowBuffer, keySize)
@@ -771,7 +792,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
               fileToRead, toString(), valueSize)
           } else {
             val valueRowBuffer = new Array[Byte](valueSize)
-            ByteStreams.readFully(input, valueRowBuffer, 0, valueSize)
+            Utils.readFully(input, valueRowBuffer, 0, valueSize)
             val valueRow = new UnsafeRow(valueSchema.fields.length)
             // If valueSize in existing file is not multiple of 8, floor it to multiple of 8.
             // This is a workaround for the following:
@@ -821,7 +842,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
       }
     } catch {
       case NonFatal(e) =>
-        logWarning(log"Error doing snapshots for " + toMessageWithContext, e)
+        logWarning(log"Error doing snapshots", e)
     }
   }
 
@@ -854,7 +875,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
       }
     } catch {
       case NonFatal(e) =>
-        logWarning(log"Error cleaning up files for " + toMessageWithContext, e)
+        logWarning(log"Error cleaning up files", e)
     }
   }
 
@@ -908,7 +929,7 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
           case "snapshot" =>
             versionToFiles.put(version, StoreFile(version, path, isSnapshot = true))
           case _ => logWarning(
-            log"Could not identify file ${MDC(LogKeys.PATH, path)} for " + toMessageWithContext)
+            log"Could not identify file ${MDC(LogKeys.PATH, path)}")
         }
       }
     }
@@ -953,7 +974,8 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
    * @param endVersion   checkpoint version to end with
    * @return [[HDFSBackedStateStore]]
    */
-  override def replayStateFromSnapshot(snapshotVersion: Long, endVersion: Long): StateStore = {
+  override def replayStateFromSnapshot(
+      snapshotVersion: Long, endVersion: Long, readOnly: Boolean): StateStore = {
     val newMap = replayLoadedMapFromSnapshot(snapshotVersion, endVersion)
     logInfo(log"Retrieved snapshot at version " +
       log"${MDC(LogKeys.STATE_STORE_VERSION, snapshotVersion)} and apply delta files to version " +
@@ -1057,11 +1079,9 @@ private[sql] class HDFSBackedStateStoreProvider extends StateStoreProvider with
   /** Reports to the coordinator the store's latest snapshot version */
   private def reportSnapshotUploadToCoordinator(version: Long): Unit = {
     if (storeConf.reportSnapshotUploadLag) {
-      // Attach the query run ID and current timestamp to the RPC message
-      val runId = UUID.fromString(StateStoreProvider.getRunId(hadoopConf))
       val currentTimestamp = System.currentTimeMillis()
       StateStoreProvider.coordinatorRef.foreach(
-        _.snapshotUploaded(StateStoreProviderId(stateStoreId, runId), version, currentTimestamp)
+        _.snapshotUploaded(stateStoreProviderId, version, currentTimestamp)
       )
     }
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadata.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadata.scala
index 1c97e95847908..c34545216fdaf 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadata.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadata.scala
@@ -28,12 +28,14 @@ import org.json4s.{Formats, JBool, JObject, NoTypeHints}
 import org.json4s.jackson.JsonMethods.{compact, render}
 import org.json4s.jackson.Serialization
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.execution.datasources.v2.state.StateDataSourceErrors
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, CommitLog, MetadataVersionUtil, StateStoreWriter, StreamingQueryCheckpointMetadata}
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.CancellableFSDataOutputStream
-import org.apache.spark.sql.execution.streaming.StreamingCheckpointConstants.DIR_NAME_OFFSETS
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, CommitLog, MetadataVersionUtil}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.CancellableFSDataOutputStream
+import org.apache.spark.sql.execution.streaming.operators.stateful.StateStoreWriter
+import org.apache.spark.sql.execution.streaming.runtime.StreamingCheckpointConstants.DIR_NAME_OFFSETS
+import org.apache.spark.sql.execution.streaming.runtime.StreamingQueryCheckpointMetadata
 import org.apache.spark.sql.execution.streaming.state.OperatorStateMetadataUtils.{OperatorStateMetadataReader, OperatorStateMetadataWriter}
 
 /**
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDB.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDB.scala
index 6b3bec2077037..85e2d72ec1630 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDB.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDB.scala
@@ -21,14 +21,13 @@ import java.io.File
 import java.util.Locale
 import java.util.Set
 import java.util.UUID
-import java.util.concurrent.{ConcurrentHashMap, ConcurrentLinkedQueue, TimeUnit}
+import java.util.concurrent.{ConcurrentHashMap, ConcurrentLinkedQueue}
 import java.util.concurrent.atomic.{AtomicBoolean, AtomicInteger, AtomicLong}
-import javax.annotation.concurrent.GuardedBy
 
 import scala.collection.{mutable, Map}
 import scala.jdk.CollectionConverters.ConcurrentMapHasAsScala
-import scala.ref.WeakReference
 import scala.util.Try
+import scala.util.control.NonFatal
 
 import org.apache.hadoop.conf.Configuration
 import org.json4s.{Formats, NoTypeHints}
@@ -38,7 +37,7 @@ import org.rocksdb.CompressionType._
 import org.rocksdb.TickerType._
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.{LogEntry, Logging, LogKeys, MDC}
+import org.apache.spark.internal.{LogEntry, Logging, LogKeys}
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.util.{NextIterator, Utils}
@@ -75,7 +74,8 @@ class RocksDB(
     useColumnFamilies: Boolean = false,
     enableStateStoreCheckpointIds: Boolean = false,
     partitionId: Int = 0,
-    eventForwarder: Option[RocksDBEventForwarder] = None) extends Logging {
+    eventForwarder: Option[RocksDBEventForwarder] = None,
+    uniqueId: Option[String] = None) extends Logging {
 
   import RocksDB._
 
@@ -158,7 +158,7 @@ class RocksDB(
   private val byteArrayPair = new ByteArrayPair()
   private val commitLatencyMs = new mutable.HashMap[String, Long]()
 
-  private val acquireLock = new Object
+  private val loadMetrics = new mutable.HashMap[String, Long]()
 
   @volatile private var db: NativeRocksDB = _
   @volatile private var changelogWriter: Option[StateStoreChangelogWriter] = None
@@ -185,6 +185,25 @@ class RocksDB(
   protected var sessionStateStoreCkptId: Option[String] = None
   protected[sql] val lineageManager: RocksDBLineageManager = new RocksDBLineageManager
 
+  // Memory tracking fields for unmanaged memory monitoring
+  // This allows the UnifiedMemoryManager to track RocksDB memory usage without
+  // directly accessing RocksDB from the polling thread, avoiding segmentation faults
+
+  // Timestamp of the last memory usage update in milliseconds.
+  // Used to enforce the update interval and prevent excessive memory queries.
+  private val lastMemoryUpdateTime = new AtomicLong(0L)
+
+  // Minimum interval between memory usage updates in milliseconds.
+  // This prevents performance impact from querying RocksDB memory too frequently.
+  private val memoryUpdateIntervalMs = conf.memoryUpdateIntervalMs
+
+  // Generate a unique ID if not provided to ensure proper memory tracking
+  private val instanceUniqueId = uniqueId.getOrElse(UUID.randomUUID().toString)
+
+  // Register with RocksDBMemoryManager
+  // Initial registration with zero memory usage
+  RocksDBMemoryManager.updateMemoryUsage(instanceUniqueId, 0L, conf.boundedMemoryUsage)
+
   @volatile private var numKeysOnLoadedVersion = 0L
   @volatile private var numKeysOnWritingVersion = 0L
 
@@ -195,24 +214,14 @@ class RocksDB(
 
   // SPARK-46249 - Keep track of recorded metrics per version which can be used for querying later
   // Updates and access to recordedMetrics are protected by the DB instance lock
-  @GuardedBy("acquireLock")
   @volatile private var recordedMetrics: Option[RocksDBMetrics] = None
 
-  @GuardedBy("acquireLock")
-  @volatile private var acquiredThreadInfo: AcquiredThreadInfo = _
-
-  // This is accessed and updated only between load and commit
-  // which means it is implicitly guarded by acquireLock
-  @GuardedBy("acquireLock")
   private val colFamilyNameToInfoMap = new ConcurrentHashMap[String, ColumnFamilyInfo]()
 
-  @GuardedBy("acquireLock")
   private val colFamilyIdToNameMap = new ConcurrentHashMap[Short, String]()
 
-  @GuardedBy("acquireLock")
   private val maxColumnFamilyId: AtomicInteger = new AtomicInteger(-1)
 
-  @GuardedBy("acquireLock")
   private val shouldForceSnapshot: AtomicBoolean = new AtomicBoolean(false)
 
   private def getColumnFamilyInfo(cfName: String): ColumnFamilyInfo = {
@@ -300,11 +309,6 @@ class RocksDB(
     colFamilyNameToInfoMap.asScala.values.toSeq.count(_.isInternal == isInternal)
   }
 
-  // Mapping of local SST files to DFS files for file reuse.
-  // This mapping should only be updated using the Task thread - at version load and commit time.
-  // If same mapping instance is updated from different threads,
-  // it will result in undefined behavior (and most likely incorrect mapping state).
-  @GuardedBy("acquireLock")
   private val rocksDBFileMapping: RocksDBFileMapping = new RocksDBFileMapping()
 
   // We send snapshots that needs to be uploaded by the maintenance thread to this queue
@@ -583,9 +587,13 @@ class RocksDB(
       version: Long,
       stateStoreCkptId: Option[String] = None,
       readOnly: Boolean = false): RocksDB = {
+    val startTime = System.currentTimeMillis()
+
     assert(version >= 0)
-    acquire(LoadStore)
     recordedMetrics = None
+    // Reset the load metrics before loading
+    loadMetrics.clear()
+
     logInfo(log"Loading ${MDC(LogKeys.VERSION_NUM, version)} with stateStoreCkptId: ${
       MDC(LogKeys.UUID, stateStoreCkptId.getOrElse(""))}")
     if (stateStoreCkptId.isDefined || enableStateStoreCheckpointIds && version == 0) {
@@ -593,6 +601,15 @@ class RocksDB(
     } else {
       loadWithoutCheckpointId(version, readOnly)
     }
+
+    // Record the metrics after loading
+    val duration = System.currentTimeMillis() - startTime
+    loadMetrics ++= Map(
+      "load" -> duration
+    )
+    // Register with memory manager after successful load
+    updateMemoryUsageIfNeeded()
+
     this
   }
 
@@ -608,9 +625,12 @@ class RocksDB(
    *         Source.
    */
   def loadFromSnapshot(snapshotVersion: Long, endVersion: Long): RocksDB = {
+    val startTime = System.currentTimeMillis()
+
     assert(snapshotVersion >= 0 && endVersion >= snapshotVersion)
-    acquire(LoadStore)
     recordedMetrics = None
+    loadMetrics.clear()
+
     logInfo(
       log"Loading snapshot at version ${MDC(LogKeys.VERSION_NUM, snapshotVersion)} and apply " +
       log"changelog files to version ${MDC(LogKeys.VERSION_NUM, endVersion)}.")
@@ -627,6 +647,12 @@ class RocksDB(
     }
     // Report this snapshot version to the coordinator
     reportSnapshotUploadToCoordinator(snapshotVersion)
+
+    // Record the metrics after loading
+    loadMetrics ++= Map(
+      "loadFromSnapshot" -> (System.currentTimeMillis() - startTime)
+    )
+
     this
   }
 
@@ -644,6 +670,18 @@ class RocksDB(
       workingDir, rocksDBFileMapping)
     loadedVersion = snapshotVersion
     lastSnapshotVersion = snapshotVersion
+
+    setInitialCFInfo()
+    metadata.columnFamilyMapping.foreach { mapping =>
+      mapping.foreach { case (colFamilyName, cfId) =>
+        addToColFamilyMaps(colFamilyName, cfId, isInternalColFamily(colFamilyName, metadata))
+      }
+    }
+
+    metadata.maxColumnFamilyId.foreach { maxId =>
+      maxColumnFamilyId.set(maxId)
+    }
+
     openDB()
 
     val (numKeys, numInternalKeys) = if (!conf.trackTotalNumberOfRows) {
@@ -680,6 +718,8 @@ class RocksDB(
    * Replay change log from the loaded version to the target version.
    */
   private def replayChangelog(versionsAndUniqueIds: Array[(Long, Option[String])]): Unit = {
+    val startTime = System.currentTimeMillis()
+
     assert(!versionsAndUniqueIds.isEmpty && versionsAndUniqueIds.head._1 == loadedVersion + 1,
       s"Replay changelog should start from one version after loadedVersion: $loadedVersion," +
         s" but it is not."
@@ -701,13 +741,13 @@ class RocksDB(
           changelogReader.foreach { case (recordType, key, value) =>
             recordType match {
               case RecordType.PUT_RECORD =>
-                put(key, value, includesPrefix = true)
+                put(key, value, includesPrefix = true, deriveCfName = true)
 
               case RecordType.DELETE_RECORD =>
-                remove(key, includesPrefix = true)
+                remove(key, includesPrefix = true, deriveCfName = true)
 
               case RecordType.MERGE_RECORD =>
-                merge(key, value, includesPrefix = true)
+                merge(key, value, includesPrefix = true, deriveCfName = true)
             }
           }
         } else {
@@ -728,6 +768,12 @@ class RocksDB(
         if (changelogReader != null) changelogReader.closeIfNeeded()
       }
     }
+
+    val duration = System.currentTimeMillis() - startTime
+    loadMetrics ++= Map(
+      "replayChangelog" -> Math.max(duration, 1L), // avoid flaky tests
+      "numReplayChangeLogFiles" -> versionsAndUniqueIds.length
+    )
   }
 
   /**
@@ -763,6 +809,7 @@ class RocksDB(
   def get(
       key: Array[Byte],
       cfName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Array[Byte] = {
+    updateMemoryUsageIfNeeded()
     val keyWithPrefix = if (useColumnFamilies) {
       encodeStateRowWithPrefix(key, cfName)
     } else {
@@ -829,14 +876,23 @@ class RocksDB(
       key: Array[Byte],
       value: Array[Byte],
       cfName: String = StateStore.DEFAULT_COL_FAMILY_NAME,
-      includesPrefix: Boolean = false): Unit = {
+      includesPrefix: Boolean = false,
+      deriveCfName: Boolean = false): Unit = {
+    updateMemoryUsageIfNeeded()
     val keyWithPrefix = if (useColumnFamilies && !includesPrefix) {
       encodeStateRowWithPrefix(key, cfName)
     } else {
       key
     }
 
-    handleMetricsUpdate(keyWithPrefix, cfName, isPutOrMerge = true)
+    val columnFamilyName = if (deriveCfName && useColumnFamilies) {
+      val (_, cfName) = decodeStateRowWithPrefix(keyWithPrefix)
+      cfName
+    } else {
+      cfName
+    }
+
+    handleMetricsUpdate(keyWithPrefix, columnFamilyName, isPutOrMerge = true)
     db.put(writeOptions, keyWithPrefix, value)
     changelogWriter.foreach(_.put(keyWithPrefix, value))
   }
@@ -856,14 +912,23 @@ class RocksDB(
       key: Array[Byte],
       value: Array[Byte],
       cfName: String = StateStore.DEFAULT_COL_FAMILY_NAME,
-      includesPrefix: Boolean = false): Unit = {
+      includesPrefix: Boolean = false,
+      deriveCfName: Boolean = false): Unit = {
+    updateMemoryUsageIfNeeded()
     val keyWithPrefix = if (useColumnFamilies && !includesPrefix) {
       encodeStateRowWithPrefix(key, cfName)
     } else {
       key
     }
 
-    handleMetricsUpdate(keyWithPrefix, cfName, isPutOrMerge = true)
+    val columnFamilyName = if (deriveCfName && useColumnFamilies) {
+      val (_, cfName) = decodeStateRowWithPrefix(keyWithPrefix)
+      cfName
+    } else {
+      cfName
+    }
+
+    handleMetricsUpdate(keyWithPrefix, columnFamilyName, isPutOrMerge = true)
     db.merge(writeOptions, keyWithPrefix, value)
     changelogWriter.foreach(_.merge(keyWithPrefix, value))
   }
@@ -875,14 +940,23 @@ class RocksDB(
   def remove(
       key: Array[Byte],
       cfName: String = StateStore.DEFAULT_COL_FAMILY_NAME,
-      includesPrefix: Boolean = false): Unit = {
+      includesPrefix: Boolean = false,
+      deriveCfName: Boolean = false): Unit = {
+    updateMemoryUsageIfNeeded()
     val keyWithPrefix = if (useColumnFamilies && !includesPrefix) {
       encodeStateRowWithPrefix(key, cfName)
     } else {
       key
     }
 
-    handleMetricsUpdate(keyWithPrefix, cfName, isPutOrMerge = false)
+    val columnFamilyName = if (deriveCfName && useColumnFamilies) {
+      val (_, cfName) = decodeStateRowWithPrefix(keyWithPrefix)
+      cfName
+    } else {
+      cfName
+    }
+
+    handleMetricsUpdate(keyWithPrefix, columnFamilyName, isPutOrMerge = false)
     db.delete(writeOptions, keyWithPrefix)
     changelogWriter.foreach(_.delete(keyWithPrefix))
   }
@@ -890,7 +964,8 @@ class RocksDB(
   /**
    * Get an iterator of all committed and uncommitted key-value pairs.
    */
-  def iterator(): Iterator[ByteArrayPair] = {
+  def iterator(): NextIterator[ByteArrayPair] = {
+    updateMemoryUsageIfNeeded()
     val iter = db.newIterator()
     logInfo(log"Getting iterator from version ${MDC(LogKeys.LOADED_VERSION, loadedVersion)}")
     iter.seekToFirst()
@@ -926,7 +1001,8 @@ class RocksDB(
   /**
    * Get an iterator of all committed and uncommitted key-value pairs for the given column family.
    */
-  def iterator(cfName: String): Iterator[ByteArrayPair] = {
+  def iterator(cfName: String): NextIterator[ByteArrayPair] = {
+    updateMemoryUsageIfNeeded()
     if (!useColumnFamilies) {
       iterator()
     } else {
@@ -975,7 +1051,8 @@ class RocksDB(
 
   def prefixScan(
       prefix: Array[Byte],
-      cfName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Iterator[ByteArrayPair] = {
+      cfName: String = StateStore.DEFAULT_COL_FAMILY_NAME): NextIterator[ByteArrayPair] = {
+    updateMemoryUsageIfNeeded()
     val iter = db.newIterator()
     val updatedPrefix = if (useColumnFamilies) {
       encodeStateRowWithPrefix(prefix, cfName)
@@ -1013,6 +1090,8 @@ class RocksDB(
     }
   }
 
+  def release(): Unit = {}
+
   /**
    * Commit all the updates made as a version to DFS. The steps it needs to do to commits are:
    * - Flush all changes to disk
@@ -1020,6 +1099,8 @@ class RocksDB(
    * - Sync the checkpoint dir files to DFS
    */
   def commit(): (Long, StateStoreCheckpointInfo) = {
+    commitLatencyMs.clear()
+    updateMemoryUsageIfNeeded()
     val newVersion = loadedVersion + 1
     try {
       logInfo(log"Flushing updates for ${MDC(LogKeys.VERSION_NUM, newVersion)}")
@@ -1031,13 +1112,14 @@ class RocksDB(
         commitLatencyMs ++= snapshotLatency
       }
 
+      var isUploaded = false
+
       logInfo(log"Syncing checkpoint for ${MDC(LogKeys.VERSION_NUM, newVersion)} to DFS")
       val fileSyncTimeMs = timeTakenMs {
         if (enableChangelogCheckpointing) {
           // If we have changed the columnFamilyId mapping, we have set a new
           // snapshot and need to upload this to the DFS even if changelog checkpointing
           // is enabled.
-          var isUploaded = false
           if (shouldForceSnapshot.get()) {
             assert(snapshot.isDefined)
             uploadSnapshot(snapshot.get)
@@ -1048,7 +1130,14 @@ class RocksDB(
           // ensure that changelog files are always written
           try {
             assert(changelogWriter.isDefined)
-            changelogWriter.foreach(_.commit())
+            val changeLogWriterCommitTimeMs = timeTakenMs {
+              changelogWriter.foreach(_.commit())
+            }
+            // Record the commit time for the changelog writer
+            commitLatencyMs ++= Map(
+              "changeLogWriterCommit" -> changeLogWriterCommitTimeMs
+            )
+
             if (!isUploaded) {
               snapshot.foreach(snapshotsToUploadQueue.offer)
             }
@@ -1059,9 +1148,19 @@ class RocksDB(
           assert(changelogWriter.isEmpty)
           assert(snapshot.isDefined)
           uploadSnapshot(snapshot.get)
+          isUploaded = true
         }
       }
 
+      if (isUploaded) {
+        // If we have uploaded the snapshot, the fileManagerMetrics will be cleared and updated
+        // in uploadSnapshot. If there are new metrics needed to be added specific to this commit,
+        // add them here to not accidentally use old fileManagerMetrics from the maintenance threads
+        commitLatencyMs ++= Map(
+          "saveZipFiles" -> fileManagerMetrics.saveZipFilesTimeMs.getOrElse(0L)
+        )
+      }
+
       if (enableStateStoreCheckpointIds) {
         lastCommitBasedStateStoreCkptId = loadedStateStoreCkptId
         lastCommittedStateStoreCkptId = sessionStateStoreCkptId
@@ -1093,10 +1192,6 @@ class RocksDB(
       case t: Throwable =>
         loadedVersion = -1  // invalidate loaded version
         throw t
-    } finally {
-      // reset resources as either 1) we already pushed the changes and it has been committed or
-      // 2) commit has failed and the current version is "invalidated".
-      release(LoadStore)
     }
   }
 
@@ -1180,23 +1275,18 @@ class RocksDB(
    * Drop uncommitted changes, and roll back to previous version.
    */
   def rollback(): Unit = {
-    acquire(RollbackStore)
-    try {
-      numKeysOnWritingVersion = numKeysOnLoadedVersion
-      numInternalKeysOnWritingVersion = numInternalKeysOnLoadedVersion
-      loadedVersion = -1L
-      lastCommitBasedStateStoreCkptId = None
-      lastCommittedStateStoreCkptId = None
-      loadedStateStoreCkptId = None
-      sessionStateStoreCkptId = None
-      lineageManager.clear()
-      changelogWriter.foreach(_.abort())
-      // Make sure changelogWriter gets recreated next time.
-      changelogWriter = None
-      logInfo(log"Rolled back to ${MDC(LogKeys.VERSION_NUM, loadedVersion)}")
-    } finally {
-      release(RollbackStore)
-    }
+    numKeysOnWritingVersion = numKeysOnLoadedVersion
+    numInternalKeysOnWritingVersion = numInternalKeysOnLoadedVersion
+    loadedVersion = -1L
+    lastCommitBasedStateStoreCkptId = None
+    lastCommittedStateStoreCkptId = None
+    loadedStateStoreCkptId = None
+    sessionStateStoreCkptId = None
+    lineageManager.clear()
+    changelogWriter.foreach(_.abort())
+    // Make sure changelogWriter gets recreated next time.
+    changelogWriter = None
+    logInfo(log"Rolled back to ${MDC(LogKeys.VERSION_NUM, loadedVersion)}")
   }
 
   def doMaintenance(): Unit = {
@@ -1228,7 +1318,6 @@ class RocksDB(
   /** Release all resources */
   def close(): Unit = {
     // Acquire DB instance lock and release at the end to allow for synchronized access
-    acquire(CloseStore)
     try {
       closeDB()
 
@@ -1244,14 +1333,21 @@ class RocksDB(
         snapshot = snapshotsToUploadQueue.poll()
       }
 
+      // Unregister from RocksDBMemoryManager
+      try {
+        RocksDBMemoryManager.unregisterInstance(instanceUniqueId)
+      } catch {
+        case NonFatal(e) =>
+          logWarning(log"Failed to unregister from RocksDBMemoryManager " +
+            log"${MDC(LogKeys.EXCEPTION, e)}")
+      }
+
       silentDeleteRecursively(localRootDir, "closing RocksDB")
       // Clear internal maps to reset the state
       clearColFamilyMaps()
     } catch {
       case e: Exception =>
         logWarning("Error closing RocksDB", e)
-    } finally {
-      release(CloseStore)
     }
   }
 
@@ -1278,9 +1374,6 @@ class RocksDB(
   private def metrics: RocksDBMetrics = {
     import HistogramType._
     val totalSSTFilesBytes = getDBProperty("rocksdb.total-sst-files-size")
-    val readerMemUsage = getDBProperty("rocksdb.estimate-table-readers-mem")
-    val memTableMemUsage = getDBProperty("rocksdb.size-all-mem-tables")
-    val blockCacheUsage = getDBProperty("rocksdb.block-cache-usage")
     val pinnedBlocksMemUsage = getDBProperty("rocksdb.block-cache-pinned-usage")
     val nativeOpsHistograms = Seq(
       "get" -> DB_GET,
@@ -1314,14 +1407,8 @@ class RocksDB(
       nativeStats.getTickerCount(typ)
     }
 
-    // if bounded memory usage is enabled, we share the block cache across all state providers
-    // running on the same node and account the usage to this single cache. In this case, its not
-    // possible to provide partition level or query level memory usage.
-    val memoryUsage = if (conf.boundedMemoryUsage) {
-      0L
-    } else {
-      readerMemUsage + memTableMemUsage + blockCacheUsage
-    }
+    // Use RocksDBMemoryManager to calculate the memory usage accounting
+    val memoryUsage = RocksDBMemoryManager.getInstanceMemoryUsage(instanceUniqueId, getMemoryUsage)
 
     RocksDBMetrics(
       numKeysOnLoadedVersion,
@@ -1331,7 +1418,9 @@ class RocksDB(
       pinnedBlocksMemUsage,
       totalSSTFilesBytes,
       nativeOpsLatencyMicros,
-      commitLatencyMs,
+      // Ensure that the maps are cloned to avoid sharing these Maps
+      commitLatencyMs.clone(),
+      loadMetrics.clone(),
       bytesCopied = fileManagerMetrics.bytesCopied,
       filesCopied = fileManagerMetrics.filesCopied,
       filesReused = fileManagerMetrics.filesReused,
@@ -1347,100 +1436,67 @@ class RocksDB(
    */
   def metricsOpt: Option[RocksDBMetrics] = {
     var rocksDBMetricsOpt: Option[RocksDBMetrics] = None
-    acquire(ReportStoreMetrics)
     try {
       rocksDBMetricsOpt = recordedMetrics
     } catch {
       case ex: Exception =>
         logInfo(log"Failed to acquire metrics with exception=${MDC(LogKeys.ERROR, ex)}")
-    } finally {
-      release(ReportStoreMetrics)
     }
     rocksDBMetricsOpt
   }
 
   /**
-   * Function to acquire RocksDB instance lock that allows for synchronized access to the state
-   * store instance
-   *
-   * @param opType - operation type requesting the lock
+   * Refresh the recorded metrics with the latest metrics.
    */
-  private def acquire(opType: RocksDBOpType): Unit = acquireLock.synchronized {
-    val newAcquiredThreadInfo = AcquiredThreadInfo()
-    val waitStartTime = System.nanoTime()
-    def timeWaitedMs = {
-      val elapsedNanos = System.nanoTime() - waitStartTime
-      TimeUnit.MILLISECONDS.convert(elapsedNanos, TimeUnit.NANOSECONDS)
-    }
-    def isAcquiredByDifferentThread = acquiredThreadInfo != null &&
-      acquiredThreadInfo.threadRef.get.isDefined &&
-      newAcquiredThreadInfo.threadRef.get.get.getId != acquiredThreadInfo.threadRef.get.get.getId
-
-    while (isAcquiredByDifferentThread && timeWaitedMs < conf.lockAcquireTimeoutMs) {
-      acquireLock.wait(10)
-    }
-    if (isAcquiredByDifferentThread) {
-      val stackTraceOutput = acquiredThreadInfo.threadRef.get.get.getStackTrace.mkString("\n")
-      throw QueryExecutionErrors.unreleasedThreadError(loggingId, opType.toString,
-        newAcquiredThreadInfo.toString(), acquiredThreadInfo.toString(), timeWaitedMs,
-        stackTraceOutput)
-    } else {
-      acquiredThreadInfo = newAcquiredThreadInfo
-      // Add a listener to always release the lock when the task (if active) completes
-      Option(TaskContext.get()).foreach(_.addTaskCompletionListener[Unit] {
-        _ => this.release(StoreTaskCompletionListener, Some(newAcquiredThreadInfo))
-      })
-      logInfo(log"RocksDB instance was acquired by " +
-        log"ownerThread=${MDC(LogKeys.THREAD, acquiredThreadInfo)} " +
-        log"for opType=${MDC(LogKeys.OP_TYPE, opType.toString)}")
-    }
+  private[state] def refreshRecordedMetricsForTest(): Unit = {
+    recordedMetrics = Some(metrics)
   }
 
+  private def getDBProperty(property: String): Long = db.getProperty(property).toLong
+
   /**
-   * Function to release RocksDB instance lock that allows for synchronized access to the state
-   * store instance. Optionally provide a thread to check against, and release only if provided
-   * thread is the one that acquired the lock.
+   * Returns the current memory usage of this RocksDB instance in bytes.
+   * WARNING: This method should only be called from the task thread when
+   * RocksDB is in a safe state.
    *
-   * @param opType - operation type releasing the lock
-   * @param releaseForThreadOpt - optional thread to check against acquired thread
+   * This includes memory from all major RocksDB components:
+   * - Table readers (indexes and filters in memory)
+   * - Memtables (write buffers)
+   * - Block cache (cached data blocks)
+   * - Block cache pinned usage (blocks pinned in cache)
+   *
+   * @return Total memory usage in bytes across all tracked components
    */
-  private def release(
-      opType: RocksDBOpType,
-      releaseForThreadOpt: Option[AcquiredThreadInfo] = None): Unit = acquireLock.synchronized {
-    if (acquiredThreadInfo != null) {
-      val release = releaseForThreadOpt match {
-        case Some(releaseForThread) if releaseForThread.threadRef.get.isEmpty =>
-          logInfo(log"Thread reference is empty when attempting to release for " +
-            log"opType=${MDC(LogKeys.OP_TYPE, opType.toString)}, ignoring release. " +
-            log"Lock is held by ownerThread=${MDC(LogKeys.THREAD, acquiredThreadInfo)}")
-          false
-        // NOTE: we compare the entire acquiredThreadInfo object to ensure that we are
-        // releasing not only for the right thread but the right task as well. This is
-        // inconsistent with the logic for acquire which uses only the thread ID, consider
-        // updating this in future.
-        case Some(releaseForThread) if acquiredThreadInfo != releaseForThread =>
-          logInfo(log"Thread info for " +
-            log"releaseThread=${MDC(LogKeys.THREAD, releaseForThreadOpt.get)} " +
-            log"does not match the acquired thread when attempting to " +
-            log"release for opType=${MDC(LogKeys.OP_TYPE, opType.toString)}, ignoring release. " +
-            log"Lock is held by ownerThread=${MDC(LogKeys.THREAD, acquiredThreadInfo)}")
-          false
-        case _ => true
-      }
+  def getMemoryUsage: Long = {
+    require(db != null && !db.isClosed, "RocksDB must be open to get memory usage")
+    RocksDB.mainMemorySources.map(getDBProperty).sum
+  }
+
+  /**
+   * Updates the cached memory usage if enough time has passed.
+   * This is called from task thread operations, so it's already thread-safe.
+   */
+  def updateMemoryUsageIfNeeded(): Unit = {
+
+    val currentTime = System.currentTimeMillis()
+    val timeSinceLastUpdate = currentTime - lastMemoryUpdateTime.get()
 
-      if (release) {
-        logInfo(log"RocksDB instance was released by " +
-          log"releaseThread=${MDC(LogKeys.THREAD, AcquiredThreadInfo())} " +
-          log"with ownerThread=${MDC(LogKeys.THREAD, acquiredThreadInfo)} " +
-          log"for opType=${MDC(LogKeys.OP_TYPE, opType.toString)}")
-        acquiredThreadInfo = null
-        acquireLock.notifyAll()
+    if (timeSinceLastUpdate >= memoryUpdateIntervalMs && db != null && !db.isClosed) {
+      try {
+        val usage = getMemoryUsage
+        lastMemoryUpdateTime.set(currentTime)
+        // Report usage to RocksDBMemoryManager
+        RocksDBMemoryManager.updateMemoryUsage(
+          instanceUniqueId,
+          usage,
+          conf.boundedMemoryUsage)
+      } catch {
+        case NonFatal(e) =>
+          logDebug(s"Failed to update RocksDB memory usage: ${e.getMessage}")
       }
     }
   }
 
-  private def getDBProperty(property: String): Long = db.getProperty(property).toLong
-
   private def openDB(): Unit = {
     assert(db == null)
     db = NativeRocksDB.open(rocksDbOptions, workingDir.toString)
@@ -1462,11 +1518,6 @@ class RocksDB(
     }
   }
 
-  private[state] def getAcquiredThreadInfo(): Option[AcquiredThreadInfo] =
-      acquireLock.synchronized {
-    Option(acquiredThreadInfo).map(_.copy())
-  }
-
   /** Upload the snapshot to DFS and remove it from snapshots pending */
   private def uploadSnapshot(
       snapshot: RocksDBSnapshot,
@@ -1565,6 +1616,12 @@ class RocksDB(
 }
 
 object RocksDB extends Logging {
+
+  val mainMemorySources: Seq[String] = Seq(
+    "rocksdb.estimate-table-readers-mem",
+    "rocksdb.size-all-mem-tables",
+    "rocksdb.block-cache-usage")
+
   case class RocksDBSnapshot(
       checkpointDir: File,
       version: Long,
@@ -1705,6 +1762,24 @@ class RocksDBFileMapping {
     }.getOrElse(None)
   }
 
+  /**
+   * Remove all local file mappings that are incompatible with the current version we are
+   * trying to load.
+   *
+   * @return seq of purged mappings
+   */
+  def purgeIncompatibleMappingsForLoad(versionToLoad: Long):
+  Seq[(String, (Long, RocksDBImmutableFile))] = {
+    val filesToRemove = localFileMappings.filter {
+      case (_, (dfsFileMappedVersion, _)) =>
+        dfsFileMappedVersion >= versionToLoad
+    }.toSeq
+    filesToRemove.foreach { case (localFileName, _) =>
+      remove(localFileName)
+    }
+    filesToRemove
+  }
+
   def mapToDfsFile(
       localFileName: String,
       dfsFile: RocksDBImmutableFile,
@@ -1788,6 +1863,7 @@ case class RocksDBConf(
     totalMemoryUsageMB: Long,
     writeBufferCacheRatio: Double,
     highPriorityPoolRatio: Double,
+    memoryUpdateIntervalMs: Long,
     compressionCodec: String,
     allowFAllocate: Boolean,
     compression: String,
@@ -1874,6 +1950,12 @@ object RocksDBConf {
   private val HIGH_PRIORITY_POOL_RATIO_CONF = SQLConfEntry(HIGH_PRIORITY_POOL_RATIO_CONF_KEY,
     "0.1")
 
+  // Memory usage update interval for unmanaged memory tracking
+  val MEMORY_UPDATE_INTERVAL_MS_CONF_KEY = "memoryUpdateIntervalMs"
+  private val MEMORY_UPDATE_INTERVAL_MS_CONF = SQLConfEntry(MEMORY_UPDATE_INTERVAL_MS_CONF_KEY,
+    "1000")
+
+
   // Allow files to be pre-allocated on disk using fallocate
   // Disabling may slow writes, but can solve an issue where
   // significant quantities of disk are wasted if there are
@@ -1972,6 +2054,7 @@ object RocksDBConf {
       getLongConf(MAX_MEMORY_USAGE_MB_CONF),
       getRatioConf(WRITE_BUFFER_CACHE_RATIO_CONF),
       getRatioConf(HIGH_PRIORITY_POOL_RATIO_CONF),
+      getPositiveLongConf(MEMORY_UPDATE_INTERVAL_MS_CONF),
       storeConf.compressionCodec,
       getBooleanConf(ALLOW_FALLOCATE_CONF),
       getStringConf(COMPRESSION_CONF),
@@ -1991,6 +2074,7 @@ case class RocksDBMetrics(
     totalSSTFilesBytes: Long,
     nativeOpsHistograms: Map[String, RocksDBNativeHistogram],
     lastCommitLatencyMs: Map[String, Long],
+    loadMetrics: Map[String, Long],
     filesCopied: Long,
     bytesCopied: Long,
     filesReused: Long,
@@ -2023,21 +2107,6 @@ object RocksDBNativeHistogram {
   }
 }
 
-case class AcquiredThreadInfo(
-    threadRef: WeakReference[Thread] = new WeakReference[Thread](Thread.currentThread()),
-    tc: TaskContext = TaskContext.get()) {
-  override def toString(): String = {
-    val taskStr = if (tc != null) {
-      val taskDetails =
-        s"partition ${tc.partitionId()}.${tc.attemptNumber()} in stage " +
-          s"${tc.stageId()}.${tc.stageAttemptNumber()}, TID ${tc.taskAttemptId()}"
-      s", task: $taskDetails"
-    } else ""
-
-    s"[ThreadId: ${threadRef.get.map(_.getId)}$taskStr]"
-  }
-}
-
 /**
  * A helper class to manage the lineage information when checkpoint unique id is enabled.
  * "lineage" is an array of LineageItem (version, uniqueId) pair.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBFileManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBFileManager.scala
index 562a57aafbd41..0063f960c4757 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBFileManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBFileManager.scala
@@ -30,17 +30,18 @@ import com.fasterxml.jackson.annotation.JsonInclude.Include
 import com.fasterxml.jackson.databind.{DeserializationFeature, ObjectMapper}
 import com.fasterxml.jackson.databind.annotation.JsonDeserialize
 import com.fasterxml.jackson.module.scala.{ClassTagExtensions, DefaultScalaModule}
-import org.apache.commons.io.{FilenameUtils, IOUtils}
+import org.apache.commons.io.FilenameUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, FileSystem, Path, PathFilter}
 import org.json4s.{Formats, NoTypeHints}
 import org.json4s.jackson.Serialization
 
 import org.apache.spark.{SparkConf, SparkEnv, SparkException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC, MessageWithContext}
+import org.apache.spark.internal.{Logging, LogKeys, MessageWithContext}
+import org.apache.spark.internal.LogKeys.{DFS_FILE, VERSION_NUM}
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.util.ArrayImplicits._
 import org.apache.spark.util.Utils
@@ -298,22 +299,31 @@ class RocksDBFileManager(
     logDebug(log"Written metadata for version ${MDC(LogKeys.VERSION_NUM, version)}:\n" +
       log"${MDC(LogKeys.METADATA_JSON, metadata.prettyJson)}")
 
-    if (version <= 1 && numKeys <= 0) {
-      // If we're writing the initial version and there's no data, we have to explicitly initialize
-      // the root directory. Normally saveImmutableFilesToDfs will do this initialization, but
-      // when there's no data that method won't write any files, and zipToDfsFile uses the
-      // CheckpointFileManager.createAtomic API which doesn't auto-initialize parent directories.
-      // Moreover, once we disable to track the number of keys, in which the numKeys is -1, we
-      // still need to create the initial dfs root directory anyway.
-      if (!rootDirChecked) {
-        val path = new Path(dfsRootDir)
-        if (!fm.exists(path)) fm.mkdirs(path)
-        rootDirChecked = true
+    val (_, zipFilesTimeMs) = Utils.timeTakenMs {
+      if (version <= 1 && numKeys <= 0) {
+        // If we're writing the initial version and there's no data, we have to initialize
+        // the root directory. Normally saveImmutableFilesToDfs will do this initialization, but
+        // when there's no data that method won't write any files, and zipToDfsFile uses the
+        // CheckpointFileManager.createAtomic API which doesn't auto-initialize parent directories.
+        // Moreover, once we disable to track the number of keys, in which the numKeys is -1, we
+        // still need to create the initial dfs root directory anyway.
+        if (!rootDirChecked) {
+          val path = new Path(dfsRootDir)
+          if (!fm.exists(path)) fm.mkdirs(path)
+          rootDirChecked = true
+        }
       }
+      zipToDfsFile(localOtherFiles :+ metadataFile, dfsBatchZipFile(version, checkpointUniqueId))
+      logInfo(log"Saved checkpoint file for version ${MDC(LogKeys.VERSION_NUM, version)} " +
+        log"checkpointUniqueId: ${MDC(LogKeys.UUID, checkpointUniqueId.getOrElse(""))}")
     }
-    zipToDfsFile(localOtherFiles :+ metadataFile, dfsBatchZipFile(version, checkpointUniqueId))
-    logInfo(log"Saved checkpoint file for version ${MDC(LogKeys.VERSION_NUM, version)} " +
-      log"checkpointUniqueId: ${MDC(LogKeys.UUID, checkpointUniqueId.getOrElse(""))}")
+
+    // populate the SaveCheckpointMetrics
+    saveCheckpointMetrics =
+      saveCheckpointMetrics.copy(
+        // Round up to 1ms to reassure that we've logged successfully and avoid flaky tests
+        saveZipFilesTimeMs = Some(Math.max(zipFilesTimeMs, 1L))
+      )
   }
 
   /**
@@ -335,7 +345,7 @@ class RocksDBFileManager(
     versionToRocksDBFiles.keySet().removeIf(_._1 >= version)
     val metadata = if (version == 0) {
       if (localDir.exists) Utils.deleteRecursively(localDir)
-      localDir.mkdirs()
+      Utils.createDirectory(localDir)
       // Since we cleared the local dir, we should also clear the local file mapping
       rocksDBFileMapping.clear()
       RocksDBCheckpointMetadata(Seq.empty, 0)
@@ -785,6 +795,17 @@ class RocksDBFileManager(
       }
     }
 
+    // Delete remaining unnecessary local immutable file mappings.
+    // Files present in the file mapping but not the filesystem may lead to
+    // versionID mismatch error (SPARK-52637), so we should explicitly delete
+    // them.
+    rocksDBFileMapping.purgeIncompatibleMappingsForLoad(version).foreach {
+      case (_, (dfsFileMappedVersion, dfsFile)) =>
+        logInfo(log"Deleted local fileMapping to ${MDC(DFS_FILE, dfsFile)} because " +
+          log"mapped file version ${MDC(VERSION_NUM, dfsFileMappedVersion)} was " +
+          log"incompatible with versionToLoad ${MDC(VERSION_NUM, version)}")
+    }
+
     var filesCopied = 0L
     var bytesCopied = 0L
     var filesReused = 0L
@@ -828,7 +849,7 @@ class RocksDBFileManager(
   private def getImmutableFilesFromVersionZip(
       version: Long, checkpointUniqueId: Option[String] = None): Seq[RocksDBImmutableFile] = {
     Utils.deleteRecursively(localTempDir)
-    localTempDir.mkdirs()
+    Utils.createDirectory(localTempDir)
     Utils.unzipFilesFromFile(fs, dfsBatchZipFile(version, checkpointUniqueId), localTempDir)
     val metadataFile = localMetadataFile(localTempDir)
     val metadata = RocksDBCheckpointMetadata.readFromFile(metadataFile)
@@ -849,7 +870,7 @@ class RocksDBFileManager(
       files.foreach { file =>
         zout.putNextEntry(new ZipEntry(file.getName))
         in = new FileInputStream(file)
-        val bytes = IOUtils.copy(in, zout)
+        val bytes = in.transferTo(zout)
         in.close()
         zout.closeEntry()
         totalBytes += bytes
@@ -868,8 +889,8 @@ class RocksDBFileManager(
         throw e
     } finally {
       // Close everything no matter what happened
-      IOUtils.closeQuietly(in)
-      IOUtils.closeQuietly(zout)
+      Utils.closeQuietly(in)
+      Utils.closeQuietly(zout)
     }
   }
 
@@ -950,7 +971,9 @@ case class RocksDBFileManagerMetrics(
     bytesCopied: Long,
     filesReused: Long,
     @JsonDeserialize(contentAs = classOf[java.lang.Long])
-    zipFileBytesUncompressed: Option[Long] = None)
+    zipFileBytesUncompressed: Option[Long] = None,
+    @JsonDeserialize(contentAs = classOf[java.lang.Long])
+    saveZipFilesTimeMs: Option[Long] = None)
 
 /**
  * Metrics to return when requested but no operation has been performed.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBMemoryManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBMemoryManager.scala
index 273cbbc5e87d5..82ee1803b3172 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBMemoryManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBMemoryManager.scala
@@ -17,22 +17,117 @@
 
 package org.apache.spark.sql.execution.streaming.state
 
+import java.util.concurrent.ConcurrentHashMap
+
+import scala.jdk.CollectionConverters._
+
 import org.rocksdb._
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.SparkEnv
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
+import org.apache.spark.memory.{MemoryMode, UnifiedMemoryManager, UnmanagedMemoryConsumer, UnmanagedMemoryConsumerId}
 
 /**
  * Singleton responsible for managing cache and write buffer manager associated with all RocksDB
  * state store instances running on a single executor if boundedMemoryUsage is enabled for RocksDB.
  * If boundedMemoryUsage is disabled, a new cache object is returned.
+ * This also implements UnmanagedMemoryConsumer to report RocksDB memory usage to Spark's
+ * UnifiedMemoryManager, allowing Spark to account for RocksDB memory when making
+ * memory allocation decisions.
  */
-object RocksDBMemoryManager extends Logging {
+object RocksDBMemoryManager extends Logging with UnmanagedMemoryConsumer {
   private var writeBufferManager: WriteBufferManager = null
   private var cache: Cache = null
 
+  // Tracks memory usage and bounded memory mode per unique ID
+  private case class InstanceMemoryInfo(memoryUsage: Long, isBoundedMemory: Boolean)
+  private val instanceMemoryMap = new ConcurrentHashMap[String, InstanceMemoryInfo]()
+
+  override def unmanagedMemoryConsumerId: UnmanagedMemoryConsumerId = {
+    UnmanagedMemoryConsumerId("RocksDB", "RocksDB-Memory-Manager")
+  }
+
+  override def memoryMode: MemoryMode = {
+    // RocksDB uses native/off-heap memory for its data structures
+    MemoryMode.OFF_HEAP
+  }
+
+  override def getMemBytesUsed: Long = {
+    val memoryInfos = instanceMemoryMap.values().asScala.toSeq
+    if (memoryInfos.isEmpty) {
+      return 0L
+    }
+
+    // Separate instances by bounded vs unbounded memory mode
+    val (bounded, unbounded) = memoryInfos.partition(_.isBoundedMemory)
+
+    // For bounded memory instances, they all share the same memory pool,
+    // so just take the max value (they should all be similar)
+    val boundedMemory = if (bounded.nonEmpty) bounded.map(_.memoryUsage).max else 0L
+
+    // For unbounded memory instances, sum their individual usages
+    val unboundedMemory = unbounded.map(_.memoryUsage).sum
+
+    // Total is bounded memory (shared) + sum of unbounded memory (individual)
+    boundedMemory + unboundedMemory
+  }
+
+  /**
+   * Register/update a RocksDB instance with its memory usage.
+   * @param uniqueId The instance's unique identifier
+   * @param memoryUsage The current memory usage in bytes
+   * @param isBoundedMemory Whether this instance uses bounded memory mode
+   */
+  def updateMemoryUsage(
+      uniqueId: String,
+      memoryUsage: Long,
+      isBoundedMemory: Boolean): Unit = {
+    instanceMemoryMap.put(uniqueId, InstanceMemoryInfo(memoryUsage, isBoundedMemory))
+    logDebug(s"Updated memory usage for $uniqueId: $memoryUsage bytes " +
+      s"(bounded=$isBoundedMemory)")
+  }
+
+  /**
+   * Unregister a RocksDB instance.
+   * @param uniqueId The instance's unique identifier
+   */
+  def unregisterInstance(uniqueId: String): Unit = {
+    instanceMemoryMap.remove(uniqueId)
+    logDebug(s"Unregistered instance $uniqueId")
+  }
+
+  def getNumRocksDBInstances(boundedMemory: Boolean): Long = {
+    instanceMemoryMap.values().asScala.count(_.isBoundedMemory == boundedMemory)
+  }
+
+  /**
+   * Get the memory usage for a specific instance, accounting for bounded memory sharing.
+   * @param uniqueId The instance's unique identifier
+   * @param totalMemoryUsage The total memory usage of this instance
+   * @return The adjusted memory usage accounting for sharing in bounded memory mode
+   */
+  def getInstanceMemoryUsage(uniqueId: String, totalMemoryUsage: Long): Long = {
+    val instanceInfo = instanceMemoryMap.
+      getOrDefault(uniqueId, InstanceMemoryInfo(0L, isBoundedMemory = false))
+    if (instanceInfo.isBoundedMemory) {
+      // In bounded memory mode, divide by the number of bounded instances
+      // since they share the same memory pool
+      val numBoundedInstances = getNumRocksDBInstances(true)
+      totalMemoryUsage / numBoundedInstances
+    } else {
+      // In unbounded memory mode, each instance has its own memory
+      totalMemoryUsage
+    }
+  }
+
   def getOrCreateRocksDBMemoryManagerAndCache(conf: RocksDBConf): (WriteBufferManager, Cache)
     = synchronized {
+    // Register with UnifiedMemoryManager (idempotent operation)
+    if (SparkEnv.get != null) {
+      UnifiedMemoryManager.registerUnmanagedMemoryConsumer(this)
+    }
+
     if (conf.boundedMemoryUsage) {
       if (writeBufferManager == null) {
         assert(cache == null)
@@ -72,5 +167,6 @@ object RocksDBMemoryManager extends Logging {
   def resetWriteBufferManagerAndCache: Unit = synchronized {
     writeBufferManager = null
     cache = null
+    instanceMemoryMap.clear()
   }
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateEncoder.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateEncoder.scala
index cf5f8ba5f2ebe..f49c79f96b9ce 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateEncoder.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateEncoder.scala
@@ -36,7 +36,8 @@ import org.apache.spark.sql.avro.{AvroDeserializer, AvroOptions, AvroSerializer,
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{BoundReference, JoinedRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.expressions.codegen.UnsafeRowWriter
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, StateStoreColumnFamilySchemaUtils}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.StateStoreColumnFamilySchemaUtils
 import org.apache.spark.sql.execution.streaming.state.RocksDBStateStoreProvider.{SCHEMA_ID_PREFIX_BYTES, STATE_ENCODING_NUM_VERSION_BYTES, STATE_ENCODING_VERSION}
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.Platform
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateMachine.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateMachine.scala
new file mode 100644
index 0000000000000..80ef42f9bd75b
--- /dev/null
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateMachine.scala
@@ -0,0 +1,330 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution.streaming.state
+
+import java.util.concurrent.TimeUnit
+import java.util.concurrent.atomic.AtomicLong
+import javax.annotation.concurrent.GuardedBy
+
+import scala.ref.WeakReference
+
+import org.apache.spark.TaskContext
+import org.apache.spark.internal.{Logging, LogKeys}
+import org.apache.spark.sql.errors.QueryExecutionErrors
+
+/**
+ * A state machine that manages the lifecycle of a RocksDB instance
+ *
+ * This class enforces proper state transitions and ensures thread-safety for accessing
+ * RocksDB instances.
+ * It prevents concurrent modifications to the same native RocksDB instance by using
+ * a stamp-based locking mechanism.
+ *
+ * State Lifecycle:
+ * - RELEASED: The RocksDB instance is not being accessed by any thread
+ * - ACQUIRED: The RocksDB instance is currently being accessed by a thread
+ * - CLOSED: The RocksDB instance has been closed and can no longer be used
+ *
+ * Valid Transitions:
+ * - RELEASED -> ACQUIRED: When a thread acquires the RocksDB instance
+ * - ACQUIRED -> RELEASED: When a thread releases the RocksDB instance
+ * - RELEASED -> CLOSED: When the RocksDB instance is shut down
+ * - ACQUIRED -> MAINTENANCE: Maintenance can be performed on an acquired RocksDB instance
+ * - RELEASED -> MAINTENANCE: Maintenance can be performed on a released RocksDB instance
+ *
+ * Stamps:
+ * Each time a RocksDB instance is acquired, a unique stamp is generated. This stamp must be
+ * presented when performing operations on the RocksDB instance and when releasing it. This ensures
+ * that only the stamp owner that acquired the RocksDB instance can release it or perform
+ * operations.
+ */
+class RocksDBStateMachine(
+    stateStoreId: StateStoreId,
+    rocksDBConf: RocksDBConf) extends Logging {
+
+  private sealed trait STATE
+  private case object RELEASED extends STATE
+  private case object ACQUIRED extends STATE
+  private case object CLOSED extends STATE
+
+  private sealed abstract class OPERATION(name: String) {
+    override def toString: String = name
+  }
+  private case object LOAD extends OPERATION("load")
+  private case object RELEASE extends OPERATION("release")
+  private case object CLOSE extends OPERATION("close")
+  private case object MAINTENANCE extends OPERATION("maintenance")
+
+  private val stateMachineLock = new Object()
+  @GuardedBy("stateMachineLock")
+  private var state: STATE = RELEASED
+
+  // This is only maintained for logging purposes
+  @GuardedBy("stateMachineLock")
+  private var acquiredThreadInfo: AcquiredThreadInfo = _
+
+  private val RELEASED_STATE_MACHINE_STAMP: Long = -1L
+
+  /**
+   * Map defining all valid state transitions in the state machine.
+   * Key: (currentState, operation) -> Value: nextState
+   *
+   * Valid transitions:
+   * - (RELEASED, LOAD) -> ACQUIRED: Acquire exclusive access to the RocksDB instance
+   * - (ACQUIRED, RELEASE) -> RELEASED: Release exclusive access
+   * - (RELEASED, CLOSE) -> CLOSED: Permanently close the RocksDB instance
+   * - (CLOSED, CLOSE) -> CLOSED: Close is idempotent
+   * - (RELEASED, MAINTENANCE) -> RELEASED: Maintenance on released RocksDB instance
+   * - (ACQUIRED, MAINTENANCE) -> ACQUIRED: Maintenance on acquired RocksDB instance
+   */
+  private val allowedStateTransitions: Map[(STATE, OPERATION), STATE] = Map(
+    (RELEASED, LOAD) -> ACQUIRED,
+    (ACQUIRED, RELEASE) -> RELEASED,
+    (RELEASED, CLOSE) -> CLOSED,
+    (CLOSED, CLOSE) -> CLOSED,  // Idempotent close operation
+    (RELEASED, MAINTENANCE) -> RELEASED,
+    (ACQUIRED, MAINTENANCE) -> ACQUIRED
+  )
+
+  /**
+   * Returns information about the thread that currently has the RocksDB instance acquired.
+   * This method is exposed for testing purposes only.
+   *
+   * @return Some(AcquiredThreadInfo) if a thread currently has the RocksDB instance acquired,
+   *         None if the RocksDB instance is in RELEASED state
+   */
+  private[spark] def getAcquiredThreadInfo: Option[AcquiredThreadInfo] =
+    stateMachineLock.synchronized {
+      Option(acquiredThreadInfo).map(_.copy())
+    }
+
+  // Can be read without holding any locks, but should only be updated when
+  // stateMachineLock is held.
+  private[state] val currentValidStamp = new AtomicLong(RELEASED_STATE_MACHINE_STAMP)
+  @GuardedBy("stateMachineLock")
+  private var lastValidStamp: Long = 0L
+
+  /**
+   * This method is marked "WithLock" because it MUST only be called when the caller
+   * already holds the stateMachineLock. Calling this method without holding the lock
+   * will result in race conditions and data corruption.
+   *
+   * @return A new unique stamp value
+   */
+  @GuardedBy("stateMachineLock")
+  private def incAndGetStampWithLock: Long = {
+    assert(Thread.holdsLock(stateMachineLock), "Instance lock must be held")
+    lastValidStamp += 1
+    currentValidStamp.set(lastValidStamp)
+    logInfo(log"New stamp: ${MDC(LogKeys.STAMP, currentValidStamp.get())} issued for " +
+      log"${MDC(LogKeys.STATE_STORE_ID, stateStoreId)}")
+    lastValidStamp
+  }
+
+  /**
+   * This method is marked "WithLock" because it MUST only be called when the caller
+   * already holds the stateMachineLock. The method uses stateMachineLock.wait() which
+   * requires the calling stamp owner to own the monitor. Calling this without holding the
+   * lock will throw IllegalMonitorStateException.
+   *
+   * @param operation The operation being attempted (used for error reporting)
+   * @throws QueryExecutionErrors.unreleasedThreadError if timeout occurs
+   */
+  @GuardedBy("stateMachineLock")
+  private def awaitNotAcquiredWithLock(operation: OPERATION): Unit = {
+    assert(Thread.holdsLock(stateMachineLock), "Instance lock must be held")
+    val waitStartTime = System.nanoTime()
+    def timeWaitedMs = {
+      val elapsedNanos = System.nanoTime() - waitStartTime
+      // Convert from nanoseconds to milliseconds
+      TimeUnit.MILLISECONDS.convert(elapsedNanos, TimeUnit.NANOSECONDS)
+    }
+    while (state == ACQUIRED && timeWaitedMs < rocksDBConf.lockAcquireTimeoutMs) {
+      stateMachineLock.wait(10)
+      // log every 30 seconds
+      if (timeWaitedMs % (30 * 1000) == 0) {
+        logInfo(log"Waiting to acquire lock for ${MDC(LogKeys.STATE_STORE_ID, stateStoreId)}")
+      }
+    }
+    if (state == ACQUIRED) {
+      val newAcquiredThreadInfo = AcquiredThreadInfo()
+      val stackTraceOutput = acquiredThreadInfo.threadRef.get.get.getStackTrace.mkString("\n")
+      val loggingId = s"StateStoreId(opId=${stateStoreId.operatorId}," +
+        s"partId=${stateStoreId.partitionId},name=${stateStoreId.storeName})"
+      throw QueryExecutionErrors.unreleasedThreadError(loggingId, operation.toString,
+        newAcquiredThreadInfo.toString(), acquiredThreadInfo.toString(), timeWaitedMs,
+        stackTraceOutput)
+    }
+  }
+
+  /**
+   * Validates a state operation and updates the internal state if the transition is legal.
+   *
+   * This method is the core of the state machine that ensures thread-safe access to RocksDB
+   * instances. It uses a map-based approach to define valid state transitions,
+   * making the state machine logic cleaner and more maintainable.
+   *
+   * Thread Safety Requirements:
+   * - Caller MUST hold the stateMachineLock before calling this method
+   * - This is enforced by the synchronized blocks in all public methods
+   *
+   * Side Effects:
+   * - Updates the internal state variable
+   * - Sets acquiredThreadInfo when transitioning to ACQUIRED state
+   * - Logs state transitions for debugging
+   *
+   * @param operation The requested state operation (LOAD, RELEASE, CLOSE, or MAINTENANCE)
+   * @return A tuple of (oldState, newState) representing the state before and after operation
+   * @throws StateStoreInvalidStateMachineTransition if the requested operation is not allowed
+   *         from the current state
+   */
+  @GuardedBy("stateMachineLock")
+  private def validateAndTransitionState(operation: OPERATION): (STATE, STATE) = {
+    assert(Thread.holdsLock(stateMachineLock), "Instance lock must be held")
+    val oldState = state
+    val newState = allowedStateTransitions.get((oldState, operation)) match {
+      case Some(nextState) => nextState
+      case None =>
+        // Determine expected state for better error message
+        val expectedState = operation match {
+          case LOAD => "ACQUIRED"
+          case RELEASE => "RELEASED"
+          case CLOSE => "CLOSED"
+          case MAINTENANCE => oldState.toString
+        }
+        throw StateStoreErrors.invalidStateMachineTransition(
+          oldState.toString, expectedState, operation.toString, stateStoreId)
+    }
+    state = newState
+    if (newState == ACQUIRED) {
+      acquiredThreadInfo = AcquiredThreadInfo()
+    }
+    logInfo(log"Transitioned state from ${MDC(LogKeys.STATE_STORE_STATE, oldState)} " +
+      log"to ${MDC(LogKeys.STATE_STORE_STATE, newState)} " +
+      log"with operation ${MDC(LogKeys.OPERATION, operation.toString)} " +
+      log"for StateStoreId ${MDC(LogKeys.STATE_STORE_ID, stateStoreId)}")
+    (oldState, newState)
+  }
+
+  /**
+   * Verifies that the provided stamp matches the current valid stamp.
+   * This ensures that operations are performed by the task that acquired the RocksDB instance.
+   *
+   * @param stamp The stamp to verify against the current valid stamp
+   * @throws StateStoreInvalidStamp if the stamp does not match the current valid stamp
+   */
+  def verifyStamp(stamp: Long): Unit = {
+    val currentStamp = currentValidStamp.get()
+    if (stamp != currentStamp) {
+      throw StateStoreErrors.invalidStamp(stamp, currentStamp)
+    }
+  }
+
+  /**
+   * Releases the RocksDB instance, transitioning it from ACQUIRED to RELEASED state.
+   * This can only be called by the stamp owner that acquired the RocksDB instance.
+   *
+   * @param stamp The stamp that was returned when the RocksDB instance was acquired
+   * @param throwEx Whether to throw an exception if the stamp is invalid (default: true)
+   * @return true if the RocksDB instance was successfully released, false if stamp was invalid
+   *         and throwEx=false
+   * @throws StateStoreInvalidStamp if stamp is invalid and throwEx=true
+   * @throws StateStoreInvalidStateMachineTransition if the current state doesn't allow release
+   */
+  def releaseStamp(stamp: Long, throwEx: Boolean = true): Boolean = stateMachineLock.synchronized {
+    currentValidStamp.compareAndSet(stamp, RELEASED_STATE_MACHINE_STAMP) match {
+      case true =>
+        validateAndTransitionState(RELEASE)
+        true
+      case false =>
+        throwEx match {
+          case true =>
+            val actualStamp = currentValidStamp.get()
+            throw StateStoreErrors.invalidStamp(stamp, actualStamp)
+          case false =>
+            false
+        }
+    }
+  }
+
+  /**
+   * Acquires the RocksDB instance for exclusive use by the calling task.
+   * Transitions the state from RELEASED to ACQUIRED.
+   *
+   * This method will block if another task currently has a stamp for the RocksDB instance,
+   * waiting up to the configured timeout before throwing an exception.
+   *
+   * @return A unique stamp that must be used for subsequent operations and release
+   * @throws StateStoreInvalidStateMachineTransition if the RocksDB instance is in CLOSED state
+   * @throws QueryExecutionErrors.unreleasedThreadError if timeout occurs waiting for another thread
+   */
+  def acquireStamp(): Long = stateMachineLock.synchronized {
+    awaitNotAcquiredWithLock(LOAD)
+    validateAndTransitionState(LOAD)
+    incAndGetStampWithLock
+  }
+
+  /**
+   * This verifies that it is in a state that allows maintenance to be performed.
+   * This operation is allowed in both RELEASED and ACQUIRED states.
+   *
+   * @throws StateStoreInvalidStateMachineTransition if the RocksDB instance is in CLOSED state
+   */
+  def verifyForMaintenance(): Unit = stateMachineLock.synchronized {
+    validateAndTransitionState(MAINTENANCE)
+  }
+
+  /**
+   * Closes the RocksDB instance permanently, transitioning it to CLOSED state.
+   * Once closed, the RocksDB instance cannot be used again and all future operations will fail.
+   *
+   * This method will block if another task currently has a stamp for the RocksDB instance,
+   * waiting up to the configured timeout before throwing an exception.
+   *
+   * @throws StateStoreInvalidStateMachineTransition if called multiple times (idempotent)
+   * @throws QueryExecutionErrors.unreleasedThreadError if timeout occurs waiting for another thread
+   */
+  def close(): Boolean = stateMachineLock.synchronized {
+    // return boolean as to whether we need to close or not
+    if (state == CLOSED) {
+      false
+    } else {
+      logInfo(log"Trying to close store ${MDC(LogKeys.STATE_STORE_ID, stateStoreId)}")
+      awaitNotAcquiredWithLock(CLOSE)
+      logInfo(log"Finished waiting to acquire lock," +
+        log" transitioning to close store ${MDC(LogKeys.STATE_STORE_ID, stateStoreId)}")
+      validateAndTransitionState(CLOSE)
+      true
+    }
+  }
+}
+
+case class AcquiredThreadInfo(
+    threadRef: WeakReference[Thread] = new WeakReference[Thread](Thread.currentThread()),
+    tc: TaskContext = TaskContext.get()) {
+  override def toString(): String = {
+    val taskStr = if (tc != null) {
+      val taskDetails =
+        s"partition ${tc.partitionId()}.${tc.attemptNumber()} in stage " +
+          s"${tc.stageId()}.${tc.stageAttemptNumber()}, TID ${tc.taskAttemptId()}"
+      s", task: $taskDetails"
+    } else ""
+
+    s"[ThreadId: ${threadRef.get.map(_.getId)}$taskStr]"
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreProvider.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreProvider.scala
index 6efdf8d67137b..4230ea3a21662 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreProvider.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreProvider.scala
@@ -26,13 +26,13 @@ import scala.util.control.NonFatal
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.{SparkConf, SparkEnv}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.{SparkConf, SparkEnv, TaskContext}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
 import org.apache.spark.sql.execution.streaming.state.StateStoreEncoding.Avro
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.unsafe.Platform
@@ -43,20 +43,149 @@ private[sql] class RocksDBStateStoreProvider
   with SupportsFineGrainedReplay {
   import RocksDBStateStoreProvider._
 
-  class RocksDBStateStore(lastVersion: Long) extends StateStore {
+  class RocksDBStateStore(
+      lastVersion: Long,
+      private[RocksDBStateStoreProvider] val stamp: Long,
+      private[RocksDBStateStoreProvider] var readOnly: Boolean) extends StateStore {
+
+    private sealed trait OPERATION
+    private case object UPDATE extends OPERATION
+    private case object ABORT extends OPERATION
+    private case object RELEASE extends OPERATION
+    private case object COMMIT extends OPERATION
+    private case object METRICS extends OPERATION
+
     /** Trait and classes representing the internal state of the store */
     trait STATE
     case object UPDATING extends STATE
     case object COMMITTED extends STATE
     case object ABORTED extends STATE
+    case object RELEASED extends STATE
 
     @volatile private var state: STATE = UPDATING
     @volatile private var isValidated = false
 
+    /**
+     * Map defining all valid state transitions for the RocksDB state store.
+     * Key: (currentState, operation) -> Value: nextState
+     *
+     * Valid transitions:
+     * - (UPDATING, UPDATE) -> UPDATING: Continue updating
+     * - (UPDATING, ABORT) -> ABORTED: Abort during update
+     * - (UPDATING, RELEASE) -> RELEASED: Release during update
+     * - (UPDATING, COMMIT) -> COMMITTED: Direct commit
+     * - (COMMITTED, METRICS) -> COMMITTED: Allow metrics after commit
+     * - (ABORTED, ABORT) -> ABORTED: Abort is idempotent
+     * - (ABORTED, METRICS) -> ABORTED: Allow metrics after abort
+     * - (RELEASED, RELEASE) -> RELEASED: Release is idempotent
+     * - (RELEASED, METRICS) -> RELEASED: Allow metrics after release
+     */
+    private val allowedStateTransitions: Map[(STATE, OPERATION), STATE] = Map(
+      // From UPDATING state
+      (UPDATING, UPDATE) -> UPDATING,
+      (UPDATING, ABORT) -> ABORTED,
+      (UPDATING, RELEASE) -> RELEASED,
+      (UPDATING, COMMIT) -> COMMITTED,
+      // From COMMITTED state
+      (COMMITTED, METRICS) -> COMMITTED,
+      // From ABORTED state
+      (ABORTED, ABORT) -> ABORTED,  // Idempotent
+      (ABORTED, METRICS) -> ABORTED,
+      // From RELEASED state
+      (RELEASED, RELEASE) -> RELEASED,  // Idempotent
+      (RELEASED, METRICS) -> RELEASED
+    )
+
     override def id: StateStoreId = RocksDBStateStoreProvider.this.stateStoreId
 
     override def version: Long = lastVersion
 
+    /**
+     * Validates the expected state, throws exception if state is not as expected.
+     * Returns the current state
+     *
+     * @param possibleStates Expected possible states
+     * @return current state of StateStore
+     */
+    private def validateState(possibleStates: STATE*): STATE = {
+      if (!possibleStates.contains(state)) {
+        throw StateStoreErrors.stateStoreOperationOutOfOrder(
+          s"Expected possible states ${possibleStates.mkString("(", ", ", ")")} but found $state")
+      }
+      state
+    }
+
+    /**
+     * Throws error if transition is illegal.
+     * MUST be called for every StateStore method.
+     *
+     * @param operation The transition type of the operation.
+     */
+    private def validateAndTransitionState(operation: OPERATION): Unit = {
+      val oldState = state
+
+      // Operations requiring stamp verification
+      val needsStampVerification = operation match {
+        case ABORT if state == ABORTED => false     // ABORT is idempotent
+        case RELEASE if state == RELEASED => false  // RELEASE is idempotent
+        case UPDATE | ABORT | RELEASE | COMMIT => true
+        case METRICS => false
+      }
+
+      if (needsStampVerification) {
+        stateMachine.verifyStamp(stamp)
+      }
+
+      val newState = allowedStateTransitions.get((oldState, operation)) match {
+        case Some(nextState) => nextState
+        case None =>
+          val errorMsg = operation match {
+            case UPDATE => s"Cannot update after ${oldState.toString}"
+            case ABORT => s"Cannot abort after ${oldState.toString}"
+            case RELEASE => s"Cannot release after ${oldState.toString}"
+            case COMMIT => s"Cannot commit after ${oldState.toString}"
+            case METRICS => s"Cannot get metrics in ${oldState} state"
+          }
+          throw StateStoreErrors.stateStoreOperationOutOfOrder(errorMsg)
+      }
+
+      // Special handling for COMMIT operation - release the store
+      if (operation == COMMIT || operation == RELEASE) {
+        stateMachine.releaseStamp(stamp)
+      }
+
+      if (operation != UPDATE) {
+        logInfo(log"Transitioned state from ${MDC(LogKeys.STATE_STORE_STATE, oldState)} " +
+          log"to ${MDC(LogKeys.STATE_STORE_STATE, newState)} " +
+          log"for StateStoreId ${MDC(LogKeys.STATE_STORE_ID, stateStoreId)} " +
+          log"with transition ${MDC(LogKeys.OPERATION, operation.toString)}")
+      }
+      state = newState
+    }
+
+    Option(TaskContext.get()).foreach { ctxt =>
+      ctxt.addTaskCompletionListener[Unit](ctx => {
+        try {
+          if (state == UPDATING) {
+            if (readOnly) {
+              release()
+            } else {
+              abort() // Abort since this is an error if stateful task completes
+            }
+          }
+        } catch {
+          case NonFatal(e) =>
+            logWarning("Failed to abort or release state store", e)
+        } finally {
+          stateMachine.releaseStamp(stamp, throwEx = false)
+        }
+      })
+      // Abort the async commit stores only when the task has failed and store is not committed.
+      ctxt.addTaskFailureListener((_, _) => {
+        if (!hasCommitted) abort()
+      })
+    }
+
     override def createColFamilyIfAbsent(
         colFamilyName: String,
         keySchema: StructType,
@@ -64,6 +193,7 @@ private[sql] class RocksDBStateStoreProvider
         keyStateEncoderSpec: KeyStateEncoderSpec,
         useMultipleValuesPerKey: Boolean = false,
         isInternal: Boolean = false): Unit = {
+      validateAndTransitionState(UPDATE)
       verifyColFamilyCreationOrDeletion("create_col_family", colFamilyName, isInternal)
       val cfId = rocksDB.createColFamilyIfAbsent(colFamilyName, isInternal)
       val dataEncoderCacheKey = StateRowEncoderCacheKey(
@@ -105,6 +235,7 @@ private[sql] class RocksDBStateStoreProvider
     }
 
     override def get(key: UnsafeRow, colFamilyName: String): UnsafeRow = {
+      validateAndTransitionState(UPDATE)
       verify(key != null, "Key cannot be null")
       verifyColFamilyOperations("get", colFamilyName)
 
@@ -131,6 +262,7 @@ private[sql] class RocksDBStateStoreProvider
      * values per key.
      */
     override def valuesIterator(key: UnsafeRow, colFamilyName: String): Iterator[UnsafeRow] = {
+      validateAndTransitionState(UPDATE)
       verify(key != null, "Key cannot be null")
       verifyColFamilyOperations("valuesIterator", colFamilyName)
 
@@ -147,6 +279,7 @@ private[sql] class RocksDBStateStoreProvider
 
     override def merge(key: UnsafeRow, value: UnsafeRow,
         colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Unit = {
+      validateAndTransitionState(UPDATE)
       verify(state == UPDATING, "Cannot merge after already committed or aborted")
       verifyColFamilyOperations("merge", colFamilyName)
 
@@ -162,6 +295,7 @@ private[sql] class RocksDBStateStoreProvider
     }
 
     override def put(key: UnsafeRow, value: UnsafeRow, colFamilyName: String): Unit = {
+      validateAndTransitionState(UPDATE)
       verify(state == UPDATING, "Cannot put after already committed or aborted")
       verify(key != null, "Key cannot be null")
       require(value != null, "Cannot put a null value")
@@ -172,6 +306,7 @@ private[sql] class RocksDBStateStoreProvider
     }
 
     override def remove(key: UnsafeRow, colFamilyName: String): Unit = {
+      validateAndTransitionState(UPDATE)
       verify(state == UPDATING, "Cannot remove after already committed or aborted")
       verify(key != null, "Key cannot be null")
       verifyColFamilyOperations("remove", colFamilyName)
@@ -180,16 +315,18 @@ private[sql] class RocksDBStateStoreProvider
       rocksDB.remove(kvEncoder._1.encodeKey(key), colFamilyName)
     }
 
-    override def iterator(colFamilyName: String): Iterator[UnsafeRowPair] = {
+    override def iterator(colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
+      validateAndTransitionState(UPDATE)
       // Note this verify function only verify on the colFamilyName being valid,
       // we are actually doing prefix when useColumnFamilies,
       // but pass "iterator" to throw correct error message
       verifyColFamilyOperations("iterator", colFamilyName)
       val kvEncoder = keyValueEncoderMap.get(colFamilyName)
       val rowPair = new UnsafeRowPair()
-
       if (useColumnFamilies) {
-        rocksDB.iterator(colFamilyName).map { kv =>
+        val rocksDbIter = rocksDB.iterator(colFamilyName)
+
+        val iter = rocksDbIter.map { kv =>
           rowPair.withRows(kvEncoder._1.decodeKey(kv.key),
             kvEncoder._2.decodeValue(kv.value))
           if (!isValidated && rowPair.value != null && !useColumnFamilies) {
@@ -199,8 +336,12 @@ private[sql] class RocksDBStateStoreProvider
           }
           rowPair
         }
+
+        new StateStoreIterator(iter, rocksDbIter.closeIfNeeded)
       } else {
-        rocksDB.iterator().map { kv =>
+        val rocksDbIter = rocksDB.iterator()
+
+        val iter = rocksDbIter.map { kv =>
           rowPair.withRows(kvEncoder._1.decodeKey(kv.key),
             kvEncoder._2.decodeValue(kv.value))
           if (!isValidated && rowPair.value != null && !useColumnFamilies) {
@@ -210,11 +351,15 @@ private[sql] class RocksDBStateStoreProvider
           }
           rowPair
         }
+
+        new StateStoreIterator(iter, rocksDbIter.closeIfNeeded)
       }
     }
 
-    override def prefixScan(prefixKey: UnsafeRow, colFamilyName: String):
-      Iterator[UnsafeRowPair] = {
+    override def prefixScan(
+        prefixKey: UnsafeRow,
+        colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
+      validateAndTransitionState(UPDATE)
       verifyColFamilyOperations("prefixScan", colFamilyName)
 
       val kvEncoder = keyValueEncoderMap.get(colFamilyName)
@@ -223,22 +368,36 @@ private[sql] class RocksDBStateStoreProvider
 
       val rowPair = new UnsafeRowPair()
       val prefix = kvEncoder._1.encodePrefixKey(prefixKey)
-      rocksDB.prefixScan(prefix, colFamilyName).map { kv =>
+
+      val rocksDbIter = rocksDB.prefixScan(prefix, colFamilyName)
+      val iter = rocksDbIter.map { kv =>
         rowPair.withRows(kvEncoder._1.decodeKey(kv.key),
           kvEncoder._2.decodeValue(kv.value))
         rowPair
       }
+
+      new StateStoreIterator(iter, rocksDbIter.closeIfNeeded)
     }
 
     var checkpointInfo: Option[StateStoreCheckpointInfo] = None
+    private var storedMetrics: Option[RocksDBMetrics] = None
+
     override def commit(): Long = synchronized {
+      validateState(UPDATING)
       try {
-        verify(state == UPDATING, "Cannot commit after already committed or aborted")
+        stateMachine.verifyStamp(stamp)
         val (newVersion, newCheckpointInfo) = rocksDB.commit()
         checkpointInfo = Some(newCheckpointInfo)
-        state = COMMITTED
+        storedMetrics = rocksDB.metricsOpt
+        validateAndTransitionState(COMMIT)
         logInfo(log"Committed ${MDC(VERSION_NUM, newVersion)} " +
           log"for ${MDC(STATE_STORE_ID, id)}")
+
+        // Report the commit to StateStoreCoordinator for tracking
+        if (storeConf.commitValidationEnabled) {
+          StateStore.reportCommitToCoordinator(newVersion, stateStoreId, hadoopConf)
+        }
+
         newVersion
       } catch {
         case e: Throwable =>
@@ -246,16 +405,38 @@ private[sql] class RocksDBStateStoreProvider
       }
     }
 
+    override def release(): Unit = {
+      assert(readOnly, "Release can only be called on a read-only store")
+      if (state != RELEASED) {
+        logInfo(log"Releasing ${MDC(VERSION_NUM, version + 1)} " +
+          log"for ${MDC(STATE_STORE_ID, id)}")
+        rocksDB.release()
+        validateAndTransitionState(RELEASE)
+      } else {
+        // Optionally log at DEBUG level that it's already released
+        logDebug(log"State store already released")
+      }
+    }
+
     override def abort(): Unit = {
-      verify(state == UPDATING || state == ABORTED, "Cannot abort after already committed")
-      logInfo(log"Aborting ${MDC(VERSION_NUM, version + 1)} " +
-        log"for ${MDC(STATE_STORE_ID, id)}")
-      rocksDB.rollback()
-      state = ABORTED
+      if (validateState(UPDATING, ABORTED) != ABORTED) {
+        try {
+          validateAndTransitionState(ABORT)
+          logInfo(log"Aborting ${MDC(VERSION_NUM, version + 1)} " +
+            log"for ${MDC(STATE_STORE_ID, id)}")
+          rocksDB.rollback()
+        } finally {
+          stateMachine.releaseStamp(stamp)
+        }
+      } else {
+        logInfo(log"Skipping abort for ${MDC(VERSION_NUM, version + 1)} " +
+          log"for ${MDC(STATE_STORE_ID, id)} as we already aborted")
+      }
     }
 
     override def metrics: StateStoreMetrics = {
-      val rocksDBMetricsOpt = rocksDB.metricsOpt
+      validateAndTransitionState(METRICS)
+      val rocksDBMetricsOpt = storedMetrics
 
       if (rocksDBMetricsOpt.isDefined) {
         val rocksDBMetrics = rocksDBMetricsOpt.get
@@ -263,6 +444,9 @@ private[sql] class RocksDBStateStoreProvider
         def commitLatencyMs(typ: String): Long =
           rocksDBMetrics.lastCommitLatencyMs.getOrElse(typ, 0L)
 
+        def loadMetrics(typ: String): Long =
+          rocksDBMetrics.loadMetrics.getOrElse(typ, 0L)
+
         def nativeOpsLatencyMillis(typ: String): Long = {
           rocksDBMetrics.nativeOpsMetrics.get(typ).map(_ * 1000).getOrElse(0)
         }
@@ -298,6 +482,13 @@ private[sql] class RocksDBStateStoreProvider
           CUSTOM_METRIC_COMMIT_COMPACT_TIME -> commitLatencyMs("compact"),
           CUSTOM_METRIC_CHECKPOINT_TIME -> commitLatencyMs("checkpoint"),
           CUSTOM_METRIC_FILESYNC_TIME -> commitLatencyMs("fileSync"),
+          CUSTOM_METRIC_CHANGE_LOG_WRITER_COMMIT_TIME -> commitLatencyMs("changeLogWriterCommit"),
+          CUSTOM_METRIC_SAVE_ZIP_FILES_TIME -> commitLatencyMs("saveZipFiles"),
+
+          CUSTOM_METRIC_LOAD_FROM_SNAPSHOT_TIME -> loadMetrics("loadFromSnapshot"),
+          CUSTOM_METRIC_LOAD_TIME -> loadMetrics("load"),
+          CUSTOM_METRIC_REPLAY_CHANGE_LOG -> loadMetrics("replayChangelog"),
+          CUSTOM_METRIC_NUM_REPLAY_CHANGE_LOG_FILES -> loadMetrics("numReplayChangeLogFiles"),
           CUSTOM_METRIC_BYTES_COPIED -> rocksDBMetrics.bytesCopied,
           CUSTOM_METRIC_FILES_COPIED -> rocksDBMetrics.filesCopied,
           CUSTOM_METRIC_FILES_REUSED -> rocksDBMetrics.filesReused,
@@ -337,6 +528,7 @@ private[sql] class RocksDBStateStoreProvider
     }
 
     override def getStateStoreCheckpointInfo(): StateStoreCheckpointInfo = {
+      validateAndTransitionState(METRICS)
       checkpointInfo match {
         case Some(info) => info
         case None => throw StateStoreErrors.stateStoreOperationOutOfOrder(
@@ -347,8 +539,7 @@ private[sql] class RocksDBStateStoreProvider
     override def hasCommitted: Boolean = state == COMMITTED
 
     override def toString: String = {
-      s"RocksDBStateStore[id=(op=${id.operatorId},part=${id.partitionId})," +
-        s"dir=${id.storeCheckpointLocation()}]"
+      s"RocksDBStateStore[stateStoreId=$stateStoreId_, version=$version]"
     }
 
     /** Return the [[RocksDB]] instance in this store. This is exposed mainly for testing. */
@@ -393,6 +584,10 @@ private[sql] class RocksDBStateStoreProvider
     this.rocksDBEventForwarder =
       Some(RocksDBEventForwarder(StateStoreProvider.getRunId(hadoopConf), stateStoreId))
 
+    // Initialize StateStoreProviderId for memory tracking
+    val queryRunId = UUID.fromString(StateStoreProvider.getRunId(hadoopConf))
+    this.stateStoreProviderId = StateStoreProviderId(stateStoreId, queryRunId)
+
     if (useMultipleValuesPerKey) {
       require(useColumnFamilies, "Multiple values per key support requires column families to be" +
         " enabled in RocksDBStateStore.")
@@ -446,48 +641,120 @@ private[sql] class RocksDBStateStoreProvider
 
   override def stateStoreId: StateStoreId = stateStoreId_
 
-  override def getStore(version: Long, uniqueId: Option[String] = None): StateStore = {
+  private lazy val stateMachine: RocksDBStateMachine =
+    new RocksDBStateMachine(stateStoreId, RocksDBConf(storeConf))
+
+  override protected def logName: String = s"${super.logName} ${stateStoreProviderId}"
+
+  /**
+   * Creates and returns a state store with the specified parameters.
+   *
+   * @param version The version of the state store to load
+   * @param uniqueId Optional unique identifier for checkpoint
+   * @param readOnly Whether to open the store in read-only mode
+   * @param existingStore Optional existing store to reuse instead of creating a new one
+   * @return The loaded state store
+   */
+  private def loadStateStore(
+      version: Long,
+      uniqueId: Option[String] = None,
+      readOnly: Boolean,
+      existingStore: Option[RocksDBStateStore] = None): StateStore = {
+    var acquiredStamp: Option[Long] = None
+    var storeLoaded = false
     try {
       if (version < 0) {
         throw QueryExecutionErrors.unexpectedStateStoreVersion(version)
       }
-      rocksDB.load(
-        version,
-        stateStoreCkptId = if (storeConf.enableStateStoreCheckpointIds) uniqueId else None)
-      new RocksDBStateStore(version)
-    }
-    catch {
-      case e: OutOfMemoryError =>
-        throw QueryExecutionErrors.notEnoughMemoryToLoadStore(
-          stateStoreId.toString,
-          "ROCKSDB_STORE_PROVIDER",
-          e)
-      case e: Throwable => throw StateStoreErrors.cannotLoadStore(e)
-    }
-  }
 
-  override def getReadStore(version: Long, uniqueId: Option[String] = None): StateStore = {
-    try {
-      if (version < 0) {
-        throw QueryExecutionErrors.unexpectedStateStoreVersion(version)
+      // Early validation of the existing store type before loading RocksDB
+      existingStore.foreach { store =>
+        if (!store.readOnly) {
+          throw new IllegalArgumentException(
+            s"Existing store must be readOnly, but got a read-write store")
+        }
+      }
+
+      // if the existing store is None, then we need to acquire the stamp before
+      // loading RocksDB
+      val stamp = existingStore match {
+        case None =>
+          val s = stateMachine.acquireStamp()
+          acquiredStamp = Some(s)
+          Some(s)
+        case Some(store: RocksDBStateStore) =>
+          val s = store.stamp
+          stateMachine.verifyStamp(s)
+          Some(s)
       }
+
       rocksDB.load(
         version,
         stateStoreCkptId = if (storeConf.enableStateStoreCheckpointIds) uniqueId else None,
-        readOnly = true)
-      new RocksDBStateStore(version)
-    }
-    catch {
+        readOnly = readOnly)
+
+      // Create or reuse store instance
+      val store = existingStore match {
+        case Some(store: RocksDBStateStore) =>
+          // Mark store as being used for write operations
+          store.readOnly = readOnly
+          store
+        case None =>
+          // Create new store instance. The stamp should be defined
+          // in this case
+          new RocksDBStateStore(version, stamp.get, readOnly)
+      }
+      storeLoaded = true
+      store
+    } catch {
       case e: OutOfMemoryError =>
         throw QueryExecutionErrors.notEnoughMemoryToLoadStore(
           stateStoreId.toString,
           "ROCKSDB_STORE_PROVIDER",
           e)
+      case e: StateStoreInvalidStateMachineTransition =>
+        throw e
       case e: Throwable => throw StateStoreErrors.cannotLoadStore(e)
+    } finally {
+      // If we acquired a stamp but failed to load the store, release it.
+      // Note: We cannot rely on the task completion listener to clean up the stamp in this case
+      // because the listener is only registered in the RocksDBStateStore constructor. If the
+      // store fails to load (e.g., rocksDB.load() throws an exception), the RocksDBStateStore
+      // instance is never created, so no completion listener exists to release the stamp.
+      // This finally block ensures proper cleanup even when store creation fails early.
+      if (!storeLoaded && acquiredStamp.isDefined) {
+        acquiredStamp.foreach(stamp => stateMachine.releaseStamp(stamp, throwEx = false))
+      }
     }
   }
 
+  override def getStore(
+      version: Long, uniqueId: Option[String] = None): StateStore = {
+    loadStateStore(version, uniqueId, readOnly = false)
+  }
+
+  override def upgradeReadStoreToWriteStore(
+      readStore: ReadStateStore,
+      version: Long,
+      uniqueId: Option[String] = None): StateStore = {
+    assert(version == readStore.version,
+      s"Can only upgrade readStore to writeStore with the same version," +
+        s" readStoreVersion: ${readStore.version}, writeStoreVersion: ${version}")
+    assert(this.stateStoreId == readStore.id, "Can only upgrade readStore to writeStore with" +
+      " the same stateStoreId")
+    assert(readStore.isInstanceOf[RocksDBStateStore], "Can only upgrade state store if it is a " +
+      "RocksDBStateStore")
+    loadStateStore(version, uniqueId, readOnly = false, existingStore =
+      Some(readStore.asInstanceOf[RocksDBStateStore]))
+  }
+
+  override def getReadStore(
+      version: Long, uniqueId: Option[String] = None): StateStore = {
+    loadStateStore(version, uniqueId, readOnly = true)
+  }
+
   override def doMaintenance(): Unit = {
+    stateMachine.verifyForMaintenance()
     try {
       rocksDB.doMaintenance()
     } catch {
@@ -500,7 +767,9 @@ private[sql] class RocksDBStateStoreProvider
   }
 
   override def close(): Unit = {
-    rocksDB.close()
+    if (stateMachine.close()) {
+      rocksDB.close()
+    }
   }
 
   override def supportedCustomMetrics: Seq[StateStoreCustomMetric] = ALL_CUSTOM_METRICS
@@ -520,6 +789,7 @@ private[sql] class RocksDBStateStoreProvider
   @volatile private var stateStoreEncoding: String = _
   @volatile private var stateSchemaProvider: Option[StateSchemaProvider] = _
   @volatile private var rocksDBEventForwarder: Option[RocksDBEventForwarder] = _
+  @volatile private var stateStoreProviderId: StateStoreProviderId = _
 
   protected def createRocksDB(
       dfsRootDir: String,
@@ -530,7 +800,8 @@ private[sql] class RocksDBStateStoreProvider
       useColumnFamilies: Boolean,
       enableStateStoreCheckpointIds: Boolean,
       partitionId: Int = 0,
-      eventForwarder: Option[RocksDBEventForwarder] = None): RocksDB = {
+      eventForwarder: Option[RocksDBEventForwarder] = None,
+      uniqueId: Option[String] = None): RocksDB = {
     new RocksDB(
       dfsRootDir,
       conf,
@@ -540,18 +811,21 @@ private[sql] class RocksDBStateStoreProvider
       useColumnFamilies,
       enableStateStoreCheckpointIds,
       partitionId,
-      eventForwarder)
+      eventForwarder,
+      uniqueId)
   }
 
   private[sql] lazy val rocksDB = {
     val dfsRootDir = stateStoreId.storeCheckpointLocation().toString
     val storeIdStr = s"StateStoreId(opId=${stateStoreId.operatorId}," +
       s"partId=${stateStoreId.partitionId},name=${stateStoreId.storeName})"
+    val loggingId = stateStoreProviderId.toString
     val sparkConf = Option(SparkEnv.get).map(_.conf).getOrElse(new SparkConf)
     val localRootDir = Utils.createTempDir(Utils.getLocalDir(sparkConf), storeIdStr)
-    createRocksDB(dfsRootDir, RocksDBConf(storeConf), localRootDir, hadoopConf, storeIdStr,
+    createRocksDB(dfsRootDir, RocksDBConf(storeConf), localRootDir, hadoopConf, loggingId,
       useColumnFamilies, storeConf.enableStateStoreCheckpointIds, stateStoreId.partitionId,
-      rocksDBEventForwarder)
+      rocksDBEventForwarder,
+      Some(s"${stateStoreProviderId.toString}_${UUID.randomUUID().toString}"))
   }
 
   private val keyValueEncoderMap = new java.util.concurrent.ConcurrentHashMap[String,
@@ -572,7 +846,8 @@ private[sql] class RocksDBStateStoreProvider
    * @param endVersion   checkpoint version to end with
    * @return [[StateStore]]
    */
-  override def replayStateFromSnapshot(snapshotVersion: Long, endVersion: Long): StateStore = {
+  override def replayStateFromSnapshot(
+      snapshotVersion: Long, endVersion: Long, readOnly: Boolean): StateStore = {
     try {
       if (snapshotVersion < 1) {
         throw QueryExecutionErrors.unexpectedStateStoreVersion(snapshotVersion)
@@ -580,8 +855,15 @@ private[sql] class RocksDBStateStoreProvider
       if (endVersion < snapshotVersion) {
         throw QueryExecutionErrors.unexpectedStateStoreVersion(endVersion)
       }
-      rocksDB.loadFromSnapshot(snapshotVersion, endVersion)
-      new RocksDBStateStore(endVersion)
+      val stamp = stateMachine.acquireStamp()
+      try {
+        rocksDB.loadFromSnapshot(snapshotVersion, endVersion)
+        new RocksDBStateStore(endVersion, stamp, readOnly)
+      } catch {
+        case e: Throwable =>
+          stateMachine.releaseStamp(stamp)
+          throw e
+      }
     }
     catch {
       case e: OutOfMemoryError =>
@@ -851,6 +1133,25 @@ object RocksDBStateStoreProvider {
     "rocksdbFilesReused", "RocksDB: file manager - files reused")
   val CUSTOM_METRIC_ZIP_FILE_BYTES_UNCOMPRESSED = StateStoreCustomSizeMetric(
     "rocksdbZipFileBytesUncompressed", "RocksDB: file manager - uncompressed zip file bytes")
+  val CUSTOM_METRIC_CHANGE_LOG_WRITER_COMMIT_TIME = StateStoreCustomTimingMetric(
+    "rocksdbChangeLogWriterCommitLatencyMs",
+    "RocksDB: commit - changelog commit time")
+  val CUSTOM_METRIC_SAVE_ZIP_FILES_TIME = StateStoreCustomTimingMetric(
+    "rocksdbSaveZipFilesLatencyMs",
+    "RocksDB: commit - zip files sync to external storage time")
+
+  val CUSTOM_METRIC_LOAD_FROM_SNAPSHOT_TIME = StateStoreCustomTimingMetric(
+    "rocksdbLoadFromSnapshotLatencyMs",
+    "RocksDB: load from snapshot - time taken to load the store from snapshot")
+  val CUSTOM_METRIC_LOAD_TIME = StateStoreCustomTimingMetric(
+    "rocksdbLoadLatencyMs",
+    "RocksDB: load - time taken to load the store")
+  val CUSTOM_METRIC_REPLAY_CHANGE_LOG = StateStoreCustomTimingMetric(
+    "rocksdbReplayChangeLogLatencyMs",
+    "RocksDB: load - time taken to replay the change log")
+  val CUSTOM_METRIC_NUM_REPLAY_CHANGE_LOG_FILES = StateStoreCustomSizeMetric(
+    "rocksdbNumReplayChangelogFiles",
+    "RocksDB: load - number of change log files replayed")
 
   val CUSTOM_METRIC_BLOCK_CACHE_MISS = StateStoreCustomSumMetric(
     "rocksdbReadBlockCacheMissCount",
@@ -905,13 +1206,16 @@ object RocksDBStateStoreProvider {
     CUSTOM_METRIC_FLUSH_TIME, CUSTOM_METRIC_COMMIT_COMPACT_TIME,
     CUSTOM_METRIC_CHECKPOINT_TIME, CUSTOM_METRIC_FILESYNC_TIME,
     CUSTOM_METRIC_BYTES_COPIED, CUSTOM_METRIC_FILES_COPIED, CUSTOM_METRIC_FILES_REUSED,
-    CUSTOM_METRIC_ZIP_FILE_BYTES_UNCOMPRESSED, CUSTOM_METRIC_GET_COUNT, CUSTOM_METRIC_PUT_COUNT,
+    CUSTOM_METRIC_ZIP_FILE_BYTES_UNCOMPRESSED, CUSTOM_METRIC_CHANGE_LOG_WRITER_COMMIT_TIME,
+    CUSTOM_METRIC_SAVE_ZIP_FILES_TIME, CUSTOM_METRIC_GET_COUNT, CUSTOM_METRIC_PUT_COUNT,
     CUSTOM_METRIC_BLOCK_CACHE_MISS, CUSTOM_METRIC_BLOCK_CACHE_HITS, CUSTOM_METRIC_BYTES_READ,
     CUSTOM_METRIC_BYTES_WRITTEN, CUSTOM_METRIC_ITERATOR_BYTES_READ, CUSTOM_METRIC_STALL_TIME,
     CUSTOM_METRIC_TOTAL_COMPACT_TIME, CUSTOM_METRIC_COMPACT_READ_BYTES,
     CUSTOM_METRIC_COMPACT_WRITTEN_BYTES, CUSTOM_METRIC_FLUSH_WRITTEN_BYTES,
     CUSTOM_METRIC_PINNED_BLOCKS_MEM_USAGE, CUSTOM_METRIC_NUM_INTERNAL_COL_FAMILIES_KEYS,
-    CUSTOM_METRIC_NUM_EXTERNAL_COL_FAMILIES, CUSTOM_METRIC_NUM_INTERNAL_COL_FAMILIES)
+    CUSTOM_METRIC_NUM_EXTERNAL_COL_FAMILIES, CUSTOM_METRIC_NUM_INTERNAL_COL_FAMILIES,
+    CUSTOM_METRIC_LOAD_FROM_SNAPSHOT_TIME, CUSTOM_METRIC_LOAD_TIME, CUSTOM_METRIC_REPLAY_CHANGE_LOG,
+    CUSTOM_METRIC_NUM_REPLAY_CHANGE_LOG_FILES)
 
   val CUSTOM_INSTANCE_METRIC_SNAPSHOT_LAST_UPLOADED = StateStoreSnapshotLastUploadInstanceMetric()
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/SchemaHelper.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/SchemaHelper.scala
index d67eb40fde2c2..7da8c5a6bd3ca 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/SchemaHelper.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/SchemaHelper.scala
@@ -25,7 +25,7 @@ import org.apache.hadoop.fs.{FSDataInputStream, FSDataOutputStream}
 import org.json4s.DefaultFormats
 import org.json4s.jackson.JsonMethods
 
-import org.apache.spark.sql.execution.streaming.MetadataVersionUtil
+import org.apache.spark.sql.execution.streaming.checkpointing.MetadataVersionUtil
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.Utils
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityChecker.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityChecker.scala
index 17a36e5210b94..ca18ce9067b36 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityChecker.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityChecker.scala
@@ -25,14 +25,15 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FSDataInputStream, Path}
 
 import org.apache.spark.SparkUnsupportedOperationException
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.avro.{AvroDeserializer, AvroSerializer, SchemaConverters}
 import org.apache.spark.sql.catalyst.util.UnsafeRowUtils
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, StatefulOperatorStateInfo}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
 import org.apache.spark.sql.execution.streaming.state.SchemaHelper.{SchemaReader, SchemaWriter}
 import org.apache.spark.sql.execution.streaming.state.StateSchemaCompatibilityChecker.SCHEMA_FORMAT_V3
-import org.apache.spark.sql.internal.SessionState
+import org.apache.spark.sql.internal.{SessionState, SQLConf}
 import org.apache.spark.sql.types._
 
 // Result returned after validating the schema of the state store for schema changes
@@ -88,7 +89,7 @@ class StateSchemaCompatibilityChecker(
   // per query. This variable is the latest one
   private val schemaFileLocation = if (oldSchemaFilePaths.isEmpty) {
     val storeCpLocation = providerId.storeId.storeCheckpointLocation()
-    schemaFile(storeCpLocation)
+    StateSchemaCompatibilityChecker.schemaFile(storeCpLocation)
   } else {
     oldSchemaFilePaths.last
   }
@@ -97,7 +98,7 @@ class StateSchemaCompatibilityChecker(
 
   fm.mkdirs(schemaFileLocation.getParent)
 
-  private val conf = SparkSession.getActiveSession.get.sessionState.conf
+  private val conf = SparkSession.getActiveSession.map(_.sessionState.conf).getOrElse(new SQLConf())
 
   // Read most recent schema file
   def readSchemaFile(): List[StateStoreColFamilySchema] = {
@@ -302,9 +303,6 @@ class StateSchemaCompatibilityChecker(
       newSchemaFileWritten
     }
   }
-
-  private def schemaFile(storeCpLocation: Path): Path =
-    new Path(new Path(storeCpLocation, "_metadata"), "schema")
 }
 
 object StateSchemaCompatibilityChecker extends Logging {
@@ -432,4 +430,7 @@ object StateSchemaCompatibilityChecker extends Logging {
 
     StateSchemaValidationResult(evolvedSchema, schemaFileLocation)
   }
+
+  def schemaFile(storeCpLocation: Path): Path =
+    new Path(new Path(storeCpLocation, "_metadata"), "schema")
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStore.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStore.scala
index 9a85169ad451a..604a27866f62e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStore.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStore.scala
@@ -17,11 +17,13 @@
 
 package org.apache.spark.sql.execution.streaming.state
 
+import java.io.Closeable
 import java.util.UUID
-import java.util.concurrent.{ScheduledFuture, TimeUnit}
+import java.util.concurrent.{ConcurrentLinkedQueue, ScheduledFuture, TimeUnit}
 import javax.annotation.concurrent.GuardedBy
 
 import scala.collection.mutable
+import scala.collection.mutable.ArrayBuffer
 import scala.util.control.NonFatal
 
 import org.apache.hadoop.conf.Configuration
@@ -31,16 +33,38 @@ import org.json4s.JsonAST.JValue
 import org.json4s.JsonDSL._
 import org.json4s.jackson.JsonMethods.{compact, render}
 
-import org.apache.spark.{SparkContext, SparkEnv, SparkException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.{SparkContext, SparkEnv, SparkException, TaskContext}
+import org.apache.spark.internal.{Logging, LogKeys}
+import org.apache.spark.internal.LogKeys.{EXCEPTION, STATE_STORE_ID, VERSION_NUM}
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.catalyst.util.UnsafeRowUtils
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
-import org.apache.spark.sql.execution.streaming.{StatefulOperatorStateInfo, StreamExecution}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
+import org.apache.spark.sql.execution.streaming.state.MaintenanceTaskType._
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.{NextIterator, ThreadUtils, Utils}
 
+/**
+ * Represents an iterator that provides additional functionalities for state store use cases.
+ *
+ * `close()` is useful for freeing underlying iterator resources when the iterator is no longer
+ * needed.
+ *
+ * The caller MUST call `close()` on the iterator if it was not fully consumed, and it is no
+ * longer needed.
+ */
+class StateStoreIterator[A](
+    val iter: Iterator[A],
+    val onClose: () => Unit = () => {}) extends Iterator[A] with Closeable {
+  override def hasNext: Boolean = iter.hasNext
+
+  override def next(): A = iter.next()
+
+  override def close(): Unit = onClose()
+}
+
 sealed trait StateStoreEncoding {
   override def toString: String = this match {
     case StateStoreEncoding.UnsafeRow => "unsaferow"
@@ -53,6 +77,14 @@ object StateStoreEncoding {
   case object Avro extends StateStoreEncoding
 }
 
+sealed trait MaintenanceTaskType
+
+object MaintenanceTaskType {
+  case object FromUnloadedProvidersQueue extends MaintenanceTaskType
+  case object FromTaskThread extends MaintenanceTaskType
+  case object FromLoadedProviders extends MaintenanceTaskType
+}
+
 /**
  * Base trait for a versioned key-value store which provides read operations. Each instance of a
  * `ReadStateStore` represents a specific version of state data, and such instances are created
@@ -106,10 +138,11 @@ trait ReadStateStore {
    */
   def prefixScan(
       prefixKey: UnsafeRow,
-      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Iterator[UnsafeRowPair]
+      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): StateStoreIterator[UnsafeRowPair]
 
   /** Return an iterator containing all the key-value pairs in the StateStore. */
-  def iterator(colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Iterator[UnsafeRowPair]
+  def iterator(
+      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): StateStoreIterator[UnsafeRowPair]
 
   /**
    * Clean up the resource.
@@ -117,6 +150,22 @@ trait ReadStateStore {
    * The method name is to respect backward compatibility on [[StateStore]].
    */
   def abort(): Unit
+
+
+  /**
+   * Releases resources associated with this read-only state store.
+   *
+   * This method should be called when the store is no longer needed but has completed
+   * successfully (i.e., no errors occurred during reading). It performs any necessary
+   * cleanup operations without invalidating or rolling back the data that was read.
+   *
+   * In contrast to `abort()`, which is called on error paths to cancel operations,
+   * `release()` is the proper method to call in success scenarios when a read-only
+   * store is no longer needed.
+   *
+   * This method is idempotent and safe to call multiple times.
+   */
+  def release(): Unit
 }
 
 /**
@@ -188,6 +237,10 @@ trait StateStore extends ReadStateStore {
    */
   override def abort(): Unit
 
+  override def release(): Unit = {
+    throw new UnsupportedOperationException("Should only call release() on ReadStateStore")
+  }
+
   /**
    * Return an iterator containing all the key-value pairs in the StateStore. Implementations must
    * ensure that updates (puts, removes) can be made while iterating over this iterator.
@@ -196,8 +249,8 @@ trait StateStore extends ReadStateStore {
    * performed after initialization of the iterator. Callers should perform all updates before
    * calling this method if all updates should be visible in the returned iterator.
    */
-  override def iterator(colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME):
-    Iterator[UnsafeRowPair]
+  override def iterator(colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME)
+    : StateStoreIterator[UnsafeRowPair]
 
   /** Current metrics of the state store */
   def metrics: StateStoreMetrics
@@ -229,14 +282,16 @@ class WrappedReadStateStore(store: StateStore) extends ReadStateStore {
     colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): UnsafeRow = store.get(key,
     colFamilyName)
 
-  override def iterator(colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME):
-    Iterator[UnsafeRowPair] = store.iterator(colFamilyName)
+  override def iterator(colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME)
+    : StateStoreIterator[UnsafeRowPair] = store.iterator(colFamilyName)
 
   override def abort(): Unit = store.abort()
 
+  override def release(): Unit = store.release()
+
   override def prefixScan(prefixKey: UnsafeRow,
-    colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Iterator[UnsafeRowPair] =
-    store.prefixScan(prefixKey, colFamilyName)
+      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME)
+    : StateStoreIterator[UnsafeRowPair] = store.prefixScan(prefixKey, colFamilyName)
 
   override def valuesIterator(key: UnsafeRow, colFamilyName: String): Iterator[UnsafeRow] = {
     store.valuesIterator(key, colFamilyName)
@@ -554,7 +609,11 @@ trait StateStoreProvider {
    */
   def stateStoreId: StateStoreId
 
-  /** Called when the provider instance is unloaded from the executor */
+  /**
+   * Called when the provider instance is unloaded from the executor
+   * WARNING: IF PROVIDER FROM [[StateStore.loadedProviders]],
+   * CLOSE MUST ONLY BE CALLED FROM MAINTENANCE THREAD!
+   */
   def close(): Unit
 
   /**
@@ -575,6 +634,30 @@ trait StateStoreProvider {
   def getReadStore(version: Long, uniqueId: Option[String] = None): ReadStateStore =
     new WrappedReadStateStore(getStore(version, uniqueId))
 
+  /**
+   * Creates a writable store from an existing read-only store for the specified version.
+   *
+   * This method enables an important optimization pattern for stateful operations where
+   * the same state store needs to be accessed for both reading and writing within a task.
+   * Instead of opening two separate state store instances (which can cause contention issues),
+   * this method converts an existing read-only store to a writable store that can commit changes.
+   *
+   * This approach is particularly beneficial when:
+   * - A stateful operation needs to first read the existing state, then update it
+   * - The state store has locking mechanisms that prevent concurrent access
+   * - Multiple state store connections would cause unnecessary resource duplication
+   *
+   * @param readStore The existing read-only store instance to convert to a writable store
+   * @param version The version of the state store (must match the read store's version)
+   * @param uniqueId Optional unique identifier for checkpointing
+   * @return A writable StateStore instance that can be used to update and commit changes
+   */
+  def upgradeReadStoreToWriteStore(
+      readStore: ReadStateStore,
+      version: Long,
+      uniqueId: Option[String] = None): StateStore = getStore(version, uniqueId)
+
+
   /** Optional method for providers to allow for background maintenance (e.g. compactions) */
   def doMaintenance(): Unit = { }
 
@@ -664,7 +747,7 @@ object StateStoreProvider extends Logging {
   }
 
   /**
-   * Get the runId from the provided hadoopConf. If it is not found, generate a random UUID.
+   * Get the runId from the provided hadoopConf. If it is not found, an error will be thrown.
    *
    * @param hadoopConf Hadoop configuration used by the StateStore to save state data
    */
@@ -717,7 +800,8 @@ trait SupportsFineGrainedReplay {
    * @param snapshotVersion checkpoint version of the snapshot to start with
    * @param endVersion   checkpoint version to end with
    */
-  def replayStateFromSnapshot(snapshotVersion: Long, endVersion: Long): StateStore
+  def replayStateFromSnapshot(
+      snapshotVersion: Long, endVersion: Long, readOnly: Boolean = false): StateStore
 
   /**
    * Return an instance of [[ReadStateStore]] representing state data of the given version.
@@ -730,7 +814,7 @@ trait SupportsFineGrainedReplay {
    * @param endVersion   checkpoint version to end with
    */
   def replayReadStateFromSnapshot(snapshotVersion: Long, endVersion: Long): ReadStateStore = {
-    new WrappedReadStateStore(replayStateFromSnapshot(snapshotVersion, endVersion))
+    new WrappedReadStateStore(replayStateFromSnapshot(snapshotVersion, endVersion, readOnly = true))
   }
 
   /**
@@ -759,7 +843,11 @@ trait SupportsFineGrainedReplay {
  * Note that `queryRunId` is used uniquely identify a provider, so that the same provider
  * instance is not reused across query restarts.
  */
-case class StateStoreProviderId(storeId: StateStoreId, queryRunId: UUID)
+case class StateStoreProviderId(storeId: StateStoreId, queryRunId: UUID) {
+  override def toString: String = {
+    s"StateStoreProviderId[ storeId=$storeId, queryRunId=$queryRunId ]"
+  }
+}
 
 object StateStoreProviderId {
   private[sql] def apply(
@@ -802,9 +890,7 @@ case class StateStoreId(
   }
 
   override def toString: String = {
-    s"""StateStoreId[ checkpointRootLocation=$checkpointRootLocation, operatorId=$operatorId,
-       | partitionId=$partitionId, storeName=$storeName ]
-       |""".stripMargin.replaceAll("\n", "")
+    s"StateStoreId[ operatorId=$operatorId, partitionId=$partitionId, storeName=$storeName ]"
   }
 }
 
@@ -841,12 +927,37 @@ object StateStore extends Logging {
 
   private val maintenanceThreadPoolLock = new Object
 
+  private val unloadedProvidersToClose =
+    new ConcurrentLinkedQueue[(StateStoreProviderId, StateStoreProvider)]
+
   // This set is to keep track of the partitions that are queued
   // for maintenance or currently have maintenance running on them
   // to prevent the same partition from being processed concurrently.
   @GuardedBy("maintenanceThreadPoolLock")
   private val maintenancePartitions = new mutable.HashSet[StateStoreProviderId]
 
+  /** Reports to the coordinator that a StateStore has committed */
+  def reportCommitToCoordinator(
+      version: Long,
+      stateStoreId: StateStoreId,
+      hadoopConf: Configuration): Unit = {
+    try {
+      val runId = UUID.fromString(StateStoreProvider.getRunId(hadoopConf))
+      val providerId = StateStoreProviderId(stateStoreId, runId)
+      // The coordinator will handle whether tracking is active for this batch
+      // If tracking is not active, it will just reply without processing
+      StateStoreProvider.coordinatorRef.foreach(
+        _.reportStateStoreCommit(providerId, version, stateStoreId.storeName)
+      )
+      logDebug(log"Reported commit for store " +
+        log"${MDC(STATE_STORE_ID, stateStoreId)} at version ${MDC(VERSION_NUM, version)}")
+    } catch {
+      case NonFatal(e) =>
+        // Log but don't fail the commit if reporting fails
+        logWarning(log"Failed to report StateStore commit: ${MDC(EXCEPTION, e)}")
+    }
+  }
+
   /**
    * Runs the `task` periodically and bubbles any exceptions that it encounters.
    *
@@ -948,6 +1059,56 @@ object StateStore extends Logging {
     storeProvider.getReadStore(version, stateStoreCkptId)
   }
 
+  /**
+   * Converts an existing read-only state store to a writable state store.
+   *
+   * This method provides an optimization for stateful operations that need to both read and update
+   * state within the same task. Instead of opening separate read and write instances (which may
+   * cause resource contention or duplication), this method reuses the already loaded read store
+   * and transforms it into a writable store.
+   *
+   * The optimization is particularly valuable for state stores with expensive initialization costs
+   * or limited concurrency capabilities (like RocksDB). It eliminates redundant loading of the same
+   * state data and reduces resource usage.
+   *
+   * @param readStore The existing read-only state store to convert to a writable store
+   * @param storeProviderId Unique identifier for the state store provider
+   * @param keySchema Schema of the state store keys
+   * @param valueSchema Schema of the state store values
+   * @param keyStateEncoderSpec Specification for encoding the state keys
+   * @param version The version of the state store (must match the read store's version)
+   * @param stateStoreCkptId Optional checkpoint identifier for the state store
+   * @param stateSchemaBroadcast Optional broadcast of the state schema
+   * @param useColumnFamilies Whether to use column families in the state store
+   * @param storeConf Configuration for the state store
+   * @param hadoopConf Hadoop configuration
+   * @param useMultipleValuesPerKey Whether the store supports multiple values per key
+   * @return A writable StateStore instance that can be used to update and commit changes
+   * @throws SparkException If the store cannot be loaded or if there's insufficient memory
+   */
+  def getWriteStore(
+      readStore: ReadStateStore,
+      storeProviderId: StateStoreProviderId,
+      keySchema: StructType,
+      valueSchema: StructType,
+      keyStateEncoderSpec: KeyStateEncoderSpec,
+      version: Long,
+      stateStoreCkptId: Option[String],
+      stateSchemaBroadcast: Option[StateSchemaBroadcast],
+      useColumnFamilies: Boolean,
+      storeConf: StateStoreConf,
+      hadoopConf: Configuration,
+      useMultipleValuesPerKey: Boolean = false): StateStore = {
+    hadoopConf.set(StreamExecution.RUN_ID_KEY, storeProviderId.queryRunId.toString)
+    if (version < 0) {
+      throw QueryExecutionErrors.unexpectedStateStoreVersion(version)
+    }
+    val storeProvider = getStateStoreProvider(storeProviderId, keySchema, valueSchema,
+      keyStateEncoderSpec, useColumnFamilies, storeConf, hadoopConf, useMultipleValuesPerKey,
+      stateSchemaBroadcast)
+    storeProvider.upgradeReadStoreToWriteStore(readStore, version, stateStoreCkptId)
+  }
+
   /** Get or create a store associated with the id. */
   def get(
       storeProviderId: StateStoreProviderId,
@@ -1010,7 +1171,21 @@ object StateStore extends Logging {
       if (!storeConf.unloadOnCommit) {
         val otherProviderIds = loadedProviders.keys.filter(_ != storeProviderId).toSeq
         val providerIdsToUnload = reportActiveStoreInstance(storeProviderId, otherProviderIds)
-        providerIdsToUnload.foreach(unload(_))
+        val taskContextIdLogLine = Option(TaskContext.get()).map { tc =>
+          log"taskId=${MDC(LogKeys.TASK_ID, tc.taskAttemptId())}"
+        }.getOrElse(log"")
+        providerIdsToUnload.foreach(id => {
+          loadedProviders.remove(id).foreach( provider => {
+            // Trigger maintenance thread to immediately do maintenance on and close the provider.
+            // Doing maintenance first allows us to do maintenance for a constantly-moving state
+            // store.
+            logInfo(log"Submitted maintenance from task thread to close " +
+              log"provider=${MDC(LogKeys.STATE_STORE_PROVIDER_ID, id)}." + taskContextIdLogLine +
+              log"Removed provider from loadedProviders")
+            submitMaintenanceWorkForProvider(
+              id, provider, storeConf, MaintenanceTaskType.FromTaskThread)
+          })
+        })
       }
 
       provider
@@ -1027,14 +1202,30 @@ object StateStore extends Logging {
     }
   }
 
-  /** Unload a state store provider */
-  def unload(storeProviderId: StateStoreProviderId): Unit = loadedProviders.synchronized {
-    loadedProviders.remove(storeProviderId).foreach(_.close())
+  /**
+   * Unload a state store provider.
+   * If alreadyRemovedFromLoadedProviders is None, provider will be
+   * removed from loadedProviders and closed.
+   * If alreadyRemovedFromLoadedProviders is Some, provider will be closed
+   * using passed in provider.
+   * WARNING: CAN ONLY BE CALLED FROM MAINTENANCE THREAD!
+   */
+  def removeFromLoadedProvidersAndClose(
+      storeProviderId: StateStoreProviderId,
+      alreadyRemovedProvider: Option[StateStoreProvider] = None): Unit = {
+    val providerToClose = alreadyRemovedProvider.orElse {
+      loadedProviders.synchronized {
+        loadedProviders.remove(storeProviderId)
+      }
+    }
+    providerToClose.foreach { provider =>
+      provider.close()
+    }
   }
 
   /** Unload all state store providers: unit test purpose */
   private[sql] def unloadAll(): Unit = loadedProviders.synchronized {
-    loadedProviders.keySet.foreach { key => unload(key) }
+    loadedProviders.keySet.foreach { key => removeFromLoadedProvidersAndClose(key) }
     loadedProviders.clear()
   }
 
@@ -1073,7 +1264,7 @@ object StateStore extends Logging {
 
   /** Unload and stop all state store providers */
   def stop(): Unit = loadedProviders.synchronized {
-    loadedProviders.keySet.foreach { key => unload(key) }
+    loadedProviders.keySet.foreach { key => removeFromLoadedProvidersAndClose(key) }
     loadedProviders.clear()
     _coordRef = null
     stopMaintenanceTask()
@@ -1088,7 +1279,7 @@ object StateStore extends Logging {
       if (SparkEnv.get != null && !isMaintenanceRunning && !storeConf.unloadOnCommit) {
         maintenanceTask = new MaintenanceTask(
           storeConf.maintenanceInterval,
-          task = { doMaintenance() }
+          task = { doMaintenance(storeConf) }
         )
         maintenanceThreadPool = new MaintenanceThreadPool(numMaintenanceThreads,
           maintenanceShutdownTimeout)
@@ -1097,6 +1288,27 @@ object StateStore extends Logging {
     }
   }
 
+  // Wait until this partition can be processed
+  private def awaitProcessThisPartition(
+      id: StateStoreProviderId,
+      timeoutMs: Long): Boolean = maintenanceThreadPoolLock synchronized  {
+    val startTime = System.currentTimeMillis()
+    val endTime = startTime + timeoutMs
+
+    // If immediate processing fails, wait with timeout
+    var canProcessThisPartition = processThisPartition(id)
+    while (!canProcessThisPartition && System.currentTimeMillis() < endTime) {
+      maintenanceThreadPoolLock.wait(timeoutMs)
+      canProcessThisPartition = processThisPartition(id)
+    }
+    val elapsedTime = System.currentTimeMillis() - startTime
+    logInfo(log"Waited for ${MDC(LogKeys.TOTAL_TIME, elapsedTime)} ms to be able to process " +
+      log"maintenance for partition ${MDC(LogKeys.STATE_STORE_PROVIDER_ID, id)}")
+    canProcessThisPartition
+  }
+
+  private def doMaintenance(): Unit = doMaintenance(StateStoreConf.empty)
+
   private def processThisPartition(id: StateStoreProviderId): Boolean = {
     maintenanceThreadPoolLock.synchronized {
       if (!maintenancePartitions.contains(id)) {
@@ -1112,56 +1324,42 @@ object StateStore extends Logging {
    * Execute background maintenance task in all the loaded store providers if they are still
    * the active instances according to the coordinator.
    */
-  private def doMaintenance(): Unit = {
+  private def doMaintenance(storeConf: StateStoreConf): Unit = {
     logDebug("Doing maintenance")
     if (SparkEnv.get == null) {
       throw new IllegalStateException("SparkEnv not active, cannot do maintenance on StateStores")
     }
+
+    // Providers that couldn't be processed now and need to be added back to the queue
+    val providersToRequeue = new ArrayBuffer[(StateStoreProviderId, StateStoreProvider)]()
+
+    // unloadedProvidersToClose are StateStoreProviders that have been removed from
+    // loadedProviders, and can now be processed for maintenance. This queue contains
+    // providers for which we weren't able to process for maintenance on the previous iteration
+    while (!unloadedProvidersToClose.isEmpty) {
+      val (providerId, provider) = unloadedProvidersToClose.poll()
+
+      if (processThisPartition(providerId)) {
+        submitMaintenanceWorkForProvider(
+          providerId, provider, storeConf, MaintenanceTaskType.FromUnloadedProvidersQueue)
+      } else {
+        providersToRequeue += ((providerId, provider))
+      }
+    }
+
+    if (providersToRequeue.nonEmpty) {
+      logInfo(log"Had to requeue ${MDC(LogKeys.SIZE, providersToRequeue.size)} providers " +
+        log"for maintenance in doMaintenance")
+    }
+
+    providersToRequeue.foreach(unloadedProvidersToClose.offer)
+
     loadedProviders.synchronized {
       loadedProviders.toSeq
     }.foreach { case (id, provider) =>
       if (processThisPartition(id)) {
-        maintenanceThreadPool.execute(() => {
-          val startTime = System.currentTimeMillis()
-          try {
-            provider.doMaintenance()
-            if (!verifyIfStoreInstanceActive(id)) {
-              unload(id)
-              logInfo(log"Unloaded ${MDC(LogKeys.STATE_STORE_PROVIDER, provider)}")
-            }
-          } catch {
-            case NonFatal(e) =>
-              logWarning(log"Error managing ${MDC(LogKeys.STATE_STORE_PROVIDER, provider)}, " +
-                log"unloading state store provider", e)
-              // When we get a non-fatal exception, we just unload the provider.
-              //
-              // By not bubbling the exception to the maintenance task thread or the query execution
-              // thread, it's possible for a maintenance thread pool task to continue failing on
-              // the same partition. Additionally, if there is some global issue that will cause
-              // all maintenance thread pool tasks to fail, then bubbling the exception and
-              // stopping the pool is faster than waiting for all tasks to see the same exception.
-              //
-              // However, we assume that repeated failures on the same partition and global issues
-              // are rare. The benefit to unloading just the partition with an exception is that
-              // transient issues on a given provider do not affect any other providers; so, in
-              // most cases, this should be a more performant solution.
-              unload(id)
-          } finally {
-            val duration = System.currentTimeMillis() - startTime
-            val logMsg =
-              log"Finished maintenance task for " +
-                log"provider=${MDC(LogKeys.STATE_STORE_PROVIDER_ID, id)}" +
-                log" in elapsed_time=${MDC(LogKeys.TIME_UNITS, duration)}\n"
-            if (duration > 5000) {
-              logInfo(logMsg)
-            } else {
-              logDebug(logMsg)
-            }
-            maintenanceThreadPoolLock.synchronized {
-              maintenancePartitions.remove(id)
-            }
-          }
-        })
+        submitMaintenanceWorkForProvider(
+          id, provider, storeConf, MaintenanceTaskType.FromLoadedProviders)
       } else {
         logInfo(log"Not processing partition ${MDC(LogKeys.PARTITION_ID, id)} " +
           log"for maintenance because it is currently " +
@@ -1170,6 +1368,108 @@ object StateStore extends Logging {
     }
   }
 
+  /**
+   * Submits maintenance work for a provider to the maintenance thread pool.
+   *
+   * @param id The StateStore provider ID to perform maintenance on
+   * @param provider The StateStore provider instance
+   */
+  private def submitMaintenanceWorkForProvider(
+      id: StateStoreProviderId,
+      provider: StateStoreProvider,
+      storeConf: StateStoreConf,
+      source: MaintenanceTaskType = FromLoadedProviders): Unit = {
+    maintenanceThreadPool.execute(() => {
+      val startTime = System.currentTimeMillis()
+      // Determine if we can process this partition based on the source
+      val canProcessThisPartition = source match {
+        case FromTaskThread =>
+          // Provider from task thread needs to wait for lock
+          // We potentially need to wait for ongoing maintenance to finish processing
+          // this partition
+          val timeoutMs = storeConf.stateStoreMaintenanceProcessingTimeout * 1000
+          val ableToProcessNow = awaitProcessThisPartition(id, timeoutMs)
+          if (!ableToProcessNow) {
+            // Add to queue for later processing if we can't process now
+            // This will be resubmitted for maintenance later by the background maintenance task
+            unloadedProvidersToClose.add((id, provider))
+          }
+          ableToProcessNow
+
+        case FromUnloadedProvidersQueue =>
+          // Provider from queue can be processed immediately
+          // (we've already removed it from loadedProviders)
+          true
+
+        case FromLoadedProviders =>
+          // Provider from loadedProviders can be processed immediately
+          // as it's in maintenancePartitions
+          true
+      }
+
+      if (canProcessThisPartition) {
+        val awaitingPartitionDuration = System.currentTimeMillis() - startTime
+        try {
+          provider.doMaintenance()
+          // Handle unloading based on source
+          source match {
+            case FromTaskThread | FromUnloadedProvidersQueue =>
+              // Provider already removed from loadedProviders, just close it
+              removeFromLoadedProvidersAndClose(id, Some(provider))
+
+            case FromLoadedProviders =>
+              // Check if provider should be unloaded
+              if (!verifyIfStoreInstanceActive(id)) {
+                removeFromLoadedProvidersAndClose(id)
+              }
+          }
+          logInfo(log"Unloaded ${MDC(LogKeys.STATE_STORE_PROVIDER_ID, id)}")
+        } catch {
+          case NonFatal(e) =>
+            logWarning(log"Error doing maintenance on provider:" +
+              log" ${MDC(LogKeys.STATE_STORE_PROVIDER_ID, id)}. " +
+              log"Could not unload state store provider", e)
+            // When we get a non-fatal exception, we just unload the provider.
+            //
+            // By not bubbling the exception to the maintenance task thread or the query execution
+            // thread, it's possible for a maintenance thread pool task to continue failing on
+            // the same partition. Additionally, if there is some global issue that will cause
+            // all maintenance thread pool tasks to fail, then bubbling the exception and
+            // stopping the pool is faster than waiting for all tasks to see the same exception.
+            //
+            // However, we assume that repeated failures on the same partition and global issues
+            // are rare. The benefit to unloading just the partition with an exception is that
+            // transient issues on a given provider do not affect any other providers; so, in
+            // most cases, this should be a more performant solution.
+            source match {
+              case FromTaskThread | FromUnloadedProvidersQueue =>
+                removeFromLoadedProvidersAndClose(id, Some(provider))
+
+              case FromLoadedProviders =>
+                removeFromLoadedProvidersAndClose(id)
+            }
+        } finally {
+          val duration = System.currentTimeMillis() - startTime
+          val logMsg =
+            log"Finished maintenance task for " +
+              log"provider=${MDC(LogKeys.STATE_STORE_PROVIDER_ID, id)}" +
+              log" in elapsed_time=${MDC(LogKeys.TIME_UNITS, duration)}" +
+              log" and awaiting_partition_time=" +
+              log"${MDC(LogKeys.TIME_UNITS, awaitingPartitionDuration)}\n"
+          if (duration > 5000) {
+            logInfo(logMsg)
+          } else {
+            logDebug(logMsg)
+          }
+          maintenanceThreadPoolLock.synchronized {
+            maintenancePartitions.remove(id)
+            maintenanceThreadPoolLock.notifyAll()
+          }
+        }
+      }
+    })
+  }
+
   private def reportActiveStoreInstance(
       storeProviderId: StateStoreProviderId,
       otherProviderIds: Seq[StateStoreProviderId]): Seq[StateStoreProviderId] = {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreChangelog.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreChangelog.scala
index bcaff4c60d08f..4c5dea63baeab 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreChangelog.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreChangelog.scala
@@ -21,21 +21,20 @@ import java.io.{DataInputStream, DataOutputStream, FileNotFoundException, IOExce
 
 import scala.util.control.NonFatal
 
-import com.google.common.io.ByteStreams
-import org.apache.commons.io.IOUtils
 import org.apache.hadoop.fs.{FSError, Path}
 import org.json4s._
 import org.json4s.jackson.Serialization
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
 import org.apache.spark.sql.errors.QueryExecutionErrors
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.CancellableFSDataOutputStream
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.CancellableFSDataOutputStream
 import org.apache.spark.sql.execution.streaming.state.RecordType.RecordType
 import org.apache.spark.util.NextIterator
+import org.apache.spark.util.Utils
 
 /**
  * Enum used to write record types to changelog files used with RocksDBStateStoreProvider.
@@ -132,7 +131,7 @@ abstract class StateStoreChangelogWriter(
   def abort(): Unit = {
     try {
       if (backingFileStream != null) backingFileStream.cancel()
-      if (compressedStream != null) IOUtils.closeQuietly(compressedStream)
+      if (compressedStream != null) Utils.closeQuietly(compressedStream)
     } catch {
       // Closing the compressedStream causes the stream to write/flush data into the
       // rawStream. Since the rawStream is already closed, there may be errors.
@@ -371,7 +370,11 @@ class StateStoreChangelogReaderFactory(
       // Or if the first record in the changelog file in V1 has a large enough
       // key, readUTF() will throw a UTFDataFormatException so we should return
       // version 1 (SPARK-51922).
-      case _: java.io.EOFException | _: java.io.UTFDataFormatException => 1
+      case _: java.io.EOFException |
+           _: java.io.UTFDataFormatException |
+           // SPARK-52553 - Can throw this if the bytes in the file is coincidentally
+           // decoded as UTF string like "v)".
+           _: NumberFormatException => 1
     }
   }
 
@@ -481,14 +484,14 @@ class StateStoreChangelogReaderV1(
     } else {
       // TODO: reuse the key buffer and value buffer across records.
       val keyBuffer = new Array[Byte](keySize)
-      ByteStreams.readFully(input, keyBuffer, 0, keySize)
+      Utils.readFully(input, keyBuffer, 0, keySize)
       val valueSize = input.readInt()
       if (valueSize < 0) {
         // A deletion record
         (RecordType.DELETE_RECORD, keyBuffer, null)
       } else {
         val valueBuffer = new Array[Byte](valueSize)
-        ByteStreams.readFully(input, valueBuffer, 0, valueSize)
+        Utils.readFully(input, valueBuffer, 0, valueSize)
         // A put record.
         (RecordType.PUT_RECORD, keyBuffer, valueBuffer)
       }
@@ -512,7 +515,7 @@ class StateStoreChangelogReaderV2(
   private def parseBuffer(input: DataInputStream): Array[Byte] = {
     val blockSize = input.readInt()
     val blockBuffer = new Array[Byte](blockSize)
-    ByteStreams.readFully(input, blockBuffer, 0, blockSize)
+    Utils.readFully(input, blockBuffer, 0, blockSize)
     blockBuffer
   }
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreConf.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreConf.scala
index 9a994200baeb0..00bb7de46dc4d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreConf.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreConf.scala
@@ -17,12 +17,14 @@
 
 package org.apache.spark.sql.execution.streaming.state
 
-import org.apache.spark.sql.execution.streaming.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
 import org.apache.spark.sql.internal.SQLConf
 
 /** A class that contains configuration parameters for [[StateStore]]s. */
 class StateStoreConf(
-    @transient private[state] val sqlConf: SQLConf,
+    // Should be private because it could be null under serialization (due to
+    // the transient annotation)
+    @transient private val sqlConf: SQLConf,
     val extraOptions: Map[String, String] = Map.empty)
   extends Serializable {
 
@@ -38,6 +40,8 @@ class StateStoreConf(
    */
   val stateStoreMaintenanceShutdownTimeout: Long = sqlConf.stateStoreMaintenanceShutdownTimeout
 
+  val stateStoreMaintenanceProcessingTimeout: Long = sqlConf.stateStoreMaintenanceProcessingTimeout
+
   /**
    * Minimum number of delta files in a chain after which HDFSBackedStateStore will
    * consider generating a snapshot.
@@ -67,6 +71,13 @@ class StateStoreConf(
   /** Whether validate the underlying format or not. */
   val formatValidationEnabled: Boolean = sqlConf.stateStoreFormatValidationEnabled
 
+  /**
+   * Whether to validate StateStore commits for ForeachBatch sinks to ensure all partitions
+   * are processed. This helps detect incomplete processing due to operations like show()
+   * or limit().
+   */
+  val commitValidationEnabled = sqlConf.stateStoreCommitValidationEnabled
+
   /**
    * Whether to validate the value side. This config is applied to both validators as below:
    *
@@ -106,6 +117,9 @@ class StateStoreConf(
   /** Whether to unload the store on task completion. */
   val unloadOnCommit = sqlConf.stateStoreUnloadOnCommit
 
+  /** The version of the state store checkpoint format. */
+  val stateStoreCheckpointFormatVersion: Int = sqlConf.stateStoreCheckpointFormatVersion
+
   /**
    * Additional configurations related to state store. This will capture all configs in
    * SQLConf that start with `spark.sql.streaming.stateStore.`
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinator.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinator.scala
index 903f27fb2a223..37e35c917a521 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinator.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinator.scala
@@ -22,7 +22,7 @@ import java.util.UUID
 import scala.collection.mutable
 
 import org.apache.spark.SparkEnv
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.rpc.{RpcCallContext, RpcEndpointRef, RpcEnv, ThreadSafeRpcEndpoint}
 import org.apache.spark.scheduler.ExecutorCacheTaskLocation
 import org.apache.spark.sql.internal.SQLConf
@@ -53,6 +53,24 @@ private case class VerifyIfInstanceActive(storeId: StateStoreProviderId, executo
 private case class GetLocation(storeId: StateStoreProviderId)
   extends StateStoreCoordinatorMessage
 
+/** Report that a StateStore has committed for tracking purposes */
+private case class ReportStateStoreCommit(
+    storeId: StateStoreProviderId,
+    version: Long,
+    storeName: String = StateStoreId.DEFAULT_STORE_NAME)
+  extends StateStoreCoordinatorMessage
+
+/** Start tracking StateStore commits for a batch */
+private case class StartStateStoreCommitTrackingForBatch(
+    runId: UUID,
+    batchId: Long,
+    expectedStores: Map[Long, Map[String, Int]]) // operatorId -> (storeName -> numPartitions)
+  extends StateStoreCoordinatorMessage
+
+/** Validate that all expected StateStores have committed for a batch */
+private case class ValidateStateStoreCommitForBatch(runId: UUID, batchId: Long)
+  extends StateStoreCoordinatorMessage
+
 private case class DeactivateInstances(runId: UUID)
   extends StateStoreCoordinatorMessage
 
@@ -176,6 +194,29 @@ class StateStoreCoordinatorRef private(rpcEndpointRef: RpcEndpointRef) {
       LogLaggingStateStores(queryRunId, latestVersion, isTerminatingTrigger))
   }
 
+
+  /** Start tracking StateStore commits for a batch */
+  private[sql] def startStateStoreCommitTrackingForBatch(
+      runId: UUID,
+      batchId: Long,
+      expectedStores: Map[Long, Map[String, Int]]): Unit = {
+    rpcEndpointRef.askSync[Unit](
+      StartStateStoreCommitTrackingForBatch(runId, batchId, expectedStores))
+  }
+
+  /** Report that a StateStore has committed */
+  private[sql] def reportStateStoreCommit(
+      storeId: StateStoreProviderId,
+      version: Long,
+      storeName: String = StateStoreId.DEFAULT_STORE_NAME): Unit = {
+    rpcEndpointRef.askSync[Unit](ReportStateStoreCommit(storeId, version, storeName))
+  }
+
+  /** Validate that all expected StateStores have committed for a batch */
+  private[sql] def validateStateStoreCommitForBatch(runId: UUID, batchId: Long): Unit = {
+    rpcEndpointRef.askSync[Unit](ValidateStateStoreCommitForBatch(runId, batchId))
+  }
+
   /**
    * Endpoint used for testing.
    * Get the latest snapshot version uploaded for a state store.
@@ -222,6 +263,10 @@ private class StateStoreCoordinator(
   // Default snapshot upload event to use when a provider has never uploaded a snapshot
   private val defaultSnapshotUploadEvent = SnapshotUploadEvent(0, 0)
 
+  // Tracking structure for StateStore commits per batch
+  // Key: (runId, batchId) -> Value: CommitTracker
+  private val batchCommitTrackers = new mutable.HashMap[(UUID, Long), BatchCommitTracker]
+
   // Stores the last timestamp in milliseconds for each queryRunId indicating when the
   // coordinator did a report on instances lagging behind on snapshot uploads.
   // The initial timestamp is defaulted to 0 milliseconds.
@@ -264,6 +309,10 @@ private class StateStoreCoordinator(
       val storeIdsToRemove =
         instances.keys.filter(_.queryRunId == runId).toSeq
       instances --= storeIdsToRemove
+
+      val runIdsToRemove = batchCommitTrackers.keys.filter(_._1 == runId)
+      batchCommitTrackers --= runIdsToRemove
+
       // Also remove these instances from snapshot upload event tracking
       stateStoreLatestUploadedSnapshot --= storeIdsToRemove
       // Remove the corresponding run id entries for report time and starting time
@@ -336,6 +385,49 @@ private class StateStoreCoordinator(
       }
       context.reply(true)
 
+    case StartStateStoreCommitTrackingForBatch(runId, batchId, expectedStores) =>
+      val key = (runId, batchId)
+      if (batchCommitTrackers.contains(key)) {
+        context.sendFailure(new IllegalStateException(
+          s"Batch commit tracker already exists for runId=$runId, batchId=$batchId"))
+      } else {
+        batchCommitTrackers.put(key, new BatchCommitTracker(runId, batchId, expectedStores))
+        logInfo(s"Started tracking commits for batch $batchId with " +
+          s"${expectedStores.values.map(_.values.sum).sum} expected stores")
+        context.reply(())
+      }
+
+    case ReportStateStoreCommit(storeId, version, storeName) =>
+      // StateStore version = batchId + 1, so we need to adjust
+      val batchId = version - 1
+      val key = (storeId.queryRunId, batchId)
+      batchCommitTrackers.get(key) match {
+        case Some(tracker) =>
+          tracker.recordCommit(storeId, storeName)
+          context.reply(())
+        case None =>
+          // In case no commit tracker for this batch was found
+          context.reply(())
+      }
+
+    case ValidateStateStoreCommitForBatch(runId, batchId) =>
+      val key = (runId, batchId)
+      batchCommitTrackers.get(key) match {
+        case Some(tracker) =>
+          try {
+            tracker.validateAllCommitted()
+            batchCommitTrackers.remove(key) // Clean up after validation
+            context.reply(())
+          } catch {
+            case e: StateStoreCommitValidationFailed =>
+              batchCommitTrackers.remove(key) // Clean up even on failure
+              context.sendFailure(e)
+          }
+        case None =>
+          context.sendFailure(new IllegalStateException(
+            s"No commit tracker found for runId=$runId, batchId=$batchId"))
+      }
+
     case GetLatestSnapshotVersionForTesting(providerId) =>
       val version = stateStoreLatestUploadedSnapshot.get(providerId).map(_.version)
       logDebug(s"Got latest snapshot version of the state store $providerId: $version")
@@ -402,6 +494,55 @@ private class StateStoreCoordinator(
   }
 }
 
+/**
+ * Tracks StateStore commits for a batch to ensure all expected stores commit
+ */
+private class BatchCommitTracker(
+    runId: UUID,
+    batchId: Long,
+    expectedStores: Map[Long, Map[String, Int]]) extends Logging {
+
+  // Track committed stores: (operatorId, partitionId, storeName) -> committed
+  private val committedStores = new mutable.HashSet[(Long, Int, String)]()
+
+  def recordCommit(storeId: StateStoreProviderId, storeName: String): Unit = {
+    val key = (storeId.storeId.operatorId, storeId.storeId.partitionId, storeName)
+    committedStores.add(key)
+    logDebug(s"Recorded commit for store $storeId with name $storeName for batch $batchId")
+  }
+
+  def validateAllCommitted(): Unit = {
+    val missingCommits = new mutable.ArrayBuffer[String]()
+
+    expectedStores.foreach { case (operatorId, storeMap) =>
+      storeMap.foreach { case (storeName, numPartitions) =>
+        for (partitionId <- 0 until numPartitions) {
+          val key = (operatorId, partitionId, storeName)
+          if (!committedStores.contains(key)) {
+            missingCommits += s"(operator=$operatorId, partition=$partitionId, store=$storeName)"
+          }
+        }
+      }
+    }
+
+    if (missingCommits.nonEmpty) {
+      val totalExpected = expectedStores.values.map(_.values.sum).sum
+      val errorMsg = s"Not all StateStores committed for batch $batchId. " +
+        s"Expected $totalExpected commits but got ${committedStores.size}. " +
+        s"Missing commits: ${missingCommits.mkString(", ")}"
+      logError(errorMsg)
+      throw StateStoreErrors.stateStoreCommitValidationFailed(
+        batchId,
+        totalExpected,
+        committedStores.size,
+        missingCommits.mkString(", ")
+      )
+    }
+
+    logInfo(s"All ${committedStores.size} StateStores successfully committed for batch $batchId")
+  }
+}
+
 case class SnapshotUploadEvent(
     version: Long,
     timestamp: Long
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreErrors.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreErrors.scala
index 633fd96f90567..43682de034462 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreErrors.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreErrors.scala
@@ -92,6 +92,18 @@ object StateStoreErrors {
     new StateStoreIncorrectNumOrderingColsForPrefixScan(numPrefixCols)
   }
 
+  def invalidStateMachineTransition(
+      oldState: String,
+      newState: String,
+      transition: String,
+      storeId: StateStoreId): StateStoreInvalidStateMachineTransition = {
+    new StateStoreInvalidStateMachineTransition(oldState, newState, transition, storeId)
+  }
+
+  def invalidStamp(providedStamp: Long, currentStamp: Long): StateStoreInvalidStamp = {
+    new StateStoreInvalidStamp(providedStamp, currentStamp)
+  }
+
   def incorrectNumOrderingColsForRangeScan(numOrderingCols: String):
     StateStoreIncorrectNumOrderingColsForRangeScan = {
     new StateStoreIncorrectNumOrderingColsForRangeScan(numOrderingCols)
@@ -175,6 +187,11 @@ object StateStoreErrors {
       numSchemaFiles, schemaFilesThreshold, addedColFamilies, removedColFamilies)
   }
 
+  def streamingStateCheckpointLocationNotEmpty(checkpointLocation: String)
+    : StateStoreCheckpointLocationNotEmpty = {
+    new StateStoreCheckpointLocationNotEmpty(checkpointLocation)
+  }
+
   def stateStoreColumnFamilyMismatch(
       columnFamilyName: String,
       oldColumnFamilySchema: String,
@@ -204,6 +221,14 @@ object StateStoreErrors {
     new StateStoreInvalidConfigAfterRestart(configName, oldConfig, newConfig)
   }
 
+  def stateStoreCommitValidationFailed(
+      batchId: Long,
+      expectedCommits: Int,
+      actualCommits: Int,
+      missingCommits: String): StateStoreCommitValidationFailed = {
+    new StateStoreCommitValidationFailed(batchId, expectedCommits, actualCommits, missingCommits)
+  }
+
   def duplicateStateVariableDefined(stateName: String):
     StateStoreDuplicateStateVariableDefined = {
     new StateStoreDuplicateStateVariableDefined(stateName)
@@ -343,6 +368,30 @@ class StateStoreVariableSizeOrderingColsNotSupported(fieldName: String, index: S
     errorClass = "STATE_STORE_VARIABLE_SIZE_ORDERING_COLS_NOT_SUPPORTED",
     messageParameters = Map("fieldName" -> fieldName, "index" -> index))
 
+class StateStoreInvalidStateMachineTransition(
+    oldState: String,
+    newState: String,
+    operation: String,
+    storeId: StateStoreId)
+  extends SparkRuntimeException(
+    errorClass = "STATE_STORE_INVALID_STATE_MACHINE_TRANSITION",
+    messageParameters = Map(
+      "oldState" -> oldState,
+      "newState" -> newState,
+      "operation" -> operation,
+      "storeId" -> storeId.toString
+    )
+  )
+
+class StateStoreInvalidStamp(providedStamp: Long, currentStamp: Long)
+  extends SparkRuntimeException(
+    errorClass = "STATE_STORE_INVALID_STAMP",
+    messageParameters = Map(
+      "providedStamp" -> providedStamp.toString,
+      "currentStamp" -> currentStamp.toString
+    )
+  )
+
 class StateStoreNullTypeOrderingColsNotSupported(fieldName: String, index: String)
   extends SparkUnsupportedOperationException(
     errorClass = "STATE_STORE_NULL_TYPE_ORDERING_COLS_NOT_SUPPORTED",
@@ -430,6 +479,13 @@ class StateStoreStateSchemaFilesThresholdExceeded(
       "addedColumnFamilies" -> addedColFamilies.mkString("(", ",", ")"),
       "removedColumnFamilies" -> removedColFamilies.mkString("(", ",", ")")))
 
+class StateStoreCheckpointLocationNotEmpty(
+    checkpointLocation: String)
+  extends SparkUnsupportedOperationException(
+    errorClass = "STATE_STORE_CHECKPOINT_LOCATION_NOT_EMPTY",
+    messageParameters = Map(
+      "checkpointLocation" -> checkpointLocation))
+
 class StateStoreSnapshotFileNotFound(fileToRead: String, clazz: String)
   extends SparkRuntimeException(
     errorClass = "CANNOT_LOAD_STATE_STORE.CANNOT_READ_MISSING_SNAPSHOT_FILE",
@@ -488,3 +544,18 @@ class StateStoreOperationOutOfOrder(errorMsg: String)
     errorClass = "STATE_STORE_OPERATION_OUT_OF_ORDER",
     messageParameters = Map("errorMsg" -> errorMsg)
   )
+
+class StateStoreCommitValidationFailed(
+    batchId: Long,
+    expectedCommits: Int,
+    actualCommits: Int,
+    missingCommits: String)
+  extends SparkRuntimeException(
+    errorClass = "STATE_STORE_COMMIT_VALIDATION_FAILED",
+    messageParameters = Map(
+      "batchId" -> batchId.toString,
+      "expectedCommits" -> expectedCommits.toString,
+      "actualCommits" -> actualCommits.toString,
+      "missingCommits" -> missingCommits
+    )
+  )
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDD.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDD.scala
index 4a3e045811686..c95faada419e2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDD.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDD.scala
@@ -27,6 +27,28 @@ import org.apache.spark.sql.internal.SessionState
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.SerializableConfiguration
 
+/**
+ * Thread local storage for sharing StateStore instances between RDDs.
+ * This allows a ReadStateStore to be reused by a subsequent StateStore operation.
+ */
+object StateStoreThreadLocalTracker {
+  /** Case class to hold both the store and its usage state */
+
+  private val storeInfo: ThreadLocal[ReadStateStore] = new ThreadLocal[ReadStateStore]
+
+  def setStore(store: ReadStateStore): Unit = {
+    storeInfo.set(store)
+  }
+
+  def getStore: Option[ReadStateStore] = {
+    Option(storeInfo.get())
+  }
+
+  def clearStore(): Unit = {
+    storeInfo.remove()
+  }
+}
+
 abstract class BaseStateStoreRDD[T: ClassTag, U: ClassTag](
     dataRDD: RDD[T],
     checkpointLocation: String,
@@ -95,6 +117,7 @@ class ReadStateStoreRDD[T: ClassTag, U: ClassTag](
       stateStoreCkptIds.map(_.apply(partition.index).head),
       stateSchemaBroadcast,
       useColumnFamilies, storeConf, hadoopConfBroadcast.value.value)
+    StateStoreThreadLocalTracker.setStore(store)
     storeReadFunction(store, inputIter)
   }
 }
@@ -130,12 +153,22 @@ class StateStoreRDD[T: ClassTag, U: ClassTag](
     val storeProviderId = getStateProviderId(partition)
 
     val inputIter = dataRDD.iterator(partition, ctxt)
-    val store = StateStore.get(
-      storeProviderId, keySchema, valueSchema, keyStateEncoderSpec, storeVersion,
-      uniqueId.map(_.apply(partition.index).head),
-      stateSchemaBroadcast,
-      useColumnFamilies, storeConf, hadoopConfBroadcast.value.value,
-      useMultipleValuesPerKey)
+    val store = StateStoreThreadLocalTracker.getStore match {
+      case Some(readStateStore: ReadStateStore) =>
+        StateStore.getWriteStore(readStateStore, storeProviderId,
+          keySchema, valueSchema, keyStateEncoderSpec, storeVersion,
+          uniqueId.map(_.apply(partition.index).head),
+          stateSchemaBroadcast,
+          useColumnFamilies, storeConf, hadoopConfBroadcast.value.value,
+          useMultipleValuesPerKey)
+      case None =>
+        StateStore.get(
+          storeProviderId, keySchema, valueSchema, keyStateEncoderSpec, storeVersion,
+          uniqueId.map(_.apply(partition.index).head),
+          stateSchemaBroadcast,
+          useColumnFamilies, storeConf, hadoopConfBroadcast.value.value,
+          useMultipleValuesPerKey)
+    }
 
     if (storeConf.unloadOnCommit) {
       ctxt.addTaskCompletionListener[Unit](_ => {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/package.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/package.scala
index a82eff4812953..d9b80ed99689d 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/package.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/streaming/state/package.scala
@@ -23,6 +23,7 @@ import org.apache.spark.TaskContext
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.SQLContext
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
 import org.apache.spark.sql.internal.SessionState
 import org.apache.spark.sql.types.StructType
 
@@ -109,8 +110,9 @@ package object state {
       val cleanedF = dataRDD.sparkContext.clean(storeReadFn)
       val wrappedF = (store: ReadStateStore, iter: Iterator[T]) => {
         // Clean up the state store.
-        TaskContext.get().addTaskCompletionListener[Unit](_ => {
-          store.abort()
+        val ctxt = TaskContext.get()
+        ctxt.addTaskCompletionListener[Unit](_ => {
+          StateStoreThreadLocalTracker.clearStore()
         })
         cleanedF(store, iter)
       }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListener.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListener.scala
index f680860231f01..4dbee24f0fecd 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListener.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListener.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
 import org.apache.spark.{JobExecutionStatus, SparkConf}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_NAME
 import org.apache.spark.internal.config.Status._
 import org.apache.spark.scheduler._
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/StreamingQueryHistoryServerPlugin.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/StreamingQueryHistoryServerPlugin.scala
index 76f64dcb64451..1c2abf5179f28 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/StreamingQueryHistoryServerPlugin.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/ui/StreamingQueryHistoryServerPlugin.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.execution.ui
 
 import org.apache.spark.SparkConf
 import org.apache.spark.scheduler.SparkListener
-import org.apache.spark.sql.execution.streaming.StreamingQueryListenerBus
+import org.apache.spark.sql.execution.streaming.runtime.StreamingQueryListenerBus
 import org.apache.spark.sql.streaming.ui.{StreamingQueryStatusListener, StreamingQueryTab}
 import org.apache.spark.status.{AppHistoryServerPlugin, ElementTrackingStore}
 import org.apache.spark.ui.SparkUI
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactory.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactory.scala
index 9ff056a279466..d59a0e9f4639b 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactory.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactory.scala
@@ -45,6 +45,7 @@ class WindowEvaluatorFactory(
     private val factories = windowFrameExpressionFactoryPairs.map(_._2).toArray
     private val inMemoryThreshold = conf.windowExecBufferInMemoryThreshold
     private val spillThreshold = conf.windowExecBufferSpillThreshold
+    private val spillSizeThreshold = conf.windowExecBufferSpillSizeThreshold
 
     override def eval(
         partitionIndex: Int,
@@ -82,7 +83,8 @@ class WindowEvaluatorFactory(
 
         // Manage the current partition.
         val buffer: ExternalAppendOnlyUnsafeRowArray =
-          new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold)
+          new ExternalAppendOnlyUnsafeRowArray(inMemoryThreshold, spillThreshold,
+            spillSizeThreshold)
 
         var bufferIterator: Iterator[UnsafeRow] = _
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactoryBase.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactoryBase.scala
index 7d13dbbe2a06a..c2dedda832e2e 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactoryBase.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/window/WindowEvaluatorFactoryBase.scala
@@ -22,7 +22,7 @@ import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.SparkException
 import org.apache.spark.sql.catalyst.InternalRow
-import org.apache.spark.sql.catalyst.expressions.{Add, AggregateWindowFunction, Ascending, Attribute, BoundReference, CurrentRow, DateAdd, DateAddYMInterval, DecimalAddNoOverflowCheck, Descending, Expression, ExtractANSIIntervalDays, FrameLessOffsetWindowFunction, FrameType, IdentityProjection, IntegerLiteral, MutableProjection, NamedExpression, OffsetWindowFunction, PythonFuncExpression, RangeFrame, RowFrame, RowOrdering, SortOrder, SpecifiedWindowFrame, TimeAdd, TimestampAddYMInterval, UnaryMinus, UnboundedFollowing, UnboundedPreceding, UnsafeProjection, WindowExpression}
+import org.apache.spark.sql.catalyst.expressions.{Add, AggregateWindowFunction, Ascending, Attribute, BoundReference, CurrentRow, DateAdd, DateAddYMInterval, DecimalAddNoOverflowCheck, Descending, Expression, ExtractANSIIntervalDays, FrameLessOffsetWindowFunction, FrameType, IdentityProjection, IntegerLiteral, MutableProjection, NamedExpression, OffsetWindowFunction, PythonFuncExpression, RangeFrame, RowFrame, RowOrdering, SortOrder, SpecifiedWindowFrame, TimestampAddInterval, TimestampAddYMInterval, UnaryMinus, UnboundedFollowing, UnboundedPreceding, UnsafeProjection, WindowExpression}
 import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateExpression
 import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.sql.internal.SQLConf
@@ -105,11 +105,11 @@ trait WindowEvaluatorFactoryBase {
           case (DateType, DayTimeIntervalType(DAY, DAY)) =>
             DateAdd(expr, ExtractANSIIntervalDays(boundOffset))
           case (TimestampType | TimestampNTZType, CalendarIntervalType) =>
-            TimeAdd(expr, boundOffset, Some(timeZone))
+            TimestampAddInterval(expr, boundOffset, Some(timeZone))
           case (TimestampType | TimestampNTZType, _: YearMonthIntervalType) =>
             TimestampAddYMInterval(expr, boundOffset, Some(timeZone))
           case (TimestampType | TimestampNTZType, _: DayTimeIntervalType) =>
-            TimeAdd(expr, boundOffset, Some(timeZone))
+            TimestampAddInterval(expr, boundOffset, Some(timeZone))
           case (d: DecimalType, _: DecimalType) => DecimalAddNoOverflowCheck(expr, boundOffset, d)
           case (a, b) if a == b => Add(expr, boundOffset)
         }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/internal/BaseSessionStateBuilder.scala b/sql/core/src/main/scala/org/apache/spark/sql/internal/BaseSessionStateBuilder.scala
index 334616a7709e0..ada30cde27cd0 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/internal/BaseSessionStateBuilder.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/internal/BaseSessionStateBuilder.scala
@@ -22,7 +22,7 @@ import org.apache.spark.sql.artifact.ArtifactManager
 import org.apache.spark.sql.catalyst.analysis.{Analyzer, EvalSubqueriesForTimeTravel, FunctionRegistry, InvokeProcedures, ReplaceCharWithVarchar, ResolveDataSource, ResolveSessionCatalog, ResolveTranspose, TableFunctionRegistry}
 import org.apache.spark.sql.catalyst.analysis.resolver.ResolverExtension
 import org.apache.spark.sql.catalyst.catalog.{FunctionExpressionBuilder, SessionCatalog}
-import org.apache.spark.sql.catalyst.expressions.Expression
+import org.apache.spark.sql.catalyst.expressions.{Expression, ExtractSemiStructuredFields}
 import org.apache.spark.sql.catalyst.optimizer.Optimizer
 import org.apache.spark.sql.catalyst.parser.ParserInterface
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
@@ -37,7 +37,7 @@ import org.apache.spark.sql.execution.analysis.DetectAmbiguousSelfJoin
 import org.apache.spark.sql.execution.command.CommandCheck
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.datasources.v2.{TableCapabilityCheck, V2SessionCatalog}
-import org.apache.spark.sql.execution.streaming.ResolveWriteToStream
+import org.apache.spark.sql.execution.streaming.runtime.ResolveWriteToStream
 import org.apache.spark.sql.expressions.UserDefinedAggregateFunction
 import org.apache.spark.sql.util.ExecutionListenerManager
 
@@ -244,6 +244,7 @@ abstract class BaseSessionStateBuilder(
         new EvalSubqueriesForTimeTravel +:
         new ResolveTranspose(session) +:
         new InvokeProcedures(session) +:
+        ExtractSemiStructuredFields +:
         customResolutionRules
 
     override val postHocResolutionRules: Seq[Rule[LogicalPlan]] =
@@ -406,7 +407,8 @@ abstract class BaseSessionStateBuilder(
    */
   protected def createQueryExecution:
     (LogicalPlan, CommandExecutionMode.Value) => QueryExecution =
-      (plan, mode) => new QueryExecution(session, plan, mode = mode)
+      (plan, mode) => new QueryExecution(session, plan, mode = mode,
+        shuffleCleanupMode = QueryExecution.determineShuffleCleanupMode(session.sessionState.conf))
 
   /**
    * Interface to start and stop streaming queries.
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/internal/SessionStateHelper.scala b/sql/core/src/main/scala/org/apache/spark/sql/internal/SessionStateHelper.scala
new file mode 100644
index 0000000000000..6279f8c123765
--- /dev/null
+++ b/sql/core/src/main/scala/org/apache/spark/sql/internal/SessionStateHelper.scala
@@ -0,0 +1,53 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.internal
+
+import org.apache.hadoop.conf.Configuration
+
+import org.apache.spark.{SparkConf, SparkContext}
+import org.apache.spark.sql.SparkSession
+
+/**
+ * Helper trait to access session state related configurations and utilities.
+ * It also provides type annotations for IDEs to build indexes.
+ */
+trait SessionStateHelper {
+  private def sessionState(sparkSession: SparkSession): SessionState = {
+    sparkSession.sessionState
+  }
+
+  private def sparkContext(sparkSession: SparkSession): SparkContext = {
+    sparkSession.sparkContext
+  }
+
+  def getSparkConf(sparkSession: SparkSession): SparkConf = {
+    sparkContext(sparkSession).conf
+  }
+
+  def getSqlConf(sparkSession: SparkSession): SQLConf = {
+    sessionState(sparkSession).conf
+  }
+
+  def getHadoopConf(
+      sparkSession: SparkSession,
+      options: Map[String, String]): Configuration = {
+    sessionState(sparkSession).newHadoopConfWithOptions(options)
+  }
+}
+
+object SessionStateHelper extends SessionStateHelper
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/internal/SharedState.scala b/sql/core/src/main/scala/org/apache/spark/sql/internal/SharedState.scala
index 2b1451493398f..af1f38caab686 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/internal/SharedState.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/internal/SharedState.scala
@@ -29,12 +29,12 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FsUrlStreamHandlerFactory, Path}
 
 import org.apache.spark.{SparkConf, SparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, CONFIG2, PATH, VALUE}
 import org.apache.spark.sql.catalyst.catalog._
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.CacheManager
-import org.apache.spark.sql.execution.streaming.StreamExecution
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.sql.execution.ui.{SQLAppStatusListener, SQLAppStatusStore, SQLTab, StreamingQueryStatusStore}
 import org.apache.spark.sql.internal.StaticSQLConf._
 import org.apache.spark.sql.streaming.ui.{StreamingQueryStatusListener, StreamingQueryTab}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/DatabricksDialect.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/DatabricksDialect.scala
index f4fc670470328..9124c1b889098 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/DatabricksDialect.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/DatabricksDialect.scala
@@ -59,7 +59,12 @@ private case class DatabricksDialect() extends JdbcDialect with NoLegacyJDBCErro
   }
 
   override def quoteIdentifier(colName: String): String = {
-    s"`$colName`"
+    // Per Databricks documentation:
+    // https://docs.databricks.com/aws/en/sql/language-manual/sql-ref-identifiers
+    //
+    // "Any character from the Unicode character set. Use ` to escape ` itself."
+    val escapedColName = colName.replace("`", "``")
+    s"`$escapedColName`"
   }
 
   override def supportsLimit: Boolean = true
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/H2Dialect.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/H2Dialect.scala
index b5ee88aebd7d6..966c5d14bc662 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/H2Dialect.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/H2Dialect.scala
@@ -25,8 +25,6 @@ import java.util.concurrent.ConcurrentHashMap
 import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
-import org.apache.commons.lang3.StringUtils
-
 import org.apache.spark.{SparkThrowable, SparkUnsupportedOperationException}
 import org.apache.spark.sql.catalyst.analysis.{IndexAlreadyExistsException, NoSuchIndexException, NoSuchNamespaceException, NoSuchTableException, TableAlreadyExistsException}
 import org.apache.spark.sql.connector.catalog.Identifier
@@ -35,6 +33,7 @@ import org.apache.spark.sql.connector.catalog.index.TableIndex
 import org.apache.spark.sql.connector.expressions.{Expression, FieldReference, NamedReference}
 import org.apache.spark.sql.execution.datasources.jdbc.{JDBCOptions, JdbcUtils}
 import org.apache.spark.sql.types.{BooleanType, ByteType, DataType, DecimalType, MetadataBuilder, ShortType, StringType, TimestampType}
+import org.apache.spark.util.SparkStringUtils
 
 private[sql] case class H2Dialect() extends JdbcDialect with NoLegacyJDBCError {
   override def canHandle(url: String): Boolean =
@@ -181,7 +180,7 @@ private[sql] case class H2Dialect() extends JdbcDialect with NoLegacyJDBCError {
             indexMap += (indexName -> newIndex)
           } else {
             val properties = new util.Properties()
-            if (StringUtils.isNotEmpty(indexComment)) properties.put("COMMENT", indexComment)
+            if (SparkStringUtils.isNotEmpty(indexComment)) properties.put("COMMENT", indexComment)
             val index = new TableIndex(indexName, indexType, Array(FieldReference(colName)),
               new util.HashMap[NamedReference, util.Properties](), properties)
             indexMap += (indexName -> index)
@@ -307,4 +306,6 @@ private[sql] case class H2Dialect() extends JdbcDialect with NoLegacyJDBCError {
   override def supportsLimit: Boolean = true
 
   override def supportsOffset: Boolean = true
+
+  override def supportsJoin: Boolean = true
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcDialects.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcDialects.scala
index da0df734bbeca..ce4c347cad349 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcDialects.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcDialects.scala
@@ -26,8 +26,6 @@ import java.util.concurrent.TimeUnit
 import scala.collection.mutable.ArrayBuilder
 import scala.util.control.NonFatal
 
-import org.apache.commons.lang3.StringUtils
-
 import org.apache.spark.{SparkRuntimeException, SparkThrowable, SparkUnsupportedOperationException}
 import org.apache.spark.annotation.{DeveloperApi, Since}
 import org.apache.spark.internal.Logging
@@ -244,7 +242,9 @@ abstract class JdbcDialect extends Serializable with Logging {
    * name is a reserved keyword, or in case it contains characters that require quotes (e.g. space).
    */
   def quoteIdentifier(colName: String): String = {
-    s""""$colName""""
+    // By ANSI standard, quotes are escaped with another quotes.
+    val escapedColName = colName.replace("\"", "\"\"")
+    s""""$escapedColName""""
   }
 
   /**
@@ -352,7 +352,7 @@ abstract class JdbcDialect extends Serializable with Logging {
    */
   @Since("2.3.0")
   protected[jdbc] def escapeSql(value: String): String =
-    if (value == null) null else StringUtils.replace(value, "'", "''")
+    if (value == null) null else value.replace("'", "''")
 
   /**
    * Converts value to SQL expression.
@@ -853,6 +853,11 @@ abstract class JdbcDialect extends Serializable with Logging {
 
   def supportsHint: Boolean = false
 
+  /**
+   * Returns true if dialect supports JOIN operator.
+   */
+  def supportsJoin: Boolean = false
+
   /**
    * Return the DB-specific quoted and fully qualified table name
    */
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcSQLQueryBuilder.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcSQLQueryBuilder.scala
index 95be14f816a76..93af5890711c6 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcSQLQueryBuilder.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/JdbcSQLQueryBuilder.scala
@@ -91,6 +91,20 @@ class JdbcSQLQueryBuilder(dialect: JdbcDialect, options: JDBCOptions) {
     this
   }
 
+  def withAliasedColumns(
+      columns: Array[String],
+      aliases: Array[Option[String]]): JdbcSQLQueryBuilder = {
+    if (columns.nonEmpty) {
+      assert(columns.length == aliases.length,
+        "Number of columns does not match the number of provided aliases")
+
+      columnList = columns.zip(aliases).map {
+        case (column, alias) => if (alias.isDefined) s"$column AS ${alias.get}" else column
+      }.mkString(",")
+    }
+    this
+  }
+
   /**
    * Constructs the WHERE clause that following dialect's SQL syntax.
    */
@@ -164,6 +178,38 @@ class JdbcSQLQueryBuilder(dialect: JdbcDialect, options: JDBCOptions) {
     this
   }
 
+  /**
+   * Represents JOIN subquery in case Join has been pushed down. This value should be used
+   * instead of options.tableOrQuery if join has been pushed down.
+   */
+  private var joinQuery: Option[String] = None
+
+  def withJoin(
+      left: JdbcSQLQueryBuilder,
+      right: JdbcSQLQueryBuilder,
+      leftSideQualifier: String,
+      rightSideQualifier: String,
+      columns: Array[String],
+      joinType: String,
+      joinCondition: String): JdbcSQLQueryBuilder = {
+    columnList = columns.mkString(",")
+    joinQuery = Some(
+      s"""(
+       |SELECT ${columns.mkString(",")} FROM
+       |(${left.build()}) $leftSideQualifier
+       |$joinType
+       |(${right.build()}) $rightSideQualifier
+       |ON $joinCondition
+       |) ${JoinPushdownAliasGenerator.getSubqueryQualifier}""".stripMargin
+    )
+
+    this
+  }
+
+  // If join has been pushed down, reuse join query as a subquery. Otherwise, fallback to
+  // what is provided in options.
+  protected final def tableOrQuery: String = joinQuery.getOrElse(options.tableOrQuery)
+
   /**
    * Build the final SQL query that following dialect's SQL syntax.
    */
@@ -174,7 +220,15 @@ class JdbcSQLQueryBuilder(dialect: JdbcDialect, options: JDBCOptions) {
     val offsetClause = dialect.getOffsetClause(offset)
 
     options.prepareQuery +
-      s"SELECT $hintClause$columnList FROM ${options.tableOrQuery} $tableSampleClause" +
+      s"SELECT $hintClause$columnList FROM $tableOrQuery $tableSampleClause" +
       s" $whereClause $groupByClause $orderByClause $limitClause $offsetClause"
   }
 }
+
+object JoinPushdownAliasGenerator {
+  private val subQueryId = new java.util.concurrent.atomic.AtomicLong()
+
+  def getSubqueryQualifier: String = {
+    "join_subquery_" + subQueryId.getAndIncrement()
+  }
+}
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MsSqlServerDialect.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MsSqlServerDialect.scala
index 3f06ea1a2fbfc..2954795836877 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MsSqlServerDialect.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MsSqlServerDialect.scala
@@ -265,7 +265,7 @@ private case class MsSqlServerDialect() extends JdbcDialect with NoLegacyJDBCErr
       val limitClause = dialect.getLimitClause(limit)
 
       options.prepareQuery +
-        s"SELECT $limitClause $columnList FROM ${options.tableOrQuery}" +
+        s"SELECT $limitClause $columnList FROM $tableOrQuery" +
         s" $whereClause $groupByClause $orderByClause"
     }
   }
@@ -286,6 +286,8 @@ private case class MsSqlServerDialect() extends JdbcDialect with NoLegacyJDBCErr
   }
 
   override def supportsLimit: Boolean = true
+
+  override def supportsJoin: Boolean = true
 }
 
 private object MsSqlServerDialect {
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MySQLDialect.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MySQLDialect.scala
index 19377057844e5..41452ca45057c 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MySQLDialect.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/MySQLDialect.scala
@@ -196,7 +196,13 @@ private case class MySQLDialect() extends JdbcDialect with SQLConfHelper with No
   }
 
   override def quoteIdentifier(colName: String): String = {
-    s"`$colName`"
+    // Per MySQL documentation: https://dev.mysql.com/doc/refman/8.4/en/identifiers.html
+    //
+    // Identifier quote characters can be included within an identifier if you quote the
+    // identifier. If the character to be included within the identifier is the same as
+    // that used to quote the identifier itself, then you need to double the character.
+    val escapedColName = colName.replace("`", "``")
+    s"`$escapedColName`"
   }
 
   override def schemasExists(conn: Connection, options: JDBCOptions, schema: String): Boolean = {
@@ -424,7 +430,7 @@ private case class MySQLDialect() extends JdbcDialect with SQLConfHelper with No
       }
 
       options.prepareQuery +
-        s"SELECT $hintClause$columnList FROM ${options.tableOrQuery} $tableSampleClause" +
+        s"SELECT $hintClause$columnList FROM $tableOrQuery $tableSampleClause" +
         s" $whereClause $groupByClause $orderByClause $limitOrOffsetStmt"
     }
   }
@@ -437,4 +443,6 @@ private case class MySQLDialect() extends JdbcDialect with SQLConfHelper with No
   override def supportsOffset: Boolean = true
 
   override def supportsHint: Boolean = true
+
+  override def supportsJoin: Boolean = true
 }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/OracleDialect.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/OracleDialect.scala
index a9f6a727a7241..81031b1ec13d4 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/OracleDialect.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/OracleDialect.scala
@@ -24,7 +24,7 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.{SparkThrowable, SparkUnsupportedOperationException}
 import org.apache.spark.sql.catalyst.SQLConfHelper
-import org.apache.spark.sql.connector.expressions.{Expression, Literal}
+import org.apache.spark.sql.connector.expressions.{Expression, Extract, Literal}
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.execution.datasources.jdbc.JDBCOptions
 import org.apache.spark.sql.jdbc.OracleDialect._
@@ -44,7 +44,7 @@ private case class OracleDialect() extends JdbcDialect with SQLConfHelper with N
   // scalastyle:on line.size.limit
   private val supportedAggregateFunctions =
     Set("MAX", "MIN", "SUM", "COUNT", "AVG") ++ distinctUnsupportedAggregateFunctions
-  private val supportedFunctions = supportedAggregateFunctions
+  private val supportedFunctions = supportedAggregateFunctions ++ Set("TRUNC")
 
   override def isSupportedFunction(funcName: String): Boolean =
     supportedFunctions.contains(funcName)
@@ -56,6 +56,30 @@ private case class OracleDialect() extends JdbcDialect with SQLConfHelper with N
 
   class OracleSQLBuilder extends JDBCSQLBuilder {
 
+    override def visitExtract(extract: Extract): String = {
+      val field = extract.field
+      field match {
+        // YEAR, MONTH, DAY, HOUR, MINUTE are identical on Oracle and Spark for
+        // both datetime and interval types.
+        case "YEAR" | "MONTH" | "DAY" | "HOUR" | "MINUTE" =>
+          super.visitExtract(field, build(extract.source()))
+        // Oracle does not support the following date fields: DAY_OF_YEAR, WEEK, QUARTER,
+        // DAY_OF_WEEK, or YEAR_OF_WEEK.
+        // We can't push down SECOND due to the difference in result types between Spark and
+        // Oracle. Spark returns decimal(8, 6), but Oracle returns integer.
+        case _ =>
+          visitUnexpectedExpr(extract)
+      }
+    }
+
+    override def visitSQLFunction(funcName: String, inputs: Array[String]): String = {
+      funcName match {
+        case "TRUNC" =>
+          s"TRUNC(${inputs(0)}, 'IW')"
+        case _ => super.visitSQLFunction(funcName, inputs)
+      }
+    }
+
     override def visitAggregateFunction(
         funcName: String, isDistinct: Boolean, inputs: Array[String]): String =
       if (isDistinct && distinctUnsupportedAggregateFunctions.contains(funcName)) {
@@ -233,7 +257,7 @@ private case class OracleDialect() extends JdbcDialect with SQLConfHelper with N
     extends JdbcSQLQueryBuilder(dialect, options) {
 
     override def build(): String = {
-      val selectStmt = s"SELECT $hintClause$columnList FROM ${options.tableOrQuery}" +
+      val selectStmt = s"SELECT $hintClause$columnList FROM $tableOrQuery" +
         s" $tableSampleClause $whereClause $groupByClause $orderByClause"
       val finalSelectStmt = if (limit > 0) {
         if (offset > 0) {
@@ -268,6 +292,8 @@ private case class OracleDialect() extends JdbcDialect with SQLConfHelper with N
 
   override def supportsHint: Boolean = true
 
+  override def supportsJoin: Boolean = true
+
   override def classifyException(
       e: Throwable,
       condition: String,
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/PostgresDialect.scala b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/PostgresDialect.scala
index b5a0dd95e60c4..d7d730ed0cc3a 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/jdbc/PostgresDialect.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/jdbc/PostgresDialect.scala
@@ -27,7 +27,6 @@ import scala.util.control.NonFatal
 
 import org.apache.spark.SparkThrowable
 import org.apache.spark.internal.LogKeys.COLUMN_NAME
-import org.apache.spark.internal.MDC
 import org.apache.spark.sql.catalyst.SQLConfHelper
 import org.apache.spark.sql.catalyst.analysis.{IndexAlreadyExistsException, NonEmptyNamespaceException, NoSuchIndexException}
 import org.apache.spark.sql.connector.catalog.Identifier
@@ -363,6 +362,8 @@ private case class PostgresDialect()
 
   override def supportsTableSample: Boolean = true
 
+  override def supportsJoin: Boolean = true
+
   override def getTableSample(sample: TableSampleInfo): String = {
     // hard-coded to BERNOULLI for now because Spark doesn't have a way to specify sample
     // method name
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionNode.scala b/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionNode.scala
index fa8aaf6d81c2b..efc44f84cd2c2 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionNode.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionNode.scala
@@ -1174,7 +1174,7 @@ class ForStatementExec(
     val defaultExpression = DefaultValueExpression(
       Literal(null, queryColumnNameToDataType(varName)), "null")
     val declareVariable = CreateVariable(
-      UnresolvedIdentifier(Seq(varName)),
+      Seq(UnresolvedIdentifier(Seq(varName))),
       defaultExpression,
       replace = false
     )
@@ -1187,7 +1187,7 @@ class ForStatementExec(
       OneRowRelation()
     )
     val setIdentifierToCurrentRow =
-      SetVariable(Seq(UnresolvedAttribute(varName)), projectNamedStruct)
+      SetVariable(Seq(UnresolvedAttribute.quoted(varName)), projectNamedStruct)
     new SingleStatementExec(
       setIdentifierToCurrentRow,
       Origin(),
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreter.scala b/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreter.scala
index 9ab45c4003f8c..e0e11183d3213 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreter.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreter.scala
@@ -122,12 +122,21 @@ case class SqlScriptingInterpreter(session: SparkSession) {
 
       // Get NOT FOUND handler.
       notFoundHandler = if (handler.exceptionHandlerTriggers.notFound) {
-        Some(handlerExec)
+        if (notFoundHandler.isDefined) {
+          throw SqlScriptingErrors.duplicateHandlerForSameCondition(CurrentOrigin.get, "NOT FOUND")
+        } else {
+          Some(handlerExec)
+        }
       } else None
 
       // Get SQLEXCEPTION handler.
       sqlExceptionHandler = if (handler.exceptionHandlerTriggers.sqlException) {
-        Some(handlerExec)
+        if (sqlExceptionHandler.isDefined) {
+          throw SqlScriptingErrors
+            .duplicateHandlerForSameCondition(CurrentOrigin.get, "SQLEXCEPTION")
+        } else {
+          Some(handlerExec)
+        }
       } else None
     })
 
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingLocalVariableManager.scala b/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingLocalVariableManager.scala
index f875f2154a925..fb3560ddb9f38 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingLocalVariableManager.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/scripting/SqlScriptingLocalVariableManager.scala
@@ -28,6 +28,9 @@ import org.apache.spark.sql.errors.QueryCompilationErrors.unresolvedVariableErro
 class SqlScriptingLocalVariableManager(context: SqlScriptingExecutionContext)
   extends VariableManager with DataTypeErrorsBase {
 
+  override def getVariableNameForError(variableName: String): String =
+    toSQLId(Seq(context.currentScope.label, variableName))
+
   override def create(
       nameParts: Seq[String],
       varDef: VariableDefinition,
@@ -42,7 +45,7 @@ class SqlScriptingLocalVariableManager(context: SqlScriptingExecutionContext)
       throw new AnalysisException(
         errorClass = "VARIABLE_ALREADY_EXISTS",
         messageParameters = Map(
-          "variableName" -> toSQLId(Seq(context.currentScope.label, name))))
+          "variableName" -> getVariableNameForError(name)))
     }
     context.currentScope.variables.put(name, varDef)
   }
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/streaming/TestGroupState.scala b/sql/core/src/main/scala/org/apache/spark/sql/streaming/TestGroupState.scala
index b92e361ef805b..17fb402457b74 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/streaming/TestGroupState.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/streaming/TestGroupState.scala
@@ -19,8 +19,8 @@ package org.apache.spark.sql.streaming
 
 import org.apache.spark.annotation.Evolving
 import org.apache.spark.api.java.Optional
-import org.apache.spark.sql.execution.streaming.GroupStateImpl
-import org.apache.spark.sql.execution.streaming.GroupStateImpl._
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl._
 
 /**
  * :: Experimental ::
diff --git a/sql/core/src/test/java/test/org/apache/spark/sql/JavaBeanDeserializationSuite.java b/sql/core/src/test/java/test/org/apache/spark/sql/JavaBeanDeserializationSuite.java
index a83041dc522c6..79a7d2b71cc43 100644
--- a/sql/core/src/test/java/test/org/apache/spark/sql/JavaBeanDeserializationSuite.java
+++ b/sql/core/src/test/java/test/org/apache/spark/sql/JavaBeanDeserializationSuite.java
@@ -24,8 +24,6 @@
 import java.time.LocalDate;
 import java.util.*;
 
-import org.apache.commons.lang3.builder.ToStringBuilder;
-import org.apache.commons.lang3.builder.ToStringStyle;
 import org.junit.jupiter.api.*;
 
 import org.apache.spark.api.java.function.MapFunction;
@@ -493,17 +491,10 @@ public int hashCode() {
 
     @Override
     public String toString() {
-      return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-          .append("shortField", shortField)
-          .append("intField", intField)
-          .append("longField", longField)
-          .append("floatField", floatField)
-          .append("doubleField", doubleField)
-          .append("stringField", stringField)
-          .append("booleanField", booleanField)
-          .append("timestampField", timestampField)
-          .append("nullIntField", nullIntField)
-          .toString();
+      return "RecordSpark22000[shortField=" + shortField + ",intField=" + intField +
+          ",longField=" + longField + ",floatField=" + floatField + ",doubleField=" + doubleField +
+          ",stringField=" + stringField + ",booleanField=" + booleanField +
+          ",timestampField=" + timestampField + ",nullIntField=" + nullIntField + "]";
     }
   }
 
@@ -680,10 +671,8 @@ public int hashCode() {
 
     @Override
     public String toString() {
-      return new ToStringBuilder(this, ToStringStyle.SHORT_PREFIX_STYLE)
-          .append("localDateField", localDateField)
-          .append("instantField", instantField)
-          .toString();
+      return "LocalDateInstantRecord[localDateField=" + localDateField +
+          ",instantField=" + instantField + "]";
     }
 
   }
diff --git a/sql/core/src/test/java/test/org/apache/spark/sql/JavaColumnExpressionSuite.java b/sql/core/src/test/java/test/org/apache/spark/sql/JavaColumnExpressionSuite.java
index 9988d04220f0f..1a94867668aec 100644
--- a/sql/core/src/test/java/test/org/apache/spark/sql/JavaColumnExpressionSuite.java
+++ b/sql/core/src/test/java/test/org/apache/spark/sql/JavaColumnExpressionSuite.java
@@ -19,8 +19,6 @@
 
 import java.util.*;
 
-import com.google.common.collect.Maps;
-
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.Assertions;
 import org.junit.jupiter.api.BeforeEach;
@@ -90,6 +88,6 @@ public void isInCollectionCheckExceptionMessage() {
     messageParameters.put("functionName", "`in`");
     messageParameters.put("dataType", "[\"INT\", \"ARRAY<INT>\"]");
     messageParameters.put("sqlExpr", "\"(a IN (b))\"");
-    Assertions.assertTrue(Maps.difference(e.getMessageParameters(), messageParameters).areEqual());
+    Assertions.assertTrue(e.getMessageParameters().equals(messageParameters));
   }
 }
diff --git a/sql/core/src/test/java/test/org/apache/spark/sql/JavaDataFrameSuite.java b/sql/core/src/test/java/test/org/apache/spark/sql/JavaDataFrameSuite.java
index 27137e53934d2..a780c057e9038 100644
--- a/sql/core/src/test/java/test/org/apache/spark/sql/JavaDataFrameSuite.java
+++ b/sql/core/src/test/java/test/org/apache/spark/sql/JavaDataFrameSuite.java
@@ -27,7 +27,6 @@
 import scala.collection.Seq;
 import scala.jdk.javaapi.CollectionConverters;
 
-import com.google.common.collect.ImmutableMap;
 import com.google.common.primitives.Ints;
 import org.junit.jupiter.api.*;
 
@@ -133,7 +132,7 @@ public void testShow() {
   public static class Bean implements Serializable {
     private double a = 0.0;
     private Integer[] b = { 0, 1 };
-    private Map<String, int[]> c = ImmutableMap.of("hello", new int[] { 1, 2 });
+    private Map<String, int[]> c = Map.of("hello", new int[] { 1, 2 });
     private List<String> d = Arrays.asList("floppy", "disk");
     private BigInteger e = new BigInteger("1234567");
     private NestedBean f = new NestedBean();
@@ -312,7 +311,7 @@ public void testCovariance() {
   @Test
   public void testSampleBy() {
     Dataset<Row> df = spark.range(0, 100, 1, 2).select(col("id").mod(3).as("key"));
-    Dataset<Row> sampled = df.stat().sampleBy("key", ImmutableMap.of(0, 0.1, 1, 0.2), 0L);
+    Dataset<Row> sampled = df.stat().sampleBy("key", Map.of(0, 0.1, 1, 0.2), 0L);
     List<Row> actual = sampled.groupBy("key").count().orderBy("key").collectAsList();
     Assertions.assertEquals(0, actual.get(0).getLong(0));
     Assertions.assertTrue(0 <= actual.get(0).getLong(1) && actual.get(0).getLong(1) <= 8);
@@ -338,7 +337,7 @@ public void testwithColumns() {
   @Test
   public void testSampleByColumn() {
     Dataset<Row> df = spark.range(0, 100, 1, 2).select(col("id").mod(3).as("key"));
-    Dataset<Row> sampled = df.stat().sampleBy(col("key"), ImmutableMap.of(0, 0.1, 1, 0.2), 0L);
+    Dataset<Row> sampled = df.stat().sampleBy(col("key"), Map.of(0, 0.1, 1, 0.2), 0L);
     List<Row> actual = sampled.groupBy("key").count().orderBy("key").collectAsList();
     Assertions.assertEquals(0, actual.get(0).getLong(0));
     Assertions.assertTrue(0 <= actual.get(0).getLong(1) && actual.get(0).getLong(1) <= 8);
diff --git a/sql/core/src/test/java/test/org/apache/spark/sql/JavaDatasetSuite.java b/sql/core/src/test/java/test/org/apache/spark/sql/JavaDatasetSuite.java
index 692b5c0ebc3a9..33afafbf25601 100644
--- a/sql/core/src/test/java/test/org/apache/spark/sql/JavaDatasetSuite.java
+++ b/sql/core/src/test/java/test/org/apache/spark/sql/JavaDatasetSuite.java
@@ -33,7 +33,6 @@
 import scala.Tuple4;
 import scala.Tuple5;
 
-import com.google.common.base.Objects;
 import org.junit.jupiter.api.AfterEach;
 import org.junit.jupiter.api.Assertions;
 import org.junit.jupiter.api.BeforeEach;
@@ -812,6 +811,26 @@ public void testLocalTimeEncoder() {
     Assertions.assertEquals(data, ds.collectAsList());
   }
 
+  @Test
+  public void testLocalTimeFilter() {
+    Encoder<LocalTime> encoder = Encoders.LOCALTIME();
+    List<LocalTime> data = Arrays.asList(
+      LocalTime.of(9, 30, 45),
+      LocalTime.of(14, 10, 10),
+      LocalTime.of(22, 10, 10)
+    );
+    Dataset<LocalTime> ds = spark.createDataset(data, encoder);
+
+    Dataset<LocalTime> filtered = ds.filter(
+      (FilterFunction<LocalTime>) time -> time.isAfter(LocalTime.of(12, 0, 0))
+    );
+    List<LocalTime> expectedFiltered = Arrays.asList(
+      LocalTime.of(14, 10, 10),
+      LocalTime.of(22, 10, 10)
+    );
+    Assertions.assertEquals(expectedFiltered, filtered.collectAsList());
+  }
+
   public static class KryoSerializable {
     String value;
 
@@ -1192,12 +1211,12 @@ public boolean equals(Object o) {
       if (this == o) return true;
       if (o == null || getClass() != o.getClass()) return false;
       SmallBean smallBean = (SmallBean) o;
-      return b == smallBean.b && com.google.common.base.Objects.equal(a, smallBean.a);
+      return b == smallBean.b && Objects.equals(a, smallBean.a);
     }
 
     @Override
     public int hashCode() {
-      return Objects.hashCode(a, b);
+      return Objects.hash(a, b);
     }
   }
 
@@ -1217,7 +1236,7 @@ public boolean equals(Object o) {
       if (this == o) return true;
       if (o == null || getClass() != o.getClass()) return false;
       NestedSmallBean that = (NestedSmallBean) o;
-      return Objects.equal(f, that.f);
+      return Objects.equals(f, that.f);
     }
 
     @Override
@@ -1259,13 +1278,13 @@ public boolean equals(Object o) {
       if (this == o) return true;
       if (o == null || getClass() != o.getClass()) return false;
       NestedSmallBeanWithNonNullField that = (NestedSmallBeanWithNonNullField) o;
-      return Objects.equal(nullable_f, that.nullable_f) &&
-        Objects.equal(nonNull_f, that.nonNull_f) && Objects.equal(childMap, that.childMap);
+      return Objects.equals(nullable_f, that.nullable_f) &&
+        Objects.equals(nonNull_f, that.nonNull_f) && Objects.equals(childMap, that.childMap);
     }
 
     @Override
     public int hashCode() {
-      return Objects.hashCode(nullable_f, nonNull_f, childMap);
+      return Objects.hash(nullable_f, nonNull_f, childMap);
     }
   }
 
@@ -1286,7 +1305,7 @@ public boolean equals(Object o) {
       if (this == o) return true;
       if (o == null || getClass() != o.getClass()) return false;
       NestedSmallBean2 that = (NestedSmallBean2) o;
-      return Objects.equal(f, that.f);
+      return Objects.equals(f, that.f);
     }
 
     @Override
@@ -1828,7 +1847,7 @@ public String toString() {
     }
 
     public int hashCode() {
-      return Objects.hashCode(enumField, regularField);
+      return Objects.hash(enumField, regularField);
     }
 
     public boolean equals(Object other) {
@@ -2085,7 +2104,7 @@ public boolean equals(Object o) {
       if (this == o) return true;
       if (o == null || getClass() != o.getClass()) return false;
       BeanWithSet that = (BeanWithSet) o;
-      return Objects.equal(fields, that.fields);
+      return Objects.equals(fields, that.fields);
     }
 
     @Override
@@ -2128,14 +2147,14 @@ public boolean equals(Object o) {
       if (this == o) return true;
       if (o == null || getClass() != o.getClass()) return false;
       SpecificListsBean that = (SpecificListsBean) o;
-      return Objects.equal(arrayList, that.arrayList) &&
-        Objects.equal(linkedList, that.linkedList) &&
-        Objects.equal(list, that.list);
+      return Objects.equals(arrayList, that.arrayList) &&
+        Objects.equals(linkedList, that.linkedList) &&
+        Objects.equals(list, that.list);
     }
 
     @Override
     public int hashCode() {
-      return Objects.hashCode(arrayList, linkedList, list);
+      return Objects.hash(arrayList, linkedList, list);
     }
   }
 }
diff --git a/sql/core/src/test/java/test/org/apache/spark/sql/JavaUDFSuite.java b/sql/core/src/test/java/test/org/apache/spark/sql/JavaUDFSuite.java
index c1f48a922b727..7328249955147 100644
--- a/sql/core/src/test/java/test/org/apache/spark/sql/JavaUDFSuite.java
+++ b/sql/core/src/test/java/test/org/apache/spark/sql/JavaUDFSuite.java
@@ -19,6 +19,7 @@
 
 import java.io.Serializable;
 import java.time.LocalDate;
+import java.time.LocalTime;
 import java.util.List;
 
 import org.apache.spark.sql.catalyst.FunctionIdentifier;
@@ -34,6 +35,7 @@
 import org.apache.spark.sql.classic.SparkSession;
 import org.apache.spark.sql.api.java.UDF2;
 import org.apache.spark.sql.types.DataTypes;
+import org.apache.spark.sql.types.TimeType;
 
 // The test suite itself is Serializable so that anonymous Function implementations can be
 // serialized, as an alternative to converting these anonymous classes to static inner classes;
@@ -136,6 +138,15 @@ public void udf7Test() {
     }
   }
 
+  @Test
+  public void udf8Test() {
+    spark.udf().register(
+        "plusTwoHours",
+        (java.time.LocalTime lt) -> lt.plusHours(2), new TimeType(6));
+    Row result = spark.sql("SELECT plusTwoHours(TIME '09:10:10')").head();
+    Assertions.assertEquals(LocalTime.of(11, 10, 10), result.get(0));
+  }
+
   @Test
   public void sourceTest() {
     spark.udf().register("stringLengthTest", (String str) -> str.length(), DataTypes.IntegerType);
diff --git a/sql/core/src/test/resources/log4j2.properties b/sql/core/src/test/resources/log4j2.properties
index 9b0e2af355fd8..0951114470faa 100644
--- a/sql/core/src/test/resources/log4j2.properties
+++ b/sql/core/src/test/resources/log4j2.properties
@@ -42,7 +42,6 @@ appender.file.fileName = target/unit-tests.log
 appender.file.layout.type = PatternLayout
 appender.file.layout.pattern = %d{HH:mm:ss.SSS} %t %p %c{1}: %m%n%ex
 
-# Set the logger level of File Appender to WARN
 appender.file.filter.threshold.type = ThresholdFilter
 appender.file.filter.threshold.level = info
 
diff --git a/sql/core/src/test/resources/sql-functions/sql-expression-schema.md b/sql/core/src/test/resources/sql-functions/sql-expression-schema.md
index da7b8f3f7709d..6e6d520efbac3 100644
--- a/sql/core/src/test/resources/sql-functions/sql-expression-schema.md
+++ b/sql/core/src/test/resources/sql-functions/sql-expression-schema.md
@@ -10,6 +10,7 @@
 | org.apache.spark.sql.catalyst.expressions.AesDecrypt | aes_decrypt | SELECT aes_decrypt(unhex('83F16B2AA704794132802D248E6BFD4E380078182D1544813898AC97E709B28A94'), '0000111122223333') | struct<aes_decrypt(unhex(83F16B2AA704794132802D248E6BFD4E380078182D1544813898AC97E709B28A94), 0000111122223333, GCM, DEFAULT, ):binary> |
 | org.apache.spark.sql.catalyst.expressions.AesEncrypt | aes_encrypt | SELECT hex(aes_encrypt('Spark', '0000111122223333')) | struct<hex(aes_encrypt(Spark, 0000111122223333, GCM, DEFAULT, , )):string> |
 | org.apache.spark.sql.catalyst.expressions.And | and | SELECT true and true | struct<(true AND true):boolean> |
+| org.apache.spark.sql.catalyst.expressions.ApproxTopKEstimate | approx_top_k_estimate | SELECT approx_top_k_estimate(approx_top_k_accumulate(expr)) FROM VALUES (0), (0), (1), (1), (2), (3), (4), (4) AS tab(expr) | struct<approx_top_k_estimate(approx_top_k_accumulate(expr, 10000), 5):array<struct<item:int,count:bigint>>> |
 | org.apache.spark.sql.catalyst.expressions.ArrayAggregate | aggregate | SELECT aggregate(array(1, 2, 3), 0, (acc, x) -> acc + x) | struct<aggregate(array(1, 2, 3), 0, lambdafunction((namedlambdavariable() + namedlambdavariable()), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable())):int> |
 | org.apache.spark.sql.catalyst.expressions.ArrayAggregate | reduce | SELECT reduce(array(1, 2, 3), 0, (acc, x) -> acc + x) | struct<reduce(array(1, 2, 3), 0, lambdafunction((namedlambdavariable() + namedlambdavariable()), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable())):int> |
 | org.apache.spark.sql.catalyst.expressions.ArrayAppend | array_append | SELECT array_append(array('b', 'd', 'c', 'a'), 'd') | struct<array_append(array(b, d, c, a), d):array<string>> |
@@ -73,6 +74,7 @@
 | org.apache.spark.sql.catalyst.expressions.Cast | int | N/A | N/A |
 | org.apache.spark.sql.catalyst.expressions.Cast | smallint | N/A | N/A |
 | org.apache.spark.sql.catalyst.expressions.Cast | string | N/A | N/A |
+| org.apache.spark.sql.catalyst.expressions.Cast | time | N/A | N/A |
 | org.apache.spark.sql.catalyst.expressions.Cast | timestamp | N/A | N/A |
 | org.apache.spark.sql.catalyst.expressions.Cast | tinyint | N/A | N/A |
 | org.apache.spark.sql.catalyst.expressions.Cbrt | cbrt | SELECT cbrt(27.0) | struct<CBRT(27.0):double> |
@@ -207,7 +209,7 @@
 | org.apache.spark.sql.catalyst.expressions.MakeDate | make_date | SELECT make_date(2013, 7, 15) | struct<make_date(2013, 7, 15):date> |
 | org.apache.spark.sql.catalyst.expressions.MakeInterval | make_interval | SELECT make_interval(100, 11, 1, 1, 12, 30, 01.001001) | struct<make_interval(100, 11, 1, 1, 12, 30, 1.001001):interval> |
 | org.apache.spark.sql.catalyst.expressions.MakeTime | make_time | SELECT make_time(6, 30, 45.887) | struct<make_time(6, 30, 45.887):time(6)> |
-| org.apache.spark.sql.catalyst.expressions.MakeTimestamp | make_timestamp | SELECT make_timestamp(2014, 12, 28, 6, 30, 45.887) | struct<make_timestamp(2014, 12, 28, 6, 30, 45.887):timestamp> |
+| org.apache.spark.sql.catalyst.expressions.MakeTimestampExpressionBuilder | make_timestamp | SELECT make_timestamp(2014, 12, 28, 6, 30, 45.887) | struct<make_timestamp(2014, 12, 28, 6, 30, 45.887):timestamp> |
 | org.apache.spark.sql.catalyst.expressions.MakeTimestampLTZExpressionBuilder | make_timestamp_ltz | SELECT make_timestamp_ltz(2014, 12, 28, 6, 30, 45.887) | struct<make_timestamp_ltz(2014, 12, 28, 6, 30, 45.887):timestamp> |
 | org.apache.spark.sql.catalyst.expressions.MakeTimestampNTZExpressionBuilder | make_timestamp_ntz | SELECT make_timestamp_ntz(2014, 12, 28, 6, 30, 45.887) | struct<make_timestamp_ntz(2014, 12, 28, 6, 30, 45.887):timestamp_ntz> |
 | org.apache.spark.sql.catalyst.expressions.MakeValidUTF8 | make_valid_utf8 | SELECT make_valid_utf8('Spark') | struct<make_valid_utf8(Spark):string> |
@@ -340,6 +342,8 @@
 | org.apache.spark.sql.catalyst.expressions.Subtract | - | SELECT 2 - 1 | struct<(2 - 1):int> |
 | org.apache.spark.sql.catalyst.expressions.Tan | tan | SELECT tan(0) | struct<TAN(0):double> |
 | org.apache.spark.sql.catalyst.expressions.Tanh | tanh | SELECT tanh(0) | struct<TANH(0):double> |
+| org.apache.spark.sql.catalyst.expressions.TimeDiff | time_diff | SELECT time_diff('HOUR', TIME'20:30:29', TIME'21:30:28') | struct<time_diff(HOUR, TIME '20:30:29', TIME '21:30:28'):bigint> |
+| org.apache.spark.sql.catalyst.expressions.TimeTrunc | time_trunc | SELECT time_trunc('HOUR', TIME'09:32:05.359') | struct<time_trunc(HOUR, TIME '09:32:05.359'):time(6)> |
 | org.apache.spark.sql.catalyst.expressions.TimeWindow | window | SELECT a, window.start, window.end, count(*) as cnt FROM VALUES ('A1', '2021-01-01 00:00:00'), ('A1', '2021-01-01 00:04:30'), ('A1', '2021-01-01 00:06:00'), ('A2', '2021-01-01 00:01:00') AS tab(a, b) GROUP by a, window(b, '5 minutes') ORDER BY a, start | struct<a:string,start:timestamp,end:timestamp,cnt:bigint> |
 | org.apache.spark.sql.catalyst.expressions.ToBinary | to_binary | SELECT to_binary('abc', 'utf-8') | struct<to_binary(abc, utf-8):binary> |
 | org.apache.spark.sql.catalyst.expressions.ToCharacterBuilder | to_char | SELECT to_char(454, '999') | struct<to_char(454, 999):string> |
@@ -368,6 +372,7 @@
 | org.apache.spark.sql.catalyst.expressions.TryReflect | try_reflect | SELECT try_reflect('java.util.UUID', 'randomUUID') | struct<try_reflect(java.util.UUID, randomUUID):string> |
 | org.apache.spark.sql.catalyst.expressions.TrySubtract | try_subtract | SELECT try_subtract(2, 1) | struct<try_subtract(2, 1):int> |
 | org.apache.spark.sql.catalyst.expressions.TryToBinary | try_to_binary | SELECT try_to_binary('abc', 'utf-8') | struct<try_to_binary(abc, utf-8):binary> |
+| org.apache.spark.sql.catalyst.expressions.TryToDateExpressionBuilder | try_to_date | SELECT try_to_date('2016-12-31') | struct<try_to_date(2016-12-31):date> |
 | org.apache.spark.sql.catalyst.expressions.TryToNumber | try_to_number | SELECT try_to_number('454', '999') | struct<try_to_number(454, 999):decimal(3,0)> |
 | org.apache.spark.sql.catalyst.expressions.TryToTimeExpressionBuilder | try_to_time | SELECT try_to_time('00:12:00.001') | struct<try_to_time(to_time(00:12:00.001)):time(6)> |
 | org.apache.spark.sql.catalyst.expressions.TryToTimestampExpressionBuilder | try_to_timestamp | SELECT try_to_timestamp('2016-12-31 00:12:00') | struct<try_to_timestamp(2016-12-31 00:12:00):timestamp> |
@@ -400,6 +405,8 @@
 | org.apache.spark.sql.catalyst.expressions.ZeroIfNull | zeroifnull | SELECT zeroifnull(NULL) | struct<zeroifnull(NULL):int> |
 | org.apache.spark.sql.catalyst.expressions.ZipWith | zip_with | SELECT zip_with(array(1, 2, 3), array('a', 'b', 'c'), (x, y) -> (y, x)) | struct<zip_with(array(1, 2, 3), array(a, b, c), lambdafunction(named_struct(y, namedlambdavariable(), x, namedlambdavariable()), namedlambdavariable(), namedlambdavariable())):array<struct<y:string,x:int>>> |
 | org.apache.spark.sql.catalyst.expressions.aggregate.AnyValue | any_value | SELECT any_value(col) FROM VALUES (10), (5), (20) AS tab(col) | struct<any_value(col):int> |
+| org.apache.spark.sql.catalyst.expressions.aggregate.ApproxTopK | approx_top_k | SELECT approx_top_k(expr) FROM VALUES (0), (0), (1), (1), (2), (3), (4), (4) AS tab(expr) | struct<approx_top_k(expr, 5, 10000):array<struct<item:int,count:bigint>>> |
+| org.apache.spark.sql.catalyst.expressions.aggregate.ApproxTopKAccumulate | approx_top_k_accumulate | SELECT approx_top_k_estimate(approx_top_k_accumulate(expr)) FROM VALUES (0), (0), (1), (1), (2), (3), (4), (4) AS tab(expr) | struct<approx_top_k_estimate(approx_top_k_accumulate(expr, 10000), 5):array<struct<item:int,count:bigint>>> |
 | org.apache.spark.sql.catalyst.expressions.aggregate.ApproximatePercentile | approx_percentile | SELECT approx_percentile(col, array(0.5, 0.4, 0.1), 100) FROM VALUES (0), (1), (2), (10) AS tab(col) | struct<approx_percentile(col, array(0.5, 0.4, 0.1), 100):array<int>> |
 | org.apache.spark.sql.catalyst.expressions.aggregate.ApproximatePercentile | percentile_approx | SELECT percentile_approx(col, array(0.5, 0.4, 0.1), 100) FROM VALUES (0), (1), (2), (10) AS tab(col) | struct<percentile_approx(col, array(0.5, 0.4, 0.1), 100):array<int>> |
 | org.apache.spark.sql.catalyst.expressions.aggregate.Average | avg | SELECT avg(col) FROM VALUES (1), (2), (3) AS tab(col) | struct<avg(col):double> |
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/binary.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/binary.sql.out
index fe61e684a7ff5..b2781c56ca7da 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/binary.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/binary.sql.out
@@ -32,3 +32,28 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 -- !query analysis
 Project [to_csv(named_struct(n, 1, info, 0x4561736F6E2059616F20323031382D31312D31373A31333A33333A3333), Some(America/Los_Angeles)) AS to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333'))#x]
 +- OneRowRelation
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query analysis
+Project [to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)) AS to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query analysis
+Project [from_xml(StructField(name,StringType,true), StructField(birth,IntegerType,true), StructField(org,StringType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query analysis
+Project [from_xml(StructField(name,BinaryType,true), StructField(birth,IntegerType,true), StructField(org,BinaryType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_base64.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_base64.sql.out
index fe61e684a7ff5..b2781c56ca7da 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_base64.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_base64.sql.out
@@ -32,3 +32,28 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 -- !query analysis
 Project [to_csv(named_struct(n, 1, info, 0x4561736F6E2059616F20323031382D31312D31373A31333A33333A3333), Some(America/Los_Angeles)) AS to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333'))#x]
 +- OneRowRelation
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query analysis
+Project [to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)) AS to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query analysis
+Project [from_xml(StructField(name,StringType,true), StructField(birth,IntegerType,true), StructField(org,StringType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query analysis
+Project [from_xml(StructField(name,BinaryType,true), StructField(birth,IntegerType,true), StructField(org,BinaryType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_basic.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_basic.sql.out
index fe61e684a7ff5..b2781c56ca7da 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_basic.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_basic.sql.out
@@ -32,3 +32,28 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 -- !query analysis
 Project [to_csv(named_struct(n, 1, info, 0x4561736F6E2059616F20323031382D31312D31373A31333A33333A3333), Some(America/Los_Angeles)) AS to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333'))#x]
 +- OneRowRelation
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query analysis
+Project [to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)) AS to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query analysis
+Project [from_xml(StructField(name,StringType,true), StructField(birth,IntegerType,true), StructField(org,StringType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query analysis
+Project [from_xml(StructField(name,BinaryType,true), StructField(birth,IntegerType,true), StructField(org,BinaryType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex.sql.out
index fe61e684a7ff5..b2781c56ca7da 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex.sql.out
@@ -32,3 +32,28 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 -- !query analysis
 Project [to_csv(named_struct(n, 1, info, 0x4561736F6E2059616F20323031382D31312D31373A31333A33333A3333), Some(America/Los_Angeles)) AS to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333'))#x]
 +- OneRowRelation
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query analysis
+Project [to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)) AS to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query analysis
+Project [from_xml(StructField(name,StringType,true), StructField(birth,IntegerType,true), StructField(org,StringType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query analysis
+Project [from_xml(StructField(name,BinaryType,true), StructField(birth,IntegerType,true), StructField(org,BinaryType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex_discrete.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex_discrete.sql.out
index fe61e684a7ff5..b2781c56ca7da 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex_discrete.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/binary_hex_discrete.sql.out
@@ -32,3 +32,28 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 -- !query analysis
 Project [to_csv(named_struct(n, 1, info, 0x4561736F6E2059616F20323031382D31312D31373A31333A33333A3333), Some(America/Los_Angeles)) AS to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333'))#x]
 +- OneRowRelation
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query analysis
+Project [to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)) AS to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query analysis
+Project [from_xml(StructField(name,StringType,true), StructField(birth,IntegerType,true), StructField(org,StringType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query analysis
+Project [from_xml(StructField(name,BinaryType,true), StructField(birth,IntegerType,true), StructField(org,BinaryType,true), to_xml(named_struct(name, cast(Eason as binary), birth, 2018, org, cast(Kindergarten Cop as binary)), Some(America/Los_Angeles)), Some(America/Los_Angeles)) AS from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)))#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/cast.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/cast.sql.out
index 643dfd3771ffe..053d7af3df45f 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/cast.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/cast.sql.out
@@ -881,6 +881,97 @@ Project [cast(10.654321 as interval month) AS CAST(10.654321 AS INTERVAL MONTH)#
 +- OneRowRelation
 
 
+-- !query
+SELECT CAST(TIME '00:01:52' AS tinyint)
+-- !query analysis
+Project [cast(00:01:52 as tinyint) AS CAST(TIME '00:01:52' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS smallint)
+-- !query analysis
+Project [cast(00:01:52 as smallint) AS CAST(TIME '00:01:52' AS SMALLINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS int)
+-- !query analysis
+Project [cast(00:01:52 as int) AS CAST(TIME '00:01:52' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS bigint)
+-- !query analysis
+Project [cast(00:01:52 as bigint) AS CAST(TIME '00:01:52' AS BIGINT)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS tinyint)
+-- !query analysis
+Project [cast(23:59:59 as tinyint) AS CAST(TIME '23:59:59' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS smallint)
+-- !query analysis
+Project [cast(23:59:59 as smallint) AS CAST(TIME '23:59:59' AS SMALLINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS int)
+-- !query analysis
+Project [cast(23:59:59 as int) AS CAST(TIME '23:59:59' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS bigint)
+-- !query analysis
+Project [cast(23:59:59 as bigint) AS CAST(TIME '23:59:59' AS BIGINT)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS tinyint)
+-- !query analysis
+Project [cast(00:00:17.5 as tinyint) AS CAST(TIME '00:00:17.5' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS int)
+-- !query analysis
+Project [cast(00:00:17.5 as int) AS CAST(TIME '00:00:17.5' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.9' AS int)
+-- !query analysis
+Project [cast(00:00:17.9 as int) AS CAST(TIME '00:00:17.9' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS tinyint)
+-- !query analysis
+Project [cast(00:00:00 as tinyint) AS CAST(TIME '00:00:00' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS int)
+-- !query analysis
+Project [cast(00:00:00 as int) AS CAST(TIME '00:00:00' AS INT)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT '1.23' :: int
 -- !query analysis
@@ -1033,6 +1124,34 @@ Project [cast(10.123456 as interval day to second) AS CAST(10.123456 AS INTERVAL
 +- OneRowRelation
 
 
+-- !query
+SELECT TIME '00:01:52' :: tinyint
+-- !query analysis
+Project [cast(00:01:52 as tinyint) AS CAST(TIME '00:01:52' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME '00:01:52' :: int
+-- !query analysis
+Project [cast(00:01:52 as int) AS CAST(TIME '00:01:52' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME '23:59:59' :: tinyint
+-- !query analysis
+Project [cast(23:59:59 as tinyint) AS CAST(TIME '23:59:59' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME '23:59:59' :: int
+-- !query analysis
+Project [cast(23:59:59 as int) AS CAST(TIME '23:59:59' AS INT)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT '1.23' :: int :: long
 -- !query analysis
@@ -1113,3 +1232,122 @@ org.apache.spark.sql.catalyst.parser.ParseException
     "hint" : ""
   }
 }
+
+
+-- !query
+SELECT CAST(time '00:00:00' AS decimal(1, 0))
+-- !query analysis
+Project [cast(00:00:00 as decimal(1,0)) AS CAST(TIME '00:00:00' AS DECIMAL(1,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '12:00:00' AS decimal(7, 2))
+-- !query analysis
+Project [cast(12:00:00 as decimal(7,2)) AS CAST(TIME '12:00:00' AS DECIMAL(7,2))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '01:30:45' AS decimal(8, 3))
+-- !query analysis
+Project [cast(01:30:45 as decimal(8,3)) AS CAST(TIME '01:30:45' AS DECIMAL(8,3))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59' AS decimal(9, 4))
+-- !query analysis
+Project [cast(23:59:59 as decimal(9,4)) AS CAST(TIME '23:59:59' AS DECIMAL(9,4))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '01:02:03' AS decimal(15, 9))
+-- !query analysis
+Project [cast(01:02:03 as decimal(15,9)) AS CAST(TIME '01:02:03' AS DECIMAL(15,9))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '10:20:30' AS decimal(20, 10))
+-- !query analysis
+Project [cast(10:20:30 as decimal(20,10)) AS CAST(TIME '10:20:30' AS DECIMAL(20,10))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.001' AS decimal(8, 3))
+-- !query analysis
+Project [cast(23:59:59.001 as decimal(8,3)) AS CAST(TIME '23:59:59.001' AS DECIMAL(8,3))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 6))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(11,6)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(11,6))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 9))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(14,9)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(14,9))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(20, 10))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(20,10)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(20,10))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '00:01:00' AS decimal(1, 0))
+-- !query analysis
+Project [cast(00:01:00 as decimal(1,0)) AS CAST(TIME '00:01:00' AS DECIMAL(1,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '01:00:00' AS decimal(3, 0))
+-- !query analysis
+Project [cast(01:00:00 as decimal(3,0)) AS CAST(TIME '01:00:00' AS DECIMAL(3,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '10:00:00' AS decimal(5, 2))
+-- !query analysis
+Project [cast(10:00:00 as decimal(5,2)) AS CAST(TIME '10:00:00' AS DECIMAL(5,2))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.9' AS decimal(6, 0))
+-- !query analysis
+Project [cast(23:59:59.9 as decimal(6,0)) AS CAST(TIME '23:59:59.9' AS DECIMAL(6,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999' AS decimal(8, 2))
+-- !query analysis
+Project [cast(23:59:59.999 as decimal(8,2)) AS CAST(TIME '23:59:59.999' AS DECIMAL(8,2))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 5))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(11,5)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(11,5))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 8))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(14,8)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(14,8))#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/charvarchar.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/charvarchar.sql.out
index 524797015a2f6..4e864523368d7 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/charvarchar.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/charvarchar.sql.out
@@ -376,7 +376,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`char_tbl4`, false
 insert into char_tbl4 select c, c, v, c from str_view
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/char_tbl4, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/char_tbl4], Append, `spark_catalog`.`default`.`char_tbl4`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/char_tbl4), [c7, c8, v, s]
-+- Project [static_invoke(CharVarcharCodegenUtils.charTypeWriteSideCheck(cast(c#x as string), 7)) AS c7#x, static_invoke(CharVarcharCodegenUtils.charTypeWriteSideCheck(cast(c#x as string), 8)) AS c8#x, static_invoke(CharVarcharCodegenUtils.varcharTypeWriteSideCheck(cast(v#x as string), 6)) AS v#x, cast(c#x as string) AS s#x]
++- Project [static_invoke(CharVarcharCodegenUtils.charTypeWriteSideCheck(cast(c#x as string), 7)) AS c7#x, static_invoke(CharVarcharCodegenUtils.charTypeWriteSideCheck(cast(c#x as string), 8)) AS c8#x, static_invoke(CharVarcharCodegenUtils.varcharTypeWriteSideCheck(cast(v#x as string), 6)) AS v#x, c#x AS s#x]
    +- Project [c#x, c#x, v#x, c#x]
       +- SubqueryAlias str_view
          +- View (`str_view`, [c#x, v#x])
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/collations-aliases.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-aliases.sql.out
new file mode 100644
index 0000000000000..454682e392be8
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-aliases.sql.out
@@ -0,0 +1,335 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+-- !query analysis
+Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query analysis
+Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select * from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query analysis
+Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select subq1.* from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+) AS subq1
+-- !query analysis
+Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- SubqueryAlias subq1
+   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+with cte as (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+select * from cte
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias cte
+:     +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+:        +- SubqueryAlias spark_catalog.default.t1
+:           +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
++- Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+   +- SubqueryAlias cte
+      +- CTERelationRef xxxx, true, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x], false, false
+
+
+-- !query
+select * from values (1) where exists (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query analysis
+Project [col1#x]
++- Filter exists#x []
+   :  +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+   :     +- SubqueryAlias spark_catalog.default.t1
+   :        +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+   +- LocalRelation [col1#x]
+
+
+-- !query
+select (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1 limit 1
+)
+-- !query analysis
+Project [scalar-subquery#x [] AS scalarsubquery()#x]
+:  +- GlobalLimit 1
+:     +- LocalLimit 1
+:        +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+:           +- SubqueryAlias spark_catalog.default.t1
+:              +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
++- OneRowRelation
+
+
+-- !query
+select (
+  with cte as (
+    select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  )
+  select * from cte limit 1
+)
+-- !query analysis
+Project [scalar-subquery#x [] AS scalarsubquery()#x]
+:  +- WithCTE
+:     :- CTERelationDef xxxx, false
+:     :  +- SubqueryAlias cte
+:     :     +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+:     :        +- SubqueryAlias spark_catalog.default.t1
+:     :           +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+:     +- GlobalLimit 1
+:        +- LocalLimit 1
+:           +- Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+:              +- SubqueryAlias cte
+:                 +- CTERelationRef xxxx, true, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x], false, false
++- OneRowRelation
+
+
+-- !query
+select * from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1 limit 1
+)
+where (
+  `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` == 'aaa'
+)
+-- !query analysis
+Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- Filter (concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x = aaa)
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- GlobalLimit 1
+         +- LocalLimit 1
+            +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+               +- SubqueryAlias spark_catalog.default.t1
+                  +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  group by 1
+  order by 1
+)
+-- !query analysis
+Project [lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x) AS lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Sort [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x ASC NULLS FIRST], true
+      +- Aggregate [concat_ws( , utf8_lcase#x, utf8_lcase#x)], [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  group by 1
+  order by max(concat_ws(' ', utf8_lcase, utf8_lcase))
+)
+-- !query analysis
+Project [lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x) AS lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+      +- Sort [max(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x ASC NULLS FIRST], true
+         +- Aggregate [concat_ws( , utf8_lcase#x, utf8_lcase#x)], [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x, max(concat_ws( , utf8_lcase#x, utf8_lcase#x)) AS max(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x]
+            +- SubqueryAlias spark_catalog.default.t1
+               +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+create temporary view v1 as (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query analysis
+CreateViewCommand `v1`, (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+), false, false, LocalTempView, UNSUPPORTED, true
+   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select * from v1
+-- !query analysis
+Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- SubqueryAlias v1
+   +- View (`v1`, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x])
+      +- Project [cast(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x as string collate UTF8_LCASE) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+         +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+            +- SubqueryAlias spark_catalog.default.t1
+               +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from v1
+-- !query analysis
+Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- SubqueryAlias v1
+   +- View (`v1`, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x])
+      +- Project [cast(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x as string collate UTF8_LCASE) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+         +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
+            +- SubqueryAlias spark_catalog.default.t1
+               +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+drop view v1
+-- !query analysis
+DropTempViewCommand v1
+
+
+-- !query
+drop table t1
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/collations-basic.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-basic.sql.out
new file mode 100644
index 0000000000000..03409b001c153
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-basic.sql.out
@@ -0,0 +1,1164 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
+
+
+-- !query
+insert into t1 values('aaa', 'aaa')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+insert into t1 values('AAA', 'AAA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+insert into t1 values('bbb', 'bbb')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+insert into t1 values('BBB', 'BBB')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+describe table t1
+-- !query analysis
+DescribeTableCommand `spark_catalog`.`default`.`t1`, false, [col_name#x, data_type#x, comment#x]
+
+
+-- !query
+select count(*) from t1 group by utf8_binary
+-- !query analysis
+Aggregate [utf8_binary#x], [count(1) AS count(1)#xL]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select count(*) from t1 group by utf8_lcase
+-- !query analysis
+Aggregate [utf8_lcase#x], [count(1) AS count(1)#xL]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select * from t1 where utf8_binary = 'aaa'
+-- !query analysis
+Project [utf8_binary#x, utf8_lcase#x]
++- Filter (utf8_binary#x = aaa)
+   +- SubqueryAlias spark_catalog.default.t1
+      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select * from t1 where utf8_lcase = 'aaa' collate utf8_lcase
+-- !query analysis
+Project [utf8_binary#x, utf8_lcase#x]
++- Filter (utf8_lcase#x = collate(aaa, utf8_lcase))
+   +- SubqueryAlias spark_catalog.default.t1
+      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select * from t1 where utf8_binary < 'bbb'
+-- !query analysis
+Project [utf8_binary#x, utf8_lcase#x]
++- Filter (utf8_binary#x < bbb)
+   +- SubqueryAlias spark_catalog.default.t1
+      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select * from t1 where utf8_lcase < 'bbb' collate utf8_lcase
+-- !query analysis
+Project [utf8_binary#x, utf8_lcase#x]
++- Filter (utf8_lcase#x < collate(bbb, utf8_lcase))
+   +- SubqueryAlias spark_catalog.default.t1
+      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select l.utf8_binary, r.utf8_lcase from t1 l join t1 r on l.utf8_lcase = r.utf8_lcase
+-- !query analysis
+Project [utf8_binary#x, utf8_lcase#x]
++- Join Inner, (utf8_lcase#x = utf8_lcase#x)
+   :- SubqueryAlias l
+   :  +- SubqueryAlias spark_catalog.default.t1
+   :     +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+   +- SubqueryAlias r
+      +- SubqueryAlias spark_catalog.default.t1
+         +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+create table t2(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t2`, false
+
+
+-- !query
+insert into t2 values('aaa', 'aaa')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+insert into t2 values('bbb', 'bbb')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+select * from t1 anti join t2 on t1.utf8_lcase = t2.utf8_lcase
+-- !query analysis
+Project [utf8_binary#x, utf8_lcase#x]
++- Join LeftAnti, (utf8_lcase#x = utf8_lcase#x)
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
+   +- SubqueryAlias spark_catalog.default.t2
+      +- Relation spark_catalog.default.t2[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+drop table t2
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t2
+
+
+-- !query
+drop table t1
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query analysis
+Except false
+:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+:  +- LocalRelation [col1#x]
++- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query analysis
+Except All true
+:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+:  +- LocalRelation [col1#x]
++- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query analysis
+Distinct
++- Union false, false
+   :- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+   :  +- LocalRelation [col1#x]
+   +- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+      +- LocalRelation [col1#x]
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query analysis
+Union false, false
+:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+:  +- LocalRelation [col1#x]
++- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query analysis
+Intersect false
+:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+:  +- LocalRelation [col1#x]
++- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "EXCEPT",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 162,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "EXCEPT ALL",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 166,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "UNION",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 161,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "UNION",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 165,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "INTERSECT",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 156,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+create table t1 (c1 struct<utf8_binary: string collate utf8_binary, utf8_lcase: string collate utf8_lcase>) USING PARQUET
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
+
+
+-- !query
+insert into t1 values (named_struct('utf8_binary', 'aaa', 'utf8_lcase', 'aaa'))
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [c1]
++- Project [named_struct(utf8_binary, col1#x.utf8_binary, utf8_lcase, cast(col1#x.utf8_lcase as string collate UTF8_LCASE)) AS c1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+insert into t1 values (named_struct('utf8_binary', 'AAA', 'utf8_lcase', 'AAA'))
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [c1]
++- Project [named_struct(utf8_binary, col1#x.utf8_binary, utf8_lcase, cast(col1#x.utf8_lcase as string collate UTF8_LCASE)) AS c1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+select count(*) from t1 group by c1.utf8_binary
+-- !query analysis
+Aggregate [c1#x.utf8_binary], [count(1) AS count(1)#xL]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[c1#x] parquet
+
+
+-- !query
+select count(*) from t1 group by c1.utf8_lcase
+-- !query analysis
+Aggregate [c1#x.utf8_lcase], [count(1) AS count(1)#xL]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[c1#x] parquet
+
+
+-- !query
+drop table t1
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
+
+
+-- !query
+select array_contains(ARRAY('aaa' collate utf8_lcase),'AAA' collate utf8_lcase)
+-- !query analysis
+Project [array_contains(array(collate(aaa, utf8_lcase)), collate(AAA, utf8_lcase)) AS array_contains(array(collate(aaa, utf8_lcase)), collate(AAA, utf8_lcase))#x]
++- OneRowRelation
+
+
+-- !query
+select array_position(ARRAY('aaa' collate utf8_lcase, 'bbb' collate utf8_lcase),'BBB' collate utf8_lcase)
+-- !query analysis
+Project [array_position(array(collate(aaa, utf8_lcase), collate(bbb, utf8_lcase)), collate(BBB, utf8_lcase)) AS array_position(array(collate(aaa, utf8_lcase), collate(bbb, utf8_lcase)), collate(BBB, utf8_lcase))#xL]
++- OneRowRelation
+
+
+-- !query
+select nullif('aaa' COLLATE utf8_lcase, 'AAA' COLLATE utf8_lcase)
+-- !query analysis
+Project [nullif(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase)) AS nullif(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase))#x]
++- OneRowRelation
+
+
+-- !query
+select least('aaa' COLLATE utf8_lcase, 'AAA' collate utf8_lcase, 'a' collate utf8_lcase)
+-- !query analysis
+Project [least(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase), collate(a, utf8_lcase)) AS least(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase), collate(a, utf8_lcase))#x]
++- OneRowRelation
+
+
+-- !query
+select arrays_overlap(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query analysis
+Project [arrays_overlap(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS arrays_overlap(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
++- OneRowRelation
+
+
+-- !query
+select array_distinct(array('aaa' collate utf8_lcase, 'AAA' collate utf8_lcase))
+-- !query analysis
+Project [array_distinct(array(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase))) AS array_distinct(array(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase)))#x]
++- OneRowRelation
+
+
+-- !query
+select array_union(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query analysis
+Project [array_union(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS array_union(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
++- OneRowRelation
+
+
+-- !query
+select array_intersect(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query analysis
+Project [array_intersect(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS array_intersect(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
++- OneRowRelation
+
+
+-- !query
+select array_except(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query analysis
+Project [array_except(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS array_except(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate unicode < 'A'
+-- !query analysis
+Project [(collate(a, unicode) < A) AS (collate(a, unicode) < 'A' collate UNICODE)#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate unicode_ci = 'A'
+-- !query analysis
+Project [(collate(a, unicode_ci) = A) AS (collate(a, unicode_ci) = 'A' collate UNICODE_CI)#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate unicode_ai = 'å'
+-- !query analysis
+Project [(collate(a, unicode_ai) = å) AS (collate(a, unicode_ai) = 'å' collate UNICODE_AI)#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate unicode_ci_ai = 'Å'
+-- !query analysis
+Project [(collate(a, unicode_ci_ai) = Å) AS (collate(a, unicode_ci_ai) = 'Å' collate UNICODE_CI_AI)#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate en < 'A'
+-- !query analysis
+Project [(collate(a, en) < A) AS (collate(a, en) < 'A' collate en)#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate en_ci = 'A'
+-- !query analysis
+Project [(collate(a, en_ci) = A) AS (collate(a, en_ci) = 'A' collate en_CI)#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate en_ai = 'å'
+-- !query analysis
+Project [(collate(a, en_ai) = å) AS (collate(a, en_ai) = 'å' collate en_AI)#x]
++- OneRowRelation
+
+
+-- !query
+select 'a' collate en_ci_ai = 'Å'
+-- !query analysis
+Project [(collate(a, en_ci_ai) = Å) AS (collate(a, en_ci_ai) = 'Å' collate en_CI_AI)#x]
++- OneRowRelation
+
+
+-- !query
+select 'Kypper' collate sv < 'Köpfe'
+-- !query analysis
+Project [(collate(Kypper, sv) < Köpfe) AS (collate(Kypper, sv) < 'Köpfe' collate sv)#x]
++- OneRowRelation
+
+
+-- !query
+select 'Kypper' collate de > 'Köpfe'
+-- !query analysis
+Project [(collate(Kypper, de) > Köpfe) AS (collate(Kypper, de) > 'Köpfe' collate de)#x]
++- OneRowRelation
+
+
+-- !query
+select 'I' collate tr_ci = 'ı'
+-- !query analysis
+Project [(collate(I, tr_ci) = ı) AS (collate(I, tr_ci) = 'ı' collate tr_CI)#x]
++- OneRowRelation
+
+
+-- !query
+create table t3 (text string collate utf8_binary, pairDelim string collate utf8_lcase, keyValueDelim string collate utf8_binary) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t3`, false
+
+
+-- !query
+insert into t3 values('a:1,b:2,c:3', ',', ':')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [text, pairDelim, keyValueDelim]
++- Project [col1#x AS text#x, cast(col2#x as string collate UTF8_LCASE) AS pairDelim#x, col3#x AS keyValueDelim#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+select str_to_map(text, pairDelim, keyValueDelim) from t3
+-- !query analysis
+Project [str_to_map(cast(text#x as string collate null), cast(pairDelim#x as string collate null), cast(keyValueDelim#x as string collate null)) AS str_to_map(text, pairDelim, keyValueDelim)#x]
++- SubqueryAlias spark_catalog.default.t3
+   +- Relation spark_catalog.default.t3[text#x,pairDelim#x,keyValueDelim#x] parquet
+
+
+-- !query
+select str_to_map(text collate utf8_binary, pairDelim collate utf8_lcase, keyValueDelim collate utf8_binary) from t3
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select str_to_map(text collate utf8_binary, pairDelim collate utf8_binary, keyValueDelim collate utf8_binary) from t3
+-- !query analysis
+Project [str_to_map(collate(text#x, utf8_binary), collate(pairDelim#x, utf8_binary), collate(keyValueDelim#x, utf8_binary)) AS str_to_map(collate(text, utf8_binary), collate(pairDelim, utf8_binary), collate(keyValueDelim, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t3
+   +- Relation spark_catalog.default.t3[text#x,pairDelim#x,keyValueDelim#x] parquet
+
+
+-- !query
+select str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai) from t3
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(text, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"str_to_map(collate(text, unicode_ai), collate(pairDelim, unicode_ai), collate(keyValueDelim, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 106,
+    "fragment" : "str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+drop table t3
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t3
+
+
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+create table t2(ascii double) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t2`, false
+
+
+-- !query
+insert into t2 values (97.52143)
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [ascii]
++- Project [cast(col1#x as double) AS ascii#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+insert into t2 values (66.421)
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [ascii]
++- Project [cast(col1#x as double) AS ascii#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+create table t3(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t3`, false
+
+
+-- !query
+insert into t3 values ('aaAaAAaA', 'aaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+insert into t3 values ('efd2', 'efd2')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [utf8_binary, utf8_lcase]
++- Project [col1#x AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+create table t4(num long) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t4`, false
+
+
+-- !query
+insert into t4 values (97)
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t4, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t4], Append, `spark_catalog`.`default`.`t4`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t4), [num]
++- Project [cast(col1#x as bigint) AS num#xL]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+insert into t4 values (66)
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t4, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t4], Append, `spark_catalog`.`default`.`t4`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t4), [num]
++- Project [cast(col1#x as bigint) AS num#xL]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+select elt(2, s, utf8_binary) from t1
+-- !query analysis
+Project [elt(2, s#x, utf8_binary#x, true) AS elt(2, s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select elt(2, utf8_binary, utf8_lcase, s) from t1
+-- !query analysis
+Project [elt(2, cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), cast(s#x as string collate null), true) AS elt(2, utf8_binary, utf8_lcase, s)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [elt(1, collate(utf8_binary#x, utf8_binary), collate(utf8_lcase#x, utf8_binary), true) AS elt(1, collate(utf8_binary, utf8_binary), collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase) from t1
+-- !query analysis
+Project [elt(1, collate(utf8_binary#x, utf8_binary), cast(utf8_lcase#x as string), true) AS elt(1, collate(utf8_binary, utf8_binary), utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select elt(1, utf8_binary, 'word'), elt(1, utf8_lcase, 'word') from t1
+-- !query analysis
+Project [elt(1, utf8_binary#x, word, true) AS elt(1, utf8_binary, word)#x, elt(1, utf8_lcase#x, word, true) AS elt(1, utf8_lcase, 'word' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select elt(1, utf8_binary, 'word' collate utf8_lcase), elt(1, utf8_lcase, 'word' collate utf8_binary) from t1
+-- !query analysis
+Project [elt(1, cast(utf8_binary#x as string collate UTF8_LCASE), collate(word, utf8_lcase), true) AS elt(1, utf8_binary, collate(word, utf8_lcase))#x, elt(1, cast(utf8_lcase#x as string), collate(word, utf8_binary), true) AS elt(1, utf8_lcase, collate(word, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select ascii(utf8_binary), ascii(utf8_lcase) from t1
+-- !query analysis
+Project [ascii(utf8_binary#x) AS ascii(utf8_binary)#x, ascii(utf8_lcase#x) AS ascii(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select ascii(utf8_binary collate utf8_lcase), ascii(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [ascii(collate(utf8_binary#x, utf8_lcase)) AS ascii(collate(utf8_binary, utf8_lcase))#x, ascii(collate(utf8_lcase#x, utf8_binary)) AS ascii(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select unbase64(utf8_binary), unbase64(utf8_lcase) from t3
+-- !query analysis
+Project [unbase64(utf8_binary#x, false) AS unbase64(utf8_binary)#x, unbase64(utf8_lcase#x, false) AS unbase64(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t3
+   +- Relation spark_catalog.default.t3[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select unbase64(utf8_binary collate utf8_lcase), unbase64(utf8_lcase collate utf8_binary) from t3
+-- !query analysis
+Project [unbase64(collate(utf8_binary#x, utf8_lcase), false) AS unbase64(collate(utf8_binary, utf8_lcase))#x, unbase64(collate(utf8_lcase#x, utf8_binary), false) AS unbase64(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t3
+   +- Relation spark_catalog.default.t3[utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select base64(utf8_binary), base64(utf8_lcase) from t1
+-- !query analysis
+Project [base64(cast(utf8_binary#x as binary)) AS base64(utf8_binary)#x, base64(cast(utf8_lcase#x as binary)) AS base64(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select base64(utf8_binary collate utf8_lcase), base64(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [base64(cast(collate(utf8_binary#x, utf8_lcase) as binary)) AS base64(collate(utf8_binary, utf8_lcase))#x, base64(cast(collate(utf8_lcase#x, utf8_binary) as binary)) AS base64(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select decode(encode(utf8_binary, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase, 'utf-8'), 'utf-8') from t1
+-- !query analysis
+Project [decode(encode(utf8_binary#x, utf-8), utf-8) AS decode(encode(utf8_binary, utf-8), utf-8)#x, decode(encode(utf8_lcase#x, utf-8), utf-8) AS decode(encode(utf8_lcase, utf-8), utf-8)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select decode(encode(utf8_binary collate utf8_lcase, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase collate utf8_binary, 'utf-8'), 'utf-8') from t1
+-- !query analysis
+Project [decode(encode(collate(utf8_binary#x, utf8_lcase), utf-8), utf-8) AS decode(encode(collate(utf8_binary, utf8_lcase), utf-8), utf-8)#x, decode(encode(collate(utf8_lcase#x, utf8_binary), utf-8), utf-8) AS decode(encode(collate(utf8_lcase, utf8_binary), utf-8), utf-8)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select format_number(ascii, '###.###') from t2
+-- !query analysis
+Project [format_number(ascii#x, ###.###) AS format_number(ascii, ###.###)#x]
++- SubqueryAlias spark_catalog.default.t2
+   +- Relation spark_catalog.default.t2[ascii#x] parquet
+
+
+-- !query
+select format_number(ascii, '###.###' collate utf8_lcase) from t2
+-- !query analysis
+Project [format_number(ascii#x, collate(###.###, utf8_lcase)) AS format_number(ascii, collate(###.###, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t2
+   +- Relation spark_catalog.default.t2[ascii#x] parquet
+
+
+-- !query
+select encode(utf8_binary, 'utf-8'), encode(utf8_lcase, 'utf-8') from t1
+-- !query analysis
+Project [encode(utf8_binary#x, utf-8) AS encode(utf8_binary, utf-8)#x, encode(utf8_lcase#x, utf-8) AS encode(utf8_lcase, utf-8)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select encode(utf8_binary collate utf8_lcase, 'utf-8'), encode(utf8_lcase collate utf8_binary, 'utf-8') from t1
+-- !query analysis
+Project [encode(collate(utf8_binary#x, utf8_lcase), utf-8) AS encode(collate(utf8_binary, utf8_lcase), utf-8)#x, encode(collate(utf8_lcase#x, utf8_binary), utf-8) AS encode(collate(utf8_lcase, utf8_binary), utf-8)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select to_binary(utf8_binary, 'utf-8'), to_binary(utf8_lcase, 'utf-8') from t1
+-- !query analysis
+Project [to_binary(utf8_binary#x, Some(utf-8), false) AS to_binary(utf8_binary, utf-8)#x, to_binary(utf8_lcase#x, Some(utf-8), false) AS to_binary(utf8_lcase, utf-8)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select to_binary(utf8_binary collate utf8_lcase, 'utf-8'), to_binary(utf8_lcase collate utf8_binary, 'utf-8') from t1
+-- !query analysis
+Project [to_binary(collate(utf8_binary#x, utf8_lcase), Some(utf-8), false) AS to_binary(collate(utf8_binary, utf8_lcase), utf-8)#x, to_binary(collate(utf8_lcase#x, utf8_binary), Some(utf-8), false) AS to_binary(collate(utf8_lcase, utf8_binary), utf-8)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select soundex(utf8_binary), soundex(utf8_lcase) from t1
+-- !query analysis
+Project [soundex(utf8_binary#x) AS soundex(utf8_binary)#x, soundex(utf8_lcase#x) AS soundex(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select soundex(utf8_binary collate utf8_lcase), soundex(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [soundex(collate(utf8_binary#x, utf8_lcase)) AS soundex(collate(utf8_binary, utf8_lcase))#x, soundex(collate(utf8_lcase#x, utf8_binary)) AS soundex(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select luhn_check(num) from t4
+-- !query analysis
+Project [luhn_check(cast(num#xL as string)) AS luhn_check(num)#x]
++- SubqueryAlias spark_catalog.default.t4
+   +- Relation spark_catalog.default.t4[num#xL] parquet
+
+
+-- !query
+select levenshtein(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+Project [levenshtein(cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), None) AS levenshtein(utf8_binary, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select levenshtein(s, utf8_binary) from t1
+-- !query analysis
+Project [levenshtein(s#x, utf8_binary#x, None) AS levenshtein(s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select levenshtein(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select levenshtein(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [levenshtein(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), None) AS levenshtein(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select levenshtein(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [levenshtein(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), None) AS levenshtein(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select levenshtein(utf8_binary, 'a'), levenshtein(utf8_lcase, 'a') from t1
+-- !query analysis
+Project [levenshtein(utf8_binary#x, a, None) AS levenshtein(utf8_binary, a)#x, levenshtein(utf8_lcase#x, a, None) AS levenshtein(utf8_lcase, 'a' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select levenshtein(utf8_binary, 'AaAA' collate utf8_lcase, 3), levenshtein(utf8_lcase, 'AAa' collate utf8_binary, 4) from t1
+-- !query analysis
+Project [levenshtein(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), Some(3)) AS levenshtein(utf8_binary, collate(AaAA, utf8_lcase), 3)#x, levenshtein(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), Some(4)) AS levenshtein(utf8_lcase, collate(AAa, utf8_binary), 4)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select is_valid_utf8(utf8_binary), is_valid_utf8(utf8_lcase) from t1
+-- !query analysis
+Project [is_valid_utf8(utf8_binary#x) AS is_valid_utf8(utf8_binary)#x, is_valid_utf8(utf8_lcase#x) AS is_valid_utf8(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select is_valid_utf8(utf8_binary collate utf8_lcase), is_valid_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [is_valid_utf8(collate(utf8_binary#x, utf8_lcase)) AS is_valid_utf8(collate(utf8_binary, utf8_lcase))#x, is_valid_utf8(collate(utf8_lcase#x, utf8_binary)) AS is_valid_utf8(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select is_valid_utf8(utf8_binary collate utf8_lcase_rtrim), is_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [is_valid_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS is_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, is_valid_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS is_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select make_valid_utf8(utf8_binary), make_valid_utf8(utf8_lcase) from t1
+-- !query analysis
+Project [make_valid_utf8(utf8_binary#x) AS make_valid_utf8(utf8_binary)#x, make_valid_utf8(utf8_lcase#x) AS make_valid_utf8(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select make_valid_utf8(utf8_binary collate utf8_lcase), make_valid_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [make_valid_utf8(collate(utf8_binary#x, utf8_lcase)) AS make_valid_utf8(collate(utf8_binary, utf8_lcase))#x, make_valid_utf8(collate(utf8_lcase#x, utf8_binary)) AS make_valid_utf8(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select make_valid_utf8(utf8_binary collate utf8_lcase_rtrim), make_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [make_valid_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS make_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, make_valid_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS make_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select validate_utf8(utf8_binary), validate_utf8(utf8_lcase) from t1
+-- !query analysis
+Project [validate_utf8(utf8_binary#x) AS validate_utf8(utf8_binary)#x, validate_utf8(utf8_lcase#x) AS validate_utf8(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select validate_utf8(utf8_binary collate utf8_lcase), validate_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [validate_utf8(collate(utf8_binary#x, utf8_lcase)) AS validate_utf8(collate(utf8_binary, utf8_lcase))#x, validate_utf8(collate(utf8_lcase#x, utf8_binary)) AS validate_utf8(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select validate_utf8(utf8_binary collate utf8_lcase_rtrim), validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [validate_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS validate_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, validate_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS validate_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select try_validate_utf8(utf8_binary), try_validate_utf8(utf8_lcase) from t1
+-- !query analysis
+Project [try_validate_utf8(utf8_binary#x) AS try_validate_utf8(utf8_binary)#x, try_validate_utf8(utf8_lcase#x) AS try_validate_utf8(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select try_validate_utf8(utf8_binary collate utf8_lcase), try_validate_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [try_validate_utf8(collate(utf8_binary#x, utf8_lcase)) AS try_validate_utf8(collate(utf8_binary, utf8_lcase))#x, try_validate_utf8(collate(utf8_lcase#x, utf8_binary)) AS try_validate_utf8(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select try_validate_utf8(utf8_binary collate utf8_lcase_rtrim), try_validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [try_validate_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS try_validate_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, try_validate_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS try_validate_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+drop table t1
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
+
+
+-- !query
+drop table t2
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t2
+
+
+-- !query
+drop table t3
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t3
+
+
+-- !query
+drop table t4
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t4
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/collations-padding-trim.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-padding-trim.sql.out
new file mode 100644
index 0000000000000..626c4e57e14bd
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-padding-trim.sql.out
@@ -0,0 +1,690 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+select rpad(utf8_binary, 8, utf8_lcase) from t1
+-- !query analysis
+Project [rpad(cast(utf8_binary#x as string collate null), 8, cast(utf8_lcase#x as string collate null)) AS rpad(utf8_binary, 8, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select rpad(s, 8, utf8_binary) from t1
+-- !query analysis
+Project [rpad(s#x, 8, utf8_binary#x) AS rpad(s, 8, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select rpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select rpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [rpad(utf8_binary#x, 8, collate(utf8_lcase#x, utf8_binary)) AS rpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select rpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [rpad(collate(utf8_binary#x, utf8_lcase), 8, collate(utf8_lcase#x, utf8_lcase)) AS rpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [lpad(collate(utf8_binary#x, utf8_binary_rtrim), 8, collate(utf8_lcase#x, utf8_binary_rtrim)) AS lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select rpad(utf8_binary, 8, 'a'), rpad(utf8_lcase, 8, 'a') from t1
+-- !query analysis
+Project [rpad(utf8_binary#x, 8, a) AS rpad(utf8_binary, 8, a)#x, rpad(utf8_lcase#x, 8, a) AS rpad(utf8_lcase, 8, 'a' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select rpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), rpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t1
+-- !query analysis
+Project [rpad(cast(utf8_binary#x as string collate UTF8_LCASE), 8, collate(AaAA, utf8_lcase)) AS rpad(utf8_binary, 8, collate(AaAA, utf8_lcase))#x, rpad(cast(utf8_lcase#x as string), 8, collate(AAa, utf8_binary)) AS rpad(utf8_lcase, 8, collate(AAa, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(utf8_binary, 8, utf8_lcase) from t1
+-- !query analysis
+Project [lpad(cast(utf8_binary#x as string collate null), 8, cast(utf8_lcase#x as string collate null)) AS lpad(utf8_binary, 8, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(s, 8, utf8_binary) from t1
+-- !query analysis
+Project [lpad(s#x, 8, utf8_binary#x) AS lpad(s, 8, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select lpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [lpad(utf8_binary#x, 8, collate(utf8_lcase#x, utf8_binary)) AS lpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [lpad(collate(utf8_binary#x, utf8_lcase), 8, collate(utf8_lcase#x, utf8_lcase)) AS lpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [lpad(collate(utf8_binary#x, utf8_binary_rtrim), 8, collate(utf8_lcase#x, utf8_binary_rtrim)) AS lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(utf8_binary, 8, 'a'), lpad(utf8_lcase, 8, 'a') from t1
+-- !query analysis
+Project [lpad(utf8_binary#x, 8, a) AS lpad(utf8_binary, 8, a)#x, lpad(utf8_lcase#x, 8, a) AS lpad(utf8_lcase, 8, 'a' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), lpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t1
+-- !query analysis
+Project [lpad(cast(utf8_binary#x as string collate UTF8_LCASE), 8, collate(AaAA, utf8_lcase)) AS lpad(utf8_binary, 8, collate(AaAA, utf8_lcase))#x, lpad(cast(utf8_lcase#x as string), 8, collate(AAa, utf8_binary)) AS lpad(utf8_lcase, 8, collate(AAa, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select TRIM(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(BOTH utf8_binary FROM utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 36,
+    "fragment" : "TRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select TRIM(s, utf8_binary) from t1
+-- !query analysis
+Project [trim(utf8_binary#x, Some(s#x)) AS TRIM(BOTH s FROM utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select TRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select TRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [trim(collate(utf8_lcase#x, utf8_binary), Some(utf8_binary#x)) AS TRIM(BOTH utf8_binary FROM collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select TRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [trim(collate(utf8_lcase#x, utf8_lcase), Some(collate(utf8_binary#x, utf8_lcase))) AS TRIM(BOTH collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(BOTH collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select TRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [trim(collate(utf8_lcase#x, utf8_binary_rtrim), Some(collate(utf8_binary#x, utf8_binary_rtrim))) AS TRIM(BOTH collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select TRIM('ABc', utf8_binary), TRIM('ABc', utf8_lcase) from t1
+-- !query analysis
+Project [trim(utf8_binary#x, Some(ABc)) AS TRIM(BOTH ABc FROM utf8_binary)#x, trim(utf8_lcase#x, Some(ABc)) AS TRIM(BOTH 'ABc' collate UTF8_LCASE FROM utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select TRIM('ABc' collate utf8_lcase, utf8_binary), TRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query analysis
+Project [trim(cast(utf8_binary#x as string collate UTF8_LCASE), Some(collate(ABc, utf8_lcase))) AS TRIM(BOTH collate(ABc, utf8_lcase) FROM utf8_binary)#x, trim(cast(utf8_lcase#x as string), Some(collate(AAa, utf8_binary))) AS TRIM(BOTH collate(AAa, utf8_binary) FROM utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select BTRIM(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(BOTH utf8_lcase FROM utf8_binary)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "BTRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select BTRIM(s, utf8_binary) from t1
+-- !query analysis
+Project [btrim(s#x, utf8_binary#x) AS btrim(s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select BTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select BTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [btrim(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS btrim(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select BTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [btrim(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS btrim(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(BOTH collate(utf8_lcase, unicode_ai) FROM collate(utf8_binary, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select BTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [btrim(collate(utf8_binary#x, utf8_binary_rtrim), collate(utf8_lcase#x, utf8_binary_rtrim)) AS btrim(collate(utf8_binary, utf8_binary_rtrim), collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select BTRIM('ABc', utf8_binary), BTRIM('ABc', utf8_lcase) from t1
+-- !query analysis
+Project [btrim(ABc, utf8_binary#x) AS btrim(ABc, utf8_binary)#x, btrim(ABc, utf8_lcase#x) AS btrim(ABc, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select BTRIM('ABc' collate utf8_lcase, utf8_binary), BTRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query analysis
+Project [btrim(collate(ABc, utf8_lcase), utf8_binary#x) AS btrim(collate(ABc, utf8_lcase), utf8_binary)#x, btrim(collate(AAa, utf8_binary), utf8_lcase#x) AS btrim(collate(AAa, utf8_binary), utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select LTRIM(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(LEADING utf8_binary FROM utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "LTRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select LTRIM(s, utf8_binary) from t1
+-- !query analysis
+Project [ltrim(utf8_binary#x, Some(s#x)) AS TRIM(LEADING s FROM utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select LTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select LTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [ltrim(collate(utf8_lcase#x, utf8_binary), Some(utf8_binary#x)) AS TRIM(LEADING utf8_binary FROM collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select LTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [ltrim(collate(utf8_lcase#x, utf8_lcase), Some(collate(utf8_binary#x, utf8_lcase))) AS TRIM(LEADING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(LEADING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select LTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [ltrim(collate(utf8_lcase#x, utf8_binary_rtrim), Some(collate(utf8_binary#x, utf8_binary_rtrim))) AS TRIM(LEADING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select LTRIM('ABc', utf8_binary), LTRIM('ABc', utf8_lcase) from t1
+-- !query analysis
+Project [ltrim(utf8_binary#x, Some(ABc)) AS TRIM(LEADING ABc FROM utf8_binary)#x, ltrim(utf8_lcase#x, Some(ABc)) AS TRIM(LEADING 'ABc' collate UTF8_LCASE FROM utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select LTRIM('ABc' collate utf8_lcase, utf8_binary), LTRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query analysis
+Project [ltrim(cast(utf8_binary#x as string collate UTF8_LCASE), Some(collate(ABc, utf8_lcase))) AS TRIM(LEADING collate(ABc, utf8_lcase) FROM utf8_binary)#x, ltrim(cast(utf8_lcase#x as string), Some(collate(AAa, utf8_binary))) AS TRIM(LEADING collate(AAa, utf8_binary) FROM utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select RTRIM(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(TRAILING utf8_binary FROM utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "RTRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select RTRIM(s, utf8_binary) from t1
+-- !query analysis
+Project [rtrim(utf8_binary#x, Some(s#x)) AS TRIM(TRAILING s FROM utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select RTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select RTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [rtrim(collate(utf8_lcase#x, utf8_binary), Some(utf8_binary#x)) AS TRIM(TRAILING utf8_binary FROM collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select RTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [rtrim(collate(utf8_lcase#x, utf8_lcase), Some(collate(utf8_binary#x, utf8_lcase))) AS TRIM(TRAILING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(TRAILING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select RTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [rtrim(collate(utf8_lcase#x, utf8_binary_rtrim), Some(collate(utf8_binary#x, utf8_binary_rtrim))) AS TRIM(TRAILING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select RTRIM('ABc', utf8_binary), RTRIM('ABc', utf8_lcase) from t1
+-- !query analysis
+Project [rtrim(utf8_binary#x, Some(ABc)) AS TRIM(TRAILING ABc FROM utf8_binary)#x, rtrim(utf8_lcase#x, Some(ABc)) AS TRIM(TRAILING 'ABc' collate UTF8_LCASE FROM utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select RTRIM('ABc' collate utf8_lcase, utf8_binary), RTRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query analysis
+Project [rtrim(cast(utf8_binary#x as string collate UTF8_LCASE), Some(collate(ABc, utf8_lcase))) AS TRIM(TRAILING collate(ABc, utf8_lcase) FROM utf8_binary)#x, rtrim(cast(utf8_lcase#x as string), Some(collate(AAa, utf8_binary))) AS TRIM(TRAILING collate(AAa, utf8_binary) FROM utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+drop table t1
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/collations-string-functions.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-string-functions.sql.out
new file mode 100644
index 0000000000000..f7d2d595a5817
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/collations-string-functions.sql.out
@@ -0,0 +1,1510 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [s, utf8_binary, utf8_lcase]
++- Project [col1#x AS s#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+create table t2(ascii long) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t2`, false
+
+
+-- !query
+insert into t2 values (97)
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [ascii]
++- Project [cast(col1#x as bigint) AS ascii#xL]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+insert into t2 values (66)
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [ascii]
++- Project [cast(col1#x as bigint) AS ascii#xL]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+create table t3(format string collate utf8_binary, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t3`, false
+
+
+-- !query
+insert into t3 values ('%s%s', 'abCdE', 'abCdE')
+-- !query analysis
+InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [format, utf8_binary, utf8_lcase]
++- Project [col1#x AS format#x, col2#x AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+-- !query analysis
+Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select concat_ws(' ', utf8_binary, utf8_lcase) from t1
+-- !query analysis
+Project [concat_ws( , cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null)) AS concat_ws(' ' collate null, utf8_binary, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select concat_ws(' ' collate utf8_binary, utf8_binary, 'SQL' collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select concat_ws(' ' collate utf8_lcase, utf8_binary, 'SQL' collate utf8_lcase) from t1
+-- !query analysis
+Project [concat_ws(collate( , utf8_lcase), cast(utf8_binary#x as string collate UTF8_LCASE), collate(SQL, utf8_lcase)) AS concat_ws(collate( , utf8_lcase), utf8_binary, collate(SQL, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select concat_ws(',', utf8_lcase, 'word'), concat_ws(',', utf8_binary, 'word') from t1
+-- !query analysis
+Project [concat_ws(,, utf8_lcase#x, word) AS concat_ws(',' collate UTF8_LCASE, utf8_lcase, 'word' collate UTF8_LCASE)#x, concat_ws(,, utf8_binary#x, word) AS concat_ws(,, utf8_binary, word)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select concat_ws(',', utf8_lcase, 'word' collate utf8_binary), concat_ws(',', utf8_binary, 'word' collate utf8_lcase) from t1
+-- !query analysis
+Project [concat_ws(,, cast(utf8_lcase#x as string), collate(word, utf8_binary)) AS concat_ws(,, utf8_lcase, collate(word, utf8_binary))#x, concat_ws(,, cast(utf8_binary#x as string collate UTF8_LCASE), collate(word, utf8_lcase)) AS concat_ws(',' collate UTF8_LCASE, utf8_binary, collate(word, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select split_part(utf8_binary, utf8_lcase, 3) from t1
+-- !query analysis
+Project [split_part(cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), 3) AS split_part(utf8_binary, utf8_lcase, 3)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select split_part(s, utf8_binary, 1) from t1
+-- !query analysis
+Project [split_part(s#x, utf8_binary#x, 1) AS split_part(s, utf8_binary, 1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select split_part(utf8_binary collate utf8_binary, s collate utf8_lcase, 1) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select split_part(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1
+-- !query analysis
+Project [split_part(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 2) AS split_part(utf8_binary, collate(utf8_lcase, utf8_binary), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select split_part(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1
+-- !query analysis
+Project [split_part(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 2) AS split_part(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"split_part(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
+  } ]
+}
+
+
+-- !query
+select split_part(utf8_binary, 'a', 3), split_part(utf8_lcase, 'a', 3) from t1
+-- !query analysis
+Project [split_part(utf8_binary#x, a, 3) AS split_part(utf8_binary, a, 3)#x, split_part(utf8_lcase#x, a, 3) AS split_part(utf8_lcase, 'a' collate UTF8_LCASE, 3)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select split_part(utf8_binary, 'a' collate utf8_lcase, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t1
+-- !query analysis
+Project [split_part(cast(utf8_binary#x as string collate UTF8_LCASE), collate(a, utf8_lcase), 3) AS split_part(utf8_binary, collate(a, utf8_lcase), 3)#x, split_part(cast(utf8_lcase#x as string), collate(a, utf8_binary), 3) AS split_part(utf8_lcase, collate(a, utf8_binary), 3)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select split_part(utf8_binary, 'a ' collate utf8_lcase_rtrim, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t1
+-- !query analysis
+Project [split_part(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(a , utf8_lcase_rtrim), 3) AS split_part(utf8_binary, collate(a , utf8_lcase_rtrim), 3)#x, split_part(cast(utf8_lcase#x as string), collate(a, utf8_binary), 3) AS split_part(utf8_lcase, collate(a, utf8_binary), 3)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select contains(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"contains(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 40,
+    "fragment" : "contains(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select contains(s, utf8_binary) from t1
+-- !query analysis
+Project [Contains(s#x, utf8_binary#x) AS contains(s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select contains(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select contains(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [Contains(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS contains(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select contains(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [Contains(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS contains(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"contains(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select contains(utf8_binary, 'a'), contains(utf8_lcase, 'a') from t1
+-- !query analysis
+Project [Contains(utf8_binary#x, a) AS contains(utf8_binary, a)#x, Contains(utf8_lcase#x, a) AS contains(utf8_lcase, 'a' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select contains(utf8_binary, 'AaAA' collate utf8_lcase), contains(utf8_lcase, 'AAa' collate utf8_binary) from t1
+-- !query analysis
+Project [Contains(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase)) AS contains(utf8_binary, collate(AaAA, utf8_lcase))#x, Contains(cast(utf8_lcase#x as string), collate(AAa, utf8_binary)) AS contains(utf8_lcase, collate(AAa, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select contains(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim), contains(utf8_lcase, 'AAa ' collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [Contains(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(AaAA , utf8_lcase_rtrim)) AS contains(utf8_binary, collate(AaAA , utf8_lcase_rtrim))#x, Contains(cast(utf8_lcase#x as string collate UTF8_BINARY_RTRIM), collate(AAa , utf8_binary_rtrim)) AS contains(utf8_lcase, collate(AAa , utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substring_index(utf8_binary, utf8_lcase, 2) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"substring_index(utf8_binary, utf8_lcase, 2)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "substring_index(utf8_binary, utf8_lcase, 2)"
+  } ]
+}
+
+
+-- !query
+select substring_index(s, utf8_binary,1) from t1
+-- !query analysis
+Project [substring_index(s#x, utf8_binary#x, 1) AS substring_index(s, utf8_binary, 1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substring_index(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select substring_index(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1
+-- !query analysis
+Project [substring_index(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 2) AS substring_index(utf8_binary, collate(utf8_lcase, utf8_binary), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substring_index(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1
+-- !query analysis
+Project [substring_index(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 2) AS substring_index(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"substring_index(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 88,
+    "fragment" : "substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
+  } ]
+}
+
+
+-- !query
+select substring_index(utf8_binary, 'a', 2), substring_index(utf8_lcase, 'a', 2) from t1
+-- !query analysis
+Project [substring_index(utf8_binary#x, a, 2) AS substring_index(utf8_binary, a, 2)#x, substring_index(utf8_lcase#x, a, 2) AS substring_index(utf8_lcase, 'a' collate UTF8_LCASE, 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substring_index(utf8_binary, 'AaAA' collate utf8_lcase, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1
+-- !query analysis
+Project [substring_index(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), 2) AS substring_index(utf8_binary, collate(AaAA, utf8_lcase), 2)#x, substring_index(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 2) AS substring_index(utf8_lcase, collate(AAa, utf8_binary), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substring_index(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1
+-- !query analysis
+Project [substring_index(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(AaAA , utf8_lcase_rtrim), 2) AS substring_index(utf8_binary, collate(AaAA , utf8_lcase_rtrim), 2)#x, substring_index(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 2) AS substring_index(utf8_lcase, collate(AAa, utf8_binary), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select instr(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"instr(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "instr(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select instr(s, utf8_binary) from t1
+-- !query analysis
+Project [instr(s#x, utf8_binary#x) AS instr(s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select instr(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select instr(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [instr(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS instr(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select instr(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [instr(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS instr(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"instr(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select instr(utf8_binary, 'a'), instr(utf8_lcase, 'a') from t1
+-- !query analysis
+Project [instr(utf8_binary#x, a) AS instr(utf8_binary, a)#x, instr(utf8_lcase#x, a) AS instr(utf8_lcase, 'a' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select instr(utf8_binary, 'AaAA' collate utf8_lcase), instr(utf8_lcase, 'AAa' collate utf8_binary) from t1
+-- !query analysis
+Project [instr(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase)) AS instr(utf8_binary, collate(AaAA, utf8_lcase))#x, instr(cast(utf8_lcase#x as string), collate(AAa, utf8_binary)) AS instr(utf8_lcase, collate(AAa, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select find_in_set(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"find_in_set(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 43,
+    "fragment" : "find_in_set(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select find_in_set(s, utf8_binary) from t1
+-- !query analysis
+Project [find_in_set(s#x, utf8_binary#x) AS find_in_set(s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select find_in_set(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select find_in_set(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [find_in_set(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS find_in_set(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select find_in_set(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [find_in_set(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS find_in_set(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o'), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o') from t1
+-- !query analysis
+Project [find_in_set(utf8_binary#x, aaAaaAaA,i̇o) AS find_in_set(utf8_binary, aaAaaAaA,i̇o)#x, find_in_set(utf8_lcase#x, aaAaaAaA,i̇o) AS find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o' collate utf8_lcase), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t1
+-- !query analysis
+Project [find_in_set(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA,i̇o, utf8_lcase)) AS find_in_set(utf8_binary, collate(aaAaaAaA,i̇o, utf8_lcase))#x, find_in_set(cast(utf8_lcase#x as string), collate(aaAaaAaA,i̇o, utf8_binary)) AS find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o ' collate utf8_lcase_rtrim), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t1
+-- !query analysis
+Project [find_in_set(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA,i̇o , utf8_lcase_rtrim)) AS find_in_set(utf8_binary, collate(aaAaaAaA,i̇o , utf8_lcase_rtrim))#x, find_in_set(cast(utf8_lcase#x as string), collate(aaAaaAaA,i̇o, utf8_binary)) AS find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select startswith(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"startswith(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 42,
+    "fragment" : "startswith(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select startswith(s, utf8_binary) from t1
+-- !query analysis
+Project [StartsWith(s#x, utf8_binary#x) AS startswith(s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select startswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select startswith(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [StartsWith(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS startswith(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select startswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [StartsWith(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS startswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"startswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 80,
+    "fragment" : "startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select startswith(utf8_binary, 'aaAaaAaA'), startswith(utf8_lcase, 'aaAaaAaA') from t1
+-- !query analysis
+Project [StartsWith(utf8_binary#x, aaAaaAaA) AS startswith(utf8_binary, aaAaaAaA)#x, StartsWith(utf8_lcase#x, aaAaaAaA) AS startswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select startswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query analysis
+Project [StartsWith(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA, utf8_lcase)) AS startswith(utf8_binary, collate(aaAaaAaA, utf8_lcase))#x, StartsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select startswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query analysis
+Project [StartsWith(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA , utf8_lcase_rtrim)) AS startswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim))#x, StartsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select translate(utf8_lcase, utf8_lcase, '12345') from t1
+-- !query analysis
+Project [translate(utf8_lcase#x, utf8_lcase#x, 12345) AS translate(utf8_lcase, utf8_lcase, '12345' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select translate(utf8_binary, utf8_lcase, '12345') from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"translate(utf8_binary, utf8_lcase, 12345)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "translate(utf8_binary, utf8_lcase, '12345')"
+  } ]
+}
+
+
+-- !query
+select translate(utf8_binary, 'aBc' collate utf8_lcase, '12345' collate utf8_binary) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select translate(utf8_binary, 'SQL' collate utf8_lcase, '12345' collate utf8_lcase) from t1
+-- !query analysis
+Project [translate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(SQL, utf8_lcase), collate(12345, utf8_lcase)) AS translate(utf8_binary, collate(SQL, utf8_lcase), collate(12345, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"utf8_binary\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"translate(utf8_binary, collate(SQL, unicode_ai), collate(12345, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select translate(utf8_lcase, 'aaAaaAaA', '12345'), translate(utf8_binary, 'aaAaaAaA', '12345') from t1
+-- !query analysis
+Project [translate(utf8_lcase#x, aaAaaAaA, 12345) AS translate(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, '12345' collate UTF8_LCASE)#x, translate(utf8_binary#x, aaAaaAaA, 12345) AS translate(utf8_binary, aaAaaAaA, 12345)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select translate(utf8_lcase, 'aBc' collate utf8_binary, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t1
+-- !query analysis
+Project [translate(cast(utf8_lcase#x as string), collate(aBc, utf8_binary), 12345) AS translate(utf8_lcase, collate(aBc, utf8_binary), 12345)#x, translate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aBc, utf8_lcase), 12345) AS translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select translate(utf8_lcase, 'aBc ' collate utf8_binary_rtrim, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t1
+-- !query analysis
+Project [translate(cast(utf8_lcase#x as string collate UTF8_BINARY_RTRIM), collate(aBc , utf8_binary_rtrim), 12345) AS translate(utf8_lcase, collate(aBc , utf8_binary_rtrim), '12345' collate UTF8_BINARY_RTRIM)#x, translate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aBc, utf8_lcase), 12345) AS translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select replace(utf8_binary, utf8_lcase, 'abc') from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"replace(utf8_binary, utf8_lcase, abc)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 46,
+    "fragment" : "replace(utf8_binary, utf8_lcase, 'abc')"
+  } ]
+}
+
+
+-- !query
+select replace(s, utf8_binary, 'abc') from t1
+-- !query analysis
+Project [replace(s#x, utf8_binary#x, abc) AS replace(s, utf8_binary, abc)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select replace(utf8_binary collate utf8_binary, s collate utf8_lcase, 'abc') from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select replace(utf8_binary, utf8_lcase collate utf8_binary, 'abc') from t1
+-- !query analysis
+Project [replace(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), abc) AS replace(utf8_binary, collate(utf8_lcase, utf8_binary), abc)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select replace(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 'abc') from t1
+-- !query analysis
+Project [replace(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), abc) AS replace(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 'abc' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc') from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"replace(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 'abc' collate UNICODE_AI)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 84,
+    "fragment" : "replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc')"
+  } ]
+}
+
+
+-- !query
+select replace(utf8_binary, 'aaAaaAaA', 'abc'), replace(utf8_lcase, 'aaAaaAaA', 'abc') from t1
+-- !query analysis
+Project [replace(utf8_binary#x, aaAaaAaA, abc) AS replace(utf8_binary, aaAaaAaA, abc)#x, replace(utf8_lcase#x, aaAaaAaA, abc) AS replace(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, 'abc' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select replace(utf8_binary, 'aaAaaAaA' collate utf8_lcase, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t1
+-- !query analysis
+Project [replace(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA, utf8_lcase), abc) AS replace(utf8_binary, collate(aaAaaAaA, utf8_lcase), 'abc' collate UTF8_LCASE)#x, replace(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary), abc) AS replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select replace(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t1
+-- !query analysis
+Project [replace(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA , utf8_lcase_rtrim), abc) AS replace(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim), 'abc' collate UTF8_LCASE_RTRIM)#x, replace(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary), abc) AS replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select endswith(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"endswith(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 40,
+    "fragment" : "endswith(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select endswith(s, utf8_binary) from t1
+-- !query analysis
+Project [EndsWith(s#x, utf8_binary#x) AS endswith(s, utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select endswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select endswith(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [EndsWith(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS endswith(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select endswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query analysis
+Project [EndsWith(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS endswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"endswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select endswith(utf8_binary, 'aaAaaAaA'), endswith(utf8_lcase, 'aaAaaAaA') from t1
+-- !query analysis
+Project [EndsWith(utf8_binary#x, aaAaaAaA) AS endswith(utf8_binary, aaAaaAaA)#x, EndsWith(utf8_lcase#x, aaAaaAaA) AS endswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select endswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query analysis
+Project [EndsWith(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA, utf8_lcase)) AS endswith(utf8_binary, collate(aaAaaAaA, utf8_lcase))#x, EndsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select endswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query analysis
+Project [EndsWith(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA , utf8_lcase_rtrim)) AS endswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim))#x, EndsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select repeat(utf8_binary, 3), repeat(utf8_lcase, 2) from t1
+-- !query analysis
+Project [repeat(utf8_binary#x, 3) AS repeat(utf8_binary, 3)#x, repeat(utf8_lcase#x, 2) AS repeat(utf8_lcase, 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select repeat(utf8_binary collate utf8_lcase, 3), repeat(utf8_lcase collate utf8_binary, 2) from t1
+-- !query analysis
+Project [repeat(collate(utf8_binary#x, utf8_lcase), 3) AS repeat(collate(utf8_binary, utf8_lcase), 3)#x, repeat(collate(utf8_lcase#x, utf8_binary), 2) AS repeat(collate(utf8_lcase, utf8_binary), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select chr(ascii) from t2
+-- !query analysis
+Project [chr(ascii#xL) AS chr(ascii)#x]
++- SubqueryAlias spark_catalog.default.t2
+   +- Relation spark_catalog.default.t2[ascii#xL] parquet
+
+
+-- !query
+select sentences(utf8_binary), sentences(utf8_lcase) from t1
+-- !query analysis
+Project [sentences(utf8_binary#x, , ) AS sentences(utf8_binary, , )#x, sentences(utf8_lcase#x, , ) AS sentences(utf8_lcase, , )#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select sentences(utf8_binary collate utf8_lcase), sentences(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [sentences(collate(utf8_binary#x, utf8_lcase), , ) AS sentences(collate(utf8_binary, utf8_lcase), , )#x, sentences(collate(utf8_lcase#x, utf8_binary), , ) AS sentences(collate(utf8_lcase, utf8_binary), , )#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select upper(utf8_binary), upper(utf8_lcase) from t1
+-- !query analysis
+Project [upper(utf8_binary#x) AS upper(utf8_binary)#x, upper(utf8_lcase#x) AS upper(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select upper(utf8_binary collate utf8_lcase), upper(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [upper(collate(utf8_binary#x, utf8_lcase)) AS upper(collate(utf8_binary, utf8_lcase))#x, upper(collate(utf8_lcase#x, utf8_binary)) AS upper(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lower(utf8_binary), lower(utf8_lcase) from t1
+-- !query analysis
+Project [lower(utf8_binary#x) AS lower(utf8_binary)#x, lower(utf8_lcase#x) AS lower(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select lower(utf8_binary collate utf8_lcase), lower(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [lower(collate(utf8_binary#x, utf8_lcase)) AS lower(collate(utf8_binary, utf8_lcase))#x, lower(collate(utf8_lcase#x, utf8_binary)) AS lower(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select initcap(utf8_binary), initcap(utf8_lcase) from t1
+-- !query analysis
+Project [initcap(utf8_binary#x) AS initcap(utf8_binary)#x, initcap(utf8_lcase#x) AS initcap(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select initcap(utf8_binary collate utf8_lcase), initcap(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [initcap(collate(utf8_binary#x, utf8_lcase)) AS initcap(collate(utf8_binary, utf8_lcase))#x, initcap(collate(utf8_lcase#x, utf8_binary)) AS initcap(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select overlay(utf8_binary, utf8_lcase, 2) from t1
+-- !query analysis
+Project [overlay(cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), 2, -1) AS overlay(utf8_binary, utf8_lcase, 2, -1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select overlay(s, utf8_binary,1) from t1
+-- !query analysis
+Project [overlay(s#x, utf8_binary#x, 1, -1) AS overlay(s, utf8_binary, 1, -1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select overlay(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select overlay(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1
+-- !query analysis
+Project [overlay(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 2, -1) AS overlay(utf8_binary, collate(utf8_lcase, utf8_binary), 2, -1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select overlay(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1
+-- !query analysis
+Project [overlay(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 2, -1) AS overlay(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2, -1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select overlay(utf8_binary, 'a', 2), overlay(utf8_lcase, 'a', 2) from t1
+-- !query analysis
+Project [overlay(utf8_binary#x, a, 2, -1) AS overlay(utf8_binary, a, 2, -1)#x, overlay(utf8_lcase#x, a, 2, -1) AS overlay(utf8_lcase, 'a' collate UTF8_LCASE, 2, -1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select overlay(utf8_binary, 'AaAA' collate utf8_lcase, 2), overlay(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1
+-- !query analysis
+Project [overlay(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), 2, -1) AS overlay(utf8_binary, collate(AaAA, utf8_lcase), 2, -1)#x, overlay(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 2, -1) AS overlay(utf8_lcase, collate(AAa, utf8_binary), 2, -1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select format_string(format, utf8_binary, utf8_lcase) from t3
+-- !query analysis
+Project [format_string(format#x, utf8_binary#x, utf8_lcase#x) AS format_string(format, utf8_binary, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t3
+   +- Relation spark_catalog.default.t3[format#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select format_string(format collate utf8_lcase, utf8_lcase, utf8_binary collate utf8_lcase, 3), format_string(format, utf8_lcase collate utf8_binary, utf8_binary) from t3
+-- !query analysis
+Project [format_string(collate(format#x, utf8_lcase), utf8_lcase#x, collate(utf8_binary#x, utf8_lcase), 3) AS format_string(collate(format, utf8_lcase), utf8_lcase, collate(utf8_binary, utf8_lcase), 3)#x, format_string(format#x, collate(utf8_lcase#x, utf8_binary), utf8_binary#x) AS format_string(format, collate(utf8_lcase, utf8_binary), utf8_binary)#x]
++- SubqueryAlias spark_catalog.default.t3
+   +- Relation spark_catalog.default.t3[format#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select format_string(format, utf8_binary, utf8_lcase) from t3
+-- !query analysis
+Project [format_string(format#x, utf8_binary#x, utf8_lcase#x) AS format_string(format, utf8_binary, utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t3
+   +- Relation spark_catalog.default.t3[format#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select length(utf8_binary), length(utf8_lcase) from t1
+-- !query analysis
+Project [length(utf8_binary#x) AS length(utf8_binary)#x, length(utf8_lcase#x) AS length(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select length(utf8_binary collate utf8_lcase), length(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [length(collate(utf8_binary#x, utf8_lcase)) AS length(collate(utf8_binary, utf8_lcase))#x, length(collate(utf8_lcase#x, utf8_binary)) AS length(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select bit_length(utf8_binary), bit_length(utf8_lcase) from t1
+-- !query analysis
+Project [bit_length(utf8_binary#x) AS bit_length(utf8_binary)#x, bit_length(utf8_lcase#x) AS bit_length(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select bit_length(utf8_binary collate utf8_lcase), bit_length(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [bit_length(collate(utf8_binary#x, utf8_lcase)) AS bit_length(collate(utf8_binary, utf8_lcase))#x, bit_length(collate(utf8_lcase#x, utf8_binary)) AS bit_length(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select octet_length(utf8_binary), octet_length(utf8_lcase) from t1
+-- !query analysis
+Project [octet_length(utf8_binary#x) AS octet_length(utf8_binary)#x, octet_length(utf8_lcase#x) AS octet_length(utf8_lcase)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select octet_length(utf8_binary collate utf8_lcase), octet_length(utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [octet_length(collate(utf8_binary#x, utf8_lcase)) AS octet_length(collate(utf8_binary, utf8_lcase))#x, octet_length(collate(utf8_lcase#x, utf8_binary)) AS octet_length(collate(utf8_lcase, utf8_binary))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select octet_length(utf8_binary collate utf8_lcase_rtrim), octet_length(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query analysis
+Project [octet_length(collate(utf8_binary#x, utf8_lcase_rtrim)) AS octet_length(collate(utf8_binary, utf8_lcase_rtrim))#x, octet_length(collate(utf8_lcase#x, utf8_binary_rtrim)) AS octet_length(collate(utf8_lcase, utf8_binary_rtrim))#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substr(utf8_binary, 2, 2), substr(utf8_lcase, 2, 2) from t1
+-- !query analysis
+Project [substr(utf8_binary#x, 2, 2) AS substr(utf8_binary, 2, 2)#x, substr(utf8_lcase#x, 2, 2) AS substr(utf8_lcase, 2, 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select substr(utf8_binary collate utf8_lcase, 2, 2), substr(utf8_lcase collate utf8_binary, 2, 2) from t1
+-- !query analysis
+Project [substr(collate(utf8_binary#x, utf8_lcase), 2, 2) AS substr(collate(utf8_binary, utf8_lcase), 2, 2)#x, substr(collate(utf8_lcase#x, utf8_binary), 2, 2) AS substr(collate(utf8_lcase, utf8_binary), 2, 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select right(utf8_binary, 2), right(utf8_lcase, 2) from t1
+-- !query analysis
+Project [right(utf8_binary#x, 2) AS right(utf8_binary, 2)#x, right(utf8_lcase#x, 2) AS right(utf8_lcase, 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select right(utf8_binary collate utf8_lcase, 2), right(utf8_lcase collate utf8_binary, 2) from t1
+-- !query analysis
+Project [right(collate(utf8_binary#x, utf8_lcase), 2) AS right(collate(utf8_binary, utf8_lcase), 2)#x, right(collate(utf8_lcase#x, utf8_binary), 2) AS right(collate(utf8_lcase, utf8_binary), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select left(utf8_binary, '2' collate utf8_lcase), left(utf8_lcase, 2) from t1
+-- !query analysis
+Project [left(utf8_binary#x, cast(collate(2, utf8_lcase) as int)) AS left(utf8_binary, collate(2, utf8_lcase))#x, left(utf8_lcase#x, 2) AS left(utf8_lcase, 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select left(utf8_binary collate utf8_lcase, 2), left(utf8_lcase collate utf8_binary, 2) from t1
+-- !query analysis
+Project [left(collate(utf8_binary#x, utf8_lcase), 2) AS left(collate(utf8_binary, utf8_lcase), 2)#x, left(collate(utf8_lcase#x, utf8_binary), 2) AS left(collate(utf8_lcase, utf8_binary), 2)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select locate(utf8_binary, utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"locate(utf8_binary, utf8_lcase, 1)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 38,
+    "fragment" : "locate(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select locate(s, utf8_binary) from t1
+-- !query analysis
+Project [locate(s#x, utf8_binary#x, 1) AS locate(s, utf8_binary, 1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select locate(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select locate(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query analysis
+Project [locate(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 1) AS locate(utf8_binary, collate(utf8_lcase, utf8_binary), 1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select locate(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 3) from t1
+-- !query analysis
+Project [locate(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 3) AS locate(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 3)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3) from t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"locate(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 3)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3)"
+  } ]
+}
+
+
+-- !query
+select locate(utf8_binary, 'a'), locate(utf8_lcase, 'a') from t1
+-- !query analysis
+Project [locate(utf8_binary#x, a, 1) AS locate(utf8_binary, a, 1)#x, locate(utf8_lcase#x, a, 1) AS locate(utf8_lcase, 'a' collate UTF8_LCASE, 1)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select locate(utf8_binary, 'AaAA' collate utf8_lcase, 4), locate(utf8_lcase, 'AAa' collate utf8_binary, 4) from t1
+-- !query analysis
+Project [locate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), 4) AS locate(utf8_binary, collate(AaAA, utf8_lcase), 4)#x, locate(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 4) AS locate(utf8_lcase, collate(AAa, utf8_binary), 4)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+select locate(utf8_binary, 'AaAA ' collate utf8_binary_rtrim, 4), locate(utf8_lcase, 'AAa ' collate utf8_binary, 4) from t1
+-- !query analysis
+Project [locate(cast(utf8_binary#x as string collate UTF8_BINARY_RTRIM), collate(AaAA , utf8_binary_rtrim), 4) AS locate(utf8_binary, collate(AaAA , utf8_binary_rtrim), 4)#x, locate(cast(utf8_lcase#x as string), collate(AAa , utf8_binary), 4) AS locate(utf8_lcase, collate(AAa , utf8_binary), 4)#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- Relation spark_catalog.default.t1[s#x,utf8_binary#x,utf8_lcase#x] parquet
+
+
+-- !query
+drop table t1
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
+
+
+-- !query
+drop table t2
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t2
+
+
+-- !query
+drop table t3
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t3
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/collations.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/collations.sql.out
deleted file mode 100644
index 957bcabb078fe..0000000000000
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/collations.sql.out
+++ /dev/null
@@ -1,3303 +0,0 @@
--- Automatically generated by SQLQueryTestSuite
--- !query
-create table t1(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
-
-
--- !query
-insert into t1 values('aaa', 'aaa')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-insert into t1 values('AAA', 'AAA')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-insert into t1 values('bbb', 'bbb')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-insert into t1 values('BBB', 'BBB')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-describe table t1
--- !query analysis
-DescribeTableCommand `spark_catalog`.`default`.`t1`, false, [col_name#x, data_type#x, comment#x]
-
-
--- !query
-select count(*) from t1 group by utf8_binary
--- !query analysis
-Aggregate [utf8_binary#x], [count(1) AS count(1)#xL]
-+- SubqueryAlias spark_catalog.default.t1
-   +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select count(*) from t1 group by utf8_lcase
--- !query analysis
-Aggregate [utf8_lcase#x], [count(1) AS count(1)#xL]
-+- SubqueryAlias spark_catalog.default.t1
-   +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select * from t1 where utf8_binary = 'aaa'
--- !query analysis
-Project [utf8_binary#x, utf8_lcase#x]
-+- Filter (utf8_binary#x = aaa)
-   +- SubqueryAlias spark_catalog.default.t1
-      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select * from t1 where utf8_lcase = 'aaa' collate utf8_lcase
--- !query analysis
-Project [utf8_binary#x, utf8_lcase#x]
-+- Filter (utf8_lcase#x = collate(aaa, utf8_lcase))
-   +- SubqueryAlias spark_catalog.default.t1
-      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select * from t1 where utf8_binary < 'bbb'
--- !query analysis
-Project [utf8_binary#x, utf8_lcase#x]
-+- Filter (utf8_binary#x < bbb)
-   +- SubqueryAlias spark_catalog.default.t1
-      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select * from t1 where utf8_lcase < 'bbb' collate utf8_lcase
--- !query analysis
-Project [utf8_binary#x, utf8_lcase#x]
-+- Filter (utf8_lcase#x < collate(bbb, utf8_lcase))
-   +- SubqueryAlias spark_catalog.default.t1
-      +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select l.utf8_binary, r.utf8_lcase from t1 l join t1 r on l.utf8_lcase = r.utf8_lcase
--- !query analysis
-Project [utf8_binary#x, utf8_lcase#x]
-+- Join Inner, (utf8_lcase#x = utf8_lcase#x)
-   :- SubqueryAlias l
-   :  +- SubqueryAlias spark_catalog.default.t1
-   :     +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-   +- SubqueryAlias r
-      +- SubqueryAlias spark_catalog.default.t1
-         +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-create table t2(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t2`, false
-
-
--- !query
-insert into t2 values('aaa', 'aaa')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-insert into t2 values('bbb', 'bbb')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-select * from t1 anti join t2 on t1.utf8_lcase = t2.utf8_lcase
--- !query analysis
-Project [utf8_binary#x, utf8_lcase#x]
-+- Join LeftAnti, (utf8_lcase#x = utf8_lcase#x)
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- Relation spark_catalog.default.t1[utf8_binary#x,utf8_lcase#x] parquet
-   +- SubqueryAlias spark_catalog.default.t2
-      +- Relation spark_catalog.default.t2[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-drop table t2
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t2
-
-
--- !query
-drop table t1
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query analysis
-Except false
-:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-:  +- LocalRelation [col1#x]
-+- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query analysis
-Except All true
-:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-:  +- LocalRelation [col1#x]
-+- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query analysis
-Distinct
-+- Union false, false
-   :- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-   :  +- LocalRelation [col1#x]
-   +- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-      +- LocalRelation [col1#x]
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query analysis
-Union false, false
-:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-:  +- LocalRelation [col1#x]
-+- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query analysis
-Intersect false
-:- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-:  +- LocalRelation [col1#x]
-+- Project [collate(col1#x, utf8_lcase) AS collate(col1, utf8_lcase)#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "EXCEPT",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 162,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "EXCEPT ALL",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 166,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "UNION",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 161,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "UNION",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 165,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "INTERSECT",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 156,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-create table t1 (c1 struct<utf8_binary: string collate utf8_binary, utf8_lcase: string collate utf8_lcase>) USING PARQUET
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
-
-
--- !query
-insert into t1 values (named_struct('utf8_binary', 'aaa', 'utf8_lcase', 'aaa'))
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [c1]
-+- Project [named_struct(utf8_binary, col1#x.utf8_binary, utf8_lcase, cast(col1#x.utf8_lcase as string collate UTF8_LCASE)) AS c1#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-insert into t1 values (named_struct('utf8_binary', 'AAA', 'utf8_lcase', 'AAA'))
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [c1]
-+- Project [named_struct(utf8_binary, col1#x.utf8_binary, utf8_lcase, cast(col1#x.utf8_lcase as string collate UTF8_LCASE)) AS c1#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-select count(*) from t1 group by c1.utf8_binary
--- !query analysis
-Aggregate [c1#x.utf8_binary], [count(1) AS count(1)#xL]
-+- SubqueryAlias spark_catalog.default.t1
-   +- Relation spark_catalog.default.t1[c1#x] parquet
-
-
--- !query
-select count(*) from t1 group by c1.utf8_lcase
--- !query analysis
-Aggregate [c1#x.utf8_lcase], [count(1) AS count(1)#xL]
-+- SubqueryAlias spark_catalog.default.t1
-   +- Relation spark_catalog.default.t1[c1#x] parquet
-
-
--- !query
-drop table t1
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
-
-
--- !query
-select array_contains(ARRAY('aaa' collate utf8_lcase),'AAA' collate utf8_lcase)
--- !query analysis
-Project [array_contains(array(collate(aaa, utf8_lcase)), collate(AAA, utf8_lcase)) AS array_contains(array(collate(aaa, utf8_lcase)), collate(AAA, utf8_lcase))#x]
-+- OneRowRelation
-
-
--- !query
-select array_position(ARRAY('aaa' collate utf8_lcase, 'bbb' collate utf8_lcase),'BBB' collate utf8_lcase)
--- !query analysis
-Project [array_position(array(collate(aaa, utf8_lcase), collate(bbb, utf8_lcase)), collate(BBB, utf8_lcase)) AS array_position(array(collate(aaa, utf8_lcase), collate(bbb, utf8_lcase)), collate(BBB, utf8_lcase))#xL]
-+- OneRowRelation
-
-
--- !query
-select nullif('aaa' COLLATE utf8_lcase, 'AAA' COLLATE utf8_lcase)
--- !query analysis
-Project [nullif(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase)) AS nullif(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase))#x]
-+- OneRowRelation
-
-
--- !query
-select least('aaa' COLLATE utf8_lcase, 'AAA' collate utf8_lcase, 'a' collate utf8_lcase)
--- !query analysis
-Project [least(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase), collate(a, utf8_lcase)) AS least(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase), collate(a, utf8_lcase))#x]
-+- OneRowRelation
-
-
--- !query
-select arrays_overlap(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query analysis
-Project [arrays_overlap(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS arrays_overlap(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
-+- OneRowRelation
-
-
--- !query
-select array_distinct(array('aaa' collate utf8_lcase, 'AAA' collate utf8_lcase))
--- !query analysis
-Project [array_distinct(array(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase))) AS array_distinct(array(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase)))#x]
-+- OneRowRelation
-
-
--- !query
-select array_union(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query analysis
-Project [array_union(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS array_union(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
-+- OneRowRelation
-
-
--- !query
-select array_intersect(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query analysis
-Project [array_intersect(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS array_intersect(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
-+- OneRowRelation
-
-
--- !query
-select array_except(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query analysis
-Project [array_except(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))) AS array_except(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase)))#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate unicode < 'A'
--- !query analysis
-Project [(collate(a, unicode) < A) AS (collate(a, unicode) < 'A' collate UNICODE)#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate unicode_ci = 'A'
--- !query analysis
-Project [(collate(a, unicode_ci) = A) AS (collate(a, unicode_ci) = 'A' collate UNICODE_CI)#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate unicode_ai = 'å'
--- !query analysis
-Project [(collate(a, unicode_ai) = å) AS (collate(a, unicode_ai) = 'å' collate UNICODE_AI)#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate unicode_ci_ai = 'Å'
--- !query analysis
-Project [(collate(a, unicode_ci_ai) = Å) AS (collate(a, unicode_ci_ai) = 'Å' collate UNICODE_CI_AI)#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate en < 'A'
--- !query analysis
-Project [(collate(a, en) < A) AS (collate(a, en) < 'A' collate en)#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate en_ci = 'A'
--- !query analysis
-Project [(collate(a, en_ci) = A) AS (collate(a, en_ci) = 'A' collate en_CI)#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate en_ai = 'å'
--- !query analysis
-Project [(collate(a, en_ai) = å) AS (collate(a, en_ai) = 'å' collate en_AI)#x]
-+- OneRowRelation
-
-
--- !query
-select 'a' collate en_ci_ai = 'Å'
--- !query analysis
-Project [(collate(a, en_ci_ai) = Å) AS (collate(a, en_ci_ai) = 'Å' collate en_CI_AI)#x]
-+- OneRowRelation
-
-
--- !query
-select 'Kypper' collate sv < 'Köpfe'
--- !query analysis
-Project [(collate(Kypper, sv) < Köpfe) AS (collate(Kypper, sv) < 'Köpfe' collate sv)#x]
-+- OneRowRelation
-
-
--- !query
-select 'Kypper' collate de > 'Köpfe'
--- !query analysis
-Project [(collate(Kypper, de) > Köpfe) AS (collate(Kypper, de) > 'Köpfe' collate de)#x]
-+- OneRowRelation
-
-
--- !query
-select 'I' collate tr_ci = 'ı'
--- !query analysis
-Project [(collate(I, tr_ci) = ı) AS (collate(I, tr_ci) = 'ı' collate tr_CI)#x]
-+- OneRowRelation
-
-
--- !query
-create table t4 (text string collate utf8_binary, pairDelim string collate utf8_lcase, keyValueDelim string collate utf8_binary) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t4`, false
-
-
--- !query
-insert into t4 values('a:1,b:2,c:3', ',', ':')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t4, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t4], Append, `spark_catalog`.`default`.`t4`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t4), [text, pairDelim, keyValueDelim]
-+- Project [cast(col1#x as string) AS text#x, cast(col2#x as string collate UTF8_LCASE) AS pairDelim#x, cast(col3#x as string) AS keyValueDelim#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-select str_to_map(text, pairDelim, keyValueDelim) from t4
--- !query analysis
-Project [str_to_map(cast(text#x as string collate null), cast(pairDelim#x as string collate null), cast(keyValueDelim#x as string collate null)) AS str_to_map(text, pairDelim, keyValueDelim)#x]
-+- SubqueryAlias spark_catalog.default.t4
-   +- Relation spark_catalog.default.t4[text#x,pairDelim#x,keyValueDelim#x] parquet
-
-
--- !query
-select str_to_map(text collate utf8_binary, pairDelim collate utf8_lcase, keyValueDelim collate utf8_binary) from t4
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select str_to_map(text collate utf8_binary, pairDelim collate utf8_binary, keyValueDelim collate utf8_binary) from t4
--- !query analysis
-Project [str_to_map(collate(text#x, utf8_binary), collate(pairDelim#x, utf8_binary), collate(keyValueDelim#x, utf8_binary)) AS str_to_map(collate(text, utf8_binary), collate(pairDelim, utf8_binary), collate(keyValueDelim, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t4
-   +- Relation spark_catalog.default.t4[text#x,pairDelim#x,keyValueDelim#x] parquet
-
-
--- !query
-select str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai) from t4
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(text, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"str_to_map(collate(text, unicode_ai), collate(pairDelim, unicode_ai), collate(keyValueDelim, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 106,
-    "fragment" : "str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-drop table t4
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t4
-
-
--- !query
-create table t5(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t5`, false
-
-
--- !query
-insert into t5 values ('Spark', 'Spark', 'SQL')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('bbAbaAbA', 'bbAbAAbA', 'a')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('İo', 'İo', 'İo')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('İo', 'İo', 'İo ')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('İo', 'İo ', 'İo')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('İo', 'İo', 'i̇o')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('efd2', 'efd2', 'efd2')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('kitten', 'kitten', 'sitTing')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('abc', 'abc', 'abc')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-insert into t5 values ('abcdcba', 'abcdcba', 'aBcDCbA')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t5], Append, `spark_catalog`.`default`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t5), [s, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS s#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-create table t6(ascii long) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t6`, false
-
-
--- !query
-insert into t6 values (97)
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t6, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t6], Append, `spark_catalog`.`default`.`t6`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t6), [ascii]
-+- Project [cast(col1#x as bigint) AS ascii#xL]
-   +- LocalRelation [col1#x]
-
-
--- !query
-insert into t6 values (66)
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t6, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t6], Append, `spark_catalog`.`default`.`t6`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t6), [ascii]
-+- Project [cast(col1#x as bigint) AS ascii#xL]
-   +- LocalRelation [col1#x]
-
-
--- !query
-create table t7(ascii double) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t7`, false
-
-
--- !query
-insert into t7 values (97.52143)
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t7, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t7], Append, `spark_catalog`.`default`.`t7`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t7), [ascii]
-+- Project [cast(col1#x as double) AS ascii#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-insert into t7 values (66.421)
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t7, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t7], Append, `spark_catalog`.`default`.`t7`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t7), [ascii]
-+- Project [cast(col1#x as double) AS ascii#x]
-   +- LocalRelation [col1#x]
-
-
--- !query
-create table t8(format string collate utf8_binary, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t8`, false
-
-
--- !query
-insert into t8 values ('%s%s', 'abCdE', 'abCdE')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t8, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t8], Append, `spark_catalog`.`default`.`t8`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t8), [format, utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS format#x, cast(col2#x as string) AS utf8_binary#x, cast(col3#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x, col3#x]
-
-
--- !query
-create table t9(num long) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t9`, false
-
-
--- !query
-insert into t9 values (97)
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t9, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t9], Append, `spark_catalog`.`default`.`t9`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t9), [num]
-+- Project [cast(col1#x as bigint) AS num#xL]
-   +- LocalRelation [col1#x]
-
-
--- !query
-insert into t9 values (66)
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t9, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t9], Append, `spark_catalog`.`default`.`t9`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t9), [num]
-+- Project [cast(col1#x as bigint) AS num#xL]
-   +- LocalRelation [col1#x]
-
-
--- !query
-create table t10(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query analysis
-CreateDataSourceTableCommand `spark_catalog`.`default`.`t10`, false
-
-
--- !query
-insert into t10 values ('aaAaAAaA', 'aaAaaAaA')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t10], Append, `spark_catalog`.`default`.`t10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t10), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-insert into t10 values ('efd2', 'efd2')
--- !query analysis
-InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t10], Append, `spark_catalog`.`default`.`t10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t10), [utf8_binary, utf8_lcase]
-+- Project [cast(col1#x as string) AS utf8_binary#x, cast(col2#x as string collate UTF8_LCASE) AS utf8_lcase#x]
-   +- LocalRelation [col1#x, col2#x]
-
-
--- !query
-select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
--- !query analysis
-Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select concat_ws(' ', utf8_binary, utf8_lcase) from t5
--- !query analysis
-Project [concat_ws( , cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null)) AS concat_ws(' ' collate null, utf8_binary, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select concat_ws(' ' collate utf8_binary, utf8_binary, 'SQL' collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select concat_ws(' ' collate utf8_lcase, utf8_binary, 'SQL' collate utf8_lcase) from t5
--- !query analysis
-Project [concat_ws(collate( , utf8_lcase), cast(utf8_binary#x as string collate UTF8_LCASE), collate(SQL, utf8_lcase)) AS concat_ws(collate( , utf8_lcase), utf8_binary, collate(SQL, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select concat_ws(',', utf8_lcase, 'word'), concat_ws(',', utf8_binary, 'word') from t5
--- !query analysis
-Project [concat_ws(,, utf8_lcase#x, word) AS concat_ws(',' collate UTF8_LCASE, utf8_lcase, 'word' collate UTF8_LCASE)#x, concat_ws(,, utf8_binary#x, word) AS concat_ws(,, utf8_binary, word)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select concat_ws(',', utf8_lcase, 'word' collate utf8_binary), concat_ws(',', utf8_binary, 'word' collate utf8_lcase) from t5
--- !query analysis
-Project [concat_ws(,, cast(utf8_lcase#x as string), collate(word, utf8_binary)) AS concat_ws(,, utf8_lcase, collate(word, utf8_binary))#x, concat_ws(,, cast(utf8_binary#x as string collate UTF8_LCASE), collate(word, utf8_lcase)) AS concat_ws(',' collate UTF8_LCASE, utf8_binary, collate(word, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select elt(2, s, utf8_binary) from t5
--- !query analysis
-Project [elt(2, s#x, utf8_binary#x, true) AS elt(2, s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select elt(2, utf8_binary, utf8_lcase, s) from t5
--- !query analysis
-Project [elt(2, cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), cast(s#x as string collate null), true) AS elt(2, utf8_binary, utf8_lcase, s)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [elt(1, collate(utf8_binary#x, utf8_binary), collate(utf8_lcase#x, utf8_binary), true) AS elt(1, collate(utf8_binary, utf8_binary), collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase) from t5
--- !query analysis
-Project [elt(1, collate(utf8_binary#x, utf8_binary), cast(utf8_lcase#x as string), true) AS elt(1, collate(utf8_binary, utf8_binary), utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select elt(1, utf8_binary, 'word'), elt(1, utf8_lcase, 'word') from t5
--- !query analysis
-Project [elt(1, utf8_binary#x, word, true) AS elt(1, utf8_binary, word)#x, elt(1, utf8_lcase#x, word, true) AS elt(1, utf8_lcase, 'word' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select elt(1, utf8_binary, 'word' collate utf8_lcase), elt(1, utf8_lcase, 'word' collate utf8_binary) from t5
--- !query analysis
-Project [elt(1, cast(utf8_binary#x as string collate UTF8_LCASE), collate(word, utf8_lcase), true) AS elt(1, utf8_binary, collate(word, utf8_lcase))#x, elt(1, cast(utf8_lcase#x as string), collate(word, utf8_binary), true) AS elt(1, utf8_lcase, collate(word, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select split_part(utf8_binary, utf8_lcase, 3) from t5
--- !query analysis
-Project [split_part(cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), 3) AS split_part(utf8_binary, utf8_lcase, 3)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select split_part(s, utf8_binary, 1) from t5
--- !query analysis
-Project [split_part(s#x, utf8_binary#x, 1) AS split_part(s, utf8_binary, 1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select split_part(utf8_binary collate utf8_binary, s collate utf8_lcase, 1) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select split_part(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5
--- !query analysis
-Project [split_part(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 2) AS split_part(utf8_binary, collate(utf8_lcase, utf8_binary), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select split_part(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5
--- !query analysis
-Project [split_part(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 2) AS split_part(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"split_part(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 83,
-    "fragment" : "split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
-  } ]
-}
-
-
--- !query
-select split_part(utf8_binary, 'a', 3), split_part(utf8_lcase, 'a', 3) from t5
--- !query analysis
-Project [split_part(utf8_binary#x, a, 3) AS split_part(utf8_binary, a, 3)#x, split_part(utf8_lcase#x, a, 3) AS split_part(utf8_lcase, 'a' collate UTF8_LCASE, 3)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select split_part(utf8_binary, 'a' collate utf8_lcase, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t5
--- !query analysis
-Project [split_part(cast(utf8_binary#x as string collate UTF8_LCASE), collate(a, utf8_lcase), 3) AS split_part(utf8_binary, collate(a, utf8_lcase), 3)#x, split_part(cast(utf8_lcase#x as string), collate(a, utf8_binary), 3) AS split_part(utf8_lcase, collate(a, utf8_binary), 3)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select split_part(utf8_binary, 'a ' collate utf8_lcase_rtrim, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t5
--- !query analysis
-Project [split_part(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(a , utf8_lcase_rtrim), 3) AS split_part(utf8_binary, collate(a , utf8_lcase_rtrim), 3)#x, split_part(cast(utf8_lcase#x as string), collate(a, utf8_binary), 3) AS split_part(utf8_lcase, collate(a, utf8_binary), 3)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select contains(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"contains(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 40,
-    "fragment" : "contains(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select contains(s, utf8_binary) from t5
--- !query analysis
-Project [Contains(s#x, utf8_binary#x) AS contains(s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select contains(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select contains(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [Contains(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS contains(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select contains(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [Contains(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS contains(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"contains(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 78,
-    "fragment" : "contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select contains(utf8_binary, 'a'), contains(utf8_lcase, 'a') from t5
--- !query analysis
-Project [Contains(utf8_binary#x, a) AS contains(utf8_binary, a)#x, Contains(utf8_lcase#x, a) AS contains(utf8_lcase, 'a' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select contains(utf8_binary, 'AaAA' collate utf8_lcase), contains(utf8_lcase, 'AAa' collate utf8_binary) from t5
--- !query analysis
-Project [Contains(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase)) AS contains(utf8_binary, collate(AaAA, utf8_lcase))#x, Contains(cast(utf8_lcase#x as string), collate(AAa, utf8_binary)) AS contains(utf8_lcase, collate(AAa, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select contains(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim), contains(utf8_lcase, 'AAa ' collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [Contains(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(AaAA , utf8_lcase_rtrim)) AS contains(utf8_binary, collate(AaAA , utf8_lcase_rtrim))#x, Contains(cast(utf8_lcase#x as string collate UTF8_BINARY_RTRIM), collate(AAa , utf8_binary_rtrim)) AS contains(utf8_lcase, collate(AAa , utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substring_index(utf8_binary, utf8_lcase, 2) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"substring_index(utf8_binary, utf8_lcase, 2)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 50,
-    "fragment" : "substring_index(utf8_binary, utf8_lcase, 2)"
-  } ]
-}
-
-
--- !query
-select substring_index(s, utf8_binary,1) from t5
--- !query analysis
-Project [substring_index(s#x, utf8_binary#x, 1) AS substring_index(s, utf8_binary, 1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substring_index(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select substring_index(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5
--- !query analysis
-Project [substring_index(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 2) AS substring_index(utf8_binary, collate(utf8_lcase, utf8_binary), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substring_index(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5
--- !query analysis
-Project [substring_index(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 2) AS substring_index(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"substring_index(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 88,
-    "fragment" : "substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
-  } ]
-}
-
-
--- !query
-select substring_index(utf8_binary, 'a', 2), substring_index(utf8_lcase, 'a', 2) from t5
--- !query analysis
-Project [substring_index(utf8_binary#x, a, 2) AS substring_index(utf8_binary, a, 2)#x, substring_index(utf8_lcase#x, a, 2) AS substring_index(utf8_lcase, 'a' collate UTF8_LCASE, 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substring_index(utf8_binary, 'AaAA' collate utf8_lcase, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5
--- !query analysis
-Project [substring_index(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), 2) AS substring_index(utf8_binary, collate(AaAA, utf8_lcase), 2)#x, substring_index(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 2) AS substring_index(utf8_lcase, collate(AAa, utf8_binary), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substring_index(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5
--- !query analysis
-Project [substring_index(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(AaAA , utf8_lcase_rtrim), 2) AS substring_index(utf8_binary, collate(AaAA , utf8_lcase_rtrim), 2)#x, substring_index(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 2) AS substring_index(utf8_lcase, collate(AAa, utf8_binary), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select instr(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"instr(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "instr(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select instr(s, utf8_binary) from t5
--- !query analysis
-Project [instr(s#x, utf8_binary#x) AS instr(s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select instr(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select instr(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [instr(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS instr(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select instr(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [instr(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS instr(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"instr(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select instr(utf8_binary, 'a'), instr(utf8_lcase, 'a') from t5
--- !query analysis
-Project [instr(utf8_binary#x, a) AS instr(utf8_binary, a)#x, instr(utf8_lcase#x, a) AS instr(utf8_lcase, 'a' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select instr(utf8_binary, 'AaAA' collate utf8_lcase), instr(utf8_lcase, 'AAa' collate utf8_binary) from t5
--- !query analysis
-Project [instr(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase)) AS instr(utf8_binary, collate(AaAA, utf8_lcase))#x, instr(cast(utf8_lcase#x as string), collate(AAa, utf8_binary)) AS instr(utf8_lcase, collate(AAa, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select find_in_set(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"find_in_set(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 43,
-    "fragment" : "find_in_set(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select find_in_set(s, utf8_binary) from t5
--- !query analysis
-Project [find_in_set(s#x, utf8_binary#x) AS find_in_set(s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select find_in_set(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select find_in_set(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [find_in_set(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS find_in_set(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select find_in_set(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [find_in_set(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS find_in_set(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o'), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o') from t5
--- !query analysis
-Project [find_in_set(utf8_binary#x, aaAaaAaA,i̇o) AS find_in_set(utf8_binary, aaAaaAaA,i̇o)#x, find_in_set(utf8_lcase#x, aaAaaAaA,i̇o) AS find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o' collate utf8_lcase), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t5
--- !query analysis
-Project [find_in_set(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA,i̇o, utf8_lcase)) AS find_in_set(utf8_binary, collate(aaAaaAaA,i̇o, utf8_lcase))#x, find_in_set(cast(utf8_lcase#x as string), collate(aaAaaAaA,i̇o, utf8_binary)) AS find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o ' collate utf8_lcase_rtrim), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t5
--- !query analysis
-Project [find_in_set(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA,i̇o , utf8_lcase_rtrim)) AS find_in_set(utf8_binary, collate(aaAaaAaA,i̇o , utf8_lcase_rtrim))#x, find_in_set(cast(utf8_lcase#x as string), collate(aaAaaAaA,i̇o, utf8_binary)) AS find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select startswith(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"startswith(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 42,
-    "fragment" : "startswith(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select startswith(s, utf8_binary) from t5
--- !query analysis
-Project [StartsWith(s#x, utf8_binary#x) AS startswith(s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select startswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select startswith(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [StartsWith(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS startswith(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select startswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [StartsWith(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS startswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"startswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 80,
-    "fragment" : "startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select startswith(utf8_binary, 'aaAaaAaA'), startswith(utf8_lcase, 'aaAaaAaA') from t5
--- !query analysis
-Project [StartsWith(utf8_binary#x, aaAaaAaA) AS startswith(utf8_binary, aaAaaAaA)#x, StartsWith(utf8_lcase#x, aaAaaAaA) AS startswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select startswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query analysis
-Project [StartsWith(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA, utf8_lcase)) AS startswith(utf8_binary, collate(aaAaaAaA, utf8_lcase))#x, StartsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select startswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query analysis
-Project [StartsWith(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA , utf8_lcase_rtrim)) AS startswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim))#x, StartsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select translate(utf8_lcase, utf8_lcase, '12345') from t5
--- !query analysis
-Project [translate(utf8_lcase#x, utf8_lcase#x, 12345) AS translate(utf8_lcase, utf8_lcase, '12345' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select translate(utf8_binary, utf8_lcase, '12345') from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"translate(utf8_binary, utf8_lcase, 12345)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 50,
-    "fragment" : "translate(utf8_binary, utf8_lcase, '12345')"
-  } ]
-}
-
-
--- !query
-select translate(utf8_binary, 'aBc' collate utf8_lcase, '12345' collate utf8_binary) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select translate(utf8_binary, 'SQL' collate utf8_lcase, '12345' collate utf8_lcase) from t5
--- !query analysis
-Project [translate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(SQL, utf8_lcase), collate(12345, utf8_lcase)) AS translate(utf8_binary, collate(SQL, utf8_lcase), collate(12345, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"utf8_binary\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"translate(utf8_binary, collate(SQL, unicode_ai), collate(12345, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 83,
-    "fragment" : "translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select translate(utf8_lcase, 'aaAaaAaA', '12345'), translate(utf8_binary, 'aaAaaAaA', '12345') from t5
--- !query analysis
-Project [translate(utf8_lcase#x, aaAaaAaA, 12345) AS translate(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, '12345' collate UTF8_LCASE)#x, translate(utf8_binary#x, aaAaaAaA, 12345) AS translate(utf8_binary, aaAaaAaA, 12345)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select translate(utf8_lcase, 'aBc' collate utf8_binary, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t5
--- !query analysis
-Project [translate(cast(utf8_lcase#x as string), collate(aBc, utf8_binary), 12345) AS translate(utf8_lcase, collate(aBc, utf8_binary), 12345)#x, translate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aBc, utf8_lcase), 12345) AS translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select translate(utf8_lcase, 'aBc ' collate utf8_binary_rtrim, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t5
--- !query analysis
-Project [translate(cast(utf8_lcase#x as string collate UTF8_BINARY_RTRIM), collate(aBc , utf8_binary_rtrim), 12345) AS translate(utf8_lcase, collate(aBc , utf8_binary_rtrim), '12345' collate UTF8_BINARY_RTRIM)#x, translate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aBc, utf8_lcase), 12345) AS translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select replace(utf8_binary, utf8_lcase, 'abc') from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"replace(utf8_binary, utf8_lcase, abc)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 46,
-    "fragment" : "replace(utf8_binary, utf8_lcase, 'abc')"
-  } ]
-}
-
-
--- !query
-select replace(s, utf8_binary, 'abc') from t5
--- !query analysis
-Project [replace(s#x, utf8_binary#x, abc) AS replace(s, utf8_binary, abc)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select replace(utf8_binary collate utf8_binary, s collate utf8_lcase, 'abc') from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select replace(utf8_binary, utf8_lcase collate utf8_binary, 'abc') from t5
--- !query analysis
-Project [replace(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), abc) AS replace(utf8_binary, collate(utf8_lcase, utf8_binary), abc)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select replace(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 'abc') from t5
--- !query analysis
-Project [replace(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), abc) AS replace(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 'abc' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc') from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"replace(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 'abc' collate UNICODE_AI)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 84,
-    "fragment" : "replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc')"
-  } ]
-}
-
-
--- !query
-select replace(utf8_binary, 'aaAaaAaA', 'abc'), replace(utf8_lcase, 'aaAaaAaA', 'abc') from t5
--- !query analysis
-Project [replace(utf8_binary#x, aaAaaAaA, abc) AS replace(utf8_binary, aaAaaAaA, abc)#x, replace(utf8_lcase#x, aaAaaAaA, abc) AS replace(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, 'abc' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select replace(utf8_binary, 'aaAaaAaA' collate utf8_lcase, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t5
--- !query analysis
-Project [replace(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA, utf8_lcase), abc) AS replace(utf8_binary, collate(aaAaaAaA, utf8_lcase), 'abc' collate UTF8_LCASE)#x, replace(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary), abc) AS replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select replace(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t5
--- !query analysis
-Project [replace(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA , utf8_lcase_rtrim), abc) AS replace(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim), 'abc' collate UTF8_LCASE_RTRIM)#x, replace(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary), abc) AS replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select endswith(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"endswith(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 40,
-    "fragment" : "endswith(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select endswith(s, utf8_binary) from t5
--- !query analysis
-Project [EndsWith(s#x, utf8_binary#x) AS endswith(s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select endswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select endswith(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [EndsWith(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS endswith(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select endswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [EndsWith(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS endswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"endswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 78,
-    "fragment" : "endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select endswith(utf8_binary, 'aaAaaAaA'), endswith(utf8_lcase, 'aaAaaAaA') from t5
--- !query analysis
-Project [EndsWith(utf8_binary#x, aaAaaAaA) AS endswith(utf8_binary, aaAaaAaA)#x, EndsWith(utf8_lcase#x, aaAaaAaA) AS endswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select endswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query analysis
-Project [EndsWith(cast(utf8_binary#x as string collate UTF8_LCASE), collate(aaAaaAaA, utf8_lcase)) AS endswith(utf8_binary, collate(aaAaaAaA, utf8_lcase))#x, EndsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select endswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query analysis
-Project [EndsWith(cast(utf8_binary#x as string collate UTF8_LCASE_RTRIM), collate(aaAaaAaA , utf8_lcase_rtrim)) AS endswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim))#x, EndsWith(cast(utf8_lcase#x as string), collate(aaAaaAaA, utf8_binary)) AS endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select repeat(utf8_binary, 3), repeat(utf8_lcase, 2) from t5
--- !query analysis
-Project [repeat(utf8_binary#x, 3) AS repeat(utf8_binary, 3)#x, repeat(utf8_lcase#x, 2) AS repeat(utf8_lcase, 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select repeat(utf8_binary collate utf8_lcase, 3), repeat(utf8_lcase collate utf8_binary, 2) from t5
--- !query analysis
-Project [repeat(collate(utf8_binary#x, utf8_lcase), 3) AS repeat(collate(utf8_binary, utf8_lcase), 3)#x, repeat(collate(utf8_lcase#x, utf8_binary), 2) AS repeat(collate(utf8_lcase, utf8_binary), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select ascii(utf8_binary), ascii(utf8_lcase) from t5
--- !query analysis
-Project [ascii(utf8_binary#x) AS ascii(utf8_binary)#x, ascii(utf8_lcase#x) AS ascii(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select ascii(utf8_binary collate utf8_lcase), ascii(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [ascii(collate(utf8_binary#x, utf8_lcase)) AS ascii(collate(utf8_binary, utf8_lcase))#x, ascii(collate(utf8_lcase#x, utf8_binary)) AS ascii(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select unbase64(utf8_binary), unbase64(utf8_lcase) from t10
--- !query analysis
-Project [unbase64(utf8_binary#x, false) AS unbase64(utf8_binary)#x, unbase64(utf8_lcase#x, false) AS unbase64(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t10
-   +- Relation spark_catalog.default.t10[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select unbase64(utf8_binary collate utf8_lcase), unbase64(utf8_lcase collate utf8_binary) from t10
--- !query analysis
-Project [unbase64(collate(utf8_binary#x, utf8_lcase), false) AS unbase64(collate(utf8_binary, utf8_lcase))#x, unbase64(collate(utf8_lcase#x, utf8_binary), false) AS unbase64(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t10
-   +- Relation spark_catalog.default.t10[utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select chr(ascii) from t6
--- !query analysis
-Project [chr(ascii#xL) AS chr(ascii)#x]
-+- SubqueryAlias spark_catalog.default.t6
-   +- Relation spark_catalog.default.t6[ascii#xL] parquet
-
-
--- !query
-select base64(utf8_binary), base64(utf8_lcase) from t5
--- !query analysis
-Project [base64(cast(utf8_binary#x as binary)) AS base64(utf8_binary)#x, base64(cast(utf8_lcase#x as binary)) AS base64(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select base64(utf8_binary collate utf8_lcase), base64(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [base64(cast(collate(utf8_binary#x, utf8_lcase) as binary)) AS base64(collate(utf8_binary, utf8_lcase))#x, base64(cast(collate(utf8_lcase#x, utf8_binary) as binary)) AS base64(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select decode(encode(utf8_binary, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase, 'utf-8'), 'utf-8') from t5
--- !query analysis
-Project [decode(encode(utf8_binary#x, utf-8), utf-8) AS decode(encode(utf8_binary, utf-8), utf-8)#x, decode(encode(utf8_lcase#x, utf-8), utf-8) AS decode(encode(utf8_lcase, utf-8), utf-8)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select decode(encode(utf8_binary collate utf8_lcase, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase collate utf8_binary, 'utf-8'), 'utf-8') from t5
--- !query analysis
-Project [decode(encode(collate(utf8_binary#x, utf8_lcase), utf-8), utf-8) AS decode(encode(collate(utf8_binary, utf8_lcase), utf-8), utf-8)#x, decode(encode(collate(utf8_lcase#x, utf8_binary), utf-8), utf-8) AS decode(encode(collate(utf8_lcase, utf8_binary), utf-8), utf-8)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select format_number(ascii, '###.###') from t7
--- !query analysis
-Project [format_number(ascii#x, ###.###) AS format_number(ascii, ###.###)#x]
-+- SubqueryAlias spark_catalog.default.t7
-   +- Relation spark_catalog.default.t7[ascii#x] parquet
-
-
--- !query
-select format_number(ascii, '###.###' collate utf8_lcase) from t7
--- !query analysis
-Project [format_number(ascii#x, collate(###.###, utf8_lcase)) AS format_number(ascii, collate(###.###, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t7
-   +- Relation spark_catalog.default.t7[ascii#x] parquet
-
-
--- !query
-select encode(utf8_binary, 'utf-8'), encode(utf8_lcase, 'utf-8') from t5
--- !query analysis
-Project [encode(utf8_binary#x, utf-8) AS encode(utf8_binary, utf-8)#x, encode(utf8_lcase#x, utf-8) AS encode(utf8_lcase, utf-8)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select encode(utf8_binary collate utf8_lcase, 'utf-8'), encode(utf8_lcase collate utf8_binary, 'utf-8') from t5
--- !query analysis
-Project [encode(collate(utf8_binary#x, utf8_lcase), utf-8) AS encode(collate(utf8_binary, utf8_lcase), utf-8)#x, encode(collate(utf8_lcase#x, utf8_binary), utf-8) AS encode(collate(utf8_lcase, utf8_binary), utf-8)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select to_binary(utf8_binary, 'utf-8'), to_binary(utf8_lcase, 'utf-8') from t5
--- !query analysis
-Project [to_binary(utf8_binary#x, Some(utf-8), false) AS to_binary(utf8_binary, utf-8)#x, to_binary(utf8_lcase#x, Some(utf-8), false) AS to_binary(utf8_lcase, utf-8)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select to_binary(utf8_binary collate utf8_lcase, 'utf-8'), to_binary(utf8_lcase collate utf8_binary, 'utf-8') from t5
--- !query analysis
-Project [to_binary(collate(utf8_binary#x, utf8_lcase), Some(utf-8), false) AS to_binary(collate(utf8_binary, utf8_lcase), utf-8)#x, to_binary(collate(utf8_lcase#x, utf8_binary), Some(utf-8), false) AS to_binary(collate(utf8_lcase, utf8_binary), utf-8)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select sentences(utf8_binary), sentences(utf8_lcase) from t5
--- !query analysis
-Project [sentences(utf8_binary#x, , ) AS sentences(utf8_binary, , )#x, sentences(utf8_lcase#x, , ) AS sentences(utf8_lcase, , )#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select sentences(utf8_binary collate utf8_lcase), sentences(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [sentences(collate(utf8_binary#x, utf8_lcase), , ) AS sentences(collate(utf8_binary, utf8_lcase), , )#x, sentences(collate(utf8_lcase#x, utf8_binary), , ) AS sentences(collate(utf8_lcase, utf8_binary), , )#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select upper(utf8_binary), upper(utf8_lcase) from t5
--- !query analysis
-Project [upper(utf8_binary#x) AS upper(utf8_binary)#x, upper(utf8_lcase#x) AS upper(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select upper(utf8_binary collate utf8_lcase), upper(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [upper(collate(utf8_binary#x, utf8_lcase)) AS upper(collate(utf8_binary, utf8_lcase))#x, upper(collate(utf8_lcase#x, utf8_binary)) AS upper(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lower(utf8_binary), lower(utf8_lcase) from t5
--- !query analysis
-Project [lower(utf8_binary#x) AS lower(utf8_binary)#x, lower(utf8_lcase#x) AS lower(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lower(utf8_binary collate utf8_lcase), lower(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [lower(collate(utf8_binary#x, utf8_lcase)) AS lower(collate(utf8_binary, utf8_lcase))#x, lower(collate(utf8_lcase#x, utf8_binary)) AS lower(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select initcap(utf8_binary), initcap(utf8_lcase) from t5
--- !query analysis
-Project [initcap(utf8_binary#x) AS initcap(utf8_binary)#x, initcap(utf8_lcase#x) AS initcap(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select initcap(utf8_binary collate utf8_lcase), initcap(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [initcap(collate(utf8_binary#x, utf8_lcase)) AS initcap(collate(utf8_binary, utf8_lcase))#x, initcap(collate(utf8_lcase#x, utf8_binary)) AS initcap(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select overlay(utf8_binary, utf8_lcase, 2) from t5
--- !query analysis
-Project [overlay(cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), 2, -1) AS overlay(utf8_binary, utf8_lcase, 2, -1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select overlay(s, utf8_binary,1) from t5
--- !query analysis
-Project [overlay(s#x, utf8_binary#x, 1, -1) AS overlay(s, utf8_binary, 1, -1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select overlay(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select overlay(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5
--- !query analysis
-Project [overlay(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 2, -1) AS overlay(utf8_binary, collate(utf8_lcase, utf8_binary), 2, -1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select overlay(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5
--- !query analysis
-Project [overlay(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 2, -1) AS overlay(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2, -1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select overlay(utf8_binary, 'a', 2), overlay(utf8_lcase, 'a', 2) from t5
--- !query analysis
-Project [overlay(utf8_binary#x, a, 2, -1) AS overlay(utf8_binary, a, 2, -1)#x, overlay(utf8_lcase#x, a, 2, -1) AS overlay(utf8_lcase, 'a' collate UTF8_LCASE, 2, -1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select overlay(utf8_binary, 'AaAA' collate utf8_lcase, 2), overlay(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5
--- !query analysis
-Project [overlay(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), 2, -1) AS overlay(utf8_binary, collate(AaAA, utf8_lcase), 2, -1)#x, overlay(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 2, -1) AS overlay(utf8_lcase, collate(AAa, utf8_binary), 2, -1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select format_string(format, utf8_binary, utf8_lcase) from t8
--- !query analysis
-Project [format_string(format#x, utf8_binary#x, utf8_lcase#x) AS format_string(format, utf8_binary, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t8
-   +- Relation spark_catalog.default.t8[format#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select format_string(format collate utf8_lcase, utf8_lcase, utf8_binary collate utf8_lcase, 3), format_string(format, utf8_lcase collate utf8_binary, utf8_binary) from t8
--- !query analysis
-Project [format_string(collate(format#x, utf8_lcase), utf8_lcase#x, collate(utf8_binary#x, utf8_lcase), 3) AS format_string(collate(format, utf8_lcase), utf8_lcase, collate(utf8_binary, utf8_lcase), 3)#x, format_string(format#x, collate(utf8_lcase#x, utf8_binary), utf8_binary#x) AS format_string(format, collate(utf8_lcase, utf8_binary), utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t8
-   +- Relation spark_catalog.default.t8[format#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select format_string(format, utf8_binary, utf8_lcase) from t8
--- !query analysis
-Project [format_string(format#x, utf8_binary#x, utf8_lcase#x) AS format_string(format, utf8_binary, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t8
-   +- Relation spark_catalog.default.t8[format#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select soundex(utf8_binary), soundex(utf8_lcase) from t5
--- !query analysis
-Project [soundex(utf8_binary#x) AS soundex(utf8_binary)#x, soundex(utf8_lcase#x) AS soundex(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select soundex(utf8_binary collate utf8_lcase), soundex(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [soundex(collate(utf8_binary#x, utf8_lcase)) AS soundex(collate(utf8_binary, utf8_lcase))#x, soundex(collate(utf8_lcase#x, utf8_binary)) AS soundex(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select length(utf8_binary), length(utf8_lcase) from t5
--- !query analysis
-Project [length(utf8_binary#x) AS length(utf8_binary)#x, length(utf8_lcase#x) AS length(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select length(utf8_binary collate utf8_lcase), length(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [length(collate(utf8_binary#x, utf8_lcase)) AS length(collate(utf8_binary, utf8_lcase))#x, length(collate(utf8_lcase#x, utf8_binary)) AS length(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select bit_length(utf8_binary), bit_length(utf8_lcase) from t5
--- !query analysis
-Project [bit_length(utf8_binary#x) AS bit_length(utf8_binary)#x, bit_length(utf8_lcase#x) AS bit_length(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select bit_length(utf8_binary collate utf8_lcase), bit_length(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [bit_length(collate(utf8_binary#x, utf8_lcase)) AS bit_length(collate(utf8_binary, utf8_lcase))#x, bit_length(collate(utf8_lcase#x, utf8_binary)) AS bit_length(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select octet_length(utf8_binary), octet_length(utf8_lcase) from t5
--- !query analysis
-Project [octet_length(utf8_binary#x) AS octet_length(utf8_binary)#x, octet_length(utf8_lcase#x) AS octet_length(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select octet_length(utf8_binary collate utf8_lcase), octet_length(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [octet_length(collate(utf8_binary#x, utf8_lcase)) AS octet_length(collate(utf8_binary, utf8_lcase))#x, octet_length(collate(utf8_lcase#x, utf8_binary)) AS octet_length(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select octet_length(utf8_binary collate utf8_lcase_rtrim), octet_length(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [octet_length(collate(utf8_binary#x, utf8_lcase_rtrim)) AS octet_length(collate(utf8_binary, utf8_lcase_rtrim))#x, octet_length(collate(utf8_lcase#x, utf8_binary_rtrim)) AS octet_length(collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select luhn_check(num) from t9
--- !query analysis
-Project [luhn_check(cast(num#xL as string)) AS luhn_check(num)#x]
-+- SubqueryAlias spark_catalog.default.t9
-   +- Relation spark_catalog.default.t9[num#xL] parquet
-
-
--- !query
-select levenshtein(utf8_binary, utf8_lcase) from t5
--- !query analysis
-Project [levenshtein(cast(utf8_binary#x as string collate null), cast(utf8_lcase#x as string collate null), None) AS levenshtein(utf8_binary, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select levenshtein(s, utf8_binary) from t5
--- !query analysis
-Project [levenshtein(s#x, utf8_binary#x, None) AS levenshtein(s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select levenshtein(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select levenshtein(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [levenshtein(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), None) AS levenshtein(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select levenshtein(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [levenshtein(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), None) AS levenshtein(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select levenshtein(utf8_binary, 'a'), levenshtein(utf8_lcase, 'a') from t5
--- !query analysis
-Project [levenshtein(utf8_binary#x, a, None) AS levenshtein(utf8_binary, a)#x, levenshtein(utf8_lcase#x, a, None) AS levenshtein(utf8_lcase, 'a' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select levenshtein(utf8_binary, 'AaAA' collate utf8_lcase, 3), levenshtein(utf8_lcase, 'AAa' collate utf8_binary, 4) from t5
--- !query analysis
-Project [levenshtein(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), Some(3)) AS levenshtein(utf8_binary, collate(AaAA, utf8_lcase), 3)#x, levenshtein(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), Some(4)) AS levenshtein(utf8_lcase, collate(AAa, utf8_binary), 4)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select is_valid_utf8(utf8_binary), is_valid_utf8(utf8_lcase) from t5
--- !query analysis
-Project [is_valid_utf8(utf8_binary#x) AS is_valid_utf8(utf8_binary)#x, is_valid_utf8(utf8_lcase#x) AS is_valid_utf8(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select is_valid_utf8(utf8_binary collate utf8_lcase), is_valid_utf8(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [is_valid_utf8(collate(utf8_binary#x, utf8_lcase)) AS is_valid_utf8(collate(utf8_binary, utf8_lcase))#x, is_valid_utf8(collate(utf8_lcase#x, utf8_binary)) AS is_valid_utf8(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select is_valid_utf8(utf8_binary collate utf8_lcase_rtrim), is_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [is_valid_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS is_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, is_valid_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS is_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select make_valid_utf8(utf8_binary), make_valid_utf8(utf8_lcase) from t5
--- !query analysis
-Project [make_valid_utf8(utf8_binary#x) AS make_valid_utf8(utf8_binary)#x, make_valid_utf8(utf8_lcase#x) AS make_valid_utf8(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select make_valid_utf8(utf8_binary collate utf8_lcase), make_valid_utf8(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [make_valid_utf8(collate(utf8_binary#x, utf8_lcase)) AS make_valid_utf8(collate(utf8_binary, utf8_lcase))#x, make_valid_utf8(collate(utf8_lcase#x, utf8_binary)) AS make_valid_utf8(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select make_valid_utf8(utf8_binary collate utf8_lcase_rtrim), make_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [make_valid_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS make_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, make_valid_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS make_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select validate_utf8(utf8_binary), validate_utf8(utf8_lcase) from t5
--- !query analysis
-Project [validate_utf8(utf8_binary#x) AS validate_utf8(utf8_binary)#x, validate_utf8(utf8_lcase#x) AS validate_utf8(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select validate_utf8(utf8_binary collate utf8_lcase), validate_utf8(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [validate_utf8(collate(utf8_binary#x, utf8_lcase)) AS validate_utf8(collate(utf8_binary, utf8_lcase))#x, validate_utf8(collate(utf8_lcase#x, utf8_binary)) AS validate_utf8(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select validate_utf8(utf8_binary collate utf8_lcase_rtrim), validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [validate_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS validate_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, validate_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS validate_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select try_validate_utf8(utf8_binary), try_validate_utf8(utf8_lcase) from t5
--- !query analysis
-Project [try_validate_utf8(utf8_binary#x) AS try_validate_utf8(utf8_binary)#x, try_validate_utf8(utf8_lcase#x) AS try_validate_utf8(utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select try_validate_utf8(utf8_binary collate utf8_lcase), try_validate_utf8(utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [try_validate_utf8(collate(utf8_binary#x, utf8_lcase)) AS try_validate_utf8(collate(utf8_binary, utf8_lcase))#x, try_validate_utf8(collate(utf8_lcase#x, utf8_binary)) AS try_validate_utf8(collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select try_validate_utf8(utf8_binary collate utf8_lcase_rtrim), try_validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [try_validate_utf8(collate(utf8_binary#x, utf8_lcase_rtrim)) AS try_validate_utf8(collate(utf8_binary, utf8_lcase_rtrim))#x, try_validate_utf8(collate(utf8_lcase#x, utf8_binary_rtrim)) AS try_validate_utf8(collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substr(utf8_binary, 2, 2), substr(utf8_lcase, 2, 2) from t5
--- !query analysis
-Project [substr(utf8_binary#x, 2, 2) AS substr(utf8_binary, 2, 2)#x, substr(utf8_lcase#x, 2, 2) AS substr(utf8_lcase, 2, 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select substr(utf8_binary collate utf8_lcase, 2, 2), substr(utf8_lcase collate utf8_binary, 2, 2) from t5
--- !query analysis
-Project [substr(collate(utf8_binary#x, utf8_lcase), 2, 2) AS substr(collate(utf8_binary, utf8_lcase), 2, 2)#x, substr(collate(utf8_lcase#x, utf8_binary), 2, 2) AS substr(collate(utf8_lcase, utf8_binary), 2, 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select right(utf8_binary, 2), right(utf8_lcase, 2) from t5
--- !query analysis
-Project [right(utf8_binary#x, 2) AS right(utf8_binary, 2)#x, right(utf8_lcase#x, 2) AS right(utf8_lcase, 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select right(utf8_binary collate utf8_lcase, 2), right(utf8_lcase collate utf8_binary, 2) from t5
--- !query analysis
-Project [right(collate(utf8_binary#x, utf8_lcase), 2) AS right(collate(utf8_binary, utf8_lcase), 2)#x, right(collate(utf8_lcase#x, utf8_binary), 2) AS right(collate(utf8_lcase, utf8_binary), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select left(utf8_binary, '2' collate utf8_lcase), left(utf8_lcase, 2) from t5
--- !query analysis
-Project [left(utf8_binary#x, cast(collate(2, utf8_lcase) as int)) AS left(utf8_binary, collate(2, utf8_lcase))#x, left(utf8_lcase#x, 2) AS left(utf8_lcase, 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select left(utf8_binary collate utf8_lcase, 2), left(utf8_lcase collate utf8_binary, 2) from t5
--- !query analysis
-Project [left(collate(utf8_binary#x, utf8_lcase), 2) AS left(collate(utf8_binary, utf8_lcase), 2)#x, left(collate(utf8_lcase#x, utf8_binary), 2) AS left(collate(utf8_lcase, utf8_binary), 2)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select rpad(utf8_binary, 8, utf8_lcase) from t5
--- !query analysis
-Project [rpad(cast(utf8_binary#x as string collate null), 8, cast(utf8_lcase#x as string collate null)) AS rpad(utf8_binary, 8, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select rpad(s, 8, utf8_binary) from t5
--- !query analysis
-Project [rpad(s#x, 8, utf8_binary#x) AS rpad(s, 8, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select rpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select rpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [rpad(utf8_binary#x, 8, collate(utf8_lcase#x, utf8_binary)) AS rpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select rpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [rpad(collate(utf8_binary#x, utf8_lcase), 8, collate(utf8_lcase#x, utf8_lcase)) AS rpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [lpad(collate(utf8_binary#x, utf8_binary_rtrim), 8, collate(utf8_lcase#x, utf8_binary_rtrim)) AS lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select rpad(utf8_binary, 8, 'a'), rpad(utf8_lcase, 8, 'a') from t5
--- !query analysis
-Project [rpad(utf8_binary#x, 8, a) AS rpad(utf8_binary, 8, a)#x, rpad(utf8_lcase#x, 8, a) AS rpad(utf8_lcase, 8, 'a' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select rpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), rpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t5
--- !query analysis
-Project [rpad(cast(utf8_binary#x as string collate UTF8_LCASE), 8, collate(AaAA, utf8_lcase)) AS rpad(utf8_binary, 8, collate(AaAA, utf8_lcase))#x, rpad(cast(utf8_lcase#x as string), 8, collate(AAa, utf8_binary)) AS rpad(utf8_lcase, 8, collate(AAa, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(utf8_binary, 8, utf8_lcase) from t5
--- !query analysis
-Project [lpad(cast(utf8_binary#x as string collate null), 8, cast(utf8_lcase#x as string collate null)) AS lpad(utf8_binary, 8, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(s, 8, utf8_binary) from t5
--- !query analysis
-Project [lpad(s#x, 8, utf8_binary#x) AS lpad(s, 8, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select lpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [lpad(utf8_binary#x, 8, collate(utf8_lcase#x, utf8_binary)) AS lpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [lpad(collate(utf8_binary#x, utf8_lcase), 8, collate(utf8_lcase#x, utf8_lcase)) AS lpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [lpad(collate(utf8_binary#x, utf8_binary_rtrim), 8, collate(utf8_lcase#x, utf8_binary_rtrim)) AS lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(utf8_binary, 8, 'a'), lpad(utf8_lcase, 8, 'a') from t5
--- !query analysis
-Project [lpad(utf8_binary#x, 8, a) AS lpad(utf8_binary, 8, a)#x, lpad(utf8_lcase#x, 8, a) AS lpad(utf8_lcase, 8, 'a' collate UTF8_LCASE)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), lpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t5
--- !query analysis
-Project [lpad(cast(utf8_binary#x as string collate UTF8_LCASE), 8, collate(AaAA, utf8_lcase)) AS lpad(utf8_binary, 8, collate(AaAA, utf8_lcase))#x, lpad(cast(utf8_lcase#x as string), 8, collate(AAa, utf8_binary)) AS lpad(utf8_lcase, 8, collate(AAa, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select locate(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"locate(utf8_binary, utf8_lcase, 1)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 38,
-    "fragment" : "locate(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select locate(s, utf8_binary) from t5
--- !query analysis
-Project [locate(s#x, utf8_binary#x, 1) AS locate(s, utf8_binary, 1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select locate(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select locate(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [locate(utf8_binary#x, collate(utf8_lcase#x, utf8_binary), 1) AS locate(utf8_binary, collate(utf8_lcase, utf8_binary), 1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select locate(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 3) from t5
--- !query analysis
-Project [locate(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase), 3) AS locate(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 3)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"locate(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 3)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 79,
-    "fragment" : "locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3)"
-  } ]
-}
-
-
--- !query
-select locate(utf8_binary, 'a'), locate(utf8_lcase, 'a') from t5
--- !query analysis
-Project [locate(utf8_binary#x, a, 1) AS locate(utf8_binary, a, 1)#x, locate(utf8_lcase#x, a, 1) AS locate(utf8_lcase, 'a' collate UTF8_LCASE, 1)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select locate(utf8_binary, 'AaAA' collate utf8_lcase, 4), locate(utf8_lcase, 'AAa' collate utf8_binary, 4) from t5
--- !query analysis
-Project [locate(cast(utf8_binary#x as string collate UTF8_LCASE), collate(AaAA, utf8_lcase), 4) AS locate(utf8_binary, collate(AaAA, utf8_lcase), 4)#x, locate(cast(utf8_lcase#x as string), collate(AAa, utf8_binary), 4) AS locate(utf8_lcase, collate(AAa, utf8_binary), 4)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select locate(utf8_binary, 'AaAA ' collate utf8_binary_rtrim, 4), locate(utf8_lcase, 'AAa ' collate utf8_binary, 4) from t5
--- !query analysis
-Project [locate(cast(utf8_binary#x as string collate UTF8_BINARY_RTRIM), collate(AaAA , utf8_binary_rtrim), 4) AS locate(utf8_binary, collate(AaAA , utf8_binary_rtrim), 4)#x, locate(cast(utf8_lcase#x as string), collate(AAa , utf8_binary), 4) AS locate(utf8_lcase, collate(AAa , utf8_binary), 4)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select TRIM(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(BOTH utf8_binary FROM utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 36,
-    "fragment" : "TRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select TRIM(s, utf8_binary) from t5
--- !query analysis
-Project [trim(utf8_binary#x, Some(s#x)) AS TRIM(BOTH s FROM utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select TRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select TRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [trim(collate(utf8_lcase#x, utf8_binary), Some(utf8_binary#x)) AS TRIM(BOTH utf8_binary FROM collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select TRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [trim(collate(utf8_lcase#x, utf8_lcase), Some(collate(utf8_binary#x, utf8_lcase))) AS TRIM(BOTH collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(BOTH collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 74,
-    "fragment" : "TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select TRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [trim(collate(utf8_lcase#x, utf8_binary_rtrim), Some(collate(utf8_binary#x, utf8_binary_rtrim))) AS TRIM(BOTH collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select TRIM('ABc', utf8_binary), TRIM('ABc', utf8_lcase) from t5
--- !query analysis
-Project [trim(utf8_binary#x, Some(ABc)) AS TRIM(BOTH ABc FROM utf8_binary)#x, trim(utf8_lcase#x, Some(ABc)) AS TRIM(BOTH 'ABc' collate UTF8_LCASE FROM utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select TRIM('ABc' collate utf8_lcase, utf8_binary), TRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query analysis
-Project [trim(cast(utf8_binary#x as string collate UTF8_LCASE), Some(collate(ABc, utf8_lcase))) AS TRIM(BOTH collate(ABc, utf8_lcase) FROM utf8_binary)#x, trim(cast(utf8_lcase#x as string), Some(collate(AAa, utf8_binary))) AS TRIM(BOTH collate(AAa, utf8_binary) FROM utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select BTRIM(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(BOTH utf8_lcase FROM utf8_binary)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "BTRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select BTRIM(s, utf8_binary) from t5
--- !query analysis
-Project [btrim(s#x, utf8_binary#x) AS btrim(s, utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select BTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select BTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [btrim(utf8_binary#x, collate(utf8_lcase#x, utf8_binary)) AS btrim(utf8_binary, collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select BTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [btrim(collate(utf8_binary#x, utf8_lcase), collate(utf8_lcase#x, utf8_lcase)) AS btrim(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(BOTH collate(utf8_lcase, unicode_ai) FROM collate(utf8_binary, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select BTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [btrim(collate(utf8_binary#x, utf8_binary_rtrim), collate(utf8_lcase#x, utf8_binary_rtrim)) AS btrim(collate(utf8_binary, utf8_binary_rtrim), collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select BTRIM('ABc', utf8_binary), BTRIM('ABc', utf8_lcase) from t5
--- !query analysis
-Project [btrim(ABc, utf8_binary#x) AS btrim(ABc, utf8_binary)#x, btrim(ABc, utf8_lcase#x) AS btrim(ABc, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select BTRIM('ABc' collate utf8_lcase, utf8_binary), BTRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query analysis
-Project [btrim(collate(ABc, utf8_lcase), utf8_binary#x) AS btrim(collate(ABc, utf8_lcase), utf8_binary)#x, btrim(collate(AAa, utf8_binary), utf8_lcase#x) AS btrim(collate(AAa, utf8_binary), utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select LTRIM(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(LEADING utf8_binary FROM utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "LTRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select LTRIM(s, utf8_binary) from t5
--- !query analysis
-Project [ltrim(utf8_binary#x, Some(s#x)) AS TRIM(LEADING s FROM utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select LTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select LTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [ltrim(collate(utf8_lcase#x, utf8_binary), Some(utf8_binary#x)) AS TRIM(LEADING utf8_binary FROM collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select LTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [ltrim(collate(utf8_lcase#x, utf8_lcase), Some(collate(utf8_binary#x, utf8_lcase))) AS TRIM(LEADING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(LEADING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select LTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [ltrim(collate(utf8_lcase#x, utf8_binary_rtrim), Some(collate(utf8_binary#x, utf8_binary_rtrim))) AS TRIM(LEADING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select LTRIM('ABc', utf8_binary), LTRIM('ABc', utf8_lcase) from t5
--- !query analysis
-Project [ltrim(utf8_binary#x, Some(ABc)) AS TRIM(LEADING ABc FROM utf8_binary)#x, ltrim(utf8_lcase#x, Some(ABc)) AS TRIM(LEADING 'ABc' collate UTF8_LCASE FROM utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select LTRIM('ABc' collate utf8_lcase, utf8_binary), LTRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query analysis
-Project [ltrim(cast(utf8_binary#x as string collate UTF8_LCASE), Some(collate(ABc, utf8_lcase))) AS TRIM(LEADING collate(ABc, utf8_lcase) FROM utf8_binary)#x, ltrim(cast(utf8_lcase#x as string), Some(collate(AAa, utf8_binary))) AS TRIM(LEADING collate(AAa, utf8_binary) FROM utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select RTRIM(utf8_binary, utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(TRAILING utf8_binary FROM utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "RTRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select RTRIM(s, utf8_binary) from t5
--- !query analysis
-Project [rtrim(utf8_binary#x, Some(s#x)) AS TRIM(TRAILING s FROM utf8_binary)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select RTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select RTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query analysis
-Project [rtrim(collate(utf8_lcase#x, utf8_binary), Some(utf8_binary#x)) AS TRIM(TRAILING utf8_binary FROM collate(utf8_lcase, utf8_binary))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select RTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query analysis
-Project [rtrim(collate(utf8_lcase#x, utf8_lcase), Some(collate(utf8_binary#x, utf8_lcase))) AS TRIM(TRAILING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(TRAILING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select RTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query analysis
-Project [rtrim(collate(utf8_lcase#x, utf8_binary_rtrim), Some(collate(utf8_binary#x, utf8_binary_rtrim))) AS TRIM(TRAILING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim))#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select RTRIM('ABc', utf8_binary), RTRIM('ABc', utf8_lcase) from t5
--- !query analysis
-Project [rtrim(utf8_binary#x, Some(ABc)) AS TRIM(TRAILING ABc FROM utf8_binary)#x, rtrim(utf8_lcase#x, Some(ABc)) AS TRIM(TRAILING 'ABc' collate UTF8_LCASE FROM utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select RTRIM('ABc' collate utf8_lcase, utf8_binary), RTRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query analysis
-Project [rtrim(cast(utf8_binary#x as string collate UTF8_LCASE), Some(collate(ABc, utf8_lcase))) AS TRIM(TRAILING collate(ABc, utf8_lcase) FROM utf8_binary)#x, rtrim(cast(utf8_lcase#x as string), Some(collate(AAa, utf8_binary))) AS TRIM(TRAILING collate(AAa, utf8_binary) FROM utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
--- !query analysis
-Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- SubqueryAlias spark_catalog.default.t5
-   +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query analysis
-Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- SubqueryAlias __auto_generated_subquery_name
-   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-      +- SubqueryAlias spark_catalog.default.t5
-         +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select * from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query analysis
-Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- SubqueryAlias __auto_generated_subquery_name
-   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-      +- SubqueryAlias spark_catalog.default.t5
-         +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select subq1.* from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-) AS subq1
--- !query analysis
-Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- SubqueryAlias subq1
-   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-      +- SubqueryAlias spark_catalog.default.t5
-         +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-with cte as (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
-select * from cte
--- !query analysis
-WithCTE
-:- CTERelationDef xxxx, false
-:  +- SubqueryAlias cte
-:     +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-:        +- SubqueryAlias spark_catalog.default.t5
-:           +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-+- Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-   +- SubqueryAlias cte
-      +- CTERelationRef xxxx, true, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x], false, false
-
-
--- !query
-select * from values (1) where exists (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query analysis
-Project [col1#x]
-+- Filter exists#x []
-   :  +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-   :     +- SubqueryAlias spark_catalog.default.t5
-   :        +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-   +- LocalRelation [col1#x]
-
-
--- !query
-select (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5 limit 1
-)
--- !query analysis
-Project [scalar-subquery#x [] AS scalarsubquery()#x]
-:  +- GlobalLimit 1
-:     +- LocalLimit 1
-:        +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-:           +- SubqueryAlias spark_catalog.default.t5
-:              +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-+- OneRowRelation
-
-
--- !query
-select (
-  with cte as (
-    select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  )
-  select * from cte limit 1
-)
--- !query analysis
-Project [scalar-subquery#x [] AS scalarsubquery()#x]
-:  +- WithCTE
-:     :- CTERelationDef xxxx, false
-:     :  +- SubqueryAlias cte
-:     :     +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-:     :        +- SubqueryAlias spark_catalog.default.t5
-:     :           +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-:     +- GlobalLimit 1
-:        +- LocalLimit 1
-:           +- Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-:              +- SubqueryAlias cte
-:                 +- CTERelationRef xxxx, true, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x], false, false
-+- OneRowRelation
-
-
--- !query
-select * from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5 limit 1
-)
-where (
-  `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` == 'aaa'
-)
--- !query analysis
-Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- Filter (concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x = aaa)
-   +- SubqueryAlias __auto_generated_subquery_name
-      +- GlobalLimit 1
-         +- LocalLimit 1
-            +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-               +- SubqueryAlias spark_catalog.default.t5
-                  +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  group by 1
-  order by 1
-)
--- !query analysis
-Project [lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x) AS lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias __auto_generated_subquery_name
-   +- Sort [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x ASC NULLS FIRST], true
-      +- Aggregate [concat_ws( , utf8_lcase#x, utf8_lcase#x)], [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-         +- SubqueryAlias spark_catalog.default.t5
-            +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  group by 1
-  order by max(concat_ws(' ', utf8_lcase, utf8_lcase))
-)
--- !query analysis
-Project [lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x) AS lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x]
-+- SubqueryAlias __auto_generated_subquery_name
-   +- Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-      +- Sort [max(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x ASC NULLS FIRST], true
-         +- Aggregate [concat_ws( , utf8_lcase#x, utf8_lcase#x)], [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x, max(concat_ws( , utf8_lcase#x, utf8_lcase#x)) AS max(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase))#x]
-            +- SubqueryAlias spark_catalog.default.t5
-               +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-create temporary view v1 as (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query analysis
-CreateViewCommand `v1`, (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-), false, false, LocalTempView, UNSUPPORTED, true
-   +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-      +- SubqueryAlias spark_catalog.default.t5
-         +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select * from v1
--- !query analysis
-Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- SubqueryAlias v1
-   +- View (`v1`, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x])
-      +- Project [cast(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x as string collate UTF8_LCASE) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-         +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-            +- SubqueryAlias spark_catalog.default.t5
-               +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from v1
--- !query analysis
-Project [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-+- SubqueryAlias v1
-   +- View (`v1`, [concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x])
-      +- Project [cast(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x as string collate UTF8_LCASE) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-         +- Project [concat_ws( , utf8_lcase#x, utf8_lcase#x) AS concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)#x]
-            +- SubqueryAlias spark_catalog.default.t5
-               +- Relation spark_catalog.default.t5[s#x,utf8_binary#x,utf8_lcase#x] parquet
-
-
--- !query
-drop view v1
--- !query analysis
-DropTempViewCommand v1
-
-
--- !query
-drop table t5
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t5
-
-
--- !query
-drop table t6
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t6
-
-
--- !query
-drop table t7
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t7
-
-
--- !query
-drop table t8
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t8
-
-
--- !query
-drop table t9
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t9
-
-
--- !query
-drop table t10
--- !query analysis
-DropTable false, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t10
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/columnresolution.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/columnresolution.sql.out
index e0ef6c1248aea..5a2447d440035 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/columnresolution.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/columnresolution.sql.out
@@ -337,7 +337,7 @@ CreateDataSourceTableCommand `spark_catalog`.`mydb1`.`t5`, false
 INSERT INTO t5 VALUES(1, (2, 3))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/mydb1.db/t5, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/mydb1.db/t5], Append, `spark_catalog`.`mydb1`.`t5`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/mydb1.db/t5), [i1, t5]
-+- Project [cast(col1#x as int) AS i1#x, named_struct(i1, cast(col2#x.col1 as int), i2, cast(col2#x.col2 as int)) AS t5#x]
++- Project [col1#x AS i1#x, named_struct(i1, col2#x.col1, i2, col2#x.col2) AS t5#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/cte-recursion.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/cte-recursion.sql.out
index f67d7c6f8142b..23ee616dda8ea 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/cte-recursion.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/cte-recursion.sql.out
@@ -409,20 +409,10 @@ WITH RECURSIVE r(level) AS (
 )
 SELECT * FROM r
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
+org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`level`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 62,
-    "stopIndex" : 66,
-    "fragment" : "level"
-  } ]
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
 }
 
 
@@ -471,24 +461,11 @@ WITH RECURSIVE t(col) (
 )
 SELECT * FROM t LIMIT 5
 -- !query analysis
-WithCTE
-:- CTERelationDef xxxx, false
-:  +- SubqueryAlias t
-:     +- Project [1#x AS col#x]
-:        +- UnionLoop xxxx
-:           :- Project [1 AS 1#x]
-:           :  +- OneRowRelation
-:           +- Project [scalar-subquery#x [] AS scalarsubquery()#x]
-:              :  +- Aggregate [max(col#x) AS max(col)#x]
-:              :     +- SubqueryAlias t
-:              :        +- Project [1#x AS col#x]
-:              :           +- UnionLoopRef xxxx, [1#x], false
-:              +- OneRowRelation
-+- GlobalLimit 5
-   +- LocalLimit 5
-      +- Project [col#x]
-         +- SubqueryAlias t
-            +- CTERelationRef xxxx, true, [col#x], false, false
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_REFERENCE.PLACE",
+  "sqlState" : "42836"
+}
 
 
 -- !query
@@ -511,6 +488,35 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 }
 
 
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT (SELECT n+1 FROM t1 WHERE n<5)
+)
+SELECT * FROM t1 LIMIT 5
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t1
+:     +- Project [1#x AS n#x]
+:        +- UnionLoop xxxx
+:           :- Project [1 AS 1#x]
+:           :  +- OneRowRelation
+:           +- Project [scalar-subquery#x [] AS scalarsubquery()#x]
+:              :  +- Project [(n#x + 1) AS (n + 1)#x]
+:              :     +- Filter (n#x < 5)
+:              :        +- SubqueryAlias t1
+:              :           +- Project [1#x AS n#x]
+:              :              +- UnionLoopRef xxxx, [1#x], false
+:              +- OneRowRelation
++- GlobalLimit 5
+   +- LocalLimit 5
+      +- Project [n#x]
+         +- SubqueryAlias t1
+            +- CTERelationRef xxxx, true, [n#x], false, false
+
+
 -- !query
 WITH RECURSIVE
   t1 AS (
@@ -1360,7 +1366,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`tb`, false
 INSERT INTO tb VALUES (0), (1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/tb, false, JSON, [path=file:[not included in comparison]/{warehouse_dir}/tb], Append, `spark_catalog`.`default`.`tb`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/tb), [next]
-+- Project [cast(col1#x as int) AS next#x]
++- Project [col1#x AS next#x]
    +- LocalRelation [col1#x]
 
 
@@ -1577,28 +1583,11 @@ WITH RECURSIVE t1(n) AS (
     SELECT n+1 FROM t2 WHERE n < 5)
 SELECT * FROM t1
 -- !query analysis
-WithCTE
-:- CTERelationDef xxxx, false
-:  +- SubqueryAlias t1
-:     +- Project [1#x AS n#x]
-:        +- WithCTE
-:           :- CTERelationDef xxxx, false
-:           :  +- SubqueryAlias t2
-:           :     +- Project [n#x AS n#x]
-:           :        +- Project [n#x]
-:           :           +- SubqueryAlias t1
-:           :              +- Project [1#x AS n#x]
-:           :                 +- UnionLoopRef xxxx, [1#x], false
-:           +- UnionLoop xxxx
-:              :- Project [1 AS 1#x]
-:              :  +- OneRowRelation
-:              +- Project [(n#x + 1) AS (n + 1)#x]
-:                 +- Filter (n#x < 5)
-:                    +- SubqueryAlias t2
-:                       +- CTERelationRef xxxx, true, [n#x], false, false
-+- Project [n#x]
-   +- SubqueryAlias t1
-      +- CTERelationRef xxxx, true, [n#x], false, false
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
 
 
 -- !query
@@ -1609,26 +1598,11 @@ WITH RECURSIVE t1 AS (
     SELECT n+1 FROM t2 WHERE n < 5)
 SELECT * FROM t1
 -- !query analysis
-WithCTE
-:- CTERelationDef xxxx, false
-:  +- SubqueryAlias t1
-:     +- WithCTE
-:        :- CTERelationDef xxxx, false
-:        :  +- SubqueryAlias t2
-:        :     +- Project [n#x AS n#x]
-:        :        +- Project [n#x]
-:        :           +- SubqueryAlias t1
-:        :              +- UnionLoopRef xxxx, [n#x], false
-:        +- UnionLoop xxxx
-:           :- Project [1 AS n#x]
-:           :  +- OneRowRelation
-:           +- Project [(n#x + 1) AS (n + 1)#x]
-:              +- Filter (n#x < 5)
-:                 +- SubqueryAlias t2
-:                    +- CTERelationRef xxxx, true, [n#x], false, false
-+- Project [n#x]
-   +- SubqueryAlias t1
-      +- CTERelationRef xxxx, true, [n#x], false, false
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
 
 
 -- !query
@@ -1812,3 +1786,348 @@ WITH RECURSIVE randoms(val) AS (
 SELECT val FROM randoms LIMIT 5
 -- !query analysis
 [Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+WITH RECURSIVE t1(n, m) AS (
+    SELECT 1, CAST(1 AS BIGINT)
+    UNION ALL
+    SELECT n+1, n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t1
+:     +- Project [1#x AS n#x, CAST(1 AS BIGINT)#xL AS m#xL]
+:        +- UnionLoop xxxx
+:           :- Project [1 AS 1#x, cast(1 as bigint) AS CAST(1 AS BIGINT)#xL]
+:           :  +- OneRowRelation
+:           +- Project [cast((n + 1)#x as int) AS (n + 1)#x, cast((n + 1)#x as bigint) AS (n + 1)#xL]
+:              +- Project [(n#x + 1) AS (n + 1)#x, (n#x + 1) AS (n + 1)#x]
+:                 +- Filter (n#x < 5)
+:                    +- SubqueryAlias t1
+:                       +- Project [1#x AS n#x, CAST(1 AS BIGINT)#xL AS m#xL]
+:                          +- UnionLoopRef xxxx, [1#x, CAST(1 AS BIGINT)#xL], false
++- Project [n#x, m#xL]
+   +- SubqueryAlias t1
+      +- CTERelationRef xxxx, true, [n#x, m#xL], false, false
+
+
+-- !query
+WITH RECURSIVE t1(n, m) AS (
+    SELECT 1, 1
+    UNION ALL
+    SELECT n+1, CAST(n+1 AS BIGINT) FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query analysis
+org.apache.spark.SparkException
+{
+  "errorClass" : "CANNOT_MERGE_INCOMPATIBLE_DATA_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "left" : "\"INT\"",
+    "right" : "\"BIGINT\""
+  }
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT CASE WHEN n < 5 THEN n + 1 ELSE NULL END FROM t1
+)
+SELECT * FROM t1 LIMIT 25
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t1
+:     +- Project [1#x AS n#x]
+:        +- UnionLoop xxxx
+:           :- Project [1 AS 1#x]
+:           :  +- OneRowRelation
+:           +- Project [CASE WHEN (n#x < 5) THEN (n#x + 1) ELSE cast(null as int) END AS CASE WHEN (n < 5) THEN (n + 1) ELSE NULL END#x]
+:              +- SubqueryAlias t1
+:                 +- Project [1#x AS n#x]
+:                    +- UnionLoopRef xxxx, [1#x], false
++- GlobalLimit 25
+   +- LocalLimit 25
+      +- Project [n#x]
+         +- SubqueryAlias t1
+            +- CTERelationRef xxxx, true, [n#x], false, false
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1 WHERE n < 5
+)
+SELECT (SELECT SUM(n) FROM (SELECT * FROM t1)), (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 3))
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t1
+:     +- Project [1#x AS n#x]
+:        +- UnionLoop xxxx
+:           :- Project [1 AS 1#x]
+:           :  +- OneRowRelation
+:           +- Project [(n#x + 1) AS (n + 1)#x]
+:              +- Filter (n#x < 5)
+:                 +- SubqueryAlias t1
+:                    +- Project [1#x AS n#x]
+:                       +- UnionLoopRef xxxx, [1#x], false
++- Project [scalar-subquery#x [] AS scalarsubquery()#xL, scalar-subquery#x [] AS scalarsubquery()#xL]
+   :  :- Aggregate [sum(n#x) AS sum(n)#xL]
+   :  :  +- SubqueryAlias __auto_generated_subquery_name
+   :  :     +- Project [n#x]
+   :  :        +- SubqueryAlias t1
+   :  :           +- CTERelationRef xxxx, true, [n#x], false, false
+   :  +- Aggregate [sum(n#x) AS sum(n)#xL]
+   :     +- SubqueryAlias __auto_generated_subquery_name
+   :        +- GlobalLimit 3
+   :           +- LocalLimit 3
+   :              +- Project [n#x]
+   :                 +- SubqueryAlias t1
+   :                    +- CTERelationRef xxxx, true, [n#x], false, false
+   +- OneRowRelation
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+)
+SELECT (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 5)), (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 3))
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t1
+:     +- Project [1#x AS n#x]
+:        +- UnionLoop xxxx
+:           :- Project [1 AS 1#x]
+:           :  +- OneRowRelation
+:           +- Project [(n#x + 1) AS (n + 1)#x]
+:              +- SubqueryAlias t1
+:                 +- Project [1#x AS n#x]
+:                    +- UnionLoopRef xxxx, [1#x], false
++- Project [scalar-subquery#x [] AS scalarsubquery()#xL, scalar-subquery#x [] AS scalarsubquery()#xL]
+   :  :- Aggregate [sum(n#x) AS sum(n)#xL]
+   :  :  +- SubqueryAlias __auto_generated_subquery_name
+   :  :     +- GlobalLimit 5
+   :  :        +- LocalLimit 5
+   :  :           +- Project [n#x]
+   :  :              +- SubqueryAlias t1
+   :  :                 +- CTERelationRef xxxx, true, [n#x], false, false
+   :  +- Aggregate [sum(n#x) AS sum(n)#xL]
+   :     +- SubqueryAlias __auto_generated_subquery_name
+   :        +- GlobalLimit 3
+   :           +- LocalLimit 3
+   :              +- Project [n#x]
+   :                 +- SubqueryAlias t1
+   :                    +- CTERelationRef xxxx, true, [n#x], false, false
+   +- OneRowRelation
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+), t2(m) AS (
+    SELECT (SELECT SUM(n) FROM (SELECT n FROM t1 LIMIT 10) AS sums)
+    UNION ALL
+    SELECT m + (SELECT SUM(n) FROM (SELECT n FROM t1 LIMIT 3) AS sums) FROM t2
+)
+SELECT * FROM t2 LIMIT 20
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t1
+:     +- Project [1#x AS n#x]
+:        +- UnionLoop xxxx
+:           :- Project [1 AS 1#x]
+:           :  +- OneRowRelation
+:           +- Project [(n#x + 1) AS (n + 1)#x]
+:              +- SubqueryAlias t1
+:                 +- Project [1#x AS n#x]
+:                    +- UnionLoopRef xxxx, [1#x], false
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t2
+:     +- Project [scalarsubquery()#xL AS m#xL]
+:        +- UnionLoop xxxx
+:           :- Project [scalar-subquery#x [] AS scalarsubquery()#xL]
+:           :  :  +- Aggregate [sum(n#x) AS sum(n)#xL]
+:           :  :     +- SubqueryAlias sums
+:           :  :        +- GlobalLimit 10
+:           :  :           +- LocalLimit 10
+:           :  :              +- Project [n#x]
+:           :  :                 +- SubqueryAlias t1
+:           :  :                    +- CTERelationRef xxxx, true, [n#x], false, false
+:           :  +- OneRowRelation
+:           +- Project [(m#xL + scalar-subquery#x []) AS (m + scalarsubquery())#xL]
+:              :  +- Aggregate [sum(n#x) AS sum(n)#xL]
+:              :     +- SubqueryAlias sums
+:              :        +- GlobalLimit 3
+:              :           +- LocalLimit 3
+:              :              +- Project [n#x]
+:              :                 +- SubqueryAlias t1
+:              :                    +- CTERelationRef xxxx, true, [n#x], false, false
+:              +- SubqueryAlias t2
+:                 +- Project [scalarsubquery()#xL AS m#xL]
+:                    +- UnionLoopRef xxxx, [scalarsubquery()#xL], false
++- GlobalLimit 20
+   +- LocalLimit 20
+      +- Project [m#xL]
+         +- SubqueryAlias t2
+            +- CTERelationRef xxxx, true, [m#xL], false, false
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+)
+    ((SELECT n FROM t1) UNION ALL (SELECT n FROM t1)) LIMIT 20
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t1
+:     +- Project [1#x AS n#x]
+:        +- UnionLoop xxxx
+:           :- Project [1 AS 1#x]
+:           :  +- OneRowRelation
+:           +- Project [(n#x + 1) AS (n + 1)#x]
+:              +- SubqueryAlias t1
+:                 +- Project [1#x AS n#x]
+:                    +- UnionLoopRef xxxx, [1#x], false
++- GlobalLimit 20
+   +- LocalLimit 20
+      +- Union false, false
+         :- Project [n#x]
+         :  +- SubqueryAlias t1
+         :     +- CTERelationRef xxxx, true, [n#x], false, false
+         +- Project [n#x]
+            +- SubqueryAlias t1
+               +- CTERelationRef xxxx, true, [n#x], false, false
+
+
+-- !query
+WITH RECURSIVE win(id, val) AS (
+    SELECT 1, CAST(10 AS BIGINT)
+    UNION ALL
+    SELECT id + 1, SUM(val) OVER (ORDER BY id ROWS BETWEEN 1 PRECEDING AND CURRENT ROW)
+    FROM win WHERE id < 3
+)
+SELECT * FROM win
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_REFERENCE.PLACE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    (SELECT n + 1 FROM t1 WHERE n < 5 ORDER BY n)
+)
+SELECT * FROM t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_REFERENCE.PLACE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1 FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1 AS (
+    SELECT 1 AS n FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    WITH t2(m) AS (SELECT 1)
+    SELECT 1 FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1 AS (
+    WITH t2(m) AS (SELECT 1)
+    SELECT 1 AS n FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t AS (
+    SELECT 1 AS n
+    UNION ALL
+    SELECT n + m
+    FROM (SELECT 2 as m) subq
+             JOIN t ON n = m
+    WHERE n <> m
+)
+SELECT * FROM t
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias t
+:     +- UnionLoop xxxx
+:        :- Project [1 AS n#x]
+:        :  +- OneRowRelation
+:        +- Project [(n#x + m#x) AS (n + m)#x]
+:           +- Filter NOT (n#x = m#x)
+:              +- Join Inner, (n#x = m#x)
+:                 :- SubqueryAlias subq
+:                 :  +- Project [2 AS m#x]
+:                 :     +- OneRowRelation
+:                 +- SubqueryAlias t
+:                    +- UnionLoopRef xxxx, [n#x], false
++- Project [n#x]
+   +- SubqueryAlias t
+      +- CTERelationRef xxxx, true, [n#x], false, false
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/datetime-legacy.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/datetime-legacy.sql.out
index 3681a5dfd3904..e9d301c649808 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/datetime-legacy.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/datetime-legacy.sql.out
@@ -1113,6 +1113,235 @@ Project [make_timestamp(1, 1, 1, 1, 1, cast(999.999999 as decimal(16,6)), None,
 +- OneRowRelation
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), None, None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(MIT), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(PST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(UTC), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(CET), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(JST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query analysis
@@ -1595,45 +1824,13 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+[Analyzer test output redacted due to nondeterminism]
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+[Analyzer test output redacted due to nondeterminism]
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/decimalArithmeticOperations.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/decimalArithmeticOperations.sql.out
index d75f4d41bd425..5c136f6fe1779 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/decimalArithmeticOperations.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/decimalArithmeticOperations.sql.out
@@ -51,7 +51,7 @@ insert into decimals_test values(1, 100.0, 999.0), (2, 12345.123, 12345.123),
   (3, 0.1234567891011, 1234.1), (4, 123456789123456789.0, 1.123456789123456789)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/decimals_test, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/decimals_test], Append, `spark_catalog`.`default`.`decimals_test`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/decimals_test), [id, a, b]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,18)) AS a#x, cast(col3#x as decimal(38,18)) AS b#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,18)) AS a#x, cast(col3#x as decimal(38,18)) AS b#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/describe-part-after-analyze.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/describe-part-after-analyze.sql.out
index 8bb042e99795f..5da91fd74014f 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/describe-part-after-analyze.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/describe-part-after-analyze.sql.out
@@ -12,7 +12,7 @@ VALUES ('k1', 100), ('k2', 200), ('k3', 300)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, [ds=2017-08-01, hr=10], false, [ds#x, hr#x], Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.CatalogFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [key, value, ds, hr]
 +- Project [key#x, value#x, cast(2017-08-01 as string) AS ds#x, cast(10 as int) AS hr#x]
-   +- Project [cast(col1#x as string) AS key#x, cast(col2#x as string) AS value#x]
+   +- Project [col1#x AS key#x, cast(col2#x as string) AS value#x]
       +- LocalRelation [col1#x, col2#x]
 
 
@@ -22,7 +22,7 @@ VALUES ('k1', 101), ('k2', 201), ('k3', 301), ('k4', 401)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, [ds=2017-08-01, hr=11], false, [ds#x, hr#x], Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.CatalogFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [key, value, ds, hr]
 +- Project [key#x, value#x, cast(2017-08-01 as string) AS ds#x, cast(11 as int) AS hr#x]
-   +- Project [cast(col1#x as string) AS key#x, cast(col2#x as string) AS value#x]
+   +- Project [col1#x AS key#x, cast(col2#x as string) AS value#x]
       +- LocalRelation [col1#x, col2#x]
 
 
@@ -32,7 +32,7 @@ VALUES ('k1', 102), ('k2', 202)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, [ds=2017-09-01, hr=5], false, [ds#x, hr#x], Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.CatalogFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [key, value, ds, hr]
 +- Project [key#x, value#x, cast(2017-09-01 as string) AS ds#x, cast(5 as int) AS hr#x]
-   +- Project [cast(col1#x as string) AS key#x, cast(col2#x as string) AS value#x]
+   +- Project [col1#x AS key#x, cast(col2#x as string) AS value#x]
       +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/describe.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/describe.sql.out
index 2f7237663b646..e49673d33943b 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/describe.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/describe.sql.out
@@ -213,6 +213,41 @@ org.apache.spark.sql.catalyst.parser.ParseException
 }
 
 
+-- !query
+DROP SCHEMA IF EXISTS test_schema
+-- !query analysis
+DropNamespace true, false
++- ResolvedNamespace V2SessionCatalog(spark_catalog), [test_schema]
+
+
+-- !query
+CREATE SCHEMA test_schema DEFAULT COLLATION UNICODE
+-- !query analysis
+CreateNamespace false, [collation=UNICODE]
++- ResolvedNamespace V2SessionCatalog(spark_catalog), [test_schema]
+
+
+-- !query
+DESCRIBE SCHEMA EXTENDED test_schema
+-- !query analysis
+DescribeNamespace true, [info_name#x, info_value#x]
++- ResolvedNamespace V2SessionCatalog(spark_catalog), [test_schema]
+
+
+-- !query
+ALTER SCHEMA test_schema DEFAULT COLLATION UTF8_LCASE
+-- !query analysis
+SetNamespaceCollationCommand UTF8_LCASE
++- ResolvedNamespace V2SessionCatalog(spark_catalog), [test_schema]
+
+
+-- !query
+DESCRIBE SCHEMA EXTENDED test_schema
+-- !query analysis
+DescribeNamespace true, [info_name#x, info_value#x]
++- ResolvedNamespace V2SessionCatalog(spark_catalog), [test_schema]
+
+
 -- !query
 DESC temp_v
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers-enabled.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers-enabled.sql.out
index cb42a54b85d57..51569e6c965c8 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers-enabled.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers-enabled.sql.out
@@ -154,6 +154,26 @@ org.apache.spark.sql.AnalysisException
 }
 
 
+-- !query
+select 1 from "not_""exists"
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "TABLE_OR_VIEW_NOT_FOUND",
+  "sqlState" : "42P01",
+  "messageParameters" : {
+    "relationName" : "`not_\"exists`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 15,
+    "stopIndex" : 28,
+    "fragment" : "\"not_\"\"exists\""
+  } ]
+}
+
+
 -- !query
 SELECT 1 FROM `hello`
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers.sql.out
index a02bf525f947d..5c8b549a50658 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/double-quoted-identifiers.sql.out
@@ -111,6 +111,20 @@ org.apache.spark.sql.catalyst.parser.ParseException
 }
 
 
+-- !query
+select 1 from "not_""exists"
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'\"not_\"\"exists\"'",
+    "hint" : ""
+  }
+}
+
+
 -- !query
 SELECT 1 FROM `hello`
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/execute-immediate.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/execute-immediate.sql.out
index 78bf1ccb1678c..d575cac56d28b 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/execute-immediate.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/execute-immediate.sql.out
@@ -204,7 +204,7 @@ Project [id#x, name#x, data#x]
 EXECUTE IMMEDIATE 'INSERT INTO x VALUES(?)' USING 1
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/x, false, CSV, [path=file:[not included in comparison]/{warehouse_dir}/x], Append, `spark_catalog`.`default`.`x`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/x), [id]
-+- Project [cast(col1#x as int) AS id#x]
++- Project [col1#x AS id#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/group-analytics.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/group-analytics.sql.out
index fff84a1a253b4..fc0f6fef8c16c 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/group-analytics.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/group-analytics.sql.out
@@ -383,7 +383,7 @@ HAVING GROUPING(year) = 1 AND GROUPING_ID(course, year) > 0 ORDER BY course, yea
 Sort [course#x ASC NULLS FIRST, year#x ASC NULLS FIRST], true
 +- Project [course#x, year#x]
    +- Filter ((cast(cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) as int) = 1) AND (spark_grouping_id#xL > cast(0 as bigint)))
-      +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL, spark_grouping_id#xL]
+      +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL]
          +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
             +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
                +- SubqueryAlias coursesales
@@ -434,34 +434,32 @@ Project [course#x, year#x]
 SELECT course, year, GROUPING(course), GROUPING(year) FROM courseSales GROUP BY CUBE(course, year)
 ORDER BY GROUPING(course), GROUPING(year), course, year
 -- !query analysis
-Project [course#x, year#x, grouping(course)#x, grouping(year)#x]
-+- Sort [cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) ASC NULLS FIRST, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) ASC NULLS FIRST, course#x ASC NULLS FIRST, year#x ASC NULLS FIRST], true
-   +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(course)#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(year)#x, spark_grouping_id#xL, spark_grouping_id#xL]
-      +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
-         +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
-            +- SubqueryAlias coursesales
-               +- View (`courseSales`, [course#x, year#x, earnings#x])
-                  +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
-                     +- Project [course#x, year#x, earnings#x]
-                        +- SubqueryAlias courseSales
-                           +- LocalRelation [course#x, year#x, earnings#x]
+Sort [grouping(course)#x ASC NULLS FIRST, grouping(year)#x ASC NULLS FIRST, course#x ASC NULLS FIRST, year#x ASC NULLS FIRST], true
++- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(course)#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(year)#x]
+   +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
+      +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
+         +- SubqueryAlias coursesales
+            +- View (`courseSales`, [course#x, year#x, earnings#x])
+               +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
+                  +- Project [course#x, year#x, earnings#x]
+                     +- SubqueryAlias courseSales
+                        +- LocalRelation [course#x, year#x, earnings#x]
 
 
 -- !query
 SELECT course, year, GROUPING_ID(course, year) FROM courseSales GROUP BY CUBE(course, year)
 ORDER BY GROUPING(course), GROUPING(year), course, year
 -- !query analysis
-Project [course#x, year#x, grouping_id(course, year)#xL]
-+- Sort [cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) ASC NULLS FIRST, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) ASC NULLS FIRST, course#x ASC NULLS FIRST, year#x ASC NULLS FIRST], true
-   +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL AS grouping_id(course, year)#xL, spark_grouping_id#xL, spark_grouping_id#xL]
-      +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
-         +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
-            +- SubqueryAlias coursesales
-               +- View (`courseSales`, [course#x, year#x, earnings#x])
-                  +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
-                     +- Project [course#x, year#x, earnings#x]
-                        +- SubqueryAlias courseSales
-                           +- LocalRelation [course#x, year#x, earnings#x]
+Sort [cast((shiftright(grouping_id(course, year)#xL, 1) & 1) as tinyint) ASC NULLS FIRST, cast((shiftright(grouping_id(course, year)#xL, 0) & 1) as tinyint) ASC NULLS FIRST, course#x ASC NULLS FIRST, year#x ASC NULLS FIRST], true
++- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL AS grouping_id(course, year)#xL]
+   +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
+      +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
+         +- SubqueryAlias coursesales
+            +- View (`courseSales`, [course#x, year#x, earnings#x])
+               +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
+                  +- Project [course#x, year#x, earnings#x]
+                     +- SubqueryAlias courseSales
+                        +- LocalRelation [course#x, year#x, earnings#x]
 
 
 -- !query
@@ -630,7 +628,7 @@ Aggregate [a#x, b#x, spark_grouping_id#xL, _gen_grouping_pos#x], [a#x, b#x, coun
 SELECT a, b, count(1) FROM testData GROUP BY a, CUBE(a, b), ROLLUP(a, b), GROUPING SETS((a, b), (a), ())
 -- !query analysis
 Aggregate [a#x, b#x, spark_grouping_id#xL, _gen_grouping_pos#x], [a#x, b#x, count(1) AS count(1)#xL]
-+- Expand [[a#x, b#x, a#x, b#x, 0, 0], [a#x, b#x, a#x, b#x, 0, 1], [a#x, b#x, a#x, b#x, 0, 2], [a#x, b#x, a#x, b#x, 0, 3], [a#x, b#x, a#x, b#x, 0, 4], [a#x, b#x, a#x, b#x, 0, 5], [a#x, b#x, a#x, b#x, 0, 6], [a#x, b#x, a#x, b#x, 0, 7], [a#x, b#x, a#x, b#x, 0, 8], [a#x, b#x, a#x, b#x, 0, 9], [a#x, b#x, a#x, b#x, 0, 10], [a#x, b#x, a#x, b#x, 0, 11], [a#x, b#x, a#x, b#x, 0, 12], [a#x, b#x, a#x, null, 1, 13], [a#x, b#x, a#x, null, 1, 14], [a#x, b#x, a#x, b#x, 0, 15], [a#x, b#x, a#x, null, 1, 16], [a#x, b#x, a#x, null, 1, 17], [a#x, b#x, a#x, b#x, 0, 18], [a#x, b#x, a#x, b#x, 0, 19], [a#x, b#x, a#x, b#x, 0, 20], [a#x, b#x, a#x, b#x, 0, 21], [a#x, b#x, a#x, b#x, 0, 22], [a#x, b#x, a#x, b#x, 0, 23], [a#x, b#x, a#x, b#x, 0, 24], ... 11 more fields], [a#x, b#x, a#x, b#x, spark_grouping_id#xL, _gen_grouping_pos#x]
++- Expand [[a#x, b#x, a#x, b#x, 0, 0], [a#x, b#x, a#x, b#x, 0, 1], [a#x, b#x, a#x, b#x, 0, 2], [a#x, b#x, a#x, b#x, 0, 3], [a#x, b#x, a#x, b#x, 0, 4], [a#x, b#x, a#x, b#x, 0, 5], [a#x, b#x, a#x, b#x, 0, 6], [a#x, b#x, a#x, b#x, 0, 7], [a#x, b#x, a#x, b#x, 0, 8], [a#x, b#x, a#x, b#x, 0, 9], [a#x, b#x, a#x, b#x, 0, 10], [a#x, b#x, a#x, b#x, 0, 11], [a#x, b#x, a#x, b#x, 0, 12], [a#x, b#x, a#x, null, 1, 13], [a#x, b#x, a#x, null, 1, 14], [a#x, b#x, a#x, b#x, 0, 15], [a#x, b#x, a#x, null, 1, 16], [a#x, b#x, a#x, null, 1, 17], [a#x, b#x, a#x, b#x, 0, 18], [a#x, b#x, a#x, b#x, 0, 19], [a#x, b#x, a#x, b#x, 0, 20], [a#x, b#x, a#x, b#x, 0, 21], [a#x, b#x, a#x, b#x, 0, 22], [a#x, b#x, a#x, b#x, 0, 23], [a#x, b#x, a#x, b#x, 0, 24], [a#x, b#x, a#x, b#x, 0, 25], [a#x, b#x, a#x, b#x, 0, 26], [a#x, b#x, a#x, b#x, 0, 27], [a#x, b#x, a#x, b#x, 0, 28], [a#x, b#x, a#x, b#x, 0, 29], [a#x, b#x, a#x, b#x, 0, 30], [a#x, b#x, a#x, null, 1, 31], [a#x, b#x, a#x, null, 1, 32], [a#x, b#x, a#x, b#x, 0, 33], [a#x, b#x, a#x, null, 1, 34], [a#x, b#x, a#x, null, 1, 35]], [a#x, b#x, a#x, b#x, spark_grouping_id#xL, _gen_grouping_pos#x]
    +- Project [a#x, b#x, a#x AS a#x, b#x AS b#x]
       +- SubqueryAlias testdata
          +- View (`testData`, [a#x, b#x])
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/grouping_set.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/grouping_set.sql.out
index 254f9d0785408..2c63fb1525a46 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/grouping_set.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/grouping_set.sql.out
@@ -116,7 +116,7 @@ FROM   (VALUES ('x', 'a', 10), ('y', 'b', 20) ) AS t (c1, c2, c3)
 GROUP  BY GROUPING SETS ( ( c1 ), ( c2 ) )
 HAVING GROUPING__ID > 1
 -- !query analysis
-Filter (grouping__id#xL > cast(1 as bigint))
+Filter (GROUPING__ID#xL > cast(1 as bigint))
 +- Aggregate [c1#x, c2#x, spark_grouping_id#xL], [c1#x, c2#x, sum(c3#x) AS sum(c3)#xL, spark_grouping_id#xL AS grouping__id#xL]
    +- Expand [[c1#x, c2#x, c3#x, c1#x, null, 1], [c1#x, c2#x, c3#x, null, c2#x, 2]], [c1#x, c2#x, c3#x, c1#x, c2#x, spark_grouping_id#xL]
       +- Project [c1#x, c2#x, c3#x, c1#x AS c1#x, c2#x AS c2#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/having-and-order-by-recursive-type-name-resolution.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/having-and-order-by-recursive-type-name-resolution.sql.out
new file mode 100644
index 0000000000000..7c843b6ef4757
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/having-and-order-by-recursive-type-name-resolution.sql.out
@@ -0,0 +1,313 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 ORDER BY col1.a
+-- !query analysis
+Project [col1#x]
++- Sort [col1#x.a ASC NULLS FIRST], true
+   +- Aggregate [col1#x], [a AS col1#x, col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 HAVING col1.a > 0
+-- !query analysis
+Project [col1#x]
++- Filter (col1#x.a > 0)
+   +- Aggregate [col1#x], [a AS col1#x, col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a
+-- !query analysis
+Project [col1#x]
++- Sort [col1#x.a ASC NULLS FIRST], true
+   +- Project [col1#x, col1#x]
+      +- Filter (col1#x.a > 0)
+         +- Aggregate [col1#x], [a AS col1#x, col1#x]
+            +- SubqueryAlias t
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1.a
+-- !query analysis
+Sort [col1#x.a ASC NULLS FIRST], true
++- Aggregate [col1#x], [named_struct(a, 1) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a > 0
+-- !query analysis
+Filter (col1#x.a > 0)
++- Aggregate [col1#x], [named_struct(a, 1) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a
+-- !query analysis
+Sort [col1#x.a ASC NULLS FIRST], true
++- Filter (col1#x.a > 0)
+   +- Aggregate [col1#x], [named_struct(a, 1) AS col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 ORDER BY col1.a
+-- !query analysis
+Sort [col1#x.a ASC NULLS FIRST], true
++- Aggregate [col1#x], [named_struct(a, 1) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 HAVING col1.a > 0
+-- !query analysis
+Project [col1#x]
++- Filter (col1#x.a > 0)
+   +- Aggregate [col1#x], [named_struct(a, 1) AS col1#x, col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a
+-- !query analysis
+Sort [col1#x.a ASC NULLS FIRST], true
++- Project [col1#x]
+   +- Filter (col1#x.a > 0)
+      +- Aggregate [col1#x], [named_struct(a, 1) AS col1#x, col1#x]
+         +- SubqueryAlias t
+            +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 ORDER BY col1[0]
+-- !query analysis
+Project [col1#x]
++- Sort [col1#x[0] ASC NULLS FIRST], true
+   +- Aggregate [col1#x], [a AS col1#x, col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 HAVING col1[0] > 0
+-- !query analysis
+Project [col1#x]
++- Filter (col1#x[0] > 0)
+   +- Aggregate [col1#x], [a AS col1#x, col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 HAVING col1[0] > 0 ORDER BY col1[0]
+-- !query analysis
+Project [col1#x]
++- Sort [col1#x[0] ASC NULLS FIRST], true
+   +- Project [col1#x, col1#x]
+      +- Filter (col1#x[0] > 0)
+         +- Aggregate [col1#x], [a AS col1#x, col1#x]
+            +- SubqueryAlias t
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT ARRAY(1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1[0]
+-- !query analysis
+Sort [col1#x[0] ASC NULLS FIRST], true
++- Aggregate [col1#x], [array(1) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT ARRAY(1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1[0] > 0
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_EXTRACT_BASE_FIELD_TYPE",
+  "sqlState" : "42000",
+  "messageParameters" : {
+    "base" : "\"tempresolvedcolumn(col1)\"",
+    "other" : "\"STRING\""
+  }
+}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1.a.b
+-- !query analysis
+Sort [col1#x.a.b ASC NULLS FIRST], true
++- Aggregate [col1#x], [named_struct(a, named_struct(b, 1)) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a.b > 0
+-- !query analysis
+Filter (col1#x.a.b > 0)
++- Aggregate [col1#x], [named_struct(a, named_struct(b, 1)) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a.b > 0 ORDER BY col1.a.b
+-- !query analysis
+Sort [col1#x.a.b ASC NULLS FIRST], true
++- Filter (col1#x.a.b > 0)
+   +- Aggregate [col1#x], [named_struct(a, named_struct(b, 1)) AS col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT ARRAY(NAMED_STRUCT('a', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1[0].a
+-- !query analysis
+Sort [col1#x[0].a ASC NULLS FIRST], true
++- Aggregate [col1#x], [array(named_struct(a, 1)) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT ARRAY(NAMED_STRUCT('a', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1[0].a > 0
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_EXTRACT_BASE_FIELD_TYPE",
+  "sqlState" : "42000",
+  "messageParameters" : {
+    "base" : "\"tempresolvedcolumn(col1)\"",
+    "other" : "\"STRING\""
+  }
+}
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 ORDER BY col1['key']
+-- !query analysis
+Project [col1#x]
++- Sort [col1#x[key] ASC NULLS FIRST], true
+   +- Aggregate [col1#x], [a AS col1#x, col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 HAVING col1['key'] > 0
+-- !query analysis
+Project [col1#x]
++- Filter (col1#x[key] > 0)
+   +- Aggregate [col1#x], [a AS col1#x, col1#x]
+      +- SubqueryAlias t
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 HAVING col1['key'] > 0 ORDER BY col1['key']
+-- !query analysis
+Project [col1#x]
++- Sort [col1#x[key] ASC NULLS FIRST], true
+   +- Project [col1#x, col1#x]
+      +- Filter (col1#x[key] > 0)
+         +- Aggregate [col1#x], [a AS col1#x, col1#x]
+            +- SubqueryAlias t
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT MAP('key', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1['key']
+-- !query analysis
+Sort [col1#x[key] ASC NULLS FIRST], true
++- Aggregate [col1#x], [map(key, 1) AS col1#x]
+   +- SubqueryAlias t
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT MAP('key', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1['key'] > 0
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_EXTRACT_BASE_FIELD_TYPE",
+  "sqlState" : "42000",
+  "messageParameters" : {
+    "base" : "\"tempresolvedcolumn(col1)\"",
+    "other" : "\"STRING\""
+  }
+}
+
+
+-- !query
+SELECT named_struct('a',1) as col, col1
+FROM values(named_struct('a',1))
+ORDER BY col1.a
+-- !query analysis
+Sort [col1#x.a ASC NULLS FIRST], true
++- Project [named_struct(a, 1) AS col#x, col1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT named_struct('a', 1) AS col1, col1
+FROM values(named_struct('a', 1))
+GROUP BY col1
+HAVING col1.a > 0
+-- !query analysis
+Filter (col1#x.a > 0)
++- Aggregate [col1#x], [named_struct(a, 1) AS col1#x, col1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT array(1, 2, 3) AS col1, col1
+FROM values(array(1, 2, 3))
+ORDER BY col1[0]
+-- !query analysis
+Sort [col1#x[0] ASC NULLS FIRST], true
++- Project [array(1, 2, 3) AS col1#x, col1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT array(1, 2, 3) AS col1, col1
+FROM values(array(1, 2, 3))
+GROUP BY col1
+HAVING col1[1] > 1
+-- !query analysis
+Filter (col1#x[1] > 1)
++- Aggregate [col1#x], [array(1, 2, 3) AS col1#x, col1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT map('a', 1, 'b', 2) AS col1, col1
+FROM values(map('a', 1, 'b', 2))
+ORDER BY col1['a']
+-- !query analysis
+Sort [col1#x[a] ASC NULLS FIRST], true
++- Project [map(a, 1, b, 2) AS col1#x, col1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT map('a', 1, 'b', 2) AS col1, col1
+FROM values(map('a', 1, 'b', 2))
+GROUP BY col1
+HAVING col1['b'] > 1
+-- !query analysis
+Filter (col1#x[b] > 1)
++- Aggregate [col1#x], [map(a, 1, b, 2) AS col1#x, col1#x]
+   +- LocalRelation [col1#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/having.sql.out
index 95329ac46390f..dab6b87e80737 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/having.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/having.sql.out
@@ -426,3 +426,83 @@ Project [((sum(v) + 1) + min(v))#xL]
                +- Project [k#x, v#x]
                   +- SubqueryAlias hav
                      +- LocalRelation [k#x, v#x]
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(1)
+GROUP BY col1
+HAVING (
+    SELECT col1 = 1
+)
+-- !query analysis
+Filter cast(scalar-subquery#x [alias#x] as boolean)
+:  +- Project [(outer(alias#x) = 1) AS (outer(col1) = 1)#x]
+:     +- OneRowRelation
++- Aggregate [col1#x], [col1#x AS alias#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(named_struct('a', 1))
+GROUP BY col1
+HAVING (
+    SELECT col1.a = 1
+)
+-- !query analysis
+Filter cast(scalar-subquery#x [alias#x] as boolean)
+:  +- Project [(outer(alias#x).a = 1) AS (outer(col1).a = 1)#x]
+:     +- OneRowRelation
++- Aggregate [col1#x], [col1#x AS alias#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(array(1))
+GROUP BY col1
+HAVING (
+    SELECT col1[0] = 1
+)
+-- !query analysis
+Filter cast(scalar-subquery#x [alias#x] as boolean)
+:  +- Project [(outer(alias#x)[0] = 1) AS (outer(col1)[0] = 1)#x]
+:     +- OneRowRelation
++- Aggregate [col1#x], [col1#x AS alias#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(map('a', 1))
+GROUP BY col1
+HAVING (
+    SELECT col1[0] = 1
+)
+-- !query analysis
+Filter cast(scalar-subquery#x [alias#x] as boolean)
+:  +- Project [(outer(alias#x)[cast(0 as string)] = 1) AS (outer(col1)[0] = 1)#x]
+:     +- OneRowRelation
++- Aggregate [col1#x], [col1#x AS alias#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 = col2
+-- !query analysis
+Project [col1#x]
++- Filter (col2#x = col2#x)
+   +- Aggregate [col1#x, col2#x], [col1#x, col2#x]
+      +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 = col2
+-- !query analysis
+Project [a#x, b#x]
++- Filter (col2#x = col2#x)
+   +- Project [a#x, a#x AS b#x, col2#x]
+      +- Project [col1#x, col2#x, col1#x AS a#x]
+         +- Aggregate [col1#x, col2#x], [col1#x, col2#x]
+            +- LocalRelation [col1#x, col2#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/higher-order-functions.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/higher-order-functions.sql.out
index c06d1e5534aed..ab09f9ee47856 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/higher-order-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/higher-order-functions.sql.out
@@ -370,3 +370,741 @@ select aggregate(split('abcdefgh',''), array(array('')), (acc, x) -> array(array
 -- !query analysis
 Project [aggregate(split(abcdefgh, , -1), array(array()), lambdafunction(array(array(lambda x#x)), lambda acc#x, lambda x#x, false), lambdafunction(lambda id#x, lambda id#x, false)) AS aggregate(split(abcdefgh, , -1), array(array()), lambdafunction(array(array(namedlambdavariable())), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))#x]
 +- OneRowRelation
+
+
+-- !query
+select aggregate(array(1, 2, 3), 0, 100) as aggregate_int_literal
+-- !query analysis
+Project [aggregate(array(1, 2, 3), 0, lambdafunction(100, lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS aggregate_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select aggregate(array(1, 2, 3), map(), map('result', 999)) as aggregate_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 59,
+    "fragment" : "aggregate(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select aggregate(array(1, 2, 3), struct('init', 0), struct('final', 999)) as aggregate_struct_literal
+-- !query analysis
+Project [aggregate(array(1, 2, 3), struct(col1, init, col2, 0), lambdafunction(struct(col1, final, col2, 999), lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS aggregate_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select aggregate(array(1, 2, 3), array(), array('result')) as aggregate_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "aggregate(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), 1) as array_sort_int_literal
+-- !query analysis
+Project [array_sort(array(3, 1, 2), lambdafunction(1, lambda col0#x, lambda col1#x, true), false) AS array_sort_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select array_sort(array(3, 1, 2), map('compare', 0)) as array_sort_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"MAP<STRING, INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(map(compare, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "array_sort(array(3, 1, 2), map('compare', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), struct('result', 0)) as array_sort_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"STRUCT<col1: STRING NOT NULL, col2: INT NOT NULL>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(struct(result, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 54,
+    "fragment" : "array_sort(array(3, 1, 2), struct('result', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), array(0)) as array_sort_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"ARRAY<INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(array(0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 43,
+    "fragment" : "array_sort(array(3, 1, 2), array(0))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), 1) as exists_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "exists(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), map('found', true)) as exists_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(found, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(map(found, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "exists(array(1, 2, 3), map('found', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), struct('exists', true)) as exists_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(exists, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(struct(exists, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 53,
+    "fragment" : "exists(array(1, 2, 3), struct('exists', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), array(true)) as exists_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(array(true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 42,
+    "fragment" : "exists(array(1, 2, 3), array(true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), 1) as filter_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "filter(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), map('key', 'value')) as filter_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(key, value), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, STRING>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(map(key, value), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "filter(array(1, 2, 3), map('key', 'value'))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), struct('valid', true)) as filter_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(valid, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(struct(valid, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "filter(array(1, 2, 3), struct('valid', true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), array(true, false)) as filter_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, false), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(array(true, false), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "filter(array(1, 2, 3), array(true, false))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), 1) as forall_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "forall(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), map('all', true)) as forall_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(all, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(map(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 47,
+    "fragment" : "forall(array(1, 2, 3), map('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), struct('all', true)) as forall_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(all, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(struct(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "forall(array(1, 2, 3), struct('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), array(true, true)) as forall_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(array(true, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 48,
+    "fragment" : "forall(array(1, 2, 3), array(true, true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), 1) as map_filter_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(1, namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 41,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), 1)"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), map('keep', true)) as map_filter_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 57,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), map('keep', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), struct('filter', true)) as map_filter_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 62,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), struct('filter', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), array(true)) as map_filter_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(array(true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 51,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), array(true))"
+  } ]
+}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), 100) as map_zipwith_int_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(100, lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), map('merged', true)) as map_zipwith_map_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(map(merged, true), lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), struct('left', 1, 'right', 10)) as map_zipwith_struct_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(struct(col1, left, col2, 1, col3, right, col4, 10), lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), array('combined')) as map_zipwith_array_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(array(combined), lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select reduce(array(1, 2, 3), 0, 100) as reduce_int_literal
+-- !query analysis
+Project [reduce(array(1, 2, 3), 0, lambdafunction(100, lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS reduce_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select reduce(array(1, 2, 3), map(), map('result', 999)) as reduce_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 56,
+    "fragment" : "reduce(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select reduce(array(1, 2, 3), struct('init', 0), struct('final', 999)) as reduce_struct_literal
+-- !query analysis
+Project [reduce(array(1, 2, 3), struct(col1, init, col2, 0), lambdafunction(struct(col1, final, col2, 999), lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS reduce_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select reduce(array(1, 2, 3), array(), array('result')) as reduce_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 55,
+    "fragment" : "reduce(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select transform(array(1, 2, 3), 42) as transform_int_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(42, lambda col0#x, true)) AS transform_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform(array(1, 2, 3), map('key', 'value')) as transform_map_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(map(key, value), lambda col0#x, true)) AS transform_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform(array(1, 2, 3), struct('id', 99, 'name', 'test')) as transform_struct_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(struct(col1, id, col2, 99, col3, name, col4, test), lambda col0#x, true)) AS transform_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform(array(1, 2, 3), array('a', 'b')) as transform_array_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(array(a, b), lambda col0#x, true)) AS transform_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), 42) as transform_keys_int_literal
+-- !query analysis
+Project [transform_keys(map(a, 1, b, 2), lambdafunction(42, lambda col0#x, lambda col1#x, true)) AS transform_keys_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), map('new', 'key')) as transform_keys_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.INVALID_MAP_KEY_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "keyType" : "\"MAP<STRING, STRING>\"",
+    "sqlExpr" : "\"transform_keys(map(a, 1, b, 2), lambdafunction(map(new, key), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 61,
+    "fragment" : "transform_keys(map('a', 1, 'b', 2), map('new', 'key'))"
+  } ]
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), struct('key', 'value')) as transform_keys_struct_literal
+-- !query analysis
+Project [transform_keys(map(a, 1, b, 2), lambdafunction(struct(col1, key, col2, value), lambda col0#x, lambda col1#x, true)) AS transform_keys_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), array('new_key')) as transform_keys_array_literal
+-- !query analysis
+Project [transform_keys(map(a, 1, b, 2), lambdafunction(array(new_key), lambda col0#x, lambda col1#x, true)) AS transform_keys_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), 999) as transform_values_int_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(999, lambda col0#x, lambda col1#x, true)) AS transform_values_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), map('new', 'value')) as transform_values_map_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(map(new, value), lambda col0#x, lambda col1#x, true)) AS transform_values_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), struct('val', 999)) as transform_values_struct_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(struct(col1, val, col2, 999), lambda col0#x, lambda col1#x, true)) AS transform_values_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), array('new_value')) as transform_values_array_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(array(new_value), lambda col0#x, lambda col1#x, true)) AS transform_values_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), 100) as zipwith_int_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(100, lambda col0#x, lambda col1#x, true)) AS zipwith_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), map('merged', true)) as zipwith_map_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(map(merged, true), lambda col0#x, lambda col1#x, true)) AS zipwith_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), struct('left', 1, 'right', 2)) as zipwith_struct_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(struct(col1, left, col2, 1, col3, right, col4, 2), lambda col0#x, lambda col1#x, true)) AS zipwith_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), array('combined')) as zipwith_array_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(array(combined), lambda col0#x, lambda col1#x, true)) AS zipwith_array_literal#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/identifier-clause.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/identifier-clause.sql.out
index deb2526e346b6..38b28f2d3b232 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/identifier-clause.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/identifier-clause.sql.out
@@ -84,7 +84,7 @@ SetNamespaceCommand [s]
 INSERT INTO IDENTIFIER('ta' || 'b') VALUES(1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/s.db/tab, false, CSV, [path=file:[not included in comparison]/{warehouse_dir}/s.db/tab], Append, `spark_catalog`.`s`.`tab`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/s.db/tab), [c1]
-+- Project [cast(col1#x as int) AS c1#x]
++- Project [col1#x AS c1#x]
    +- LocalRelation [col1#x]
 
 
@@ -308,7 +308,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`tab`, false
 INSERT INTO tab VALUES (1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/tab, false, CSV, [path=file:[not included in comparison]/{warehouse_dir}/tab], Append, `spark_catalog`.`default`.`tab`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/tab), [c1]
-+- Project [cast(col1#x as int) AS c1#x]
++- Project [col1#x AS c1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/literals.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/literals.sql.out
index 9724fb01a1a81..39951f9ef3adc 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/literals.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/literals.sql.out
@@ -706,3 +706,51 @@ select -0, -0.0
 -- !query analysis
 Project [0 AS 0#x, 0.0 AS 0.0#x]
 +- OneRowRelation
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query analysis
+Project [S"par"k AS c1#x, S"par"k AS c2#x, S""par""k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query analysis
+Project [S'par'k AS c1#x, S'par'k AS c2#x, S''par''k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query analysis
+Project [Spark AS c1#x, Spark AS c2#x, Spark AS c3#x, Spark AS c4#x, Spark AS c5#x, Spark AS c6#x]
++- OneRowRelation
+
+
+-- !query
+SET spark.sql.legacy.consecutiveStringLiterals.enabled=true
+-- !query analysis
+SetCommand (spark.sql.legacy.consecutiveStringLiterals.enabled,Some(true))
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query analysis
+Project [Spark AS c1#x, S"par"k AS c2#x, S""par""k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query analysis
+Project [Spark AS c1#x, S'par'k AS c2#x, S''par''k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query analysis
+Project [Spark AS c1#x, Spark AS c2#x, Spark AS c3#x, Spark AS c4#x, Spark AS c5#x, Spark AS c6#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql.out
new file mode 100644
index 0000000000000..6a0f6809dedc9
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql.out
@@ -0,0 +1,675 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+CREATE OR REPLACE TEMPORARY VIEW v1 AS SELECT col1 FROM VALUES
+  (42), (17), (99), (5), (42),
+  (23), (8), (17), (76), (33),
+  (99), (55), (3), (42), (8)
+-- !query analysis
+CreateViewCommand `v1`, SELECT col1 FROM VALUES
+  (42), (17), (99), (5), (42),
+  (23), (8), (17), (76), (33),
+  (99), (55), (3), (42), (8), false, true, LocalTempView, UNSUPPORTED, true
+   +- Project [col1#x]
+      +- LocalRelation [col1#x]
+
+
+-- !query
+CREATE OR REPLACE TEMPORARY VIEW v2 AS SELECT col1 FROM VALUES
+  ('apple'), ('banana'), ('cherry'), ('date'), ('apple'),
+  ('fig'), ('grape'), ('banana'), ('kiwi'), ('lemon'),
+  ('cherry'), ('mango'), ('orange'), ('apple'), ('grape')
+-- !query analysis
+CreateViewCommand `v2`, SELECT col1 FROM VALUES
+  ('apple'), ('banana'), ('cherry'), ('date'), ('apple'),
+  ('fig'), ('grape'), ('banana'), ('kiwi'), ('lemon'),
+  ('cherry'), ('mango'), ('orange'), ('apple'), ('grape'), false, true, LocalTempView, UNSUPPORTED, true
+   +- Project [col1#x]
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 2 AS col1 FROM v1 ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [2 AS col1#x]
+   +- SubqueryAlias v1
+      +- View (`v1`, [col1#x])
+         +- Project [cast(col1#x as int) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [2], [2 AS col1#x]
+   +- SubqueryAlias v1
+      +- View (`v1`, [col1#x])
+         +- Project [cast(col1#x as int) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+-- !query analysis
+Filter (col1#x > 50)
++- Aggregate [2], [2 AS col1#x]
+   +- SubqueryAlias v1
+      +- View (`v1`, [col1#x])
+         +- Project [cast(col1#x as int) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 ORDER BY col1
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Sort [col1#x ASC NULLS FIRST], true
+         +- Project [col1#x AS c#x, 2 AS col1#x]
+            +- SubqueryAlias v1
+               +- View (`v1`, [col1#x])
+                  +- Project [cast(col1#x as int) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Sort [col1#x ASC NULLS FIRST], true
+         +- Aggregate [col1#x, 2], [col1#x AS c#x, 2 AS col1#x]
+            +- SubqueryAlias v1
+               +- View (`v1`, [col1#x])
+                  +- Project [cast(col1#x as int) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Filter (c#x > 50)
+         +- Aggregate [col1#x, 2], [col1#x AS c#x, 2 AS col1#x]
+            +- SubqueryAlias v1
+               +- View (`v1`, [col1#x])
+                  +- Project [cast(col1#x as int) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 2 AS col1, 3 AS col1 FROM v1 ORDER BY col1
+-- !query analysis
+Project [col1#x, col1#x]
++- Sort [col1#x ASC NULLS FIRST], true
+   +- Project [2 AS col1#x, 3 AS col1#x, col1#x]
+      +- SubqueryAlias v1
+         +- View (`v1`, [col1#x])
+            +- Project [cast(col1#x as int) AS col1#x]
+               +- Project [col1#x]
+                  +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`col1`",
+    "proposal" : "`col1`, `col1`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 59,
+    "stopIndex" : 62,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 57,
+    "stopIndex" : 60,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 ORDER BY col1
+-- !query analysis
+Project [c#x, col1#x, col1#x]
++- Sort [col1#x ASC NULLS FIRST], true
+   +- Project [col1#x AS c#x, 2 AS col1#x, 3 AS col1#x, col1#x]
+      +- SubqueryAlias v1
+         +- View (`v1`, [col1#x])
+            +- Project [cast(col1#x as int) AS col1#x]
+               +- Project [col1#x]
+                  +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Aggregate [col1#x, 2, 3], [col1#x AS c#x, 2 AS col1#x, 3 AS col1#x]
+   +- SubqueryAlias v1
+      +- View (`v1`, [col1#x])
+         +- Project [cast(col1#x as int) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Filter (c#x > 50)
+         +- Aggregate [col1#x, 2, 3], [col1#x AS c#x, 2 AS col1#x, 3 AS col1#x]
+            +- SubqueryAlias v1
+               +- View (`v1`, [col1#x])
+                  +- Project [cast(col1#x as int) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1, 2 AS col1 FROM v1 ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [col1#x, 2 AS col1#x]
+   +- SubqueryAlias v1
+      +- View (`v1`, [col1#x])
+         +- Project [cast(col1#x as int) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1, 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [col1#x, 2], [col1#x, 2 AS col1#x]
+   +- SubqueryAlias v1
+      +- View (`v1`, [col1#x])
+         +- Project [cast(col1#x as int) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1, 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [col1#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Filter (col1#x > 50)
+         +- Aggregate [col1#x, 2], [col1#x, 2 AS col1#x]
+            +- SubqueryAlias v1
+               +- View (`v1`, [col1#x])
+                  +- Project [cast(col1#x as int) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [3 AS col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Project [1 AS col1#x, 2 AS col1#x]
+         +- OneRowRelation
+
+
+-- !query
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [3], [3 AS col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Project [1 AS col1#x, 2 AS col1#x]
+         +- OneRowRelation
+
+
+-- !query
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL HAVING col1 > 50
+-- !query analysis
+Filter (col1#x > 50)
++- Aggregate [3], [3 AS col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Project [1 AS col1#x, 2 AS col1#x]
+         +- OneRowRelation
+
+
+-- !query
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) ORDER BY col1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL ORDER BY col1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL HAVING col1 > 50
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT 'col1' FROM v2 ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [col1 AS col1#x]
+   +- SubqueryAlias v2
+      +- View (`v2`, [col1#x])
+         +- Project [cast(col1#x as string) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [col1], [col1 AS col1#x]
+   +- SubqueryAlias v2
+      +- View (`v2`, [col1#x])
+         +- Project [cast(col1#x as string) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+-- !query analysis
+Filter (col1#x > banana)
++- Aggregate [col1], [col1 AS col1#x]
+   +- SubqueryAlias v2
+      +- View (`v2`, [col1#x])
+         +- Project [cast(col1#x as string) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 ORDER BY col1
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Sort [col1#x ASC NULLS FIRST], true
+         +- Project [col1#x AS c#x, col1 AS col1#x]
+            +- SubqueryAlias v2
+               +- View (`v2`, [col1#x])
+                  +- Project [cast(col1#x as string) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Sort [col1#x ASC NULLS FIRST], true
+         +- Aggregate [col1#x, col1], [col1#x AS c#x, col1 AS col1#x]
+            +- SubqueryAlias v2
+               +- View (`v2`, [col1#x])
+                  +- Project [cast(col1#x as string) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Filter (c#x > banana)
+         +- Aggregate [col1#x, col1], [col1#x AS c#x, col1 AS col1#x]
+            +- SubqueryAlias v2
+               +- View (`v2`, [col1#x])
+                  +- Project [cast(col1#x as string) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'col1', 'col1' FROM v2 ORDER BY col1
+-- !query analysis
+Project [col1#x, col1#x]
++- Sort [col1#x ASC NULLS FIRST], true
+   +- Project [col1 AS col1#x, col1 AS col1#x, col1#x]
+      +- SubqueryAlias v2
+         +- View (`v2`, [col1#x])
+            +- Project [cast(col1#x as string) AS col1#x]
+               +- Project [col1#x]
+                  +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'col1', 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`col1`",
+    "proposal" : "`col1`, `col1`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 53,
+    "stopIndex" : 56,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT 'col1', 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 51,
+    "stopIndex" : 54,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 'col1', 'col1' FROM v2 ORDER BY col1
+-- !query analysis
+Project [c#x, col1#x, col1#x]
++- Sort [col1#x ASC NULLS FIRST], true
+   +- Project [col1#x AS c#x, col1 AS col1#x, col1 AS col1#x, col1#x]
+      +- SubqueryAlias v2
+         +- View (`v2`, [col1#x])
+            +- Project [cast(col1#x as string) AS col1#x]
+               +- Project [col1#x]
+                  +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 AS c, 'col1', 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Aggregate [col1#x, col1, col1], [col1#x AS c#x, col1 AS col1#x, col1 AS col1#x]
+   +- SubqueryAlias v2
+      +- View (`v2`, [col1#x])
+         +- Project [cast(col1#x as string) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1', 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1
+-- !query analysis
+Sort [c#x ASC NULLS FIRST], true
++- Project [c#x, col1#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Filter (c#x > banana)
+         +- Aggregate [col1#x, col1, col1], [col1#x AS c#x, col1 AS col1#x, col1 AS col1#x]
+            +- SubqueryAlias v2
+               +- View (`v2`, [col1#x])
+                  +- Project [cast(col1#x as string) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1, 'col1' FROM v2 ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [col1#x, col1 AS col1#x]
+   +- SubqueryAlias v2
+      +- View (`v2`, [col1#x])
+         +- Project [cast(col1#x as string) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1, 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [col1#x, col1], [col1#x, col1 AS col1#x]
+   +- SubqueryAlias v2
+      +- View (`v2`, [col1#x])
+         +- Project [cast(col1#x as string) AS col1#x]
+            +- Project [col1#x]
+               +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1, 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [col1#x, col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Filter (col1#x > banana)
+         +- Aggregate [col1#x, col1], [col1#x, col1 AS col1#x]
+            +- SubqueryAlias v2
+               +- View (`v2`, [col1#x])
+                  +- Project [cast(col1#x as string) AS col1#x]
+                     +- Project [col1#x]
+                        +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Project [col1 AS col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Project [a AS col1#x, b AS col1#x]
+         +- OneRowRelation
+
+
+-- !query
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL ORDER BY col1
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [col1], [col1 AS col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Project [a AS col1#x, b AS col1#x]
+         +- OneRowRelation
+
+
+-- !query
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL HAVING col1 > 'banana'
+-- !query analysis
+Filter (col1#x > banana)
++- Aggregate [col1], [col1 AS col1#x]
+   +- SubqueryAlias __auto_generated_subquery_name
+      +- Project [a AS col1#x, b AS col1#x]
+         +- OneRowRelation
+
+
+-- !query
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) ORDER BY col1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL ORDER BY col1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL HAVING col1 > 'banana'
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+DROP VIEW v2
+-- !query analysis
+DropTempViewCommand v2
+
+
+-- !query
+DROP VIEW v1
+-- !query analysis
+DropTempViewCommand v1
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/cast.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/cast.sql.out
index e0687b564d3d1..0113716bdf712 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/cast.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/cast.sql.out
@@ -745,6 +745,97 @@ Project [cast(10.654321 as interval month) AS CAST(10.654321 AS INTERVAL MONTH)#
 +- OneRowRelation
 
 
+-- !query
+SELECT CAST(TIME '00:01:52' AS tinyint)
+-- !query analysis
+Project [cast(00:01:52 as tinyint) AS CAST(TIME '00:01:52' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS smallint)
+-- !query analysis
+Project [cast(00:01:52 as smallint) AS CAST(TIME '00:01:52' AS SMALLINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS int)
+-- !query analysis
+Project [cast(00:01:52 as int) AS CAST(TIME '00:01:52' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS bigint)
+-- !query analysis
+Project [cast(00:01:52 as bigint) AS CAST(TIME '00:01:52' AS BIGINT)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS tinyint)
+-- !query analysis
+Project [cast(23:59:59 as tinyint) AS CAST(TIME '23:59:59' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS smallint)
+-- !query analysis
+Project [cast(23:59:59 as smallint) AS CAST(TIME '23:59:59' AS SMALLINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS int)
+-- !query analysis
+Project [cast(23:59:59 as int) AS CAST(TIME '23:59:59' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS bigint)
+-- !query analysis
+Project [cast(23:59:59 as bigint) AS CAST(TIME '23:59:59' AS BIGINT)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS tinyint)
+-- !query analysis
+Project [cast(00:00:17.5 as tinyint) AS CAST(TIME '00:00:17.5' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS int)
+-- !query analysis
+Project [cast(00:00:17.5 as int) AS CAST(TIME '00:00:17.5' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.9' AS int)
+-- !query analysis
+Project [cast(00:00:17.9 as int) AS CAST(TIME '00:00:17.9' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS tinyint)
+-- !query analysis
+Project [cast(00:00:00 as tinyint) AS CAST(TIME '00:00:00' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS int)
+-- !query analysis
+Project [cast(00:00:00 as int) AS CAST(TIME '00:00:00' AS INT)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT '1.23' :: int
 -- !query analysis
@@ -880,6 +971,34 @@ Project [cast(10.123456 as interval day to second) AS CAST(10.123456 AS INTERVAL
 +- OneRowRelation
 
 
+-- !query
+SELECT TIME '00:01:52' :: tinyint
+-- !query analysis
+Project [cast(00:01:52 as tinyint) AS CAST(TIME '00:01:52' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME '00:01:52' :: int
+-- !query analysis
+Project [cast(00:01:52 as int) AS CAST(TIME '00:01:52' AS INT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME '23:59:59' :: tinyint
+-- !query analysis
+Project [cast(23:59:59 as tinyint) AS CAST(TIME '23:59:59' AS TINYINT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME '23:59:59' :: int
+-- !query analysis
+Project [cast(23:59:59 as int) AS CAST(TIME '23:59:59' AS INT)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT '1.23' :: int :: long
 -- !query analysis
@@ -960,3 +1079,122 @@ org.apache.spark.sql.catalyst.parser.ParseException
     "hint" : ""
   }
 }
+
+
+-- !query
+SELECT CAST(time '00:00:00' AS decimal(1, 0))
+-- !query analysis
+Project [cast(00:00:00 as decimal(1,0)) AS CAST(TIME '00:00:00' AS DECIMAL(1,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '12:00:00' AS decimal(7, 2))
+-- !query analysis
+Project [cast(12:00:00 as decimal(7,2)) AS CAST(TIME '12:00:00' AS DECIMAL(7,2))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '01:30:45' AS decimal(8, 3))
+-- !query analysis
+Project [cast(01:30:45 as decimal(8,3)) AS CAST(TIME '01:30:45' AS DECIMAL(8,3))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59' AS decimal(9, 4))
+-- !query analysis
+Project [cast(23:59:59 as decimal(9,4)) AS CAST(TIME '23:59:59' AS DECIMAL(9,4))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '01:02:03' AS decimal(15, 9))
+-- !query analysis
+Project [cast(01:02:03 as decimal(15,9)) AS CAST(TIME '01:02:03' AS DECIMAL(15,9))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '10:20:30' AS decimal(20, 10))
+-- !query analysis
+Project [cast(10:20:30 as decimal(20,10)) AS CAST(TIME '10:20:30' AS DECIMAL(20,10))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.001' AS decimal(8, 3))
+-- !query analysis
+Project [cast(23:59:59.001 as decimal(8,3)) AS CAST(TIME '23:59:59.001' AS DECIMAL(8,3))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 6))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(11,6)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(11,6))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 9))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(14,9)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(14,9))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(20, 10))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(20,10)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(20,10))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '00:01:00' AS decimal(1, 0))
+-- !query analysis
+Project [cast(00:01:00 as decimal(1,0)) AS CAST(TIME '00:01:00' AS DECIMAL(1,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '01:00:00' AS decimal(3, 0))
+-- !query analysis
+Project [cast(01:00:00 as decimal(3,0)) AS CAST(TIME '01:00:00' AS DECIMAL(3,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '10:00:00' AS decimal(5, 2))
+-- !query analysis
+Project [cast(10:00:00 as decimal(5,2)) AS CAST(TIME '10:00:00' AS DECIMAL(5,2))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.9' AS decimal(6, 0))
+-- !query analysis
+Project [cast(23:59:59.9 as decimal(6,0)) AS CAST(TIME '23:59:59.9' AS DECIMAL(6,0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999' AS decimal(8, 2))
+-- !query analysis
+Project [cast(23:59:59.999 as decimal(8,2)) AS CAST(TIME '23:59:59.999' AS DECIMAL(8,2))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 5))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(11,5)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(11,5))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 8))
+-- !query analysis
+Project [cast(23:59:59.999999 as decimal(14,8)) AS CAST(TIME '23:59:59.999999' AS DECIMAL(14,8))#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/decimalArithmeticOperations.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/decimalArithmeticOperations.sql.out
index d75f4d41bd425..5c136f6fe1779 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/decimalArithmeticOperations.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/decimalArithmeticOperations.sql.out
@@ -51,7 +51,7 @@ insert into decimals_test values(1, 100.0, 999.0), (2, 12345.123, 12345.123),
   (3, 0.1234567891011, 1234.1), (4, 123456789123456789.0, 1.123456789123456789)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/decimals_test, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/decimals_test], Append, `spark_catalog`.`default`.`decimals_test`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/decimals_test), [id, a, b]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,18)) AS a#x, cast(col3#x as decimal(38,18)) AS b#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,18)) AS a#x, cast(col3#x as decimal(38,18)) AS b#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/double-quoted-identifiers.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/double-quoted-identifiers.sql.out
index a02bf525f947d..5c8b549a50658 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/double-quoted-identifiers.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/double-quoted-identifiers.sql.out
@@ -111,6 +111,20 @@ org.apache.spark.sql.catalyst.parser.ParseException
 }
 
 
+-- !query
+select 1 from "not_""exists"
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'\"not_\"\"exists\"'",
+    "hint" : ""
+  }
+}
+
+
 -- !query
 SELECT 1 FROM `hello`
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/higher-order-functions.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/higher-order-functions.sql.out
index 1281b19eb2f86..d4717b18bac5b 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/higher-order-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/higher-order-functions.sql.out
@@ -370,3 +370,741 @@ select aggregate(split('abcdefgh',''), array(array('')), (acc, x) -> array(array
 -- !query analysis
 Project [aggregate(split(abcdefgh, , -1), array(array()), lambdafunction(array(array(lambda x#x)), lambda acc#x, lambda x#x, false), lambdafunction(lambda id#x, lambda id#x, false)) AS aggregate(split(abcdefgh, , -1), array(array()), lambdafunction(array(array(namedlambdavariable())), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))#x]
 +- OneRowRelation
+
+
+-- !query
+select aggregate(array(1, 2, 3), 0, 100) as aggregate_int_literal
+-- !query analysis
+Project [aggregate(array(1, 2, 3), 0, lambdafunction(100, lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS aggregate_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select aggregate(array(1, 2, 3), map(), map('result', 999)) as aggregate_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 59,
+    "fragment" : "aggregate(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select aggregate(array(1, 2, 3), struct('init', 0), struct('final', 999)) as aggregate_struct_literal
+-- !query analysis
+Project [aggregate(array(1, 2, 3), struct(col1, init, col2, 0), lambdafunction(struct(col1, final, col2, 999), lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS aggregate_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select aggregate(array(1, 2, 3), array(), array('result')) as aggregate_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "aggregate(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), 1) as array_sort_int_literal
+-- !query analysis
+Project [array_sort(array(3, 1, 2), lambdafunction(1, lambda col0#x, lambda col1#x, true), false) AS array_sort_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select array_sort(array(3, 1, 2), map('compare', 0)) as array_sort_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"MAP<STRING, INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(map(compare, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "array_sort(array(3, 1, 2), map('compare', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), struct('result', 0)) as array_sort_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"STRUCT<col1: STRING NOT NULL, col2: INT NOT NULL>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(struct(result, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 54,
+    "fragment" : "array_sort(array(3, 1, 2), struct('result', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), array(0)) as array_sort_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"ARRAY<INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(array(0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 43,
+    "fragment" : "array_sort(array(3, 1, 2), array(0))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), 1) as exists_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "exists(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), map('found', true)) as exists_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(found, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(map(found, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "exists(array(1, 2, 3), map('found', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), struct('exists', true)) as exists_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(exists, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(struct(exists, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 53,
+    "fragment" : "exists(array(1, 2, 3), struct('exists', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), array(true)) as exists_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(array(true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 42,
+    "fragment" : "exists(array(1, 2, 3), array(true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), 1) as filter_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "filter(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), map('key', 'value')) as filter_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(key, value), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, STRING>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(map(key, value), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "filter(array(1, 2, 3), map('key', 'value'))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), struct('valid', true)) as filter_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(valid, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(struct(valid, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "filter(array(1, 2, 3), struct('valid', true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), array(true, false)) as filter_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, false), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(array(true, false), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "filter(array(1, 2, 3), array(true, false))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), 1) as forall_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "forall(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), map('all', true)) as forall_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(all, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(map(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 47,
+    "fragment" : "forall(array(1, 2, 3), map('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), struct('all', true)) as forall_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(all, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(struct(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "forall(array(1, 2, 3), struct('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), array(true, true)) as forall_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(array(true, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 48,
+    "fragment" : "forall(array(1, 2, 3), array(true, true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), 1) as map_filter_int_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(1, namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 41,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), 1)"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), map('keep', true)) as map_filter_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 57,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), map('keep', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), struct('filter', true)) as map_filter_struct_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 62,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), struct('filter', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), array(true)) as map_filter_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(array(true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 51,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), array(true))"
+  } ]
+}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), 100) as map_zipwith_int_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(100, lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), map('merged', true)) as map_zipwith_map_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(map(merged, true), lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), struct('left', 1, 'right', 10)) as map_zipwith_struct_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(struct(col1, left, col2, 1, col3, right, col4, 10), lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), array('combined')) as map_zipwith_array_literal
+-- !query analysis
+Project [map_zip_with(map(a, 1), map(a, 10), lambdafunction(array(combined), lambda col0#x, lambda col1#x, lambda col2#x, true)) AS map_zipwith_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select reduce(array(1, 2, 3), 0, 100) as reduce_int_literal
+-- !query analysis
+Project [reduce(array(1, 2, 3), 0, lambdafunction(100, lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS reduce_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select reduce(array(1, 2, 3), map(), map('result', 999)) as reduce_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 56,
+    "fragment" : "reduce(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select reduce(array(1, 2, 3), struct('init', 0), struct('final', 999)) as reduce_struct_literal
+-- !query analysis
+Project [reduce(array(1, 2, 3), struct(col1, init, col2, 0), lambdafunction(struct(col1, final, col2, 999), lambda col0#x, lambda col1#x, true), lambdafunction(lambda id#x, lambda id#x, false)) AS reduce_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select reduce(array(1, 2, 3), array(), array('result')) as reduce_array_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 55,
+    "fragment" : "reduce(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select transform(array(1, 2, 3), 42) as transform_int_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(42, lambda col0#x, true)) AS transform_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform(array(1, 2, 3), map('key', 'value')) as transform_map_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(map(key, value), lambda col0#x, true)) AS transform_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform(array(1, 2, 3), struct('id', 99, 'name', 'test')) as transform_struct_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(struct(col1, id, col2, 99, col3, name, col4, test), lambda col0#x, true)) AS transform_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform(array(1, 2, 3), array('a', 'b')) as transform_array_literal
+-- !query analysis
+Project [transform(array(1, 2, 3), lambdafunction(array(a, b), lambda col0#x, true)) AS transform_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), 42) as transform_keys_int_literal
+-- !query analysis
+Project [transform_keys(map(a, 1, b, 2), lambdafunction(42, lambda col0#x, lambda col1#x, true)) AS transform_keys_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), map('new', 'key')) as transform_keys_map_literal
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.INVALID_MAP_KEY_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "keyType" : "\"MAP<STRING, STRING>\"",
+    "sqlExpr" : "\"transform_keys(map(a, 1, b, 2), lambdafunction(map(new, key), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 61,
+    "fragment" : "transform_keys(map('a', 1, 'b', 2), map('new', 'key'))"
+  } ]
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), struct('key', 'value')) as transform_keys_struct_literal
+-- !query analysis
+Project [transform_keys(map(a, 1, b, 2), lambdafunction(struct(col1, key, col2, value), lambda col0#x, lambda col1#x, true)) AS transform_keys_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), array('new_key')) as transform_keys_array_literal
+-- !query analysis
+Project [transform_keys(map(a, 1, b, 2), lambdafunction(array(new_key), lambda col0#x, lambda col1#x, true)) AS transform_keys_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), 999) as transform_values_int_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(999, lambda col0#x, lambda col1#x, true)) AS transform_values_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), map('new', 'value')) as transform_values_map_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(map(new, value), lambda col0#x, lambda col1#x, true)) AS transform_values_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), struct('val', 999)) as transform_values_struct_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(struct(col1, val, col2, 999), lambda col0#x, lambda col1#x, true)) AS transform_values_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), array('new_value')) as transform_values_array_literal
+-- !query analysis
+Project [transform_values(map(a, 1, b, 2), lambdafunction(array(new_value), lambda col0#x, lambda col1#x, true)) AS transform_values_array_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), 100) as zipwith_int_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(100, lambda col0#x, lambda col1#x, true)) AS zipwith_int_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), map('merged', true)) as zipwith_map_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(map(merged, true), lambda col0#x, lambda col1#x, true)) AS zipwith_map_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), struct('left', 1, 'right', 2)) as zipwith_struct_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(struct(col1, left, col2, 1, col3, right, col4, 2), lambda col0#x, lambda col1#x, true)) AS zipwith_struct_literal#x]
++- OneRowRelation
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), array('combined')) as zipwith_array_literal
+-- !query analysis
+Project [zip_with(array(1, 2, 3), array(4, 5, 6), lambdafunction(array(combined), lambda col0#x, lambda col1#x, true)) AS zipwith_array_literal#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/literals.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/literals.sql.out
index 9724fb01a1a81..39951f9ef3adc 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/literals.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/literals.sql.out
@@ -706,3 +706,51 @@ select -0, -0.0
 -- !query analysis
 Project [0 AS 0#x, 0.0 AS 0.0#x]
 +- OneRowRelation
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query analysis
+Project [S"par"k AS c1#x, S"par"k AS c2#x, S""par""k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query analysis
+Project [S'par'k AS c1#x, S'par'k AS c2#x, S''par''k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query analysis
+Project [Spark AS c1#x, Spark AS c2#x, Spark AS c3#x, Spark AS c4#x, Spark AS c5#x, Spark AS c6#x]
++- OneRowRelation
+
+
+-- !query
+SET spark.sql.legacy.consecutiveStringLiterals.enabled=true
+-- !query analysis
+SetCommand (spark.sql.legacy.consecutiveStringLiterals.enabled,Some(true))
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query analysis
+Project [Spark AS c1#x, S"par"k AS c2#x, S""par""k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query analysis
+Project [Spark AS c1#x, S'par'k AS c2#x, S''par''k AS c3#x]
++- OneRowRelation
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query analysis
+Project [Spark AS c1#x, Spark AS c2#x, Spark AS c3#x, Spark AS c4#x, Spark AS c5#x, Spark AS c6#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/string-functions.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/string-functions.sql.out
index ee4ad922fa8a5..b352d0edf896b 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/string-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/string-functions.sql.out
@@ -128,6 +128,41 @@ Project [split(hello, , -1) AS split(hello, , -1)#x]
 +- OneRowRelation
 
 
+-- !query
+SELECT split('hello', '', 0)
+-- !query analysis
+Project [split(hello, , 0) AS split(hello, , 0)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 1)
+-- !query analysis
+Project [split(hello, , 1) AS split(hello, , 1)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 3)
+-- !query analysis
+Project [split(hello, , 3) AS split(hello, , 3)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 5)
+-- !query analysis
+Project [split(hello, , 5) AS split(hello, , 5)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 100)
+-- !query analysis
+Project [split(hello, , 100) AS split(hello, , 100)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT split('', '')
 -- !query analysis
@@ -135,6 +170,27 @@ Project [split(, , -1) AS split(, , -1)#x]
 +- OneRowRelation
 
 
+-- !query
+SELECT split('', '', -1)
+-- !query analysis
+Project [split(, , -1) AS split(, , -1)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('', '', 0)
+-- !query analysis
+Project [split(, , 0) AS split(, , 0)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('', '', 1)
+-- !query analysis
+Project [split(, , 1) AS split(, , 1)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT split('abc', null)
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/timestamp.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/timestamp.sql.out
index dcfd783b648f8..963424bdaa09e 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/timestamp.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/nonansi/timestamp.sql.out
@@ -157,6 +157,235 @@ Project [make_timestamp(1, 1, 1, 1, 1, cast(999.999999 as decimal(16,6)), None,
 +- OneRowRelation
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), None, None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(MIT), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(PST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(UTC), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(CET), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(JST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query analysis
@@ -711,45 +940,13 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+[Analyzer test output redacted due to nondeterminism]
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+[Analyzer test output redacted due to nondeterminism]
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/null-handling.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/null-handling.sql.out
index 37d84f6c5fc00..86ee26bd1cf62 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/null-handling.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/null-handling.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
 insert into t1 values(1,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [a, b, c]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into t1 values(2,0,1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [a, b, c]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into t1 values(3,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [a, b, c]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into t1 values(4,1,1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [a, b, c]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into t1 values(5,null,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [a, b, c]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
++- Project [col1#x AS a#x, cast(col2#x as int) AS b#x, col3#x AS c#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -49,7 +49,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into t1 values(6,null,1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [a, b, c]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
++- Project [col1#x AS a#x, cast(col2#x as int) AS b#x, col3#x AS c#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -57,7 +57,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into t1 values(7,null,null)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [a, b, c]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
++- Project [col1#x AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/order-by-ordinal.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/order-by-ordinal.sql.out
index f1f189517dea7..842d099db396c 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/order-by-ordinal.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/order-by-ordinal.sql.out
@@ -150,6 +150,284 @@ Sort [a#x DESC NULLS LAST], false
                   +- LocalRelation [a#x, b#x]
 
 
+-- !query
+set spark.sql.prioritizeOrdinalResolutionInSort.enabled=true
+-- !query analysis
+SetCommand (spark.sql.prioritizeOrdinalResolutionInSort.enabled,Some(true))
+
+
+-- !query
+SELECT a FROM data ORDER BY 2, b
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 29,
+    "stopIndex" : 29,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 2
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY 'b', 2
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 34,
+    "stopIndex" : 34,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY `b`, 2
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 34,
+    "stopIndex" : 34,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY a, 2
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 3
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "3",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "3"
+  } ]
+}
+
+
+-- !query
+SELECT a, a + 1 FROM data ORDER BY b, 3
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "3",
+    "size" : "2"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 39,
+    "stopIndex" : 39,
+    "fragment" : "3"
+  } ]
+}
+
+
+-- !query
+set spark.sql.prioritizeOrdinalResolutionInSort.enabled=false
+-- !query analysis
+SetCommand (spark.sql.prioritizeOrdinalResolutionInSort.enabled,Some(false))
+
+
+-- !query
+SELECT a FROM data ORDER BY 2, b
+-- !query analysis
+Project [a#x]
++- Sort [b#x ASC NULLS FIRST, b#x ASC NULLS FIRST], true
+   +- Project [a#x, b#x]
+      +- SubqueryAlias data
+         +- View (`data`, [a#x, b#x])
+            +- Project [cast(a#x as int) AS a#x, cast(b#x as int) AS b#x]
+               +- Project [a#x, b#x]
+                  +- SubqueryAlias data
+                     +- LocalRelation [a#x, b#x]
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 2
+-- !query analysis
+Project [a#x]
++- Sort [b#x ASC NULLS FIRST, b#x ASC NULLS FIRST], true
+   +- Project [a#x, b#x]
+      +- SubqueryAlias data
+         +- View (`data`, [a#x, b#x])
+            +- Project [cast(a#x as int) AS a#x, cast(b#x as int) AS b#x]
+               +- Project [a#x, b#x]
+                  +- SubqueryAlias data
+                     +- LocalRelation [a#x, b#x]
+
+
+-- !query
+SELECT a FROM data ORDER BY 'b', 2
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 34,
+    "stopIndex" : 34,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY `b`, 2
+-- !query analysis
+Project [a#x]
++- Sort [b#x ASC NULLS FIRST, b#x ASC NULLS FIRST], true
+   +- Project [a#x, b#x]
+      +- SubqueryAlias data
+         +- View (`data`, [a#x, b#x])
+            +- Project [cast(a#x as int) AS a#x, cast(b#x as int) AS b#x]
+               +- Project [a#x, b#x]
+                  +- SubqueryAlias data
+                     +- LocalRelation [a#x, b#x]
+
+
+-- !query
+SELECT a FROM data ORDER BY a, 2
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 3
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "3",
+    "size" : "2"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "3"
+  } ]
+}
+
+
+-- !query
+SELECT a, a + 1 FROM data ORDER BY b, 3
+-- !query analysis
+Project [a#x, (a + 1)#x]
++- Sort [b#x ASC NULLS FIRST, b#x ASC NULLS FIRST], true
+   +- Project [a#x, (a#x + 1) AS (a + 1)#x, b#x]
+      +- SubqueryAlias data
+         +- View (`data`, [a#x, b#x])
+            +- Project [cast(a#x as int) AS a#x, cast(b#x as int) AS b#x]
+               +- Project [a#x, b#x]
+                  +- SubqueryAlias data
+                     +- LocalRelation [a#x, b#x]
+
+
 -- !query
 set spark.sql.orderByOrdinal=false
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/order-by.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/order-by.sql.out
index 9c9305ac632db..920e16ea8687a 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/order-by.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/order-by.sql.out
@@ -454,6 +454,26 @@ Sort [(sum(b) + 1)#xL ASC NULLS FIRST], true
                      +- LocalRelation [a#x, b#x]
 
 
+-- !query
+SELECT col1 FROM VALUES(1,2) GROUP BY col1, col2 ORDER BY col2, col2
+-- !query analysis
+Project [col1#x]
++- Sort [col2#x ASC NULLS FIRST, col2#x ASC NULLS FIRST], true
+   +- Aggregate [col1#x, col2#x], [col1#x, col2#x]
+      +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 ORDER BY col2, col2
+-- !query analysis
+Project [a#x, b#x]
++- Sort [col2#x ASC NULLS FIRST, col2#x ASC NULLS FIRST], true
+   +- Project [a#x, a#x AS b#x, col2#x]
+      +- Project [col1#x, col2#x, col1#x AS a#x]
+         +- Aggregate [col1#x, col2#x], [col1#x, col2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
 -- !query
 DROP VIEW IF EXISTS testData
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/pipe-operators.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/pipe-operators.sql.out
index 3de5ec38a2bad..dda0722e21d75 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/pipe-operators.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/pipe-operators.sql.out
@@ -16,7 +16,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 insert into t values (0, 'abc'), (1, 'def')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, CSV, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [x, y]
-+- Project [cast(col1#x as int) AS x#x, cast(col2#x as string) AS y#x]
++- Project [col1#x AS x#x, col2#x AS y#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -37,7 +37,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`other`, false
 insert into other values (1, 1), (1, 2), (2, 4)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/other, false, JSON, [path=file:[not included in comparison]/{warehouse_dir}/other], Append, `spark_catalog`.`default`.`other`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/other), [a, b]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x]
++- Project [col1#x AS a#x, col2#x AS b#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -58,7 +58,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`st`, false
 insert into st values (1, (2, 3))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/st, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/st], Append, `spark_catalog`.`default`.`st`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/st), [x, col]
-+- Project [cast(col1#x as int) AS x#x, named_struct(i1, cast(col2#x.col1 as int), i2, cast(col2#x.col2 as int)) AS col#x]
++- Project [col1#x AS x#x, named_struct(i1, col2#x.col1, i2, col2#x.col2) AS col#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/boolean.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/boolean.sql.out
index 277ab866f97f7..9e5733212c24e 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/boolean.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/boolean.sql.out
@@ -290,7 +290,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`BOOLTBL1`, false
 INSERT INTO BOOLTBL1 VALUES (cast('t' as boolean))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl1], Append, `spark_catalog`.`default`.`booltbl1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl1), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -298,7 +298,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO BOOLTBL1 VALUES (cast('True' as boolean))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl1], Append, `spark_catalog`.`default`.`booltbl1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl1), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -306,7 +306,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO BOOLTBL1 VALUES (cast('true' as boolean))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl1], Append, `spark_catalog`.`default`.`booltbl1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl1), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -355,7 +355,7 @@ Project [ AS zero#x, f1#x]
 INSERT INTO BOOLTBL1 VALUES (boolean('f'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl1], Append, `spark_catalog`.`default`.`booltbl1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl1), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -380,7 +380,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`BOOLTBL2`, false
 INSERT INTO BOOLTBL2 VALUES (boolean('f'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl2], Append, `spark_catalog`.`default`.`booltbl2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl2), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -388,7 +388,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO BOOLTBL2 VALUES (boolean('false'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl2], Append, `spark_catalog`.`default`.`booltbl2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl2), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -396,7 +396,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO BOOLTBL2 VALUES (boolean('False'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl2], Append, `spark_catalog`.`default`.`booltbl2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl2), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -404,7 +404,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO BOOLTBL2 VALUES (boolean('FALSE'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl2], Append, `spark_catalog`.`default`.`booltbl2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl2), [f1]
-+- Project [cast(col1#x as boolean) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -593,7 +593,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`BOOLTBL3`, false
 INSERT INTO BOOLTBL3 VALUES ('true', true, 1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl3], Append, `spark_catalog`.`default`.`booltbl3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl3), [d, b, o]
-+- Project [cast(col1#x as string) AS d#x, cast(col2#x as boolean) AS b#x, cast(col3#x as int) AS o#x]
++- Project [col1#x AS d#x, col2#x AS b#x, col3#x AS o#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -601,7 +601,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO BOOLTBL3 VALUES ('false', false, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl3], Append, `spark_catalog`.`default`.`booltbl3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl3), [d, b, o]
-+- Project [cast(col1#x as string) AS d#x, cast(col2#x as boolean) AS b#x, cast(col3#x as int) AS o#x]
++- Project [col1#x AS d#x, col2#x AS b#x, col3#x AS o#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -609,7 +609,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO BOOLTBL3 VALUES ('null', null, 3)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl3], Append, `spark_catalog`.`default`.`booltbl3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl3), [d, b, o]
-+- Project [cast(col1#x as string) AS d#x, cast(col2#x as boolean) AS b#x, cast(col3#x as int) AS o#x]
++- Project [col1#x AS d#x, cast(col2#x as boolean) AS b#x, col3#x AS o#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -641,7 +641,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`booltbl4`, false
 INSERT INTO booltbl4 VALUES (false, true, null)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/booltbl4, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/booltbl4], Append, `spark_catalog`.`default`.`booltbl4`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/booltbl4), [isfalse, istrue, isnul]
-+- Project [cast(col1#x as boolean) AS isfalse#x, cast(col2#x as boolean) AS istrue#x, cast(col3#x as boolean) AS isnul#x]
++- Project [col1#x AS isfalse#x, col2#x AS istrue#x, cast(col3#x as boolean) AS isnul#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/case.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/case.sql.out
index 31d199e4754e0..465da4d2e737a 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/case.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/case.sql.out
@@ -21,7 +21,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`CASE2_TBL`, false
 INSERT INTO CASE_TBL VALUES (1, 10.1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -29,7 +29,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE_TBL VALUES (2, 20.2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -37,7 +37,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE_TBL VALUES (3, -30.3)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -45,7 +45,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE_TBL VALUES (4, NULL)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -53,7 +53,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (1, -1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -61,7 +61,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (2, -2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -69,7 +69,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (3, -3)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -77,7 +77,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (2, -4)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -85,7 +85,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (1, NULL)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, cast(col2#x as int) AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -93,7 +93,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (NULL, -6)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [cast(col1#x as int) AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/create_view.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/create_view.sql.out
index e4e4be8fee7d3..e39f479f6ea65 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/create_view.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/create_view.sql.out
@@ -94,7 +94,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`viewtest_tbl`, false
 INSERT INTO viewtest_tbl VALUES (5, 10), (10, 15), (15, 20), (20, 25)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/viewtest_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/viewtest_tbl], Append, `spark_catalog`.`default`.`viewtest_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/viewtest_tbl), [a, b]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x]
++- Project [col1#x AS a#x, col2#x AS b#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -833,7 +833,7 @@ CreateDataSourceTableCommand `spark_catalog`.`testviewschm2`.`tmptbl`, false
 INSERT INTO tmptbl VALUES (1, 1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/testviewschm2.db/tmptbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/testviewschm2.db/tmptbl], Append, `spark_catalog`.`testviewschm2`.`tmptbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/testviewschm2.db/tmptbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/date.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/date.sql.out
index d3ac6a3eb2b5c..16d1ffffd7d95 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/date.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/date.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`DATE_TBL`, false
 INSERT INTO DATE_TBL VALUES (date('1957-04-09'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1957-06-13'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1996-02-28'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1996-02-29'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1996-03-01'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -49,7 +49,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1996-03-02'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -57,7 +57,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1997-02-28'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -65,7 +65,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1997-03-01'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -73,7 +73,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('1997-03-02'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -81,7 +81,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('2000-04-01'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -89,7 +89,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('2000-04-02'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -97,7 +97,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('2000-04-03'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -105,7 +105,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('2038-04-08'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -113,7 +113,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('2039-04-09'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -121,7 +121,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO DATE_TBL VALUES (date('2040-04-10'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/date_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/date_tbl], Append, `spark_catalog`.`default`.`date_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/date_tbl), [f1]
-+- Project [cast(col1#x as date) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float4.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float4.sql.out
index 0618a1d8432ed..445edd15f473f 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float4.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float4.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`FLOAT4_TBL`, false
 INSERT INTO FLOAT4_TBL VALUES (float('    0.0'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float4_tbl], Append, `spark_catalog`.`default`.`float4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float4_tbl), [f1]
-+- Project [cast(col1#x as float) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT4_TBL VALUES (float('1004.30   '))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float4_tbl], Append, `spark_catalog`.`default`.`float4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float4_tbl), [f1]
-+- Project [cast(col1#x as float) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT4_TBL VALUES (float('     -34.84    '))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float4_tbl], Append, `spark_catalog`.`default`.`float4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float4_tbl), [f1]
-+- Project [cast(col1#x as float) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT4_TBL VALUES (float('1.2345678901234e+20'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float4_tbl], Append, `spark_catalog`.`default`.`float4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float4_tbl), [f1]
-+- Project [cast(col1#x as float) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT4_TBL VALUES (float('1.2345678901234e-20'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float4_tbl], Append, `spark_catalog`.`default`.`float4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float4_tbl), [f1]
-+- Project [cast(col1#x as float) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float8.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float8.sql.out
index 2f2beda4f1cec..31f315d61bc9d 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float8.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/float8.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`FLOAT8_TBL`, false
 INSERT INTO FLOAT8_TBL VALUES (double('    0.0   '))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('1004.30  '))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('   -34.84'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('1.2345678901234e+200'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('1.2345678901234e-200'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -612,7 +612,7 @@ TruncateTableCommand `spark_catalog`.`default`.`float8_tbl`
 INSERT INTO FLOAT8_TBL VALUES (double('0.0'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -620,7 +620,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('-34.84'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -628,7 +628,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('-1004.30'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -636,7 +636,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('-1.2345678901234e+200'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -644,7 +644,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO FLOAT8_TBL VALUES (double('-1.2345678901234e-200'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/float8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/float8_tbl], Append, `spark_catalog`.`default`.`float8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/float8_tbl), [f1]
-+- Project [cast(col1#x as double) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/groupingsets.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/groupingsets.sql.out
index 82b03e986f9dd..84b280b5e9e73 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/groupingsets.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/groupingsets.sql.out
@@ -33,7 +33,7 @@ insert into gstest2 values
   (2, 2, 2, 2, 2, 2, 2, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/gstest2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/gstest2], Append, `spark_catalog`.`default`.`gstest2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/gstest2), [a, b, c, d, e, f, g, h]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x, cast(col4#x as int) AS d#x, cast(col5#x as int) AS e#x, cast(col6#x as int) AS f#x, cast(col7#x as int) AS g#x, cast(col8#x as int) AS h#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x, col5#x AS e#x, col6#x AS f#x, col7#x AS g#x, col8#x AS h#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x, col5#x, col6#x, col7#x, col8#x]
 
 
@@ -49,7 +49,7 @@ insert into gstest3 values
   (2, 2, 2, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/gstest3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/gstest3], Append, `spark_catalog`.`default`.`gstest3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/gstest3), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as int) AS c#x, cast(col4#x as int) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -68,7 +68,7 @@ values (1,1,tinyint('0'),1), (2,2,tinyint('1'),1),
        (7,64,tinyint('2'),1), (8,128,tinyint('3'),1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/gstest4, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/gstest4], Append, `spark_catalog`.`default`.`gstest4`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/gstest4), [id, v, unhashable_col, unsortable_col]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS v#x, cast(col3#x as tinyint) AS unhashable_col#x, cast(col4#x as int) AS unsortable_col#x]
++- Project [col1#x AS id#x, col2#x AS v#x, col3#x AS unhashable_col#x, col4#x AS unsortable_col#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -401,13 +401,12 @@ group by grouping sets(ten) having grouping(ten) >= 0
 order by 2,1
 -- !query analysis
 Sort [grouping(ten)#x ASC NULLS FIRST, ten#x ASC NULLS FIRST], true
-+- Project [ten#x, grouping(ten)#x]
-   +- Filter (cast(cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) as int) >= 0)
-      +- Aggregate [ten#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(ten)#x, spark_grouping_id#xL]
-         +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, 0]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, spark_grouping_id#xL]
-            +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x]
-               +- SubqueryAlias spark_catalog.default.onek
-                  +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
++- Filter (cast(grouping(ten)#x as int) >= 0)
+   +- Aggregate [ten#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(ten)#x]
+      +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, 0]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, spark_grouping_id#xL]
+         +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x]
+            +- SubqueryAlias spark_catalog.default.onek
+               +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
 
 
 -- !query
@@ -416,13 +415,12 @@ group by grouping sets(ten, four) having grouping(ten) > 0
 order by 2,1
 -- !query analysis
 Sort [grouping(ten)#x ASC NULLS FIRST, ten#x ASC NULLS FIRST], true
-+- Project [ten#x, grouping(ten)#x]
-   +- Filter (cast(cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) as int) > 0)
-      +- Aggregate [ten#x, four#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(ten)#x, spark_grouping_id#xL]
-         +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, null, 1], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, null, four#x, 2]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, four#x, spark_grouping_id#xL]
-            +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x, four#x AS four#x]
-               +- SubqueryAlias spark_catalog.default.onek
-                  +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
++- Filter (cast(grouping(ten)#x as int) > 0)
+   +- Aggregate [ten#x, four#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(ten)#x]
+      +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, null, 1], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, null, four#x, 2]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, four#x, spark_grouping_id#xL]
+         +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x, four#x AS four#x]
+            +- SubqueryAlias spark_catalog.default.onek
+               +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
 
 
 -- !query
@@ -431,13 +429,12 @@ group by rollup(ten) having grouping(ten) > 0
 order by 2,1
 -- !query analysis
 Sort [grouping(ten)#x ASC NULLS FIRST, ten#x ASC NULLS FIRST], true
-+- Project [ten#x, grouping(ten)#x]
-   +- Filter (cast(cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) as int) > 0)
-      +- Aggregate [ten#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(ten)#x, spark_grouping_id#xL]
-         +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, 0], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, null, 1]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, spark_grouping_id#xL]
-            +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x]
-               +- SubqueryAlias spark_catalog.default.onek
-                  +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
++- Filter (cast(grouping(ten)#x as int) > 0)
+   +- Aggregate [ten#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(ten)#x]
+      +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, 0], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, null, 1]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, spark_grouping_id#xL]
+         +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x]
+            +- SubqueryAlias spark_catalog.default.onek
+               +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
 
 
 -- !query
@@ -446,13 +443,12 @@ group by cube(ten) having grouping(ten) > 0
 order by 2,1
 -- !query analysis
 Sort [grouping(ten)#x ASC NULLS FIRST, ten#x ASC NULLS FIRST], true
-+- Project [ten#x, grouping(ten)#x]
-   +- Filter (cast(cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) as int) > 0)
-      +- Aggregate [ten#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(ten)#x, spark_grouping_id#xL]
-         +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, 0], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, null, 1]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, spark_grouping_id#xL]
-            +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x]
-               +- SubqueryAlias spark_catalog.default.onek
-                  +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
++- Filter (cast(grouping(ten)#x as int) > 0)
+   +- Aggregate [ten#x, spark_grouping_id#xL], [ten#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(ten)#x]
+      +- Expand [[unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, 0], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, null, 1]], [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x, spark_grouping_id#xL]
+         +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, ten#x AS ten#x]
+            +- SubqueryAlias spark_catalog.default.onek
+               +- Relation spark_catalog.default.onek[unique1#x,unique2#x,two#x,four#x,ten#x,twenty#x,hundred#x,thousand#x,twothousand#x,fivethous#x,tenthous#x,odd#x,even#x,stringu1#x,stringu2#x,string4#x] parquet
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int2.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int2.sql.out
index 9dda3c0dc42d4..6720132a09acc 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int2.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int2.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`INT2_TBL`, false
 INSERT INTO INT2_TBL VALUES (smallint(trim('0   ')))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int2_tbl], Append, `spark_catalog`.`default`.`int2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int2_tbl), [f1]
-+- Project [cast(col1#x as smallint) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT2_TBL VALUES (smallint(trim('  1234 ')))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int2_tbl], Append, `spark_catalog`.`default`.`int2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int2_tbl), [f1]
-+- Project [cast(col1#x as smallint) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT2_TBL VALUES (smallint(trim('    -1234')))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int2_tbl], Append, `spark_catalog`.`default`.`int2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int2_tbl), [f1]
-+- Project [cast(col1#x as smallint) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT2_TBL VALUES (smallint('32767'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int2_tbl], Append, `spark_catalog`.`default`.`int2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int2_tbl), [f1]
-+- Project [cast(col1#x as smallint) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT2_TBL VALUES (smallint('-32767'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int2_tbl], Append, `spark_catalog`.`default`.`int2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int2_tbl), [f1]
-+- Project [cast(col1#x as smallint) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int4.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int4.sql.out
index d261b59a4c5e2..e19adeb5f0bf7 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int4.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int4.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`INT4_TBL`, false
 INSERT INTO INT4_TBL VALUES (int(trim('   0  ')))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int4_tbl], Append, `spark_catalog`.`default`.`int4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int4_tbl), [f1]
-+- Project [cast(col1#x as int) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT4_TBL VALUES (int(trim('123456     ')))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int4_tbl], Append, `spark_catalog`.`default`.`int4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int4_tbl), [f1]
-+- Project [cast(col1#x as int) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT4_TBL VALUES (int(trim('    -123456')))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int4_tbl], Append, `spark_catalog`.`default`.`int4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int4_tbl), [f1]
-+- Project [cast(col1#x as int) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT4_TBL VALUES (int('2147483647'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int4_tbl], Append, `spark_catalog`.`default`.`int4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int4_tbl), [f1]
-+- Project [cast(col1#x as int) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT4_TBL VALUES (int('-2147483647'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int4_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int4_tbl], Append, `spark_catalog`.`default`.`int4_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int4_tbl), [f1]
-+- Project [cast(col1#x as int) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int8.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int8.sql.out
index 72972469fa6ef..9546f1dae5e31 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int8.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/int8.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`INT8_TBL`, false
 INSERT INTO INT8_TBL VALUES(bigint(trim('  123   ')),bigint(trim('  456')))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int8_tbl], Append, `spark_catalog`.`default`.`int8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int8_tbl), [q1, q2]
-+- Project [cast(col1#xL as bigint) AS q1#xL, cast(col2#xL as bigint) AS q2#xL]
++- Project [col1#xL AS q1#xL, col2#xL AS q2#xL]
    +- LocalRelation [col1#xL, col2#xL]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT8_TBL VALUES(bigint(trim('123   ')),bigint('4567890123456789'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int8_tbl], Append, `spark_catalog`.`default`.`int8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int8_tbl), [q1, q2]
-+- Project [cast(col1#xL as bigint) AS q1#xL, cast(col2#xL as bigint) AS q2#xL]
++- Project [col1#xL AS q1#xL, col2#xL AS q2#xL]
    +- LocalRelation [col1#xL, col2#xL]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT8_TBL VALUES(bigint('4567890123456789'),bigint('123'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int8_tbl], Append, `spark_catalog`.`default`.`int8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int8_tbl), [q1, q2]
-+- Project [cast(col1#xL as bigint) AS q1#xL, cast(col2#xL as bigint) AS q2#xL]
++- Project [col1#xL AS q1#xL, col2#xL AS q2#xL]
    +- LocalRelation [col1#xL, col2#xL]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT8_TBL VALUES(+4567890123456789,bigint('4567890123456789'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int8_tbl], Append, `spark_catalog`.`default`.`int8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int8_tbl), [q1, q2]
-+- Project [cast(col1#xL as bigint) AS q1#xL, cast(col2#xL as bigint) AS q2#xL]
++- Project [col1#xL AS q1#xL, col2#xL AS q2#xL]
    +- LocalRelation [col1#xL, col2#xL]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO INT8_TBL VALUES(bigint('+4567890123456789'),bigint('-4567890123456789'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/int8_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/int8_tbl], Append, `spark_catalog`.`default`.`int8_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/int8_tbl), [q1, q2]
-+- Project [cast(col1#xL as bigint) AS q1#xL, cast(col2#xL as bigint) AS q2#xL]
++- Project [col1#xL AS q1#xL, col2#xL AS q2#xL]
    +- LocalRelation [col1#xL, col2#xL]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/join.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/join.sql.out
index 144fb69812ee6..439094c112863 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/join.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/join.sql.out
@@ -116,7 +116,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`J2_TBL`, false
 INSERT INTO J1_TBL VALUES (1, 4, 'one')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -124,7 +124,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (2, 3, 'two')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -132,7 +132,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (3, 2, 'three')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -140,7 +140,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (4, 1, 'four')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -148,7 +148,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (5, 0, 'five')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -156,7 +156,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (6, 6, 'six')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -164,7 +164,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (7, 7, 'seven')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -172,7 +172,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (8, 8, 'eight')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -180,7 +180,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (0, NULL, 'zero')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, cast(col2#x as int) AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -188,7 +188,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (NULL, NULL, 'null')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -196,7 +196,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (NULL, 0, 'zero')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [cast(col1#x as int) AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -204,7 +204,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (1, -1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -212,7 +212,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (2, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -220,7 +220,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (3, -3)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -228,7 +228,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (2, 4)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -236,7 +236,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (5, -5)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -244,7 +244,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (5, -5)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -252,7 +252,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (0, NULL)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, cast(col2#x as int) AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -268,7 +268,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (NULL, 0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [cast(col1#x as int) AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -674,7 +674,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t3`, false
 INSERT INTO t1 VALUES ( 'bb', 11 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -682,7 +682,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t2 VALUES ( 'bb', 12 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -690,7 +690,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t2 VALUES ( 'cc', 22 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -698,7 +698,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t2 VALUES ( 'ee', 42 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -706,7 +706,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t3 VALUES ( 'bb', 13 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -714,7 +714,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t3 VALUES ( 'cc', 23 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -722,7 +722,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t3 VALUES ( 'dd', 33 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -1326,7 +1326,7 @@ Aggregate [count(1) AS count(1)#xL]
 +- Filter unique1#x IN (list#x [])
    :  +- Project [unique1#x]
    :     +- Filter (unique2#x = 42)
-   :        +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, ... 6 more fields]
+   :        +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x]
    :           +- Join Inner, (unique1#x = unique1#x)
    :              :- SubqueryAlias b
    :              :  +- SubqueryAlias spark_catalog.default.tenk1
@@ -3844,7 +3844,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`j2`, false
 INSERT INTO j1 values(1,1),(1,2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1], Append, `spark_catalog`.`default`.`j1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1), [id1, id2]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3852,7 +3852,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO j2 values(1,1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2], Append, `spark_catalog`.`default`.`j2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2), [id1, id2]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3860,7 +3860,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO j2 values(1,2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2], Append, `spark_catalog`.`default`.`j2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2), [id1, id2]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/numeric.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/numeric.sql.out
index 6c2ae23291755..d5e8edbf02060 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/numeric.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/numeric.sql.out
@@ -63,7 +63,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`num_result`, false
 INSERT INTO num_exp_add VALUES (0,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -71,7 +71,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -79,7 +79,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -87,7 +87,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -95,7 +95,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -103,7 +103,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -111,7 +111,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -119,7 +119,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -127,7 +127,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,2,-34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -135,7 +135,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,2,34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -143,7 +143,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,2,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -151,7 +151,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,2,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -159,7 +159,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,3,4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -167,7 +167,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,3,-4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -175,7 +175,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,3,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -183,7 +183,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,3,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -191,7 +191,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,4,7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -199,7 +199,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,4,-7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -207,7 +207,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,4,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -215,7 +215,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,4,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -223,7 +223,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,5,16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -231,7 +231,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,5,-16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -239,7 +239,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,5,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -247,7 +247,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,5,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -255,7 +255,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,6,93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -263,7 +263,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,6,-93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -271,7 +271,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,6,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -279,7 +279,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,6,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -287,7 +287,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,7,-83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -295,7 +295,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,7,83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -303,7 +303,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,7,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -311,7 +311,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,7,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -319,7 +319,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,8,74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -327,7 +327,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,8,-74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -335,7 +335,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,8,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -343,7 +343,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,8,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -351,7 +351,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (0,9,-24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -359,7 +359,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (0,9,24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -367,7 +367,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (0,9,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -375,7 +375,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (0,9,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -383,7 +383,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -391,7 +391,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -399,7 +399,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -407,7 +407,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -415,7 +415,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -423,7 +423,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -431,7 +431,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -439,7 +439,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -447,7 +447,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,2,-34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -455,7 +455,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,2,34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -463,7 +463,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,2,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -471,7 +471,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,2,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -479,7 +479,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,3,4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -487,7 +487,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,3,-4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -495,7 +495,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,3,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -503,7 +503,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,3,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -511,7 +511,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,4,7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -519,7 +519,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,4,-7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -527,7 +527,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,4,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -535,7 +535,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,4,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -543,7 +543,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,5,16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -551,7 +551,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,5,-16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -559,7 +559,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,5,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -567,7 +567,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,5,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -575,7 +575,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,6,93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -583,7 +583,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,6,-93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -591,7 +591,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,6,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -599,7 +599,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,6,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -607,7 +607,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,7,-83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -615,7 +615,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,7,83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -623,7 +623,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,7,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -631,7 +631,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,7,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -639,7 +639,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,8,74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -647,7 +647,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,8,-74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -655,7 +655,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,8,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -663,7 +663,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,8,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -671,7 +671,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (1,9,-24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -679,7 +679,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (1,9,24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -687,7 +687,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (1,9,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -695,7 +695,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (1,9,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -703,7 +703,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,0,-34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -711,7 +711,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,0,-34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -719,7 +719,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -727,7 +727,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -735,7 +735,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,1,-34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -743,7 +743,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,1,-34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -751,7 +751,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -759,7 +759,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -767,7 +767,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,2,-68676984.430794094)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -775,7 +775,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,2,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -783,7 +783,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,2,1179132047626883.596862135856320209)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -791,7 +791,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,2,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -799,7 +799,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,3,-34338487.905397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -807,7 +807,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,3,-34338496.525397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -815,7 +815,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,3,-147998901.44836127257)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -823,7 +823,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,3,-7967167.56737750510440835266)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -831,7 +831,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,4,-26539030.803497047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -839,7 +839,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,4,-42137953.627297047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -847,7 +847,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,4,-267821744976817.8111137106593)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -855,7 +855,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,4,-4.40267480046830116685)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -863,7 +863,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,5,-34322095.176906047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -871,7 +871,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,5,-34354889.253888047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -879,7 +879,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,5,-563049578578.769242506736077)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -887,7 +887,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,5,-2094.18866914563535496429)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -895,7 +895,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,6,-34244590.637766787)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -903,7 +903,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,6,-34432393.793027307)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -911,7 +911,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,6,-3224438592470.18449811926184222)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -919,7 +919,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,6,-365.68599891479766440940)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -927,7 +927,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,7,-117366977.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -935,7 +935,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,7,48689992.784602953)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -943,7 +943,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,7,2851072985828710.485883795)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -951,7 +951,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,7,.41357483778485235518)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -959,7 +959,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,8,-34263611.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -967,7 +967,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,8,-34413373.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -975,7 +975,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,8,-2571300635581.146276407)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -983,7 +983,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,8,-458.57416721727870888476)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -991,7 +991,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (2,9,-59265296.260444467)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -999,7 +999,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (2,9,-9411688.170349627)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1007,7 +1007,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (2,9,855948866655588.453741509242968740)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1015,7 +1015,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (2,9,1.37757299946438931811)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1023,7 +1023,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,0,4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1031,7 +1031,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,0,4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1039,7 +1039,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1047,7 +1047,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1055,7 +1055,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,1,4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1063,7 +1063,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,1,4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1071,7 +1071,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1079,7 +1079,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1087,7 +1087,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,2,-34338487.905397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1095,7 +1095,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,2,34338496.525397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1103,7 +1103,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,2,-147998901.44836127257)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1111,7 +1111,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,2,-.00000012551512084352)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1119,7 +1119,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,3,8.62)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1127,7 +1127,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,3,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1135,7 +1135,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,3,18.5761)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1143,7 +1143,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,3,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1151,7 +1151,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,4,7799465.7219)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1159,7 +1159,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,4,-7799457.1019)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1167,7 +1167,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,4,33615678.685289)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1175,7 +1175,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,4,.00000055260225961552)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1183,7 +1183,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,5,16401.348491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1191,7 +1191,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,5,-16392.728491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1199,7 +1199,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,5,70671.23589621)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1207,7 +1207,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,5,.00026285234387695504)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1215,7 +1215,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,6,93905.88763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1223,7 +1223,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,6,-93897.26763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1231,7 +1231,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,6,404715.7995864206)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1239,7 +1239,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,6,.00004589912234457595)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1247,7 +1247,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,7,-83028480.69)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1255,7 +1255,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,7,83028489.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1263,7 +1263,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,7,-357852770.35)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1271,7 +1271,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,7,-.00000005190989574240)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1279,7 +1279,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,8,74885.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1287,7 +1287,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,8,-74876.69)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1295,7 +1295,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,8,322737.11)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1303,7 +1303,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,8,.00005755799201399553)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1311,7 +1311,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (3,9,-24926799.735047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1319,7 +1319,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (3,9,24926808.355047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1327,7 +1327,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (3,9,-107434525.43415438020)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1335,7 +1335,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (3,9,-.00000017290624149854)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1343,7 +1343,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,0,7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1351,7 +1351,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,0,7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1359,7 +1359,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1367,7 +1367,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1375,7 +1375,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,1,7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1383,7 +1383,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,1,7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1391,7 +1391,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1399,7 +1399,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1407,7 +1407,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,2,-26539030.803497047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1415,7 +1415,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,2,42137953.627297047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1423,7 +1423,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,2,-267821744976817.8111137106593)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1431,7 +1431,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,2,-.22713465002993920385)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1439,7 +1439,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,3,7799465.7219)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1447,7 +1447,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,3,7799457.1019)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1455,7 +1455,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,3,33615678.685289)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1463,7 +1463,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,3,1809619.81714617169373549883)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1471,7 +1471,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,4,15598922.8238)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1479,7 +1479,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,4,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1487,7 +1487,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,4,60831598315717.14146161)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1495,7 +1495,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,4,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1503,7 +1503,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,5,7815858.450391)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1511,7 +1511,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,5,7783064.373409)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1519,7 +1519,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,5,127888068979.9935054429)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1527,7 +1527,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,5,475.66281046305802686061)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1535,7 +1535,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,6,7893362.98953026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1543,7 +1543,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,6,7705559.83426974)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1551,7 +1551,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,6,732381731243.745115764094)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1559,7 +1559,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,6,83.05996138436129499606)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1567,7 +1567,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,7,-75229023.5881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1575,7 +1575,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,7,90827946.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1583,7 +1583,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,7,-647577464846017.9715)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1591,7 +1591,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,7,-.09393717604145131637)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1599,7 +1599,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,8,7874342.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1607,7 +1607,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,8,7724580.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1615,7 +1615,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,8,584031469984.4839)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1623,7 +1623,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,8,104.15808298366741897143)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1631,7 +1631,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (4,9,-17127342.633147420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1639,7 +1639,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (4,9,32726265.456947420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1647,7 +1647,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (4,9,-194415646271340.1815956522980)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1655,7 +1655,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (4,9,-.31289456112403769409)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1663,7 +1663,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,0,16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1671,7 +1671,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,0,16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1679,7 +1679,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1687,7 +1687,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1695,7 +1695,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,1,16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1703,7 +1703,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,1,16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1711,7 +1711,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1719,7 +1719,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1727,7 +1727,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,2,-34322095.176906047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1735,7 +1735,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,2,34354889.253888047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1743,7 +1743,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,2,-563049578578.769242506736077)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1751,7 +1751,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,2,-.00047751189505192446)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1759,7 +1759,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,3,16401.348491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1767,7 +1767,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,3,16392.728491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1775,7 +1775,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,3,70671.23589621)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1783,7 +1783,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,3,3804.41728329466357308584)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1791,7 +1791,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,4,7815858.450391)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1799,7 +1799,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,4,-7783064.373409)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1807,7 +1807,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,4,127888068979.9935054429)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1815,7 +1815,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,4,.00210232958726897192)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1823,7 +1823,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,5,32794.076982)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1831,7 +1831,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,5,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1839,7 +1839,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,5,268862871.275335557081)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1847,7 +1847,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,5,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1855,7 +1855,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,6,110298.61612126)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1863,7 +1863,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,6,-77504.53913926)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1871,7 +1871,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,6,1539707782.76899778633766)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1879,7 +1879,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,6,.17461941433576102689)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1887,7 +1887,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,7,-83012087.961509)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1895,7 +1895,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,7,83044882.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1903,7 +1903,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,7,-1361421264394.416135)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1911,7 +1911,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,7,-.00019748690453643710)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1919,7 +1919,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,8,91278.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1927,7 +1927,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,8,-58483.961509)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1935,7 +1935,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,8,1227826639.244571)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1943,7 +1943,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,8,.21897461960978085228)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1951,7 +1951,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (5,9,-24910407.006556420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1959,7 +1959,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (5,9,24943201.083538420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1967,7 +1967,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (5,9,-408725765384.257043660243220)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1975,7 +1975,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (5,9,-.00065780749354660427)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1983,7 +1983,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,0,93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1991,7 +1991,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,0,93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1999,7 +1999,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2007,7 +2007,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2015,7 +2015,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,1,93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2023,7 +2023,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,1,93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2031,7 +2031,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2039,7 +2039,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2047,7 +2047,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,2,-34244590.637766787)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2055,7 +2055,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,2,34432393.793027307)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2063,7 +2063,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,2,-3224438592470.18449811926184222)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2071,7 +2071,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,2,-.00273458651128995823)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2079,7 +2079,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,3,93905.88763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2087,7 +2087,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,3,93897.26763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2095,7 +2095,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,3,404715.7995864206)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2103,7 +2103,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,3,21786.90896293735498839907)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2111,7 +2111,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,4,7893362.98953026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2119,7 +2119,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,4,-7705559.83426974)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2127,7 +2127,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,4,732381731243.745115764094)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2135,7 +2135,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,4,.01203949512295682469)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2143,7 +2143,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,5,110298.61612126)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2151,7 +2151,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,5,77504.53913926)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2159,7 +2159,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,5,1539707782.76899778633766)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2167,7 +2167,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,5,5.72674008674192359679)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2175,7 +2175,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,6,187803.15526052)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2183,7 +2183,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,6,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2191,7 +2191,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,6,8817506281.4517452372676676)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2199,7 +2199,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,6,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2207,7 +2207,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,7,-82934583.42236974)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2215,7 +2215,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,7,83122386.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2223,7 +2223,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,7,-7796505729750.37795610)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2231,7 +2231,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,7,-.00113095617281538980)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2239,7 +2239,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,8,168782.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2247,7 +2247,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,8,19020.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2255,7 +2255,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,8,7031444034.53149906)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2263,7 +2263,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,8,1.25401073209839612184)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2271,7 +2271,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (6,9,-24832902.467417160)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2279,7 +2279,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (6,9,25020705.622677680)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2287,7 +2287,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (6,9,-2340666225110.29929521292692920)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2295,7 +2295,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (6,9,-.00376709254265256789)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2303,7 +2303,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,0,-83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2311,7 +2311,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,0,-83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2319,7 +2319,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2327,7 +2327,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2335,7 +2335,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,1,-83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2343,7 +2343,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,1,-83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2351,7 +2351,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2359,7 +2359,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2367,7 +2367,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,2,-117366977.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2375,7 +2375,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,2,-48689992.784602953)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2383,7 +2383,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,2,2851072985828710.485883795)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2391,7 +2391,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,2,2.41794207151503385700)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2399,7 +2399,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,3,-83028480.69)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2407,7 +2407,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,3,-83028489.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2415,7 +2415,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,3,-357852770.35)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2423,7 +2423,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,3,-19264149.65197215777262180974)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2431,7 +2431,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,4,-75229023.5881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2439,7 +2439,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,4,-90827946.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2447,7 +2447,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,4,-647577464846017.9715)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2455,7 +2455,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,4,-10.64541262725136247686)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2463,7 +2463,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,5,-83012087.961509)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2471,7 +2471,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,5,-83044882.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2479,7 +2479,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,5,-1361421264394.416135)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2487,7 +2487,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,5,-5063.62688881730941836574)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2495,7 +2495,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,6,-82934583.42236974)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2503,7 +2503,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,6,-83122386.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2511,7 +2511,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,6,-7796505729750.37795610)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2519,7 +2519,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,6,-884.20756174009028770294)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2527,7 +2527,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,7,-166056970)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2535,7 +2535,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,7,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2543,7 +2543,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,7,6893729321395225)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#xL]
 
 
@@ -2551,7 +2551,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,7,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2559,7 +2559,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,8,-82953604)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2567,7 +2567,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,8,-83103366)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2575,7 +2575,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,8,-6217255985285)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#xL]
 
 
@@ -2583,7 +2583,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,8,-1108.80577182462841041118)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2591,7 +2591,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (7,9,-107955289.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2599,7 +2599,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (7,9,-58101680.954952580)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2607,7 +2607,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (7,9,2069634775752159.035758700)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2615,7 +2615,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (7,9,3.33089171198810413382)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2623,7 +2623,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,0,74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2631,7 +2631,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,0,74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2639,7 +2639,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2647,7 +2647,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2655,7 +2655,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,1,74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2663,7 +2663,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,1,74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2671,7 +2671,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2679,7 +2679,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2687,7 +2687,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,2,-34263611.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2695,7 +2695,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,2,34413373.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2703,7 +2703,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,2,-2571300635581.146276407)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2711,7 +2711,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,2,-.00218067233500788615)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2719,7 +2719,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,3,74885.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2727,7 +2727,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,3,74876.69)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2735,7 +2735,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,3,322737.11)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2743,7 +2743,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,3,17373.78190255220417633410)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2751,7 +2751,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,4,7874342.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2759,7 +2759,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,4,-7724580.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2767,7 +2767,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,4,584031469984.4839)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2775,7 +2775,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,4,.00960079113741758956)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2783,7 +2783,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,5,91278.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2791,7 +2791,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,5,58483.961509)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2799,7 +2799,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,5,1227826639.244571)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2807,7 +2807,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,5,4.56673929509287019456)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2815,7 +2815,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,6,168782.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2823,7 +2823,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,6,-19020.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2831,7 +2831,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,6,7031444034.53149906)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2839,7 +2839,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,6,.79744134113322314424)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2847,7 +2847,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,7,-82953604)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2855,7 +2855,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,7,83103366)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2863,7 +2863,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,7,-6217255985285)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#xL]
 
 
@@ -2871,7 +2871,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,7,-.00090187120721280172)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2879,7 +2879,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,8,149762)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2887,7 +2887,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,8,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2895,7 +2895,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,8,5607164161)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#xL as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#xL]
 
 
@@ -2903,7 +2903,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,8,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2911,7 +2911,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (8,9,-24851923.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2919,7 +2919,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (8,9,25001685.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2927,7 +2927,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (8,9,-1866544013697.195857020)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2935,7 +2935,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (8,9,-.00300403532938582735)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2943,7 +2943,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,0,-24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2951,7 +2951,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,0,-24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2959,7 +2959,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2967,7 +2967,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2975,7 +2975,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,1,-24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2983,7 +2983,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,1,-24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2991,7 +2991,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -2999,7 +2999,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3007,7 +3007,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,2,-59265296.260444467)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3015,7 +3015,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,2,9411688.170349627)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3023,7 +3023,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,2,855948866655588.453741509242968740)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3031,7 +3031,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,2,.72591434384152961526)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3039,7 +3039,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,3,-24926799.735047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3047,7 +3047,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,3,-24926808.355047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3055,7 +3055,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,3,-107434525.43415438020)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3063,7 +3063,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,3,-5783481.21694835730858468677)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3071,7 +3071,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,4,-17127342.633147420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3079,7 +3079,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,4,-32726265.456947420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3087,7 +3087,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,4,-194415646271340.1815956522980)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3095,7 +3095,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,4,-3.19596478892958416484)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3103,7 +3103,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,5,-24910407.006556420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3111,7 +3111,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,5,-24943201.083538420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3119,7 +3119,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,5,-408725765384.257043660243220)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3127,7 +3127,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,5,-1520.20159364322004505807)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3135,7 +3135,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,6,-24832902.467417160)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3143,7 +3143,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,6,-25020705.622677680)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3151,7 +3151,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,6,-2340666225110.29929521292692920)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3159,7 +3159,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,6,-265.45671195426965751280)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3167,7 +3167,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,7,-107955289.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3175,7 +3175,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,7,58101680.954952580)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3183,7 +3183,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,7,2069634775752159.035758700)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3191,7 +3191,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,7,.30021990699995814689)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3199,7 +3199,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,8,-24851923.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3207,7 +3207,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,8,-25001685.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3215,7 +3215,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,8,-1866544013697.195857020)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3223,7 +3223,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,8,-332.88556569820675471748)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3231,7 +3231,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_add VALUES (9,9,-49853608.090094840)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_add, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_add], Append, `spark_catalog`.`default`.`num_exp_add`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_add), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3239,7 +3239,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sub VALUES (9,9,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sub, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sub], Append, `spark_catalog`.`default`.`num_exp_sub`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sub), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3247,7 +3247,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_mul VALUES (9,9,621345559900192.420120630048656400)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_mul, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_mul], Append, `spark_catalog`.`default`.`num_exp_mul`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_mul), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3255,7 +3255,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_div VALUES (9,9,1.00000000000000000000)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_div, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_div], Append, `spark_catalog`.`default`.`num_exp_div`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_div), [id1, id2, expected]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x, cast(col3#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -3263,7 +3263,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (0,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3271,7 +3271,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (1,0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3279,7 +3279,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (2,5859.90547836712524903505)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3287,7 +3287,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (3,2.07605394920266944396)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3295,7 +3295,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (4,2792.75158435189147418923)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3303,7 +3303,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (5,128.05092147657509145473)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3311,7 +3311,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (6,306.43364311096782703406)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3319,7 +3319,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (7,9111.99676251039939975230)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3327,7 +3327,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (8,273.64392922189960397542)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3335,7 +3335,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_sqrt VALUES (9,4992.67503899937593364766)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt], Append, `spark_catalog`.`default`.`num_exp_sqrt`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_sqrt), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3343,7 +3343,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3351,7 +3351,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3359,7 +3359,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (2,17.35177750493897715514)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3367,7 +3367,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (3,1.46093790411565641971)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3375,7 +3375,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (4,15.86956523951936572464)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3383,7 +3383,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (5,9.70485601768871834038)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3391,7 +3391,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (6,11.45000246622944403127)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3399,7 +3399,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (7,18.23469429965478772991)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3407,7 +3407,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (8,11.22365546576315513668)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3415,7 +3415,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_ln VALUES (9,17.03145425013166006962)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_ln], Append, `spark_catalog`.`default`.`num_exp_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3423,7 +3423,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3431,7 +3431,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3439,7 +3439,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (2,7.53578122160797276459)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3447,7 +3447,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (3,.63447727016073160075)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3455,7 +3455,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (4,6.89206461372691743345)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3463,7 +3463,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (5,4.21476541614777768626)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3471,7 +3471,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (6,4.97267288886207207671)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3479,7 +3479,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (7,7.91922711353275546914)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3487,7 +3487,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (8,4.87437163556421004138)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3495,7 +3495,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_log10 VALUES (9,7.39666659961986567059)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_log10, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_log10], Append, `spark_catalog`.`default`.`num_exp_log10`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_log10), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3503,7 +3503,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (0,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3511,7 +3511,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (1,double('NaN'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3519,7 +3519,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (2,224790267919917955.13261618583642653184)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3527,7 +3527,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (3,28.90266599445155957393)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3535,7 +3535,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (4,7405685069594999.07733999469386277636)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3543,7 +3543,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (5,5068226527.32127265408584640098)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3551,7 +3551,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (6,281839893606.99372343357047819067)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3573,7 +3573,7 @@ org.apache.spark.SparkArithmeticException
 INSERT INTO num_exp_power_10_ln VALUES (8,167361463828.07491320069016125952)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3581,7 +3581,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_exp_power_10_ln VALUES (9,107511333880052007.04141124673540337457)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln], Append, `spark_catalog`.`default`.`num_exp_power_10_ln`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_exp_power_10_ln), [id, expected]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS expected#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3589,7 +3589,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (0, 0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3597,7 +3597,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (1, 0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3605,7 +3605,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (2, -34338492.215397047)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3613,7 +3613,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (3, 4.31)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3621,7 +3621,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (4, 7799461.4119)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3629,7 +3629,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (5, 16397.038491)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3637,7 +3637,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (6, 93901.57763026)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3645,7 +3645,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (7, -83028485)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3653,7 +3653,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (8, 74881)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3661,7 +3661,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO num_data VALUES (9, -24926804.045047420)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_data, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_data], Append, `spark_catalog`.`default`.`num_data`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_data), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(38,10)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3684,7 +3684,7 @@ INSERT INTO num_result SELECT t1.id, t2.id, t1.val + t2.val
     FROM num_data t1, num_data t2
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(id#x as int) AS id2#x, cast((val + val)#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, id#x AS id2#x, cast((val + val)#x as decimal(38,10)) AS result#x]
    +- Project [id#x, id#x, (val#x + val#x) AS (val + val)#x]
       +- Join Inner
          :- SubqueryAlias t1
@@ -3723,7 +3723,7 @@ INSERT INTO num_result SELECT t1.id, t2.id, round(t1.val + t2.val, 10)
     FROM num_data t1, num_data t2
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(id#x as int) AS id2#x, cast(round((val + val), 10)#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, id#x AS id2#x, cast(round((val + val), 10)#x as decimal(38,10)) AS result#x]
    +- Project [id#x, id#x, round((val#x + val#x), 10) AS round((val + val), 10)#x]
       +- Join Inner
          :- SubqueryAlias t1
@@ -3762,7 +3762,7 @@ INSERT INTO num_result SELECT t1.id, t2.id, t1.val - t2.val
     FROM num_data t1, num_data t2
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(id#x as int) AS id2#x, cast((val - val)#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, id#x AS id2#x, cast((val - val)#x as decimal(38,10)) AS result#x]
    +- Project [id#x, id#x, (val#x - val#x) AS (val - val)#x]
       +- Join Inner
          :- SubqueryAlias t1
@@ -3801,7 +3801,7 @@ INSERT INTO num_result SELECT t1.id, t2.id, round(t1.val - t2.val, 40)
     FROM num_data t1, num_data t2
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(id#x as int) AS id2#x, cast(round((val - val), 40)#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, id#x AS id2#x, cast(round((val - val), 40)#x as decimal(38,10)) AS result#x]
    +- Project [id#x, id#x, round((val#x - val#x), 40) AS round((val - val), 40)#x]
       +- Join Inner
          :- SubqueryAlias t1
@@ -3879,7 +3879,7 @@ INSERT INTO num_result SELECT t1.id, t2.id, round(t1.val * t2.val, 30)
     FROM num_data t1, num_data t2
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(id#x as int) AS id2#x, cast(round((val * val), 30)#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, id#x AS id2#x, cast(round((val * val), 30)#x as decimal(38,10)) AS result#x]
    +- Project [id#x, id#x, round((val#x * val#x), 30) AS round((val * val), 30)#x]
       +- Join Inner
          :- SubqueryAlias t1
@@ -3919,7 +3919,7 @@ INSERT INTO num_result SELECT t1.id, t2.id, t1.val / t2.val
     WHERE t2.val != '0.0'
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(id#x as int) AS id2#x, cast((val / val)#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, id#x AS id2#x, cast((val / val)#x as decimal(38,10)) AS result#x]
    +- Project [id#x, id#x, (val#x / val#x) AS (val / val)#x]
       +- Filter NOT (cast(val#x as double) = cast(0.0 as double))
          +- Join Inner
@@ -3960,7 +3960,7 @@ INSERT INTO num_result SELECT t1.id, t2.id, round(t1.val / t2.val, 80)
     WHERE t2.val != '0.0'
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(id#x as int) AS id2#x, cast(round((val / val), 80)#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, id#x AS id2#x, cast(round((val / val), 80)#x as decimal(38,10)) AS result#x]
    +- Project [id#x, id#x, round((val#x / val#x), 80) AS round((val / val), 80)#x]
       +- Filter NOT (cast(val#x as double) = cast(0.0 as double))
          +- Join Inner
@@ -4000,7 +4000,7 @@ INSERT INTO num_result SELECT id, 0, SQRT(ABS(val))
     FROM num_data
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(0#x as int) AS id2#x, cast(SQRT(abs(val))#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, 0#x AS id2#x, cast(SQRT(abs(val))#x as decimal(38,10)) AS result#x]
    +- Project [id#x, 0 AS 0#x, SQRT(cast(abs(val#x) as double)) AS SQRT(abs(val))#x]
       +- SubqueryAlias spark_catalog.default.num_data
          +- Relation spark_catalog.default.num_data[id#x,val#x] parquet
@@ -4035,7 +4035,7 @@ INSERT INTO num_result SELECT id, 0, LN(ABS(val))
     WHERE val != '0.0'
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(0#x as int) AS id2#x, cast(ln(abs(val))#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, 0#x AS id2#x, cast(ln(abs(val))#x as decimal(38,10)) AS result#x]
    +- Project [id#x, 0 AS 0#x, ln(cast(abs(val#x) as double)) AS ln(abs(val))#x]
       +- Filter NOT (cast(val#x as double) = cast(0.0 as double))
          +- SubqueryAlias spark_catalog.default.num_data
@@ -4071,7 +4071,7 @@ INSERT INTO num_result SELECT id, 0, LOG(cast('10' as decimal(38, 18)), ABS(val)
     WHERE val != '0.0'
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(0#x as int) AS id2#x, cast(LOG(CAST(10 AS DECIMAL(38,18)), abs(val))#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, 0#x AS id2#x, cast(LOG(CAST(10 AS DECIMAL(38,18)), abs(val))#x as decimal(38,10)) AS result#x]
    +- Project [id#x, 0 AS 0#x, LOG(cast(cast(10 as decimal(38,18)) as double), cast(abs(val#x) as double)) AS LOG(CAST(10 AS DECIMAL(38,18)), abs(val))#x]
       +- Filter NOT (cast(val#x as double) = cast(0.0 as double))
          +- SubqueryAlias spark_catalog.default.num_data
@@ -4107,7 +4107,7 @@ INSERT INTO num_result SELECT id, 0, POWER(cast('10' as decimal(38, 18)), LN(ABS
     WHERE val != '0.0'
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/num_result, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/num_result], Append, `spark_catalog`.`default`.`num_result`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/num_result), [id1, id2, result]
-+- Project [cast(id#x as int) AS id1#x, cast(0#x as int) AS id2#x, cast(POWER(CAST(10 AS DECIMAL(38,18)), ln(abs(round(val, 200))))#x as decimal(38,10)) AS result#x]
++- Project [id#x AS id1#x, 0#x AS id2#x, cast(POWER(CAST(10 AS DECIMAL(38,18)), ln(abs(round(val, 200))))#x as decimal(38,10)) AS result#x]
    +- Project [id#x, 0 AS 0#x, POWER(cast(cast(10 as decimal(38,18)) as double), ln(cast(abs(round(val#x, 200)) as double))) AS POWER(CAST(10 AS DECIMAL(38,18)), ln(abs(round(val, 200))))#x]
       +- Filter NOT (cast(val#x as double) = cast(0.0 as double))
          +- SubqueryAlias spark_catalog.default.num_data
@@ -4149,7 +4149,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`fract_only`, false
 INSERT INTO fract_only VALUES (1, 0.0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/fract_only, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/fract_only], Append, `spark_catalog`.`default`.`fract_only`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/fract_only), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -4157,7 +4157,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO fract_only VALUES (2, 0.1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/fract_only, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/fract_only], Append, `spark_catalog`.`default`.`fract_only`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/fract_only), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -4165,7 +4165,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO fract_only VALUES (4, -0.9999)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/fract_only, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/fract_only], Append, `spark_catalog`.`default`.`fract_only`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/fract_only), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
++- Project [col1#x AS id#x, col2#x AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -4173,7 +4173,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO fract_only VALUES (5, 0.99994)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/fract_only, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/fract_only], Append, `spark_catalog`.`default`.`fract_only`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/fract_only), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -4181,7 +4181,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO fract_only VALUES (7, 0.00001)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/fract_only, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/fract_only], Append, `spark_catalog`.`default`.`fract_only`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/fract_only), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -4189,7 +4189,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO fract_only VALUES (8, 0.00017)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/fract_only, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/fract_only], Append, `spark_catalog`.`default`.`fract_only`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/fract_only), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
++- Project [col1#x AS id#x, cast(col2#x as decimal(4,4)) AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_having.sql.out
index 640ab20757936..72b607951ec1d 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_having.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_having.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`test_having`, false
 INSERT INTO test_having VALUES (0, 1, 'XXXX', 'A')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (1, 2, 'AAAA', 'b')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (2, 2, 'AAAA', 'c')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (3, 3, 'BBBB', 'D')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (4, 3, 'BBBB', 'e')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -49,7 +49,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (5, 3, 'bbbb', 'F')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -57,7 +57,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (6, 4, 'cccc', 'g')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -65,7 +65,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (7, 4, 'cccc', 'h')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -73,7 +73,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (8, 4, 'CCCC', 'I')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -81,7 +81,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (9, 4, 'CCCC', 'j')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_implicit.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_implicit.sql.out
index 83b10b3cb67c4..e456a80d5e049 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_implicit.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/select_implicit.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`test_missing_target`, fa
 INSERT INTO test_missing_target VALUES (0, 1, 'XXXX', 'A')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (1, 2, 'ABAB', 'b')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (2, 2, 'ABAB', 'c')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (3, 3, 'BBBB', 'D')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (4, 3, 'BBBB', 'e')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -49,7 +49,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (5, 3, 'bbbb', 'F')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -57,7 +57,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (6, 4, 'cccc', 'g')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -65,7 +65,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (7, 4, 'cccc', 'h')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -73,7 +73,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (8, 4, 'CCCC', 'I')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -81,7 +81,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (9, 4, 'CCCC', 'j')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/strings.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/strings.sql.out
index 2a4d79360b5c1..57d6a813c25d3 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/strings.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/strings.sql.out
@@ -512,7 +512,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`toasttest`, false
 insert into toasttest values(repeat('1234567890',10000))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/toasttest, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/toasttest], Append, `spark_catalog`.`default`.`toasttest`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/toasttest), [f1]
-+- Project [cast(col1#x as string) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -520,7 +520,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into toasttest values(repeat('1234567890',10000))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/toasttest, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/toasttest], Append, `spark_catalog`.`default`.`toasttest`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/toasttest), [f1]
-+- Project [cast(col1#x as string) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -528,7 +528,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into toasttest values(repeat('1234567890',10000))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/toasttest, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/toasttest], Append, `spark_catalog`.`default`.`toasttest`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/toasttest), [f1]
-+- Project [cast(col1#x as string) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -536,7 +536,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 insert into toasttest values(repeat('1234567890',10000))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/toasttest, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/toasttest], Append, `spark_catalog`.`default`.`toasttest`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/toasttest), [f1]
-+- Project [cast(col1#x as string) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/text.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/text.sql.out
index 474c2401f40d0..ef7b7a4180ba1 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/text.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/text.sql.out
@@ -23,7 +23,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`TEXT_TBL`, false
 INSERT INTO TEXT_TBL VALUES ('doh!')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/text_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/text_tbl], Append, `spark_catalog`.`default`.`text_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/text_tbl), [f1]
-+- Project [cast(col1#x as string) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -31,7 +31,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TEXT_TBL VALUES ('hi de ho neighbor')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/text_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/text_tbl], Append, `spark_catalog`.`default`.`text_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/text_tbl), [f1]
-+- Project [cast(col1#x as string) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/timestamp.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/timestamp.sql.out
index a6c3c27829698..3bc151fe61956 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/timestamp.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/timestamp.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`TIMESTAMP_TBL`, false
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'now')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'now')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'today')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'yesterday')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'tomorrow')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -49,7 +49,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'tomorrow EST')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -57,7 +57,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'tomorrow Zulu')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -89,7 +89,7 @@ TruncateTableCommand `spark_catalog`.`default`.`timestamp_tbl`
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp'epoch')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -97,7 +97,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp('1997-01-02'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -105,7 +105,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp('1997-01-02 03:04:05'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -113,7 +113,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp('1997-02-10 17:32:01-08'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
@@ -121,7 +121,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO TIMESTAMP_TBL VALUES (timestamp('2001-09-22T18:19:20'))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/timestamp_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/timestamp_tbl], Append, `spark_catalog`.`default`.`timestamp_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/timestamp_tbl), [d1]
-+- Project [cast(col1#x as timestamp) AS d1#x]
++- Project [col1#x AS d1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part2.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part2.sql.out
index cdcd563de4f6a..5281494bece15 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part2.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part2.sql.out
@@ -24,7 +24,7 @@ INSERT INTO empsalary VALUES
   ('develop', 11, 5200, date '2007-08-15')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/empsalary, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/empsalary], Append, `spark_catalog`.`default`.`empsalary`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/empsalary), [depname, empno, salary, enroll_date]
-+- Project [cast(col1#x as string) AS depname#x, cast(col2#x as int) AS empno#x, cast(col3#x as int) AS salary#x, cast(col4#x as date) AS enroll_date#x]
++- Project [col1#x AS depname#x, col2#x AS empno#x, col3#x AS salary#x, col4#x AS enroll_date#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -280,7 +280,7 @@ insert into numerics values
 (7, 100, 100, 100)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/numerics, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/numerics], Append, `spark_catalog`.`default`.`numerics`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/numerics), [id, f_float4, f_float8, f_numeric]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as float) AS f_float4#x, cast(col3#x as float) AS f_float8#x, cast(col4#x as int) AS f_numeric#x]
++- Project [col1#x AS id#x, cast(col2#x as float) AS f_float4#x, cast(col3#x as float) AS f_float8#x, cast(col4#x as int) AS f_numeric#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part3.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part3.sql.out
index d552c108d4612..bc6dc828ad857 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part3.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/window_part3.sql.out
@@ -33,7 +33,7 @@ INSERT INTO empsalary VALUES
   ('develop', 11, 5200, date '2007-08-15')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/empsalary, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/empsalary], Append, `spark_catalog`.`default`.`empsalary`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/empsalary), [depname, empno, salary, enroll_date]
-+- Project [cast(col1#x as string) AS depname#x, cast(col2#x as int) AS empno#x, cast(col3#x as int) AS salary#x, cast(col4#x as date) AS enroll_date#x]
++- Project [col1#x AS depname#x, col2#x AS empno#x, col3#x AS salary#x, col4#x AS enroll_date#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -223,7 +223,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
 insert into t1 values (1,1),(1,2),(2,2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [f1, f2]
-+- Project [cast(col1#x as int) AS f1#x, cast(col2#x as int) AS f2#x]
++- Project [col1#x AS f1#x, col2#x AS f2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/with.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/with.sql.out
index de86c88f6d1b9..edbdcba851483 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/with.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/postgreSQL/with.sql.out
@@ -325,7 +325,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`department`, false
 INSERT INTO department VALUES (0, NULL, 'ROOT')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, cast(col2#x as int) AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -333,7 +333,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO department VALUES (1, 0, 'A')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, col2#x AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -341,7 +341,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO department VALUES (2, 1, 'B')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, col2#x AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -349,7 +349,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO department VALUES (3, 2, 'C')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, col2#x AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -357,7 +357,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO department VALUES (4, 2, 'D')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, col2#x AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -365,7 +365,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO department VALUES (5, 0, 'E')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, col2#x AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -373,7 +373,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO department VALUES (6, 4, 'F')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, col2#x AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -381,7 +381,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO department VALUES (7, 5, 'G')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/department, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/department], Append, `spark_catalog`.`default`.`department`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/department), [id, parent_department, name]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_department#x, cast(col3#x as string) AS name#x]
++- Project [col1#x AS id#x, col2#x AS parent_department#x, col3#x AS name#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -774,7 +774,7 @@ VALUES (1, NULL), (2, 1), (3,1), (4,2), (5,2), (6,2), (7,3), (8,3),
        (9,4), (10,4), (11,7), (12,7), (13,7), (14, 9), (15,11), (16,11)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/tree, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/tree], Append, `spark_catalog`.`default`.`tree`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/tree), [id, parent_id]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as int) AS parent_id#x]
++- Project [col1#x AS id#x, col2#x AS parent_id#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -902,7 +902,7 @@ insert into graph values
 	(5, 1, 'arc 5 -> 1')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/graph, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/graph], Append, `spark_catalog`.`default`.`graph`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/graph), [f, t, label]
-+- Project [cast(col1#x as int) AS f#x, cast(col2#x as int) AS t#x, cast(col3#x as string) AS label#x]
++- Project [col1#x AS f#x, col2#x AS t#x, col3#x AS label#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -1111,7 +1111,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`y`, false
 INSERT INTO y SELECT EXPLODE(SEQUENCE(1, 10))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/y, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/y], Append, `spark_catalog`.`default`.`y`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/y), [a]
-+- Project [cast(col#x as int) AS a#x]
++- Project [col#x AS a#x]
    +- Project [col#x]
       +- Generate explode(sequence(1, 10, None, Some(America/Los_Angeles))), false, [col#x]
          +- OneRowRelation
@@ -1183,20 +1183,10 @@ org.apache.spark.sql.AnalysisException
 WITH RECURSIVE x(n) AS (SELECT n FROM x UNION ALL SELECT 1)
 	SELECT * FROM x
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
+org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`n`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 32,
-    "stopIndex" : 32,
-    "fragment" : "n"
-  } ]
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
 }
 
 
@@ -1210,7 +1200,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`y`, false
 INSERT INTO y SELECT EXPLODE(SEQUENCE(1, 10))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/y, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/y], Append, `spark_catalog`.`default`.`y`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/y), [a]
-+- Project [cast(col#x as int) AS a#x]
++- Project [col#x AS a#x]
    +- Project [col#x]
       +- Generate explode(sequence(1, 10, None, Some(America/Los_Angeles))), false, [col#x]
          +- OneRowRelation
@@ -1670,15 +1660,8 @@ SELECT * FROM outermost ORDER BY 1
 -- !query analysis
 org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "UNION_NOT_SUPPORTED_IN_RECURSIVE_CTE",
-  "sqlState" : "42836",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 185,
-    "fragment" : "WITH RECURSIVE outermost(x) AS (\n  WITH innermost as (SELECT 2 FROM outermost) -- fail\n    SELECT * FROM innermost\n    UNION SELECT * from outermost\n)\nSELECT * FROM outermost ORDER BY 1"
-  } ]
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
 }
 
 
@@ -1719,7 +1702,7 @@ TruncateTableCommand `spark_catalog`.`default`.`y`
 INSERT INTO y SELECT EXPLODE(SEQUENCE(1, 3))
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/y, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/y], Append, `spark_catalog`.`default`.`y`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/y), [a]
-+- Project [cast(col#x as int) AS a#x]
++- Project [col#x AS a#x]
    +- Project [col#x]
       +- Generate explode(sequence(1, 3, None, Some(America/Los_Angeles))), false, [col#x]
          +- OneRowRelation
@@ -1773,7 +1756,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`parent`, false
 INSERT INTO parent VALUES ( 1, 'p1' )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/parent, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/parent], Append, `spark_catalog`.`default`.`parent`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/parent), [id, val]
-+- Project [cast(col1#x as int) AS id#x, cast(col2#x as string) AS val#x]
++- Project [col1#x AS id#x, col2#x AS val#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -1876,7 +1859,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`test`, false
 with test as (select 42) insert into test select * from test
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test], Append, `spark_catalog`.`default`.`test`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test), [i]
-+- Project [cast(42#x as int) AS i#x]
++- Project [42#x AS i#x]
    +- WithCTE
       :- CTERelationDef xxxx, false
       :  +- SubqueryAlias test
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/replacing-missing-expression-with-alias.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/replacing-missing-expression-with-alias.sql.out
new file mode 100644
index 0000000000000..a353c9e8ed018
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/replacing-missing-expression-with-alias.sql.out
@@ -0,0 +1,204 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+SELECT col1 + 1 AS a FROM VALUES(1) GROUP BY a ORDER BY col1 + 1
+-- !query analysis
+Sort [a#x ASC NULLS FIRST], true
++- Aggregate [(col1#x + 1)], [(col1#x + 1) AS a#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 + 1 AS a, a AS b FROM VALUES(1) GROUP BY a ORDER BY col1 + 1
+-- !query analysis
+Sort [a#x ASC NULLS FIRST], true
++- Project [a#x, a#x AS b#x]
+   +- Project [(col1 + 1)#x, (col1 + 1)#x AS a#x]
+      +- Aggregate [(col1#x + 1)], [(col1#x + 1) AS (col1 + 1)#x]
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 + 1 AS a FROM VALUES(1) GROUP BY a HAVING col1 + 1 > 0
+-- !query analysis
+Filter (a#x > 0)
++- Aggregate [(col1#x + 1)], [(col1#x + 1) AS a#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 + 1 AS a, a AS b FROM VALUES(1) GROUP BY a HAVING col1 + 1 > 0
+-- !query analysis
+Filter (a#x > 0)
++- Project [a#x, a#x AS b#x]
+   +- Project [(col1 + 1)#x, (col1 + 1)#x AS a#x]
+      +- Aggregate [(col1#x + 1)], [(col1#x + 1) AS (col1 + 1)#x]
+         +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1, col2, GROUPING(col1) FROM VALUES("abc", 1) GROUP BY CUBE(col1, col2) ORDER BY GROUPING(col1)
+-- !query analysis
+Sort [grouping(col1)#x ASC NULLS FIRST], true
++- Aggregate [col1#x, col2#x, spark_grouping_id#xL], [col1#x, col2#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(col1)#x]
+   +- Expand [[col1#x, col2#x, col1#x, col2#x, 0], [col1#x, col2#x, col1#x, null, 1], [col1#x, col2#x, null, col2#x, 2], [col1#x, col2#x, null, null, 3]], [col1#x, col2#x, col1#x, col2#x, spark_grouping_id#xL]
+      +- Project [col1#x, col2#x, col1#x AS col1#x, col2#x AS col2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col1, col2, GROUPING(col1) FROM VALUES("abc", 1) GROUP BY CUBE(col1, col2) HAVING GROUPING(col1) != NULL
+-- !query analysis
+Filter NOT (grouping(col1)#x = cast(null as tinyint))
++- Aggregate [col1#x, col2#x, spark_grouping_id#xL], [col1#x, col2#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(col1)#x]
+   +- Expand [[col1#x, col2#x, col1#x, col2#x, 0], [col1#x, col2#x, col1#x, null, 1], [col1#x, col2#x, null, col2#x, 2], [col1#x, col2#x, null, null, 3]], [col1#x, col2#x, col1#x, col2#x, spark_grouping_id#xL]
+      +- Project [col1#x, col2#x, col1#x AS col1#x, col2#x AS col2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) ORDER BY make_date(col1, col2, col3)
+-- !query analysis
+Sort [a#x ASC NULLS FIRST], true
++- Aggregate [make_date(col1#x, col2#x, col3#x, true)], [make_date(col1#x, col2#x, col3#x, true) AS a#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) ORDER BY make_date(col1, col2, col3)
+-- !query analysis
+Sort [a#x ASC NULLS FIRST], true
++- Project [a#x, a#x AS b#x]
+   +- Project [make_date(col1, col2, col3)#x, make_date(col1, col2, col3)#x AS a#x]
+      +- Aggregate [make_date(col1#x, col2#x, col3#x, true)], [make_date(col1#x, col2#x, col3#x, true) AS make_date(col1, col2, col3)#x]
+         +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) HAVING make_date(col1, col2, col3) > '2025-01-01'
+-- !query analysis
+Filter (a#x > cast(2025-01-01 as date))
++- Aggregate [make_date(col1#x, col2#x, col3#x, true)], [make_date(col1#x, col2#x, col3#x, true) AS a#x]
+   +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) HAVING make_date(col1, col2, col3) > '2025-01-01'
+-- !query analysis
+Filter (a#x > cast(2025-01-01 as date))
++- Project [a#x, a#x AS b#x]
+   +- Project [make_date(col1, col2, col3)#x, make_date(col1, col2, col3)#x AS a#x]
+      +- Aggregate [make_date(col1#x, col2#x, col3#x, true)], [make_date(col1#x, col2#x, col3#x, true) AS make_date(col1, col2, col3)#x]
+         +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) ORDER BY make_date(col1, col2, col3)
+-- !query analysis
+Project [a#x]
++- Sort [make_date(col1#x, col2#x, col3#x, true) ASC NULLS FIRST], true
+   +- Project [make_date(col1#x, col2#x, col3#x, true) AS a#x, col1#x, col2#x, col3#x]
+      +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) ORDER BY make_date(col1, col2, col3)
+-- !query analysis
+Project [a#x, b#x]
++- Sort [make_date(col1#x, col2#x, col3#x, true) ASC NULLS FIRST], true
+   +- Project [a#x, a#x AS b#x, col1#x, col2#x, col3#x]
+      +- Project [col1#x, col2#x, col3#x, make_date(col1#x, col2#x, col3#x, true) AS a#x]
+         +- LocalRelation [col1#x, col2#x, col3#x]
+
+
+-- !query
+SELECT col1, col1 AS a FROM VALUES(1) GROUP BY col1 ORDER BY col1 ASC
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [col1#x], [col1#x, col1#x AS a#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 AS a, col1 FROM VALUES(1) GROUP BY col1 ORDER BY col1 ASC
+-- !query analysis
+Sort [col1#x ASC NULLS FIRST], true
++- Aggregate [col1#x], [col1#x AS a#x, col1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1, col1 AS a FROM VALUES(1) GROUP BY col1 HAVING col1 > 0
+-- !query analysis
+Filter (col1#x > 0)
++- Aggregate [col1#x], [col1#x, col1#x AS a#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col1 AS a, col1 FROM VALUES(1) GROUP BY col1 HAVING col1 > 0
+-- !query analysis
+Filter (col1#x > 0)
++- Aggregate [col1#x], [col1#x AS a#x, col1#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT col2 AS b, col2 FROM VALUES(1,2) GROUP BY 1,2 ORDER BY ALL
+-- !query analysis
+Sort [b#x ASC NULLS FIRST, col2#x ASC NULLS FIRST], true
++- Aggregate [col2#x, col2#x], [col2#x AS b#x, col2#x]
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col2 AS b, col2 FROM VALUES(1,2) GROUP BY 1,2 HAVING col2 > 0 ORDER BY ALL
+-- !query analysis
+Sort [b#x ASC NULLS FIRST, col2#x ASC NULLS FIRST], true
++- Filter (col2#x > 0)
+   +- Aggregate [col2#x, col2#x], [col2#x AS b#x, col2#x]
+      +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col2 AS b, col2, b as c FROM VALUES(1,2) GROUP BY 1,2 ORDER BY ALL
+-- !query analysis
+Sort [b#x ASC NULLS FIRST, col2#x ASC NULLS FIRST, c#x ASC NULLS FIRST], true
++- Project [b#x, col2#x, b#x AS c#x]
+   +- Project [col2#x, col2#x AS b#x]
+      +- Aggregate [col2#x, col2#x], [col2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col2 AS b, col2, b as c FROM VALUES(1,2) GROUP BY 1,2 HAVING col2 > 0 ORDER BY ALL
+-- !query analysis
+Sort [b#x ASC NULLS FIRST, col2#x ASC NULLS FIRST, c#x ASC NULLS FIRST], true
++- Filter (col2#x > 0)
+   +- Project [b#x, col2#x, b#x AS c#x]
+      +- Project [col2#x, col2#x AS b#x]
+         +- Aggregate [col2#x, col2#x], [col2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col1 AS a FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 > 1 ORDER BY col1
+-- !query analysis
+Project [a#x]
++- Sort [col1#x ASC NULLS FIRST], true
+   +- Project [a#x, col1#x]
+      +- Filter (col2#x > 1)
+         +- Aggregate [col1#x, col2#x], [col1#x AS a#x, col2#x, col1#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 > 1 ORDER BY col1
+-- !query analysis
+Project [a#x, b#x]
++- Sort [col1#x ASC NULLS FIRST], true
+   +- Project [a#x, b#x, col1#x]
+      +- Filter (col2#x > 1)
+         +- Project [a#x, a#x AS b#x, col2#x, col1#x]
+            +- Project [col1#x, col2#x, col1#x AS a#x]
+               +- Aggregate [col1#x, col2#x], [col1#x, col2#x]
+                  +- LocalRelation [col1#x, col2#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/sql-session-variables.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/sql-session-variables.sql.out
index 6f22f598498c6..7d23f27cdf5d6 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/sql-session-variables.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/sql-session-variables.sql.out
@@ -1247,9 +1247,176 @@ DropVariable false
 
 
 -- !query
-SET VARIABLE title = 'SET VARIABLE - row assignment'
+SET VARIABLE title = 'DECLARE VARIABLE - multiple variables declared at once'
 -- !query analysis
 SetVariable [variablereference(system.session.title='SET VARIABLE - comma separated target')]
++- Project [DECLARE VARIABLE - multiple variables declared at once AS title#x]
+   +- OneRowRelation
+
+
+-- !query
+DECLARE VARIABLE var1, var2, var3 INT
+-- !query analysis
+CreateVariable defaultvalueexpression(null, null), false
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var1
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var2
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var3
+
+
+-- !query
+DECLARE VARIABLE var4, var5, var6 INT DEFAULT CAST(RAND(0) * 10 AS INT)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+DECLARE VARIABLE var7, var8, var9 DEFAULT 5
+-- !query analysis
+CreateVariable defaultvalueexpression(5, 5), false
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var7
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var8
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var9
+
+
+-- !query
+SELECT var4 = var5, var4 = var6, var5 = var6
+-- !query analysis
+Project [(variablereference(system.session.var4=7) = variablereference(system.session.var5=7)) AS (variablereference(system.session.var4=7) = variablereference(system.session.var5=7))#x, (variablereference(system.session.var4=7) = variablereference(system.session.var6=7)) AS (variablereference(system.session.var4=7) = variablereference(system.session.var6=7))#x, (variablereference(system.session.var5=7) = variablereference(system.session.var6=7)) AS (variablereference(system.session.var5=7) = variablereference(system.session.var6=7))#x]
++- OneRowRelation
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var1, var2, var3 DOUBLE
+-- !query analysis
+CreateVariable defaultvalueexpression(null, null), true
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var1
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var2
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var3
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var4, var5, var6 DOUBLE DEFAULT RAND(0)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var7, var8, var9 DEFAULT 1.5
+-- !query analysis
+CreateVariable defaultvalueexpression(1.5, 1.5), true
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var7
+:- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var8
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var9
+
+
+-- !query
+SELECT var4 = var5, var4 = var6, var5 = var6
+-- !query analysis
+Project [(variablereference(system.session.var4=0.7604953758285915D) = variablereference(system.session.var5=0.7604953758285915D)) AS (variablereference(system.session.var4=0.7604953758285915D) = variablereference(system.session.var5=0.7604953758285915D))#x, (variablereference(system.session.var4=0.7604953758285915D) = variablereference(system.session.var6=0.7604953758285915D)) AS (variablereference(system.session.var4=0.7604953758285915D) = variablereference(system.session.var6=0.7604953758285915D))#x, (variablereference(system.session.var5=0.7604953758285915D) = variablereference(system.session.var6=0.7604953758285915D)) AS (variablereference(system.session.var5=0.7604953758285915D) = variablereference(system.session.var6=0.7604953758285915D))#x]
++- OneRowRelation
+
+
+-- !query
+DROP TEMPORARY VARIABLE var1
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var1
+
+
+-- !query
+DROP TEMPORARY VARIABLE var2
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var2
+
+
+-- !query
+DROP TEMPORARY VARIABLE var3
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var3
+
+
+-- !query
+DROP TEMPORARY VARIABLE var4
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var4
+
+
+-- !query
+DROP TEMPORARY VARIABLE var5
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var5
+
+
+-- !query
+DROP TEMPORARY VARIABLE var6
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var6
+
+
+-- !query
+DROP TEMPORARY VARIABLE var7
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var7
+
+
+-- !query
+DROP TEMPORARY VARIABLE var8
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var8
+
+
+-- !query
+DROP TEMPORARY VARIABLE var9
+-- !query analysis
+DropVariable false
++- ResolvedIdentifier org.apache.spark.sql.catalyst.analysis.FakeSystemCatalog$@xxxxxxxx, session.var9
+
+
+-- !query
+SET VARIABLE title = 'DECLARE VARIABLE - duplicate names'
+-- !query analysis
+SetVariable [variablereference(system.session.title='DECLARE VARIABLE - multiple variables declared at once')]
++- Project [DECLARE VARIABLE - duplicate names AS title#x]
+   +- OneRowRelation
+
+
+-- !query
+DECLARE VARIABLE var1, var2, vAr1 INT
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE",
+  "sqlState" : "42734",
+  "messageParameters" : {
+    "variableName" : "`system`.`session`.`var1`"
+  }
+}
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var1, var2, vAr1 INT
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE",
+  "sqlState" : "42734",
+  "messageParameters" : {
+    "variableName" : "`system`.`session`.`var1`"
+  }
+}
+
+
+-- !query
+SET VARIABLE title = 'SET VARIABLE - row assignment'
+-- !query analysis
+SetVariable [variablereference(system.session.title='DECLARE VARIABLE - duplicate names')]
 +- Project [SET VARIABLE - row assignment AS title#x]
    +- OneRowRelation
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/sql-udf.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/sql-udf.sql.out
index d24ab2c760fbc..2b8a47c9ca633 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/sql-udf.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/sql-udf.sql.out
@@ -2,16 +2,7 @@
 -- !query
 CREATE FUNCTION foo1a0() RETURNS INT RETURN 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo1a0`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo1a0, INT, 1, false, false, false, false
 
 
 -- !query
@@ -48,16 +39,7 @@ org.apache.spark.sql.AnalysisException
 -- !query
 CREATE FUNCTION foo1a1(a INT) RETURNS INT RETURN 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo1a1`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo1a1, a INT, INT, 1, false, false, false, false
 
 
 -- !query
@@ -94,16 +76,7 @@ org.apache.spark.sql.AnalysisException
 -- !query
 CREATE FUNCTION foo1a2(a INT, b INT, c INT, d INT) RETURNS INT RETURN 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo1a2`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo1a2, a INT, b INT, c INT, d INT, INT, 1, false, false, false, false
 
 
 -- !query
@@ -117,16 +90,7 @@ Project [spark_catalog.default.foo1a2(a#x, b#x, c#x, d#x) AS spark_catalog.defau
 -- !query
 CREATE FUNCTION foo1b0() RETURNS TABLE (c1 INT) RETURN SELECT 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo1b0`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo1b0, c1 INT, SELECT 1, true, false, false, false
 
 
 -- !query
@@ -143,16 +107,7 @@ Project [c1#x]
 -- !query
 CREATE FUNCTION foo1b1(a INT) RETURNS TABLE (c1 INT) RETURN SELECT 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo1b1`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo1b1, a INT, c1 INT, SELECT 1, true, false, false, false
 
 
 -- !query
@@ -169,16 +124,7 @@ Project [c1#x]
 -- !query
 CREATE FUNCTION foo1b2(a INT, b INT, c INT, d INT) RETURNS TABLE(c1 INT) RETURN SELECT 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo1b2`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo1b2, a INT, b INT, c INT, d INT, c1 INT, SELECT 1, true, false, false, false
 
 
 -- !query
@@ -643,16 +589,7 @@ org.apache.spark.sql.catalyst.parser.ParseException
 -- !query
 CREATE FUNCTION foo2a2() RETURNS TABLE(c1 INT, c2 INT) RETURN SELECT 1, 2
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2a2`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo2a2, c1 INT, c2 INT, SELECT 1, 2, true, false, false, false
 
 
 -- !query
@@ -669,16 +606,7 @@ Project [c1#x, c2#x]
 -- !query
 CREATE FUNCTION foo2a4() RETURNS TABLE(c1 INT, c2 INT, c3 INT, c4 INT) RETURN SELECT 1, 2, 3, 4
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2a4`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo2a4, c1 INT, c2 INT, c3 INT, c4 INT, SELECT 1, 2, 3, 4, true, false, false, false
 
 
 -- !query
@@ -788,16 +716,7 @@ org.apache.spark.sql.AnalysisException
 -- !query
 CREATE FUNCTION foo41() RETURNS INT RETURN SELECT 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo41`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo41, INT, SELECT 1, false, false, false, false
 
 
 -- !query
@@ -814,2791 +733,4640 @@ org.apache.spark.sql.AnalysisException
 
 
 -- !query
-CREATE FUNCTION foo2_1a(a INT) RETURNS INT RETURN a
+CREATE FUNCTION foo51() RETURNS INT RETURN (SELECT a FROM VALUES(1), (2) AS T(a))
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_1a`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo51, INT, (SELECT a FROM VALUES(1), (2) AS T(a)), false, false, false, false
 
 
 -- !query
-SELECT foo2_1a(5)
+SELECT foo51()
 -- !query analysis
-Project [spark_catalog.default.foo2_1a(a#x) AS spark_catalog.default.foo2_1a(5)#x]
-+- Project [cast(5 as int) AS a#x]
+Project [spark_catalog.default.foo51() AS spark_catalog.default.foo51()#x]
+:  +- Project [a#x]
+:     +- SubqueryAlias T
+:        +- LocalRelation [a#x]
++- Project
    +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_1b(a INT, b INT) RETURNS INT RETURN a + b
+CREATE FUNCTION foo52() RETURNS INT RETURN (SELECT 1 FROM VALUES(1) WHERE 1 = 0)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_1b`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo52, INT, (SELECT 1 FROM VALUES(1) WHERE 1 = 0), false, false, false, false
 
 
 -- !query
-SELECT foo2_1b(5, 6)
+SELECT foo52()
 -- !query analysis
-Project [spark_catalog.default.foo2_1b(a#x, b#x) AS spark_catalog.default.foo2_1b(5, 6)#x]
-+- Project [cast(5 as int) AS a#x, cast(6 as int) AS b#x]
+Project [spark_catalog.default.foo52() AS spark_catalog.default.foo52()#x]
+:  +- Project [1 AS 1#x]
+:     +- Filter (1 = 0)
+:        +- LocalRelation [col1#x]
++- Project
    +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_1c(a INT, b INT) RETURNS INT RETURN 10 * (a + b) + 100 * (a -b)
+CREATE FUNCTION foo6c(` a` INT, a INT, `a b` INT) RETURNS INT RETURN 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_1c`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo6c, ` a` INT, a INT, `a b` INT, INT, 1, false, false, false, false
 
 
 -- !query
-SELECT foo2_1c(5, 6)
+SELECT foo6c(1, 2, 3)
 -- !query analysis
-Project [spark_catalog.default.foo2_1c(a#x, b#x) AS spark_catalog.default.foo2_1c(5, 6)#x]
-+- Project [cast(5 as int) AS a#x, cast(6 as int) AS b#x]
+Project [spark_catalog.default.foo6c( a#x, a#x, a b#x) AS spark_catalog.default.foo6c(1, 2, 3)#x]
++- Project [cast(1 as int) AS  a#x, cast(2 as int) AS a#x, cast(3 as int) AS a b#x]
    +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_1d(a INT, b INT) RETURNS INT RETURN ABS(a) - LENGTH(CAST(b AS VARCHAR(10)))
+CREATE FUNCTION foo6d() RETURNS TABLE(` a` INT, a INT, `a b` INT) RETURN SELECT 1, 2, 3
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_1d`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo6d, ` a` INT, a INT, `a b` INT, SELECT 1, 2, 3, true, false, false, false
 
 
 -- !query
-SELECT foo2_1d(-5, 6)
+SELECT * FROM foo6d()
 -- !query analysis
-Project [spark_catalog.default.foo2_1d(a#x, b#x) AS spark_catalog.default.foo2_1d(-5, 6)#x]
-+- Project [cast(-5 as int) AS a#x, cast(6 as int) AS b#x]
-   +- OneRowRelation
+Project [ a#x, a#x, a b#x]
++- SQLFunctionNode spark_catalog.default.foo6d
+   +- SubqueryAlias foo6d
+      +- Project [cast(1#x as int) AS  a#x, cast(2#x as int) AS a#x, cast(3#x as int) AS a b#x]
+         +- Project [1 AS 1#x, 2 AS 2#x, 3 AS 3#x]
+            +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_2a(a INT) RETURNS INT RETURN SELECT a
+CREATE FUNCTION foo7a(a STRING, b STRING, c STRING) RETURNS STRING RETURN
+SELECT 'Foo.a: ' || a ||  ' Foo.a: ' || foo7a.a
+       || ' T.b: ' ||  b || ' Foo.b: ' || foo7a.b
+       || ' T.c: ' || c || ' T.c: ' || t.c FROM VALUES('t.b', 't.c') AS T(b, c)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_2a`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo7a, a STRING, b STRING, c STRING, STRING, SELECT 'Foo.a: ' || a ||  ' Foo.a: ' || foo7a.a
+       || ' T.b: ' ||  b || ' Foo.b: ' || foo7a.b
+       || ' T.c: ' || c || ' T.c: ' || t.c FROM VALUES('t.b', 't.c') AS T(b, c), false, false, false, false
 
 
 -- !query
-SELECT foo2_2a(5)
+SELECT foo7a('Foo.a', 'Foo.b', 'Foo.c')
 -- !query analysis
-Project [spark_catalog.default.foo2_2a(a#x) AS spark_catalog.default.foo2_2a(5)#x]
-+- Project [cast(5 as int) AS a#x]
+Project [spark_catalog.default.foo7a(a#x, b#x, c#x) AS spark_catalog.default.foo7a(Foo.a, Foo.b, Foo.c)#x]
+:  +- Project [concat(concat(concat(concat(concat(concat(concat(concat(concat(concat(concat(Foo.a: , outer(a#x)),  Foo.a: ), outer(a#x)),  T.b: ), b#x),  Foo.b: ), outer(b#x)),  T.c: ), c#x),  T.c: ), c#x) AS concat(concat(concat(concat(concat(concat(concat(concat(concat(concat(concat(Foo.a: , outer(foo7a.a)),  Foo.a: ), outer(foo7a.a)),  T.b: ), b),  Foo.b: ), outer(foo7a.b)),  T.c: ), c),  T.c: ), c)#x]
+:     +- SubqueryAlias T
+:        +- LocalRelation [b#x, c#x]
++- Project [cast(Foo.a as string) AS a#x, cast(Foo.b as string) AS b#x, cast(Foo.c as string) AS c#x]
    +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_2b(a INT) RETURNS INT RETURN 1 + (SELECT a)
+CREATE FUNCTION foo7at(a STRING, b STRING, c STRING) RETURNS TABLE (a STRING, b STRING, c STRING, d STRING, e STRING) RETURN
+SELECT CONCAT('Foo.a: ', a), CONCAT('Foo.b: ', foo7at.b), CONCAT('T.b: ', b),
+       CONCAT('Foo.c: ', foo7at.c), CONCAT('T.c: ', c)
+FROM VALUES ('t.b', 't.c') AS T(b, c)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_2b`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo7at, a STRING, b STRING, c STRING, a STRING, b STRING, c STRING, d STRING, e STRING, SELECT CONCAT('Foo.a: ', a), CONCAT('Foo.b: ', foo7at.b), CONCAT('T.b: ', b),
+       CONCAT('Foo.c: ', foo7at.c), CONCAT('T.c: ', c)
+FROM VALUES ('t.b', 't.c') AS T(b, c), true, false, false, false
 
 
 -- !query
-SELECT foo2_2b(5)
+SELECT * FROM foo7at('Foo.a', 'Foo.b', 'Foo.c')
 -- !query analysis
-Project [spark_catalog.default.foo2_2b(a#x) AS spark_catalog.default.foo2_2b(5)#x]
-:  +- Project [outer(a#x)]
-:     +- OneRowRelation
-+- Project [cast(5 as int) AS a#x]
-   +- OneRowRelation
+Project [a#x, b#x, c#x, d#x, e#x]
++- SQLFunctionNode spark_catalog.default.foo7at
+   +- SubqueryAlias foo7at
+      +- Project [cast(concat(Foo.a: , outer(foo7at.a))#x as string) AS a#x, cast(concat(Foo.b: , outer(foo7at.b))#x as string) AS b#x, cast(concat(T.b: , b)#x as string) AS c#x, cast(concat(Foo.c: , outer(foo7at.c))#x as string) AS d#x, cast(concat(T.c: , c)#x as string) AS e#x]
+         +- Project [concat(Foo.a: , cast(Foo.a as string)) AS concat(Foo.a: , outer(foo7at.a))#x, concat(Foo.b: , cast(Foo.b as string)) AS concat(Foo.b: , outer(foo7at.b))#x, concat(T.b: , b#x) AS concat(T.b: , b)#x, concat(Foo.c: , cast(Foo.c as string)) AS concat(Foo.c: , outer(foo7at.c))#x, concat(T.c: , c#x) AS concat(T.c: , c)#x]
+            +- SubqueryAlias T
+               +- LocalRelation [b#x, c#x]
 
 
 -- !query
-CREATE FUNCTION foo2_2c(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT a))
+CREATE FUNCTION foo9a(a BOOLEAN) RETURNS BOOLEAN RETURN NOT a
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`a`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 21,
-    "stopIndex" : 21,
-    "fragment" : "a"
-  } ]
-}
+CreateSQLFunctionCommand spark_catalog.default.foo9a, a BOOLEAN, BOOLEAN, NOT a, false, false, false, false
 
 
 -- !query
-CREATE FUNCTION foo2_2d(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT (SELECT (SELECT a))))
+SELECT foo9a(true)
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`a`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 37,
-    "stopIndex" : 37,
-    "fragment" : "a"
-  } ]
-}
+Project [spark_catalog.default.foo9a(a#x) AS spark_catalog.default.foo9a(true)#x]
++- Project [cast(true as boolean) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_2e(a INT) RETURNS INT RETURN
-SELECT a FROM (VALUES 1) AS V(c1) WHERE c1 = 2
-UNION ALL
-SELECT a + 1 FROM (VALUES 1) AS V(c1)
+SELECT foo9a(5)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_2e`"
-  }
-}
+Project [spark_catalog.default.foo9a(a#x) AS spark_catalog.default.foo9a(5)#x]
++- Project [cast(5 as boolean) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_2f(a INT) RETURNS INT RETURN
-SELECT a FROM (VALUES 1) AS V(c1)
-EXCEPT
-SELECT a + 1 FROM (VALUES 1) AS V(a)
+SELECT foo9a('Nonsense')
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_2f`"
-  }
-}
+Project [spark_catalog.default.foo9a(a#x) AS spark_catalog.default.foo9a(Nonsense)#x]
++- Project [cast(Nonsense as boolean) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_2g(a INT) RETURNS INT RETURN
-SELECT a FROM (VALUES 1) AS V(c1)
-INTERSECT
-SELECT a FROM (VALUES 1) AS V(a)
+CREATE FUNCTION foo9b(a BYTE) RETURNS BYTE RETURN CAST(a AS SHORT) + 1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_2g`"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo9b, a BYTE, BYTE, CAST(a AS SHORT) + 1, false, false, false, false
 
 
 -- !query
-DROP TABLE IF EXISTS t1
+SELECT foo9b(126)
 -- !query analysis
-DropTable true, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
+Project [spark_catalog.default.foo9b(a#x) AS spark_catalog.default.foo9b(126)#x]
++- Project [cast(126 as tinyint) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP TABLE IF EXISTS t2
+SELECT foo9b(127)
 -- !query analysis
-DropTable true, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t2
+Project [spark_catalog.default.foo9b(a#x) AS spark_catalog.default.foo9b(127)#x]
++- Project [cast(127 as tinyint) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP TABLE IF EXISTS ts
+SELECT foo9b(128)
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "WRONG_COMMAND_FOR_OBJECT_TYPE",
-  "sqlState" : "42809",
-  "messageParameters" : {
-    "alternative" : "DROP VIEW",
-    "foundType" : "VIEW",
-    "objectName" : "spark_catalog.default.ts",
-    "operation" : "DROP TABLE",
-    "requiredType" : "EXTERNAL or MANAGED"
-  }
-}
+Project [spark_catalog.default.foo9b(a#x) AS spark_catalog.default.foo9b(128)#x]
++- Project [cast(128 as tinyint) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP TABLE IF EXISTS tm
+CREATE FUNCTION foo9c(a SHORT) RETURNS SHORT RETURN CAST(a AS INTEGER) + 1
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "WRONG_COMMAND_FOR_OBJECT_TYPE",
-  "sqlState" : "42809",
-  "messageParameters" : {
-    "alternative" : "DROP VIEW",
-    "foundType" : "VIEW",
-    "objectName" : "spark_catalog.default.tm",
-    "operation" : "DROP TABLE",
-    "requiredType" : "EXTERNAL or MANAGED"
-  }
-}
+CreateSQLFunctionCommand spark_catalog.default.foo9c, a SHORT, SHORT, CAST(a AS INTEGER) + 1, false, false, false, false
 
 
 -- !query
-DROP TABLE IF EXISTS ta
+SELECT foo9c(32766)
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "WRONG_COMMAND_FOR_OBJECT_TYPE",
-  "sqlState" : "42809",
-  "messageParameters" : {
-    "alternative" : "DROP VIEW",
-    "foundType" : "VIEW",
-    "objectName" : "spark_catalog.default.ta",
-    "operation" : "DROP TABLE",
-    "requiredType" : "EXTERNAL or MANAGED"
-  }
-}
+Project [spark_catalog.default.foo9c(a#x) AS spark_catalog.default.foo9c(32766)#x]
++- Project [cast(32766 as smallint) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP TABLE IF EXISTS V1
+SELECT foo9c(32767)
 -- !query analysis
-DropTable true, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.V1
+Project [spark_catalog.default.foo9c(a#x) AS spark_catalog.default.foo9c(32767)#x]
++- Project [cast(32767 as smallint) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP TABLE IF EXISTS V2
+SELECT foo9c(32768)
 -- !query analysis
-DropTable true, false
-+- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.V2
+Project [spark_catalog.default.foo9c(a#x) AS spark_catalog.default.foo9c(32768)#x]
++- Project [cast(32768 as smallint) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP VIEW IF EXISTS t1
+CREATE FUNCTION foo9d(a INTEGER) RETURNS INTEGER RETURN CAST(a AS BIGINT) + 1
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`t1`, true, true, false
+CreateSQLFunctionCommand spark_catalog.default.foo9d, a INTEGER, INTEGER, CAST(a AS BIGINT) + 1, false, false, false, false
 
 
 -- !query
-DROP VIEW IF EXISTS t2
+SELECT foo9d(2147483647 - 1)
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`t2`, true, true, false
+Project [spark_catalog.default.foo9d(a#x) AS spark_catalog.default.foo9d((2147483647 - 1))#x]
++- Project [cast((2147483647 - 1) as int) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP VIEW IF EXISTS ts
+SELECT foo9d(2147483647)
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`ts`, true, true, false
+Project [spark_catalog.default.foo9d(a#x) AS spark_catalog.default.foo9d(2147483647)#x]
++- Project [cast(2147483647 as int) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP VIEW IF EXISTS tm
+SELECT foo9d(2147483647 + 1)
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`tm`, true, true, false
+Project [spark_catalog.default.foo9d(a#x) AS spark_catalog.default.foo9d((2147483647 + 1))#x]
++- Project [cast((2147483647 + 1) as int) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP VIEW IF EXISTS ta
+CREATE FUNCTION foo9e(a BIGINT) RETURNS BIGINT RETURN CAST(a AS DECIMAL(20, 0)) + 1
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`ta`, true, true, false
+CreateSQLFunctionCommand spark_catalog.default.foo9e, a BIGINT, BIGINT, CAST(a AS DECIMAL(20, 0)) + 1, false, false, false, false
 
 
 -- !query
-DROP VIEW IF EXISTS V1
+SELECT foo9e(9223372036854775807 - 1)
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`V1`, true, true, false
+Project [spark_catalog.default.foo9e(a#xL) AS spark_catalog.default.foo9e((9223372036854775807 - 1))#xL]
++- Project [cast((9223372036854775807 - cast(1 as bigint)) as bigint) AS a#xL]
+   +- OneRowRelation
 
 
 -- !query
-DROP VIEW IF EXISTS V2
+SELECT foo9e(9223372036854775807)
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`V2`, true, true, false
+Project [spark_catalog.default.foo9e(a#xL) AS spark_catalog.default.foo9e(9223372036854775807)#xL]
++- Project [cast(9223372036854775807 as bigint) AS a#xL]
+   +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_3(a INT, b INT) RETURNS INT RETURN a + b
+SELECT foo9e(9223372036854775807.0 + 1)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_3`"
-  }
-}
+Project [spark_catalog.default.foo9e(a#xL) AS spark_catalog.default.foo9e((9223372036854775807.0 + 1))#xL]
++- Project [cast((9223372036854775807.0 + cast(1 as decimal(1,0))) as bigint) AS a#xL]
+   +- OneRowRelation
 
 
 -- !query
-CREATE VIEW V1(c1, c2) AS VALUES (1, 2), (3, 4), (5, 6)
+CREATE FUNCTION foo9f(a DECIMAL( 5, 2 )) RETURNS DECIMAL (5, 2) RETURN CAST(a AS DECIMAL(6, 2)) + 1
 -- !query analysis
-CreateViewCommand `spark_catalog`.`default`.`V1`, [(c1,None), (c2,None)], VALUES (1, 2), (3, 4), (5, 6), false, false, PersistedView, COMPENSATION, true
-   +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9f, a DECIMAL( 5, 2 ), DECIMAL (5, 2), CAST(a AS DECIMAL(6, 2)) + 1, false, false, false, false
 
 
 -- !query
-CREATE VIEW V2(c1, c2) AS VALUES (-1, -2), (-3, -4), (-5, -6)
+SELECT foo9f(999 - 1)
 -- !query analysis
-CreateViewCommand `spark_catalog`.`default`.`V2`, [(c1,None), (c2,None)], VALUES (-1, -2), (-3, -4), (-5, -6), false, false, PersistedView, COMPENSATION, true
-   +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9f(a#x) AS spark_catalog.default.foo9f((999 - 1))#x]
++- Project [cast((999 - 1) as decimal(5,2)) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo2_3(c1, c2), foo2_3(c2, 1), foo2_3(c1, c2) - foo2_3(c2, c1 - 1) FROM V1 ORDER BY 1, 2, 3
+SELECT foo9f(999)
 -- !query analysis
-Sort [spark_catalog.default.foo2_3(c1, c2)#x ASC NULLS FIRST, spark_catalog.default.foo2_3(c2, 1)#x ASC NULLS FIRST, (spark_catalog.default.foo2_3(c1, c2) - spark_catalog.default.foo2_3(c2, (c1 - 1)))#x ASC NULLS FIRST], true
-+- Project [spark_catalog.default.foo2_3(a#x, b#x) AS spark_catalog.default.foo2_3(c1, c2)#x, spark_catalog.default.foo2_3(a#x, b#x) AS spark_catalog.default.foo2_3(c2, 1)#x, (spark_catalog.default.foo2_3(a#x, b#x) - spark_catalog.default.foo2_3(a#x, b#x)) AS (spark_catalog.default.foo2_3(c1, c2) - spark_catalog.default.foo2_3(c2, (c1 - 1)))#x]
-   +- Project [c1#x, c2#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x, cast(c2#x as int) AS a#x, cast(1 as int) AS b#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x, cast(c2#x as int) AS a#x, cast((c1#x - 1) as int) AS b#x]
-      +- SubqueryAlias spark_catalog.default.v1
-         +- View (`spark_catalog`.`default`.`v1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9f(a#x) AS spark_catalog.default.foo9f(999)#x]
++- Project [cast(999 as decimal(5,2)) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT * FROM V1 WHERE foo2_3(c1, 0) = c1 AND foo2_3(c1, c2) < 8
+SELECT foo9f(999 + 1)
 -- !query analysis
-Project [c1#x, c2#x]
-+- Project [c1#x, c2#x]
-   +- Filter ((spark_catalog.default.foo2_3(a#x, b#x) = c1#x) AND (spark_catalog.default.foo2_3(a#x, b#x) < 8))
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS a#x, cast(0 as int) AS b#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x]
-         +- SubqueryAlias spark_catalog.default.v1
-            +- View (`spark_catalog`.`default`.`v1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9f(a#x) AS spark_catalog.default.foo9f((999 + 1))#x]
++- Project [cast((999 + 1) as decimal(5,2)) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo2_3(SUM(c1), SUM(c2)), SUM(c1) + SUM(c2), SUM(foo2_3(c1, c2) + foo2_3(c2, c1) - foo2_3(c2, c1))
-FROM V1
+CREATE FUNCTION foo9g(a FLOAT, b String) RETURNS FLOAT RETURN b || CAST(a AS String)
 -- !query analysis
-Project [spark_catalog.default.foo2_3(a#x, b#x) AS spark_catalog.default.foo2_3(sum(c1), sum(c2))#x, (sum(c1) + sum(c2))#xL, sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1)))#xL]
-+- Project [sum(c1)#xL, sum(c2)#xL, (sum(c1) + sum(c2))#xL, sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1)))#xL, cast(sum(c1)#xL as int) AS a#x, cast(sum(c2)#xL as int) AS b#x]
-   +- Aggregate [sum(c1#x) AS sum(c1)#xL, sum(c2#x) AS sum(c2)#xL, (sum(c1#x) + sum(c2#x)) AS (sum(c1) + sum(c2))#xL, sum(((spark_catalog.default.foo2_3(a#x, b#x) + spark_catalog.default.foo2_3(a#x, b#x)) - spark_catalog.default.foo2_3(a#x, b#x))) AS sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1)))#xL]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x, cast(c2#x as int) AS a#x, cast(c1#x as int) AS b#x, cast(c2#x as int) AS a#x, cast(c1#x as int) AS b#x]
-         +- SubqueryAlias spark_catalog.default.v1
-            +- View (`spark_catalog`.`default`.`v1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9g, a FLOAT, b String, FLOAT, b || CAST(a AS String), false, false, false, false
 
 
 -- !query
-CREATE FUNCTION foo2_4a(a ARRAY<STRING>) RETURNS STRING RETURN
-SELECT array_sort(a, (i, j) -> rank[i] - rank[j])[0] FROM (SELECT MAP('a', 1, 'b', 2) rank)
+SELECT foo9g(123.23, '7')
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_4a`"
-  }
-}
+Project [spark_catalog.default.foo9g(a#x, b#x) AS spark_catalog.default.foo9g(123.23, 7)#x]
++- Project [cast(123.23 as float) AS a#x, cast(7 as string) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo2_4a(ARRAY('a', 'b'))
+SELECT foo9g('hello', '7')
 -- !query analysis
-Project [spark_catalog.default.foo2_4a(a#x) AS spark_catalog.default.foo2_4a(array(a, b))#x]
-:  +- Project [array_sort(outer(a#x), lambdafunction((rank#x[lambda i#x] - rank#x[lambda j#x]), lambda i#x, lambda j#x, false), false)[0] AS array_sort(outer(foo2_4a.a), lambdafunction((rank[namedlambdavariable()] - rank[namedlambdavariable()]), namedlambdavariable(), namedlambdavariable()))[0]#x]
-:     +- SubqueryAlias __auto_generated_subquery_name
-:        +- Project [map(a, 1, b, 2) AS rank#x]
-:           +- OneRowRelation
-+- Project [cast(array(a, b) as array<string>) AS a#x]
+Project [spark_catalog.default.foo9g(a#x, b#x) AS spark_catalog.default.foo9g(hello, 7)#x]
++- Project [cast(hello as float) AS a#x, cast(7 as string) AS b#x]
    +- OneRowRelation
 
 
 -- !query
-CREATE FUNCTION foo2_4b(m MAP<STRING, STRING>, k STRING) RETURNS STRING RETURN
-SELECT v || ' ' || v FROM (SELECT upper(m[k]) AS v)
+SELECT foo9g(123.23, 'q')
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo2_4b`"
-  }
-}
+Project [spark_catalog.default.foo9g(a#x, b#x) AS spark_catalog.default.foo9g(123.23, q)#x]
++- Project [cast(123.23 as float) AS a#x, cast(q as string) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo2_4b(map('a', 'hello', 'b', 'world'), 'a')
+CREATE FUNCTION foo9h(a DOUBLE, b String) RETURNS DOUBLE RETURN b || CAST(a AS String)
 -- !query analysis
-Project [spark_catalog.default.foo2_4b(m#x, k#x) AS spark_catalog.default.foo2_4b(map(a, hello, b, world), a)#x]
-:  +- Project [concat(concat(v#x,  ), v#x) AS concat(concat(v,  ), v)#x]
-:     +- SubqueryAlias __auto_generated_subquery_name
-:        +- Project [upper(outer(m#x)[outer(k#x)]) AS v#x]
-:           +- OneRowRelation
-+- Project [cast(map(a, hello, b, world) as map<string,string>) AS m#x, cast(a as string) AS k#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9h, a DOUBLE, b String, DOUBLE, b || CAST(a AS String), false, false, false, false
+
+
+-- !query
+SELECT foo9h(123.23, '7')
+-- !query analysis
+Project [spark_catalog.default.foo9h(a#x, b#x) AS spark_catalog.default.foo9h(123.23, 7)#x]
++- Project [cast(123.23 as double) AS a#x, cast(7 as string) AS b#x]
    +- OneRowRelation
 
 
 -- !query
-DROP VIEW V2
+SELECT foo9h('hello', '7')
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`V2`, false, true, false
+Project [spark_catalog.default.foo9h(a#x, b#x) AS spark_catalog.default.foo9h(hello, 7)#x]
++- Project [cast(hello as double) AS a#x, cast(7 as string) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-DROP VIEW V1
+SELECT foo9h(123.23, 'q')
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`V1`, false, true, false
+Project [spark_catalog.default.foo9h(a#x, b#x) AS spark_catalog.default.foo9h(123.23, q)#x]
++- Project [cast(123.23 as double) AS a#x, cast(q as string) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-CREATE VIEW t1(c1, c2) AS VALUES (0, 1), (0, 2), (1, 2)
+CREATE FUNCTION foo9i(a VARCHAR(10), b VARCHAR(10)) RETURNS VARCHAR(12) RETURN a || b
 -- !query analysis
-CreateViewCommand `spark_catalog`.`default`.`t1`, [(c1,None), (c2,None)], VALUES (0, 1), (0, 2), (1, 2), false, false, PersistedView, COMPENSATION, true
-   +- LocalRelation [col1#x, col2#x]
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_CHAR_OR_VARCHAR_AS_STRING",
+  "sqlState" : "0A000"
+}
 
 
 -- !query
-CREATE VIEW t2(c1, c2) AS VALUES (0, 2), (0, 3)
+CREATE FUNCTION foo9j(a STRING, b STRING) RETURNS STRING RETURN a || b
 -- !query analysis
-CreateViewCommand `spark_catalog`.`default`.`t2`, [(c1,None), (c2,None)], VALUES (0, 2), (0, 3), false, false, PersistedView, COMPENSATION, true
-   +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9j, a STRING, b STRING, STRING, a || b, false, false, false, false
 
 
 -- !query
-CREATE VIEW ts(x) AS VALUES NAMED_STRUCT('a', 1, 'b', 2)
+SELECT foo9j('1234567890', '12')
 -- !query analysis
-CreateViewCommand `spark_catalog`.`default`.`ts`, [(x,None)], VALUES NAMED_STRUCT('a', 1, 'b', 2), false, false, PersistedView, COMPENSATION, true
-   +- LocalRelation [col1#x]
+Project [spark_catalog.default.foo9j(a#x, b#x) AS spark_catalog.default.foo9j(1234567890, 12)#x]
++- Project [cast(1234567890 as string) AS a#x, cast(12 as string) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-CREATE VIEW tm(x) AS VALUES MAP('a', 1, 'b', 2)
+SELECT foo9j(12345678901, '12')
 -- !query analysis
-CreateViewCommand `spark_catalog`.`default`.`tm`, [(x,None)], VALUES MAP('a', 1, 'b', 2), false, false, PersistedView, COMPENSATION, true
-   +- LocalRelation [col1#x]
+Project [spark_catalog.default.foo9j(a#x, b#x) AS spark_catalog.default.foo9j(12345678901, 12)#x]
++- Project [cast(12345678901 as string) AS a#x, cast(12 as string) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-CREATE VIEW ta(x) AS VALUES ARRAY(1, 2, 3)
+CREATE FUNCTION foo9l(a DATE, b INTERVAL) RETURNS DATE RETURN a + b
 -- !query analysis
-CreateViewCommand `spark_catalog`.`default`.`ta`, [(x,None)], VALUES ARRAY(1, 2, 3), false, false, PersistedView, COMPENSATION, true
-   +- LocalRelation [col1#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9l, a DATE, b INTERVAL, DATE, a + b, false, false, false, false
 
 
 -- !query
-CREATE FUNCTION foo3_1a(a DOUBLE, b DOUBLE) RETURNS DOUBLE RETURN a * b
+SELECT foo9l(DATE '2020-02-02', INTERVAL '1' YEAR)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
 {
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
   "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1a`"
-  }
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "foo9l(DATE '2020-02-02', INTERVAL '1' YEAR)"
+  } ]
 }
 
 
 -- !query
-CREATE FUNCTION foo3_1b(x INT) RETURNS INT RETURN x
+SELECT foo9l('2020-02-02', INTERVAL '1' YEAR)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
 {
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
   "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1b`"
-  }
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 45,
+    "fragment" : "foo9l('2020-02-02', INTERVAL '1' YEAR)"
+  } ]
 }
 
 
 -- !query
-CREATE FUNCTION foo3_1c(x INT) RETURNS INT RETURN SELECT x
+SELECT foo9l(DATE '-7', INTERVAL '1' YEAR)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
+org.apache.spark.sql.catalyst.parser.ParseException
 {
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
   "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1c`"
-  }
+    "value" : "'-7'",
+    "valueType" : "\"DATE\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 14,
+    "stopIndex" : 22,
+    "fragment" : "DATE '-7'"
+  } ]
 }
 
 
 -- !query
-CREATE FUNCTION foo3_1d(x INT) RETURNS INT RETURN (SELECT SUM(c2) FROM t2 WHERE c1 = x)
+SELECT foo9l(DATE '2020-02-02', INTERVAL '9999999' YEAR)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
 {
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
   "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1d`"
-  }
+    "sqlExpr" : "\"INTERVAL '9999999' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 56,
+    "fragment" : "foo9l(DATE '2020-02-02', INTERVAL '9999999' YEAR)"
+  } ]
 }
 
 
 -- !query
-CREATE FUNCTION foo3_1e() RETURNS INT RETURN foo3_1d(0)
+CREATE FUNCTION foo9m(a TIMESTAMP, b INTERVAL) RETURNS TIMESTAMP RETURN a + b
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo9m, a TIMESTAMP, b INTERVAL, TIMESTAMP, a + b, false, false, false, false
+
+
+-- !query
+SELECT foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '1' YEAR)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
 {
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
   "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1e`"
-  }
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 67,
+    "fragment" : "foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '1' YEAR)"
+  } ]
 }
 
 
 -- !query
-CREATE FUNCTION foo3_1f() RETURNS INT RETURN SELECT SUM(c2) FROM t2 WHERE c1 = 0
+SELECT foo9m('2020-02-02 12:15:16.123', INTERVAL '1' YEAR)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
 {
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
   "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1f`"
-  }
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "foo9m('2020-02-02 12:15:16.123', INTERVAL '1' YEAR)"
+  } ]
 }
 
 
 -- !query
-CREATE FUNCTION foo3_1g(x INT) RETURNS INT RETURN SELECT (SELECT x)
+SELECT foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '999999' YEAR)
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
 {
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
   "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1g`"
-  }
+    "sqlExpr" : "\"INTERVAL '999999' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 72,
+    "fragment" : "foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '999999' YEAR)"
+  } ]
 }
 
 
 -- !query
-SELECT a, b, foo3_1a(a + 1, b + 1) FROM t1 AS t(a, b)
+CREATE FUNCTION foo9n(a ARRAY<INTEGER>) RETURNS ARRAY<INTEGER> RETURN a
 -- !query analysis
-Project [a#x, b#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a((a + 1), (b + 1))#x]
-+- Project [a#x, b#x, cast((a#x + 1) as double) AS a#x, cast((b#x + 1) as double) AS b#x]
-   +- SubqueryAlias t
-      +- Project [c1#x AS a#x, c2#x AS b#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9n, a ARRAY<INTEGER>, ARRAY<INTEGER>, a, false, false, false, false
 
 
 -- !query
-SELECT x, foo3_1c(x) FROM t1 AS t(x, y)
+SELECT foo9n(ARRAY(1, 2, 3))
 -- !query analysis
-Project [x#x, spark_catalog.default.foo3_1c(x#x) AS spark_catalog.default.foo3_1c(x)#x]
-+- Project [x#x, y#x, cast(x#x as int) AS x#x]
-   +- SubqueryAlias t
-      +- Project [c1#x AS x#x, c2#x AS y#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9n(a#x) AS spark_catalog.default.foo9n(array(1, 2, 3))#x]
++- Project [cast(array(1, 2, 3) as array<int>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, foo3_1d(c1) FROM t1
+SELECT foo9n(from_json('[1, 2, 3]', 'array<int>'))
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1d(x#x) AS spark_catalog.default.foo3_1d(c1)#x]
-:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-:     +- Filter (c1#x = outer(x#x))
-:        +- SubqueryAlias spark_catalog.default.t2
-:           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-:              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-:                 +- LocalRelation [col1#x, col2#x]
-+- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9n(a#x) AS spark_catalog.default.foo9n(from_json([1, 2, 3]))#x]
++- Project [cast(from_json(ArrayType(IntegerType,true), [1, 2, 3], Some(America/Los_Angeles), false) as array<int>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, foo3_1a(foo3_1b(c1), foo3_1b(c1)) FROM t1
+CREATE FUNCTION foo9o(a MAP<STRING, INTEGER>) RETURNS MAP<STRING, INTEGER> RETURN a
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), spark_catalog.default.foo3_1b(c1))#x]
-+- Project [c1#x, c2#x, x#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as double) AS a#x, cast(spark_catalog.default.foo3_1b(x#x) as double) AS b#x]
-   +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x, cast(c1#x as int) AS x#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9o, a MAP<STRING, INTEGER>, MAP<STRING, INTEGER>, a, false, false, false, false
 
 
 -- !query
-SELECT c1, foo3_1d(foo3_1c(foo3_1b(c1))) FROM t1
+SELECT foo9o(MAP('hello', 1, 'world', 2))
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1d(x#x) AS spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1)))#x]
-:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-:     +- Filter (c1#x = outer(x#x))
-:        +- SubqueryAlias spark_catalog.default.t2
-:           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-:              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-:                 +- LocalRelation [col1#x, col2#x]
-+- Project [c1#x, c2#x, x#x, x#x, cast(spark_catalog.default.foo3_1c(x#x) as int) AS x#x]
-   +- Project [c1#x, c2#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9o(a#x) AS spark_catalog.default.foo9o(map(hello, 1, world, 2))#x]
++- Project [cast(map(hello, 1, world, 2) as map<string,int>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, foo3_1a(foo3_1c(foo3_1b(c1)), foo3_1d(foo3_1b(c1))) FROM t1
+SELECT foo9o(from_json('{"hello":1, "world":2}', 'map<string,int>'))
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1)), spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1b(c1)))#x]
-+- Project [c1#x, c2#x, x#x, x#x, x#x, x#x, cast(spark_catalog.default.foo3_1c(x#x) as double) AS a#x, cast(spark_catalog.default.foo3_1d(x#x) as double) AS b#x]
-   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-   :     +- Filter (c1#x = outer(x#x))
-   :        +- SubqueryAlias spark_catalog.default.t2
-   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                 +- LocalRelation [col1#x, col2#x]
-   +- Project [c1#x, c2#x, x#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9o(a#x) AS spark_catalog.default.foo9o(entries)#x]
++- Project [cast(from_json(MapType(StringType,IntegerType,true), {"hello":1, "world":2}, Some(America/Los_Angeles), false) as map<string,int>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1c(foo3_1e()) FROM t1
+CREATE FUNCTION foo9p(a STRUCT<a1: INTEGER, a2: STRING>) RETURNS STRUCT<a1: INTEGER, a2: STRING> RETURN a
 -- !query analysis
-Project [spark_catalog.default.foo3_1c(x#x) AS spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1e())#x]
-+- Project [c1#x, c2#x, x#x, cast(spark_catalog.default.foo3_1e() as int) AS x#x]
-   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-   :     +- Filter (c1#x = outer(x#x))
-   :        +- SubqueryAlias spark_catalog.default.t2
-   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                 +- LocalRelation [col1#x, col2#x]
-   +- Project [c1#x, c2#x, cast(0 as int) AS x#x]
-      +- Project [c1#x, c2#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9p, a STRUCT<a1: INTEGER, a2: STRING>, STRUCT<a1: INTEGER, a2: STRING>, a, false, false, false, false
 
 
 -- !query
-SELECT foo3_1a(MAX(c1), MAX(c2)) FROM t1
+SELECT foo9p(STRUCT(1, 'hello'))
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(max(c1), max(c2))#x]
-+- Project [max(c1)#x, max(c2)#x, cast(max(c1)#x as double) AS a#x, cast(max(c2)#x as double) AS b#x]
-   +- Aggregate [max(c1#x) AS max(c1)#x, max(c2#x) AS max(c2)#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9p(a#x) AS spark_catalog.default.foo9p(struct(1, hello))#x]
++- Project [cast(struct(col1, 1, col2, hello) as struct<a1:int,a2:string>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1a(MAX(c1), c2) FROM t1 GROUP BY c2
+SELECT foo9p(from_json('{1:"hello"}', 'struct<a1:int, a2:string>'))
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(max(c1), c2)#x]
-+- Project [max(c1)#x, c2#x, cast(max(c1)#x as double) AS a#x, cast(c2#x as double) AS b#x]
-   +- Aggregate [c2#x], [max(c1#x) AS max(c1)#x, c2#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9p(a#x) AS spark_catalog.default.foo9p(from_json({1:"hello"}))#x]
++- Project [cast(from_json(StructField(a1,IntegerType,true), StructField(a2,StringType,true), {1:"hello"}, Some(America/Los_Angeles), false) as struct<a1:int,a2:string>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+CREATE FUNCTION foo9q(a ARRAY<STRUCT<a1: INT, a2: STRING>>) RETURNS ARRAY<STRUCT<a1: INT, a2: STRING>> RETURN a
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, c2)#x]
-+- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
-   +- Aggregate [c1#x, c2#x], [c1#x, c2#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9q, a ARRAY<STRUCT<a1: INT, a2: STRING>>, ARRAY<STRUCT<a1: INT, a2: STRING>>, a, false, false, false, false
 
 
 -- !query
-SELECT MAX(foo3_1a(c1, c2)) FROM t1 GROUP BY c1, c2
+SELECT foo9q(ARRAY(STRUCT(1, 'hello'), STRUCT(2, 'world')))
 -- !query analysis
-Project [max(spark_catalog.default.foo3_1a(c1, c2))#x]
-+- Aggregate [c1#x, c2#x], [max(spark_catalog.default.foo3_1a(a#x, b#x)) AS max(spark_catalog.default.foo3_1a(c1, c2))#x]
-   +- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9q(a#x) AS spark_catalog.default.foo9q(array(struct(1, hello), struct(2, world)))#x]
++- Project [cast(array(struct(col1, 1, col2, hello), struct(col1, 2, col2, world)) as array<struct<a1:int,a2:string>>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT MAX(c1) + foo3_1b(MAX(c1)) FROM t1 GROUP BY c2
+SELECT foo9q(ARRAY(NAMED_STRUCT('x', 1, 'y', 'hello'), NAMED_STRUCT('x', 2, 'y', 'world')))
 -- !query analysis
-Project [(max(c1)#x + spark_catalog.default.foo3_1b(x#x)) AS (max(c1) + spark_catalog.default.foo3_1b(max(c1)))#x]
-+- Project [max(c1)#x, max(c1)#x, cast(max(c1)#x as int) AS x#x]
-   +- Aggregate [c2#x], [max(c1#x) AS max(c1)#x, max(c1#x) AS max(c1)#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9q(a#x) AS spark_catalog.default.foo9q(array(named_struct(x, 1, y, hello), named_struct(x, 2, y, world)))#x]
++- Project [cast(array(named_struct(x, 1, y, hello), named_struct(x, 2, y, world)) as array<struct<a1:int,a2:string>>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, SUM(foo3_1c(c2)) FROM t1 GROUP BY c1
+SELECT foo9q(from_json('[{1:"hello"}, {2:"world"}]', 'array<struct<a1:int,a2:string>>'))
 -- !query analysis
-Project [c1#x, sum(spark_catalog.default.foo3_1c(c2))#xL]
-+- Aggregate [c1#x], [c1#x, sum(spark_catalog.default.foo3_1c(x#x)) AS sum(spark_catalog.default.foo3_1c(c2))#xL]
-   +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9q(a#x) AS spark_catalog.default.foo9q(from_json([{1:"hello"}, {2:"world"}]))#x]
++- Project [cast(from_json(ArrayType(StructType(StructField(a1,IntegerType,true),StructField(a2,StringType,true)),true), [{1:"hello"}, {2:"world"}], Some(America/Los_Angeles), false) as array<struct<a1:int,a2:string>>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, SUM(foo3_1d(c2)) FROM t1 GROUP BY c1
+CREATE FUNCTION foo9r(a ARRAY<MAP<STRING, INT>>) RETURNS ARRAY<MAP<STRING, INT>> RETURN a
 -- !query analysis
-Project [c1#x, sum(spark_catalog.default.foo3_1d(c2))#xL]
-+- Aggregate [c1#x], [c1#x, sum(spark_catalog.default.foo3_1d(x#x)) AS sum(spark_catalog.default.foo3_1d(c2))#xL]
-   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-   :     +- Filter (c1#x = outer(x#x))
-   :        +- SubqueryAlias spark_catalog.default.t2
-   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                 +- LocalRelation [col1#x, col2#x]
-   +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo9r, a ARRAY<MAP<STRING, INT>>, ARRAY<MAP<STRING, INT>>, a, false, false, false, false
 
 
 -- !query
-SELECT foo3_1c(c1), foo3_1d(c1) FROM t1 GROUP BY c1
+SELECT foo9r(ARRAY(MAP('hello', 1), MAP('world', 2)))
 -- !query analysis
-Project [spark_catalog.default.foo3_1c(x#x) AS spark_catalog.default.foo3_1c(c1)#x, spark_catalog.default.foo3_1d(x#x) AS spark_catalog.default.foo3_1d(c1)#x]
-:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-:     +- Filter (c1#x = outer(x#x))
-:        +- SubqueryAlias spark_catalog.default.t2
-:           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-:              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-:                 +- LocalRelation [col1#x, col2#x]
-+- Project [c1#x, c1#x, cast(c1#x as int) AS x#x, cast(c1#x as int) AS x#x]
-   +- Aggregate [c1#x], [c1#x, c1#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo9r(a#x) AS spark_catalog.default.foo9r(array(map(hello, 1), map(world, 2)))#x]
++- Project [cast(array(map(hello, 1), map(world, 2)) as array<map<string,int>>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1a(SUM(c1), rand(0) * 0) FROM t1
+SELECT foo9r(from_json('[{"hello":1}, {"world":2}]', 'array<map<string,int>>'))
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+Project [spark_catalog.default.foo9r(a#x) AS spark_catalog.default.foo9r(from_json([{"hello":1}, {"world":2}]))#x]
++- Project [cast(from_json(ArrayType(MapType(StringType,IntegerType,true),true), [{"hello":1}, {"world":2}], Some(America/Los_Angeles), false) as array<map<string,int>>) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1a(SUM(c1) + rand(0) * 0, SUM(c2)) FROM t1
+CREATE OR REPLACE FUNCTION foo1_10(a INT) RETURNS INT RETURN a + 2
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+CreateSQLFunctionCommand spark_catalog.default.foo1_10, a INT, INT, a + 2, false, false, false, true
 
 
 -- !query
-SELECT foo3_1b(SUM(c1) + rand(0) * 0) FROM t1
+CREATE OR REPLACE FUNCTION bar1_10(b INT) RETURNS STRING RETURN foo1_10(TRY_CAST(b AS STRING))
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+CreateSQLFunctionCommand spark_catalog.default.bar1_10, b INT, STRING, foo1_10(TRY_CAST(b AS STRING)), false, false, false, true
 
 
 -- !query
-SELECT foo3_1b(SUM(1) + rand(0) * 0) FROM t1 GROUP BY c2
+SELECT bar1_10(3)
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+Project [spark_catalog.default.bar1_10(b#x) AS spark_catalog.default.bar1_10(3)#x]
++- Project [b#x, cast(try_cast(b#x as string) as int) AS a#x]
+   +- Project [cast(3 as int) AS b#x]
+      +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1c(SUM(c2) + rand(0) * 0) FROM t1 GROUP by c1
+CREATE OR REPLACE FUNCTION foo1_11a() RETURN 42
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11a, , 42, false, false, false, true
 
 
 -- !query
-SELECT foo3_1b(foo3_1b(MAX(c2))) FROM t1
+SELECT foo1_11a()
 -- !query analysis
-Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(spark_catalog.default.foo3_1b(max(c2)))#x]
-+- Project [max(c2)#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x]
-   +- Project [max(c2)#x, cast(max(c2)#x as int) AS x#x]
-      +- Aggregate [max(c2#x) AS max(c2)#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11a() AS spark_catalog.default.foo1_11a()#x]
++- Project
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1b(MAX(foo3_1b(c2))) FROM t1
+CREATE OR REPLACE FUNCTION foo1_11b() RETURN 'hello world'
 -- !query analysis
-Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(max(spark_catalog.default.foo3_1b(c2)))#x]
-+- Project [max(spark_catalog.default.foo3_1b(c2))#x, cast(max(spark_catalog.default.foo3_1b(c2))#x as int) AS x#x]
-   +- Aggregate [max(spark_catalog.default.foo3_1b(x#x)) AS max(spark_catalog.default.foo3_1b(c2))#x]
-      +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11b, , 'hello world', false, false, false, true
 
 
 -- !query
-SELECT foo3_1a(foo3_1b(c1), MAX(c2)) FROM t1 GROUP BY c1
+SELECT foo1_11b()
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), max(c2))#x]
-+- Project [c1#x, max(c2)#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as double) AS a#x, cast(max(c2)#x as double) AS b#x]
-   +- Project [c1#x, max(c2)#x, cast(c1#x as int) AS x#x]
-      +- Aggregate [c1#x], [c1#x, max(c2#x) AS max(c2)#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11b() AS spark_catalog.default.foo1_11b()#x]
++- Project
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, foo3_1b(c1) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11c(a INT, b INT) RETURN a + b
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(c1)#x]
-+- Project [c1#x, c1#x, cast(c1#x as int) AS x#x]
-   +- Aggregate [c1#x], [c1#x, c1#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11c, a INT, b INT, , a + b, false, false, false, true
 
 
 -- !query
-SELECT c1, foo3_1b(c1 + 1) FROM t1 GROUP BY c1
+SELECT foo1_11c(3, 5)
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b((c1 + 1))#x]
-+- Project [c1#x, (c1 + 1)#x, cast((c1 + 1)#x as int) AS x#x]
-   +- Aggregate [c1#x], [c1#x, (c1#x + 1) AS (c1 + 1)#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11c(a#x, b#x) AS spark_catalog.default.foo1_11c(3, 5)#x]
++- Project [cast(3 as int) AS a#x, cast(5 as int) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, foo3_1b(c1 + rand(0) * 0) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11d(a DOUBLE, b INT) RETURN a * b + 1.5
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11d, a DOUBLE, b INT, , a * b + 1.5, false, false, false, true
 
 
 -- !query
-SELECT c1, foo3_1a(c1, MIN(c2)) FROM t1 GROUP BY c1
+SELECT foo1_11d(3.0, 5)
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, min(c2))#x]
-+- Project [c1#x, c1#x, min(c2)#x, cast(c1#x as double) AS a#x, cast(min(c2)#x as double) AS b#x]
-   +- Aggregate [c1#x], [c1#x, c1#x, min(c2#x) AS min(c2)#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11d(a#x, b#x) AS spark_catalog.default.foo1_11d(3.0, 5)#x]
++- Project [cast(3.0 as double) AS a#x, cast(5 as int) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, foo3_1a(c1 + 1, MIN(c2 + 1)) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11e(a INT) RETURN a > 10
 -- !query analysis
-Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a((c1 + 1), min((c2 + 1)))#x]
-+- Project [c1#x, (c1 + 1)#x, min((c2 + 1))#x, cast((c1 + 1)#x as double) AS a#x, cast(min((c2 + 1))#x as double) AS b#x]
-   +- Aggregate [c1#x], [c1#x, (c1#x + 1) AS (c1 + 1)#x, min((c2#x + 1)) AS min((c2 + 1))#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11e, a INT, , a > 10, false, false, false, true
 
 
 -- !query
-SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+SELECT foo1_11e(15), foo1_11e(5)
 -- !query analysis
-Project [c1#x, c2#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, c2)#x]
-+- Project [c1#x, c2#x, c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
-   +- Aggregate [c1#x, c2#x], [c1#x, c2#x, c1#x, c2#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11e(a#x) AS spark_catalog.default.foo1_11e(15)#x, spark_catalog.default.foo1_11e(a#x) AS spark_catalog.default.foo1_11e(5)#x]
++- Project [cast(15 as int) AS a#x, cast(5 as int) AS a#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, c2, foo3_1a(1, 2) FROM t1 GROUP BY c1, c2
+CREATE OR REPLACE FUNCTION foo1_11f(d DATE) RETURN d + INTERVAL '1' DAY
 -- !query analysis
-Project [c1#x, c2#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(1, 2)#x]
-+- Project [c1#x, c2#x, 1#x, 2#x, cast(1#x as double) AS a#x, cast(2#x as double) AS b#x]
-   +- Aggregate [c1#x, c2#x], [c1#x, c2#x, 1 AS 1#x, 2 AS 2#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11f, d DATE, , d + INTERVAL '1' DAY, false, false, false, true
 
 
 -- !query
-SELECT c1 + c2, foo3_1b(c1 + c2 + 1) FROM t1 GROUP BY c1 + c2
+SELECT foo1_11f(DATE '2024-01-01')
 -- !query analysis
-Project [(c1 + c2)#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(((c1 + c2) + 1))#x]
-+- Project [(c1 + c2)#x, ((c1 + c2) + 1)#x, cast(((c1 + c2) + 1)#x as int) AS x#x]
-   +- Aggregate [(c1#x + c2#x)], [(c1#x + c2#x) AS (c1 + c2)#x, ((c1#x + c2#x) + 1) AS ((c1 + c2) + 1)#x]
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+[Analyzer test output redacted due to nondeterminism]
 
 
 -- !query
-SELECT COUNT(*) + foo3_1b(c1) + foo3_1b(SUM(c2)) + SUM(foo3_1b(c2)) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11g(n INT) RETURN ARRAY(1, 2, n)
 -- !query analysis
-Project [(((count(1)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) + sum(spark_catalog.default.foo3_1b(c2))#xL) AS (((count(1) + spark_catalog.default.foo3_1b(c1)) + spark_catalog.default.foo3_1b(sum(c2))) + sum(spark_catalog.default.foo3_1b(c2)))#xL]
-+- Project [count(1)#xL, c1#x, sum(c2)#xL, sum(spark_catalog.default.foo3_1b(c2))#xL, cast(c1#x as int) AS x#x, cast(sum(c2)#xL as int) AS x#x]
-   +- Aggregate [c1#x], [count(1) AS count(1)#xL, c1#x, sum(c2#x) AS sum(c2)#xL, sum(spark_catalog.default.foo3_1b(x#x)) AS sum(spark_catalog.default.foo3_1b(c2))#xL]
-      +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11g, n INT, , ARRAY(1, 2, n), false, false, false, true
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+SELECT foo1_11g(5)
 -- !query analysis
-Filter (count(1)#xL > cast(0 as bigint))
-+- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(sum(c2))#x]
-   +- Project [c1#x, count(1)#xL, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
-      +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11g(n#x) AS spark_catalog.default.foo1_11g(5)#x]
++- Project [cast(5 as int) AS n#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 0
+CREATE OR REPLACE FUNCTION foo1_11h(a INT, b STRING) RETURN STRUCT(a, b)
 -- !query analysis
-Filter (spark_catalog.default.foo3_1b(sum(c2))#x > 0)
-+- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(sum(c2))#x]
-   +- Project [c1#x, count(1)#xL, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
-      +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11h, a INT, b STRING, , STRUCT(a, b), false, false, false, true
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING SUM(foo3_1b(c2)) > 0
+SELECT foo1_11h(1, 'test')
 -- !query analysis
-Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(sum(c2))#x]
-+- Filter (sum(spark_catalog.default.foo3_1b(c2))#xL > cast(0 as bigint))
-   +- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(sum(c2))#x, sum(spark_catalog.default.foo3_1b(c2))#xL]
-      +- Project [c1#x, count(1)#xL, sum(c2)#xL, sum(spark_catalog.default.foo3_1b(c2))#xL, cast(sum(c2)#xL as int) AS x#x]
-         +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL, sum(spark_catalog.default.foo3_1b(x#x)) AS sum(spark_catalog.default.foo3_1b(c2))#xL]
-            +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
-               +- SubqueryAlias spark_catalog.default.t1
-                  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-                     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                        +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11h(a#x, b#x) AS spark_catalog.default.foo1_11h(1, test)#x]
++- Project [cast(1 as int) AS a#x, cast(test as string) AS b#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT foo3_1b(c1), MIN(c2) FROM t1 GROUP BY 1
+CREATE OR REPLACE FUNCTION foo1_11i(x INT) RETURN (SELECT x * 2)
 -- !query analysis
-Project [spark_catalog.default.foo3_1b(c1)#x, min(c2)#x]
-+- Aggregate [spark_catalog.default.foo3_1b#x], [spark_catalog.default.foo3_1b#x AS spark_catalog.default.foo3_1b(c1)#x, min(c2#x) AS min(c2)#x]
-   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11i, x INT, , (SELECT x * 2), false, false, false, true
 
 
 -- !query
-SELECT foo3_1a(c1 + rand(0) * 0, c2) FROM t1 GROUP BY 1
+SELECT foo1_11i(5)
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+Project [spark_catalog.default.foo1_11i(x#x) AS spark_catalog.default.foo1_11i(5)#x]
++- Project [cast(5 as int) AS x#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2, 3
+CREATE OR REPLACE FUNCTION foo1_11j(s STRING) RETURN UPPER(s)
 -- !query analysis
-Project [c1#x, c2#x, spark_catalog.default.foo3_1a(c1, c2)#x]
-+- Aggregate [c1#x, c2#x, spark_catalog.default.foo3_1a#x], [c1#x, c2#x, spark_catalog.default.foo3_1a#x AS spark_catalog.default.foo3_1a(c1, c2)#x]
-   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a#x]
-      +- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+CreateSQLFunctionCommand spark_catalog.default.foo1_11j, s STRING, , UPPER(s), false, false, false, true
 
 
 -- !query
-SELECT c1, (SELECT c1), (SELECT foo3_1b(c1)), SUM(c2) FROM t1 GROUP BY 1, 2, 3
+SELECT foo1_11j('hello')
 -- !query analysis
-Aggregate [c1#x, scalar-subquery#x [c1#x], scalar-subquery#x [c1#x]], [c1#x, scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x, scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x, sum(c2#x) AS sum(c2)#xL]
-:  :- Project [outer(c1#x)]
-:  :  +- OneRowRelation
-:  :- Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(outer(spark_catalog.default.t1.c1))#x]
-:  :  +- Project [cast(outer(c1#x) as int) AS x#x]
-:  :     +- OneRowRelation
-:  :- Project [outer(c1#x)]
-:  :  +- OneRowRelation
-:  +- Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(outer(spark_catalog.default.t1.c1))#x]
-:     +- Project [cast(outer(c1#x) as int) AS x#x]
-:        +- OneRowRelation
-+- SubqueryAlias spark_catalog.default.t1
-   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-         +- LocalRelation [col1#x, col2#x]
+Project [spark_catalog.default.foo1_11j(s#x) AS spark_catalog.default.foo1_11j(hello)#x]
++- Project [cast(hello as string) AS s#x]
+   +- OneRowRelation
 
 
 -- !query
-SELECT c1, SUM(c2) + foo3_1a(MIN(c2), MAX(c2)) + (SELECT SUM(c2)) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11k(a INT, b STRING) RETURN CONCAT(CAST(a AS STRING), '_', b)
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "sqlExprs" : "\"sum(c2) AS `sum(outer(spark_catalog.default.t1.c2))`\""
+CreateSQLFunctionCommand spark_catalog.default.foo1_11k, a INT, b STRING, , CONCAT(CAST(a AS STRING), '_', b), false, false, false, true
+
+
+-- !query
+SELECT foo1_11k(123, 'test')
+-- !query analysis
+Project [spark_catalog.default.foo1_11k(a#x, b#x) AS spark_catalog.default.foo1_11k(123, test)#x]
++- Project [cast(123 as int) AS a#x, cast(test as string) AS b#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo1_11l() RETURNS TABLE RETURN SELECT 1 as id, 'hello' as name
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo1_11l, TABLE, SELECT 1 as id, 'hello' as name, true, false, false, true
+
+
+-- !query
+SELECT * FROM foo1_11l()
+-- !query analysis
+Project [id#x, name#x]
++- SQLFunctionNode spark_catalog.default.foo1_11l
+   +- SubqueryAlias foo1_11l
+      +- Project [cast(id#x as int) AS id#x, cast(name#x as string) AS name#x]
+         +- Project [1 AS id#x, hello AS name#x]
+            +- OneRowRelation
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo1_11m(a INT, b STRING) RETURNS TABLE RETURN SELECT a * 2 as doubled, UPPER(b) as upper_name
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo1_11m, a INT, b STRING, TABLE, SELECT a * 2 as doubled, UPPER(b) as upper_name, true, false, false, true
+
+
+-- !query
+SELECT * FROM foo1_11m(5, 'world')
+-- !query analysis
+Project [doubled#x, upper_name#x]
++- SQLFunctionNode spark_catalog.default.foo1_11m
+   +- SubqueryAlias foo1_11m
+      +- Project [cast(doubled#x as int) AS doubled#x, cast(upper_name#x as string) AS upper_name#x]
+         +- Project [(cast(5 as int) * 2) AS doubled#x, upper(cast(world as string)) AS upper_name#x]
+            +- OneRowRelation
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo1_11n(arr ARRAY<INT>) RETURNS TABLE RETURN SELECT size(arr) as array_size, arr[0] as first_element
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo1_11n, arr ARRAY<INT>, TABLE, SELECT size(arr) as array_size, arr[0] as first_element, true, false, false, true
+
+
+-- !query
+SELECT * FROM foo1_11n(ARRAY(1, 2, 3))
+-- !query analysis
+Project [array_size#x, first_element#x]
++- SQLFunctionNode spark_catalog.default.foo1_11n
+   +- SubqueryAlias foo1_11n
+      +- Project [cast(array_size#x as int) AS array_size#x, cast(first_element#x as int) AS first_element#x]
+         +- Project [size(cast(array(1, 2, 3) as array<int>), false) AS array_size#x, cast(array(1, 2, 3) as array<int>)[0] AS first_element#x]
+            +- OneRowRelation
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo1_11o(id INT, name STRING) RETURNS TABLE RETURN SELECT STRUCT(id, name) as person_info, id + 100 as modified_id
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo1_11o, id INT, name STRING, TABLE, SELECT STRUCT(id, name) as person_info, id + 100 as modified_id, true, false, false, true
+
+
+-- !query
+SELECT * FROM foo1_11o(1, 'Alice')
+-- !query analysis
+Project [person_info#x, modified_id#x]
++- SQLFunctionNode spark_catalog.default.foo1_11o
+   +- SubqueryAlias foo1_11o
+      +- Project [cast(person_info#x as struct<id:int,name:string>) AS person_info#x, cast(modified_id#x as int) AS modified_id#x]
+         +- Project [struct(id, cast(1 as int), name, cast(Alice as string)) AS person_info#x, (cast(1 as int) + 100) AS modified_id#x]
+            +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_1a(a INT) RETURNS INT RETURN a
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_1a, a INT, INT, a, false, false, false, false
+
+
+-- !query
+SELECT foo2_1a(5)
+-- !query analysis
+Project [spark_catalog.default.foo2_1a(a#x) AS spark_catalog.default.foo2_1a(5)#x]
++- Project [cast(5 as int) AS a#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_1b(a INT, b INT) RETURNS INT RETURN a + b
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_1b, a INT, b INT, INT, a + b, false, false, false, false
+
+
+-- !query
+SELECT foo2_1b(5, 6)
+-- !query analysis
+Project [spark_catalog.default.foo2_1b(a#x, b#x) AS spark_catalog.default.foo2_1b(5, 6)#x]
++- Project [cast(5 as int) AS a#x, cast(6 as int) AS b#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_1c(a INT, b INT) RETURNS INT RETURN 10 * (a + b) + 100 * (a -b)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_1c, a INT, b INT, INT, 10 * (a + b) + 100 * (a -b), false, false, false, false
+
+
+-- !query
+SELECT foo2_1c(5, 6)
+-- !query analysis
+Project [spark_catalog.default.foo2_1c(a#x, b#x) AS spark_catalog.default.foo2_1c(5, 6)#x]
++- Project [cast(5 as int) AS a#x, cast(6 as int) AS b#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_1d(a INT, b INT) RETURNS INT RETURN ABS(a) - LENGTH(CAST(b AS VARCHAR(10)))
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_1d, a INT, b INT, INT, ABS(a) - LENGTH(CAST(b AS VARCHAR(10))), false, false, false, false
+
+
+-- !query
+SELECT foo2_1d(-5, 6)
+-- !query analysis
+Project [spark_catalog.default.foo2_1d(a#x, b#x) AS spark_catalog.default.foo2_1d(-5, 6)#x]
++- Project [cast(-5 as int) AS a#x, cast(6 as int) AS b#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_2a(a INT) RETURNS INT RETURN SELECT a
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_2a, a INT, INT, SELECT a, false, false, false, false
+
+
+-- !query
+SELECT foo2_2a(5)
+-- !query analysis
+Project [spark_catalog.default.foo2_2a(a#x) AS spark_catalog.default.foo2_2a(5)#x]
++- Project [cast(5 as int) AS a#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_2b(a INT) RETURNS INT RETURN 1 + (SELECT a)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_2b, a INT, INT, 1 + (SELECT a), false, false, false, false
+
+
+-- !query
+SELECT foo2_2b(5)
+-- !query analysis
+Project [spark_catalog.default.foo2_2b(a#x) AS spark_catalog.default.foo2_2b(5)#x]
+:  +- Project [outer(a#x)]
+:     +- OneRowRelation
++- Project [cast(5 as int) AS a#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_2c(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT a))
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`a`"
   },
   "queryContext" : [ {
     "objectType" : "",
     "objectName" : "",
-    "startIndex" : 51,
-    "stopIndex" : 64,
-    "fragment" : "SELECT SUM(c2)"
+    "startIndex" : 21,
+    "stopIndex" : 21,
+    "fragment" : "a"
   } ]
 }
 
 
 -- !query
-SELECT foo3_1b(SUM(c1)) + (SELECT foo3_1b(SUM(c1))) FROM t1
+CREATE FUNCTION foo2_2d(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT (SELECT (SELECT a))))
 -- !query analysis
 org.apache.spark.sql.catalyst.ExtendedAnalysisException
 {
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
-  "sqlState" : "0A000",
+  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
+  "sqlState" : "42703",
   "messageParameters" : {
-    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
+    "objectName" : "`a`"
   },
   "queryContext" : [ {
     "objectType" : "",
     "objectName" : "",
-    "startIndex" : 27,
-    "stopIndex" : 51,
-    "fragment" : "(SELECT foo3_1b(SUM(c1)))"
+    "startIndex" : 37,
+    "stopIndex" : 37,
+    "fragment" : "a"
   } ]
 }
 
 
 -- !query
-SELECT SUM(foo3_1b(SUM(c1))) FROM t1
+CREATE FUNCTION foo2_2e(a INT) RETURNS INT RETURN
+SELECT a FROM (VALUES 1) AS V(c1) WHERE c1 = 2
+UNION ALL
+SELECT a + 1 FROM (VALUES 1) AS V(c1)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_2e, a INT, INT, SELECT a FROM (VALUES 1) AS V(c1) WHERE c1 = 2
+UNION ALL
+SELECT a + 1 FROM (VALUES 1) AS V(c1), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo2_2f(a INT) RETURNS INT RETURN
+SELECT a FROM (VALUES 1) AS V(c1)
+EXCEPT
+SELECT a + 1 FROM (VALUES 1) AS V(a)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_2f, a INT, INT, SELECT a FROM (VALUES 1) AS V(c1)
+EXCEPT
+SELECT a + 1 FROM (VALUES 1) AS V(a), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo2_2g(a INT) RETURNS INT RETURN
+SELECT a FROM (VALUES 1) AS V(c1)
+INTERSECT
+SELECT a FROM (VALUES 1) AS V(a)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_2g, a INT, INT, SELECT a FROM (VALUES 1) AS V(c1)
+INTERSECT
+SELECT a FROM (VALUES 1) AS V(a), false, false, false, false
+
+
+-- !query
+DROP TABLE IF EXISTS t1
+-- !query analysis
+DropTable true, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
+
+
+-- !query
+DROP TABLE IF EXISTS t2
+-- !query analysis
+DropTable true, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t2
+
+
+-- !query
+DROP TABLE IF EXISTS ts
 -- !query analysis
 org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
-  "sqlState" : "42607",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 12,
-    "stopIndex" : 27,
-    "fragment" : "foo3_1b(SUM(c1))"
-  } ]
+  "errorClass" : "WRONG_COMMAND_FOR_OBJECT_TYPE",
+  "sqlState" : "42809",
+  "messageParameters" : {
+    "alternative" : "DROP VIEW",
+    "foundType" : "VIEW",
+    "objectName" : "spark_catalog.default.ts",
+    "operation" : "DROP TABLE",
+    "requiredType" : "EXTERNAL or MANAGED"
+  }
 }
 
 
 -- !query
-SELECT foo3_1b(SUM(c1)) + (SELECT SUM(SUM(c1))) FROM t1
+DROP TABLE IF EXISTS tm
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
+org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
-  "sqlState" : "42607",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 39,
-    "stopIndex" : 45,
-    "fragment" : "SUM(c1)"
-  } ]
+  "errorClass" : "WRONG_COMMAND_FOR_OBJECT_TYPE",
+  "sqlState" : "42809",
+  "messageParameters" : {
+    "alternative" : "DROP VIEW",
+    "foundType" : "VIEW",
+    "objectName" : "spark_catalog.default.tm",
+    "operation" : "DROP TABLE",
+    "requiredType" : "EXTERNAL or MANAGED"
+  }
 }
 
 
 -- !query
-SELECT foo3_1b(SUM(c1) + SUM(SUM(c1))) FROM t1
+DROP TABLE IF EXISTS ta
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
+org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
-  "sqlState" : "42607",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 30,
-    "stopIndex" : 36,
-    "fragment" : "SUM(c1)"
-  } ]
-}
+  "errorClass" : "WRONG_COMMAND_FOR_OBJECT_TYPE",
+  "sqlState" : "42809",
+  "messageParameters" : {
+    "alternative" : "DROP VIEW",
+    "foundType" : "VIEW",
+    "objectName" : "spark_catalog.default.ta",
+    "operation" : "DROP TABLE",
+    "requiredType" : "EXTERNAL or MANAGED"
+  }
+}
+
+
+-- !query
+DROP TABLE IF EXISTS V1
+-- !query analysis
+DropTable true, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.V1
+
+
+-- !query
+DROP TABLE IF EXISTS V2
+-- !query analysis
+DropTable true, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.V2
+
+
+-- !query
+DROP VIEW IF EXISTS t1
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`t1`, true, true, false
+
+
+-- !query
+DROP VIEW IF EXISTS t2
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`t2`, true, true, false
+
+
+-- !query
+DROP VIEW IF EXISTS ts
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`ts`, true, true, false
+
+
+-- !query
+DROP VIEW IF EXISTS tm
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`tm`, true, true, false
+
+
+-- !query
+DROP VIEW IF EXISTS ta
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`ta`, true, true, false
+
+
+-- !query
+DROP VIEW IF EXISTS V1
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`V1`, true, true, false
+
+
+-- !query
+DROP VIEW IF EXISTS V2
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`V2`, true, true, false
+
+
+-- !query
+CREATE FUNCTION foo2_3(a INT, b INT) RETURNS INT RETURN a + b
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_3, a INT, b INT, INT, a + b, false, false, false, false
+
+
+-- !query
+CREATE VIEW V1(c1, c2) AS VALUES (1, 2), (3, 4), (5, 6)
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`V1`, [(c1,None), (c2,None)], VALUES (1, 2), (3, 4), (5, 6), false, false, PersistedView, COMPENSATION, true
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE VIEW V2(c1, c2) AS VALUES (-1, -2), (-3, -4), (-5, -6)
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`V2`, [(c1,None), (c2,None)], VALUES (-1, -2), (-3, -4), (-5, -6), false, false, PersistedView, COMPENSATION, true
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo2_3(c1, c2), foo2_3(c2, 1), foo2_3(c1, c2) - foo2_3(c2, c1 - 1) FROM V1 ORDER BY 1, 2, 3
+-- !query analysis
+Sort [spark_catalog.default.foo2_3(c1, c2)#x ASC NULLS FIRST, spark_catalog.default.foo2_3(c2, 1)#x ASC NULLS FIRST, (spark_catalog.default.foo2_3(c1, c2) - spark_catalog.default.foo2_3(c2, (c1 - 1)))#x ASC NULLS FIRST], true
++- Project [spark_catalog.default.foo2_3(a#x, b#x) AS spark_catalog.default.foo2_3(c1, c2)#x, spark_catalog.default.foo2_3(a#x, b#x) AS spark_catalog.default.foo2_3(c2, 1)#x, (spark_catalog.default.foo2_3(a#x, b#x) - spark_catalog.default.foo2_3(a#x, b#x)) AS (spark_catalog.default.foo2_3(c1, c2) - spark_catalog.default.foo2_3(c2, (c1 - 1)))#x]
+   +- Project [c1#x, c2#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x, cast(c2#x as int) AS a#x, cast(1 as int) AS b#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x, cast(c2#x as int) AS a#x, cast((c1#x - 1) as int) AS b#x]
+      +- SubqueryAlias spark_catalog.default.v1
+         +- View (`spark_catalog`.`default`.`v1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM V1 WHERE foo2_3(c1, 0) = c1 AND foo2_3(c1, c2) < 8
+-- !query analysis
+Project [c1#x, c2#x]
++- Project [c1#x, c2#x]
+   +- Filter ((spark_catalog.default.foo2_3(a#x, b#x) = c1#x) AND (spark_catalog.default.foo2_3(a#x, b#x) < 8))
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS a#x, cast(0 as int) AS b#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x]
+         +- SubqueryAlias spark_catalog.default.v1
+            +- View (`spark_catalog`.`default`.`v1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo2_3(SUM(c1), SUM(c2)), SUM(c1) + SUM(c2), SUM(foo2_3(c1, c2) + foo2_3(c2, c1) - foo2_3(c2, c1))
+FROM V1
+-- !query analysis
+Project [spark_catalog.default.foo2_3(a#x, b#x) AS spark_catalog.default.foo2_3(sum(c1), sum(c2))#x, (sum(c1) + sum(c2))#xL, sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1)))#xL]
++- Project [sum(c1)#xL, sum(c2)#xL, (sum(c1) + sum(c2))#xL, sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1)))#xL, cast(sum(c1)#xL as int) AS a#x, cast(sum(c2)#xL as int) AS b#x]
+   +- Aggregate [sum(c1#x) AS sum(c1)#xL, sum(c2#x) AS sum(c2)#xL, (sum(c1#x) + sum(c2#x)) AS (sum(c1) + sum(c2))#xL, sum(((spark_catalog.default.foo2_3(a#x, b#x) + spark_catalog.default.foo2_3(a#x, b#x)) - spark_catalog.default.foo2_3(a#x, b#x))) AS sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1)))#xL]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS a#x, cast(c2#x as int) AS b#x, cast(c2#x as int) AS a#x, cast(c1#x as int) AS b#x, cast(c2#x as int) AS a#x, cast(c1#x as int) AS b#x]
+         +- SubqueryAlias spark_catalog.default.v1
+            +- View (`spark_catalog`.`default`.`v1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo2_4a(a ARRAY<STRING>) RETURNS STRING RETURN
+SELECT array_sort(a, (i, j) -> rank[i] - rank[j])[0] FROM (SELECT MAP('a', 1, 'b', 2) rank)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_4a, a ARRAY<STRING>, STRING, SELECT array_sort(a, (i, j) -> rank[i] - rank[j])[0] FROM (SELECT MAP('a', 1, 'b', 2) rank), false, false, false, false
+
+
+-- !query
+SELECT foo2_4a(ARRAY('a', 'b'))
+-- !query analysis
+Project [spark_catalog.default.foo2_4a(a#x) AS spark_catalog.default.foo2_4a(array(a, b))#x]
+:  +- Project [array_sort(outer(a#x), lambdafunction((rank#x[lambda i#x] - rank#x[lambda j#x]), lambda i#x, lambda j#x, false), false)[0] AS array_sort(outer(foo2_4a.a), lambdafunction((rank[namedlambdavariable()] - rank[namedlambdavariable()]), namedlambdavariable(), namedlambdavariable()))[0]#x]
+:     +- SubqueryAlias __auto_generated_subquery_name
+:        +- Project [map(a, 1, b, 2) AS rank#x]
+:           +- OneRowRelation
++- Project [cast(array(a, b) as array<string>) AS a#x]
+   +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo2_4b(m MAP<STRING, STRING>, k STRING) RETURNS STRING RETURN
+SELECT v || ' ' || v FROM (SELECT upper(m[k]) AS v)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo2_4b, m MAP<STRING, STRING>, k STRING, STRING, SELECT v || ' ' || v FROM (SELECT upper(m[k]) AS v), false, false, false, false
+
+
+-- !query
+SELECT foo2_4b(map('a', 'hello', 'b', 'world'), 'a')
+-- !query analysis
+Project [spark_catalog.default.foo2_4b(m#x, k#x) AS spark_catalog.default.foo2_4b(map(a, hello, b, world), a)#x]
+:  +- Project [concat(concat(v#x,  ), v#x) AS concat(concat(v,  ), v)#x]
+:     +- SubqueryAlias __auto_generated_subquery_name
+:        +- Project [upper(outer(m#x)[outer(k#x)]) AS v#x]
+:           +- OneRowRelation
++- Project [cast(map(a, hello, b, world) as map<string,string>) AS m#x, cast(a as string) AS k#x]
+   +- OneRowRelation
+
+
+-- !query
+DROP VIEW V2
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`V2`, false, true, false
+
+
+-- !query
+DROP VIEW V1
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`V1`, false, true, false
+
+
+-- !query
+CREATE VIEW t1(c1, c2) AS VALUES (0, 1), (0, 2), (1, 2)
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`t1`, [(c1,None), (c2,None)], VALUES (0, 1), (0, 2), (1, 2), false, false, PersistedView, COMPENSATION, true
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE VIEW t2(c1, c2) AS VALUES (0, 2), (0, 3)
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`t2`, [(c1,None), (c2,None)], VALUES (0, 2), (0, 3), false, false, PersistedView, COMPENSATION, true
+   +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE VIEW ts(x) AS VALUES NAMED_STRUCT('a', 1, 'b', 2)
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`ts`, [(x,None)], VALUES NAMED_STRUCT('a', 1, 'b', 2), false, false, PersistedView, COMPENSATION, true
+   +- LocalRelation [col1#x]
+
+
+-- !query
+CREATE VIEW tm(x) AS VALUES MAP('a', 1, 'b', 2)
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`tm`, [(x,None)], VALUES MAP('a', 1, 'b', 2), false, false, PersistedView, COMPENSATION, true
+   +- LocalRelation [col1#x]
+
+
+-- !query
+CREATE VIEW ta(x) AS VALUES ARRAY(1, 2, 3)
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`ta`, [(x,None)], VALUES ARRAY(1, 2, 3), false, false, PersistedView, COMPENSATION, true
+   +- LocalRelation [col1#x]
+
+
+-- !query
+CREATE FUNCTION foo3_1a(a DOUBLE, b DOUBLE) RETURNS DOUBLE RETURN a * b
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1a, a DOUBLE, b DOUBLE, DOUBLE, a * b, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_1b(x INT) RETURNS INT RETURN x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1b, x INT, INT, x, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_1c(x INT) RETURNS INT RETURN SELECT x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1c, x INT, INT, SELECT x, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_1d(x INT) RETURNS INT RETURN (SELECT SUM(c2) FROM t2 WHERE c1 = x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1d, x INT, INT, (SELECT SUM(c2) FROM t2 WHERE c1 = x), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_1e() RETURNS INT RETURN foo3_1d(0)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1e, INT, foo3_1d(0), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_1f() RETURNS INT RETURN SELECT SUM(c2) FROM t2 WHERE c1 = 0
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1f, INT, SELECT SUM(c2) FROM t2 WHERE c1 = 0, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_1g(x INT) RETURNS INT RETURN SELECT (SELECT x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1g, x INT, INT, SELECT (SELECT x), false, false, false, false
+
+
+-- !query
+SELECT a, b, foo3_1a(a + 1, b + 1) FROM t1 AS t(a, b)
+-- !query analysis
+Project [a#x, b#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a((a + 1), (b + 1))#x]
++- Project [a#x, b#x, cast((a#x + 1) as double) AS a#x, cast((b#x + 1) as double) AS b#x]
+   +- SubqueryAlias t
+      +- Project [c1#x AS a#x, c2#x AS b#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT x, foo3_1c(x) FROM t1 AS t(x, y)
+-- !query analysis
+Project [x#x, spark_catalog.default.foo3_1c(x#x) AS spark_catalog.default.foo3_1c(x)#x]
++- Project [x#x, y#x, cast(x#x as int) AS x#x]
+   +- SubqueryAlias t
+      +- Project [c1#x AS x#x, c2#x AS y#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1d(c1) FROM t1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1d(x#x) AS spark_catalog.default.foo3_1d(c1)#x]
+:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+:     +- Filter (c1#x = outer(x#x))
+:        +- SubqueryAlias spark_catalog.default.t2
+:           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+:              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+:                 +- LocalRelation [col1#x, col2#x]
++- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1a(foo3_1b(c1), foo3_1b(c1)) FROM t1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), spark_catalog.default.foo3_1b(c1))#x]
++- Project [c1#x, c2#x, x#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as double) AS a#x, cast(spark_catalog.default.foo3_1b(x#x) as double) AS b#x]
+   +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x, cast(c1#x as int) AS x#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1d(foo3_1c(foo3_1b(c1))) FROM t1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1d(x#x) AS spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1)))#x]
+:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+:     +- Filter (c1#x = outer(x#x))
+:        +- SubqueryAlias spark_catalog.default.t2
+:           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+:              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+:                 +- LocalRelation [col1#x, col2#x]
++- Project [c1#x, c2#x, x#x, x#x, cast(spark_catalog.default.foo3_1c(x#x) as int) AS x#x]
+   +- Project [c1#x, c2#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1a(foo3_1c(foo3_1b(c1)), foo3_1d(foo3_1b(c1))) FROM t1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1)), spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1b(c1)))#x]
++- Project [c1#x, c2#x, x#x, x#x, x#x, x#x, cast(spark_catalog.default.foo3_1c(x#x) as double) AS a#x, cast(spark_catalog.default.foo3_1d(x#x) as double) AS b#x]
+   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+   :     +- Filter (c1#x = outer(x#x))
+   :        +- SubqueryAlias spark_catalog.default.t2
+   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                 +- LocalRelation [col1#x, col2#x]
+   +- Project [c1#x, c2#x, x#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1c(foo3_1e()) FROM t1
+-- !query analysis
+Project [spark_catalog.default.foo3_1c(x#x) AS spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1e())#x]
++- Project [c1#x, c2#x, x#x, cast(spark_catalog.default.foo3_1e() as int) AS x#x]
+   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+   :     +- Filter (c1#x = outer(x#x))
+   :        +- SubqueryAlias spark_catalog.default.t2
+   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                 +- LocalRelation [col1#x, col2#x]
+   +- Project [c1#x, c2#x, cast(0 as int) AS x#x]
+      +- Project [c1#x, c2#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1a(MAX(c1), MAX(c2)) FROM t1
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(max(c1), max(c2))#x]
++- Project [max(c1)#x, max(c2)#x, cast(max(c1)#x as double) AS a#x, cast(max(c2)#x as double) AS b#x]
+   +- Aggregate [max(c1#x) AS max(c1)#x, max(c2#x) AS max(c2)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1a(MAX(c1), c2) FROM t1 GROUP BY c2
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(max(c1), c2)#x]
++- Project [max(c1)#x, c2#x, cast(max(c1)#x as double) AS a#x, cast(c2#x as double) AS b#x]
+   +- Aggregate [c2#x], [max(c1#x) AS max(c1)#x, c2#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, c2)#x]
++- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
+   +- Aggregate [c1#x, c2#x], [c1#x, c2#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT MAX(foo3_1a(c1, c2)) FROM t1 GROUP BY c1, c2
+-- !query analysis
+Project [max(spark_catalog.default.foo3_1a(c1, c2))#x]
++- Aggregate [c1#x, c2#x], [max(spark_catalog.default.foo3_1a(a#x, b#x)) AS max(spark_catalog.default.foo3_1a(c1, c2))#x]
+   +- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT MAX(c1) + foo3_1b(MAX(c1)) FROM t1 GROUP BY c2
+-- !query analysis
+Project [(max(c1)#x + spark_catalog.default.foo3_1b(x#x)) AS (max(c1) + spark_catalog.default.foo3_1b(max(c1)))#x]
++- Project [max(c1)#x, max(c1)#x, cast(max(c1)#x as int) AS x#x]
+   +- Aggregate [c2#x], [max(c1#x) AS max(c1)#x, max(c1#x) AS max(c1)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, SUM(foo3_1c(c2)) FROM t1 GROUP BY c1
+-- !query analysis
+Project [c1#x, sum(spark_catalog.default.foo3_1c(c2))#xL]
++- Aggregate [c1#x], [c1#x, sum(spark_catalog.default.foo3_1c(x#x)) AS sum(spark_catalog.default.foo3_1c(c2))#xL]
+   +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, SUM(foo3_1d(c2)) FROM t1 GROUP BY c1
+-- !query analysis
+Project [c1#x, sum(spark_catalog.default.foo3_1d(c2))#xL]
++- Aggregate [c1#x], [c1#x, sum(spark_catalog.default.foo3_1d(x#x)) AS sum(spark_catalog.default.foo3_1d(c2))#xL]
+   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+   :     +- Filter (c1#x = outer(x#x))
+   :        +- SubqueryAlias spark_catalog.default.t2
+   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                 +- LocalRelation [col1#x, col2#x]
+   +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1c(c1), foo3_1d(c1) FROM t1 GROUP BY c1
+-- !query analysis
+Project [spark_catalog.default.foo3_1c(x#x) AS spark_catalog.default.foo3_1c(c1)#x, spark_catalog.default.foo3_1d(x#x) AS spark_catalog.default.foo3_1d(c1)#x]
+:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+:     +- Filter (c1#x = outer(x#x))
+:        +- SubqueryAlias spark_catalog.default.t2
+:           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+:              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+:                 +- LocalRelation [col1#x, col2#x]
++- Project [c1#x, c1#x, cast(c1#x as int) AS x#x, cast(c1#x as int) AS x#x]
+   +- Aggregate [c1#x], [c1#x, c1#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1a(SUM(c1), rand(0) * 0) FROM t1
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT foo3_1a(SUM(c1) + rand(0) * 0, SUM(c2)) FROM t1
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT foo3_1b(SUM(c1) + rand(0) * 0) FROM t1
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT foo3_1b(SUM(1) + rand(0) * 0) FROM t1 GROUP BY c2
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT foo3_1c(SUM(c2) + rand(0) * 0) FROM t1 GROUP by c1
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT foo3_1b(foo3_1b(MAX(c2))) FROM t1
+-- !query analysis
+Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(spark_catalog.default.foo3_1b(max(c2)))#x]
++- Project [max(c2)#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as int) AS x#x]
+   +- Project [max(c2)#x, cast(max(c2)#x as int) AS x#x]
+      +- Aggregate [max(c2#x) AS max(c2)#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1b(MAX(foo3_1b(c2))) FROM t1
+-- !query analysis
+Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(max(spark_catalog.default.foo3_1b(c2)))#x]
++- Project [max(spark_catalog.default.foo3_1b(c2))#x, cast(max(spark_catalog.default.foo3_1b(c2))#x as int) AS x#x]
+   +- Aggregate [max(spark_catalog.default.foo3_1b(x#x)) AS max(spark_catalog.default.foo3_1b(c2))#x]
+      +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1a(foo3_1b(c1), MAX(c2)) FROM t1 GROUP BY c1
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), max(c2))#x]
++- Project [c1#x, max(c2)#x, x#x, cast(spark_catalog.default.foo3_1b(x#x) as double) AS a#x, cast(max(c2)#x as double) AS b#x]
+   +- Project [c1#x, max(c2)#x, cast(c1#x as int) AS x#x]
+      +- Aggregate [c1#x], [c1#x, max(c2#x) AS max(c2)#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1b(c1) FROM t1 GROUP BY c1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(c1)#x]
++- Project [c1#x, c1#x, cast(c1#x as int) AS x#x]
+   +- Aggregate [c1#x], [c1#x, c1#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1b(c1 + 1) FROM t1 GROUP BY c1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b((c1 + 1))#x]
++- Project [c1#x, (c1 + 1)#x, cast((c1 + 1)#x as int) AS x#x]
+   +- Aggregate [c1#x], [c1#x, (c1#x + 1) AS (c1 + 1)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1b(c1 + rand(0) * 0) FROM t1 GROUP BY c1
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT c1, foo3_1a(c1, MIN(c2)) FROM t1 GROUP BY c1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, min(c2))#x]
++- Project [c1#x, c1#x, min(c2)#x, cast(c1#x as double) AS a#x, cast(min(c2)#x as double) AS b#x]
+   +- Aggregate [c1#x], [c1#x, c1#x, min(c2#x) AS min(c2)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, foo3_1a(c1 + 1, MIN(c2 + 1)) FROM t1 GROUP BY c1
+-- !query analysis
+Project [c1#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a((c1 + 1), min((c2 + 1)))#x]
++- Project [c1#x, (c1 + 1)#x, min((c2 + 1))#x, cast((c1 + 1)#x as double) AS a#x, cast(min((c2 + 1))#x as double) AS b#x]
+   +- Aggregate [c1#x], [c1#x, (c1#x + 1) AS (c1 + 1)#x, min((c2#x + 1)) AS min((c2 + 1))#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+-- !query analysis
+Project [c1#x, c2#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, c2)#x]
++- Project [c1#x, c2#x, c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
+   +- Aggregate [c1#x, c2#x], [c1#x, c2#x, c1#x, c2#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, c2, foo3_1a(1, 2) FROM t1 GROUP BY c1, c2
+-- !query analysis
+Project [c1#x, c2#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(1, 2)#x]
++- Project [c1#x, c2#x, 1#x, 2#x, cast(1#x as double) AS a#x, cast(2#x as double) AS b#x]
+   +- Aggregate [c1#x, c2#x], [c1#x, c2#x, 1 AS 1#x, 2 AS 2#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1 + c2, foo3_1b(c1 + c2 + 1) FROM t1 GROUP BY c1 + c2
+-- !query analysis
+Project [(c1 + c2)#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(((c1 + c2) + 1))#x]
++- Project [(c1 + c2)#x, ((c1 + c2) + 1)#x, cast(((c1 + c2) + 1)#x as int) AS x#x]
+   +- Aggregate [(c1#x + c2#x)], [(c1#x + c2#x) AS (c1 + c2)#x, ((c1#x + c2#x) + 1) AS ((c1 + c2) + 1)#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT COUNT(*) + foo3_1b(c1) + foo3_1b(SUM(c2)) + SUM(foo3_1b(c2)) FROM t1 GROUP BY c1
+-- !query analysis
+Project [(((count(1)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) + sum(spark_catalog.default.foo3_1b(c2))#xL) AS (((count(1) + spark_catalog.default.foo3_1b(c1)) + spark_catalog.default.foo3_1b(sum(c2))) + sum(spark_catalog.default.foo3_1b(c2)))#xL]
++- Project [count(1)#xL, c1#x, sum(c2)#xL, sum(spark_catalog.default.foo3_1b(c2))#xL, cast(c1#x as int) AS x#x, cast(sum(c2)#xL as int) AS x#x]
+   +- Aggregate [c1#x], [count(1) AS count(1)#xL, c1#x, sum(c2#x) AS sum(c2)#xL, sum(spark_catalog.default.foo3_1b(x#x)) AS sum(spark_catalog.default.foo3_1b(c2))#xL]
+      +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+-- !query analysis
+Filter (count(1)#xL > cast(0 as bigint))
++- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(sum(c2))#x]
+   +- Project [c1#x, count(1)#xL, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
+      +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 0
+-- !query analysis
+Filter (spark_catalog.default.foo3_1b(sum(c2))#x > 0)
++- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(sum(c2))#x]
+   +- Project [c1#x, count(1)#xL, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
+      +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING SUM(foo3_1b(c2)) > 0
+-- !query analysis
+Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(sum(c2))#x]
++- Filter (sum(spark_catalog.default.foo3_1b(c2))#xL > cast(0 as bigint))
+   +- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(sum(c2))#x, sum(spark_catalog.default.foo3_1b(c2))#xL]
+      +- Project [c1#x, count(1)#xL, sum(c2)#xL, sum(spark_catalog.default.foo3_1b(c2))#xL, cast(sum(c2)#xL as int) AS x#x]
+         +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL, sum(spark_catalog.default.foo3_1b(x#x)) AS sum(spark_catalog.default.foo3_1b(c2))#xL]
+            +- Project [c1#x, c2#x, cast(c2#x as int) AS x#x]
+               +- SubqueryAlias spark_catalog.default.t1
+                  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+                     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                        +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1b(c1), MIN(c2) FROM t1 GROUP BY 1
+-- !query analysis
+Project [spark_catalog.default.foo3_1b(c1)#x, min(c2)#x]
++- Aggregate [spark_catalog.default.foo3_1b#x], [spark_catalog.default.foo3_1b#x AS spark_catalog.default.foo3_1b(c1)#x, min(c2#x) AS min(c2)#x]
+   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1a(c1 + rand(0) * 0, c2) FROM t1 GROUP BY 1
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2, 3
+-- !query analysis
+Project [c1#x, c2#x, spark_catalog.default.foo3_1a(c1, c2)#x]
++- Aggregate [c1#x, c2#x, spark_catalog.default.foo3_1a#x], [c1#x, c2#x, spark_catalog.default.foo3_1a#x AS spark_catalog.default.foo3_1a(c1, c2)#x]
+   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a#x]
+      +- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, (SELECT c1), (SELECT foo3_1b(c1)), SUM(c2) FROM t1 GROUP BY 1, 2, 3
+-- !query analysis
+Aggregate [c1#x, scalar-subquery#x [c1#x], scalar-subquery#x [c1#x]], [c1#x, scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x, scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x, sum(c2#x) AS sum(c2)#xL]
+:  :- Project [outer(c1#x)]
+:  :  +- OneRowRelation
+:  :- Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(outer(spark_catalog.default.t1.c1))#x]
+:  :  +- Project [cast(outer(c1#x) as int) AS x#x]
+:  :     +- OneRowRelation
+:  :- Project [outer(c1#x)]
+:  :  +- OneRowRelation
+:  +- Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(outer(spark_catalog.default.t1.c1))#x]
+:     +- Project [cast(outer(c1#x) as int) AS x#x]
+:        +- OneRowRelation
++- SubqueryAlias spark_catalog.default.t1
+   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, SUM(c2) + foo3_1a(MIN(c2), MAX(c2)) + (SELECT SUM(c2)) FROM t1 GROUP BY c1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "sqlExprs" : "\"sum(c2) AS `sum(outer(spark_catalog.default.t1.c2))`\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 51,
+    "stopIndex" : 64,
+    "fragment" : "SELECT SUM(c2)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1)) + (SELECT foo3_1b(SUM(c1))) FROM t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 27,
+    "stopIndex" : 51,
+    "fragment" : "(SELECT foo3_1b(SUM(c1)))"
+  } ]
+}
+
+
+-- !query
+SELECT SUM(foo3_1b(SUM(c1))) FROM t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
+  "sqlState" : "42607",
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 12,
+    "stopIndex" : 27,
+    "fragment" : "foo3_1b(SUM(c1))"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1)) + (SELECT SUM(SUM(c1))) FROM t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
+  "sqlState" : "42607",
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 39,
+    "stopIndex" : 45,
+    "fragment" : "SUM(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1) + SUM(SUM(c1))) FROM t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
+  "sqlState" : "42607",
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 30,
+    "stopIndex" : 36,
+    "fragment" : "SUM(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1 + rand(0) * 0)) FROM t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
+  "sqlState" : "42845",
+  "messageParameters" : {
+    "sqlExpr" : "\"sum((c1 + (rand(0) * 0)))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 20,
+    "stopIndex" : 35,
+    "fragment" : "c1 + rand(0) * 0"
+  } ]
+}
+
+
+-- !query
+SELECT SUM(foo3_1b(c1) + rand(0) * 0) FROM t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
+  "sqlState" : "42845",
+  "messageParameters" : {
+    "sqlExpr" : "\"sum((spark_catalog.default.foo3_1b(foo3_1b.x) + (rand(0) * 0)))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 12,
+    "stopIndex" : 36,
+    "fragment" : "foo3_1b(c1) + rand(0) * 0"
+  } ]
+}
+
+
+-- !query
+SELECT SUM(foo3_1b(c1 + rand(0) * 0)) FROM t1
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT foo3_1b(SUM(c1) + foo3_1b(SUM(c1))) FROM t1
+-- !query analysis
+Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b((sum(c1) + spark_catalog.default.foo3_1b(sum(c1))))#x]
++- Project [sum(c1)#xL, sum(c1)#xL, x#x, cast((sum(c1)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) as int) AS x#x]
+   +- Project [sum(c1)#xL, sum(c1)#xL, cast(sum(c1)#xL as int) AS x#x]
+      +- Aggregate [sum(c1#x) AS sum(c1)#xL, sum(c1#x) AS sum(c1)#xL]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1b(SUM(c2) + foo3_1b(SUM(c1))) AS foo FROM t1 HAVING foo > 0
+-- !query analysis
+Filter (foo#x > 0)
++- Project [spark_catalog.default.foo3_1b(x#x) AS foo#x]
+   +- Project [sum(c2)#xL, sum(c1)#xL, x#x, cast((sum(c2)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) as int) AS x#x]
+      +- Project [sum(c2)#xL, sum(c1)#xL, cast(sum(c1)#xL as int) AS x#x]
+         +- Aggregate [sum(c2#x) AS sum(c2)#xL, sum(c1#x) AS sum(c1)#xL]
+            +- SubqueryAlias spark_catalog.default.t1
+               +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+                  +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                     +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2) + foo3_1b(SUM(c2))) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+-- !query analysis
+Filter (count(1)#xL > cast(0 as bigint))
++- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b((sum(c2) + spark_catalog.default.foo3_1b(sum(c2))))#x]
+   +- Project [c1#x, count(1)#xL, sum(c2)#xL, sum(c2)#xL, x#x, cast((sum(c2)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) as int) AS x#x]
+      +- Project [c1#x, count(1)#xL, sum(c2)#xL, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
+         +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL, sum(c2#x) AS sum(c2)#xL]
+            +- SubqueryAlias spark_catalog.default.t1
+               +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+                  +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                     +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1a(c1, MAX(c2)) FROM t1 GROUP BY c1, 1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "GROUP_BY_POS_AGGREGATE",
+  "sqlState" : "42903",
+  "messageParameters" : {
+    "aggExpr" : "spark_catalog.default.foo3_1a(spark_catalog.default.t1.c1, max(spark_catalog.default.t1.c2)) AS `spark_catalog.default.foo3_1a(c1, max(c2))`",
+    "index" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 50,
+    "stopIndex" : 50,
+    "fragment" : "1"
+  } ]
+}
+
+
+-- !query
+WITH cte AS (SELECT foo3_1a(c1, c2) FROM t1)
+SELECT * FROM cte
+-- !query analysis
+WithCTE
+:- CTERelationDef xxxx, false
+:  +- SubqueryAlias cte
+:     +- Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, c2)#x]
+:        +- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
+:           +- SubqueryAlias spark_catalog.default.t1
+:              +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+:                 +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+:                    +- LocalRelation [col1#x, col2#x]
++- Project [spark_catalog.default.foo3_1a(c1, c2)#x]
+   +- SubqueryAlias cte
+      +- CTERelationRef xxxx, true, [spark_catalog.default.foo3_1a(c1, c2)#x], false, false
+
+
+-- !query
+SELECT SUM(c2) FROM t1 GROUP BY foo3_1b(c1)
+-- !query analysis
+Project [sum(c2)#xL]
++- Aggregate [spark_catalog.default.foo3_1b#x], [sum(c2#x) AS sum(c2)#xL]
+   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1b(c1), SUM(c2) FROM t1 GROUP BY 1
+-- !query analysis
+Project [spark_catalog.default.foo3_1b(c1)#x, sum(c2)#xL]
++- Aggregate [spark_catalog.default.foo3_1b#x], [spark_catalog.default.foo3_1b#x AS spark_catalog.default.foo3_1b(c1)#x, sum(c2#x) AS sum(c2)#xL]
+   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1b(c1), c2, GROUPING(foo3_1b(c1)), SUM(c1) FROM t1 GROUP BY ROLLUP(foo3_1b(c1), c2)
+-- !query analysis
+Aggregate [spark_catalog.default.foo3_1b(c1)#x, c2#x, spark_grouping_id#xL], [spark_catalog.default.foo3_1b(c1)#x AS spark_catalog.default.foo3_1b(c1)#x, c2#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(spark_catalog.default.foo3_1b(c1))#x, sum(c1#x) AS sum(c1)#xL]
++- Expand [[c1#x, c2#x, spark_catalog.default.foo3_1b(c1)#x, c2#x, 0], [c1#x, c2#x, spark_catalog.default.foo3_1b(c1)#x, null, 1], [c1#x, c2#x, null, null, 3]], [c1#x, c2#x, spark_catalog.default.foo3_1b(c1)#x, c2#x, spark_grouping_id#xL]
+   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(c1)#x, c2#x AS c2#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, SUM(c2) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 1
+-- !query analysis
+Project [c1#x, sum(c2)#xL]
++- Filter (spark_catalog.default.foo3_1b(x#x) > 1)
+   +- Project [c1#x, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
+      +- Aggregate [c1#x], [c1#x, sum(c2#x) AS sum(c2)#xL]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c1, SUM(c2) FROM t1 GROUP BY CUBE(c1) HAVING foo3_1b(GROUPING(c1)) = 0
+-- !query analysis
+Project [c1#x, sum(c2)#xL]
++- Project [c1#x, sum(c2)#xL, spark_grouping_id#xL]
+   +- Filter (spark_catalog.default.foo3_1b(x#x) = 0)
+      +- Project [c1#x, sum(c2)#xL, spark_grouping_id#xL, cast(cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) as int) AS x#x]
+         +- Aggregate [c1#x, spark_grouping_id#xL], [c1#x, sum(c2#x) AS sum(c2)#xL, spark_grouping_id#xL]
+            +- Expand [[c1#x, c2#x, c1#x, 0], [c1#x, c2#x, null, 1]], [c1#x, c2#x, c1#x, spark_grouping_id#xL]
+               +- Project [c1#x, c2#x, c1#x AS c1#x]
+                  +- SubqueryAlias spark_catalog.default.t1
+                     +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+                        +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                           +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1a(t1.c1, t2.c2) >= 2
+-- !query analysis
+Project [c1#x, c2#x, c1#x, c2#x]
++- Join Inner, (spark_catalog.default.foo3_1a(a#x, b#x) >= cast(2 as double))
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :        +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t2
+      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c2) = foo3_1b(t2.c2)
+-- !query analysis
+Project [c1#x, c2#x, c1#x, c2#x]
++- Join Inner, (spark_catalog.default.foo3_1b(x#x) = spark_catalog.default.foo3_1b(x#x))
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :        +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t2
+      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c1 + t2.c1 + 2) > 2
+-- !query analysis
+Project [c1#x, c2#x, c1#x, c2#x]
++- Join Inner, (spark_catalog.default.foo3_1b(x#x) > 2)
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :        +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t2
+      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1a(foo3_1b(t1.c1), t2.c2) >= 2
+-- !query analysis
+Project [c1#x, c2#x, c1#x, c2#x]
++- Join Inner, (spark_catalog.default.foo3_1a(a#x, b#x) >= cast(2 as double))
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :        +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t2
+      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1f() > 0
+-- !query analysis
+Project [c1#x, c2#x, c1#x, c2#x]
++- Join Inner, (spark_catalog.default.foo3_1f() > 0)
+   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+   :     +- Filter (c1#x = 0)
+   :        +- SubqueryAlias spark_catalog.default.t2
+   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                 +- LocalRelation [col1#x, col2#x]
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :        +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t2
+      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c1 + rand(0) * 0) > 1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
+  "sqlState" : "42K0E",
+  "messageParameters" : {
+    "sqlExprs" : "\"(spark_catalog.default.foo3_1b(foo3_1b.x) > 1)\""
+  }
+}
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1c(t1.c1) = 2
+-- !query analysis
+Project [c1#x, c2#x, c1#x, c2#x]
++- Join Inner, (spark_catalog.default.foo3_1c(x#x) = 2)
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :        +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t2
+      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1g(t1.c1) = 2
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.UNSUPPORTED_CORRELATED_SCALAR_SUBQUERY",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "treeNode" : "Join Inner, (spark_catalog.default.foo3_1g(x#x) = 2)\n:  +- Project [outer(x#x)]\n:     +- OneRowRelation\n:- SubqueryAlias spark_catalog.default.t1\n:  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n:     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n:        +- LocalRelation [col1#x, col2#x]\n+- SubqueryAlias spark_catalog.default.t2\n   +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
+  }
+}
+
+
+-- !query
+SELECT * FROM t1 ORDER BY foo3_1b(c1)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
+    "nodeName" : "Sort"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 27,
+    "stopIndex" : 37,
+    "fragment" : "foo3_1b(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT * FROM t1 LIMIT foo3_1b(1)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
+    "nodeName" : "GlobalLimit"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 24,
+    "stopIndex" : 33,
+    "fragment" : "foo3_1b(1)"
+  } ]
+}
+
+
+-- !query
+SELECT * FROM ta LATERAL VIEW EXPLODE(ARRAY(foo3_1b(x[0]), foo3_1b(x[1]))) AS t
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
+    "nodeName" : "Generate"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 45,
+    "stopIndex" : 57,
+    "fragment" : "foo3_1b(x[0])"
+  } ]
+}
+
+
+-- !query
+SELECT CASE WHEN foo3_1b(rand(0) * 0 < 1 THEN 1 ELSE -1 END
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'foo3_1b'",
+    "hint" : ""
+  }
+}
+
+
+-- !query
+SELECT (SELECT SUM(c2) FROM t2 WHERE c1 = foo3_1b(t1.c1)) FROM t1
+-- !query analysis
+Project [scalar-subquery#x [c1#x] AS scalarsubquery(c1)#xL]
+:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
+:     +- Project [c1#x, c2#x]
+:        +- Filter (c1#x = spark_catalog.default.foo3_1b(x#x))
+:           +- Project [c1#x, c2#x, cast(outer(c1#x) as int) AS x#x]
+:              +- SubqueryAlias spark_catalog.default.t2
+:                 +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+:                    +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+:                       +- LocalRelation [col1#x, col2#x]
++- SubqueryAlias spark_catalog.default.t1
+   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1b((SELECT SUM(c1) FROM t1))
+-- !query analysis
+Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(scalarsubquery())#x]
++- Project [cast(scalar-subquery#x [] as int) AS x#x]
+   :  +- Aggregate [sum(c1#x) AS sum(c1)#xL]
+   :     +- SubqueryAlias spark_catalog.default.t1
+   :        +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :           +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :              +- LocalRelation [col1#x, col2#x]
+   +- OneRowRelation
+
+
+-- !query
+SELECT foo3_1a(c1, (SELECT MIN(c1) FROM t1)) FROM t1
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, scalarsubquery())#x]
++- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(scalar-subquery#x [] as double) AS b#x]
+   :  +- Aggregate [min(c1#x) AS min(c1)#x]
+   :     +- SubqueryAlias spark_catalog.default.t1
+   :        +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :           +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :              +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_1b((SELECT SUM(c1))) FROM t1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 17,
+    "stopIndex" : 30,
+    "fragment" : "SELECT SUM(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b((SELECT SUM(c1) FROM t1 WHERE c2 = t2.c2)) FROM t2
+-- !query analysis
+Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(scalarsubquery(c2))#x]
++- Project [c1#x, c2#x, cast(scalar-subquery#x [c2#x] as int) AS x#x]
+   :  +- Aggregate [sum(c1#x) AS sum(c1)#xL]
+   :     +- Filter (c2#x = outer(c2#x))
+   :        +- SubqueryAlias spark_catalog.default.t1
+   :           +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                 +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t2
+      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT c2, AVG(foo3_1b((SELECT COUNT(*) FROM t1 WHERE c2 = t2.c2))) OVER (PARTITION BY c1) AS r FROM t2
+-- !query analysis
+Project [c2#x, r#x]
++- Project [c2#x, _w0#x, c1#x, r#x, r#x]
+   +- Window [avg(_w0#x) windowspecdefinition(c1#x, specifiedwindowframe(RowFrame, unboundedpreceding$(), unboundedfollowing$())) AS r#x], [c1#x]
+      +- Project [c2#x, spark_catalog.default.foo3_1b(x#x) AS _w0#x, c1#x]
+         +- Project [c1#x, c2#x, cast(scalar-subquery#x [c2#x] as int) AS x#x]
+            :  +- Aggregate [count(1) AS count(1)#xL]
+            :     +- Filter (c2#x = outer(c2#x))
+            :        +- SubqueryAlias spark_catalog.default.t1
+            :           +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            :                 +- LocalRelation [col1#x, col2#x]
+            +- SubqueryAlias spark_catalog.default.t2
+               +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+                  +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                     +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_1x(x STRUCT<a: INT, b: INT>) RETURNS INT RETURN x.a + x.b
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1x, x STRUCT<a: INT, b: INT>, INT, x.a + x.b, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_1y(x ARRAY<INT>) RETURNS INT RETURN aggregate(x, BIGINT(0), (x, y) -> x + y)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_1y, x ARRAY<INT>, INT, aggregate(x, BIGINT(0), (x, y) -> x + y), false, false, false, false
+
+
+-- !query
+SELECT foo3_1a(x.a, x.b) FROM ts
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(x.a, x.b)#x]
++- Project [x#x, cast(x#x.a as double) AS a#x, cast(x#x.b as double) AS b#x]
+   +- SubqueryAlias spark_catalog.default.ts
+      +- View (`spark_catalog`.`default`.`ts`, [x#x])
+         +- Project [cast(col1#x as struct<a:int,b:int>) AS x#x]
+            +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT foo3_1x(x) FROM ts
+-- !query analysis
+Project [spark_catalog.default.foo3_1x(x#x) AS spark_catalog.default.foo3_1x(x)#x]
++- Project [x#x, cast(x#x as struct<a:int,b:int>) AS x#x]
+   +- SubqueryAlias spark_catalog.default.ts
+      +- View (`spark_catalog`.`default`.`ts`, [x#x])
+         +- Project [cast(col1#x as struct<a:int,b:int>) AS x#x]
+            +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT foo3_1a(x['a'], x['b']) FROM tm
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(x[a], x[b])#x]
++- Project [x#x, cast(x#x[a] as double) AS a#x, cast(x#x[b] as double) AS b#x]
+   +- SubqueryAlias spark_catalog.default.tm
+      +- View (`spark_catalog`.`default`.`tm`, [x#x])
+         +- Project [cast(col1#x as map<string,int>) AS x#x]
+            +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT foo3_1a(x[0], x[1]) FROM ta
+-- !query analysis
+Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(x[0], x[1])#x]
++- Project [x#x, cast(x#x[0] as double) AS a#x, cast(x#x[1] as double) AS b#x]
+   +- SubqueryAlias spark_catalog.default.ta
+      +- View (`spark_catalog`.`default`.`ta`, [x#x])
+         +- Project [cast(col1#x as array<int>) AS x#x]
+            +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT foo3_1y(x) FROM ta
+-- !query analysis
+Project [spark_catalog.default.foo3_1y(x#x) AS spark_catalog.default.foo3_1y(x)#x]
++- Project [x#x, cast(x#x as array<int>) AS x#x]
+   +- SubqueryAlias spark_catalog.default.ta
+      +- View (`spark_catalog`.`default`.`ta`, [x#x])
+         +- Project [cast(col1#x as array<int>) AS x#x]
+            +- LocalRelation [col1#x]
+
+
+-- !query
+CREATE FUNCTION foo3_2a() RETURNS INT RETURN FLOOR(RAND() * 6) + 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2a, INT, FLOOR(RAND() * 6) + 1, false, false, false, false
+
+
+-- !query
+SELECT CASE WHEN foo3_2a() > 6 THEN FALSE ELSE TRUE END
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_2a() = 1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
+  "sqlState" : "42K0E",
+  "messageParameters" : {
+    "sqlExprs" : "\"(spark_catalog.default.foo3_2a() = 1)\""
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2b1(x INT) RETURNS BOOLEAN RETURN x IN (SELECT 1)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2b1, x INT, BOOLEAN, x IN (SELECT 1), false, false, false, false
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b1(c1)
+-- !query analysis
+Project [c1#x, c2#x]
++- Project [c1#x, c2#x]
+   +- Filter spark_catalog.default.foo3_2b1(x#x)
+      :  +- Project [1 AS 1#x]
+      :     +- OneRowRelation
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_2b2(x INT) RETURNS INT RETURN IF(x IN (SELECT 1), 1, 0)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2b2, x INT, INT, IF(x IN (SELECT 1), 1, 0), false, false, false, false
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b2(c1) = 0
+-- !query analysis
+Project [c1#x, c2#x]
++- Project [c1#x, c2#x]
+   +- Filter (spark_catalog.default.foo3_2b2(x#x) = 0)
+      :  +- Project [1 AS 1#x]
+      :     +- OneRowRelation
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT foo3_2b2(c1) FROM t1
+-- !query analysis
+Project [spark_catalog.default.foo3_2b2(x#x) AS spark_catalog.default.foo3_2b2(c1)#x]
+:  +- Project [1 AS 1#x]
+:     +- OneRowRelation
++- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_2b3(x INT) RETURNS BOOLEAN RETURN x IN (SELECT c1 FROM t2)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2b3, x INT, BOOLEAN, x IN (SELECT c1 FROM t2), false, false, false, false
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b3(c1)
+-- !query analysis
+Project [c1#x, c2#x]
++- Project [c1#x, c2#x]
+   +- Filter spark_catalog.default.foo3_2b3(x#x)
+      :  +- Project [c1#x]
+      :     +- SubqueryAlias spark_catalog.default.t2
+      :        +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+      :           +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+      :              +- LocalRelation [col1#x, col2#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_2b4(x INT) RETURNS BOOLEAN RETURN x NOT IN (SELECT c2 FROM t2 WHERE x = c1)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2b4, x INT, BOOLEAN, x NOT IN (SELECT c2 FROM t2 WHERE x = c1), false, false, false, false
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b4(c1)
+-- !query analysis
+Project [c1#x, c2#x]
++- Project [c1#x, c2#x]
+   +- Filter spark_catalog.default.foo3_2b4(x#x)
+      :  +- Project [c2#x]
+      :     +- Filter (outer(x#x) = c1#x)
+      :        +- SubqueryAlias spark_catalog.default.t2
+      :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+      :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+      :                 +- LocalRelation [col1#x, col2#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN SUM(1) + IF(x IN (SELECT 1), 1, 0)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "USER_DEFINED_FUNCTIONS.CANNOT_CONTAIN_COMPLEX_FUNCTIONS",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "queryText" : "SUM(1) + IF(x IN (SELECT 1), 1, 0)"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN y IN (SELECT 1)
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`y`",
+    "proposal" : "`x`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 1,
+    "fragment" : "y"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN x IN (SELECT x WHERE x = 1)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2b5, x INT, BOOLEAN, x IN (SELECT x WHERE x = 1), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_2c1(x INT) RETURNS BOOLEAN RETURN EXISTS(SELECT 1)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2c1, x INT, BOOLEAN, EXISTS(SELECT 1), false, false, false, false
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2c1(c1)
+-- !query analysis
+Project [c1#x, c2#x]
++- Project [c1#x, c2#x]
+   +- Filter spark_catalog.default.foo3_2c1(x#x)
+      :  +- Project [1 AS 1#x]
+      :     +- OneRowRelation
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_2c2(x INT) RETURNS BOOLEAN RETURN NOT EXISTS(SELECT * FROM t2 WHERE c1 = x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2c2, x INT, BOOLEAN, NOT EXISTS(SELECT * FROM t2 WHERE c1 = x), false, false, false, false
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2c2(c1)
+-- !query analysis
+Project [c1#x, c2#x]
++- Project [c1#x, c2#x]
+   +- Filter spark_catalog.default.foo3_2c2(x#x)
+      :  +- Project [c1#x, c2#x]
+      :     +- Filter (c1#x = outer(x#x))
+      :        +- SubqueryAlias spark_catalog.default.t2
+      :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+      :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+      :                 +- LocalRelation [col1#x, col2#x]
+      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
+         +- SubqueryAlias spark_catalog.default.t1
+            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                  +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_2d1(x INT) RETURNS INT RETURN SELECT (SELECT x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2d1, x INT, INT, SELECT (SELECT x), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_2d2(x INT) RETURNS INT RETURN SELECT (SELECT 1 WHERE EXISTS (SELECT * FROM t2 WHERE c1 = x))
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`x`",
+    "proposal" : "`c1`, `c2`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 60,
+    "stopIndex" : 60,
+    "fragment" : "x"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2e1(
+    occurrences ARRAY<STRUCT<start_time: TIMESTAMP, occurrence_id: STRING>>,
+    instance_start_time TIMESTAMP
+) RETURNS STRING RETURN
+WITH t AS (
+    SELECT transform(occurrences, x -> named_struct(
+        'diff', abs(unix_millis(x.start_time) - unix_millis(instance_start_time)),
+        'id', x.occurrence_id
+    )) AS diffs
+)
+SELECT CASE WHEN occurrences IS NULL OR size(occurrences) = 0
+       THEN NULL
+       ELSE sort_array(diffs)[0].id END AS id
+FROM t
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_2e1, occurrences ARRAY<STRUCT<start_time: TIMESTAMP, occurrence_id: STRING>>,
+    instance_start_time TIMESTAMP, STRING, WITH t AS (
+    SELECT transform(occurrences, x -> named_struct(
+        'diff', abs(unix_millis(x.start_time) - unix_millis(instance_start_time)),
+        'id', x.occurrence_id
+    )) AS diffs
+)
+SELECT CASE WHEN occurrences IS NULL OR size(occurrences) = 0
+       THEN NULL
+       ELSE sort_array(diffs)[0].id END AS id
+FROM t, false, false, false, false
+
+
+-- !query
+SELECT foo3_2e1(
+    ARRAY(STRUCT('2022-01-01 10:11:12', '1'), STRUCT('2022-01-01 10:11:15', '2')),
+    '2022-01-01')
+-- !query analysis
+Project [spark_catalog.default.foo3_2e1(occurrences#x, instance_start_time#x) AS spark_catalog.default.foo3_2e1(array(struct(2022-01-01 10:11:12, 1), struct(2022-01-01 10:11:15, 2)), 2022-01-01)#x]
+:  +- WithCTE
+:     :- CTERelationDef xxxx, false
+:     :  +- SubqueryAlias t
+:     :     +- Project [transform(outer(occurrences#x), lambdafunction(named_struct(diff, abs((unix_millis(lambda x#x.start_time) - unix_millis(outer(instance_start_time#x)))), id, lambda x#x.occurrence_id), lambda x#x, false)) AS diffs#x]
+:     :        +- OneRowRelation
+:     +- Project [CASE WHEN (isnull(outer(occurrences#x)) OR (size(outer(occurrences#x), false) = 0)) THEN cast(null as string) ELSE sort_array(diffs#x, true)[0].id END AS id#x]
+:        +- SubqueryAlias t
+:           +- CTERelationRef xxxx, true, [diffs#x], false, false, 1
++- Project [cast(array(struct(col1, 2022-01-01 10:11:12, col2, 1), struct(col1, 2022-01-01 10:11:15, col2, 2)) as array<struct<start_time:timestamp,occurrence_id:string>>) AS occurrences#x, cast(2022-01-01 as timestamp) AS instance_start_time#x]
+   +- OneRowRelation
+
+
+-- !query
+SET spark.sql.ansi.enabled=true
+-- !query analysis
+SetCommand (spark.sql.ansi.enabled,Some(true))
+
+
+-- !query
+CREATE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3a, x INT, DOUBLE, 1 / x, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3at, x INT, a DOUBLE, SELECT 1 / x, true, false, false, false
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query analysis
+CreateSQLFunctionCommand foo3_3b, x INT, DOUBLE, 1 / x, false, true, false, false
+
+
+-- !query
+SET spark.sql.ansi.enabled=false
+-- !query analysis
+SetCommand (spark.sql.ansi.enabled,Some(false))
+
+
+-- !query
+SELECT foo3_3a(0)
+-- !query analysis
+Project [spark_catalog.default.foo3_3a(x#x) AS spark_catalog.default.foo3_3a(0)#x]
++- Project [cast(0 as int) AS x#x]
+   +- OneRowRelation
+
+
+-- !query
+SELECT foo3_3b(0)
+-- !query analysis
+Project [foo3_3b(x#x) AS foo3_3b(0)#x]
++- Project [cast(0 as int) AS x#x]
+   +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo3_3at(0)
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo3_3at
+   +- SubqueryAlias foo3_3at
+      +- Project [cast((1 / outer(foo3_3at.x))#x as double) AS a#x]
+         +- Project [(cast(1 as double) / cast(cast(0 as int) as double)) AS (1 / outer(foo3_3at.x))#x]
+            +- OneRowRelation
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3a, x INT, DOUBLE, 1 / x, false, false, false, true
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3at, x INT, a DOUBLE, SELECT 1 / x, true, false, false, true
+
+
+-- !query
+CREATE OR REPLACE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query analysis
+CreateSQLFunctionCommand foo3_3b, x INT, DOUBLE, 1 / x, false, true, false, true
+
+
+-- !query
+SELECT foo3_3a(0)
+-- !query analysis
+Project [spark_catalog.default.foo3_3a(x#x) AS spark_catalog.default.foo3_3a(0)#x]
++- Project [cast(0 as int) AS x#x]
+   +- OneRowRelation
+
+
+-- !query
+SELECT foo3_3b(0)
+-- !query analysis
+Project [foo3_3b(x#x) AS foo3_3b(0)#x]
++- Project [cast(0 as int) AS x#x]
+   +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo3_3at(0)
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo3_3at
+   +- SubqueryAlias foo3_3at
+      +- Project [cast((1 / outer(foo3_3at.x))#x as double) AS a#x]
+         +- Project [(cast(1 as double) / cast(cast(0 as int) as double)) AS (1 / outer(foo3_3at.x))#x]
+            +- OneRowRelation
+
+
+-- !query
+CREATE FUNCTION foo3_3c() RETURNS INT RETURN CAST('a' AS INT)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3c, INT, CAST('a' AS INT), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_3ct() RETURNS TABLE (a INT) RETURN SELECT CAST('a' AS INT)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3ct, a INT, SELECT CAST('a' AS INT), true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_3d() RETURNS INT RETURN 'a' + 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3d, INT, 'a' + 1, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_3dt() RETURNS TABLE (a INT) RETURN SELECT 'a' + 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_3dt, a INT, SELECT 'a' + 1, true, false, false, false
+
+
+-- !query
+SELECT foo3_3c()
+-- !query analysis
+Project [spark_catalog.default.foo3_3c() AS spark_catalog.default.foo3_3c()#x]
++- Project
+   +- OneRowRelation
+
+
+-- !query
+SELECT foo3_3d()
+-- !query analysis
+Project [spark_catalog.default.foo3_3d() AS spark_catalog.default.foo3_3d()#x]
++- Project
+   +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo3_3ct()
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo3_3ct
+   +- SubqueryAlias foo3_3ct
+      +- Project [cast(CAST(a AS INT)#x as int) AS a#x]
+         +- Project [cast(a as int) AS CAST(a AS INT)#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo3_3dt()
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo3_3dt
+   +- SubqueryAlias foo3_3dt
+      +- Project [cast((a + 1)#x as int) AS a#x]
+         +- Project [(cast(a as double) + cast(1 as double)) AS (a + 1)#x]
+            +- OneRowRelation
+
+
+-- !query
+SET spark.sql.ansi.enabled=true
+-- !query analysis
+SetCommand (spark.sql.ansi.enabled,Some(true))
+
+
+-- !query
+SELECT foo3_3c()
+-- !query analysis
+Project [spark_catalog.default.foo3_3c() AS spark_catalog.default.foo3_3c()#x]
++- Project
+   +- OneRowRelation
+
+
+-- !query
+SELECT foo3_3d()
+-- !query analysis
+Project [spark_catalog.default.foo3_3d() AS spark_catalog.default.foo3_3d()#x]
++- Project
+   +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo3_3ct()
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo3_3ct
+   +- SubqueryAlias foo3_3ct
+      +- Project [cast(CAST(a AS INT)#x as int) AS a#x]
+         +- Project [cast(a as int) AS CAST(a AS INT)#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo3_3dt()
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo3_3dt
+   +- SubqueryAlias foo3_3dt
+      +- Project [cast((a + 1)#x as int) AS a#x]
+         +- Project [(cast(a as double) + cast(1 as double)) AS (a + 1)#x]
+            +- OneRowRelation
+
+
+-- !query
+RESET spark.sql.ansi.enabled
+-- !query analysis
+ResetCommand spark.sql.ansi.enabled
+
+
+-- !query
+CREATE FUNCTION foo3_4a(x INT) RETURNS INT RETURN 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_4a, x INT, INT, 1, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_4b(x INT) RETURNS INT RETURN foo3_4a(x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_4b, x INT, INT, foo3_4a(x), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_4c(x INT) RETURNS INT RETURN foo3_4b(x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_4c, x INT, INT, foo3_4b(x), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_4d(x INT) RETURNS INT RETURN (SELECT foo3_4c(x))
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_4d, x INT, INT, (SELECT foo3_4c(x)), false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_4e(x INT) RETURNS TABLE(a INT) RETURN SELECT foo3_4a(x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_4e, x INT, a INT, SELECT foo3_4a(x), true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_4f(x INT) RETURNS TABLE(b INT) RETURN SELECT * FROM foo3_4e(x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_4f, x INT, b INT, SELECT * FROM foo3_4e(x), true, false, false, false
+
+
+-- !query
+CREATE OR REPLACE TEMP FUNCTION foo3_4g(x INT) RETURN x + 1
+-- !query analysis
+CreateSQLFunctionCommand foo3_4g, x INT, , x + 1, false, true, false, true
+
+
+-- !query
+CREATE OR REPLACE TEMP FUNCTION foo3_4h(x INT) RETURN foo3_4g(x) + 1
+-- !query analysis
+CreateSQLFunctionCommand foo3_4h, x INT, , foo3_4g(x) + 1, false, true, false, true
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4b(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4c(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4c -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4d(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4d -> spark_catalog.default.foo3_4c -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURN FoO3_4b(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN SELECT SUM(a) FROM foo3_4e(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4e -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4e(x INT) RETURNS TABLE (c INT) RETURN SELECT * FROM foo3_4f(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4e -> spark_catalog.default.foo3_4f -> spark_catalog.default.foo3_4e"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4e(x INT) RETURNS TABLE RETURN SELECT * FROM fOo3_4F(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4e -> spark_catalog.default.foo3_4f -> spark_catalog.default.foo3_4e"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE TEMP FUNCTION foo3_4g(x INT) RETURN foo3_4h(x) + 1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "foo3_4g -> foo3_4h -> foo3_4g"
+  }
+}
+
+
+-- !query
+CREATE TEMPORARY VIEW t AS VALUES (0) t(a)
+-- !query analysis
+CreateViewCommand `t`, VALUES (0) t(a), false, false, LocalTempView, UNSUPPORTED, true
+   +- SubqueryAlias t
+      +- LocalRelation [a#x]
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_5a(x INT) RETURNS INT RETURN x
+-- !query analysis
+CreateSQLFunctionCommand foo3_5a, x INT, INT, x, false, true, false, false
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_5b(x INT) RETURNS INT RETURN (SELECT SUM(a) FROM t)
+-- !query analysis
+CreateSQLFunctionCommand foo3_5b, x INT, INT, (SELECT SUM(a) FROM t), false, true, false, false
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_5c(x INT) RETURNS TABLE (a INT) RETURN SELECT a FROM t
+-- !query analysis
+CreateSQLFunctionCommand foo3_5c, x INT, a INT, SELECT a FROM t, true, true, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS INT RETURN foo3_5a(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "FUNCTION",
+    "tempObjName" : "`foo3_5a`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS TABLE (a INT) RETURN SELECT foo3_5a(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "FUNCTION",
+    "tempObjName" : "`foo3_5a`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS INT RETURN (SELECT SUM(a) FROM t)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "VIEW",
+    "tempObjName" : "`t`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS TABLE (a INT) RETURN SELECT a FROM t
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "VIEW",
+    "tempObjName" : "`t`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12a(x INT) RETURNS INT CONTAINS SQL RETURN x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12a, x INT, INT, x, true, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12b(x INT) RETURNS INT READS SQL DATA RETURN x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12b, x INT, INT, x, false, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12c(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT x)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12c, x INT, INT, (SELECT x), true, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12d(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT COUNT(*) FROM range(0, 3))
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12d, x INT, INT, (SELECT COUNT(*) FROM range(0, 3)), true, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12e(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT COUNT(*) FROM VALUES (0, 1))
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12e, x INT, INT, (SELECT COUNT(*) FROM VALUES (0, 1)), true, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN SELECT SUM(c2) FROM t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN foo3_12b(x) + 1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN 1 + (SELECT SUM(c2) FROM t1)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12g(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT x, x + 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12g, x INT, a INT, b INT, SELECT x, x + 1, true, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12h(x INT) RETURNS TABLE (a INT, b INT) READS SQL DATA RETURN SELECT x, x + 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12h, x INT, a INT, b INT, SELECT x, x + 1, false, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12i(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM VALUES (0, 1)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12i, x INT, a INT, b INT, SELECT * FROM VALUES (0, 1), true, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12j(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT id, id + 1 FROM RANGE(3)
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12j, x INT, a INT, b INT, SELECT id, id + 1 FROM RANGE(3), true, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12k(x INT) RETURNS TABLE (a INT, b INT) RETURN SELECT c1, c2 FROM t1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_12k, x INT, a INT, b INT, SELECT c1, c2 FROM t1, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT c1, c2 FROM t1
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT foo3_12b(x), x
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM foo3_12h(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM foo3_12k(x)
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE TABLE tbl USING PARQUET AS SELECT c1 FROM t2
+-- !query analysis
+CreateDataSourceTableAsSelectCommand `spark_catalog`.`default`.`tbl`, ErrorIfExists, [c1]
+   +- Project [c1#x]
+      +- SubqueryAlias spark_catalog.default.t2
+         +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN SELECT SUM(c1) FROM tbl
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT) CONTAINS SQL RETURN SELECT * FROM tbl
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+DROP TABLE tbl
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.tbl
+
+
+-- !query
+CREATE FUNCTION foo3_14a() RETURNS INT RETURN 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_14a, INT, 1, false, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo3_14b() RETURNS TABLE (a INT) RETURN SELECT 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo3_14b, a INT, SELECT 1, true, false, false, false
+
+
+-- !query
+SELECT * FROM foo3_14a()
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "NOT_A_TABLE_FUNCTION",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_14a`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 15,
+    "stopIndex" : 24,
+    "fragment" : "foo3_14a()"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_14b()
+-- !query analysis
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "NOT_A_SCALAR_FUNCTION",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_14b`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 17,
+    "fragment" : "foo3_14b()"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo4_0() RETURNS TABLE (x INT) RETURN SELECT 1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo4_0, x INT, SELECT 1, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo4_1(x INT) RETURNS TABLE (a INT) RETURN SELECT x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo4_1, x INT, a INT, SELECT x, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo4_2(x INT) RETURNS TABLE (a INT) RETURN SELECT c2 FROM t2 WHERE c1 = x
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo4_2, x INT, a INT, SELECT c2 FROM t2 WHERE c1 = x, true, false, false, false
+
+
+-- !query
+CREATE FUNCTION foo4_3(x INT) RETURNS TABLE (a INT, cnt INT) RETURN SELECT c1, COUNT(*) FROM t2 WHERE c1 = x GROUP BY c1
+-- !query analysis
+CreateSQLFunctionCommand spark_catalog.default.foo4_3, x INT, a INT, cnt INT, SELECT c1, COUNT(*) FROM t2 WHERE c1 = x GROUP BY c1, true, false, false, false
+
+
+-- !query
+SELECT * FROM foo4_0()
+-- !query analysis
+Project [x#x]
++- SQLFunctionNode spark_catalog.default.foo4_0
+   +- SubqueryAlias foo4_0
+      +- Project [cast(1#x as int) AS x#x]
+         +- Project [1 AS 1#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo4_1(1)
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo4_1
+   +- SubqueryAlias foo4_1
+      +- Project [cast(x#x as int) AS a#x]
+         +- Project [cast(1 as int) AS x#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT * FROM foo4_2(2)
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo4_2
+   +- SubqueryAlias foo4_2
+      +- Project [cast(c2#x as int) AS a#x]
+         +- Project [c2#x]
+            +- Filter (c1#x = cast(2 as int))
+               +- SubqueryAlias spark_catalog.default.t2
+                  +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+                     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                        +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM foo4_3(0)
+-- !query analysis
+Project [a#x, cnt#x]
++- SQLFunctionNode spark_catalog.default.foo4_3
+   +- SubqueryAlias foo4_3
+      +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
+         +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
+            +- Filter (c1#x = cast(0 as int))
+               +- SubqueryAlias spark_catalog.default.t2
+                  +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+                     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+                        +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM foo4_1(rand(0) * 0)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT * FROM foo4_1(x => 1)
+-- !query analysis
+Project [a#x]
++- SQLFunctionNode spark_catalog.default.foo4_1
+   +- SubqueryAlias foo4_1
+      +- Project [cast(x#x as int) AS a#x]
+         +- Project [cast(1 as int) AS x#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_1(c1)
+-- !query analysis
+Project [c1#x, c2#x, a#x]
++- LateralJoin lateral-subquery#x [c1#x], Inner
+   :  +- SQLFunctionNode spark_catalog.default.foo4_1
+   :     +- SubqueryAlias foo4_1
+   :        +- Project [cast(x#x as int) AS a#x]
+   :           +- Project [cast(outer(c1#x) as int) AS x#x]
+   :              +- OneRowRelation
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_2(c1)
+-- !query analysis
+Project [c1#x, c2#x, a#x]
++- LateralJoin lateral-subquery#x [c1#x], Inner
+   :  +- SQLFunctionNode spark_catalog.default.foo4_2
+   :     +- SubqueryAlias foo4_2
+   :        +- Project [cast(c2#x as int) AS a#x]
+   :           +- Project [c2#x]
+   :              +- Filter (c1#x = cast(outer(c1#x) as int))
+   :                 +- SubqueryAlias spark_catalog.default.t2
+   :                    +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :                       +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                          +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1 JOIN LATERAL foo4_2(c1) ON t1.c2 = foo4_2.a
+-- !query analysis
+Project [c1#x, c2#x, a#x]
++- LateralJoin lateral-subquery#x [c1#x], Inner, (c2#x = a#x)
+   :  +- SQLFunctionNode spark_catalog.default.foo4_2
+   :     +- SubqueryAlias foo4_2
+   :        +- Project [cast(c2#x as int) AS a#x]
+   :           +- Project [c2#x]
+   :              +- Filter (c1#x = cast(outer(c1#x) as int))
+   :                 +- SubqueryAlias spark_catalog.default.t2
+   :                    +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :                       +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                          +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_3(c1)
+-- !query analysis
+Project [c1#x, c2#x, a#x, cnt#x]
++- LateralJoin lateral-subquery#x [c1#x], Inner
+   :  +- SQLFunctionNode spark_catalog.default.foo4_3
+   :     +- SubqueryAlias foo4_3
+   :        +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
+   :           +- LateralJoin lateral-subquery#x [x#x], Inner
+   :              :  +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
+   :              :     +- Filter (c1#x = outer(x#x))
+   :              :        +- SubqueryAlias spark_catalog.default.t2
+   :              :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :              :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :              :                 +- LocalRelation [col1#x, col2#x]
+   :              +- Project [cast(outer(c1#x) as int) AS x#x]
+   :                 +- OneRowRelation
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1, LATERAL (SELECT cnt FROM foo4_3(c1))
+-- !query analysis
+Project [c1#x, c2#x, cnt#x]
++- LateralJoin lateral-subquery#x [c1#x], Inner
+   :  +- SubqueryAlias __auto_generated_subquery_name
+   :     +- Project [cnt#x]
+   :        +- SQLFunctionNode spark_catalog.default.foo4_3
+   :           +- SubqueryAlias foo4_3
+   :              +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
+   :                 +- LateralJoin lateral-subquery#x [x#x], Inner
+   :                    :  +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
+   :                    :     +- Filter (c1#x = outer(x#x))
+   :                    :        +- SubqueryAlias spark_catalog.default.t2
+   :                    :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :                    :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                    :                 +- LocalRelation [col1#x, col2#x]
+   :                    +- Project [cast(outer(c1#x) as int) AS x#x]
+   :                       +- OneRowRelation
+   +- SubqueryAlias spark_catalog.default.t1
+      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+            +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.NON_DETERMINISTIC_LATERAL_SUBQUERIES",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "treeNode" : "LateralJoin lateral-subquery#x [c1#x], Inner\n:  +- SQLFunctionNode spark_catalog.default.foo4_1\n:     +- SubqueryAlias foo4_1\n:        +- Project [cast(x#x as int) AS a#x]\n:           +- LateralJoin lateral-subquery#x [x#x], Inner\n:              :  +- Project [outer(x#x) AS x#x]\n:              :     +- OneRowRelation\n:              +- Project [cast((cast(outer(c1#x) as double) + (rand(number) * cast(0 as double))) as int) AS x#x]\n:                 +- OneRowRelation\n+- SubqueryAlias spark_catalog.default.t1\n   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 10,
+    "stopIndex" : 50,
+    "fragment" : "FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)"
+  } ]
+}
+
+
+-- !query
+SELECT * FROM t1 JOIN foo4_1(1) AS foo4_1(x) ON t1.c1 = foo4_1.x
+-- !query analysis
+Project [c1#x, c2#x, x#x]
++- Join Inner, (c1#x = x#x)
+   :- SubqueryAlias spark_catalog.default.t1
+   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :        +- LocalRelation [col1#x, col2#x]
+   +- SubqueryAlias foo4_1
+      +- Project [a#x AS x#x]
+         +- SQLFunctionNode spark_catalog.default.foo4_1
+            +- SubqueryAlias foo4_1
+               +- Project [cast(x#x as int) AS a#x]
+                  +- Project [cast(1 as int) AS x#x]
+                     +- OneRowRelation
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_1(c1), LATERAL foo4_2(foo4_1.a + c1)
+-- !query analysis
+Project [c1#x, c2#x, a#x, a#x]
++- LateralJoin lateral-subquery#x [a#x && c1#x], Inner
+   :  +- SQLFunctionNode spark_catalog.default.foo4_2
+   :     +- SubqueryAlias foo4_2
+   :        +- Project [cast(c2#x as int) AS a#x]
+   :           +- Project [c2#x]
+   :              +- Filter (c1#x = cast((outer(a#x) + outer(c1#x)) as int))
+   :                 +- SubqueryAlias spark_catalog.default.t2
+   :                    +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+   :                       +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+   :                          +- LocalRelation [col1#x, col2#x]
+   +- LateralJoin lateral-subquery#x [c1#x], Inner
+      :  +- SQLFunctionNode spark_catalog.default.foo4_1
+      :     +- SubqueryAlias foo4_1
+      :        +- Project [cast(x#x as int) AS a#x]
+      :           +- Project [cast(outer(c1#x) as int) AS x#x]
+      :              +- OneRowRelation
+      +- SubqueryAlias spark_catalog.default.t1
+         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+               +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT (SELECT MAX(a) FROM foo4_1(c1)) FROM t1
+-- !query analysis
+Project [scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x]
+:  +- Aggregate [max(a#x) AS max(a)#x]
+:     +- SQLFunctionNode spark_catalog.default.foo4_1
+:        +- SubqueryAlias foo4_1
+:           +- Project [cast(x#x as int) AS a#x]
+:              +- Project [cast(outer(c1#x) as int) AS x#x]
+:                 +- OneRowRelation
++- SubqueryAlias spark_catalog.default.t1
+   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT (SELECT MAX(a) FROM foo4_1(c1) WHERE a = c2) FROM t1
+-- !query analysis
+Project [scalar-subquery#x [c2#x && c1#x] AS scalarsubquery(c2, c1)#x]
+:  +- Aggregate [max(a#x) AS max(a)#x]
+:     +- Filter (a#x = outer(c2#x))
+:        +- SQLFunctionNode spark_catalog.default.foo4_1
+:           +- SubqueryAlias foo4_1
+:              +- Project [cast(x#x as int) AS a#x]
+:                 +- Project [cast(outer(c1#x) as int) AS x#x]
+:                    +- OneRowRelation
++- SubqueryAlias spark_catalog.default.t1
+   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT (SELECT MAX(cnt) FROM foo4_3(c1)) FROM t1
+-- !query analysis
+Project [scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x]
+:  +- Aggregate [max(cnt#x) AS max(cnt)#x]
+:     +- SQLFunctionNode spark_catalog.default.foo4_3
+:        +- SubqueryAlias foo4_3
+:           +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
+:              +- LateralJoin lateral-subquery#x [x#x], Inner
+:                 :  +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
+:                 :     +- Filter (c1#x = outer(x#x))
+:                 :        +- SubqueryAlias spark_catalog.default.t2
+:                 :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
+:                 :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+:                 :                 +- LocalRelation [col1#x, col2#x]
+:                 +- Project [cast(outer(c1#x) as int) AS x#x]
+:                    +- OneRowRelation
++- SubqueryAlias spark_catalog.default.t1
+   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
+      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
+         +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+DROP VIEW t1
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`t1`, false, true, false
+
+
+-- !query
+DROP VIEW t2
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`t2`, false, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1a0
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1a0, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1a1
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1a1, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1a2
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1a2, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1b0
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1b0, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1b1
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1b1, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1b2
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1b2, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1c1
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1c1]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1c2
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1c2]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d1
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1d1, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d2
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1d2, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d4
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1d4, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d5
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1d5, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d6
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo1d6, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1e1
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1e1]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1e2
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1e2]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1e3
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1e3]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1f1
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1f1]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1f2
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1f2]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1g1
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1g1]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1g2
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo1g2]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo2a0
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo2a0]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo2a2
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo2a2, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo2a4
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo2a4, true, false
 
 
 -- !query
-SELECT foo3_1b(SUM(c1 + rand(0) * 0)) FROM t1
+DROP FUNCTION IF EXISTS foo2b1
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
-  "sqlState" : "42845",
-  "messageParameters" : {
-    "sqlExpr" : "\"sum((c1 + (rand(0) * 0)))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 20,
-    "stopIndex" : 35,
-    "fragment" : "c1 + rand(0) * 0"
-  } ]
-}
+NoopCommand DROP FUNCTION, [foo2b1]
 
 
 -- !query
-SELECT SUM(foo3_1b(c1) + rand(0) * 0) FROM t1
+DROP FUNCTION IF EXISTS foo2b2
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
-  "sqlState" : "42845",
-  "messageParameters" : {
-    "sqlExpr" : "\"sum((spark_catalog.default.foo3_1b(foo3_1b.x) + (rand(0) * 0)))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 12,
-    "stopIndex" : 36,
-    "fragment" : "foo3_1b(c1) + rand(0) * 0"
-  } ]
-}
+NoopCommand DROP FUNCTION, [foo2b2]
 
 
 -- !query
-SELECT SUM(foo3_1b(c1 + rand(0) * 0)) FROM t1
+DROP FUNCTION IF EXISTS foo2c1
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+NoopCommand DROP FUNCTION, [foo2c1]
 
 
 -- !query
-SELECT foo3_1b(SUM(c1) + foo3_1b(SUM(c1))) FROM t1
+DROP FUNCTION IF EXISTS foo31
 -- !query analysis
-Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b((sum(c1) + spark_catalog.default.foo3_1b(sum(c1))))#x]
-+- Project [sum(c1)#xL, sum(c1)#xL, x#x, cast((sum(c1)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) as int) AS x#x]
-   +- Project [sum(c1)#xL, sum(c1)#xL, cast(sum(c1)#xL as int) AS x#x]
-      +- Aggregate [sum(c1#x) AS sum(c1)#xL, sum(c1#x) AS sum(c1)#xL]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+NoopCommand DROP FUNCTION, [foo31]
 
 
 -- !query
-SELECT foo3_1b(SUM(c2) + foo3_1b(SUM(c1))) AS foo FROM t1 HAVING foo > 0
+DROP FUNCTION IF EXISTS foo32
 -- !query analysis
-Filter (foo#x > 0)
-+- Project [spark_catalog.default.foo3_1b(x#x) AS foo#x]
-   +- Project [sum(c2)#xL, sum(c1)#xL, x#x, cast((sum(c2)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) as int) AS x#x]
-      +- Project [sum(c2)#xL, sum(c1)#xL, cast(sum(c1)#xL as int) AS x#x]
-         +- Aggregate [sum(c2#x) AS sum(c2)#xL, sum(c1#x) AS sum(c1)#xL]
-            +- SubqueryAlias spark_catalog.default.t1
-               +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-                  +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                     +- LocalRelation [col1#x, col2#x]
+NoopCommand DROP FUNCTION, [foo32]
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2) + foo3_1b(SUM(c2))) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+DROP FUNCTION IF EXISTS foo33
 -- !query analysis
-Filter (count(1)#xL > cast(0 as bigint))
-+- Project [c1#x, count(1)#xL, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b((sum(c2) + spark_catalog.default.foo3_1b(sum(c2))))#x]
-   +- Project [c1#x, count(1)#xL, sum(c2)#xL, sum(c2)#xL, x#x, cast((sum(c2)#xL + cast(spark_catalog.default.foo3_1b(x#x) as bigint)) as int) AS x#x]
-      +- Project [c1#x, count(1)#xL, sum(c2)#xL, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
-         +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL, sum(c2#x) AS sum(c2)#xL, sum(c2#x) AS sum(c2)#xL]
-            +- SubqueryAlias spark_catalog.default.t1
-               +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-                  +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                     +- LocalRelation [col1#x, col2#x]
+NoopCommand DROP FUNCTION, [foo33]
 
 
 -- !query
-SELECT foo3_1a(c1, MAX(c2)) FROM t1 GROUP BY c1, 1
+DROP FUNCTION IF EXISTS foo41
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "GROUP_BY_POS_AGGREGATE",
-  "sqlState" : "42903",
-  "messageParameters" : {
-    "aggExpr" : "spark_catalog.default.foo3_1a(spark_catalog.default.t1.c1, max(spark_catalog.default.t1.c2)) AS `spark_catalog.default.foo3_1a(c1, max(c2))`",
-    "index" : "1"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 50,
-    "stopIndex" : 50,
-    "fragment" : "1"
-  } ]
-}
+DropFunctionCommand spark_catalog.default.foo41, true, false
 
 
 -- !query
-WITH cte AS (SELECT foo3_1a(c1, c2) FROM t1)
-SELECT * FROM cte
+DROP FUNCTION IF EXISTS foo42
 -- !query analysis
-WithCTE
-:- CTERelationDef xxxx, false
-:  +- SubqueryAlias cte
-:     +- Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, c2)#x]
-:        +- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(c2#x as double) AS b#x]
-:           +- SubqueryAlias spark_catalog.default.t1
-:              +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-:                 +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-:                    +- LocalRelation [col1#x, col2#x]
-+- Project [spark_catalog.default.foo3_1a(c1, c2)#x]
-   +- SubqueryAlias cte
-      +- CTERelationRef xxxx, true, [spark_catalog.default.foo3_1a(c1, c2)#x], false, false
+NoopCommand DROP FUNCTION, [foo42]
 
 
 -- !query
-SELECT SUM(c2) FROM t1 GROUP BY foo3_1b(c1)
+DROP FUNCTION IF EXISTS foo51
 -- !query analysis
-Project [sum(c2)#xL]
-+- Aggregate [spark_catalog.default.foo3_1b#x], [sum(c2#x) AS sum(c2)#xL]
-   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo51, true, false
 
 
 -- !query
-SELECT foo3_1b(c1), SUM(c2) FROM t1 GROUP BY 1
+DROP FUNCTION IF EXISTS foo52
 -- !query analysis
-Project [spark_catalog.default.foo3_1b(c1)#x, sum(c2)#xL]
-+- Aggregate [spark_catalog.default.foo3_1b#x], [spark_catalog.default.foo3_1b#x AS spark_catalog.default.foo3_1b(c1)#x, sum(c2#x) AS sum(c2)#xL]
-   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo52, true, false
 
 
 -- !query
-SELECT foo3_1b(c1), c2, GROUPING(foo3_1b(c1)), SUM(c1) FROM t1 GROUP BY ROLLUP(foo3_1b(c1), c2)
+DROP FUNCTION IF EXISTS foo6c
 -- !query analysis
-Aggregate [spark_catalog.default.foo3_1b(c1)#x, c2#x, spark_grouping_id#xL], [spark_catalog.default.foo3_1b(c1)#x AS spark_catalog.default.foo3_1b(c1)#x, c2#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(spark_catalog.default.foo3_1b(c1))#x, sum(c1#x) AS sum(c1)#xL]
-+- Expand [[c1#x, c2#x, spark_catalog.default.foo3_1b(c1)#x, c2#x, 0], [c1#x, c2#x, spark_catalog.default.foo3_1b(c1)#x, null, 1], [c1#x, c2#x, null, null, 3]], [c1#x, c2#x, spark_catalog.default.foo3_1b(c1)#x, c2#x, spark_grouping_id#xL]
-   +- Project [c1#x, c2#x, spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(c1)#x, c2#x AS c2#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo6c, true, false
 
 
 -- !query
-SELECT c1, SUM(c2) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 1
+DROP FUNCTION IF EXISTS foo6d
 -- !query analysis
-Project [c1#x, sum(c2)#xL]
-+- Filter (spark_catalog.default.foo3_1b(x#x) > 1)
-   +- Project [c1#x, sum(c2)#xL, cast(sum(c2)#xL as int) AS x#x]
-      +- Aggregate [c1#x], [c1#x, sum(c2#x) AS sum(c2)#xL]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo6d, true, false
 
 
 -- !query
-SELECT c1, SUM(c2) FROM t1 GROUP BY CUBE(c1) HAVING foo3_1b(GROUPING(c1)) = 0
+DROP FUNCTION IF EXISTS foo7a
 -- !query analysis
-Project [c1#x, sum(c2)#xL]
-+- Project [c1#x, sum(c2)#xL, spark_grouping_id#xL]
-   +- Filter (spark_catalog.default.foo3_1b(x#x) = 0)
-      +- Project [c1#x, sum(c2)#xL, spark_grouping_id#xL, cast(cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) as int) AS x#x]
-         +- Aggregate [c1#x, spark_grouping_id#xL], [c1#x, sum(c2#x) AS sum(c2)#xL, spark_grouping_id#xL]
-            +- Expand [[c1#x, c2#x, c1#x, 0], [c1#x, c2#x, null, 1]], [c1#x, c2#x, c1#x, spark_grouping_id#xL]
-               +- Project [c1#x, c2#x, c1#x AS c1#x]
-                  +- SubqueryAlias spark_catalog.default.t1
-                     +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-                        +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                           +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo7a, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1a(t1.c1, t2.c2) >= 2
+DROP FUNCTION IF EXISTS foo7at
 -- !query analysis
-Project [c1#x, c2#x, c1#x, c2#x]
-+- Join Inner, (spark_catalog.default.foo3_1a(a#x, b#x) >= cast(2 as double))
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :        +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t2
-      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo7at, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c2) = foo3_1b(t2.c2)
+DROP FUNCTION IF EXISTS foo9a
 -- !query analysis
-Project [c1#x, c2#x, c1#x, c2#x]
-+- Join Inner, (spark_catalog.default.foo3_1b(x#x) = spark_catalog.default.foo3_1b(x#x))
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :        +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t2
-      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo9a, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c1 + t2.c1 + 2) > 2
+DROP FUNCTION IF EXISTS foo9b
 -- !query analysis
-Project [c1#x, c2#x, c1#x, c2#x]
-+- Join Inner, (spark_catalog.default.foo3_1b(x#x) > 2)
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :        +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t2
-      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo9b, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1a(foo3_1b(t1.c1), t2.c2) >= 2
+DROP FUNCTION IF EXISTS foo9c
 -- !query analysis
-Project [c1#x, c2#x, c1#x, c2#x]
-+- Join Inner, (spark_catalog.default.foo3_1a(a#x, b#x) >= cast(2 as double))
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :        +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t2
-      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo9c, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1f() > 0
+DROP FUNCTION IF EXISTS foo9d
 -- !query analysis
-Project [c1#x, c2#x, c1#x, c2#x]
-+- Join Inner, (spark_catalog.default.foo3_1f() > 0)
-   :  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-   :     +- Filter (c1#x = 0)
-   :        +- SubqueryAlias spark_catalog.default.t2
-   :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                 +- LocalRelation [col1#x, col2#x]
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :        +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t2
-      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo9d, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c1 + rand(0) * 0) > 1
+DROP FUNCTION IF EXISTS foo9e
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
-  "sqlState" : "42K0E",
-  "messageParameters" : {
-    "sqlExprs" : "\"(spark_catalog.default.foo3_1b(foo3_1b.x) > 1)\""
-  }
-}
+DropFunctionCommand spark_catalog.default.foo9e, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1c(t1.c1) = 2
+DROP FUNCTION IF EXISTS foo9f
 -- !query analysis
-Project [c1#x, c2#x, c1#x, c2#x]
-+- Join Inner, (spark_catalog.default.foo3_1c(x#x) = 2)
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :        +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t2
-      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo9f, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1g(t1.c1) = 2
+DROP FUNCTION IF EXISTS foo9g
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.UNSUPPORTED_CORRELATED_SCALAR_SUBQUERY",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "treeNode" : "Join Inner, (spark_catalog.default.foo3_1g(x#x) = 2)\n:  +- Project [outer(x#x)]\n:     +- OneRowRelation\n:- SubqueryAlias spark_catalog.default.t1\n:  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n:     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n:        +- LocalRelation [col1#x, col2#x]\n+- SubqueryAlias spark_catalog.default.t2\n   +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo9g, true, false
 
 
 -- !query
-SELECT * FROM t1 ORDER BY foo3_1b(c1)
+DROP FUNCTION IF EXISTS foo9h
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
-    "nodeName" : "Sort"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 27,
-    "stopIndex" : 37,
-    "fragment" : "foo3_1b(c1)"
-  } ]
-}
+DropFunctionCommand spark_catalog.default.foo9h, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9i
+-- !query analysis
+NoopCommand DROP FUNCTION, [foo9i]
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9j
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo9j, true, false
 
 
 -- !query
-SELECT * FROM t1 LIMIT foo3_1b(1)
+DROP FUNCTION IF EXISTS foo9l
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
-    "nodeName" : "GlobalLimit"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 24,
-    "stopIndex" : 33,
-    "fragment" : "foo3_1b(1)"
-  } ]
-}
+DropFunctionCommand spark_catalog.default.foo9l, true, false
 
 
 -- !query
-SELECT * FROM ta LATERAL VIEW EXPLODE(ARRAY(foo3_1b(x[0]), foo3_1b(x[1]))) AS t
+DROP FUNCTION IF EXISTS foo9m
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
-    "nodeName" : "Generate"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 45,
-    "stopIndex" : 57,
-    "fragment" : "foo3_1b(x[0])"
-  } ]
-}
+DropFunctionCommand spark_catalog.default.foo9m, true, false
 
 
 -- !query
-SELECT CASE WHEN foo3_1b(rand(0) * 0 < 1 THEN 1 ELSE -1 END
+DROP FUNCTION IF EXISTS foo9n
 -- !query analysis
-org.apache.spark.sql.catalyst.parser.ParseException
-{
-  "errorClass" : "PARSE_SYNTAX_ERROR",
-  "sqlState" : "42601",
-  "messageParameters" : {
-    "error" : "'foo3_1b'",
-    "hint" : ""
-  }
-}
+DropFunctionCommand spark_catalog.default.foo9n, true, false
 
 
 -- !query
-SELECT (SELECT SUM(c2) FROM t2 WHERE c1 = foo3_1b(t1.c1)) FROM t1
+DROP FUNCTION IF EXISTS foo9o
 -- !query analysis
-Project [scalar-subquery#x [c1#x] AS scalarsubquery(c1)#xL]
-:  +- Aggregate [sum(c2#x) AS sum(c2)#xL]
-:     +- Project [c1#x, c2#x]
-:        +- Filter (c1#x = spark_catalog.default.foo3_1b(x#x))
-:           +- Project [c1#x, c2#x, cast(outer(c1#x) as int) AS x#x]
-:              +- SubqueryAlias spark_catalog.default.t2
-:                 +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-:                    +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-:                       +- LocalRelation [col1#x, col2#x]
-+- SubqueryAlias spark_catalog.default.t1
-   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-         +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo9o, true, false
 
 
 -- !query
-SELECT foo3_1b((SELECT SUM(c1) FROM t1))
+DROP FUNCTION IF EXISTS foo9p
 -- !query analysis
-Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(scalarsubquery())#x]
-+- Project [cast(scalar-subquery#x [] as int) AS x#x]
-   :  +- Aggregate [sum(c1#x) AS sum(c1)#xL]
-   :     +- SubqueryAlias spark_catalog.default.t1
-   :        +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :           +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :              +- LocalRelation [col1#x, col2#x]
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo9p, true, false
 
 
 -- !query
-SELECT foo3_1a(c1, (SELECT MIN(c1) FROM t1)) FROM t1
+DROP FUNCTION IF EXISTS foo9q
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(c1, scalarsubquery())#x]
-+- Project [c1#x, c2#x, cast(c1#x as double) AS a#x, cast(scalar-subquery#x [] as double) AS b#x]
-   :  +- Aggregate [min(c1#x) AS min(c1)#x]
-   :     +- SubqueryAlias spark_catalog.default.t1
-   :        +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :           +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :              +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo9q, true, false
 
 
 -- !query
-SELECT foo3_1b((SELECT SUM(c1))) FROM t1
+DROP FUNCTION IF EXISTS foo9r
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 17,
-    "stopIndex" : 30,
-    "fragment" : "SELECT SUM(c1)"
-  } ]
-}
+DropFunctionCommand spark_catalog.default.foo9r, true, false
 
 
 -- !query
-SELECT foo3_1b((SELECT SUM(c1) FROM t1 WHERE c2 = t2.c2)) FROM t2
+DROP FUNCTION IF EXISTS foo1_10
 -- !query analysis
-Project [spark_catalog.default.foo3_1b(x#x) AS spark_catalog.default.foo3_1b(scalarsubquery(c2))#x]
-+- Project [c1#x, c2#x, cast(scalar-subquery#x [c2#x] as int) AS x#x]
-   :  +- Aggregate [sum(c1#x) AS sum(c1)#xL]
-   :     +- Filter (c2#x = outer(c2#x))
-   :        +- SubqueryAlias spark_catalog.default.t1
-   :           +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                 +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t2
-      +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo1_10, true, false
 
 
 -- !query
-SELECT c2, AVG(foo3_1b((SELECT COUNT(*) FROM t1 WHERE c2 = t2.c2))) OVER (PARTITION BY c1) AS r FROM t2
+DROP FUNCTION IF EXISTS bar1_10
 -- !query analysis
-Project [c2#x, r#x]
-+- Project [c2#x, _w0#x, c1#x, r#x, r#x]
-   +- Window [avg(_w0#x) windowspecdefinition(c1#x, specifiedwindowframe(RowFrame, unboundedpreceding$(), unboundedfollowing$())) AS r#x], [c1#x]
-      +- Project [c2#x, spark_catalog.default.foo3_1b(x#x) AS _w0#x, c1#x]
-         +- Project [c1#x, c2#x, cast(scalar-subquery#x [c2#x] as int) AS x#x]
-            :  +- Aggregate [count(1) AS count(1)#xL]
-            :     +- Filter (c2#x = outer(c2#x))
-            :        +- SubqueryAlias spark_catalog.default.t1
-            :           +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            :                 +- LocalRelation [col1#x, col2#x]
-            +- SubqueryAlias spark_catalog.default.t2
-               +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-                  +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                     +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.bar1_10, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_1x(x STRUCT<a: INT, b: INT>) RETURNS INT RETURN x.a + x.b
+DROP FUNCTION IF EXISTS foo1_11a
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1x`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo1_11a, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_1y(x ARRAY<INT>) RETURNS INT RETURN aggregate(x, BIGINT(0), (x, y) -> x + y)
+DROP FUNCTION IF EXISTS foo1_11b
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_1y`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo1_11b, true, false
 
 
 -- !query
-SELECT foo3_1a(x.a, x.b) FROM ts
+DROP FUNCTION IF EXISTS foo1_11c
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(x.a, x.b)#x]
-+- Project [x#x, cast(x#x.a as double) AS a#x, cast(x#x.b as double) AS b#x]
-   +- SubqueryAlias spark_catalog.default.ts
-      +- View (`spark_catalog`.`default`.`ts`, [x#x])
-         +- Project [cast(col1#x as struct<a:int,b:int>) AS x#x]
-            +- LocalRelation [col1#x]
+DropFunctionCommand spark_catalog.default.foo1_11c, true, false
 
 
 -- !query
-SELECT foo3_1x(x) FROM ts
+DROP FUNCTION IF EXISTS foo1_11d
 -- !query analysis
-Project [spark_catalog.default.foo3_1x(x#x) AS spark_catalog.default.foo3_1x(x)#x]
-+- Project [x#x, cast(x#x as struct<a:int,b:int>) AS x#x]
-   +- SubqueryAlias spark_catalog.default.ts
-      +- View (`spark_catalog`.`default`.`ts`, [x#x])
-         +- Project [cast(col1#x as struct<a:int,b:int>) AS x#x]
-            +- LocalRelation [col1#x]
+DropFunctionCommand spark_catalog.default.foo1_11d, true, false
 
 
 -- !query
-SELECT foo3_1a(x['a'], x['b']) FROM tm
+DROP FUNCTION IF EXISTS foo1_11e
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(x[a], x[b])#x]
-+- Project [x#x, cast(x#x[a] as double) AS a#x, cast(x#x[b] as double) AS b#x]
-   +- SubqueryAlias spark_catalog.default.tm
-      +- View (`spark_catalog`.`default`.`tm`, [x#x])
-         +- Project [cast(col1#x as map<string,int>) AS x#x]
-            +- LocalRelation [col1#x]
+DropFunctionCommand spark_catalog.default.foo1_11e, true, false
 
 
 -- !query
-SELECT foo3_1a(x[0], x[1]) FROM ta
+DROP FUNCTION IF EXISTS foo1_11f
 -- !query analysis
-Project [spark_catalog.default.foo3_1a(a#x, b#x) AS spark_catalog.default.foo3_1a(x[0], x[1])#x]
-+- Project [x#x, cast(x#x[0] as double) AS a#x, cast(x#x[1] as double) AS b#x]
-   +- SubqueryAlias spark_catalog.default.ta
-      +- View (`spark_catalog`.`default`.`ta`, [x#x])
-         +- Project [cast(col1#x as array<int>) AS x#x]
-            +- LocalRelation [col1#x]
+DropFunctionCommand spark_catalog.default.foo1_11f, true, false
 
 
 -- !query
-SELECT foo3_1y(x) FROM ta
+DROP FUNCTION IF EXISTS foo1_11g
 -- !query analysis
-Project [spark_catalog.default.foo3_1y(x#x) AS spark_catalog.default.foo3_1y(x)#x]
-+- Project [x#x, cast(x#x as array<int>) AS x#x]
-   +- SubqueryAlias spark_catalog.default.ta
-      +- View (`spark_catalog`.`default`.`ta`, [x#x])
-         +- Project [cast(col1#x as array<int>) AS x#x]
-            +- LocalRelation [col1#x]
+DropFunctionCommand spark_catalog.default.foo1_11g, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2a() RETURNS INT RETURN FLOOR(RAND() * 6) + 1
+DROP FUNCTION IF EXISTS foo1_11h
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2a`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo1_11h, true, false
 
 
 -- !query
-SELECT CASE WHEN foo3_2a() > 6 THEN FALSE ELSE TRUE END
+DROP FUNCTION IF EXISTS foo1_11i
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+DropFunctionCommand spark_catalog.default.foo1_11i, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_2a() = 1
+DROP FUNCTION IF EXISTS foo1_11j
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
-  "sqlState" : "42K0E",
-  "messageParameters" : {
-    "sqlExprs" : "\"(spark_catalog.default.foo3_2a() = 1)\""
-  }
-}
+DropFunctionCommand spark_catalog.default.foo1_11j, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2b1(x INT) RETURNS BOOLEAN RETURN x IN (SELECT 1)
+DROP FUNCTION IF EXISTS foo1_11k
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2b1`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo1_11k, true, false
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b1(c1)
+DROP FUNCTION IF EXISTS foo1_11l
 -- !query analysis
-Project [c1#x, c2#x]
-+- Project [c1#x, c2#x]
-   +- Filter spark_catalog.default.foo3_2b1(x#x)
-      :  +- Project [1 AS 1#x]
-      :     +- OneRowRelation
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo1_11l, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2b2(x INT) RETURNS INT RETURN IF(x IN (SELECT 1), 1, 0)
+DROP FUNCTION IF EXISTS foo1_11m
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2b2`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo1_11m, true, false
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b2(c1) = 0
+DROP FUNCTION IF EXISTS foo1_11n
 -- !query analysis
-Project [c1#x, c2#x]
-+- Project [c1#x, c2#x]
-   +- Filter (spark_catalog.default.foo3_2b2(x#x) = 0)
-      :  +- Project [1 AS 1#x]
-      :     +- OneRowRelation
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo1_11n, true, false
 
 
 -- !query
-SELECT foo3_2b2(c1) FROM t1
+DROP FUNCTION IF EXISTS foo1_11o
 -- !query analysis
-Project [spark_catalog.default.foo3_2b2(x#x) AS spark_catalog.default.foo3_2b2(c1)#x]
-:  +- Project [1 AS 1#x]
-:     +- OneRowRelation
-+- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo1_11o, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2b3(x INT) RETURNS BOOLEAN RETURN x IN (SELECT c1 FROM t2)
+DROP FUNCTION IF EXISTS foo2_1a
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2b3`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo2_1a, true, false
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b3(c1)
+DROP FUNCTION IF EXISTS foo2_1b
 -- !query analysis
-Project [c1#x, c2#x]
-+- Project [c1#x, c2#x]
-   +- Filter spark_catalog.default.foo3_2b3(x#x)
-      :  +- Project [c1#x]
-      :     +- SubqueryAlias spark_catalog.default.t2
-      :        +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-      :           +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-      :              +- LocalRelation [col1#x, col2#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo2_1b, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2b4(x INT) RETURNS BOOLEAN RETURN x NOT IN (SELECT c2 FROM t2 WHERE x = c1)
+DROP FUNCTION IF EXISTS foo2_1c
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2b4`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo2_1c, true, false
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo2_1d
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo2_1d, true, false
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b4(c1)
+DROP FUNCTION IF EXISTS foo2_2a
 -- !query analysis
-Project [c1#x, c2#x]
-+- Project [c1#x, c2#x]
-   +- Filter spark_catalog.default.foo3_2b4(x#x)
-      :  +- Project [c2#x]
-      :     +- Filter (outer(x#x) = c1#x)
-      :        +- SubqueryAlias spark_catalog.default.t2
-      :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-      :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-      :                 +- LocalRelation [col1#x, col2#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo2_2a, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN SUM(1) + IF(x IN (SELECT 1), 1, 0)
+DROP FUNCTION IF EXISTS foo2_2b
 -- !query analysis
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "USER_DEFINED_FUNCTIONS.CANNOT_CONTAIN_COMPLEX_FUNCTIONS",
-  "sqlState" : "42601",
-  "messageParameters" : {
-    "queryText" : "SUM(1) + IF(x IN (SELECT 1), 1, 0)"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo2_2b, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN y IN (SELECT 1)
+DROP FUNCTION IF EXISTS foo2_2c
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`y`",
-    "proposal" : "`x`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 1,
-    "fragment" : "y"
-  } ]
-}
+NoopCommand DROP FUNCTION, [foo2_2c]
 
 
 -- !query
-CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN x IN (SELECT x WHERE x = 1)
+DROP FUNCTION IF EXISTS foo2_2d
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2b5`"
-  }
-}
+NoopCommand DROP FUNCTION, [foo2_2d]
 
 
 -- !query
-CREATE FUNCTION foo3_2c1(x INT) RETURNS BOOLEAN RETURN EXISTS(SELECT 1)
+DROP FUNCTION IF EXISTS foo2_2e
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2c1`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo2_2e, true, false
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2c1(c1)
+DROP FUNCTION IF EXISTS foo2_2f
 -- !query analysis
-Project [c1#x, c2#x]
-+- Project [c1#x, c2#x]
-   +- Filter spark_catalog.default.foo3_2c1(x#x)
-      :  +- Project [1 AS 1#x]
-      :     +- OneRowRelation
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo2_2f, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2c2(x INT) RETURNS BOOLEAN RETURN NOT EXISTS(SELECT * FROM t2 WHERE c1 = x)
+DROP FUNCTION IF EXISTS foo2_2g
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2c2`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo2_2g, true, false
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2c2(c1)
+DROP FUNCTION IF EXISTS foo2_3
 -- !query analysis
-Project [c1#x, c2#x]
-+- Project [c1#x, c2#x]
-   +- Filter spark_catalog.default.foo3_2c2(x#x)
-      :  +- Project [c1#x, c2#x]
-      :     +- Filter (c1#x = outer(x#x))
-      :        +- SubqueryAlias spark_catalog.default.t2
-      :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-      :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-      :                 +- LocalRelation [col1#x, col2#x]
-      +- Project [c1#x, c2#x, cast(c1#x as int) AS x#x]
-         +- SubqueryAlias spark_catalog.default.t1
-            +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-               +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                  +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo2_3, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2d1(x INT) RETURNS INT RETURN SELECT (SELECT x)
+DROP FUNCTION IF EXISTS foo2_4a
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2d1`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo2_4a, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2d2(x INT) RETURNS INT RETURN SELECT (SELECT 1 WHERE EXISTS (SELECT * FROM t2 WHERE c1 = x))
+DROP FUNCTION IF EXISTS foo2_4b
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`x`",
-    "proposal" : "`c1`, `c2`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 60,
-    "stopIndex" : 60,
-    "fragment" : "x"
-  } ]
-}
+DropFunctionCommand spark_catalog.default.foo2_4b, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_2e1(
-    occurrences ARRAY<STRUCT<start_time: TIMESTAMP, occurrence_id: STRING>>,
-    instance_start_time TIMESTAMP
-) RETURNS STRING RETURN
-WITH t AS (
-    SELECT transform(occurrences, x -> named_struct(
-        'diff', abs(unix_millis(x.start_time) - unix_millis(instance_start_time)),
-        'id', x.occurrence_id
-    )) AS diffs
-)
-SELECT CASE WHEN occurrences IS NULL OR size(occurrences) = 0
-       THEN NULL
-       ELSE sort_array(diffs)[0].id END AS id
-FROM t
+DROP FUNCTION IF EXISTS foo3_1a
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_2e1`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_1a, true, false
 
 
 -- !query
-SELECT foo3_2e1(
-    ARRAY(STRUCT('2022-01-01 10:11:12', '1'), STRUCT('2022-01-01 10:11:15', '2')),
-    '2022-01-01')
+DROP FUNCTION IF EXISTS foo3_1b
 -- !query analysis
-Project [spark_catalog.default.foo3_2e1(occurrences#x, instance_start_time#x) AS spark_catalog.default.foo3_2e1(array(struct(2022-01-01 10:11:12, 1), struct(2022-01-01 10:11:15, 2)), 2022-01-01)#x]
-:  +- WithCTE
-:     :- CTERelationDef xxxx, false
-:     :  +- SubqueryAlias t
-:     :     +- Project [transform(outer(occurrences#x), lambdafunction(named_struct(diff, abs((unix_millis(lambda x#x.start_time) - unix_millis(outer(instance_start_time#x)))), id, lambda x#x.occurrence_id), lambda x#x, false)) AS diffs#x]
-:     :        +- OneRowRelation
-:     +- Project [CASE WHEN (isnull(outer(occurrences#x)) OR (size(outer(occurrences#x), false) = 0)) THEN cast(null as string) ELSE sort_array(diffs#x, true)[0].id END AS id#x]
-:        +- SubqueryAlias t
-:           +- CTERelationRef xxxx, true, [diffs#x], false, false, 1
-+- Project [cast(array(struct(col1, 2022-01-01 10:11:12, col2, 1), struct(col1, 2022-01-01 10:11:15, col2, 2)) as array<struct<start_time:timestamp,occurrence_id:string>>) AS occurrences#x, cast(2022-01-01 as timestamp) AS instance_start_time#x]
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_1b, true, false
 
 
 -- !query
-SET spark.sql.ansi.enabled=true
+DROP FUNCTION IF EXISTS foo3_1c
 -- !query analysis
-SetCommand (spark.sql.ansi.enabled,Some(true))
+DropFunctionCommand spark_catalog.default.foo3_1c, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_1d
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_3a`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_1d, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+DROP FUNCTION IF EXISTS foo3_1e
 -- !query analysis
-CreateSQLFunctionCommand spark_catalog.default.foo3_3at, x INT, a DOUBLE, SELECT 1 / x, true, false, false, false
+DropFunctionCommand spark_catalog.default.foo3_1e, true, false
 
 
 -- !query
-CREATE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_1f
 -- !query analysis
-CreateSQLFunctionCommand foo3_3b, x INT, DOUBLE, 1 / x, false, true, false, false
+DropFunctionCommand spark_catalog.default.foo3_1f, true, false
 
 
 -- !query
-SET spark.sql.ansi.enabled=false
+DROP FUNCTION IF EXISTS foo3_1g
 -- !query analysis
-SetCommand (spark.sql.ansi.enabled,Some(false))
+DropFunctionCommand spark_catalog.default.foo3_1g, true, false
 
 
 -- !query
-SELECT foo3_3a(0)
+DROP FUNCTION IF EXISTS foo3_1x
 -- !query analysis
-Project [spark_catalog.default.foo3_3a(x#x) AS spark_catalog.default.foo3_3a(0)#x]
-+- Project [cast(0 as int) AS x#x]
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_1x, true, false
 
 
 -- !query
-SELECT foo3_3b(0)
+DROP FUNCTION IF EXISTS foo3_1y
 -- !query analysis
-Project [foo3_3b(x#x) AS foo3_3b(0)#x]
-+- Project [cast(0 as int) AS x#x]
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_1y, true, false
 
 
 -- !query
-SELECT * FROM foo3_3at(0)
+DROP FUNCTION IF EXISTS foo3_2a
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo3_3at
-   +- SubqueryAlias foo3_3at
-      +- Project [cast((1 / outer(foo3_3at.x))#x as double) AS a#x]
-         +- Project [(cast(1 as double) / cast(cast(0 as int) as double)) AS (1 / outer(foo3_3at.x))#x]
-            +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_2a, true, false
 
 
 -- !query
-CREATE OR REPLACE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_2b1
 -- !query analysis
-CreateSQLFunctionCommand spark_catalog.default.foo3_3a, x INT, DOUBLE, 1 / x, false, false, false, true
+DropFunctionCommand spark_catalog.default.foo3_2b1, true, false
 
 
 -- !query
-CREATE OR REPLACE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+DROP FUNCTION IF EXISTS foo3_2b2
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_3at`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_2b2, true, false
 
 
 -- !query
-CREATE OR REPLACE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_2b3
 -- !query analysis
-CreateSQLFunctionCommand foo3_3b, x INT, DOUBLE, 1 / x, false, true, false, true
+DropFunctionCommand spark_catalog.default.foo3_2b3, true, false
 
 
 -- !query
-SELECT foo3_3a(0)
+DROP FUNCTION IF EXISTS foo3_2b4
 -- !query analysis
-Project [spark_catalog.default.foo3_3a(x#x) AS spark_catalog.default.foo3_3a(0)#x]
-+- Project [cast(0 as int) AS x#x]
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_2b4, true, false
 
 
 -- !query
-SELECT foo3_3b(0)
+DROP FUNCTION IF EXISTS foo3_2b5
 -- !query analysis
-Project [foo3_3b(x#x) AS foo3_3b(0)#x]
-+- Project [cast(0 as int) AS x#x]
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_2b5, true, false
 
 
 -- !query
-SELECT * FROM foo3_3at(0)
+DROP FUNCTION IF EXISTS foo3_2c1
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo3_3at
-   +- SubqueryAlias foo3_3at
-      +- Project [cast((1 / outer(foo3_3at.x))#x as double) AS a#x]
-         +- Project [(cast(1 as double) / cast(cast(0 as int) as double)) AS (1 / outer(foo3_3at.x))#x]
-            +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_2c1, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_3c() RETURNS INT RETURN CAST('a' AS INT)
+DROP FUNCTION IF EXISTS foo3_2c2
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_3c`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_2c2, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_3ct() RETURNS TABLE (a INT) RETURN SELECT CAST('a' AS INT)
+DROP FUNCTION IF EXISTS foo3_2d1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_3ct`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_2d1, true, false
 
 
 -- !query
-CREATE FUNCTION foo3_3d() RETURNS INT RETURN 'a' + 1
+DROP FUNCTION IF EXISTS foo3_2d2
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_3d`"
-  }
-}
+NoopCommand DROP FUNCTION, [foo3_2d2]
 
 
 -- !query
-CREATE FUNCTION foo3_3dt() RETURNS TABLE (a INT) RETURN SELECT 'a' + 1
+DROP FUNCTION IF EXISTS foo3_2e1
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_3dt`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_2e1, true, false
 
 
 -- !query
-SELECT foo3_3c()
+DROP FUNCTION IF EXISTS foo3_3a
 -- !query analysis
-Project [spark_catalog.default.foo3_3c() AS spark_catalog.default.foo3_3c()#x]
-+- Project
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_3a, true, false
 
 
 -- !query
-SELECT foo3_3d()
+DROP FUNCTION IF EXISTS foo3_3at
 -- !query analysis
-Project [spark_catalog.default.foo3_3d() AS spark_catalog.default.foo3_3d()#x]
-+- Project
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_3at, true, false
 
 
 -- !query
-SELECT * FROM foo3_3ct()
+DROP FUNCTION IF EXISTS foo3_14a
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo3_3ct
-   +- SubqueryAlias foo3_3ct
-      +- Project [cast(CAST(a AS INT)#x as int) AS a#x]
-         +- Project [cast(a as int) AS CAST(a AS INT)#x]
-            +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_14a, true, false
 
 
 -- !query
-SELECT * FROM foo3_3dt()
+DROP FUNCTION IF EXISTS foo3_14b
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo3_3dt
-   +- SubqueryAlias foo3_3dt
-      +- Project [cast((a + 1)#x as int) AS a#x]
-         +- Project [(cast(a as double) + cast(1 as double)) AS (a + 1)#x]
-            +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_14b, true, false
 
 
 -- !query
-SET spark.sql.ansi.enabled=true
+DROP FUNCTION IF EXISTS foo3_3c
 -- !query analysis
-SetCommand (spark.sql.ansi.enabled,Some(true))
+DropFunctionCommand spark_catalog.default.foo3_3c, true, false
 
 
 -- !query
-SELECT foo3_3c()
+DROP FUNCTION IF EXISTS foo3_3ct
 -- !query analysis
-Project [spark_catalog.default.foo3_3c() AS spark_catalog.default.foo3_3c()#x]
-+- Project
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_3ct, true, false
 
 
 -- !query
-SELECT foo3_3d()
+DROP FUNCTION IF EXISTS foo3_3d
 -- !query analysis
-Project [spark_catalog.default.foo3_3d() AS spark_catalog.default.foo3_3d()#x]
-+- Project
-   +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_3d, true, false
 
 
 -- !query
-SELECT * FROM foo3_3ct()
+DROP FUNCTION IF EXISTS foo3_3dt
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo3_3ct
-   +- SubqueryAlias foo3_3ct
-      +- Project [cast(CAST(a AS INT)#x as int) AS a#x]
-         +- Project [cast(a as int) AS CAST(a AS INT)#x]
-            +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_3dt, true, false
 
 
 -- !query
-SELECT * FROM foo3_3dt()
--- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo3_3dt
-   +- SubqueryAlias foo3_3dt
-      +- Project [cast((a + 1)#x as int) AS a#x]
-         +- Project [(cast(a as double) + cast(1 as double)) AS (a + 1)#x]
-            +- OneRowRelation
+DROP FUNCTION IF EXISTS foo3_4a
+-- !query analysis
+DropFunctionCommand spark_catalog.default.foo3_4a, true, false
 
 
 -- !query
-RESET spark.sql.ansi.enabled
+DROP FUNCTION IF EXISTS foo3_4b
 -- !query analysis
-ResetCommand spark.sql.ansi.enabled
+DropFunctionCommand spark_catalog.default.foo3_4b, true, false
 
 
 -- !query
-CREATE FUNCTION foo4_0() RETURNS TABLE (x INT) RETURN SELECT 1
+DROP FUNCTION IF EXISTS foo3_4c
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo4_0`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_4c, true, false
 
 
 -- !query
-CREATE FUNCTION foo4_1(x INT) RETURNS TABLE (a INT) RETURN SELECT x
+DROP FUNCTION IF EXISTS foo3_4d
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo4_1`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_4d, true, false
 
 
 -- !query
-CREATE FUNCTION foo4_2(x INT) RETURNS TABLE (a INT) RETURN SELECT c2 FROM t2 WHERE c1 = x
+DROP FUNCTION IF EXISTS foo3_4e
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo4_2`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_4e, true, false
 
 
 -- !query
-CREATE FUNCTION foo4_3(x INT) RETURNS TABLE (a INT, cnt INT) RETURN SELECT c1, COUNT(*) FROM t2 WHERE c1 = x GROUP BY c1
+DROP FUNCTION IF EXISTS foo3_4f
 -- !query analysis
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo4_3`"
-  }
-}
+DropFunctionCommand spark_catalog.default.foo3_4f, true, false
 
 
 -- !query
-SELECT * FROM foo4_0()
+DROP FUNCTION IF EXISTS foo3_12a
 -- !query analysis
-Project [x#x]
-+- SQLFunctionNode spark_catalog.default.foo4_0
-   +- SubqueryAlias foo4_0
-      +- Project [cast(1#x as int) AS x#x]
-         +- Project [1 AS 1#x]
-            +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_12a, true, false
 
 
 -- !query
-SELECT * FROM foo4_1(1)
+DROP FUNCTION IF EXISTS foo3_12b
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo4_1
-   +- SubqueryAlias foo4_1
-      +- Project [cast(x#x as int) AS a#x]
-         +- Project [cast(1 as int) AS x#x]
-            +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo3_12b, true, false
 
 
 -- !query
-SELECT * FROM foo4_2(2)
+DROP FUNCTION IF EXISTS foo3_12c
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo4_2
-   +- SubqueryAlias foo4_2
-      +- Project [cast(c2#x as int) AS a#x]
-         +- Project [c2#x]
-            +- Filter (c1#x = cast(2 as int))
-               +- SubqueryAlias spark_catalog.default.t2
-                  +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-                     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                        +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo3_12c, true, false
 
 
 -- !query
-SELECT * FROM foo4_3(0)
+DROP FUNCTION IF EXISTS foo3_12d
 -- !query analysis
-Project [a#x, cnt#x]
-+- SQLFunctionNode spark_catalog.default.foo4_3
-   +- SubqueryAlias foo4_3
-      +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
-         +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
-            +- Filter (c1#x = cast(0 as int))
-               +- SubqueryAlias spark_catalog.default.t2
-                  +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-                     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-                        +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo3_12d, true, false
 
 
 -- !query
-SELECT * FROM foo4_1(rand(0) * 0)
+DROP FUNCTION IF EXISTS foo3_12e
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+DropFunctionCommand spark_catalog.default.foo3_12e, true, false
 
 
 -- !query
-SELECT * FROM foo4_1(x => 1)
+DROP FUNCTION IF EXISTS foo3_12f
 -- !query analysis
-Project [a#x]
-+- SQLFunctionNode spark_catalog.default.foo4_1
-   +- SubqueryAlias foo4_1
-      +- Project [cast(x#x as int) AS a#x]
-         +- Project [cast(1 as int) AS x#x]
-            +- OneRowRelation
+NoopCommand DROP FUNCTION, [foo3_12f]
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_1(c1)
+DROP FUNCTION IF EXISTS foo3_12g
 -- !query analysis
-Project [c1#x, c2#x, a#x]
-+- LateralJoin lateral-subquery#x [c1#x], Inner
-   :  +- SQLFunctionNode spark_catalog.default.foo4_1
-   :     +- SubqueryAlias foo4_1
-   :        +- Project [cast(x#x as int) AS a#x]
-   :           +- Project [cast(outer(c1#x) as int) AS x#x]
-   :              +- OneRowRelation
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo3_12g, true, false
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_2(c1)
+DROP FUNCTION IF EXISTS foo3_12h
 -- !query analysis
-Project [c1#x, c2#x, a#x]
-+- LateralJoin lateral-subquery#x [c1#x], Inner
-   :  +- SQLFunctionNode spark_catalog.default.foo4_2
-   :     +- SubqueryAlias foo4_2
-   :        +- Project [cast(c2#x as int) AS a#x]
-   :           +- Project [c2#x]
-   :              +- Filter (c1#x = cast(outer(c1#x) as int))
-   :                 +- SubqueryAlias spark_catalog.default.t2
-   :                    +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :                       +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                          +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo3_12h, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN LATERAL foo4_2(c1) ON t1.c2 = foo4_2.a
+DROP FUNCTION IF EXISTS foo3_12i
 -- !query analysis
-Project [c1#x, c2#x, a#x]
-+- LateralJoin lateral-subquery#x [c1#x], Inner, (c2#x = a#x)
-   :  +- SQLFunctionNode spark_catalog.default.foo4_2
-   :     +- SubqueryAlias foo4_2
-   :        +- Project [cast(c2#x as int) AS a#x]
-   :           +- Project [c2#x]
-   :              +- Filter (c1#x = cast(outer(c1#x) as int))
-   :                 +- SubqueryAlias spark_catalog.default.t2
-   :                    +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :                       +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                          +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo3_12i, true, false
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_3(c1)
+DROP FUNCTION IF EXISTS foo3_12j
 -- !query analysis
-Project [c1#x, c2#x, a#x, cnt#x]
-+- LateralJoin lateral-subquery#x [c1#x], Inner
-   :  +- SQLFunctionNode spark_catalog.default.foo4_3
-   :     +- SubqueryAlias foo4_3
-   :        +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
-   :           +- LateralJoin lateral-subquery#x [x#x], Inner
-   :              :  +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
-   :              :     +- Filter (c1#x = outer(x#x))
-   :              :        +- SubqueryAlias spark_catalog.default.t2
-   :              :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :              :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :              :                 +- LocalRelation [col1#x, col2#x]
-   :              +- Project [cast(outer(c1#x) as int) AS x#x]
-   :                 +- OneRowRelation
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo3_12j, true, false
 
 
 -- !query
-SELECT * FROM t1, LATERAL (SELECT cnt FROM foo4_3(c1))
+DROP FUNCTION IF EXISTS foo3_12k
 -- !query analysis
-Project [c1#x, c2#x, cnt#x]
-+- LateralJoin lateral-subquery#x [c1#x], Inner
-   :  +- SubqueryAlias __auto_generated_subquery_name
-   :     +- Project [cnt#x]
-   :        +- SQLFunctionNode spark_catalog.default.foo4_3
-   :           +- SubqueryAlias foo4_3
-   :              +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
-   :                 +- LateralJoin lateral-subquery#x [x#x], Inner
-   :                    :  +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
-   :                    :     +- Filter (c1#x = outer(x#x))
-   :                    :        +- SubqueryAlias spark_catalog.default.t2
-   :                    :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :                    :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                    :                 +- LocalRelation [col1#x, col2#x]
-   :                    +- Project [cast(outer(c1#x) as int) AS x#x]
-   :                       +- OneRowRelation
-   +- SubqueryAlias spark_catalog.default.t1
-      +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-         +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-            +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo3_12k, true, false
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)
+DROP FUNCTION IF EXISTS foo4_0
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.NON_DETERMINISTIC_LATERAL_SUBQUERIES",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "treeNode" : "LateralJoin lateral-subquery#x [c1#x], Inner\n:  +- SQLFunctionNode spark_catalog.default.foo4_1\n:     +- SubqueryAlias foo4_1\n:        +- Project [cast(x#x as int) AS a#x]\n:           +- LateralJoin lateral-subquery#x [x#x], Inner\n:              :  +- Project [outer(x#x) AS x#x]\n:              :     +- OneRowRelation\n:              +- Project [cast((cast(outer(c1#x) as double) + (rand(number) * cast(0 as double))) as int) AS x#x]\n:                 +- OneRowRelation\n+- SubqueryAlias spark_catalog.default.t1\n   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 10,
-    "stopIndex" : 50,
-    "fragment" : "FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)"
-  } ]
-}
+DropFunctionCommand spark_catalog.default.foo4_0, true, false
 
 
 -- !query
-SELECT * FROM t1 JOIN foo4_1(1) AS foo4_1(x) ON t1.c1 = foo4_1.x
+DROP FUNCTION IF EXISTS foo4_1
 -- !query analysis
-Project [c1#x, c2#x, x#x]
-+- Join Inner, (c1#x = x#x)
-   :- SubqueryAlias spark_catalog.default.t1
-   :  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-   :     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :        +- LocalRelation [col1#x, col2#x]
-   +- SubqueryAlias foo4_1
-      +- Project [a#x AS x#x]
-         +- SQLFunctionNode spark_catalog.default.foo4_1
-            +- SubqueryAlias foo4_1
-               +- Project [cast(x#x as int) AS a#x]
-                  +- Project [cast(1 as int) AS x#x]
-                     +- OneRowRelation
+DropFunctionCommand spark_catalog.default.foo4_1, true, false
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_1(c1), LATERAL foo4_2(foo4_1.a + c1)
+DROP FUNCTION IF EXISTS foo4_2
 -- !query analysis
-Project [c1#x, c2#x, a#x, a#x]
-+- LateralJoin lateral-subquery#x [a#x && c1#x], Inner
-   :  +- SQLFunctionNode spark_catalog.default.foo4_2
-   :     +- SubqueryAlias foo4_2
-   :        +- Project [cast(c2#x as int) AS a#x]
-   :           +- Project [c2#x]
-   :              +- Filter (c1#x = cast((outer(a#x) + outer(c1#x)) as int))
-   :                 +- SubqueryAlias spark_catalog.default.t2
-   :                    +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-   :                       +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-   :                          +- LocalRelation [col1#x, col2#x]
-   +- LateralJoin lateral-subquery#x [c1#x], Inner
-      :  +- SQLFunctionNode spark_catalog.default.foo4_1
-      :     +- SubqueryAlias foo4_1
-      :        +- Project [cast(x#x as int) AS a#x]
-      :           +- Project [cast(outer(c1#x) as int) AS x#x]
-      :              +- OneRowRelation
-      +- SubqueryAlias spark_catalog.default.t1
-         +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-            +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-               +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo4_2, true, false
 
 
 -- !query
-SELECT (SELECT MAX(a) FROM foo4_1(c1)) FROM t1
+DROP FUNCTION IF EXISTS foo4_3
 -- !query analysis
-Project [scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x]
-:  +- Aggregate [max(a#x) AS max(a)#x]
-:     +- SQLFunctionNode spark_catalog.default.foo4_1
-:        +- SubqueryAlias foo4_1
-:           +- Project [cast(x#x as int) AS a#x]
-:              +- Project [cast(outer(c1#x) as int) AS x#x]
-:                 +- OneRowRelation
-+- SubqueryAlias spark_catalog.default.t1
-   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-         +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand spark_catalog.default.foo4_3, true, false
 
 
 -- !query
-SELECT (SELECT MAX(a) FROM foo4_1(c1) WHERE a = c2) FROM t1
+DROP TEMPORARY FUNCTION IF EXISTS foo1d3
 -- !query analysis
-Project [scalar-subquery#x [c2#x && c1#x] AS scalarsubquery(c2, c1)#x]
-:  +- Aggregate [max(a#x) AS max(a)#x]
-:     +- Filter (a#x = outer(c2#x))
-:        +- SQLFunctionNode spark_catalog.default.foo4_1
-:           +- SubqueryAlias foo4_1
-:              +- Project [cast(x#x as int) AS a#x]
-:                 +- Project [cast(outer(c1#x) as int) AS x#x]
-:                    +- OneRowRelation
-+- SubqueryAlias spark_catalog.default.t1
-   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-         +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand foo1d3, true, true
 
 
 -- !query
-SELECT (SELECT MAX(cnt) FROM foo4_3(c1)) FROM t1
+DROP TEMPORARY FUNCTION IF EXISTS foo3_3b
 -- !query analysis
-Project [scalar-subquery#x [c1#x] AS scalarsubquery(c1)#x]
-:  +- Aggregate [max(cnt#x) AS max(cnt)#x]
-:     +- SQLFunctionNode spark_catalog.default.foo4_3
-:        +- SubqueryAlias foo4_3
-:           +- Project [cast(c1#x as int) AS a#x, cast(count(1)#xL as int) AS cnt#x]
-:              +- LateralJoin lateral-subquery#x [x#x], Inner
-:                 :  +- Aggregate [c1#x], [c1#x, count(1) AS count(1)#xL]
-:                 :     +- Filter (c1#x = outer(x#x))
-:                 :        +- SubqueryAlias spark_catalog.default.t2
-:                 :           +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])
-:                 :              +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-:                 :                 +- LocalRelation [col1#x, col2#x]
-:                 +- Project [cast(outer(c1#x) as int) AS x#x]
-:                    +- OneRowRelation
-+- SubqueryAlias spark_catalog.default.t1
-   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])
-      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
-         +- LocalRelation [col1#x, col2#x]
+DropFunctionCommand foo3_3b, true, true
 
 
 -- !query
-DROP VIEW t1
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5a
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`t1`, false, true, false
+DropFunctionCommand foo3_5a, true, true
 
 
 -- !query
-DROP VIEW t2
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5b
 -- !query analysis
-DropTableCommand `spark_catalog`.`default`.`t2`, false, true, false
+DropFunctionCommand foo3_5b, true, true
+
+
+-- !query
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5c
+-- !query analysis
+DropFunctionCommand foo3_5c, true, true
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/string-functions.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/string-functions.sql.out
index ee4ad922fa8a5..b352d0edf896b 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/string-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/string-functions.sql.out
@@ -128,6 +128,41 @@ Project [split(hello, , -1) AS split(hello, , -1)#x]
 +- OneRowRelation
 
 
+-- !query
+SELECT split('hello', '', 0)
+-- !query analysis
+Project [split(hello, , 0) AS split(hello, , 0)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 1)
+-- !query analysis
+Project [split(hello, , 1) AS split(hello, , 1)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 3)
+-- !query analysis
+Project [split(hello, , 3) AS split(hello, , 3)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 5)
+-- !query analysis
+Project [split(hello, , 5) AS split(hello, , 5)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('hello', '', 100)
+-- !query analysis
+Project [split(hello, , 100) AS split(hello, , 100)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT split('', '')
 -- !query analysis
@@ -135,6 +170,27 @@ Project [split(, , -1) AS split(, , -1)#x]
 +- OneRowRelation
 
 
+-- !query
+SELECT split('', '', -1)
+-- !query analysis
+Project [split(, , -1) AS split(, , -1)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('', '', 0)
+-- !query analysis
+Project [split(, , 0) AS split(, , 0)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT split('', '', 1)
+-- !query analysis
+Project [split(, , 1) AS split(, , 1)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT split('abc', null)
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/struct.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/struct.sql.out
index dba912cdff72e..25bff29fc0129 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/struct.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/struct.sql.out
@@ -93,3 +93,46 @@ Project [ID#x, struct(STC, ST#x.C, STD, ST#x.D).STD AS struct(ST.C AS STC, ST.D
       +- Project [cast(ID#x as int) AS ID#x, cast(ST#x as struct<C:string,D:string>) AS ST#x]
          +- SubqueryAlias T
             +- LocalRelation [ID#x, ST#x]
+
+
+-- !query
+SELECT STRUCT(1 AS a) AS b, b AS c
+-- !query analysis
+Project [b#x, b#x AS c#x]
++- Project [struct(a, 1) AS b#x]
+   +- OneRowRelation
+
+
+-- !query
+SELECT STRUCT(col1 AS a) AS b, b AS c FROM VALUES(1)
+-- !query analysis
+Project [b#x, b#x AS c#x]
++- Project [col1#x, struct(a, col1#x) AS b#x]
+   +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT STRUCT(1 AS a) AS b, b AS c GROUP BY b
+-- !query analysis
+Project [b#x, b#x AS c#x]
++- Project [struct(1)#x, struct(1)#x AS b#x]
+   +- Aggregate [struct(a, 1)], [struct(a, 1) AS struct(1)#x]
+      +- OneRowRelation
+
+
+-- !query
+SELECT STRUCT(col1 AS a) AS b, b AS c FROM VALUES(1) GROUP BY b
+-- !query analysis
+Project [b#x, b#x AS c#x]
++- Project [struct(col1)#x, struct(col1)#x AS b#x]
+   +- Aggregate [struct(a, col1#x)], [struct(a, col1#x) AS struct(col1)#x]
+      +- LocalRelation [col1#x]
+
+
+-- !query
+SELECT MAX(STRUCT(1 AS a)), 2 AS b, b AS c GROUP BY b
+-- !query analysis
+Project [max(struct(1))#x AS max(struct(1 AS a))#x, b#x, b#x AS c#x]
++- Project [max(struct(1))#x, 2#x, 2#x AS b#x]
+   +- Aggregate [2], [max(struct(a, 1)) AS max(struct(1))#x, 2 AS 2#x]
+      +- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/in-null-semantics.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/in-null-semantics.sql.out
index 51fb2455c19f8..2bb8cafed8686 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/in-null-semantics.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/in-subquery/in-null-semantics.sql.out
@@ -25,7 +25,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 insert into t values (1), (null)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, JSON, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c]
-+- Project [cast(col1#x as int) AS c#x]
++- Project [col1#x AS c#x]
    +- LocalRelation [col1#x]
 
 
@@ -39,7 +39,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t2`, false
 insert into t2 values (2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, JSON, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [d]
-+- Project [cast(col1#x as int) AS d#x]
++- Project [col1#x AS d#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out
index 0414782fb7e67..8765e590a8da7 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out
@@ -1766,3 +1766,27 @@ Project [t0a#x, t0b#x]
       +- View (`t0`, [t0a#x, t0b#x])
          +- Project [cast(col1#x as int) AS t0a#x, cast(col2#x as int) AS t0b#x]
             +- LocalRelation [col1#x, col2#x]
+
+
+-- !query
+SELECT MAX(a.col1)
+FROM VALUES (1) AS a(col1)
+GROUP BY a.col1
+HAVING COUNT(*) = (
+        SELECT COUNT(*)
+        FROM VALUES (1),(1),(2),(2) AS c(col1)
+        WHERE c.col1 >= a.col1
+        LIMIT 1
+    )
+-- !query analysis
+Project [max(col1)#x]
++- Filter (count(1)#xL = scalar-subquery#x [col1#x])
+   :  +- GlobalLimit 1
+   :     +- LocalLimit 1
+   :        +- Aggregate [count(1) AS count(1)#xL]
+   :           +- Filter (col1#x >= outer(col1#x))
+   :              +- SubqueryAlias c
+   :                 +- LocalRelation [col1#x]
+   +- Aggregate [col1#x], [max(col1#x) AS max(col1)#x, count(1) AS count(1)#xL, col1#x]
+      +- SubqueryAlias a
+         +- LocalRelation [col1#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-nested-data.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-nested-data.sql.out
index a218238073dff..752c052f2b140 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-nested-data.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-nested-data.sql.out
@@ -23,7 +23,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`x`, false
 insert into x values (map(1, 2), 3), (map(1, 4), 5), (map(2, 3), 4), (map(5, 6), 7)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/x, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/x], Append, `spark_catalog`.`default`.`x`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/x), [xm, x2]
-+- Project [col1#x AS xm#x, cast(col2#x as int) AS x2#x]
++- Project [col1#x AS xm#x, col2#x AS x2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -37,7 +37,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`y`, false
 insert into y values (map(1, 2), 10), (map(1, 3), 20), (map(2, 3), 20), (map(8, 3), 20)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/y, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/y], Append, `spark_catalog`.`default`.`y`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/y), [ym, y2]
-+- Project [col1#x AS ym#x, cast(col2#x as int) AS y2#x]
++- Project [col1#x AS ym#x, col2#x AS y2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-offset.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-offset.sql.out
index bedb1b07a80c5..ed89c720ffec9 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-offset.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/subquery/subquery-offset.sql.out
@@ -23,7 +23,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`x`, false
 insert into x values (1, 1), (2, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/x, false, JSON, [path=file:[not included in comparison]/{warehouse_dir}/x], Append, `spark_catalog`.`default`.`x`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/x), [x1, x2]
-+- Project [cast(col1#x as int) AS x1#x, cast(col2#x as int) AS x2#x]
++- Project [col1#x AS x1#x, col2#x AS x2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -37,7 +37,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`y`, false
 insert into y values (1, 1), (1, 2), (2, 4)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/y, false, JSON, [path=file:[not included in comparison]/{warehouse_dir}/y], Append, `spark_catalog`.`default`.`y`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/y), [y1, y2]
-+- Project [cast(col1#x as int) AS y1#x, cast(col2#x as int) AS y2#x]
++- Project [col1#x AS y1#x, col2#x AS y2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/time.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/time.sql.out
index 8ce87d992e756..7ac37e447066d 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/time.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/time.sql.out
@@ -1,4 +1,12 @@
 -- Automatically generated by SQLQueryTestSuite
+-- !query
+create temporary view timediff_view as select time'01:02:03' time_start, time'04:05:06' time_end, 'SECOND' unit
+-- !query analysis
+CreateViewCommand `timediff_view`, select time'01:02:03' time_start, time'04:05:06' time_end, 'SECOND' unit, false, false, LocalTempView, UNSUPPORTED, true
+   +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+      +- OneRowRelation
+
+
 -- !query
 create temporary view time_view as select '11:53:26.038344' time_str, 'HH:mm:ss.SSSSSS' fmt_str
 -- !query analysis
@@ -7,6 +15,14 @@ CreateViewCommand `time_view`, select '11:53:26.038344' time_str, 'HH:mm:ss.SSSS
       +- OneRowRelation
 
 
+-- !query
+create temporary view trunc_time_view as select time'11:53:26.038344' time_val, 'MINUTE' unit
+-- !query analysis
+CreateViewCommand `trunc_time_view`, select time'11:53:26.038344' time_val, 'MINUTE' unit, false, false, LocalTempView, UNSUPPORTED, true
+   +- Project [11:53:26.038344 AS time_val#x, MINUTE AS unit#x]
+      +- OneRowRelation
+
+
 -- !query
 select time '16:39:45\t'
 -- !query analysis
@@ -399,3 +415,1546 @@ select extract(SECOND FROM cast('09:08:01.987654' as time(6)))
 -- !query analysis
 Project [extract(SECOND, cast(09:08:01.987654 as time(6))) AS extract(SECOND FROM CAST(09:08:01.987654 AS TIME(6)))#x]
 +- OneRowRelation
+
+
+-- !query
+SELECT TIME'0:0:0'
+-- !query analysis
+Project [00:00:00 AS TIME '00:00:00'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'01:02:03'
+-- !query analysis
+Project [01:02:03 AS TIME '01:02:03'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'12:34:56'
+-- !query analysis
+Project [12:34:56 AS TIME '12:34:56'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'23:59:59'
+-- !query analysis
+Project [23:59:59 AS TIME '23:59:59'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'23:59:59.9'
+-- !query analysis
+Project [23:59:59.9 AS TIME '23:59:59.9'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'23:59:59.99'
+-- !query analysis
+Project [23:59:59.99 AS TIME '23:59:59.99'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'23:59:59.999'
+-- !query analysis
+Project [23:59:59.999 AS TIME '23:59:59.999'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'23:59:59.9999'
+-- !query analysis
+Project [23:59:59.9999 AS TIME '23:59:59.9999'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'23:59:59.99999'
+-- !query analysis
+Project [23:59:59.99999 AS TIME '23:59:59.99999'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'23:59:59.999999'
+-- !query analysis
+Project [23:59:59.999999 AS TIME '23:59:59.999999'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'01:02:03 AM'
+-- !query analysis
+Project [01:02:03 AS TIME '01:02:03'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'01:02:03 am'
+-- !query analysis
+Project [01:02:03 AS TIME '01:02:03'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'01:02:03 Am'
+-- !query analysis
+Project [01:02:03 AS TIME '01:02:03'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'01:02:03 PM'
+-- !query analysis
+Project [13:02:03 AS TIME '13:02:03'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'01:02:03 pm'
+-- !query analysis
+Project [13:02:03 AS TIME '13:02:03'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'01:02:03 pM'
+-- !query analysis
+Project [13:02:03 AS TIME '13:02:03'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'00:00:60'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:00:60'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 21,
+    "fragment" : "TIME'00:00:60'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'00:60:00'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:60:00'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 21,
+    "fragment" : "TIME'00:60:00'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'24:00:00'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'24:00:00'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 21,
+    "fragment" : "TIME'24:00:00'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'00:00:00 AM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:00:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'00:00:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'00:00:00 PM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:00:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'00:00:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:00:60 AM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:00:60 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:00:60 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:00:60 PM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:00:60 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:00:60 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:60:00 AM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:60:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:60:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:60:00 PM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:60:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:60:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'13:00:00 AM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'13:00:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'13:00:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'13:00:00 PM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'13:00:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'13:00:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'24:00:00 AM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'24:00:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'24:00:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'24:00:00 PM'
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'24:00:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'24:00:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT cast("12:34:56" as time)
+-- !query analysis
+Project [cast(12:34:56 as time(6)) AS CAST(12:34:56 AS TIME(6))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT cast("12:34:56.789" as time(3))
+-- !query analysis
+Project [cast(12:34:56.789 as time(3)) AS CAST(12:34:56.789 AS TIME(3))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT cast("12:34:56.789" as time(6))
+-- !query analysis
+Project [cast(12:34:56.789 as time(6)) AS CAST(12:34:56.789 AS TIME(6))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT cast("12:34:56.789012" as time without time zone)
+-- !query analysis
+Project [cast(12:34:56.789012 as time(6)) AS CAST(12:34:56.789012 AS TIME(6))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT cast(cast('12:00' as time(0)) as time(2))
+-- !query analysis
+Project [cast(cast(12:00 as time(0)) as time(2)) AS CAST(CAST(12:00 AS TIME(0)) AS TIME(2))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT cast(('23:59:59.001001' :: time(6)) as time(4))
+-- !query analysis
+Project [cast(cast(23:59:59.001001 as time(6)) as time(4)) AS CAST(CAST(23:59:59.001001 AS TIME(6)) AS TIME(4))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT cast(time'11:59:59.999999' as time without time zone)
+-- !query analysis
+Project [cast(11:59:59.999999 as time(6)) AS CAST(TIME '11:59:59.999999' AS TIME(6))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56')
+-- !query analysis
+Project [time_trunc(HOUR, 12:34:56) AS time_trunc(HOUR, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56')
+-- !query analysis
+Project [time_trunc(MINUTE, 12:34:56) AS time_trunc(MINUTE, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56')
+-- !query analysis
+Project [time_trunc(SECOND, 12:34:56) AS time_trunc(SECOND, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56')
+-- !query analysis
+Project [time_trunc(MILLISECOND, 12:34:56) AS time_trunc(MILLISECOND, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56')
+-- !query analysis
+Project [time_trunc(MICROSECOND, 12:34:56) AS time_trunc(MICROSECOND, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56.1')
+-- !query analysis
+Project [time_trunc(HOUR, 12:34:56.1) AS time_trunc(HOUR, TIME '12:34:56.1')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56.1')
+-- !query analysis
+Project [time_trunc(MINUTE, 12:34:56.1) AS time_trunc(MINUTE, TIME '12:34:56.1')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56.1')
+-- !query analysis
+Project [time_trunc(SECOND, 12:34:56.1) AS time_trunc(SECOND, TIME '12:34:56.1')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56.1')
+-- !query analysis
+Project [time_trunc(MILLISECOND, 12:34:56.1) AS time_trunc(MILLISECOND, TIME '12:34:56.1')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56.1')
+-- !query analysis
+Project [time_trunc(MICROSECOND, 12:34:56.1) AS time_trunc(MICROSECOND, TIME '12:34:56.1')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56.123456')
+-- !query analysis
+Project [time_trunc(HOUR, 12:34:56.123456) AS time_trunc(HOUR, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56.123456')
+-- !query analysis
+Project [time_trunc(MINUTE, 12:34:56.123456) AS time_trunc(MINUTE, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56.123456')
+-- !query analysis
+Project [time_trunc(SECOND, 12:34:56.123456) AS time_trunc(SECOND, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56.123456')
+-- !query analysis
+Project [time_trunc(MILLISECOND, 12:34:56.123456) AS time_trunc(MILLISECOND, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56.123456')
+-- !query analysis
+Project [time_trunc(MICROSECOND, 12:34:56.123456) AS time_trunc(MICROSECOND, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56.123456789')
+-- !query analysis
+Project [time_trunc(HOUR, 12:34:56.123456) AS time_trunc(HOUR, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56.123456789')
+-- !query analysis
+Project [time_trunc(MINUTE, 12:34:56.123456) AS time_trunc(MINUTE, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56.123456789')
+-- !query analysis
+Project [time_trunc(SECOND, 12:34:56.123456) AS time_trunc(SECOND, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56.123456789')
+-- !query analysis
+Project [time_trunc(MILLISECOND, 12:34:56.123456) AS time_trunc(MILLISECOND, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56.123456789')
+-- !query analysis
+Project [time_trunc(MICROSECOND, 12:34:56.123456) AS time_trunc(MICROSECOND, TIME '12:34:56.123456')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('hour', time'12:34:56')
+-- !query analysis
+Project [time_trunc(hour, 12:34:56) AS time_trunc(hour, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MiNuTe', time'12:34:56')
+-- !query analysis
+Project [time_trunc(MiNuTe, 12:34:56) AS time_trunc(MiNuTe, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('sEcOnD', time'12:34:56')
+-- !query analysis
+Project [time_trunc(sEcOnD, 12:34:56) AS time_trunc(sEcOnD, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('Millisecond', time'12:34:56')
+-- !query analysis
+Project [time_trunc(Millisecond, 12:34:56) AS time_trunc(Millisecond, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('microseconD', time'12:34:56')
+-- !query analysis
+Project [time_trunc(microseconD, 12:34:56) AS time_trunc(microseconD, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time'00:00:00')
+-- !query analysis
+Project [time_trunc(HOUR, 00:00:00) AS time_trunc(HOUR, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'00:00:00')
+-- !query analysis
+Project [time_trunc(MINUTE, 00:00:00) AS time_trunc(MINUTE, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('SECOND', time'00:00:00')
+-- !query analysis
+Project [time_trunc(SECOND, 00:00:00) AS time_trunc(SECOND, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'00:00:00')
+-- !query analysis
+Project [time_trunc(MILLISECOND, 00:00:00) AS time_trunc(MILLISECOND, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'00:00:00')
+-- !query analysis
+Project [time_trunc(MICROSECOND, 00:00:00) AS time_trunc(MICROSECOND, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time'00:00:00.000000001')
+-- !query analysis
+Project [time_trunc(HOUR, 00:00:00) AS time_trunc(HOUR, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'00:00:00.000000001')
+-- !query analysis
+Project [time_trunc(MINUTE, 00:00:00) AS time_trunc(MINUTE, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('SECOND', time'00:00:00.000000001')
+-- !query analysis
+Project [time_trunc(SECOND, 00:00:00) AS time_trunc(SECOND, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'00:00:00.000000001')
+-- !query analysis
+Project [time_trunc(MILLISECOND, 00:00:00) AS time_trunc(MILLISECOND, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'00:00:00.000000001')
+-- !query analysis
+Project [time_trunc(MICROSECOND, 00:00:00) AS time_trunc(MICROSECOND, TIME '00:00:00')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time'23:59:59.999999999')
+-- !query analysis
+Project [time_trunc(HOUR, 23:59:59.999999) AS time_trunc(HOUR, TIME '23:59:59.999999')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'23:59:59.999999999')
+-- !query analysis
+Project [time_trunc(MINUTE, 23:59:59.999999) AS time_trunc(MINUTE, TIME '23:59:59.999999')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('SECOND', time'23:59:59.999999999')
+-- !query analysis
+Project [time_trunc(SECOND, 23:59:59.999999) AS time_trunc(SECOND, TIME '23:59:59.999999')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'23:59:59.999999999')
+-- !query analysis
+Project [time_trunc(MILLISECOND, 23:59:59.999999) AS time_trunc(MILLISECOND, TIME '23:59:59.999999')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'23:59:59.999999999')
+-- !query analysis
+Project [time_trunc(MICROSECOND, 23:59:59.999999) AS time_trunc(MICROSECOND, TIME '23:59:59.999999')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('', time'12:34:56')
+-- !query analysis
+Project [time_trunc(, 12:34:56) AS time_trunc(, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc(' ', time'12:34:56')
+-- !query analysis
+Project [time_trunc( , 12:34:56) AS time_trunc( , TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('MS', time'12:34:56')
+-- !query analysis
+Project [time_trunc(MS, 12:34:56) AS time_trunc(MS, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('DAY', time'12:34:56')
+-- !query analysis
+Project [time_trunc(DAY, 12:34:56) AS time_trunc(DAY, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('WEEK', time'12:34:56')
+-- !query analysis
+Project [time_trunc(WEEK, 12:34:56) AS time_trunc(WEEK, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('ABCD', time'12:34:56')
+-- !query analysis
+Project [time_trunc(ABCD, 12:34:56) AS time_trunc(ABCD, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('QUARTER', time'12:34:56')
+-- !query analysis
+Project [time_trunc(QUARTER, 12:34:56) AS time_trunc(QUARTER, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('INVALID', time'12:34:56')
+-- !query analysis
+Project [time_trunc(INVALID, 12:34:56) AS time_trunc(INVALID, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('INVALID_UNIT', time'12:34:56')
+-- !query analysis
+Project [time_trunc(INVALID_UNIT, 12:34:56) AS time_trunc(INVALID_UNIT, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', NULL)
+-- !query analysis
+Project [time_trunc(HOUR, cast(null as time(6))) AS time_trunc(HOUR, NULL)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc(NULL, time'12:34:56')
+-- !query analysis
+Project [time_trunc(cast(null as string), 12:34:56) AS time_trunc(NULL, TIME '12:34:56')#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc(NULL, NULL)
+-- !query analysis
+Project [time_trunc(cast(null as string), cast(null as time(6))) AS time_trunc(NULL, NULL)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time_trunc('HOUR', time_val) FROM trunc_time_view
+-- !query analysis
+Project [time_trunc(HOUR, time_val#x) AS time_trunc(HOUR, time_val)#x]
++- SubqueryAlias trunc_time_view
+   +- View (`trunc_time_view`, [time_val#x, unit#x])
+      +- Project [cast(time_val#x as time(6)) AS time_val#x, cast(unit#x as string) AS unit#x]
+         +- Project [11:53:26.038344 AS time_val#x, MINUTE AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_trunc(unit, time'12:34:56') FROM trunc_time_view
+-- !query analysis
+Project [time_trunc(unit#x, 12:34:56) AS time_trunc(unit, TIME '12:34:56')#x]
++- SubqueryAlias trunc_time_view
+   +- View (`trunc_time_view`, [time_val#x, unit#x])
+      +- Project [cast(time_val#x as time(6)) AS time_val#x, cast(unit#x as string) AS unit#x]
+         +- Project [11:53:26.038344 AS time_val#x, MINUTE AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_trunc(unit, time_val) FROM trunc_time_view
+-- !query analysis
+Project [time_trunc(unit#x, time_val#x) AS time_trunc(unit, time_val)#x]
++- SubqueryAlias trunc_time_view
+   +- View (`trunc_time_view`, [time_val#x, unit#x])
+      +- Project [cast(time_val#x as time(6)) AS time_val#x, cast(unit#x as string) AS unit#x]
+         +- Project [11:53:26.038344 AS time_val#x, MINUTE AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time("12:34:56")
+-- !query analysis
+Project [cast(12:34:56 as time(6)) AS 12:34:56#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time("12:34:56.789")
+-- !query analysis
+Project [cast(12:34:56.789 as time(6)) AS 12:34:56.789#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time("12:34:56.789012")
+-- !query analysis
+Project [cast(12:34:56.789012 as time(6)) AS 12:34:56.789012#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time(cast('12:00' as time(0)))
+-- !query analysis
+Project [cast(cast(12:00 as time(0)) as time(6)) AS CAST(12:00 AS TIME(0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time(('23:59:59.001001' :: time(6)))
+-- !query analysis
+Project [cast(cast(23:59:59.001001 as time(6)) as time(6)) AS CAST(23:59:59.001001 AS TIME(6))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT time(time'11:59:59.999999')
+-- !query analysis
+Project [cast(11:59:59.999999 as time(6)) AS TIME '11:59:59.999999'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT '12:43:33.1234' :: TIME(4) + INTERVAL '01:04:05.56' HOUR TO SECOND
+-- !query analysis
+Project [cast(12:43:33.1234 as time(4)) + INTERVAL '01:04:05.56' HOUR TO SECOND AS CAST(12:43:33.1234 AS TIME(4)) + INTERVAL '01:04:05.56' HOUR TO SECOND#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'08:30' + NULL
+-- !query analysis
+Project [08:30:00 + cast(null as interval day to second) AS TIME '08:30:00' + NULL#x]
++- OneRowRelation
+
+
+-- !query
+SELECT NULL + TIME'08:30'
+-- !query analysis
+Project [08:30:00 + cast(null as interval day to second) AS TIME '08:30:00' + NULL#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'00:00:00.0101' + 1
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "left" : "\"TIME(6)\"",
+    "right" : "\"INT\"",
+    "sqlExpr" : "\"(TIME '00:00:00.0101' + 1)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 30,
+    "fragment" : "TIME'00:00:00.0101' + 1"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:30' - INTERVAL '12:29:59.000001' HOUR TO SECOND
+-- !query analysis
+Project [12:30:00 - INTERVAL '12:29:59.000001' HOUR TO SECOND AS TIME '12:30:00' - INTERVAL '12:29:59.000001' HOUR TO SECOND#x]
++- OneRowRelation
+
+
+-- !query
+SELECT '23:59:59.999999' :: TIME - INTERVAL '23:59:59.999999' HOUR TO SECOND
+-- !query analysis
+Project [cast(23:59:59.999999 as time(6)) - INTERVAL '23:59:59.999999' HOUR TO SECOND AS CAST(23:59:59.999999 AS TIME(6)) - INTERVAL '23:59:59.999999' HOUR TO SECOND#x]
++- OneRowRelation
+
+
+-- !query
+SELECT '00:00:00.0001' :: TIME(4) - INTERVAL '0 00:00:00.0001' DAY TO SECOND
+-- !query analysis
+Project [cast(00:00:00.0001 as time(4)) - INTERVAL '0 00:00:00.0001' DAY TO SECOND AS CAST(00:00:00.0001 AS TIME(4)) - INTERVAL '0 00:00:00.0001' DAY TO SECOND#x]
++- OneRowRelation
+
+
+-- !query
+SELECT '08:30' :: TIME(0) - INTERVAL '6' HOUR
+-- !query analysis
+Project [cast(08:30 as time(0)) - INTERVAL '06' HOUR AS CAST(08:30 AS TIME(0)) - INTERVAL '06' HOUR#x]
++- OneRowRelation
+
+
+-- !query
+SELECT '10:00:01' :: TIME(1) - INTERVAL '1' MONTH
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "left" : "\"TIME(1)\"",
+    "right" : "\"INTERVAL MONTH\"",
+    "sqlExpr" : "\"(CAST(10:00:01 AS TIME(1)) - INTERVAL '1' MONTH)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "'10:00:01' :: TIME(1) - INTERVAL '1' MONTH"
+  } ]
+}
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(HOUR, 00:00:00, 12:34:56) AS time_diff(HOUR, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(MINUTE, 00:00:00, 12:34:56) AS time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(SECOND, 00:00:00, 12:34:56) AS time_diff(SECOND, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(MILLISECOND, 00:00:00, 12:34:56) AS time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, 12:34:56) AS time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'01:02:03', time'12:34:56')
+-- !query analysis
+Project [time_diff(HOUR, 01:02:03, 12:34:56) AS time_diff(HOUR, TIME '01:02:03', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'01:02:03', time'12:34:56')
+-- !query analysis
+Project [time_diff(MINUTE, 01:02:03, 12:34:56) AS time_diff(MINUTE, TIME '01:02:03', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'01:02:03', time'12:34:56')
+-- !query analysis
+Project [time_diff(SECOND, 01:02:03, 12:34:56) AS time_diff(SECOND, TIME '01:02:03', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'12:34:56', time'01:02:03')
+-- !query analysis
+Project [time_diff(HOUR, 12:34:56, 01:02:03) AS time_diff(HOUR, TIME '12:34:56', TIME '01:02:03')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'12:34:56', time'01:02:03')
+-- !query analysis
+Project [time_diff(MINUTE, 12:34:56, 01:02:03) AS time_diff(MINUTE, TIME '12:34:56', TIME '01:02:03')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'12:34:56', time'01:02:03')
+-- !query analysis
+Project [time_diff(SECOND, 12:34:56, 01:02:03) AS time_diff(SECOND, TIME '12:34:56', TIME '01:02:03')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.1')
+-- !query analysis
+Project [time_diff(HOUR, 00:00:00, 12:34:56.1) AS time_diff(HOUR, TIME '00:00:00', TIME '12:34:56.1')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.1')
+-- !query analysis
+Project [time_diff(MINUTE, 00:00:00, 12:34:56.1) AS time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56.1')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.1')
+-- !query analysis
+Project [time_diff(SECOND, 00:00:00, 12:34:56.1) AS time_diff(SECOND, TIME '00:00:00', TIME '12:34:56.1')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.1')
+-- !query analysis
+Project [time_diff(MILLISECOND, 00:00:00, 12:34:56.1) AS time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56.1')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.1')
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, 12:34:56.1) AS time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56.1')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.123456')
+-- !query analysis
+Project [time_diff(HOUR, 00:00:00, 12:34:56.123456) AS time_diff(HOUR, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.123456')
+-- !query analysis
+Project [time_diff(MINUTE, 00:00:00, 12:34:56.123456) AS time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.123456')
+-- !query analysis
+Project [time_diff(SECOND, 00:00:00, 12:34:56.123456) AS time_diff(SECOND, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.123456')
+-- !query analysis
+Project [time_diff(MILLISECOND, 00:00:00, 12:34:56.123456) AS time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.123456')
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, 12:34:56.123456) AS time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.123456789')
+-- !query analysis
+Project [time_diff(HOUR, 00:00:00, 12:34:56.123456) AS time_diff(HOUR, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.123456789')
+-- !query analysis
+Project [time_diff(MINUTE, 00:00:00, 12:34:56.123456) AS time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.123456789')
+-- !query analysis
+Project [time_diff(SECOND, 00:00:00, 12:34:56.123456) AS time_diff(SECOND, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.123456789')
+-- !query analysis
+Project [time_diff(MILLISECOND, 00:00:00, 12:34:56.123456) AS time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.123456789')
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, 12:34:56.123456) AS time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56.123456')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('hour', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(hour, 00:00:00, 12:34:56) AS time_diff(hour, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MiNuTe', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(MiNuTe, 00:00:00, 12:34:56) AS time_diff(MiNuTe, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('sEcOnD', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(sEcOnD, 00:00:00, 12:34:56) AS time_diff(sEcOnD, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('Millisecond', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(Millisecond, 00:00:00, 12:34:56) AS time_diff(Millisecond, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('microseconD', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(microseconD, 00:00:00, 12:34:56) AS time_diff(microseconD, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'00:00:00')
+-- !query analysis
+Project [time_diff(HOUR, 00:00:00, 00:00:00) AS time_diff(HOUR, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'00:00:00')
+-- !query analysis
+Project [time_diff(MINUTE, 00:00:00, 00:00:00) AS time_diff(MINUTE, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'00:00:00')
+-- !query analysis
+Project [time_diff(SECOND, 00:00:00, 00:00:00) AS time_diff(SECOND, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'00:00:00')
+-- !query analysis
+Project [time_diff(MILLISECOND, 00:00:00, 00:00:00) AS time_diff(MILLISECOND, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'00:00:00')
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, 00:00:00) AS time_diff(MICROSECOND, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'00:00:00.000000001')
+-- !query analysis
+Project [time_diff(HOUR, 00:00:00, 00:00:00) AS time_diff(HOUR, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'00:00:00.000000001')
+-- !query analysis
+Project [time_diff(MINUTE, 00:00:00, 00:00:00) AS time_diff(MINUTE, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'00:00:00.000000001')
+-- !query analysis
+Project [time_diff(SECOND, 00:00:00, 00:00:00) AS time_diff(SECOND, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'00:00:00.000000001')
+-- !query analysis
+Project [time_diff(MILLISECOND, 00:00:00, 00:00:00) AS time_diff(MILLISECOND, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'00:00:00.000000001')
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, 00:00:00) AS time_diff(MICROSECOND, TIME '00:00:00', TIME '00:00:00')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'23:59:59.999999999')
+-- !query analysis
+Project [time_diff(HOUR, 00:00:00, 23:59:59.999999) AS time_diff(HOUR, TIME '00:00:00', TIME '23:59:59.999999')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'23:59:59.999999999')
+-- !query analysis
+Project [time_diff(MINUTE, 00:00:00, 23:59:59.999999) AS time_diff(MINUTE, TIME '00:00:00', TIME '23:59:59.999999')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'23:59:59.999999999')
+-- !query analysis
+Project [time_diff(SECOND, 00:00:00, 23:59:59.999999) AS time_diff(SECOND, TIME '00:00:00', TIME '23:59:59.999999')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'23:59:59.999999999')
+-- !query analysis
+Project [time_diff(MILLISECOND, 00:00:00, 23:59:59.999999) AS time_diff(MILLISECOND, TIME '00:00:00', TIME '23:59:59.999999')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'23:59:59.999999999')
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, 23:59:59.999999) AS time_diff(MICROSECOND, TIME '00:00:00', TIME '23:59:59.999999')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(, 00:00:00, 12:34:56) AS time_diff(, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff(' ', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff( , 00:00:00, 12:34:56) AS time_diff( , TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MS', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(MS, 00:00:00, 12:34:56) AS time_diff(MS, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('DAY', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(DAY, 00:00:00, 12:34:56) AS time_diff(DAY, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('WEEK', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(WEEK, 00:00:00, 12:34:56) AS time_diff(WEEK, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('ABCD', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(ABCD, 00:00:00, 12:34:56) AS time_diff(ABCD, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('QUARTER', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(QUARTER, 00:00:00, 12:34:56) AS time_diff(QUARTER, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('INVALID', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(INVALID, 00:00:00, 12:34:56) AS time_diff(INVALID, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('INVALID_UNIT', time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(INVALID_UNIT, 00:00:00, 12:34:56) AS time_diff(INVALID_UNIT, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff(NULL, time'00:00:00', time'12:34:56')
+-- !query analysis
+Project [time_diff(cast(null as string), 00:00:00, 12:34:56) AS time_diff(NULL, TIME '00:00:00', TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', NULL, time'12:34:56')
+-- !query analysis
+Project [time_diff(MICROSECOND, cast(null as time(6)), 12:34:56) AS time_diff(MICROSECOND, NULL, TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', NULL)
+-- !query analysis
+Project [time_diff(MICROSECOND, 00:00:00, cast(null as time(6))) AS time_diff(MICROSECOND, TIME '00:00:00', NULL)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff(NULL, NULL, time'12:34:56')
+-- !query analysis
+Project [time_diff(cast(null as string), cast(null as time(6)), 12:34:56) AS time_diff(NULL, NULL, TIME '12:34:56')#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff(NULL, time'00:00:00', NULL)
+-- !query analysis
+Project [time_diff(cast(null as string), 00:00:00, cast(null as time(6))) AS time_diff(NULL, TIME '00:00:00', NULL)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('MICROSECOND', NULL, NULL)
+-- !query analysis
+Project [time_diff(MICROSECOND, cast(null as time(6)), cast(null as time(6))) AS time_diff(MICROSECOND, NULL, NULL)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff(NULL, NULL, NULL)
+-- !query analysis
+Project [time_diff(cast(null as string), cast(null as time(6)), cast(null as time(6))) AS time_diff(NULL, NULL, NULL)#xL]
++- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time_start, time_end) FROM timediff_view
+-- !query analysis
+Project [time_diff(SECOND, time_start#x, time_end#x) AS time_diff(SECOND, time_start, time_end)#xL]
++- SubqueryAlias timediff_view
+   +- View (`timediff_view`, [time_start#x, time_end#x, unit#x])
+      +- Project [cast(time_start#x as time(6)) AS time_start#x, cast(time_end#x as time(6)) AS time_end#x, cast(unit#x as string) AS unit#x]
+         +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_diff(unit, time'01:02:03', time_end) FROM timediff_view
+-- !query analysis
+Project [time_diff(unit#x, 01:02:03, time_end#x) AS time_diff(unit, TIME '01:02:03', time_end)#xL]
++- SubqueryAlias timediff_view
+   +- View (`timediff_view`, [time_start#x, time_end#x, unit#x])
+      +- Project [cast(time_start#x as time(6)) AS time_start#x, cast(time_end#x as time(6)) AS time_end#x, cast(unit#x as string) AS unit#x]
+         +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_diff(unit, time_start, time'04:05:06') FROM timediff_view
+-- !query analysis
+Project [time_diff(unit#x, time_start#x, 04:05:06) AS time_diff(unit, time_start, TIME '04:05:06')#xL]
++- SubqueryAlias timediff_view
+   +- View (`timediff_view`, [time_start#x, time_end#x, unit#x])
+      +- Project [cast(time_start#x as time(6)) AS time_start#x, cast(time_end#x as time(6)) AS time_end#x, cast(unit#x as string) AS unit#x]
+         +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time'01:02:03', time_end) FROM timediff_view
+-- !query analysis
+Project [time_diff(SECOND, 01:02:03, time_end#x) AS time_diff(SECOND, TIME '01:02:03', time_end)#xL]
++- SubqueryAlias timediff_view
+   +- View (`timediff_view`, [time_start#x, time_end#x, unit#x])
+      +- Project [cast(time_start#x as time(6)) AS time_start#x, cast(time_end#x as time(6)) AS time_end#x, cast(unit#x as string) AS unit#x]
+         +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_diff('SECOND', time_start, time'04:05:06') FROM timediff_view
+-- !query analysis
+Project [time_diff(SECOND, time_start#x, 04:05:06) AS time_diff(SECOND, time_start, TIME '04:05:06')#xL]
++- SubqueryAlias timediff_view
+   +- View (`timediff_view`, [time_start#x, time_end#x, unit#x])
+      +- Project [cast(time_start#x as time(6)) AS time_start#x, cast(time_end#x as time(6)) AS time_end#x, cast(unit#x as string) AS unit#x]
+         +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_diff(unit, time'01:02:03', time'04:05:06') FROM timediff_view
+-- !query analysis
+Project [time_diff(unit#x, 01:02:03, 04:05:06) AS time_diff(unit, TIME '01:02:03', TIME '04:05:06')#xL]
++- SubqueryAlias timediff_view
+   +- View (`timediff_view`, [time_start#x, time_end#x, unit#x])
+      +- Project [cast(time_start#x as time(6)) AS time_start#x, cast(time_end#x as time(6)) AS time_end#x, cast(unit#x as string) AS unit#x]
+         +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT time_diff(unit, time_start, time_end) FROM timediff_view
+-- !query analysis
+Project [time_diff(unit#x, time_start#x, time_end#x) AS time_diff(unit, time_start, time_end)#xL]
++- SubqueryAlias timediff_view
+   +- View (`timediff_view`, [time_start#x, time_end#x, unit#x])
+      +- Project [cast(time_start#x as time(6)) AS time_start#x, cast(time_end#x as time(6)) AS time_end#x, cast(unit#x as string) AS unit#x]
+         +- Project [01:02:03 AS time_start#x, 04:05:06 AS time_end#x, SECOND AS unit#x]
+            +- OneRowRelation
+
+
+-- !query
+SELECT TIME'12:30:41' - TIME'10:00'
+-- !query analysis
+Project [12:30:41 - 10:00:00 AS TIME '12:30:41' - TIME '10:00:00'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'08:30' - NULL
+-- !query analysis
+Project [08:30:00 - cast(null as time(6)) AS TIME '08:30:00' - NULL#x]
++- OneRowRelation
+
+
+-- !query
+SELECT NULL - TIME'10:32'
+-- !query analysis
+Project [cast(null as time(6)) - 10:32:00 AS NULL - TIME '10:32:00'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT TIME'12:30:41.123' - TIMESTAMP'2025-07-11 10:00:01'
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIME '12:30:41.123'\"",
+    "inputType" : "\"TIME(6)\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"(TIMESTAMP OR TIMESTAMP WITHOUT TIME ZONE)\"",
+    "sqlExpr" : "\"(TIME '12:30:41.123' - TIMESTAMP '2025-07-11 10:00:01')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "TIME'12:30:41.123' - TIMESTAMP'2025-07-11 10:00:01'"
+  } ]
+}
+
+
+-- !query
+SELECT '12:30:41.123' - TIME'10:00:01'
+-- !query analysis
+Project [cast(12:30:41.123 as time(6)) - 10:00:01 AS 12:30:41.123 - TIME '10:00:01'#x]
++- OneRowRelation
+
+
+-- !query
+SELECT '23:59:59.999999' :: TIME(6) - '00:00' :: TIME(0)
+-- !query analysis
+Project [cast(23:59:59.999999 as time(6)) - cast(00:00 as time(0)) AS CAST(23:59:59.999999 AS TIME(6)) - CAST(00:00 AS TIME(0))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT '00:00:00.1234' :: TIME(4) - TIME'23:59:59'
+-- !query analysis
+Project [cast(00:00:00.1234 as time(4)) - 23:59:59 AS CAST(00:00:00.1234 AS TIME(4)) - TIME '23:59:59'#x]
++- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ltz.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ltz.sql.out
index 039556b59b0ba..73fbade579c5c 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ltz.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ltz.sql.out
@@ -47,6 +47,87 @@ Project [make_timestamp_ltz(2021, 7, 11, 6, 30, cast(60.007 as decimal(16,6)), N
 +- OneRowRelation
 
 
+-- !query
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp_ltz(NULL, TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp_ltz(DATE'1970-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp_ltz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp_ltz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp_ltz(DATE'2025-06-20', timestamp_ntz'2018-11-17 13:33:33')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '2025-06-20', TIMESTAMP_NTZ '2018-11-17 13:33:33')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp_ltz(DATE'2025-06-20', timestamp_ntz'2018-11-17 13:33:33')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(PST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(CET), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET)#x]
++- OneRowRelation
+
+
 -- !query
 SELECT convert_timezone('Europe/Brussels', timestamp_ltz'2022-03-23 00:00:00 America/Los_Angeles')
 -- !query analysis
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ntz.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ntz.sql.out
index 9ab5b2445fc3a..e099b80f6bafe 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ntz.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp-ntz.sql.out
@@ -44,7 +44,7 @@ org.apache.spark.sql.AnalysisException
   "messageParameters" : {
     "actualNum" : "7",
     "docroot" : "https://spark.apache.org/docs/latest",
-    "expectedNum" : "6",
+    "expectedNum" : "[2, 6]",
     "functionName" : "`make_timestamp_ntz`"
   },
   "queryContext" : [ {
@@ -64,6 +64,140 @@ Project [make_timestamp_ntz(2021, 7, 11, 6, 30, cast(60.007 as decimal(16,6)), N
 +- OneRowRelation
 
 
+-- !query
+SELECT make_timestamp_ntz(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query analysis
+Project [make_timestamp_ntz(make_date(2021, 7, 11, true), make_time(6, 30, cast(45.678 as decimal(16,6)))) AS make_timestamp_ntz(make_date(2021, 7, 11), make_time(6, 30, 45.678))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp_ntz(NULL, TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp_ntz(DATE'1970-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp_ntz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp_ntz(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp_ntz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp_ntz(DATE'2025-06-20', '0:0:0')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"0:0:0\"",
+    "inputType" : "\"STRING\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp_ntz(DATE '2025-06-20', 0:0:0)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "make_timestamp_ntz(DATE'2025-06-20', '0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT try_make_timestamp_ntz(make_date(2025, 6, 27), make_time(16, 08, 45.123456))
+-- !query analysis
+Project [try_make_timestamp_ntz(make_timestamp_ntz(make_date(2025, 6, 27, true), make_time(16, 8, cast(45.123456 as decimal(16,6))))) AS try_make_timestamp_ntz(make_timestamp_ntz(make_date(2025, 6, 27), make_time(16, 8, 45.123456)))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT try_make_timestamp_ntz(NULL, TIME'23:59:59.00001')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT try_make_timestamp_ntz(DATE'0001-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT try_make_timestamp_ntz('2018-11-17 13:33:33', TIME'0:0:0')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"2018-11-17 13:33:33\"",
+    "inputType" : "\"STRING\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp_ntz(2018-11-17 13:33:33, TIME '00:00:00')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 65,
+    "fragment" : "try_make_timestamp_ntz('2018-11-17 13:33:33', TIME'0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT try_make_timestamp_ntz(DATE'2025-06-20', 10D)
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"10.0\"",
+    "inputType" : "\"DOUBLE\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp_ntz(DATE '2025-06-20', 10.0)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "try_make_timestamp_ntz(DATE'2025-06-20', 10D)"
+  } ]
+}
+
+
 -- !query
 SELECT convert_timezone('Europe/Moscow', 'America/Los_Angeles', timestamp_ntz'2022-01-01 00:00:00')
 -- !query analysis
@@ -150,7 +284,7 @@ INSERT INTO a PARTITION(a=timestamp_ntz'2018-11-17 13:33:33') VALUES (1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/a, [a=2018-11-17 13:33:33], false, [a#x], Parquet, [path=file:[not included in comparison]/{warehouse_dir}/a], Append, `spark_catalog`.`default`.`a`, org.apache.spark.sql.execution.datasources.CatalogFileIndex(file:[not included in comparison]/{warehouse_dir}/a), [b, a]
 +- Project [b#x, cast(2018-11-17 13:33:33 as timestamp_ntz) AS a#x]
-   +- Project [cast(col1#x as int) AS b#x]
+   +- Project [col1#x AS b#x]
       +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp.sql.out
index 560974d28c545..371b12278e415 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/timestamp.sql.out
@@ -157,6 +157,235 @@ Project [make_timestamp(1, 1, 1, 1, 1, cast(999.999999 as decimal(16,6)), None,
 +- OneRowRelation
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), None, None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(MIT), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(PST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(UTC), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(CET), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(JST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query analysis
@@ -639,45 +868,13 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+[Analyzer test output redacted due to nondeterminism]
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+[Analyzer test output redacted due to nondeterminism]
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp-ansi.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp-ansi.sql.out
index f900293918c69..1aa41666d59ab 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp-ansi.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp-ansi.sql.out
@@ -158,6 +158,235 @@ Project [make_timestamp(1, 1, 1, 1, 1, cast(999.999999 as decimal(16,6)), None,
 +- OneRowRelation
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), None, None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(MIT), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(PST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(UTC), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(CET), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, true), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(JST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query analysis
@@ -567,13 +796,15 @@ Project [(cast(2011-11-11 11:11:11 as timestamp_ntz) - 2011-11-11 11:11:10) AS (
 -- !query
 select timestamp'2011-11-11 11:11:11' - null
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+Project [(2011-11-11 11:11:11 - cast(null as timestamp_ntz)) AS (TIMESTAMP_NTZ '2011-11-11 11:11:11' - NULL)#x]
++- OneRowRelation
 
 
 -- !query
 select null - timestamp'2011-11-11 11:11:11'
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+Project [(cast(null as timestamp_ntz) - 2011-11-11 11:11:11) AS (NULL - TIMESTAMP_NTZ '2011-11-11 11:11:11')#x]
++- OneRowRelation
 
 
 -- !query
@@ -653,45 +884,15 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP_NTZ\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+Project [cast(2011-11-11 11:11:11 + cast(null as interval day to second) as timestamp_ntz) AS TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL#x]
++- OneRowRelation
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP_NTZ\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP_NTZ '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+Project [cast(2011-11-11 11:11:11 + cast(null as interval day to second) as timestamp_ntz) AS TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL#x]
++- OneRowRelation
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp.sql.out
index 6dd91c8cdccf6..ceb8fae2bb340 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/timestampNTZ/timestamp.sql.out
@@ -158,6 +158,235 @@ Project [make_timestamp(1, 1, 1, 1, 1, cast(999.999999 as decimal(16,6)), None,
 +- OneRowRelation
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), None, None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), None, Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678))#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(MIT), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(PST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(UTC), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(CET), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query analysis
+Project [make_timestamp(make_date(2021, 7, 11, false), Some(make_time(6, 30, cast(45.678 as decimal(16,6)))), Some(JST), Some(America/Los_Angeles)) AS make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST)#x]
++- OneRowRelation
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query analysis
+[Analyzer test output redacted due to nondeterminism]
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query analysis
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query analysis
@@ -601,13 +830,15 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' - null
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+Project [(2011-11-11 11:11:11 - cast(null as timestamp_ntz)) AS (TIMESTAMP_NTZ '2011-11-11 11:11:11' - NULL)#x]
++- OneRowRelation
 
 
 -- !query
 select null - timestamp'2011-11-11 11:11:11'
 -- !query analysis
-[Analyzer test output redacted due to nondeterminism]
+Project [(cast(null as timestamp_ntz) - 2011-11-11 11:11:11) AS (NULL - TIMESTAMP_NTZ '2011-11-11 11:11:11')#x]
++- OneRowRelation
 
 
 -- !query
@@ -713,45 +944,15 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP_NTZ\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+Project [cast(2011-11-11 11:11:11 + cast(null as interval day to second) as timestamp_ntz) AS TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL#x]
++- OneRowRelation
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query analysis
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP_NTZ\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP_NTZ '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+Project [cast(2011-11-11 11:11:11 + cast(null as interval day to second) as timestamp_ntz) AS TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL#x]
++- OneRowRelation
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/concat.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/concat.sql.out
index 4a35fffe3191b..d9c56bb5f564e 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/concat.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/concat.sql.out
@@ -226,9 +226,9 @@ CreateViewCommand `various_arrays`, SELECT * FROM VALUES (
   struct_array1, struct_array2,
   map_array1, map_array2
 ), false, false, LocalTempView, UNSUPPORTED, true
-   +- Project [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields]
+   +- Project [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x]
       +- SubqueryAlias various_arrays
-         +- LocalRelation [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields]
+         +- LocalRelation [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x]
 
 
 -- !query
@@ -251,11 +251,11 @@ FROM various_arrays
 -- !query analysis
 Project [concat(boolean_array1#x, boolean_array2#x) AS boolean_array#x, concat(tinyint_array1#x, tinyint_array2#x) AS tinyint_array#x, concat(smallint_array1#x, smallint_array2#x) AS smallint_array#x, concat(int_array1#x, int_array2#x) AS int_array#x, concat(bigint_array1#x, bigint_array2#x) AS bigint_array#x, concat(decimal_array1#x, decimal_array2#x) AS decimal_array#x, concat(double_array1#x, double_array2#x) AS double_array#x, concat(float_array1#x, float_array2#x) AS float_array#x, concat(date_array1#x, data_array2#x) AS data_array#x, concat(timestamp_array1#x, timestamp_array2#x) AS timestamp_array#x, concat(string_array1#x, string_array2#x) AS string_array#x, concat(array_array1#x, array_array2#x) AS array_array#x, concat(struct_array1#x, struct_array2#x) AS struct_array#x, concat(map_array1#x, map_array2#x) AS map_array#x]
 +- SubqueryAlias various_arrays
-   +- View (`various_arrays`, [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields])
-      +- Project [cast(boolean_array1#x as array<boolean>) AS boolean_array1#x, cast(boolean_array2#x as array<boolean>) AS boolean_array2#x, cast(tinyint_array1#x as array<tinyint>) AS tinyint_array1#x, cast(tinyint_array2#x as array<tinyint>) AS tinyint_array2#x, cast(smallint_array1#x as array<smallint>) AS smallint_array1#x, cast(smallint_array2#x as array<smallint>) AS smallint_array2#x, cast(int_array1#x as array<int>) AS int_array1#x, cast(int_array2#x as array<int>) AS int_array2#x, cast(bigint_array1#x as array<bigint>) AS bigint_array1#x, cast(bigint_array2#x as array<bigint>) AS bigint_array2#x, cast(decimal_array1#x as array<decimal(19,0)>) AS decimal_array1#x, cast(decimal_array2#x as array<decimal(19,0)>) AS decimal_array2#x, cast(double_array1#x as array<double>) AS double_array1#x, cast(double_array2#x as array<double>) AS double_array2#x, cast(float_array1#x as array<float>) AS float_array1#x, cast(float_array2#x as array<float>) AS float_array2#x, cast(date_array1#x as array<date>) AS date_array1#x, cast(data_array2#x as array<date>) AS data_array2#x, cast(timestamp_array1#x as array<timestamp>) AS timestamp_array1#x, cast(timestamp_array2#x as array<timestamp>) AS timestamp_array2#x, cast(string_array1#x as array<string>) AS string_array1#x, cast(string_array2#x as array<string>) AS string_array2#x, cast(array_array1#x as array<array<string>>) AS array_array1#x, cast(array_array2#x as array<array<string>>) AS array_array2#x, cast(struct_array1#x as array<struct<col1:string,col2:int>>) AS struct_array1#x, ... 3 more fields]
-         +- Project [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields]
+   +- View (`various_arrays`, [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x])
+      +- Project [cast(boolean_array1#x as array<boolean>) AS boolean_array1#x, cast(boolean_array2#x as array<boolean>) AS boolean_array2#x, cast(tinyint_array1#x as array<tinyint>) AS tinyint_array1#x, cast(tinyint_array2#x as array<tinyint>) AS tinyint_array2#x, cast(smallint_array1#x as array<smallint>) AS smallint_array1#x, cast(smallint_array2#x as array<smallint>) AS smallint_array2#x, cast(int_array1#x as array<int>) AS int_array1#x, cast(int_array2#x as array<int>) AS int_array2#x, cast(bigint_array1#x as array<bigint>) AS bigint_array1#x, cast(bigint_array2#x as array<bigint>) AS bigint_array2#x, cast(decimal_array1#x as array<decimal(19,0)>) AS decimal_array1#x, cast(decimal_array2#x as array<decimal(19,0)>) AS decimal_array2#x, cast(double_array1#x as array<double>) AS double_array1#x, cast(double_array2#x as array<double>) AS double_array2#x, cast(float_array1#x as array<float>) AS float_array1#x, cast(float_array2#x as array<float>) AS float_array2#x, cast(date_array1#x as array<date>) AS date_array1#x, cast(data_array2#x as array<date>) AS data_array2#x, cast(timestamp_array1#x as array<timestamp>) AS timestamp_array1#x, cast(timestamp_array2#x as array<timestamp>) AS timestamp_array2#x, cast(string_array1#x as array<string>) AS string_array1#x, cast(string_array2#x as array<string>) AS string_array2#x, cast(array_array1#x as array<array<string>>) AS array_array1#x, cast(array_array2#x as array<array<string>>) AS array_array2#x, cast(struct_array1#x as array<struct<col1:string,col2:int>>) AS struct_array1#x, cast(struct_array2#x as array<struct<col1:string,col2:int>>) AS struct_array2#x, cast(map_array1#x as array<map<string,int>>) AS map_array1#x, cast(map_array2#x as array<map<string,int>>) AS map_array2#x]
+         +- Project [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x]
             +- SubqueryAlias various_arrays
-               +- LocalRelation [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields]
+               +- LocalRelation [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x]
 
 
 -- !query
@@ -273,8 +273,8 @@ FROM various_arrays
 -- !query analysis
 Project [concat(cast(tinyint_array1#x as array<smallint>), smallint_array2#x) AS ts_array#x, concat(cast(smallint_array1#x as array<int>), int_array2#x) AS si_array#x, concat(cast(int_array1#x as array<bigint>), bigint_array2#x) AS ib_array#x, concat(cast(bigint_array1#x as array<decimal(20,0)>), cast(decimal_array2#x as array<decimal(20,0)>)) AS bd_array#x, concat(cast(decimal_array1#x as array<double>), double_array2#x) AS dd_array#x, concat(double_array1#x, cast(float_array2#x as array<double>)) AS df_array#x, concat(cast(string_array1#x as array<date>), data_array2#x) AS std_array#x, concat(timestamp_array1#x, cast(string_array2#x as array<timestamp>)) AS tst_array#x, concat(cast(string_array1#x as array<bigint>), cast(int_array2#x as array<bigint>)) AS sti_array#x]
 +- SubqueryAlias various_arrays
-   +- View (`various_arrays`, [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields])
-      +- Project [cast(boolean_array1#x as array<boolean>) AS boolean_array1#x, cast(boolean_array2#x as array<boolean>) AS boolean_array2#x, cast(tinyint_array1#x as array<tinyint>) AS tinyint_array1#x, cast(tinyint_array2#x as array<tinyint>) AS tinyint_array2#x, cast(smallint_array1#x as array<smallint>) AS smallint_array1#x, cast(smallint_array2#x as array<smallint>) AS smallint_array2#x, cast(int_array1#x as array<int>) AS int_array1#x, cast(int_array2#x as array<int>) AS int_array2#x, cast(bigint_array1#x as array<bigint>) AS bigint_array1#x, cast(bigint_array2#x as array<bigint>) AS bigint_array2#x, cast(decimal_array1#x as array<decimal(19,0)>) AS decimal_array1#x, cast(decimal_array2#x as array<decimal(19,0)>) AS decimal_array2#x, cast(double_array1#x as array<double>) AS double_array1#x, cast(double_array2#x as array<double>) AS double_array2#x, cast(float_array1#x as array<float>) AS float_array1#x, cast(float_array2#x as array<float>) AS float_array2#x, cast(date_array1#x as array<date>) AS date_array1#x, cast(data_array2#x as array<date>) AS data_array2#x, cast(timestamp_array1#x as array<timestamp>) AS timestamp_array1#x, cast(timestamp_array2#x as array<timestamp>) AS timestamp_array2#x, cast(string_array1#x as array<string>) AS string_array1#x, cast(string_array2#x as array<string>) AS string_array2#x, cast(array_array1#x as array<array<string>>) AS array_array1#x, cast(array_array2#x as array<array<string>>) AS array_array2#x, cast(struct_array1#x as array<struct<col1:string,col2:int>>) AS struct_array1#x, ... 3 more fields]
-         +- Project [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields]
+   +- View (`various_arrays`, [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x])
+      +- Project [cast(boolean_array1#x as array<boolean>) AS boolean_array1#x, cast(boolean_array2#x as array<boolean>) AS boolean_array2#x, cast(tinyint_array1#x as array<tinyint>) AS tinyint_array1#x, cast(tinyint_array2#x as array<tinyint>) AS tinyint_array2#x, cast(smallint_array1#x as array<smallint>) AS smallint_array1#x, cast(smallint_array2#x as array<smallint>) AS smallint_array2#x, cast(int_array1#x as array<int>) AS int_array1#x, cast(int_array2#x as array<int>) AS int_array2#x, cast(bigint_array1#x as array<bigint>) AS bigint_array1#x, cast(bigint_array2#x as array<bigint>) AS bigint_array2#x, cast(decimal_array1#x as array<decimal(19,0)>) AS decimal_array1#x, cast(decimal_array2#x as array<decimal(19,0)>) AS decimal_array2#x, cast(double_array1#x as array<double>) AS double_array1#x, cast(double_array2#x as array<double>) AS double_array2#x, cast(float_array1#x as array<float>) AS float_array1#x, cast(float_array2#x as array<float>) AS float_array2#x, cast(date_array1#x as array<date>) AS date_array1#x, cast(data_array2#x as array<date>) AS data_array2#x, cast(timestamp_array1#x as array<timestamp>) AS timestamp_array1#x, cast(timestamp_array2#x as array<timestamp>) AS timestamp_array2#x, cast(string_array1#x as array<string>) AS string_array1#x, cast(string_array2#x as array<string>) AS string_array2#x, cast(array_array1#x as array<array<string>>) AS array_array1#x, cast(array_array2#x as array<array<string>>) AS array_array2#x, cast(struct_array1#x as array<struct<col1:string,col2:int>>) AS struct_array1#x, cast(struct_array2#x as array<struct<col1:string,col2:int>>) AS struct_array2#x, cast(map_array1#x as array<map<string,int>>) AS map_array1#x, cast(map_array2#x as array<map<string,int>>) AS map_array2#x]
+         +- Project [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x]
             +- SubqueryAlias various_arrays
-               +- LocalRelation [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, ... 3 more fields]
+               +- LocalRelation [boolean_array1#x, boolean_array2#x, tinyint_array1#x, tinyint_array2#x, smallint_array1#x, smallint_array2#x, int_array1#x, int_array2#x, bigint_array1#x, bigint_array2#x, decimal_array1#x, decimal_array2#x, double_array1#x, double_array2#x, float_array1#x, float_array2#x, date_array1#x, data_array2#x, timestamp_array1#x, timestamp_array2#x, string_array1#x, string_array2#x, array_array1#x, array_array2#x, struct_array1#x, struct_array2#x, map_array1#x, map_array2#x]
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/mapconcat.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/mapconcat.sql.out
index 6fee49a07667b..5b3dace4106a3 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/mapconcat.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/typeCoercion/native/mapconcat.sql.out
@@ -71,9 +71,9 @@ CreateViewCommand `various_maps`, SELECT * FROM VALUES (
   string_int_map1, string_int_map2,
   int_string_map1, int_string_map2
 ), false, false, LocalTempView, UNSUPPORTED, true
-   +- Project [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, ... 5 more fields]
+   +- Project [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, struct_map2#x, string_int_map1#x, string_int_map2#x, int_string_map1#x, int_string_map2#x]
       +- SubqueryAlias various_maps
-         +- LocalRelation [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, ... 5 more fields]
+         +- LocalRelation [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, struct_map2#x, string_int_map1#x, string_int_map2#x, int_string_map1#x, int_string_map2#x]
 
 
 -- !query
@@ -97,11 +97,11 @@ FROM various_maps
 -- !query analysis
 Project [map_concat(boolean_map1#x, boolean_map2#x) AS boolean_map#x, map_concat(tinyint_map1#x, tinyint_map2#x) AS tinyint_map#x, map_concat(smallint_map1#x, smallint_map2#x) AS smallint_map#x, map_concat(int_map1#x, int_map2#x) AS int_map#x, map_concat(bigint_map1#x, bigint_map2#x) AS bigint_map#x, map_concat(decimal_map1#x, decimal_map2#x) AS decimal_map#x, map_concat(float_map1#x, float_map2#x) AS float_map#x, map_concat(double_map1#x, double_map2#x) AS double_map#x, map_concat(date_map1#x, date_map2#x) AS date_map#x, map_concat(timestamp_map1#x, timestamp_map2#x) AS timestamp_map#x, map_concat(string_map1#x, string_map2#x) AS string_map#x, map_concat(array_map1#x, array_map2#x) AS array_map#x, map_concat(struct_map1#x, struct_map2#x) AS struct_map#x, map_concat(string_int_map1#x, string_int_map2#x) AS string_int_map#x, map_concat(int_string_map1#x, int_string_map2#x) AS int_string_map#x]
 +- SubqueryAlias various_maps
-   +- View (`various_maps`, [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, ... 5 more fields])
-      +- Project [cast(boolean_map1#x as map<boolean,boolean>) AS boolean_map1#x, cast(boolean_map2#x as map<boolean,boolean>) AS boolean_map2#x, cast(tinyint_map1#x as map<tinyint,tinyint>) AS tinyint_map1#x, cast(tinyint_map2#x as map<tinyint,tinyint>) AS tinyint_map2#x, cast(smallint_map1#x as map<smallint,smallint>) AS smallint_map1#x, cast(smallint_map2#x as map<smallint,smallint>) AS smallint_map2#x, cast(int_map1#x as map<int,int>) AS int_map1#x, cast(int_map2#x as map<int,int>) AS int_map2#x, cast(bigint_map1#x as map<bigint,bigint>) AS bigint_map1#x, cast(bigint_map2#x as map<bigint,bigint>) AS bigint_map2#x, cast(decimal_map1#x as map<decimal(19,0),decimal(19,0)>) AS decimal_map1#x, cast(decimal_map2#x as map<decimal(19,0),decimal(19,0)>) AS decimal_map2#x, cast(double_map1#x as map<double,double>) AS double_map1#x, cast(double_map2#x as map<double,double>) AS double_map2#x, cast(float_map1#x as map<float,float>) AS float_map1#x, cast(float_map2#x as map<float,float>) AS float_map2#x, cast(date_map1#x as map<date,date>) AS date_map1#x, cast(date_map2#x as map<date,date>) AS date_map2#x, cast(timestamp_map1#x as map<timestamp,timestamp>) AS timestamp_map1#x, cast(timestamp_map2#x as map<timestamp,timestamp>) AS timestamp_map2#x, cast(string_map1#x as map<string,string>) AS string_map1#x, cast(string_map2#x as map<string,string>) AS string_map2#x, cast(array_map1#x as map<array<string>,array<string>>) AS array_map1#x, cast(array_map2#x as map<array<string>,array<string>>) AS array_map2#x, cast(struct_map1#x as map<struct<col1:string,col2:int>,struct<col1:string,col2:int>>) AS struct_map1#x, ... 5 more fields]
-         +- Project [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, ... 5 more fields]
+   +- View (`various_maps`, [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, struct_map2#x, string_int_map1#x, string_int_map2#x, int_string_map1#x, int_string_map2#x])
+      +- Project [cast(boolean_map1#x as map<boolean,boolean>) AS boolean_map1#x, cast(boolean_map2#x as map<boolean,boolean>) AS boolean_map2#x, cast(tinyint_map1#x as map<tinyint,tinyint>) AS tinyint_map1#x, cast(tinyint_map2#x as map<tinyint,tinyint>) AS tinyint_map2#x, cast(smallint_map1#x as map<smallint,smallint>) AS smallint_map1#x, cast(smallint_map2#x as map<smallint,smallint>) AS smallint_map2#x, cast(int_map1#x as map<int,int>) AS int_map1#x, cast(int_map2#x as map<int,int>) AS int_map2#x, cast(bigint_map1#x as map<bigint,bigint>) AS bigint_map1#x, cast(bigint_map2#x as map<bigint,bigint>) AS bigint_map2#x, cast(decimal_map1#x as map<decimal(19,0),decimal(19,0)>) AS decimal_map1#x, cast(decimal_map2#x as map<decimal(19,0),decimal(19,0)>) AS decimal_map2#x, cast(double_map1#x as map<double,double>) AS double_map1#x, cast(double_map2#x as map<double,double>) AS double_map2#x, cast(float_map1#x as map<float,float>) AS float_map1#x, cast(float_map2#x as map<float,float>) AS float_map2#x, cast(date_map1#x as map<date,date>) AS date_map1#x, cast(date_map2#x as map<date,date>) AS date_map2#x, cast(timestamp_map1#x as map<timestamp,timestamp>) AS timestamp_map1#x, cast(timestamp_map2#x as map<timestamp,timestamp>) AS timestamp_map2#x, cast(string_map1#x as map<string,string>) AS string_map1#x, cast(string_map2#x as map<string,string>) AS string_map2#x, cast(array_map1#x as map<array<string>,array<string>>) AS array_map1#x, cast(array_map2#x as map<array<string>,array<string>>) AS array_map2#x, cast(struct_map1#x as map<struct<col1:string,col2:int>,struct<col1:string,col2:int>>) AS struct_map1#x, cast(struct_map2#x as map<struct<col1:string,col2:int>,struct<col1:string,col2:int>>) AS struct_map2#x, cast(string_int_map1#x as map<string,int>) AS string_int_map1#x, cast(string_int_map2#x as map<string,int>) AS string_int_map2#x, cast(int_string_map1#x as map<int,string>) AS int_string_map1#x, cast(int_string_map2#x as map<int,string>) AS int_string_map2#x]
+         +- Project [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, struct_map2#x, string_int_map1#x, string_int_map2#x, int_string_map1#x, int_string_map2#x]
             +- SubqueryAlias various_maps
-               +- LocalRelation [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, ... 5 more fields]
+               +- LocalRelation [boolean_map1#x, boolean_map2#x, tinyint_map1#x, tinyint_map2#x, smallint_map1#x, smallint_map2#x, int_map1#x, int_map2#x, bigint_map1#x, bigint_map2#x, decimal_map1#x, decimal_map2#x, double_map1#x, double_map2#x, float_map1#x, float_map2#x, date_map1#x, date_map2#x, timestamp_map1#x, timestamp_map2#x, string_map1#x, string_map2#x, array_map1#x, array_map2#x, struct_map1#x, struct_map2#x, string_int_map1#x, string_int_map2#x, int_string_map1#x, int_string_map2#x]
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-case.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-case.sql.out
index c0f00168908ef..eb25e5ca2988d 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-case.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-case.sql.out
@@ -21,7 +21,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`CASE2_TBL`, false
 INSERT INTO CASE_TBL VALUES (1, 10.1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -29,7 +29,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE_TBL VALUES (2, 20.2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -37,7 +37,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE_TBL VALUES (3, -30.3)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -45,7 +45,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE_TBL VALUES (4, NULL)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case_tbl], Append, `spark_catalog`.`default`.`case_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case_tbl), [i, f]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as double) AS f#x]
++- Project [col1#x AS i#x, cast(col2#x as double) AS f#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -53,7 +53,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (1, -1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -61,7 +61,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (2, -2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -69,7 +69,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (3, -3)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -77,7 +77,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (2, -4)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -85,7 +85,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (1, NULL)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [col1#x AS i#x, cast(col2#x as int) AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -93,7 +93,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO CASE2_TBL VALUES (NULL, -6)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/case2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/case2_tbl], Append, `spark_catalog`.`default`.`case2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/case2_tbl), [i, j]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x]
++- Project [cast(col1#x as int) AS i#x, col2#x AS j#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-join.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-join.sql.out
index e7bd8a9535eb1..09ef51fcf2317 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-join.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-join.sql.out
@@ -116,7 +116,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`J2_TBL`, false
 INSERT INTO J1_TBL VALUES (1, 4, 'one')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -124,7 +124,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (2, 3, 'two')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -132,7 +132,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (3, 2, 'three')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -140,7 +140,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (4, 1, 'four')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -148,7 +148,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (5, 0, 'five')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -156,7 +156,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (6, 6, 'six')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -164,7 +164,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (7, 7, 'seven')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -172,7 +172,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (8, 8, 'eight')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -180,7 +180,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (0, NULL, 'zero')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [col1#x AS i#x, cast(col2#x as int) AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -188,7 +188,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (NULL, NULL, 'null')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -196,7 +196,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J1_TBL VALUES (NULL, 0, 'zero')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1_tbl], Append, `spark_catalog`.`default`.`j1_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1_tbl), [i, j, t]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS j#x, cast(col3#x as string) AS t#x]
++- Project [cast(col1#x as int) AS i#x, col2#x AS j#x, col3#x AS t#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -204,7 +204,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (1, -1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -212,7 +212,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (2, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -220,7 +220,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (3, -3)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -228,7 +228,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (2, 4)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -236,7 +236,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (5, -5)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -244,7 +244,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (5, -5)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -252,7 +252,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (0, NULL)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [col1#x AS i#x, cast(col2#x as int) AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -268,7 +268,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO J2_TBL VALUES (NULL, 0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2_tbl, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2_tbl], Append, `spark_catalog`.`default`.`j2_tbl`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2_tbl), [i, k]
-+- Project [cast(col1#x as int) AS i#x, cast(col2#x as int) AS k#x]
++- Project [cast(col1#x as int) AS i#x, col2#x AS k#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -678,7 +678,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t3`, false
 INSERT INTO t1 VALUES ( 'bb', 11 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t1], Append, `spark_catalog`.`default`.`t1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t1), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -686,7 +686,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t2 VALUES ( 'bb', 12 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -694,7 +694,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t2 VALUES ( 'cc', 22 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -702,7 +702,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t2 VALUES ( 'ee', 42 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t2], Append, `spark_catalog`.`default`.`t2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t2), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -710,7 +710,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t3 VALUES ( 'bb', 13 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -718,7 +718,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t3 VALUES ( 'cc', 23 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -726,7 +726,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO t3 VALUES ( 'dd', 33 )
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t3], Append, `spark_catalog`.`default`.`t3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t3), [name, n]
-+- Project [cast(col1#x as string) AS name#x, cast(col2#x as int) AS n#x]
++- Project [col1#x AS name#x, col2#x AS n#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -1330,7 +1330,7 @@ Aggregate [cast(udf(cast(cast(udf(cast(count(1) as string)) as bigint) as string
 +- Filter cast(udf(cast(cast(udf(cast(unique1#x as string)) as int) as string)) as int) IN (list#x [])
    :  +- Project [cast(udf(cast(unique1#x as string)) as int) AS udf(unique1)#x]
    :     +- Filter (cast(udf(cast(cast(udf(cast(unique2#x as string)) as int) as string)) as int) = cast(udf(cast(42 as string)) as int))
-   :        +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, ... 6 more fields]
+   :        +- Project [unique1#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x, unique2#x, two#x, four#x, ten#x, twenty#x, hundred#x, thousand#x, twothousand#x, fivethous#x, tenthous#x, odd#x, even#x, stringu1#x, stringu2#x, string4#x]
    :           +- Join Inner, (unique1#x = unique1#x)
    :              :- SubqueryAlias b
    :              :  +- SubqueryAlias spark_catalog.default.tenk1
@@ -1724,7 +1724,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`tt3`, false
 INSERT INTO tt3 SELECT x.id, repeat('xyzzy', 100) FROM range(1,10001) x
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/tt3, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/tt3], Append, `spark_catalog`.`default`.`tt3`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/tt3), [f1, f2]
-+- Project [cast(id#xL as int) AS f1#x, cast(repeat(xyzzy, 100)#x as string) AS f2#x]
++- Project [cast(id#xL as int) AS f1#x, repeat(xyzzy, 100)#x AS f2#x]
    +- Project [id#xL, repeat(xyzzy, 100) AS repeat(xyzzy, 100)#x]
       +- SubqueryAlias x
          +- Range (1, 10001, step=1)
@@ -1747,7 +1747,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`tt4`, false
 INSERT INTO tt4 VALUES (0),(1),(9999)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/tt4, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/tt4], Append, `spark_catalog`.`default`.`tt4`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/tt4), [f1]
-+- Project [cast(col1#x as int) AS f1#x]
++- Project [col1#x AS f1#x]
    +- LocalRelation [col1#x]
 
 
@@ -3526,7 +3526,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`j2`, false
 INSERT INTO j1 values(1,1),(1,2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j1, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j1], Append, `spark_catalog`.`default`.`j1`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j1), [id1, id2]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3534,7 +3534,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO j2 values(1,1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2], Append, `spark_catalog`.`default`.`j2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2), [id1, id2]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -3542,7 +3542,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO j2 values(1,2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/j2, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/j2], Append, `spark_catalog`.`default`.`j2`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/j2), [id1, id2]
-+- Project [cast(col1#x as int) AS id1#x, cast(col2#x as int) AS id2#x]
++- Project [col1#x AS id1#x, col2#x AS id2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_having.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_having.sql.out
index 6401e3d3ff41a..5fbae4d0ee395 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_having.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_having.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`test_having`, false
 INSERT INTO test_having VALUES (0, 1, 'XXXX', 'A')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (1, 2, 'AAAA', 'b')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (2, 2, 'AAAA', 'c')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (3, 3, 'BBBB', 'D')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (4, 3, 'BBBB', 'e')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -49,7 +49,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (5, 3, 'bbbb', 'F')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -57,7 +57,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (6, 4, 'cccc', 'g')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -65,7 +65,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (7, 4, 'cccc', 'h')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -73,7 +73,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (8, 4, 'CCCC', 'I')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -81,7 +81,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_having VALUES (9, 4, 'CCCC', 'j')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_having, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_having], Append, `spark_catalog`.`default`.`test_having`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_having), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_implicit.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_implicit.sql.out
index 05f47aeace9f9..0e98a1da48e9a 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_implicit.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/postgreSQL/udf-select_implicit.sql.out
@@ -9,7 +9,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`test_missing_target`, fa
 INSERT INTO test_missing_target VALUES (0, 1, 'XXXX', 'A')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -17,7 +17,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (1, 2, 'ABAB', 'b')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -25,7 +25,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (2, 2, 'ABAB', 'c')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -33,7 +33,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (3, 3, 'BBBB', 'D')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -41,7 +41,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (4, 3, 'BBBB', 'e')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -49,7 +49,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (5, 3, 'bbbb', 'F')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -57,7 +57,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (6, 4, 'cccc', 'g')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -65,7 +65,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (7, 4, 'cccc', 'h')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -73,7 +73,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (8, 4, 'CCCC', 'I')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
@@ -81,7 +81,7 @@ InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_d
 INSERT INTO test_missing_target VALUES (9, 4, 'CCCC', 'j')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/test_missing_target, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/test_missing_target], Append, `spark_catalog`.`default`.`test_missing_target`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/test_missing_target), [a, b, c, d]
-+- Project [cast(col1#x as int) AS a#x, cast(col2#x as int) AS b#x, cast(col3#x as string) AS c#x, cast(col4#x as string) AS d#x]
++- Project [col1#x AS a#x, col2#x AS b#x, col3#x AS c#x, col4#x AS d#x]
    +- LocalRelation [col1#x, col2#x, col3#x, col4#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-group-analytics.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-group-analytics.sql.out
index b246c4530cbb1..fc8199333f098 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-group-analytics.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-group-analytics.sql.out
@@ -256,7 +256,7 @@ HAVING GROUPING(year) = 1 AND GROUPING_ID(course, year) > 0 ORDER BY course, udf
 Sort [course#x ASC NULLS FIRST, cast(udf(cast(year#x as string)) as int) ASC NULLS FIRST], true
 +- Project [course#x, year#x]
    +- Filter ((cast(cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) as int) = 1) AND (spark_grouping_id#xL > cast(0 as bigint)))
-      +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL, spark_grouping_id#xL]
+      +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL]
          +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
             +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
                +- SubqueryAlias coursesales
@@ -307,34 +307,32 @@ Project [udf(course)#x, year#x]
 SELECT course, year, GROUPING(course), GROUPING(year) FROM courseSales GROUP BY CUBE(course, year)
 ORDER BY GROUPING(course), GROUPING(year), course, udf(year)
 -- !query analysis
-Project [course#x, year#x, grouping(course)#x, grouping(year)#x]
-+- Sort [cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) ASC NULLS FIRST, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) ASC NULLS FIRST, course#x ASC NULLS FIRST, cast(udf(cast(year#x as string)) as int) ASC NULLS FIRST], true
-   +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(course)#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(year)#x, spark_grouping_id#xL, spark_grouping_id#xL]
-      +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
-         +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
-            +- SubqueryAlias coursesales
-               +- View (`courseSales`, [course#x, year#x, earnings#x])
-                  +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
-                     +- Project [course#x, year#x, earnings#x]
-                        +- SubqueryAlias courseSales
-                           +- LocalRelation [course#x, year#x, earnings#x]
+Sort [grouping(course)#x ASC NULLS FIRST, grouping(year)#x ASC NULLS FIRST, course#x ASC NULLS FIRST, cast(udf(cast(year#x as string)) as int) ASC NULLS FIRST], true
++- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) AS grouping(course)#x, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) AS grouping(year)#x]
+   +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
+      +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
+         +- SubqueryAlias coursesales
+            +- View (`courseSales`, [course#x, year#x, earnings#x])
+               +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
+                  +- Project [course#x, year#x, earnings#x]
+                     +- SubqueryAlias courseSales
+                        +- LocalRelation [course#x, year#x, earnings#x]
 
 
 -- !query
 SELECT course, year, GROUPING_ID(course, year) FROM courseSales GROUP BY CUBE(course, year)
 ORDER BY GROUPING(course), GROUPING(year), course, udf(year)
 -- !query analysis
-Project [course#x, year#x, grouping_id(course, year)#xL]
-+- Sort [cast((shiftright(spark_grouping_id#xL, 1) & 1) as tinyint) ASC NULLS FIRST, cast((shiftright(spark_grouping_id#xL, 0) & 1) as tinyint) ASC NULLS FIRST, course#x ASC NULLS FIRST, cast(udf(cast(year#x as string)) as int) ASC NULLS FIRST], true
-   +- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL AS grouping_id(course, year)#xL, spark_grouping_id#xL, spark_grouping_id#xL]
-      +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
-         +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
-            +- SubqueryAlias coursesales
-               +- View (`courseSales`, [course#x, year#x, earnings#x])
-                  +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
-                     +- Project [course#x, year#x, earnings#x]
-                        +- SubqueryAlias courseSales
-                           +- LocalRelation [course#x, year#x, earnings#x]
+Sort [cast((shiftright(grouping_id(course, year)#xL, 1) & 1) as tinyint) ASC NULLS FIRST, cast((shiftright(grouping_id(course, year)#xL, 0) & 1) as tinyint) ASC NULLS FIRST, course#x ASC NULLS FIRST, cast(udf(cast(year#x as string)) as int) ASC NULLS FIRST], true
++- Aggregate [course#x, year#x, spark_grouping_id#xL], [course#x, year#x, spark_grouping_id#xL AS grouping_id(course, year)#xL]
+   +- Expand [[course#x, year#x, earnings#x, course#x, year#x, 0], [course#x, year#x, earnings#x, course#x, null, 1], [course#x, year#x, earnings#x, null, year#x, 2], [course#x, year#x, earnings#x, null, null, 3]], [course#x, year#x, earnings#x, course#x, year#x, spark_grouping_id#xL]
+      +- Project [course#x, year#x, earnings#x, course#x AS course#x, year#x AS year#x]
+         +- SubqueryAlias coursesales
+            +- View (`courseSales`, [course#x, year#x, earnings#x])
+               +- Project [cast(course#x as string) AS course#x, cast(year#x as int) AS year#x, cast(earnings#x as int) AS earnings#x]
+                  +- Project [course#x, year#x, earnings#x]
+                     +- SubqueryAlias courseSales
+                        +- LocalRelation [course#x, year#x, earnings#x]
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-window.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-window.sql.out
index 1d0d8974e97ca..aa3f40b62ccd8 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-window.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/udf/udf-window.sql.out
@@ -385,11 +385,11 @@ FROM testData
 WINDOW w AS (PARTITION BY udf(cate) ORDER BY udf(val))
 ORDER BY cate, udf(val)
 -- !query analysis
-Project [udf(val)#x, cate#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, ... 10 more fields]
+Project [udf(val)#x, cate#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, var_samp#x, approx_count_distinct#xL, covar_pop#x, corr#x, stddev_samp#x, stddev_pop#x, collect_list#x, collect_set#x, skewness#x, kurtosis#x]
 +- Sort [cate#x ASC NULLS FIRST, cast(udf(cast(val#x as string)) as int) ASC NULLS FIRST], true
-   +- Project [udf(val)#x, cate#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, ... 11 more fields]
-      +- Project [udf(val)#x, cate#x, _w0#x, _w1#x, _w2#x, _w3#x, _w4#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, ... 49 more fields]
-         +- Window [max(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS max#x, min(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, min(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, count(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS count#xL, sum(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS sum#xL, avg(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS avg#x, stddev(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev#x, first_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value#x, first_value(_w0#x, true) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_ignore_null#x, first_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_contain_null#x, any_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value#x, any_value(_w0#x, true) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_ignore_null#x, any_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_contain_null#x, last_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value#x, last_value(_w0#x, true) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_ignore_null#x, last_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_contain_null#x, rank(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rank#x, dense_rank(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS dense_rank#x, cume_dist() windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS cume_dist#x, percent_rank(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS percent_rank#x, ntile(2) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS ntile#x, row_number() windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS row_number#x, var_pop(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_pop#x, var_samp(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_samp#x, approx_count_distinct(_w0#x, 0.05, 0, 0) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS approx_count_distinct#xL, ... 8 more fields], [_w1#x], [_w0#x ASC NULLS FIRST]
+   +- Project [udf(val)#x, cate#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, var_samp#x, approx_count_distinct#xL, covar_pop#x, corr#x, stddev_samp#x, stddev_pop#x, collect_list#x, collect_set#x, skewness#x, kurtosis#x, val#x]
+      +- Project [udf(val)#x, cate#x, _w0#x, _w1#x, _w2#x, _w3#x, _w4#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, var_samp#x, approx_count_distinct#xL, covar_pop#x, corr#x, stddev_samp#x, stddev_pop#x, collect_list#x, collect_set#x, skewness#x, kurtosis#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, var_samp#x, approx_count_distinct#xL, covar_pop#x, corr#x, stddev_samp#x, stddev_pop#x, collect_list#x, collect_set#x, skewness#x, kurtosis#x, val#x]
+         +- Window [max(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS max#x, min(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, min(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, count(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS count#xL, sum(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS sum#xL, avg(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS avg#x, stddev(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev#x, first_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value#x, first_value(_w0#x, true) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_ignore_null#x, first_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_contain_null#x, any_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value#x, any_value(_w0#x, true) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_ignore_null#x, any_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_contain_null#x, last_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value#x, last_value(_w0#x, true) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_ignore_null#x, last_value(_w0#x, false) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_contain_null#x, rank(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rank#x, dense_rank(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS dense_rank#x, cume_dist() windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS cume_dist#x, percent_rank(_w0#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS percent_rank#x, ntile(2) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS ntile#x, row_number() windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS row_number#x, var_pop(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_pop#x, var_samp(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_samp#x, approx_count_distinct(_w0#x, 0.05, 0, 0) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS approx_count_distinct#xL, covar_pop(_w2#x, _w3#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS covar_pop#x, corr(_w2#x, _w3#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS corr#x, stddev_samp(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev_samp#x, stddev_pop(_w2#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev_pop#x, collect_list(_w0#x, 0, 0) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS collect_list#x, collect_set(_w0#x, 0, 0) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS collect_set#x, skewness(_w4#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS skewness#x, kurtosis(_w4#x) windowspecdefinition(_w1#x, _w0#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS kurtosis#x], [_w1#x], [_w0#x ASC NULLS FIRST]
             +- Project [cast(udf(cast(val#x as string)) as int) AS udf(val)#x, cate#x, cast(udf(cast(val#x as string)) as int) AS _w0#x, cast(udf(cast(cate#x as string)) as string) AS _w1#x, cast(cast(udf(cast(val#x as string)) as int) as double) AS _w2#x, cast(cast(udf(cast(val_long#xL as string)) as bigint) as double) AS _w3#x, cast(udf(cast(val_double#x as string)) as double) AS _w4#x, val#x]
                +- SubqueryAlias testdata
                   +- View (`testData`, [val#x, val_long#xL, val_double#x, val_date#x, val_timestamp#x, cate#x])
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/union-per-child-output-deduplication.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/union-per-child-output-deduplication.sql.out
new file mode 100644
index 0000000000000..69d15793cdbb3
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/union-per-child-output-deduplication.sql.out
@@ -0,0 +1,312 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+DROP TABLE IF EXISTS t1
+-- !query analysis
+DropTable true, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
+
+
+-- !query
+DROP VIEW  IF EXISTS v1
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`v1`, true, true, false
+
+
+-- !query
+CREATE TABLE t1 (col1 STRING, col2 STRING, col3 STRING)
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`t1`, false
+
+
+-- !query
+CREATE VIEW v1 as SELECT * FROM t1
+-- !query analysis
+CreateViewCommand `spark_catalog`.`default`.`v1`, SELECT * FROM t1, false, false, PersistedView, COMPENSATION, true
+   +- Project [col1#x, col2#x, col3#x]
+      +- SubqueryAlias spark_catalog.default.t1
+         +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.t1
+         :     :     +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.t1
+         :           +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.t1
+                  +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.v1
+         :     :     +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :     :        +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :     :           +- Project [col1#x, col2#x, col3#x]
+         :     :              +- SubqueryAlias spark_catalog.default.t1
+         :     :                 +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.v1
+         :           +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :              +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :                 +- Project [col1#x, col2#x, col3#x]
+         :                    +- SubqueryAlias spark_catalog.default.t1
+         :                       +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.v1
+                  +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+                     +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+                        +- Project [col1#x, col2#x, col3#x]
+                           +- SubqueryAlias spark_catalog.default.t1
+                              +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.t1
+         :     :     +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.t1
+         :           +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.v1
+                  +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+                     +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+                        +- Project [col1#x, col2#x, col3#x]
+                           +- SubqueryAlias spark_catalog.default.t1
+                              +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.t1
+         :     :     +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.v1
+         :           +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :              +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :                 +- Project [col1#x, col2#x, col3#x]
+         :                    +- SubqueryAlias spark_catalog.default.t1
+         :                       +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.t1
+                  +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.v1
+         :     :     +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :     :        +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :     :           +- Project [col1#x, col2#x, col3#x]
+         :     :              +- SubqueryAlias spark_catalog.default.t1
+         :     :                 +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.t1
+         :           +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.t1
+                  +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.v1
+         :     :     +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :     :        +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :     :           +- Project [col1#x, col2#x, col3#x]
+         :     :              +- SubqueryAlias spark_catalog.default.t1
+         :     :                 +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.v1
+         :           +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :              +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :                 +- Project [col1#x, col2#x, col3#x]
+         :                    +- SubqueryAlias spark_catalog.default.t1
+         :                       +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.t1
+                  +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.v1
+         :     :     +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :     :        +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :     :           +- Project [col1#x, col2#x, col3#x]
+         :     :              +- SubqueryAlias spark_catalog.default.t1
+         :     :                 +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.t1
+         :           +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.v1
+                  +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+                     +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+                        +- Project [col1#x, col2#x, col3#x]
+                           +- SubqueryAlias spark_catalog.default.t1
+                              +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query analysis
+Project [col1#x, col2#x]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Distinct
+      +- Union false, false
+         :- Distinct
+         :  +- Union false, false
+         :     :- Project [col1#x, col2#x]
+         :     :  +- SubqueryAlias spark_catalog.default.t1
+         :     :     +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         :     +- Project [col3#x, col2#x]
+         :        +- SubqueryAlias spark_catalog.default.v1
+         :           +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+         :              +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+         :                 +- Project [col1#x, col2#x, col3#x]
+         :                    +- SubqueryAlias spark_catalog.default.t1
+         :                       +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+         +- Project [col2#x, col2#x AS col2#x]
+            +- Project [col2#x, col2#x]
+               +- SubqueryAlias spark_catalog.default.v1
+                  +- View (`spark_catalog`.`default`.`v1`, [col1#x, col2#x, col3#x])
+                     +- Project [cast(col1#x as string) AS col1#x, cast(col2#x as string) AS col2#x, cast(col3#x as string) AS col3#x]
+                        +- Project [col1#x, col2#x, col3#x]
+                           +- SubqueryAlias spark_catalog.default.t1
+                              +- Relation spark_catalog.default.t1[col1#x,col2#x,col3#x] parquet
+
+
+-- !query
+DROP VIEW v1
+-- !query analysis
+DropTableCommand `spark_catalog`.`default`.`v1`, false, true, false
+
+
+-- !query
+DROP TABLE t1
+-- !query analysis
+DropTable false, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.t1
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/union.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/union.sql.out
index dfba3688f0b7d..a2dfb6e47a572 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/union.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/union.sql.out
@@ -15,6 +15,12 @@ CreateViewCommand `t2`, VALUES (1.0, 1), (2.0, 4) tbl(c1, c2), false, true, Loca
       +- LocalRelation [c1#x, c2#x]
 
 
+-- !query
+CREATE TABLE jsonTable (col1 INT, col2 INT, col3 INT, col4 INT) USING json
+-- !query analysis
+CreateDataSourceTableCommand `spark_catalog`.`default`.`jsonTable`, false
+
+
 -- !query
 SELECT *
 FROM   (SELECT * FROM t1
@@ -241,6 +247,25 @@ Aggregate [sum(v#x) AS sum(v)#x]
                         +- LocalRelation [v#x]
 
 
+-- !query
+SELECT col1, col2, col3, NULLIF('','') AS col4
+FROM jsonTable
+UNION ALL
+SELECT col2, col2, null AS col3, col4
+FROM jsonTable
+-- !query analysis
+Union false, false
+:- Project [col1#x, col2#x, col3#x, cast(col4#x as bigint) AS col4#xL]
+:  +- Project [col1#x, col2#x, col3#x, nullif(, ) AS col4#x]
+:     +- SubqueryAlias spark_catalog.default.jsontable
+:        +- Relation spark_catalog.default.jsontable[col1#x,col2#x,col3#x,col4#x] json
++- Project [col2#x, col2#x AS col2#x, col3#x, col4#xL]
+   +- Project [col2#x, col2#x, cast(col3#x as int) AS col3#x, cast(col4#x as bigint) AS col4#xL]
+      +- Project [col2#x, col2#x, null AS col3#x, col4#x]
+         +- SubqueryAlias spark_catalog.default.jsontable
+            +- Relation spark_catalog.default.jsontable[col1#x,col2#x,col3#x,col4#x] json
+
+
 -- !query
 DROP VIEW IF EXISTS t1
 -- !query analysis
@@ -275,3 +300,10 @@ DropTempViewCommand p2
 DROP VIEW IF EXISTS p3
 -- !query analysis
 DropTempViewCommand p3
+
+
+-- !query
+DROP TABLE IF EXISTS jsonTable
+-- !query analysis
+DropTable true, false
++- ResolvedIdentifier V2SessionCatalog(spark_catalog), default.jsonTable
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/variant-field-extractions.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/variant-field-extractions.sql.out
new file mode 100644
index 0000000000000..d95fb80980b87
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/variant-field-extractions.sql.out
@@ -0,0 +1,457 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+CREATE TEMP VIEW variant_test_data AS
+SELECT
+  parse_json('{ "price": 30 }') as int_price_variant,
+  parse_json('{ "price": 12345.678 }') as double_price_variant,
+  parse_json('{ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }') as multi_field_variant,
+  parse_json('{ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }') as array_value_variant,
+  parse_json('[{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }]') as array_variant,
+  parse_json('{ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }') as nested_variant,
+  parse_json('{ "field-name": "value1", "field.name": "value2", "field_name": "value3" }') as special_chars_variant
+-- !query analysis
+CreateViewCommand `variant_test_data`, SELECT
+  parse_json('{ "price": 30 }') as int_price_variant,
+  parse_json('{ "price": 12345.678 }') as double_price_variant,
+  parse_json('{ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }') as multi_field_variant,
+  parse_json('{ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }') as array_value_variant,
+  parse_json('[{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }]') as array_variant,
+  parse_json('{ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }') as nested_variant,
+  parse_json('{ "field-name": "value1", "field.name": "value2", "field_name": "value3" }') as special_chars_variant, false, false, LocalTempView, UNSUPPORTED, true
+   +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+      +- OneRowRelation
+
+
+-- !query
+select int_price_variant:price from variant_test_data
+-- !query analysis
+Project [variant_get(int_price_variant#x, $.price, VariantType, true, Some(America/Los_Angeles)) AS price#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select int_price_variant:price::decimal(5, 2) from variant_test_data
+-- !query analysis
+Project [cast(variant_get(int_price_variant#x, $.price, VariantType, true, Some(America/Los_Angeles)) as decimal(5,2)) AS price#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select int_price_variant:price::string from variant_test_data
+-- !query analysis
+Project [cast(variant_get(int_price_variant#x, $.price, VariantType, true, Some(America/Los_Angeles)) as string) AS price#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select double_price_variant:price::decimal(3, 2) from variant_test_data
+-- !query analysis
+Project [cast(variant_get(double_price_variant#x, $.price, VariantType, true, Some(America/Los_Angeles)) as decimal(3,2)) AS price#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select multi_field_variant:name, multi_field_variant:age, multi_field_variant:city from variant_test_data
+-- !query analysis
+Project [variant_get(multi_field_variant#x, $.name, VariantType, true, Some(America/Los_Angeles)) AS name#x, variant_get(multi_field_variant#x, $.age, VariantType, true, Some(America/Los_Angeles)) AS age#x, variant_get(multi_field_variant#x, $.city, VariantType, true, Some(America/Los_Angeles)) AS city#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select multi_field_variant:name::string, multi_field_variant:age::int, multi_field_variant:active::boolean from variant_test_data
+-- !query analysis
+Project [cast(variant_get(multi_field_variant#x, $.name, VariantType, true, Some(America/Los_Angeles)) as string) AS name#x, cast(variant_get(multi_field_variant#x, $.age, VariantType, true, Some(America/Los_Angeles)) as int) AS age#x, cast(variant_get(multi_field_variant#x, $.active, VariantType, true, Some(America/Los_Angeles)) as boolean) AS active#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select multi_field_variant:['name'] from variant_test_data
+-- !query analysis
+Project [variant_get(multi_field_variant#x, $['name'], VariantType, true, Some(America/Los_Angeles)) AS name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select multi_field_variant:['age'] from variant_test_data
+-- !query analysis
+Project [variant_get(multi_field_variant#x, $['age'], VariantType, true, Some(America/Los_Angeles)) AS age#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_value_variant:item[0].model from variant_test_data
+-- !query analysis
+Project [variant_get(array_value_variant#x, $.item[0].model, VariantType, true, Some(America/Los_Angeles)) AS model#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_value_variant:item[0].price from variant_test_data
+-- !query analysis
+Project [variant_get(array_value_variant#x, $.item[0].price, VariantType, true, Some(America/Los_Angeles)) AS price#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_value_variant:item[1].model from variant_test_data
+-- !query analysis
+Project [variant_get(array_value_variant#x, $.item[1].model, VariantType, true, Some(America/Los_Angeles)) AS model#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_value_variant:item[1].price from variant_test_data
+-- !query analysis
+Project [variant_get(array_value_variant#x, $.item[1].price, VariantType, true, Some(America/Los_Angeles)) AS price#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_variant:[0].id from variant_test_data
+-- !query analysis
+Project [variant_get(array_variant#x, $[0].id, VariantType, true, Some(America/Los_Angeles)) AS id#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_variant:[0].name from variant_test_data
+-- !query analysis
+Project [variant_get(array_variant#x, $[0].name, VariantType, true, Some(America/Los_Angeles)) AS name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_variant:[1].id from variant_test_data
+-- !query analysis
+Project [variant_get(array_variant#x, $[1].id, VariantType, true, Some(America/Los_Angeles)) AS id#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select array_variant:[1].name from variant_test_data
+-- !query analysis
+Project [variant_get(array_variant#x, $[1].name, VariantType, true, Some(America/Los_Angeles)) AS name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select nested_variant:metadata.version from variant_test_data
+-- !query analysis
+Project [variant_get(nested_variant#x, $.metadata.version, VariantType, true, Some(America/Los_Angeles)) AS version#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select nested_variant:metadata.tags[0] from variant_test_data
+-- !query analysis
+Project [variant_get(nested_variant#x, $.metadata.tags[0], VariantType, true, Some(America/Los_Angeles)) AS tags#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select nested_variant:metadata.nested.level from variant_test_data
+-- !query analysis
+Project [variant_get(nested_variant#x, $.metadata.nested.level, VariantType, true, Some(America/Los_Angeles)) AS level#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select nested_variant:metadata.nested.value from variant_test_data
+-- !query analysis
+Project [variant_get(nested_variant#x, $.metadata.nested.value, VariantType, true, Some(America/Los_Angeles)) AS value#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select nested_variant:metadata['version'] from variant_test_data
+-- !query analysis
+Project [variant_get(nested_variant#x, $.metadata['version'], VariantType, true, Some(America/Los_Angeles)) AS version#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select nested_variant:metadata['tags'] from variant_test_data
+-- !query analysis
+Project [variant_get(nested_variant#x, $.metadata['tags'], VariantType, true, Some(America/Los_Angeles)) AS tags#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select special_chars_variant:`field-name`::string from variant_test_data
+-- !query analysis
+Project [cast(variant_get(special_chars_variant#x, $.field-name, VariantType, true, Some(America/Los_Angeles)) as string) AS field-name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select special_chars_variant:['field-name']::string from variant_test_data
+-- !query analysis
+Project [cast(variant_get(special_chars_variant#x, $['field-name'], VariantType, true, Some(America/Los_Angeles)) as string) AS field-name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select special_chars_variant:field_name::string from variant_test_data
+-- !query analysis
+Project [cast(variant_get(special_chars_variant#x, $.field_name, VariantType, true, Some(America/Los_Angeles)) as string) AS field_name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select special_chars_variant:['field_name']::string from variant_test_data
+-- !query analysis
+Project [cast(variant_get(special_chars_variant#x, $['field_name'], VariantType, true, Some(America/Los_Angeles)) as string) AS field_name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select special_chars_variant:`field.name`::string from variant_test_data
+-- !query analysis
+Project [cast(variant_get(special_chars_variant#x, $.field.name, VariantType, true, Some(America/Los_Angeles)) as string) AS name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select special_chars_variant:['field.name']::string from variant_test_data
+-- !query analysis
+Project [cast(variant_get(special_chars_variant#x, $['field.name'], VariantType, true, Some(America/Los_Angeles)) as string) AS field.name#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select multi_field_variant:scores[0]::int + multi_field_variant:scores[1]::int from variant_test_data
+-- !query analysis
+Project [(cast(variant_get(multi_field_variant#x, $.scores[0], VariantType, true, Some(America/Los_Angeles)) as int) + cast(variant_get(multi_field_variant#x, $.scores[1], VariantType, true, Some(America/Los_Angeles)) as int)) AS (CAST(variant_get(multi_field_variant, $.scores[0]) AS scores AS INT) + CAST(variant_get(multi_field_variant, $.scores[1]) AS scores AS INT))#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select count(*) from (select explode(cast(multi_field_variant:scores as array<int>)) as score from variant_test_data)
+-- !query analysis
+Aggregate [count(1) AS count(1)#xL]
++- SubqueryAlias __auto_generated_subquery_name
+   +- Project [score#x]
+      +- Generate explode(cast(variant_get(multi_field_variant#x, $.scores, VariantType, true, Some(America/Los_Angeles)) as array<int>)), false, [score#x]
+         +- SubqueryAlias variant_test_data
+            +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+               +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+                  +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+                     +- OneRowRelation
+
+
+-- !query
+select * from variant_test_data
+-- !query analysis
+Project [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select multi_field_variant:* from variant_test_data
+-- !query analysis
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'*'",
+    "hint" : ""
+  }
+}
+
+
+-- !query
+select typeof(multi_field_variant:name) from variant_test_data
+-- !query analysis
+Project [typeof(variant_get(multi_field_variant#x, $.name, VariantType, true, Some(America/Los_Angeles))) AS typeof(variant_get(multi_field_variant, $.name) AS name)#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select typeof(multi_field_variant:age) from variant_test_data
+-- !query analysis
+Project [typeof(variant_get(multi_field_variant#x, $.age, VariantType, true, Some(America/Los_Angeles))) AS typeof(variant_get(multi_field_variant, $.age) AS age)#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select typeof(multi_field_variant:active) from variant_test_data
+-- !query analysis
+Project [typeof(variant_get(multi_field_variant#x, $.active, VariantType, true, Some(America/Los_Angeles))) AS typeof(variant_get(multi_field_variant, $.active) AS active)#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select typeof(multi_field_variant:scores) from variant_test_data
+-- !query analysis
+Project [typeof(variant_get(multi_field_variant#x, $.scores, VariantType, true, Some(America/Los_Angeles))) AS typeof(variant_get(multi_field_variant, $.scores) AS scores)#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select isnull(multi_field_variant:missing_field) from variant_test_data
+-- !query analysis
+Project [isnull(variant_get(multi_field_variant#x, $.missing_field, VariantType, true, Some(America/Los_Angeles))) AS (variant_get(multi_field_variant, $.missing_field) AS missing_field IS NULL)#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select isnotnull(multi_field_variant:name) from variant_test_data
+-- !query analysis
+Project [isnotnull(variant_get(multi_field_variant#x, $.name, VariantType, true, Some(America/Los_Angeles))) AS (variant_get(multi_field_variant, $.name) AS name IS NOT NULL)#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
+
+
+-- !query
+select coalesce(multi_field_variant:missing_field, 'default_value') from variant_test_data
+-- !query analysis
+Project [coalesce(variant_get(multi_field_variant#x, $.missing_field, VariantType, true, Some(America/Los_Angeles)), cast(default_value as variant)) AS coalesce(variant_get(multi_field_variant, $.missing_field) AS missing_field, default_value)#x]
++- SubqueryAlias variant_test_data
+   +- View (`variant_test_data`, [int_price_variant#x, double_price_variant#x, multi_field_variant#x, array_value_variant#x, array_variant#x, nested_variant#x, special_chars_variant#x])
+      +- Project [cast(int_price_variant#x as variant) AS int_price_variant#x, cast(double_price_variant#x as variant) AS double_price_variant#x, cast(multi_field_variant#x as variant) AS multi_field_variant#x, cast(array_value_variant#x as variant) AS array_value_variant#x, cast(array_variant#x as variant) AS array_variant#x, cast(nested_variant#x as variant) AS nested_variant#x, cast(special_chars_variant#x as variant) AS special_chars_variant#x]
+         +- Project [parse_json({ "price": 30 }, true) AS int_price_variant#x, parse_json({ "price": 12345.678 }, true) AS double_price_variant#x, parse_json({ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }, true) AS multi_field_variant#x, parse_json({ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }, true) AS array_value_variant#x, parse_json([{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }], true) AS array_variant#x, parse_json({ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }, true) AS nested_variant#x, parse_json({ "field-name": "value1", "field.name": "value2", "field_name": "value3" }, true) AS special_chars_variant#x]
+            +- OneRowRelation
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-binding-config.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-binding-config.sql.out
index efa221400b0be..5e1d30fbcbfac 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-binding-config.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-binding-config.sql.out
@@ -461,7 +461,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -487,7 +487,7 @@ DescribeTableCommand `spark_catalog`.`default`.`v`, true, [col_name#x, data_type
 INSERT INTO t VALUES ('a', 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -561,7 +561,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-compensation.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-compensation.sql.out
index 64295a6f9bc0c..ba6f387e8d528 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-compensation.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-compensation.sql.out
@@ -101,7 +101,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -127,7 +127,7 @@ DescribeTableCommand `spark_catalog`.`default`.`v`, true, [col_name#x, data_type
 INSERT INTO t VALUES ('a', 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -201,7 +201,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -321,7 +321,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES(1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1]
-+- Project [cast(col1#x as int) AS c1#x]
++- Project [col1#x AS c1#x]
    +- LocalRelation [col1#x]
 
 
@@ -357,7 +357,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES('1')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1]
-+- Project [cast(col1#x as string) AS c1#x]
++- Project [col1#x AS c1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-evolution.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-evolution.sql.out
index 258edf31d4c17..90629cc1bcfc3 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-evolution.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-evolution.sql.out
@@ -16,7 +16,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -63,7 +63,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2.0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c4, c5]
-+- Project [cast(col1#x as string) AS c4#x, cast(col2#x as double) AS c5#x]
++- Project [col1#x AS c4#x, cast(col2#x as double) AS c5#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -101,7 +101,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2.0, DATE'2022-01-01')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c4, c5, c6]
-+- Project [cast(col1#x as string) AS c4#x, cast(col2#x as double) AS c5#x, cast(col3#x as date) AS c6#x]
++- Project [col1#x AS c4#x, cast(col2#x as double) AS c5#x, col3#x AS c6#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -139,7 +139,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -216,7 +216,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -264,7 +264,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2.0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as double) AS c2#x]
++- Project [col1#x AS c1#x, cast(col2#x as double) AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -303,7 +303,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2.0, DATE'2022-01-01')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2, c3]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as double) AS c2#x, cast(col3#x as date) AS c3#x]
++- Project [col1#x AS c1#x, cast(col2#x as double) AS c2#x, col3#x AS c3#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -342,7 +342,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -719,7 +719,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES(1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1]
-+- Project [cast(col1#x as int) AS c1#x]
++- Project [col1#x AS c1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-type-evolution.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-type-evolution.sql.out
index 95aa35d59fdc8..650c8ffd798fe 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-type-evolution.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/view-schema-type-evolution.sql.out
@@ -16,7 +16,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -64,7 +64,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2.0)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as double) AS c2#x]
++- Project [col1#x AS c1#x, cast(col2#x as double) AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -103,7 +103,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('1', 2.0, DATE'2022-01-01')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2, c3]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as double) AS c2#x, cast(col3#x as date) AS c3#x]
++- Project [col1#x AS c1#x, cast(col2#x as double) AS c2#x, col3#x AS c3#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -142,7 +142,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES (1, 2)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]
++- Project [col1#x AS c1#x, col2#x AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -367,7 +367,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES(1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1]
-+- Project [cast(col1#x as int) AS c1#x]
++- Project [col1#x AS c1#x]
    +- LocalRelation [col1#x]
 
 
@@ -397,7 +397,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES('1')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1]
-+- Project [cast(col1#x as string) AS c1#x]
++- Project [col1#x AS c1#x]
    +- LocalRelation [col1#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/view-with-default-collation.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/view-with-default-collation.sql.out
index 697208e9c931d..017886e9f490f 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/view-with-default-collation.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/view-with-default-collation.sql.out
@@ -357,7 +357,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('a', 'a'), ('A', 'A'), ('b', 'b')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as string collate UTF8_LCASE) AS c2#x]
++- Project [col1#x AS c1#x, cast(col2#x as string collate UTF8_LCASE) AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -536,7 +536,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('a', 'b', 1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2, c3]
-+- Project [cast(col1#x as string collate UTF8_LCASE) AS c1#x, cast(col2#x as string) AS c2#x, cast(col3#x as int) AS c3#x]
++- Project [cast(col1#x as string collate UTF8_LCASE) AS c1#x, col2#x AS c2#x, col3#x AS c3#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
@@ -976,7 +976,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('a', 'a'), ('A', 'A'), ('b', 'b')
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2]
-+- Project [cast(col1#x as string) AS c1#x, cast(col2#x as string collate UTF8_LCASE) AS c2#x]
++- Project [col1#x AS c1#x, cast(col2#x as string collate UTF8_LCASE) AS c2#x]
    +- LocalRelation [col1#x, col2#x]
 
 
@@ -1155,7 +1155,7 @@ CreateDataSourceTableCommand `spark_catalog`.`default`.`t`, false
 INSERT INTO t VALUES ('a', 'b', 1)
 -- !query analysis
 InsertIntoHadoopFsRelationCommand file:[not included in comparison]/{warehouse_dir}/t, false, Parquet, [path=file:[not included in comparison]/{warehouse_dir}/t], Append, `spark_catalog`.`default`.`t`, org.apache.spark.sql.execution.datasources.InMemoryFileIndex(file:[not included in comparison]/{warehouse_dir}/t), [c1, c2, c3]
-+- Project [cast(col1#x as string collate UTF8_LCASE) AS c1#x, cast(col2#x as string) AS c2#x, cast(col3#x as int) AS c3#x]
++- Project [cast(col1#x as string collate UTF8_LCASE) AS c1#x, col2#x AS c2#x, col3#x AS c3#x]
    +- LocalRelation [col1#x, col2#x, col3#x]
 
 
diff --git a/sql/core/src/test/resources/sql-tests/analyzer-results/window.sql.out b/sql/core/src/test/resources/sql-tests/analyzer-results/window.sql.out
index 77dc2f3ba2736..00cf492574cfb 100644
--- a/sql/core/src/test/resources/sql-tests/analyzer-results/window.sql.out
+++ b/sql/core/src/test/resources/sql-tests/analyzer-results/window.sql.out
@@ -583,9 +583,9 @@ WINDOW w AS (PARTITION BY cate ORDER BY val)
 ORDER BY cate, val
 -- !query analysis
 Sort [cate#x ASC NULLS FIRST, val#x ASC NULLS FIRST], true
-+- Project [val#x, cate#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, ... 10 more fields]
-   +- Project [val#x, cate#x, _w0#x, _w1#x, val_double#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ... 46 more fields]
-      +- Window [max(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS max#x, min(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, min(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, count(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS count#xL, sum(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS sum#xL, avg(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS avg#x, stddev(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev#x, first_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value#x, first_value(val#x, true) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_ignore_null#x, first_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_contain_null#x, any_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value#x, any_value(val#x, true) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_ignore_null#x, any_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_contain_null#x, last_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value#x, last_value(val#x, true) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_ignore_null#x, last_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_contain_null#x, rank(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rank#x, dense_rank(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS dense_rank#x, cume_dist() windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS cume_dist#x, percent_rank(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS percent_rank#x, ntile(2) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS ntile#x, row_number() windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS row_number#x, var_pop(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_pop#x, var_samp(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_samp#x, approx_count_distinct(val#x, 0.05, 0, 0) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS approx_count_distinct#xL, ... 8 more fields], [cate#x], [val#x ASC NULLS FIRST]
++- Project [val#x, cate#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, var_samp#x, approx_count_distinct#xL, covar_pop#x, corr#x, stddev_samp#x, stddev_pop#x, collect_list#x, collect_set#x, skewness#x, kurtosis#x]
+   +- Project [val#x, cate#x, _w0#x, _w1#x, val_double#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, var_samp#x, approx_count_distinct#xL, covar_pop#x, corr#x, stddev_samp#x, stddev_pop#x, collect_list#x, collect_set#x, skewness#x, kurtosis#x, max#x, min#x, min#x, count#xL, sum#xL, avg#x, stddev#x, first_value#x, first_value_ignore_null#x, first_value_contain_null#x, any_value#x, any_value_ignore_null#x, any_value_contain_null#x, last_value#x, last_value_ignore_null#x, last_value_contain_null#x, rank#x, dense_rank#x, cume_dist#x, percent_rank#x, ntile#x, row_number#x, var_pop#x, var_samp#x, approx_count_distinct#xL, covar_pop#x, corr#x, stddev_samp#x, stddev_pop#x, collect_list#x, collect_set#x, skewness#x, kurtosis#x]
+      +- Window [max(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS max#x, min(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, min(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS min#x, count(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS count#xL, sum(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS sum#xL, avg(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS avg#x, stddev(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev#x, first_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value#x, first_value(val#x, true) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_ignore_null#x, first_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value_contain_null#x, any_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value#x, any_value(val#x, true) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_ignore_null#x, any_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value_contain_null#x, last_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value#x, last_value(val#x, true) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_ignore_null#x, last_value(val#x, false) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value_contain_null#x, rank(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rank#x, dense_rank(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS dense_rank#x, cume_dist() windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS cume_dist#x, percent_rank(val#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS percent_rank#x, ntile(2) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS ntile#x, row_number() windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS row_number#x, var_pop(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_pop#x, var_samp(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS var_samp#x, approx_count_distinct(val#x, 0.05, 0, 0) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS approx_count_distinct#xL, covar_pop(_w0#x, _w1#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS covar_pop#x, corr(_w0#x, _w1#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS corr#x, stddev_samp(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev_samp#x, stddev_pop(_w0#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS stddev_pop#x, collect_list(val#x, 0, 0) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS collect_list#x, collect_set(val#x, 0, 0) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS collect_set#x, skewness(val_double#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS skewness#x, kurtosis(val_double#x) windowspecdefinition(cate#x, val#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS kurtosis#x], [cate#x], [val#x ASC NULLS FIRST]
          +- Project [val#x, cate#x, cast(val#x as double) AS _w0#x, cast(val_long#xL as double) AS _w1#x, val_double#x]
             +- SubqueryAlias testdata
                +- View (`testData`, [val#x, val_long#xL, val_double#x, val_date#x, val_timestamp#x, cate#x])
@@ -1009,7 +1009,7 @@ ORDER BY id
 -- !query analysis
 Sort [id#x ASC NULLS FIRST], true
 +- Project [content#x, id#x, v#x, lead_0#x, lead_1#x, lead_2#x, lead_3#x, lag_0#x, lag_1#x, lag_2#x, lag_3#x, lag_plus_3#x, nth_value_1#x, nth_value_2#x, nth_value_3#x, first_value#x, any_value#x, last_value#x]
-   +- Project [content#x, id#x, v#x, lead_0#x, lead_1#x, lead_2#x, lead_3#x, lag_0#x, lag_1#x, lag_2#x, lag_3#x, lag_plus_3#x, nth_value_1#x, nth_value_2#x, nth_value_3#x, first_value#x, any_value#x, last_value#x, lead_0#x, lead_1#x, lead_2#x, lead_3#x, lag_0#x, lag_1#x, lag_2#x, ... 8 more fields]
+   +- Project [content#x, id#x, v#x, lead_0#x, lead_1#x, lead_2#x, lead_3#x, lag_0#x, lag_1#x, lag_2#x, lag_3#x, lag_plus_3#x, nth_value_1#x, nth_value_2#x, nth_value_3#x, first_value#x, any_value#x, last_value#x, lead_0#x, lead_1#x, lead_2#x, lead_3#x, lag_0#x, lag_1#x, lag_2#x, lag_3#x, lag_plus_3#x, nth_value_1#x, nth_value_2#x, nth_value_3#x, first_value#x, any_value#x, last_value#x]
       +- Window [lead(v#x, 0, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, 0, 0)) AS lead_0#x, lead(v#x, 1, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, 1, 1)) AS lead_1#x, lead(v#x, 2, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, 2, 2)) AS lead_2#x, lead(v#x, 3, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, 3, 3)) AS lead_3#x, lag(v#x, 0, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, 0, 0)) AS lag_0#x, lag(v#x, -1, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, -1, -1)) AS lag_1#x, lag(v#x, -2, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, -2, -2)) AS lag_2#x, lag(v#x, -3, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, -3, -3)) AS lag_3#x, lag(v#x, -3, null) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RowFrame, -3, -3)) AS lag_plus_3#x, nth_value(v#x, 1, true) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS nth_value_1#x, nth_value(v#x, 2, true) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS nth_value_2#x, nth_value(v#x, 3, true) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS nth_value_3#x, first(v#x, true) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS first_value#x, any_value(v#x, true) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS any_value#x, last(v#x, true) windowspecdefinition(id#x ASC NULLS FIRST, specifiedwindowframe(RangeFrame, unboundedpreceding$(), currentrow$())) AS last_value#x], [id#x ASC NULLS FIRST]
          +- Project [content#x, id#x, v#x]
             +- SubqueryAlias test_ignore_null
diff --git a/sql/core/src/test/resources/sql-tests/inputs/binary.sql b/sql/core/src/test/resources/sql-tests/inputs/binary.sql
index fc875b0afb0eb..b30c57a7e871b 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/binary.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/binary.sql
@@ -4,4 +4,11 @@ SELECT X'';
 SELECT X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333';
 SELECT CAST('Spark' as BINARY);
 SELECT array( X'', X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333', CAST('Spark' as BINARY));
-SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333'));
\ No newline at end of file
+SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333'));
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')));
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING');
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary');
diff --git a/sql/core/src/test/resources/sql-tests/inputs/cast.sql b/sql/core/src/test/resources/sql-tests/inputs/cast.sql
index 2bf53f9730b3b..9d191dff67028 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/cast.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/cast.sql
@@ -147,6 +147,27 @@ select cast(80.654321BD as interval hour to minute);
 select cast(-10.123456BD as interval year to month);
 select cast(10.654321BD as interval month);
 
+-- cast TIME to integral types
+SELECT CAST(TIME '00:01:52' AS tinyint);
+SELECT CAST(TIME '00:01:52' AS smallint);
+SELECT CAST(TIME '00:01:52' AS int);
+SELECT CAST(TIME '00:01:52' AS bigint);
+
+-- cast TIME to integral types with potential overflow
+SELECT CAST(TIME '23:59:59' AS tinyint);
+SELECT CAST(TIME '23:59:59' AS smallint);
+SELECT CAST(TIME '23:59:59' AS int);
+SELECT CAST(TIME '23:59:59' AS bigint);
+
+-- cast TIME with fractional seconds (should floor)
+SELECT CAST(TIME '00:00:17.5' AS tinyint);
+SELECT CAST(TIME '00:00:17.5' AS int);
+SELECT CAST(TIME '00:00:17.9' AS int);
+
+-- cast TIME edge cases
+SELECT CAST(TIME '00:00:00' AS tinyint);
+SELECT CAST(TIME '00:00:00' AS int);
+
 -- cast double colon syntax tests
 SELECT '1.23' :: int;
 SELECT 'abc' :: int;
@@ -168,6 +189,12 @@ select -10L :: interval second;
 select interval '08:11:10.001' hour to second :: decimal(10, 4);
 select 10.123456BD :: interval day to second;
 
+-- cast TIME using double colon syntax
+SELECT TIME '00:01:52' :: tinyint;
+SELECT TIME '00:01:52' :: int;
+SELECT TIME '23:59:59' :: tinyint;
+SELECT TIME '23:59:59' :: int;
+
 SELECT '1.23' :: int :: long;
 SELECT '2147483648' :: long :: int;
 SELECT CAST('2147483648' :: long AS int);
@@ -177,3 +204,26 @@ SELECT map(1, '123', 2, '456')[1] :: int;
 SELECT '2147483648' :: BINT;
 SELECT '2147483648' :: SELECT;
 SELECT FALSE IS NOT NULL :: string;
+
+-- SPARK-52619: cast TIME to DECIMAL with sufficient precision and scale.
+SELECT CAST(time '00:00:00' AS decimal(1, 0));
+SELECT CAST(time '12:00:00' AS decimal(7, 2));
+SELECT CAST(time '01:30:45' AS decimal(8, 3));
+SELECT CAST(time '23:59:59' AS decimal(9, 4));
+SELECT CAST(time '01:02:03' AS decimal(15, 9));
+SELECT CAST(time '10:20:30' AS decimal(20, 10));
+SELECT CAST(time '23:59:59.001' AS decimal(8, 3));
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 6));
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 9));
+SELECT CAST(time '23:59:59.999999999' AS decimal(20, 10));
+
+-- SPARK-52619: cast TIME to DECIMAL with insufficient precision.
+SELECT CAST(time '00:01:00' AS decimal(1, 0));
+SELECT CAST(time '01:00:00' AS decimal(3, 0));
+SELECT CAST(time '10:00:00' AS decimal(5, 2));
+
+-- SPARK-52619: cast TIME to DECIMAL with insufficient scale.
+SELECT CAST(time '23:59:59.9' AS decimal(6, 0));
+SELECT CAST(time '23:59:59.999' AS decimal(8, 2));
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 5));
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 8));
diff --git a/sql/core/src/test/resources/sql-tests/inputs/collations-aliases.sql b/sql/core/src/test/resources/sql-tests/inputs/collations-aliases.sql
new file mode 100644
index 0000000000000..307c77333eb30
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/collations-aliases.sql
@@ -0,0 +1,95 @@
+-- test cases for implicit aliases to collated expression trees are correctly generated
+
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t1 values ('Spark', 'Spark', 'SQL');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA');
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a');
+insert into t1 values ('İo', 'İo', 'İo');
+insert into t1 values ('İo', 'İo', 'İo ');
+insert into t1 values ('İo', 'İo ', 'İo');
+insert into t1 values ('İo', 'İo', 'i̇o');
+insert into t1 values ('efd2', 'efd2', 'efd2');
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.');
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.');
+insert into t1 values ('kitten', 'kitten', 'sitTing');
+insert into t1 values ('abc', 'abc', 'abc');
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA');
+
+-- Simple select
+select concat_ws(' ', utf8_lcase, utf8_lcase) from t1;
+
+-- Select by implicit alias
+select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+);
+
+-- Select by star
+select * from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+);
+
+-- Select by qualified star
+select subq1.* from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+) AS subq1;
+
+-- Implicit alias in CTE output
+with cte as (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+select * from cte;
+
+-- Implicit alias in EXISTS subquery output
+select * from values (1) where exists (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+);
+
+-- Implicit alias in scalar subquery output
+select (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1 limit 1
+);
+
+-- Scalar subquery with CTE with implicit alias
+select (
+  with cte as (
+    select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  )
+  select * from cte limit 1
+);
+
+-- Outer reference to implicit alias
+select * from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1 limit 1
+)
+where (
+  `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` == 'aaa'
+);
+
+-- Implicit alias reference in Sort
+select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  group by 1
+  order by 1
+);
+
+-- Implciit alias from aggregate in Sort
+select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  group by 1
+  order by max(concat_ws(' ', utf8_lcase, utf8_lcase))
+);
+
+-- Implicit alias in view schema
+create temporary view v1 as (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+);
+
+select * from v1;
+
+select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from v1;
+
+drop view v1;
+
+drop table t1;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/collations-basic.sql b/sql/core/src/test/resources/sql-tests/inputs/collations-basic.sql
new file mode 100644
index 0000000000000..dad8fca460989
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/collations-basic.sql
@@ -0,0 +1,212 @@
+-- test cases for collation support
+
+-- Create a test table with data
+create table t1(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t1 values('aaa', 'aaa');
+insert into t1 values('AAA', 'AAA');
+insert into t1 values('bbb', 'bbb');
+insert into t1 values('BBB', 'BBB');
+
+-- describe
+describe table t1;
+
+-- group by and count utf8_binary
+select count(*) from t1 group by utf8_binary;
+
+-- group by and count utf8_lcase
+select count(*) from t1 group by utf8_lcase;
+
+-- filter equal utf8_binary
+select * from t1 where utf8_binary = 'aaa';
+
+-- filter equal utf8_lcase
+select * from t1 where utf8_lcase = 'aaa' collate utf8_lcase;
+
+-- filter less then utf8_binary
+select * from t1 where utf8_binary < 'bbb';
+
+-- filter less then utf8_lcase
+select * from t1 where utf8_lcase < 'bbb' collate utf8_lcase;
+
+-- inner join
+select l.utf8_binary, r.utf8_lcase from t1 l join t1 r on l.utf8_lcase = r.utf8_lcase;
+
+-- create second table for anti-join
+create table t2(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t2 values('aaa', 'aaa');
+insert into t2 values('bbb', 'bbb');
+
+-- anti-join on lcase
+select * from t1 anti join t2 on t1.utf8_lcase = t2.utf8_lcase;
+
+drop table t2;
+drop table t1;
+
+-- set operations
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate utf8_lcase from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate utf8_lcase from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate utf8_lcase from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate utf8_lcase from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate utf8_lcase from values ('aaa'), ('bbb');
+
+-- set operations with conflicting collations
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb');
+select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb');
+
+-- create table with struct field
+create table t1 (c1 struct<utf8_binary: string collate utf8_binary, utf8_lcase: string collate utf8_lcase>) USING PARQUET;
+
+insert into t1 values (named_struct('utf8_binary', 'aaa', 'utf8_lcase', 'aaa'));
+insert into t1 values (named_struct('utf8_binary', 'AAA', 'utf8_lcase', 'AAA'));
+
+-- aggregate against nested field utf8_binary
+select count(*) from t1 group by c1.utf8_binary;
+
+-- aggregate against nested field utf8_lcase
+select count(*) from t1 group by c1.utf8_lcase;
+
+drop table t1;
+
+-- array function tests
+select array_contains(ARRAY('aaa' collate utf8_lcase),'AAA' collate utf8_lcase);
+select array_position(ARRAY('aaa' collate utf8_lcase, 'bbb' collate utf8_lcase),'BBB' collate utf8_lcase);
+
+-- utility
+select nullif('aaa' COLLATE utf8_lcase, 'AAA' COLLATE utf8_lcase);
+select least('aaa' COLLATE utf8_lcase, 'AAA' collate utf8_lcase, 'a' collate utf8_lcase);
+
+-- array operations
+select arrays_overlap(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
+select array_distinct(array('aaa' collate utf8_lcase, 'AAA' collate utf8_lcase));
+select array_union(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
+select array_intersect(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
+select array_except(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
+
+-- ICU collations (all statements return true)
+select 'a' collate unicode < 'A';
+select 'a' collate unicode_ci = 'A';
+select 'a' collate unicode_ai = 'å';
+select 'a' collate unicode_ci_ai = 'Å';
+select 'a' collate en < 'A';
+select 'a' collate en_ci = 'A';
+select 'a' collate en_ai = 'å';
+select 'a' collate en_ci_ai = 'Å';
+select 'Kypper' collate sv < 'Köpfe';
+select 'Kypper' collate de > 'Köpfe';
+select 'I' collate tr_ci = 'ı';
+
+-- create table for str_to_map
+create table t3 (text string collate utf8_binary, pairDelim string collate utf8_lcase, keyValueDelim string collate utf8_binary) using parquet;
+
+insert into t3 values('a:1,b:2,c:3', ',', ':');
+
+select str_to_map(text, pairDelim, keyValueDelim) from t3;
+select str_to_map(text collate utf8_binary, pairDelim collate utf8_lcase, keyValueDelim collate utf8_binary) from t3;
+select str_to_map(text collate utf8_binary, pairDelim collate utf8_binary, keyValueDelim collate utf8_binary) from t3;
+select str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai) from t3;
+
+drop table t3;
+
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t1 values ('Spark', 'Spark', 'SQL');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA');
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a');
+insert into t1 values ('İo', 'İo', 'İo');
+insert into t1 values ('İo', 'İo', 'İo ');
+insert into t1 values ('İo', 'İo ', 'İo');
+insert into t1 values ('İo', 'İo', 'i̇o');
+insert into t1 values ('efd2', 'efd2', 'efd2');
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.');
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.');
+insert into t1 values ('kitten', 'kitten', 'sitTing');
+insert into t1 values ('abc', 'abc', 'abc');
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA');
+
+create table t2(ascii double) using parquet;
+insert into t2 values (97.52143);
+insert into t2 values (66.421);
+
+create table t3(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t3 values ('aaAaAAaA', 'aaAaaAaA');
+insert into t3 values ('efd2', 'efd2');
+
+create table t4(num long) using parquet;
+insert into t4 values (97);
+insert into t4 values (66);
+
+-- Elt
+select elt(2, s, utf8_binary) from t1;
+select elt(2, utf8_binary, utf8_lcase, s) from t1;
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_lcase) from t1;
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase) from t1;
+select elt(1, utf8_binary, 'word'), elt(1, utf8_lcase, 'word') from t1;
+select elt(1, utf8_binary, 'word' collate utf8_lcase), elt(1, utf8_lcase, 'word' collate utf8_binary) from t1;
+
+-- Ascii & UnBase64 string expressions
+select ascii(utf8_binary), ascii(utf8_lcase) from t1;
+select ascii(utf8_binary collate utf8_lcase), ascii(utf8_lcase collate utf8_binary) from t1;
+select unbase64(utf8_binary), unbase64(utf8_lcase) from t3;
+select unbase64(utf8_binary collate utf8_lcase), unbase64(utf8_lcase collate utf8_binary) from t3;
+
+-- Base64, Decode
+select base64(utf8_binary), base64(utf8_lcase) from t1;
+select base64(utf8_binary collate utf8_lcase), base64(utf8_lcase collate utf8_binary) from t1;
+select decode(encode(utf8_binary, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase, 'utf-8'), 'utf-8') from t1;
+select decode(encode(utf8_binary collate utf8_lcase, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase collate utf8_binary, 'utf-8'), 'utf-8') from t1;
+
+-- FormatNumber
+select format_number(ascii, '###.###') from t2;
+select format_number(ascii, '###.###' collate utf8_lcase) from t2;
+
+-- Encode, ToBinary
+select encode(utf8_binary, 'utf-8'), encode(utf8_lcase, 'utf-8') from t1;
+select encode(utf8_binary collate utf8_lcase, 'utf-8'), encode(utf8_lcase collate utf8_binary, 'utf-8') from t1;
+select to_binary(utf8_binary, 'utf-8'), to_binary(utf8_lcase, 'utf-8') from t1;
+select to_binary(utf8_binary collate utf8_lcase, 'utf-8'), to_binary(utf8_lcase collate utf8_binary, 'utf-8') from t1;
+
+-- SoundEx
+select soundex(utf8_binary), soundex(utf8_lcase) from t1;
+select soundex(utf8_binary collate utf8_lcase), soundex(utf8_lcase collate utf8_binary) from t1;
+
+-- Luhncheck
+select luhn_check(num) from t4;
+
+-- Levenshtein
+select levenshtein(utf8_binary, utf8_lcase) from t1;
+select levenshtein(s, utf8_binary) from t1;
+select levenshtein(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select levenshtein(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select levenshtein(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select levenshtein(utf8_binary, 'a'), levenshtein(utf8_lcase, 'a') from t1;
+select levenshtein(utf8_binary, 'AaAA' collate utf8_lcase, 3), levenshtein(utf8_lcase, 'AAa' collate utf8_binary, 4) from t1;
+
+-- IsValidUTF8
+select is_valid_utf8(utf8_binary), is_valid_utf8(utf8_lcase) from t1;
+select is_valid_utf8(utf8_binary collate utf8_lcase), is_valid_utf8(utf8_lcase collate utf8_binary) from t1;
+select is_valid_utf8(utf8_binary collate utf8_lcase_rtrim), is_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t1;
+
+-- MakeValidUTF8
+select make_valid_utf8(utf8_binary), make_valid_utf8(utf8_lcase) from t1;
+select make_valid_utf8(utf8_binary collate utf8_lcase), make_valid_utf8(utf8_lcase collate utf8_binary) from t1;
+select make_valid_utf8(utf8_binary collate utf8_lcase_rtrim), make_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t1;
+
+-- ValidateUTF8
+select validate_utf8(utf8_binary), validate_utf8(utf8_lcase) from t1;
+select validate_utf8(utf8_binary collate utf8_lcase), validate_utf8(utf8_lcase collate utf8_binary) from t1;
+select validate_utf8(utf8_binary collate utf8_lcase_rtrim), validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t1;
+
+-- TryValidateUTF8
+select try_validate_utf8(utf8_binary), try_validate_utf8(utf8_lcase) from t1;
+select try_validate_utf8(utf8_binary collate utf8_lcase), try_validate_utf8(utf8_lcase collate utf8_binary) from t1;
+select try_validate_utf8(utf8_binary collate utf8_lcase_rtrim), try_validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t1;
+
+drop table t1;
+drop table t2;
+drop table t3;
+drop table t4;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/collations-padding-trim.sql b/sql/core/src/test/resources/sql-tests/inputs/collations-padding-trim.sql
new file mode 100644
index 0000000000000..b86438d117d15
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/collations-padding-trim.sql
@@ -0,0 +1,81 @@
+-- test cases for padding and trimming with collations
+
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t1 values ('Spark', 'Spark', 'SQL');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA');
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a');
+insert into t1 values ('İo', 'İo', 'İo');
+insert into t1 values ('İo', 'İo', 'İo ');
+insert into t1 values ('İo', 'İo ', 'İo');
+insert into t1 values ('İo', 'İo', 'i̇o');
+insert into t1 values ('efd2', 'efd2', 'efd2');
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.');
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.');
+insert into t1 values ('kitten', 'kitten', 'sitTing');
+insert into t1 values ('abc', 'abc', 'abc');
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA');
+
+-- StringRPad
+select rpad(utf8_binary, 8, utf8_lcase) from t1;
+select rpad(s, 8, utf8_binary) from t1;
+select rpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t1;
+select rpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t1;
+select rpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t1;
+select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t1;
+select rpad(utf8_binary, 8, 'a'), rpad(utf8_lcase, 8, 'a') from t1;
+select rpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), rpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t1;
+
+-- StringLPad
+select lpad(utf8_binary, 8, utf8_lcase) from t1;
+select lpad(s, 8, utf8_binary) from t1;
+select lpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t1;
+select lpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t1;
+select lpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t1;
+select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t1;
+select lpad(utf8_binary, 8, 'a'), lpad(utf8_lcase, 8, 'a') from t1;
+select lpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), lpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t1;
+
+-- StringTrim
+select TRIM(utf8_binary, utf8_lcase) from t1;
+select TRIM(s, utf8_binary) from t1;
+select TRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select TRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select TRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select TRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1;
+select TRIM('ABc', utf8_binary), TRIM('ABc', utf8_lcase) from t1;
+select TRIM('ABc' collate utf8_lcase, utf8_binary), TRIM('AAa' collate utf8_binary, utf8_lcase) from t1;
+-- StringTrimBoth
+select BTRIM(utf8_binary, utf8_lcase) from t1;
+select BTRIM(s, utf8_binary) from t1;
+select BTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select BTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select BTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select BTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1;
+select BTRIM('ABc', utf8_binary), BTRIM('ABc', utf8_lcase) from t1;
+select BTRIM('ABc' collate utf8_lcase, utf8_binary), BTRIM('AAa' collate utf8_binary, utf8_lcase) from t1;
+-- StringTrimLeft
+select LTRIM(utf8_binary, utf8_lcase) from t1;
+select LTRIM(s, utf8_binary) from t1;
+select LTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select LTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select LTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select LTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1;
+select LTRIM('ABc', utf8_binary), LTRIM('ABc', utf8_lcase) from t1;
+select LTRIM('ABc' collate utf8_lcase, utf8_binary), LTRIM('AAa' collate utf8_binary, utf8_lcase) from t1;
+-- StringTrimRight
+select RTRIM(utf8_binary, utf8_lcase) from t1;
+select RTRIM(s, utf8_binary) from t1;
+select RTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select RTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select RTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select RTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1;
+select RTRIM('ABc', utf8_binary), RTRIM('ABc', utf8_lcase) from t1;
+select RTRIM('ABc' collate utf8_lcase, utf8_binary), RTRIM('AAa' collate utf8_binary, utf8_lcase) from t1;
+
+drop table t1;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/collations-string-functions.sql b/sql/core/src/test/resources/sql-tests/inputs/collations-string-functions.sql
new file mode 100644
index 0000000000000..0fb73f9978a37
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/collations-string-functions.sql
@@ -0,0 +1,197 @@
+-- test cases for string functions with collations
+
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t1 values ('Spark', 'Spark', 'SQL');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA');
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA');
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a');
+insert into t1 values ('İo', 'İo', 'İo');
+insert into t1 values ('İo', 'İo', 'İo ');
+insert into t1 values ('İo', 'İo ', 'İo');
+insert into t1 values ('İo', 'İo', 'i̇o');
+insert into t1 values ('efd2', 'efd2', 'efd2');
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.');
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.');
+insert into t1 values ('kitten', 'kitten', 'sitTing');
+insert into t1 values ('abc', 'abc', 'abc');
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA');
+
+create table t2(ascii long) using parquet;
+insert into t2 values (97);
+insert into t2 values (66);
+
+create table t3(format string collate utf8_binary, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
+insert into t3 values ('%s%s', 'abCdE', 'abCdE');
+
+-- ConcatWs
+select concat_ws(' ', utf8_lcase, utf8_lcase) from t1;
+select concat_ws(' ', utf8_binary, utf8_lcase) from t1;
+select concat_ws(' ' collate utf8_binary, utf8_binary, 'SQL' collate utf8_lcase) from t1;
+select concat_ws(' ' collate utf8_lcase, utf8_binary, 'SQL' collate utf8_lcase) from t1;
+select concat_ws(',', utf8_lcase, 'word'), concat_ws(',', utf8_binary, 'word') from t1;
+select concat_ws(',', utf8_lcase, 'word' collate utf8_binary), concat_ws(',', utf8_binary, 'word' collate utf8_lcase) from t1;
+
+-- SplitPart
+select split_part(utf8_binary, utf8_lcase, 3) from t1;
+select split_part(s, utf8_binary, 1) from t1;
+select split_part(utf8_binary collate utf8_binary, s collate utf8_lcase, 1) from t1;
+select split_part(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1;
+select split_part(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1;
+select split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t1;
+select split_part(utf8_binary, 'a', 3), split_part(utf8_lcase, 'a', 3) from t1;
+select split_part(utf8_binary, 'a' collate utf8_lcase, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t1;
+select split_part(utf8_binary, 'a ' collate utf8_lcase_rtrim, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t1;
+
+-- Contains
+select contains(utf8_binary, utf8_lcase) from t1;
+select contains(s, utf8_binary) from t1;
+select contains(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select contains(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select contains(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select contains(utf8_binary, 'a'), contains(utf8_lcase, 'a') from t1;
+select contains(utf8_binary, 'AaAA' collate utf8_lcase), contains(utf8_lcase, 'AAa' collate utf8_binary) from t1;
+select contains(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim), contains(utf8_lcase, 'AAa ' collate utf8_binary_rtrim) from t1;
+
+-- SubstringIndex
+select substring_index(utf8_binary, utf8_lcase, 2) from t1;
+select substring_index(s, utf8_binary,1) from t1;
+select substring_index(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t1;
+select substring_index(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1;
+select substring_index(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1;
+select substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t1;
+select substring_index(utf8_binary, 'a', 2), substring_index(utf8_lcase, 'a', 2) from t1;
+select substring_index(utf8_binary, 'AaAA' collate utf8_lcase, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1;
+select substring_index(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1;
+
+-- StringInStr
+select instr(utf8_binary, utf8_lcase) from t1;
+select instr(s, utf8_binary) from t1;
+select instr(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select instr(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select instr(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select instr(utf8_binary, 'a'), instr(utf8_lcase, 'a') from t1;
+select instr(utf8_binary, 'AaAA' collate utf8_lcase), instr(utf8_lcase, 'AAa' collate utf8_binary) from t1;
+
+-- FindInSet
+select find_in_set(utf8_binary, utf8_lcase) from t1;
+select find_in_set(s, utf8_binary) from t1;
+select find_in_set(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select find_in_set(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select find_in_set(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o'), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o') from t1;
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o' collate utf8_lcase), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t1;
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o ' collate utf8_lcase_rtrim), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t1;
+-- StartsWith
+select startswith(utf8_binary, utf8_lcase) from t1;
+select startswith(s, utf8_binary) from t1;
+select startswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select startswith(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select startswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select startswith(utf8_binary, 'aaAaaAaA'), startswith(utf8_lcase, 'aaAaaAaA') from t1;
+select startswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1;
+select startswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1;
+
+-- StringTranslate
+select translate(utf8_lcase, utf8_lcase, '12345') from t1;
+select translate(utf8_binary, utf8_lcase, '12345') from t1;
+select translate(utf8_binary, 'aBc' collate utf8_lcase, '12345' collate utf8_binary) from t1;
+select translate(utf8_binary, 'SQL' collate utf8_lcase, '12345' collate utf8_lcase) from t1;
+select translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai) from t1;
+select translate(utf8_lcase, 'aaAaaAaA', '12345'), translate(utf8_binary, 'aaAaaAaA', '12345') from t1;
+select translate(utf8_lcase, 'aBc' collate utf8_binary, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t1;
+select translate(utf8_lcase, 'aBc ' collate utf8_binary_rtrim, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t1;
+
+-- Replace
+select replace(utf8_binary, utf8_lcase, 'abc') from t1;
+select replace(s, utf8_binary, 'abc') from t1;
+select replace(utf8_binary collate utf8_binary, s collate utf8_lcase, 'abc') from t1;
+select replace(utf8_binary, utf8_lcase collate utf8_binary, 'abc') from t1;
+select replace(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 'abc') from t1;
+select replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc') from t1;
+select replace(utf8_binary, 'aaAaaAaA', 'abc'), replace(utf8_lcase, 'aaAaaAaA', 'abc') from t1;
+select replace(utf8_binary, 'aaAaaAaA' collate utf8_lcase, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t1;
+select replace(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t1;
+
+-- EndsWith
+select endswith(utf8_binary, utf8_lcase) from t1;
+select endswith(s, utf8_binary) from t1;
+select endswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select endswith(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select endswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1;
+select endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1;
+select endswith(utf8_binary, 'aaAaaAaA'), endswith(utf8_lcase, 'aaAaaAaA') from t1;
+select endswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1;
+select endswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1;
+
+-- StringRepeat
+select repeat(utf8_binary, 3), repeat(utf8_lcase, 2) from t1;
+select repeat(utf8_binary collate utf8_lcase, 3), repeat(utf8_lcase collate utf8_binary, 2) from t1;
+
+-- Chr
+select chr(ascii) from t2;
+
+-- Sentences
+select sentences(utf8_binary), sentences(utf8_lcase) from t1;
+select sentences(utf8_binary collate utf8_lcase), sentences(utf8_lcase collate utf8_binary) from t1;
+
+-- Upper
+select upper(utf8_binary), upper(utf8_lcase) from t1;
+select upper(utf8_binary collate utf8_lcase), upper(utf8_lcase collate utf8_binary) from t1;
+
+-- Lower
+select lower(utf8_binary), lower(utf8_lcase) from t1;
+select lower(utf8_binary collate utf8_lcase), lower(utf8_lcase collate utf8_binary) from t1;
+
+-- InitCap
+select initcap(utf8_binary), initcap(utf8_lcase) from t1;
+select initcap(utf8_binary collate utf8_lcase), initcap(utf8_lcase collate utf8_binary) from t1;
+
+-- Overlay
+select overlay(utf8_binary, utf8_lcase, 2) from t1;
+select overlay(s, utf8_binary,1) from t1;
+select overlay(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t1;
+select overlay(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1;
+select overlay(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1;
+select overlay(utf8_binary, 'a', 2), overlay(utf8_lcase, 'a', 2) from t1;
+select overlay(utf8_binary, 'AaAA' collate utf8_lcase, 2), overlay(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1;
+
+-- FormatString
+select format_string(format, utf8_binary, utf8_lcase) from t3;
+select format_string(format collate utf8_lcase, utf8_lcase, utf8_binary collate utf8_lcase, 3), format_string(format, utf8_lcase collate utf8_binary, utf8_binary) from t3;
+select format_string(format, utf8_binary, utf8_lcase) from t3;
+
+-- Length, BitLength & OctetLength
+select length(utf8_binary), length(utf8_lcase) from t1;
+select length(utf8_binary collate utf8_lcase), length(utf8_lcase collate utf8_binary) from t1;
+select bit_length(utf8_binary), bit_length(utf8_lcase) from t1;
+select bit_length(utf8_binary collate utf8_lcase), bit_length(utf8_lcase collate utf8_binary) from t1;
+select octet_length(utf8_binary), octet_length(utf8_lcase) from t1;
+select octet_length(utf8_binary collate utf8_lcase), octet_length(utf8_lcase collate utf8_binary) from t1;
+select octet_length(utf8_binary collate utf8_lcase_rtrim), octet_length(utf8_lcase collate utf8_binary_rtrim) from t1;
+
+-- Left/Right/Substr
+select substr(utf8_binary, 2, 2), substr(utf8_lcase, 2, 2) from t1;
+select substr(utf8_binary collate utf8_lcase, 2, 2), substr(utf8_lcase collate utf8_binary, 2, 2) from t1;
+select right(utf8_binary, 2), right(utf8_lcase, 2) from t1;
+select right(utf8_binary collate utf8_lcase, 2), right(utf8_lcase collate utf8_binary, 2) from t1;
+select left(utf8_binary, '2' collate utf8_lcase), left(utf8_lcase, 2) from t1;
+select left(utf8_binary collate utf8_lcase, 2), left(utf8_lcase collate utf8_binary, 2) from t1;
+
+-- Locate
+select locate(utf8_binary, utf8_lcase) from t1;
+select locate(s, utf8_binary) from t1;
+select locate(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1;
+select locate(utf8_binary, utf8_lcase collate utf8_binary) from t1;
+select locate(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 3) from t1;
+select locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3) from t1;
+select locate(utf8_binary, 'a'), locate(utf8_lcase, 'a') from t1;
+select locate(utf8_binary, 'AaAA' collate utf8_lcase, 4), locate(utf8_lcase, 'AAa' collate utf8_binary, 4) from t1;
+select locate(utf8_binary, 'AaAA ' collate utf8_binary_rtrim, 4), locate(utf8_lcase, 'AAa ' collate utf8_binary, 4) from t1;
+
+drop table t1;
+drop table t2;
+drop table t3;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/collations.sql b/sql/core/src/test/resources/sql-tests/inputs/collations.sql
deleted file mode 100644
index 17815ed5dde6d..0000000000000
--- a/sql/core/src/test/resources/sql-tests/inputs/collations.sql
+++ /dev/null
@@ -1,527 +0,0 @@
--- test cases for collation support
-
--- Create a test table with data
-create table t1(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
-insert into t1 values('aaa', 'aaa');
-insert into t1 values('AAA', 'AAA');
-insert into t1 values('bbb', 'bbb');
-insert into t1 values('BBB', 'BBB');
-
--- describe
-describe table t1;
-
--- group by and count utf8_binary
-select count(*) from t1 group by utf8_binary;
-
--- group by and count utf8_lcase
-select count(*) from t1 group by utf8_lcase;
-
--- filter equal utf8_binary
-select * from t1 where utf8_binary = 'aaa';
-
--- filter equal utf8_lcase
-select * from t1 where utf8_lcase = 'aaa' collate utf8_lcase;
-
--- filter less then utf8_binary
-select * from t1 where utf8_binary < 'bbb';
-
--- filter less then utf8_lcase
-select * from t1 where utf8_lcase < 'bbb' collate utf8_lcase;
-
--- inner join
-select l.utf8_binary, r.utf8_lcase from t1 l join t1 r on l.utf8_lcase = r.utf8_lcase;
-
--- create second table for anti-join
-create table t2(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
-insert into t2 values('aaa', 'aaa');
-insert into t2 values('bbb', 'bbb');
-
--- anti-join on lcase
-select * from t1 anti join t2 on t1.utf8_lcase = t2.utf8_lcase;
-
-drop table t2;
-drop table t1;
-
--- set operations
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate utf8_lcase from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate utf8_lcase from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate utf8_lcase from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate utf8_lcase from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate utf8_lcase from values ('aaa'), ('bbb');
-
--- set operations with conflicting collations
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb');
-select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb');
-
--- create table with struct field
-create table t1 (c1 struct<utf8_binary: string collate utf8_binary, utf8_lcase: string collate utf8_lcase>) USING PARQUET;
-
-insert into t1 values (named_struct('utf8_binary', 'aaa', 'utf8_lcase', 'aaa'));
-insert into t1 values (named_struct('utf8_binary', 'AAA', 'utf8_lcase', 'AAA'));
-
--- aggregate against nested field utf8_binary
-select count(*) from t1 group by c1.utf8_binary;
-
--- aggregate against nested field utf8_lcase
-select count(*) from t1 group by c1.utf8_lcase;
-
-drop table t1;
-
--- array function tests
-select array_contains(ARRAY('aaa' collate utf8_lcase),'AAA' collate utf8_lcase);
-select array_position(ARRAY('aaa' collate utf8_lcase, 'bbb' collate utf8_lcase),'BBB' collate utf8_lcase);
-
--- utility
-select nullif('aaa' COLLATE utf8_lcase, 'AAA' COLLATE utf8_lcase);
-select least('aaa' COLLATE utf8_lcase, 'AAA' collate utf8_lcase, 'a' collate utf8_lcase);
-
--- array operations
-select arrays_overlap(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
-select array_distinct(array('aaa' collate utf8_lcase, 'AAA' collate utf8_lcase));
-select array_union(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
-select array_intersect(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
-select array_except(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase));
-
--- ICU collations (all statements return true)
-select 'a' collate unicode < 'A';
-select 'a' collate unicode_ci = 'A';
-select 'a' collate unicode_ai = 'å';
-select 'a' collate unicode_ci_ai = 'Å';
-select 'a' collate en < 'A';
-select 'a' collate en_ci = 'A';
-select 'a' collate en_ai = 'å';
-select 'a' collate en_ci_ai = 'Å';
-select 'Kypper' collate sv < 'Köpfe';
-select 'Kypper' collate de > 'Köpfe';
-select 'I' collate tr_ci = 'ı';
-
--- create table for str_to_map
-create table t4 (text string collate utf8_binary, pairDelim string collate utf8_lcase, keyValueDelim string collate utf8_binary) using parquet;
-
-insert into t4 values('a:1,b:2,c:3', ',', ':');
-
-select str_to_map(text, pairDelim, keyValueDelim) from t4;
-select str_to_map(text collate utf8_binary, pairDelim collate utf8_lcase, keyValueDelim collate utf8_binary) from t4;
-select str_to_map(text collate utf8_binary, pairDelim collate utf8_binary, keyValueDelim collate utf8_binary) from t4;
-select str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai) from t4;
-
-drop table t4;
-
-create table t5(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
-insert into t5 values ('Spark', 'Spark', 'SQL');
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA');
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA');
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA');
-insert into t5 values ('bbAbaAbA', 'bbAbAAbA', 'a');
-insert into t5 values ('İo', 'İo', 'İo');
-insert into t5 values ('İo', 'İo', 'İo ');
-insert into t5 values ('İo', 'İo ', 'İo');
-insert into t5 values ('İo', 'İo', 'i̇o');
-insert into t5 values ('efd2', 'efd2', 'efd2');
-insert into t5 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.');
-insert into t5 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.');
-insert into t5 values ('kitten', 'kitten', 'sitTing');
-insert into t5 values ('abc', 'abc', 'abc');
-insert into t5 values ('abcdcba', 'abcdcba', 'aBcDCbA');
-
-create table t6(ascii long) using parquet;
-insert into t6 values (97);
-insert into t6 values (66);
-
-create table t7(ascii double) using parquet;
-insert into t7 values (97.52143);
-insert into t7 values (66.421);
-
-create table t8(format string collate utf8_binary, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
-insert into t8 values ('%s%s', 'abCdE', 'abCdE');
-
-create table t9(num long) using parquet;
-insert into t9 values (97);
-insert into t9 values (66);
-
-create table t10(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet;
-insert into t10 values ('aaAaAAaA', 'aaAaaAaA');
-insert into t10 values ('efd2', 'efd2');
-
--- ConcatWs
-select concat_ws(' ', utf8_lcase, utf8_lcase) from t5;
-select concat_ws(' ', utf8_binary, utf8_lcase) from t5;
-select concat_ws(' ' collate utf8_binary, utf8_binary, 'SQL' collate utf8_lcase) from t5;
-select concat_ws(' ' collate utf8_lcase, utf8_binary, 'SQL' collate utf8_lcase) from t5;
-select concat_ws(',', utf8_lcase, 'word'), concat_ws(',', utf8_binary, 'word') from t5;
-select concat_ws(',', utf8_lcase, 'word' collate utf8_binary), concat_ws(',', utf8_binary, 'word' collate utf8_lcase) from t5;
-
--- Elt
-select elt(2, s, utf8_binary) from t5;
-select elt(2, utf8_binary, utf8_lcase, s) from t5;
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_lcase) from t5;
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase) from t5;
-select elt(1, utf8_binary, 'word'), elt(1, utf8_lcase, 'word') from t5;
-select elt(1, utf8_binary, 'word' collate utf8_lcase), elt(1, utf8_lcase, 'word' collate utf8_binary) from t5;
-
--- SplitPart
-select split_part(utf8_binary, utf8_lcase, 3) from t5;
-select split_part(s, utf8_binary, 1) from t5;
-select split_part(utf8_binary collate utf8_binary, s collate utf8_lcase, 1) from t5;
-select split_part(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5;
-select split_part(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5;
-select split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t5;
-select split_part(utf8_binary, 'a', 3), split_part(utf8_lcase, 'a', 3) from t5;
-select split_part(utf8_binary, 'a' collate utf8_lcase, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t5;
-select split_part(utf8_binary, 'a ' collate utf8_lcase_rtrim, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t5;
-
--- Contains
-select contains(utf8_binary, utf8_lcase) from t5;
-select contains(s, utf8_binary) from t5;
-select contains(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select contains(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select contains(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select contains(utf8_binary, 'a'), contains(utf8_lcase, 'a') from t5;
-select contains(utf8_binary, 'AaAA' collate utf8_lcase), contains(utf8_lcase, 'AAa' collate utf8_binary) from t5;
-select contains(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim), contains(utf8_lcase, 'AAa ' collate utf8_binary_rtrim) from t5;
-
--- SubstringIndex
-select substring_index(utf8_binary, utf8_lcase, 2) from t5;
-select substring_index(s, utf8_binary,1) from t5;
-select substring_index(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t5;
-select substring_index(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5;
-select substring_index(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5;
-select substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t5;
-select substring_index(utf8_binary, 'a', 2), substring_index(utf8_lcase, 'a', 2) from t5;
-select substring_index(utf8_binary, 'AaAA' collate utf8_lcase, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5;
-select substring_index(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5;
-
--- StringInStr
-select instr(utf8_binary, utf8_lcase) from t5;
-select instr(s, utf8_binary) from t5;
-select instr(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select instr(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select instr(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select instr(utf8_binary, 'a'), instr(utf8_lcase, 'a') from t5;
-select instr(utf8_binary, 'AaAA' collate utf8_lcase), instr(utf8_lcase, 'AAa' collate utf8_binary) from t5;
-
--- FindInSet
-select find_in_set(utf8_binary, utf8_lcase) from t5;
-select find_in_set(s, utf8_binary) from t5;
-select find_in_set(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select find_in_set(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select find_in_set(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o'), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o') from t5;
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o' collate utf8_lcase), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t5;
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o ' collate utf8_lcase_rtrim), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t5;
--- StartsWith
-select startswith(utf8_binary, utf8_lcase) from t5;
-select startswith(s, utf8_binary) from t5;
-select startswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select startswith(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select startswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select startswith(utf8_binary, 'aaAaaAaA'), startswith(utf8_lcase, 'aaAaaAaA') from t5;
-select startswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5;
-select startswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5;
-
--- StringTranslate
-select translate(utf8_lcase, utf8_lcase, '12345') from t5;
-select translate(utf8_binary, utf8_lcase, '12345') from t5;
-select translate(utf8_binary, 'aBc' collate utf8_lcase, '12345' collate utf8_binary) from t5;
-select translate(utf8_binary, 'SQL' collate utf8_lcase, '12345' collate utf8_lcase) from t5;
-select translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai) from t5;
-select translate(utf8_lcase, 'aaAaaAaA', '12345'), translate(utf8_binary, 'aaAaaAaA', '12345') from t5;
-select translate(utf8_lcase, 'aBc' collate utf8_binary, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t5;
-select translate(utf8_lcase, 'aBc ' collate utf8_binary_rtrim, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t5;
-
--- Replace
-select replace(utf8_binary, utf8_lcase, 'abc') from t5;
-select replace(s, utf8_binary, 'abc') from t5;
-select replace(utf8_binary collate utf8_binary, s collate utf8_lcase, 'abc') from t5;
-select replace(utf8_binary, utf8_lcase collate utf8_binary, 'abc') from t5;
-select replace(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 'abc') from t5;
-select replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc') from t5;
-select replace(utf8_binary, 'aaAaaAaA', 'abc'), replace(utf8_lcase, 'aaAaaAaA', 'abc') from t5;
-select replace(utf8_binary, 'aaAaaAaA' collate utf8_lcase, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t5;
-select replace(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t5;
-
--- EndsWith
-select endswith(utf8_binary, utf8_lcase) from t5;
-select endswith(s, utf8_binary) from t5;
-select endswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select endswith(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select endswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select endswith(utf8_binary, 'aaAaaAaA'), endswith(utf8_lcase, 'aaAaaAaA') from t5;
-select endswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5;
-select endswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5;
-
--- StringRepeat
-select repeat(utf8_binary, 3), repeat(utf8_lcase, 2) from t5;
-select repeat(utf8_binary collate utf8_lcase, 3), repeat(utf8_lcase collate utf8_binary, 2) from t5;
-
--- Ascii & UnBase64 string expressions
-select ascii(utf8_binary), ascii(utf8_lcase) from t5;
-select ascii(utf8_binary collate utf8_lcase), ascii(utf8_lcase collate utf8_binary) from t5;
-select unbase64(utf8_binary), unbase64(utf8_lcase) from t10;
-select unbase64(utf8_binary collate utf8_lcase), unbase64(utf8_lcase collate utf8_binary) from t10;
-
--- Chr
-select chr(ascii) from t6;
-
--- Base64, Decode
-select base64(utf8_binary), base64(utf8_lcase) from t5;
-select base64(utf8_binary collate utf8_lcase), base64(utf8_lcase collate utf8_binary) from t5;
-select decode(encode(utf8_binary, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase, 'utf-8'), 'utf-8') from t5;
-select decode(encode(utf8_binary collate utf8_lcase, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase collate utf8_binary, 'utf-8'), 'utf-8') from t5;
-
--- FormatNumber
-select format_number(ascii, '###.###') from t7;
-select format_number(ascii, '###.###' collate utf8_lcase) from t7;
-
--- Encode, ToBinary
-select encode(utf8_binary, 'utf-8'), encode(utf8_lcase, 'utf-8') from t5;
-select encode(utf8_binary collate utf8_lcase, 'utf-8'), encode(utf8_lcase collate utf8_binary, 'utf-8') from t5;
-select to_binary(utf8_binary, 'utf-8'), to_binary(utf8_lcase, 'utf-8') from t5;
-select to_binary(utf8_binary collate utf8_lcase, 'utf-8'), to_binary(utf8_lcase collate utf8_binary, 'utf-8') from t5;
-
--- Sentences
-select sentences(utf8_binary), sentences(utf8_lcase) from t5;
-select sentences(utf8_binary collate utf8_lcase), sentences(utf8_lcase collate utf8_binary) from t5;
-
--- Upper
-select upper(utf8_binary), upper(utf8_lcase) from t5;
-select upper(utf8_binary collate utf8_lcase), upper(utf8_lcase collate utf8_binary) from t5;
-
--- Lower
-select lower(utf8_binary), lower(utf8_lcase) from t5;
-select lower(utf8_binary collate utf8_lcase), lower(utf8_lcase collate utf8_binary) from t5;
-
--- InitCap
-select initcap(utf8_binary), initcap(utf8_lcase) from t5;
-select initcap(utf8_binary collate utf8_lcase), initcap(utf8_lcase collate utf8_binary) from t5;
-
--- Overlay
-select overlay(utf8_binary, utf8_lcase, 2) from t5;
-select overlay(s, utf8_binary,1) from t5;
-select overlay(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t5;
-select overlay(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5;
-select overlay(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5;
-select overlay(utf8_binary, 'a', 2), overlay(utf8_lcase, 'a', 2) from t5;
-select overlay(utf8_binary, 'AaAA' collate utf8_lcase, 2), overlay(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5;
-
--- FormatString
-select format_string(format, utf8_binary, utf8_lcase) from t8;
-select format_string(format collate utf8_lcase, utf8_lcase, utf8_binary collate utf8_lcase, 3), format_string(format, utf8_lcase collate utf8_binary, utf8_binary) from t8;
-select format_string(format, utf8_binary, utf8_lcase) from t8;
-
--- SoundEx
-select soundex(utf8_binary), soundex(utf8_lcase) from t5;
-select soundex(utf8_binary collate utf8_lcase), soundex(utf8_lcase collate utf8_binary) from t5;
-
--- Length, BitLength & OctetLength
-select length(utf8_binary), length(utf8_lcase) from t5;
-select length(utf8_binary collate utf8_lcase), length(utf8_lcase collate utf8_binary) from t5;
-select bit_length(utf8_binary), bit_length(utf8_lcase) from t5;
-select bit_length(utf8_binary collate utf8_lcase), bit_length(utf8_lcase collate utf8_binary) from t5;
-select octet_length(utf8_binary), octet_length(utf8_lcase) from t5;
-select octet_length(utf8_binary collate utf8_lcase), octet_length(utf8_lcase collate utf8_binary) from t5;
-select octet_length(utf8_binary collate utf8_lcase_rtrim), octet_length(utf8_lcase collate utf8_binary_rtrim) from t5;
-
--- Luhncheck
-select luhn_check(num) from t9;
-
--- Levenshtein
-select levenshtein(utf8_binary, utf8_lcase) from t5;
-select levenshtein(s, utf8_binary) from t5;
-select levenshtein(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select levenshtein(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select levenshtein(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select levenshtein(utf8_binary, 'a'), levenshtein(utf8_lcase, 'a') from t5;
-select levenshtein(utf8_binary, 'AaAA' collate utf8_lcase, 3), levenshtein(utf8_lcase, 'AAa' collate utf8_binary, 4) from t5;
-
--- IsValidUTF8
-select is_valid_utf8(utf8_binary), is_valid_utf8(utf8_lcase) from t5;
-select is_valid_utf8(utf8_binary collate utf8_lcase), is_valid_utf8(utf8_lcase collate utf8_binary) from t5;
-select is_valid_utf8(utf8_binary collate utf8_lcase_rtrim), is_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t5;
-
--- MakeValidUTF8
-select make_valid_utf8(utf8_binary), make_valid_utf8(utf8_lcase) from t5;
-select make_valid_utf8(utf8_binary collate utf8_lcase), make_valid_utf8(utf8_lcase collate utf8_binary) from t5;
-select make_valid_utf8(utf8_binary collate utf8_lcase_rtrim), make_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t5;
-
--- ValidateUTF8
-select validate_utf8(utf8_binary), validate_utf8(utf8_lcase) from t5;
-select validate_utf8(utf8_binary collate utf8_lcase), validate_utf8(utf8_lcase collate utf8_binary) from t5;
-select validate_utf8(utf8_binary collate utf8_lcase_rtrim), validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t5;
-
--- TryValidateUTF8
-select try_validate_utf8(utf8_binary), try_validate_utf8(utf8_lcase) from t5;
-select try_validate_utf8(utf8_binary collate utf8_lcase), try_validate_utf8(utf8_lcase collate utf8_binary) from t5;
-select try_validate_utf8(utf8_binary collate utf8_lcase_rtrim), try_validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t5;
-
--- Left/Right/Substr
-select substr(utf8_binary, 2, 2), substr(utf8_lcase, 2, 2) from t5;
-select substr(utf8_binary collate utf8_lcase, 2, 2), substr(utf8_lcase collate utf8_binary, 2, 2) from t5;
-select right(utf8_binary, 2), right(utf8_lcase, 2) from t5;
-select right(utf8_binary collate utf8_lcase, 2), right(utf8_lcase collate utf8_binary, 2) from t5;
-select left(utf8_binary, '2' collate utf8_lcase), left(utf8_lcase, 2) from t5;
-select left(utf8_binary collate utf8_lcase, 2), left(utf8_lcase collate utf8_binary, 2) from t5;
-
--- StringRPad
-select rpad(utf8_binary, 8, utf8_lcase) from t5;
-select rpad(s, 8, utf8_binary) from t5;
-select rpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t5;
-select rpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t5;
-select rpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t5;
-select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t5;
-select rpad(utf8_binary, 8, 'a'), rpad(utf8_lcase, 8, 'a') from t5;
-select rpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), rpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t5;
-
--- StringLPad
-select lpad(utf8_binary, 8, utf8_lcase) from t5;
-select lpad(s, 8, utf8_binary) from t5;
-select lpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t5;
-select lpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t5;
-select lpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t5;
-select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t5;
-select lpad(utf8_binary, 8, 'a'), lpad(utf8_lcase, 8, 'a') from t5;
-select lpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), lpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t5;
-
--- Locate
-select locate(utf8_binary, utf8_lcase) from t5;
-select locate(s, utf8_binary) from t5;
-select locate(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select locate(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select locate(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 3) from t5;
-select locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3) from t5;
-select locate(utf8_binary, 'a'), locate(utf8_lcase, 'a') from t5;
-select locate(utf8_binary, 'AaAA' collate utf8_lcase, 4), locate(utf8_lcase, 'AAa' collate utf8_binary, 4) from t5;
-select locate(utf8_binary, 'AaAA ' collate utf8_binary_rtrim, 4), locate(utf8_lcase, 'AAa ' collate utf8_binary, 4) from t5;
-
--- StringTrim
-select TRIM(utf8_binary, utf8_lcase) from t5;
-select TRIM(s, utf8_binary) from t5;
-select TRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select TRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select TRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select TRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5;
-select TRIM('ABc', utf8_binary), TRIM('ABc', utf8_lcase) from t5;
-select TRIM('ABc' collate utf8_lcase, utf8_binary), TRIM('AAa' collate utf8_binary, utf8_lcase) from t5;
--- StringTrimBoth
-select BTRIM(utf8_binary, utf8_lcase) from t5;
-select BTRIM(s, utf8_binary) from t5;
-select BTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select BTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select BTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select BTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5;
-select BTRIM('ABc', utf8_binary), BTRIM('ABc', utf8_lcase) from t5;
-select BTRIM('ABc' collate utf8_lcase, utf8_binary), BTRIM('AAa' collate utf8_binary, utf8_lcase) from t5;
--- StringTrimLeft
-select LTRIM(utf8_binary, utf8_lcase) from t5;
-select LTRIM(s, utf8_binary) from t5;
-select LTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select LTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select LTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select LTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5;
-select LTRIM('ABc', utf8_binary), LTRIM('ABc', utf8_lcase) from t5;
-select LTRIM('ABc' collate utf8_lcase, utf8_binary), LTRIM('AAa' collate utf8_binary, utf8_lcase) from t5;
--- StringTrimRight
-select RTRIM(utf8_binary, utf8_lcase) from t5;
-select RTRIM(s, utf8_binary) from t5;
-select RTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5;
-select RTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5;
-select RTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5;
-select RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5;
-select RTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5;
-select RTRIM('ABc', utf8_binary), RTRIM('ABc', utf8_lcase) from t5;
-select RTRIM('ABc' collate utf8_lcase, utf8_binary), RTRIM('AAa' collate utf8_binary, utf8_lcase) from t5;
-
--- Implicit aliases to collated expression trees are correctly generated
-
--- Simple select
-select concat_ws(' ', utf8_lcase, utf8_lcase) from t5;
-
--- Select by implicit alias
-select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-);
-
--- Select by star
-select * from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-);
-
--- Select by qualified star
-select subq1.* from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-) AS subq1;
-
--- Implicit alias in CTE output
-with cte as (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
-select * from cte;
-
--- Implicit alias in EXISTS subquery output
-select * from values (1) where exists (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-);
-
--- Implicit alias in scalar subquery output
-select (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5 limit 1
-);
-
--- Scalar subquery with CTE with implicit alias
-select (
-  with cte as (
-    select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  )
-  select * from cte limit 1
-);
-
--- Outer reference to implicit alias
-select * from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5 limit 1
-)
-where (
-  `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` == 'aaa'
-);
-
--- Implicit alias reference in Sort
-select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  group by 1
-  order by 1
-);
-
--- Implciit alias from aggregate in Sort
-select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  group by 1
-  order by max(concat_ws(' ', utf8_lcase, utf8_lcase))
-);
-
--- Implicit alias in view schema
-create temporary view v1 as (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-);
-
-select * from v1;
-
-select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from v1;
-
-drop view v1;
-
-drop table t5;
-drop table t6;
-drop table t7;
-drop table t8;
-drop table t9;
-drop table t10;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/cte-recursion.sql b/sql/core/src/test/resources/sql-tests/inputs/cte-recursion.sql
index 3005ceff503cf..828a7c8046776 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/cte-recursion.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/cte-recursion.sql
@@ -182,6 +182,13 @@ WITH
   )
 SELECT * FROM t2;
 
+-- Self reference is inside OneRowSubquery
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT (SELECT n+1 FROM t1 WHERE n<5)
+)
+SELECT * FROM t1 LIMIT 5;
 
 -- recursive reference in a nested CTE
 WITH RECURSIVE
@@ -674,4 +681,115 @@ WITH RECURSIVE randoms(val) AS (
     SELECT SHUFFLE(ARRAY(1,2,3,4,5), 237685)
     FROM randoms
 )
-SELECT val FROM randoms LIMIT 5;
\ No newline at end of file
+SELECT val FROM randoms LIMIT 5;
+
+-- Type coercion where the anchor is wider
+WITH RECURSIVE t1(n, m) AS (
+    SELECT 1, CAST(1 AS BIGINT)
+    UNION ALL
+    SELECT n+1, n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1;
+
+-- Type coercion where the recursion is wider
+WITH RECURSIVE t1(n, m) AS (
+    SELECT 1, 1
+    UNION ALL
+    SELECT n+1, CAST(n+1 AS BIGINT) FROM t1 WHERE n < 5)
+SELECT * FROM t1;
+
+-- Recursive CTE with nullable recursion and non-recursive anchor
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT CASE WHEN n < 5 THEN n + 1 ELSE NULL END FROM t1
+)
+SELECT * FROM t1 LIMIT 25;
+
+-- Two calls to same rCTE with and without limit
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1 WHERE n < 5
+)
+SELECT (SELECT SUM(n) FROM (SELECT * FROM t1)), (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 3));
+
+-- Two calls to same infinite rCTE with different limits
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+)
+SELECT (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 5)), (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 3));
+
+-- Two calls to same infinite rCTE from another rCTE
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+), t2(m) AS (
+    SELECT (SELECT SUM(n) FROM (SELECT n FROM t1 LIMIT 10) AS sums)
+    UNION ALL
+    SELECT m + (SELECT SUM(n) FROM (SELECT n FROM t1 LIMIT 3) AS sums) FROM t2
+)
+SELECT * FROM t2 LIMIT 20;
+
+-- Two calls to recursive CTE with single limit pushed to both
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+)
+    ((SELECT n FROM t1) UNION ALL (SELECT n FROM t1)) LIMIT 20;
+
+-- Recursive CTE with self reference inside Window function
+WITH RECURSIVE win(id, val) AS (
+    SELECT 1, CAST(10 AS BIGINT)
+    UNION ALL
+    SELECT id + 1, SUM(val) OVER (ORDER BY id ROWS BETWEEN 1 PRECEDING AND CURRENT ROW)
+    FROM win WHERE id < 3
+)
+SELECT * FROM win;
+
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    (SELECT n + 1 FROM t1 WHERE n < 5 ORDER BY n)
+)
+SELECT * FROM t1;
+
+WITH RECURSIVE t1(n) AS (
+    SELECT 1 FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1;
+
+WITH RECURSIVE t1 AS (
+    SELECT 1 AS n FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1;
+
+WITH RECURSIVE t1(n) AS (
+    WITH t2(m) AS (SELECT 1)
+    SELECT 1 FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1;
+
+WITH RECURSIVE t1 AS (
+    WITH t2(m) AS (SELECT 1)
+    SELECT 1 AS n FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1;
+
+-- Query with recursion that gets optimized to empty relation
+WITH RECURSIVE t AS (
+    SELECT 1 AS n
+    UNION ALL
+    SELECT n + m
+    FROM (SELECT 2 as m) subq
+             JOIN t ON n = m
+    WHERE n <> m
+)
+SELECT * FROM t;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/describe.sql b/sql/core/src/test/resources/sql-tests/inputs/describe.sql
index dbe5bc840bce6..2b4191a282500 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/describe.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/describe.sql
@@ -64,6 +64,13 @@ DESC t PARTITION (c='Us');
 -- ParseException: PARTITION specification is incomplete
 DESC t PARTITION (c='Us', d);
 
+-- DESC SCHEMA
+DROP SCHEMA IF EXISTS test_schema;
+CREATE SCHEMA test_schema DEFAULT COLLATION UNICODE;
+DESCRIBE SCHEMA EXTENDED test_schema;
+ALTER SCHEMA test_schema DEFAULT COLLATION UTF8_LCASE;
+DESCRIBE SCHEMA EXTENDED test_schema;
+
 -- DESC Temp View
 
 DESC temp_v;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/double-quoted-identifiers.sql b/sql/core/src/test/resources/sql-tests/inputs/double-quoted-identifiers.sql
index ffb52b403346f..202b55f4f4590 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/double-quoted-identifiers.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/double-quoted-identifiers.sql
@@ -1,4 +1,4 @@
--- All these should error out in the parser
+-- All these should error out in the parser in non-ansi mode, error out in the analyzer in ansi mode
 SELECT 1 FROM "not_exist";
 
 USE SCHEMA "not_exist";
@@ -15,6 +15,8 @@ SELECT "not_exist"();
 
 SELECT "not_exist".not_exist();
 
+select 1 from "not_""exists";
+
 -- All these should error out in analysis
 SELECT 1 FROM `hello`;
 
@@ -35,6 +37,7 @@ SELECT `not_exist`.not_exist();
 -- Strings in various situations all work
 SELECT "hello";
 
+-- Ok for non-ansi mode, error for ansi-mode
 CREATE TEMPORARY VIEW v(c1 COMMENT "hello") AS SELECT 1;
 DROP VIEW v;
 
diff --git a/sql/core/src/test/resources/sql-tests/inputs/having-and-order-by-recursive-type-name-resolution.sql b/sql/core/src/test/resources/sql-tests/inputs/having-and-order-by-recursive-type-name-resolution.sql
new file mode 100644
index 0000000000000..25eba9f14d572
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/having-and-order-by-recursive-type-name-resolution.sql
@@ -0,0 +1,76 @@
+-- This test file contains queries that test recursive types name resolution in ORDER BY and HAVING clauses.
+
+-- Alias type: String, Table column type: Struct
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 ORDER BY col1.a;
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 HAVING col1.a > 0;
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a;
+
+-- Alias type: Struct, Table column type: String
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1.a;
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a > 0;
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a;
+
+-- Alias type: Struct, Table column type: Struct
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 ORDER BY col1.a;
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 HAVING col1.a > 0;
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a;
+
+-- Alias type: String, Table column type: Array
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 ORDER BY col1[0];
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 HAVING col1[0] > 0;
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 HAVING col1[0] > 0 ORDER BY col1[0];
+
+-- Alias type: Array, Table column type: String
+SELECT ARRAY(1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1[0];
+SELECT ARRAY(1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1[0] > 0;
+
+-- Alias type: Struct<Struct>, Table column type: String
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1.a.b;
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a.b > 0;
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a.b > 0 ORDER BY col1.a.b;
+
+-- Alias type: Array<Struct>, Table column type: String
+SELECT ARRAY(NAMED_STRUCT('a', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1[0].a;
+SELECT ARRAY(NAMED_STRUCT('a', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1[0].a > 0;
+
+-- Alias type: String, Table column type: Map
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 ORDER BY col1['key'];
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 HAVING col1['key'] > 0;
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 HAVING col1['key'] > 0 ORDER BY col1['key'];
+
+-- Alias type: Map, Table column type: String
+SELECT MAP('key', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1['key'];
+SELECT MAP('key', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1['key'] > 0;
+
+-- Using ORDER BY with named_struct
+SELECT named_struct('a',1) as col, col1
+FROM values(named_struct('a',1))
+ORDER BY col1.a;
+
+-- Using HAVING with named_struct
+SELECT named_struct('a', 1) AS col1, col1
+FROM values(named_struct('a', 1))
+GROUP BY col1
+HAVING col1.a > 0;
+
+-- Using array instead of named_struct with ORDER BY
+SELECT array(1, 2, 3) AS col1, col1
+FROM values(array(1, 2, 3))
+ORDER BY col1[0];
+
+-- Using array with HAVING
+SELECT array(1, 2, 3) AS col1, col1
+FROM values(array(1, 2, 3))
+GROUP BY col1
+HAVING col1[1] > 1;
+
+-- Using map with ORDER BY
+SELECT map('a', 1, 'b', 2) AS col1, col1
+FROM values(map('a', 1, 'b', 2))
+ORDER BY col1['a'];
+
+-- Using map with HAVING
+SELECT map('a', 1, 'b', 2) AS col1, col1
+FROM values(map('a', 1, 'b', 2))
+GROUP BY col1
+HAVING col1['b'] > 1;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/having.sql b/sql/core/src/test/resources/sql-tests/inputs/having.sql
index 9cf6478fa33ca..92f1d5aec74d3 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/having.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/having.sql
@@ -62,3 +62,37 @@ SELECT 1 + SUM(v) FROM hav HAVING SUM(v) + 1;
 SELECT SUM(v) + 1 FROM hav HAVING 1 + SUM(v);
 SELECT MAX(v) + SUM(v) FROM hav HAVING SUM(v) + MAX(v);
 SELECT SUM(v) + 1 + MIN(v) FROM hav HAVING 1 + 1 + 1 + MIN(v) + 1 + SUM(v);
+
+-- HAVING with outer reference to alias in outer project list
+SELECT col1 AS alias
+FROM values(1)
+GROUP BY col1
+HAVING (
+    SELECT col1 = 1
+);
+
+SELECT col1 AS alias
+FROM values(named_struct('a', 1))
+GROUP BY col1
+HAVING (
+    SELECT col1.a = 1
+);
+
+SELECT col1 AS alias
+FROM values(array(1))
+GROUP BY col1
+HAVING (
+    SELECT col1[0] = 1
+);
+
+SELECT col1 AS alias
+FROM values(map('a', 1))
+GROUP BY col1
+HAVING (
+    SELECT col1[0] = 1
+);
+
+-- Missing attribute (col2) in HAVING is added only once
+
+SELECT col1 FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 = col2;
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 = col2;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/higher-order-functions.sql b/sql/core/src/test/resources/sql-tests/inputs/higher-order-functions.sql
index 37081de012e98..f1c92327bde3a 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/higher-order-functions.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/higher-order-functions.sql
@@ -102,4 +102,66 @@ select transform(ys, all -> all * all) as v from values (array(32, 97)) as t(ys)
 select transform(ys, (all, i) -> all + i) as v from values (array(32, 97)) as t(ys);
 
 -- SPARK-32819: Aggregate on nested string arrays
-select aggregate(split('abcdefgh',''), array(array('')), (acc, x) -> array(array(x)));
\ No newline at end of file
+select aggregate(split('abcdefgh',''), array(array('')), (acc, x) -> array(array(x)));
+
+-- HigherOrderFunctions without lambda variables
+
+select aggregate(array(1, 2, 3), 0, 100) as aggregate_int_literal;
+select aggregate(array(1, 2, 3), map(), map('result', 999)) as aggregate_map_literal;
+select aggregate(array(1, 2, 3), struct('init', 0), struct('final', 999)) as aggregate_struct_literal;
+select aggregate(array(1, 2, 3), array(), array('result')) as aggregate_array_literal;
+
+select array_sort(array(3, 1, 2), 1) as array_sort_int_literal;
+select array_sort(array(3, 1, 2), map('compare', 0)) as array_sort_map_literal;
+select array_sort(array(3, 1, 2), struct('result', 0)) as array_sort_struct_literal;
+select array_sort(array(3, 1, 2), array(0)) as array_sort_array_literal;
+
+select exists(array(1, 2, 3), 1) as exists_int_literal;
+select exists(array(1, 2, 3), map('found', true)) as exists_map_literal;
+select exists(array(1, 2, 3), struct('exists', true)) as exists_struct_literal;
+select exists(array(1, 2, 3), array(true)) as exists_array_literal;
+
+select filter(array(1, 2, 3), 1) as filter_int_literal;
+select filter(array(1, 2, 3), map('key', 'value')) as filter_map_literal;
+select filter(array(1, 2, 3), struct('valid', true)) as filter_struct_literal;
+select filter(array(1, 2, 3), array(true, false)) as filter_array_literal;
+
+select forall(array(1, 2, 3), 1) as forall_int_literal;
+select forall(array(1, 2, 3), map('all', true)) as forall_map_literal;
+select forall(array(1, 2, 3), struct('all', true)) as forall_struct_literal;
+select forall(array(1, 2, 3), array(true, true)) as forall_array_literal;
+
+select map_filter(map('a', 1, 'b', 2), 1) as map_filter_int_literal;
+select map_filter(map('a', 1, 'b', 2), map('keep', true)) as map_filter_map_literal;
+select map_filter(map('a', 1, 'b', 2), struct('filter', true)) as map_filter_struct_literal;
+select map_filter(map('a', 1, 'b', 2), array(true)) as map_filter_array_literal;
+
+select map_zip_with(map('a', 1), map('a', 10), 100) as map_zipwith_int_literal;
+select map_zip_with(map('a', 1), map('a', 10), map('merged', true)) as map_zipwith_map_literal;
+select map_zip_with(map('a', 1), map('a', 10), struct('left', 1, 'right', 10)) as map_zipwith_struct_literal;
+select map_zip_with(map('a', 1), map('a', 10), array('combined')) as map_zipwith_array_literal;
+
+select reduce(array(1, 2, 3), 0, 100) as reduce_int_literal;
+select reduce(array(1, 2, 3), map(), map('result', 999)) as reduce_map_literal;
+select reduce(array(1, 2, 3), struct('init', 0), struct('final', 999)) as reduce_struct_literal;
+select reduce(array(1, 2, 3), array(), array('result')) as reduce_array_literal;
+
+select transform(array(1, 2, 3), 42) as transform_int_literal;
+select transform(array(1, 2, 3), map('key', 'value')) as transform_map_literal;
+select transform(array(1, 2, 3), struct('id', 99, 'name', 'test')) as transform_struct_literal;
+select transform(array(1, 2, 3), array('a', 'b')) as transform_array_literal;
+
+select transform_keys(map('a', 1, 'b', 2), 42) as transform_keys_int_literal;
+select transform_keys(map('a', 1, 'b', 2), map('new', 'key')) as transform_keys_map_literal;
+select transform_keys(map('a', 1, 'b', 2), struct('key', 'value')) as transform_keys_struct_literal;
+select transform_keys(map('a', 1, 'b', 2), array('new_key')) as transform_keys_array_literal;
+
+select transform_values(map('a', 1, 'b', 2), 999) as transform_values_int_literal;
+select transform_values(map('a', 1, 'b', 2), map('new', 'value')) as transform_values_map_literal;
+select transform_values(map('a', 1, 'b', 2), struct('val', 999)) as transform_values_struct_literal;
+select transform_values(map('a', 1, 'b', 2), array('new_value')) as transform_values_array_literal;
+
+select zip_with(array(1, 2, 3), array(4, 5, 6), 100) as zipwith_int_literal;
+select zip_with(array(1, 2, 3), array(4, 5, 6), map('merged', true)) as zipwith_map_literal;
+select zip_with(array(1, 2, 3), array(4, 5, 6), struct('left', 1, 'right', 2)) as zipwith_struct_literal;
+select zip_with(array(1, 2, 3), array(4, 5, 6), array('combined')) as zipwith_array_literal;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/literals.sql b/sql/core/src/test/resources/sql-tests/inputs/literals.sql
index e1e4a370bffdc..1d8b74ad000e3 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/literals.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/literals.sql
@@ -121,3 +121,13 @@ select -x'2379ACFe';
 
 -- normalize -0 and -0.0
 select -0, -0.0;
+
+-- Double-quote escaping ("", '')
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3;
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3;
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6;
+
+SET spark.sql.legacy.consecutiveStringLiterals.enabled=true;
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3;
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3;
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql b/sql/core/src/test/resources/sql-tests/inputs/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql
new file mode 100644
index 0000000000000..91811cc8024e9
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql
@@ -0,0 +1,134 @@
+CREATE OR REPLACE TEMPORARY VIEW v1 AS SELECT col1 FROM VALUES
+  (42), (17), (99), (5), (42),
+  (23), (8), (17), (76), (33),
+  (99), (55), (3), (42), (8)
+;
+
+CREATE OR REPLACE TEMPORARY VIEW v2 AS SELECT col1 FROM VALUES
+  ('apple'), ('banana'), ('cherry'), ('date'), ('apple'),
+  ('fig'), ('grape'), ('banana'), ('kiwi'), ('lemon'),
+  ('cherry'), ('mango'), ('orange'), ('apple'), ('grape')
+;
+
+-- Explicit aliases
+
+-- Baseline
+
+SELECT 2 AS col1 FROM v1 ORDER BY col1;
+
+SELECT 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1;
+
+SELECT 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50;
+
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 ORDER BY col1
+) ORDER BY 1;
+
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+) ORDER BY 1;
+
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1;
+
+-- Conflict in main output
+
+SELECT 2 AS col1, 3 AS col1 FROM v1 ORDER BY col1;
+
+SELECT 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL ORDER BY col1;
+
+SELECT 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50;
+
+SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 ORDER BY col1;
+
+SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL ORDER BY col1;
+
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1;
+
+SELECT col1, 2 AS col1 FROM v1 ORDER BY col1;
+
+SELECT col1, 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1;
+
+SELECT * FROM (
+  SELECT col1, 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1;
+
+-- Conflict in hidden output
+
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) ORDER BY col1;
+
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL ORDER BY col1;
+
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL HAVING col1 > 50;
+
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) ORDER BY col1;
+
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL ORDER BY col1;
+
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL HAVING col1 > 50;
+
+-- Implicit aliases
+
+-- Baseline
+
+SELECT 'col1' FROM v2 ORDER BY col1;
+
+SELECT 'col1' FROM v2 GROUP BY ALL ORDER BY col1;
+
+SELECT 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana';
+
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 ORDER BY col1
+) ORDER BY 1;
+
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+) ORDER BY 1;
+
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1;
+
+-- Conflict in main output
+
+SELECT 'col1', 'col1' FROM v2 ORDER BY col1;
+
+SELECT 'col1', 'col1' FROM v2 GROUP BY ALL ORDER BY col1;
+
+SELECT 'col1', 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana';
+
+SELECT col1 AS c, 'col1', 'col1' FROM v2 ORDER BY col1;
+
+SELECT col1 AS c, 'col1', 'col1' FROM v2 GROUP BY ALL ORDER BY col1;
+
+SELECT * FROM (
+  SELECT col1 AS c, 'col1', 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1;
+
+SELECT col1, 'col1' FROM v2 ORDER BY col1;
+
+SELECT col1, 'col1' FROM v2 GROUP BY ALL ORDER BY col1;
+
+SELECT * FROM (
+  SELECT col1, 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1;
+
+-- Conflict in hidden output
+
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) ORDER BY col1;
+
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL ORDER BY col1;
+
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL HAVING col1 > 'banana';
+
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) ORDER BY col1;
+
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL ORDER BY col1;
+
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL HAVING col1 > 'banana';
+
+DROP VIEW v2;
+DROP VIEW v1;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/order-by-ordinal.sql b/sql/core/src/test/resources/sql-tests/inputs/order-by-ordinal.sql
index 8d733e77fa8d3..9908e215db877 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/order-by-ordinal.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/order-by-ordinal.sql
@@ -28,6 +28,25 @@ select * from data order by 3;
 -- sort by ordinal
 select * from data sort by 1 desc;
 
+-- SPARK-52565: Enforce ordinal resolution before other sort order expressions
+set spark.sql.prioritizeOrdinalResolutionInSort.enabled=true;
+SELECT a FROM data ORDER BY 2, b;
+SELECT a FROM data ORDER BY b, 2;
+SELECT a FROM data ORDER BY 'b', 2;
+SELECT a FROM data ORDER BY `b`, 2;
+SELECT a FROM data ORDER BY a, 2;
+SELECT a FROM data ORDER BY b, 3;
+SELECT a, a + 1 FROM data ORDER BY b, 3;
+
+set spark.sql.prioritizeOrdinalResolutionInSort.enabled=false;
+SELECT a FROM data ORDER BY 2, b;
+SELECT a FROM data ORDER BY b, 2;
+SELECT a FROM data ORDER BY 'b', 2;
+SELECT a FROM data ORDER BY `b`, 2;
+SELECT a FROM data ORDER BY a, 2;
+SELECT a FROM data ORDER BY b, 3;
+SELECT a, a + 1 FROM data ORDER BY b, 3;
+
 -- turn off order by ordinal
 set spark.sql.orderByOrdinal=false;
 
diff --git a/sql/core/src/test/resources/sql-tests/inputs/order-by.sql b/sql/core/src/test/resources/sql-tests/inputs/order-by.sql
index c9590a70046c1..88c04377de0b3 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/order-by.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/order-by.sql
@@ -54,5 +54,10 @@ SELECT MAX(a) + SUM(b) FROM testData ORDER BY SUM(b) + MAX(a);
 SELECT SUM(a) + 1 + MIN(a) FROM testData ORDER BY 1 + 1 + 1 + MIN(a) + 1 + SUM(a);
 SELECT SUM(b) + 1 FROM testData HAVING SUM(b) + 1 > 0 ORDER BY SUM(b) + 1;
 
+-- Missing attribute (col2) in ORDER BY is added only once
+
+SELECT col1 FROM VALUES(1,2) GROUP BY col1, col2 ORDER BY col2, col2;
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 ORDER BY col2, col2;
+
 -- Clean up
 DROP VIEW IF EXISTS testData;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/replacing-missing-expression-with-alias.sql b/sql/core/src/test/resources/sql-tests/inputs/replacing-missing-expression-with-alias.sql
new file mode 100644
index 0000000000000..0f238033fada2
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/replacing-missing-expression-with-alias.sql
@@ -0,0 +1,33 @@
+-- Replace expression with alias that has semantically equal child if expression is not in output
+SELECT col1 + 1 AS a FROM VALUES(1) GROUP BY a ORDER BY col1 + 1;
+SELECT col1 + 1 AS a, a AS b FROM VALUES(1) GROUP BY a ORDER BY col1 + 1;
+SELECT col1 + 1 AS a FROM VALUES(1) GROUP BY a HAVING col1 + 1 > 0;
+SELECT col1 + 1 AS a, a AS b FROM VALUES(1) GROUP BY a HAVING col1 + 1 > 0;
+
+SELECT col1, col2, GROUPING(col1) FROM VALUES("abc", 1) GROUP BY CUBE(col1, col2) ORDER BY GROUPING(col1);
+SELECT col1, col2, GROUPING(col1) FROM VALUES("abc", 1) GROUP BY CUBE(col1, col2) HAVING GROUPING(col1) != NULL;
+
+
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) ORDER BY make_date(col1, col2, col3);
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) ORDER BY make_date(col1, col2, col3);
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) HAVING make_date(col1, col2, col3) > '2025-01-01';
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) HAVING make_date(col1, col2, col3) > '2025-01-01';
+
+-- Don't replace expression with alias that has semantically equal child if expression is not grouping
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) ORDER BY make_date(col1, col2, col3);
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) ORDER BY make_date(col1, col2, col3);
+
+-- Don't replace expression with alias that has semantically equal child if expression is in output
+SELECT col1, col1 AS a FROM VALUES(1) GROUP BY col1 ORDER BY col1 ASC;
+SELECT col1 AS a, col1 FROM VALUES(1) GROUP BY col1 ORDER BY col1 ASC;
+SELECT col1, col1 AS a FROM VALUES(1) GROUP BY col1 HAVING col1 > 0;
+SELECT col1 AS a, col1 FROM VALUES(1) GROUP BY col1 HAVING col1 > 0;
+
+SELECT col2 AS b, col2 FROM VALUES(1,2) GROUP BY 1,2 ORDER BY ALL;
+SELECT col2 AS b, col2 FROM VALUES(1,2) GROUP BY 1,2 HAVING col2 > 0 ORDER BY ALL;
+SELECT col2 AS b, col2, b as c FROM VALUES(1,2) GROUP BY 1,2 ORDER BY ALL;
+SELECT col2 AS b, col2, b as c FROM VALUES(1,2) GROUP BY 1,2 HAVING col2 > 0 ORDER BY ALL;
+
+-- Fixed point doesn't know to correctly replace `col1` with `a` because HAVING adds an artificial Project node
+SELECT col1 AS a FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 > 1 ORDER BY col1;
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 > 1 ORDER BY col1;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/sql-session-variables.sql b/sql/core/src/test/resources/sql-tests/inputs/sql-session-variables.sql
index d876be1bb6bcd..2e4eaa1f8f6ca 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/sql-session-variables.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/sql-session-variables.sql
@@ -207,6 +207,35 @@ DROP TEMPORARY VARIABLE var1;
 DROP TEMPORARY VARIABLE var2;
 DROP TEMPORARY VARIABLE var3;
 
+SET VARIABLE title = 'DECLARE VARIABLE - multiple variables declared at once';
+
+DECLARE VARIABLE var1, var2, var3 INT;
+DECLARE VARIABLE var4, var5, var6 INT DEFAULT CAST(RAND(0) * 10 AS INT);
+DECLARE VARIABLE var7, var8, var9 DEFAULT 5;
+
+SELECT var4 = var5, var4 = var6, var5 = var6;
+
+DECLARE OR REPLACE VARIABLE var1, var2, var3 DOUBLE;
+DECLARE OR REPLACE VARIABLE var4, var5, var6 DOUBLE DEFAULT RAND(0);
+DECLARE OR REPLACE VARIABLE var7, var8, var9 DEFAULT 1.5;
+
+SELECT var4 = var5, var4 = var6, var5 = var6;
+
+DROP TEMPORARY VARIABLE var1;
+DROP TEMPORARY VARIABLE var2;
+DROP TEMPORARY VARIABLE var3;
+DROP TEMPORARY VARIABLE var4;
+DROP TEMPORARY VARIABLE var5;
+DROP TEMPORARY VARIABLE var6;
+DROP TEMPORARY VARIABLE var7;
+DROP TEMPORARY VARIABLE var8;
+DROP TEMPORARY VARIABLE var9;
+
+SET VARIABLE title = 'DECLARE VARIABLE - duplicate names';
+
+DECLARE VARIABLE var1, var2, vAr1 INT;
+DECLARE OR REPLACE VARIABLE var1, var2, vAr1 INT;
+
 SET VARIABLE title = 'SET VARIABLE - row assignment';
 
 DECLARE OR REPLACE VARIABLE var1 INT DEFAULT 5;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/sql-udf.sql b/sql/core/src/test/resources/sql-tests/inputs/sql-udf.sql
index 7a1ab2d16ab58..e796b7b192b3f 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/sql-udf.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/sql-udf.sql
@@ -188,6 +188,244 @@ CREATE FUNCTION foo41() RETURNS INT RETURN SELECT 1;
 -- Expect failure
 CREATE FUNCTION foo42() RETURNS TABLE(a INT) RETURN 1;
 
+-- 1.5 Scalar function returns subquery with more than one row or no rows
+
+-- 1.5.a More than one row
+CREATE FUNCTION foo51() RETURNS INT RETURN (SELECT a FROM VALUES(1), (2) AS T(a));
+SELECT foo51();
+
+-- 1.5.b No Rows
+CREATE FUNCTION foo52() RETURNS INT RETURN (SELECT 1 FROM VALUES(1) WHERE 1 = 0);
+-- Expect Success: NULL
+SELECT foo52();
+
+-- 1.6 Difficult identifiers
+-- 1.6.a Space in the schema name
+-- UNSUPPORTED BY CREATE SCHEMA
+-- CREATE SCHEMA `a b`;
+
+-- CREATE FUNCTION `a b`.foo6a() RETURNS INT RETURN 1;
+-- SELECT `a b`.foo6a();
+
+-- DROP FUNCTION `a b`.foo6a;
+-- DROP SCHEMA `a b`;
+
+-- 1.6.b Space in a function name
+-- Default Hive configuration does not allow function name with space
+-- CREATE FUNCTION `foo 6 b`() RETURNS INT RETURN 1;
+-- SELECT `foo 6 b`();
+-- DROP FUNCTION `foo 6 b`;
+
+-- 1.6.c Spaces in parameter names
+CREATE FUNCTION foo6c(` a` INT, a INT, `a b` INT) RETURNS INT RETURN 1;
+SELECT foo6c(1, 2, 3);
+
+-- 1.6.d Spaces in RETURNS column list
+CREATE FUNCTION foo6d() RETURNS TABLE(` a` INT, a INT, `a b` INT) RETURN SELECT 1, 2, 3;
+SELECT * FROM foo6d();
+
+-- 1.7 Parameter resolution
+CREATE FUNCTION foo7a(a STRING, b STRING, c STRING) RETURNS STRING RETURN
+SELECT 'Foo.a: ' || a ||  ' Foo.a: ' || foo7a.a
+       || ' T.b: ' ||  b || ' Foo.b: ' || foo7a.b
+       || ' T.c: ' || c || ' T.c: ' || t.c FROM VALUES('t.b', 't.c') AS T(b, c);
+
+SELECT foo7a('Foo.a', 'Foo.b', 'Foo.c');
+
+CREATE FUNCTION foo7at(a STRING, b STRING, c STRING) RETURNS TABLE (a STRING, b STRING, c STRING, d STRING, e STRING) RETURN
+SELECT CONCAT('Foo.a: ', a), CONCAT('Foo.b: ', foo7at.b), CONCAT('T.b: ', b),
+       CONCAT('Foo.c: ', foo7at.c), CONCAT('T.c: ', c)
+FROM VALUES ('t.b', 't.c') AS T(b, c);
+SELECT * FROM foo7at('Foo.a', 'Foo.b', 'Foo.c');
+
+-- 1.8 Comments
+-- Need to verify comments in non-sql tests
+
+-- 1.9 Test all data types
+-- Boolean
+CREATE FUNCTION foo9a(a BOOLEAN) RETURNS BOOLEAN RETURN NOT a;
+SELECT foo9a(true);
+
+-- Expect error
+SELECT foo9a(5);
+SELECT foo9a('Nonsense');
+
+-- Byte
+CREATE FUNCTION foo9b(a BYTE) RETURNS BYTE RETURN CAST(a AS SHORT) + 1;
+SELECT foo9b(126);
+SELECT foo9b(127);
+SELECT foo9b(128);
+
+-- Short
+CREATE FUNCTION foo9c(a SHORT) RETURNS SHORT RETURN CAST(a AS INTEGER) + 1;
+SELECT foo9c(32766);
+SELECT foo9c(32767);
+SELECT foo9c(32768);
+
+-- Integer
+CREATE FUNCTION foo9d(a INTEGER) RETURNS INTEGER RETURN CAST(a AS BIGINT) + 1;
+SELECT foo9d(2147483647 - 1);
+SELECT foo9d(2147483647);
+SELECT foo9d(2147483647 + 1);
+
+-- Bigint
+CREATE FUNCTION foo9e(a BIGINT) RETURNS BIGINT RETURN CAST(a AS DECIMAL(20, 0)) + 1;
+SELECT foo9e(9223372036854775807 - 1);
+SELECT foo9e(9223372036854775807);
+SELECT foo9e(9223372036854775807.0 + 1);
+
+-- DECIMAL
+CREATE FUNCTION foo9f(a DECIMAL( 5, 2 )) RETURNS DECIMAL (5, 2) RETURN CAST(a AS DECIMAL(6, 2)) + 1;
+SELECT foo9f(999 - 1);
+SELECT foo9f(999);
+SELECT foo9f(999 + 1);
+
+-- FLOAT
+CREATE FUNCTION foo9g(a FLOAT, b String) RETURNS FLOAT RETURN b || CAST(a AS String);
+SELECT foo9g(123.23, '7');
+SELECT foo9g('hello', '7');
+SELECT foo9g(123.23, 'q');
+
+-- DOUBLE
+CREATE FUNCTION foo9h(a DOUBLE, b String) RETURNS DOUBLE RETURN b || CAST(a AS String);
+SELECT foo9h(123.23, '7');
+SELECT foo9h('hello', '7');
+SELECT foo9h(123.23, 'q');
+
+-- VARCHAR
+-- Expect failure: char/varchar type can only be used in the table schema.
+CREATE FUNCTION foo9i(a VARCHAR(10), b VARCHAR(10)) RETURNS VARCHAR(12) RETURN a || b;
+-- SELECT foo9i('1234567890', '');
+-- SELECT foo9i('12345678901', '');
+-- SELECT foo9i('1234567890', '1');
+
+-- STRING
+CREATE FUNCTION foo9j(a STRING, b STRING) RETURNS STRING RETURN a || b;
+SELECT foo9j('1234567890', '12');
+SELECT foo9j(12345678901, '12');
+
+-- DATE
+CREATE FUNCTION foo9l(a DATE, b INTERVAL) RETURNS DATE RETURN a + b;
+SELECT foo9l(DATE '2020-02-02', INTERVAL '1' YEAR);
+SELECT foo9l('2020-02-02', INTERVAL '1' YEAR);
+SELECT foo9l(DATE '-7', INTERVAL '1' YEAR);
+SELECT foo9l(DATE '2020-02-02', INTERVAL '9999999' YEAR);
+
+-- TIMESTAMP
+CREATE FUNCTION foo9m(a TIMESTAMP, b INTERVAL) RETURNS TIMESTAMP RETURN a + b;
+SELECT foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '1' YEAR);
+SELECT foo9m('2020-02-02 12:15:16.123', INTERVAL '1' YEAR);
+SELECT foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '999999' YEAR);
+
+-- ARRAY
+CREATE FUNCTION foo9n(a ARRAY<INTEGER>) RETURNS ARRAY<INTEGER> RETURN a;
+SELECT foo9n(ARRAY(1, 2, 3));
+SELECT foo9n(from_json('[1, 2, 3]', 'array<int>'));
+
+-- MAP
+CREATE FUNCTION foo9o(a MAP<STRING, INTEGER>) RETURNS MAP<STRING, INTEGER> RETURN a;
+SELECT foo9o(MAP('hello', 1, 'world', 2));
+SELECT foo9o(from_json('{"hello":1, "world":2}', 'map<string,int>'));
+
+-- STRUCT
+CREATE FUNCTION foo9p(a STRUCT<a1: INTEGER, a2: STRING>) RETURNS STRUCT<a1: INTEGER, a2: STRING> RETURN a;
+SELECT foo9p(STRUCT(1, 'hello'));
+SELECT foo9p(from_json('{1:"hello"}', 'struct<a1:int, a2:string>'));
+
+-- ARRAY of STRUCT
+CREATE FUNCTION foo9q(a ARRAY<STRUCT<a1: INT, a2: STRING>>) RETURNS ARRAY<STRUCT<a1: INT, a2: STRING>> RETURN a;
+SELECT foo9q(ARRAY(STRUCT(1, 'hello'), STRUCT(2, 'world')));
+SELECT foo9q(ARRAY(NAMED_STRUCT('x', 1, 'y', 'hello'), NAMED_STRUCT('x', 2, 'y', 'world')));
+SELECT foo9q(from_json('[{1:"hello"}, {2:"world"}]', 'array<struct<a1:int,a2:string>>'));
+
+-- ARRAY of MAP
+CREATE FUNCTION foo9r(a ARRAY<MAP<STRING, INT>>) RETURNS ARRAY<MAP<STRING, INT>> RETURN a;
+SELECT foo9r(ARRAY(MAP('hello', 1), MAP('world', 2)));
+SELECT foo9r(from_json('[{"hello":1}, {"world":2}]', 'array<map<string,int>>'));
+
+-- 1.10 Proper name resolution when referencing another function
+CREATE OR REPLACE FUNCTION foo1_10(a INT) RETURNS INT RETURN a + 2;
+CREATE OR REPLACE FUNCTION bar1_10(b INT) RETURNS STRING RETURN foo1_10(TRY_CAST(b AS STRING));
+SELECT bar1_10(3);
+
+-- 1.11 Optional return types (type inference)
+-- 1.11.a Scalar UDF without RETURNS clause - return type inferred from body
+-- Simple literal return
+CREATE OR REPLACE FUNCTION foo1_11a() RETURN 42;
+-- Expect: 42
+SELECT foo1_11a();
+
+-- String literal return
+CREATE OR REPLACE FUNCTION foo1_11b() RETURN 'hello world';
+-- Expect: 'hello world'
+SELECT foo1_11b();
+
+-- Expression return - should infer INT
+CREATE OR REPLACE FUNCTION foo1_11c(a INT, b INT) RETURN a + b;
+-- Expect: 8
+SELECT foo1_11c(3, 5);
+
+-- Expression return - should infer DOUBLE
+CREATE OR REPLACE FUNCTION foo1_11d(a DOUBLE, b INT) RETURN a * b + 1.5;
+-- Expect: 16.5
+SELECT foo1_11d(3.0, 5);
+
+-- Boolean expression return
+CREATE OR REPLACE FUNCTION foo1_11e(a INT) RETURN a > 10;
+-- Expect: true, false
+SELECT foo1_11e(15), foo1_11e(5);
+
+-- Date arithmetic return
+CREATE OR REPLACE FUNCTION foo1_11f(d DATE) RETURN d + INTERVAL '1' DAY;
+-- Expect: 2024-01-02
+SELECT foo1_11f(DATE '2024-01-01');
+
+-- Array return
+CREATE OR REPLACE FUNCTION foo1_11g(n INT) RETURN ARRAY(1, 2, n);
+-- Expect: [1, 2, 5]
+SELECT foo1_11g(5);
+
+-- Struct return
+CREATE OR REPLACE FUNCTION foo1_11h(a INT, b STRING) RETURN STRUCT(a, b);
+-- Expect: {1, 'test'}
+SELECT foo1_11h(1, 'test');
+
+-- Subquery return - scalar
+CREATE OR REPLACE FUNCTION foo1_11i(x INT) RETURN (SELECT x * 2);
+-- Expect: 10
+SELECT foo1_11i(5);
+
+-- Function call return
+CREATE OR REPLACE FUNCTION foo1_11j(s STRING) RETURN UPPER(s);
+-- Expect: 'HELLO'
+SELECT foo1_11j('hello');
+
+-- Complex expression with multiple types
+CREATE OR REPLACE FUNCTION foo1_11k(a INT, b STRING) RETURN CONCAT(CAST(a AS STRING), '_', b);
+-- Expect: '123_test'
+SELECT foo1_11k(123, 'test');
+
+-- 1.11.b Table UDF without TABLE schema - schema inferred from body
+-- Simple SELECT with literals
+CREATE OR REPLACE FUNCTION foo1_11l() RETURNS TABLE RETURN SELECT 1 as id, 'hello' as name;
+-- Expect: (1, 'hello')
+SELECT * FROM foo1_11l();
+
+-- SELECT with expressions
+CREATE OR REPLACE FUNCTION foo1_11m(a INT, b STRING) RETURNS TABLE RETURN SELECT a * 2 as doubled, UPPER(b) as upper_name;
+-- Expect: (10, 'WORLD')
+SELECT * FROM foo1_11m(5, 'world');
+
+-- SELECT with complex data types
+CREATE OR REPLACE FUNCTION foo1_11n(arr ARRAY<INT>) RETURNS TABLE RETURN SELECT size(arr) as array_size, arr[0] as first_element;
+-- Expect: (3, 1)
+SELECT * FROM foo1_11n(ARRAY(1, 2, 3));
+
+-- SELECT with struct columns
+CREATE OR REPLACE FUNCTION foo1_11o(id INT, name STRING) RETURNS TABLE RETURN SELECT STRUCT(id, name) as person_info, id + 100 as modified_id;
+-- Expect: ({1, 'Alice'}, 101)
+SELECT * FROM foo1_11o(1, 'Alice');
+
 -------------------------------
 -- 2. Scalar SQL UDF
 -- 2.1 deterministic simple expressions
@@ -549,6 +787,74 @@ SELECT * FROM foo3_3ct();
 SELECT * FROM foo3_3dt();
 RESET spark.sql.ansi.enabled;
 
+-- 3.4 Cyclic function reference
+CREATE FUNCTION foo3_4a(x INT) RETURNS INT RETURN 1;
+CREATE FUNCTION foo3_4b(x INT) RETURNS INT RETURN foo3_4a(x);
+CREATE FUNCTION foo3_4c(x INT) RETURNS INT RETURN foo3_4b(x);
+CREATE FUNCTION foo3_4d(x INT) RETURNS INT RETURN (SELECT foo3_4c(x));
+CREATE FUNCTION foo3_4e(x INT) RETURNS TABLE(a INT) RETURN SELECT foo3_4a(x);
+CREATE FUNCTION foo3_4f(x INT) RETURNS TABLE(b INT) RETURN SELECT * FROM foo3_4e(x);
+CREATE OR REPLACE TEMP FUNCTION foo3_4g(x INT) RETURN x + 1;
+CREATE OR REPLACE TEMP FUNCTION foo3_4h(x INT) RETURN foo3_4g(x) + 1;
+-- Expect error
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4b(x);
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4c(x);
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4d(x);
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURN FoO3_4b(x);
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN SELECT SUM(a) FROM foo3_4e(x);
+CREATE OR REPLACE FUNCTION foo3_4e(x INT) RETURNS TABLE (c INT) RETURN SELECT * FROM foo3_4f(x);
+CREATE OR REPLACE FUNCTION foo3_4e(x INT) RETURNS TABLE RETURN SELECT * FROM fOo3_4F(x);
+CREATE OR REPLACE TEMP FUNCTION foo3_4g(x INT) RETURN foo3_4h(x) + 1;
+
+-- 3.5 Permanent functions with temp objects are not allowed
+CREATE TEMPORARY VIEW t AS VALUES (0) t(a);
+CREATE TEMPORARY FUNCTION foo3_5a(x INT) RETURNS INT RETURN x;
+CREATE TEMPORARY FUNCTION foo3_5b(x INT) RETURNS INT RETURN (SELECT SUM(a) FROM t);
+CREATE TEMPORARY FUNCTION foo3_5c(x INT) RETURNS TABLE (a INT) RETURN SELECT a FROM t;
+-- Expect error: permanent function cannot reference temporary function
+CREATE FUNCTION foo3_5d(x INT) RETURNS INT RETURN foo3_5a(x);
+CREATE FUNCTION foo3_5d(x INT) RETURNS TABLE (a INT) RETURN SELECT foo3_5a(x);
+-- Expect error: permanent function cannot reference temporary view
+CREATE FUNCTION foo3_5d(x INT) RETURNS INT RETURN (SELECT SUM(a) FROM t);
+CREATE FUNCTION foo3_5d(x INT) RETURNS TABLE (a INT) RETURN SELECT a FROM t;
+
+-- 3.12 SQL data access routine
+-- Scalar functions
+CREATE FUNCTION foo3_12a(x INT) RETURNS INT CONTAINS SQL RETURN x;
+CREATE FUNCTION foo3_12b(x INT) RETURNS INT READS SQL DATA RETURN x;
+CREATE FUNCTION foo3_12c(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT x);
+CREATE FUNCTION foo3_12d(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT COUNT(*) FROM range(0, 3));
+CREATE FUNCTION foo3_12e(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT COUNT(*) FROM VALUES (0, 1));
+-- Expect error: cannot create a SQL function with CONTAINS SQL that accesses SQL data
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN SELECT SUM(c2) FROM t1;
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN foo3_12b(x) + 1;
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN 1 + (SELECT SUM(c2) FROM t1);
+
+-- Table functions
+CREATE FUNCTION foo3_12g(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT x, x + 1;
+CREATE FUNCTION foo3_12h(x INT) RETURNS TABLE (a INT, b INT) READS SQL DATA RETURN SELECT x, x + 1;
+CREATE FUNCTION foo3_12i(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM VALUES (0, 1);
+CREATE FUNCTION foo3_12j(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT id, id + 1 FROM RANGE(3);
+-- Derived SQL data access: READS SQL DATA.
+CREATE FUNCTION foo3_12k(x INT) RETURNS TABLE (a INT, b INT) RETURN SELECT c1, c2 FROM t1;
+-- Expect error: cannot create a SQL function with CONTAINS SQL that accesses SQL data
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT c1, c2 FROM t1;
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT foo3_12b(x), x;
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM foo3_12h(x);
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM foo3_12k(x);
+
+CREATE TABLE tbl USING PARQUET AS SELECT c1 FROM t2;
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN SELECT SUM(c1) FROM tbl;
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT) CONTAINS SQL RETURN SELECT * FROM tbl;
+DROP TABLE tbl;
+
+-- 3.14 Invalid usage of SQL scalar/table functions in query clauses.
+CREATE FUNCTION foo3_14a() RETURNS INT RETURN 1;
+CREATE FUNCTION foo3_14b() RETURNS TABLE (a INT) RETURN SELECT 1;
+-- Expect error
+SELECT * FROM foo3_14a();
+SELECT foo3_14b();
+
 -- 4. SQL table functions
 CREATE FUNCTION foo4_0() RETURNS TABLE (x INT) RETURN SELECT 1;
 CREATE FUNCTION foo4_1(x INT) RETURNS TABLE (a INT) RETURN SELECT x;
@@ -585,3 +891,145 @@ SELECT (SELECT MAX(cnt) FROM foo4_3(c1)) FROM t1;
 -- Clean up
 DROP VIEW t1;
 DROP VIEW t2;
+
+DROP FUNCTION IF EXISTS foo1a0;
+DROP FUNCTION IF EXISTS foo1a1;
+DROP FUNCTION IF EXISTS foo1a2;
+DROP FUNCTION IF EXISTS foo1b0;
+DROP FUNCTION IF EXISTS foo1b1;
+DROP FUNCTION IF EXISTS foo1b2;
+DROP FUNCTION IF EXISTS foo1c1;
+DROP FUNCTION IF EXISTS foo1c2;
+DROP FUNCTION IF EXISTS foo1d1;
+DROP FUNCTION IF EXISTS foo1d2;
+DROP FUNCTION IF EXISTS foo1d4;
+DROP FUNCTION IF EXISTS foo1d5;
+DROP FUNCTION IF EXISTS foo1d6;
+DROP FUNCTION IF EXISTS foo1e1;
+DROP FUNCTION IF EXISTS foo1e2;
+DROP FUNCTION IF EXISTS foo1e3;
+DROP FUNCTION IF EXISTS foo1f1;
+DROP FUNCTION IF EXISTS foo1f2;
+DROP FUNCTION IF EXISTS foo1g1;
+DROP FUNCTION IF EXISTS foo1g2;
+DROP FUNCTION IF EXISTS foo2a0;
+DROP FUNCTION IF EXISTS foo2a2;
+DROP FUNCTION IF EXISTS foo2a4;
+DROP FUNCTION IF EXISTS foo2b1;
+DROP FUNCTION IF EXISTS foo2b2;
+DROP FUNCTION IF EXISTS foo2c1;
+DROP FUNCTION IF EXISTS foo31;
+DROP FUNCTION IF EXISTS foo32;
+DROP FUNCTION IF EXISTS foo33;
+DROP FUNCTION IF EXISTS foo41;
+DROP FUNCTION IF EXISTS foo42;
+DROP FUNCTION IF EXISTS foo51;
+DROP FUNCTION IF EXISTS foo52;
+DROP FUNCTION IF EXISTS foo6c;
+DROP FUNCTION IF EXISTS foo6d;
+DROP FUNCTION IF EXISTS foo7a;
+DROP FUNCTION IF EXISTS foo7at;
+DROP FUNCTION IF EXISTS foo9a;
+DROP FUNCTION IF EXISTS foo9b;
+DROP FUNCTION IF EXISTS foo9c;
+DROP FUNCTION IF EXISTS foo9d;
+DROP FUNCTION IF EXISTS foo9e;
+DROP FUNCTION IF EXISTS foo9f;
+DROP FUNCTION IF EXISTS foo9g;
+DROP FUNCTION IF EXISTS foo9h;
+DROP FUNCTION IF EXISTS foo9i;
+DROP FUNCTION IF EXISTS foo9j;
+DROP FUNCTION IF EXISTS foo9l;
+DROP FUNCTION IF EXISTS foo9m;
+DROP FUNCTION IF EXISTS foo9n;
+DROP FUNCTION IF EXISTS foo9o;
+DROP FUNCTION IF EXISTS foo9p;
+DROP FUNCTION IF EXISTS foo9q;
+DROP FUNCTION IF EXISTS foo9r;
+DROP FUNCTION IF EXISTS foo1_10;
+DROP FUNCTION IF EXISTS bar1_10;
+DROP FUNCTION IF EXISTS foo1_11a;
+DROP FUNCTION IF EXISTS foo1_11b;
+DROP FUNCTION IF EXISTS foo1_11c;
+DROP FUNCTION IF EXISTS foo1_11d;
+DROP FUNCTION IF EXISTS foo1_11e;
+DROP FUNCTION IF EXISTS foo1_11f;
+DROP FUNCTION IF EXISTS foo1_11g;
+DROP FUNCTION IF EXISTS foo1_11h;
+DROP FUNCTION IF EXISTS foo1_11i;
+DROP FUNCTION IF EXISTS foo1_11j;
+DROP FUNCTION IF EXISTS foo1_11k;
+DROP FUNCTION IF EXISTS foo1_11l;
+DROP FUNCTION IF EXISTS foo1_11m;
+DROP FUNCTION IF EXISTS foo1_11n;
+DROP FUNCTION IF EXISTS foo1_11o;
+DROP FUNCTION IF EXISTS foo2_1a;
+DROP FUNCTION IF EXISTS foo2_1b;
+DROP FUNCTION IF EXISTS foo2_1c;
+DROP FUNCTION IF EXISTS foo2_1d;
+DROP FUNCTION IF EXISTS foo2_2a;
+DROP FUNCTION IF EXISTS foo2_2b;
+DROP FUNCTION IF EXISTS foo2_2c;
+DROP FUNCTION IF EXISTS foo2_2d;
+DROP FUNCTION IF EXISTS foo2_2e;
+DROP FUNCTION IF EXISTS foo2_2f;
+DROP FUNCTION IF EXISTS foo2_2g;
+DROP FUNCTION IF EXISTS foo2_3;
+DROP FUNCTION IF EXISTS foo2_4a;
+DROP FUNCTION IF EXISTS foo2_4b;
+DROP FUNCTION IF EXISTS foo3_1a;
+DROP FUNCTION IF EXISTS foo3_1b;
+DROP FUNCTION IF EXISTS foo3_1c;
+DROP FUNCTION IF EXISTS foo3_1d;
+DROP FUNCTION IF EXISTS foo3_1e;
+DROP FUNCTION IF EXISTS foo3_1f;
+DROP FUNCTION IF EXISTS foo3_1g;
+DROP FUNCTION IF EXISTS foo3_1x;
+DROP FUNCTION IF EXISTS foo3_1y;
+DROP FUNCTION IF EXISTS foo3_2a;
+DROP FUNCTION IF EXISTS foo3_2b1;
+DROP FUNCTION IF EXISTS foo3_2b2;
+DROP FUNCTION IF EXISTS foo3_2b3;
+DROP FUNCTION IF EXISTS foo3_2b4;
+DROP FUNCTION IF EXISTS foo3_2b5;
+DROP FUNCTION IF EXISTS foo3_2c1;
+DROP FUNCTION IF EXISTS foo3_2c2;
+DROP FUNCTION IF EXISTS foo3_2d1;
+DROP FUNCTION IF EXISTS foo3_2d2;
+DROP FUNCTION IF EXISTS foo3_2e1;
+DROP FUNCTION IF EXISTS foo3_3a;
+DROP FUNCTION IF EXISTS foo3_3at;
+DROP FUNCTION IF EXISTS foo3_14a;
+DROP FUNCTION IF EXISTS foo3_14b;
+DROP FUNCTION IF EXISTS foo3_3c;
+DROP FUNCTION IF EXISTS foo3_3ct;
+DROP FUNCTION IF EXISTS foo3_3d;
+DROP FUNCTION IF EXISTS foo3_3dt;
+DROP FUNCTION IF EXISTS foo3_4a;
+DROP FUNCTION IF EXISTS foo3_4b;
+DROP FUNCTION IF EXISTS foo3_4c;
+DROP FUNCTION IF EXISTS foo3_4d;
+DROP FUNCTION IF EXISTS foo3_4e;
+DROP FUNCTION IF EXISTS foo3_4f;
+DROP FUNCTION IF EXISTS foo3_12a;
+DROP FUNCTION IF EXISTS foo3_12b;
+DROP FUNCTION IF EXISTS foo3_12c;
+DROP FUNCTION IF EXISTS foo3_12d;
+DROP FUNCTION IF EXISTS foo3_12e;
+DROP FUNCTION IF EXISTS foo3_12f;
+DROP FUNCTION IF EXISTS foo3_12g;
+DROP FUNCTION IF EXISTS foo3_12h;
+DROP FUNCTION IF EXISTS foo3_12i;
+DROP FUNCTION IF EXISTS foo3_12j;
+DROP FUNCTION IF EXISTS foo3_12k;
+DROP FUNCTION IF EXISTS foo4_0;
+DROP FUNCTION IF EXISTS foo4_1;
+DROP FUNCTION IF EXISTS foo4_2;
+DROP FUNCTION IF EXISTS foo4_3;
+
+-- Drop temporary functions
+DROP TEMPORARY FUNCTION IF EXISTS foo1d3;
+DROP TEMPORARY FUNCTION IF EXISTS foo3_3b;
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5a;
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5b;
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5c;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/string-functions.sql b/sql/core/src/test/resources/sql-tests/inputs/string-functions.sql
index 878fa992f81b4..7559c45ec1039 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/string-functions.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/string-functions.sql
@@ -27,7 +27,15 @@ select right("abcd", -2), right("abcd", 0), right("abcd", 'a');
 SELECT split('aa1cc2ee3', '[1-9]+');
 SELECT split('aa1cc2ee3', '[1-9]+', 2);
 SELECT split('hello', '');
+SELECT split('hello', '', 0);
+SELECT split('hello', '', 1);
+SELECT split('hello', '', 3);
+SELECT split('hello', '', 5);
+SELECT split('hello', '', 100);
 SELECT split('', '');
+SELECT split('', '', -1);
+SELECT split('', '', 0);
+SELECT split('', '', 1);
 SELECT split('abc', null);
 SELECT split(null, 'b');
 
diff --git a/sql/core/src/test/resources/sql-tests/inputs/struct.sql b/sql/core/src/test/resources/sql-tests/inputs/struct.sql
index 93a1238ab18c2..3d45db5669f75 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/struct.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/struct.sql
@@ -24,4 +24,11 @@ SELECT ID, STRUCT(ST.*).C NST FROM tbl_x;
 SELECT ID, STRUCT(ST.C, ST.D).D NST FROM tbl_x;
 
 -- Select an alias from a struct
-SELECT ID, STRUCT(ST.C as STC, ST.D as STD).STD FROM tbl_x;
\ No newline at end of file
+SELECT ID, STRUCT(ST.C as STC, ST.D as STD).STD FROM tbl_x;
+
+-- LCAs with struct columns
+SELECT STRUCT(1 AS a) AS b, b AS c;
+SELECT STRUCT(col1 AS a) AS b, b AS c FROM VALUES(1);
+SELECT STRUCT(1 AS a) AS b, b AS c GROUP BY b;
+SELECT STRUCT(col1 AS a) AS b, b AS c FROM VALUES(1) GROUP BY b;
+SELECT MAX(STRUCT(1 AS a)), 2 AS b, b AS c GROUP BY b;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/subquery/scalar-subquery/scalar-subquery-predicate.sql b/sql/core/src/test/resources/sql-tests/inputs/subquery/scalar-subquery/scalar-subquery-predicate.sql
index 81e0c5f98d82b..640ed52cff41c 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/subquery/scalar-subquery/scalar-subquery-predicate.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/subquery/scalar-subquery/scalar-subquery-predicate.sql
@@ -532,3 +532,14 @@ WHERE (SELECT max(t2c)
 
 
 SELECT * FROM t0 WHERE t0a = (SELECT distinct(t1c) FROM t1 WHERE t1a = t0a);
+
+-- SPARK-52531: Inner aggregate expressions are properly decorrelated from outer aggregate expressions
+SELECT MAX(a.col1)
+FROM VALUES (1) AS a(col1)
+GROUP BY a.col1
+HAVING COUNT(*) = (
+        SELECT COUNT(*)
+        FROM VALUES (1),(1),(2),(2) AS c(col1)
+        WHERE c.col1 >= a.col1
+        LIMIT 1
+    );
diff --git a/sql/core/src/test/resources/sql-tests/inputs/time.sql b/sql/core/src/test/resources/sql-tests/inputs/time.sql
index 3d0ea48a4e056..b46f74c657671 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/time.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/time.sql
@@ -1,7 +1,11 @@
 -- time literals, functions and operations
 
+create temporary view timediff_view as select time'01:02:03' time_start, time'04:05:06' time_end, 'SECOND' unit;
+
 create temporary view time_view as select '11:53:26.038344' time_str, 'HH:mm:ss.SSSSSS' fmt_str;
 
+create temporary view trunc_time_view as select time'11:53:26.038344' time_val, 'MINUTE' unit;
+
 select time '16:39:45\t';
 
 select to_time(null), to_time('01:02:03'), to_time('23-59-59.999999', 'HH-mm-ss.SSSSSS');
@@ -67,3 +71,233 @@ select extract(SECOND FROM cast('09:08:01.987654' as time(3)));
 select extract(SECOND FROM cast('09:08:01.987654' as time(4)));
 select extract(SECOND FROM cast('09:08:01.987654' as time(5)));
 select extract(SECOND FROM cast('09:08:01.987654' as time(6)));
+
+-- valid time literals
+SELECT TIME'0:0:0';
+SELECT TIME'01:02:03';
+SELECT TIME'12:34:56';
+SELECT TIME'23:59:59';
+SELECT TIME'23:59:59.9';
+SELECT TIME'23:59:59.99';
+SELECT TIME'23:59:59.999';
+SELECT TIME'23:59:59.9999';
+SELECT TIME'23:59:59.99999';
+SELECT TIME'23:59:59.999999';
+SELECT TIME'01:02:03 AM';
+SELECT TIME'01:02:03 am';
+SELECT TIME'01:02:03 Am';
+SELECT TIME'01:02:03 PM';
+SELECT TIME'01:02:03 pm';
+SELECT TIME'01:02:03 pM';
+
+-- invalid time literals
+SELECT TIME'00:00:60';
+SELECT TIME'00:60:00';
+SELECT TIME'24:00:00';
+SELECT TIME'00:00:00 AM';
+SELECT TIME'00:00:00 PM';
+SELECT TIME'12:00:60 AM';
+SELECT TIME'12:00:60 PM';
+SELECT TIME'12:60:00 AM';
+SELECT TIME'12:60:00 PM';
+SELECT TIME'13:00:00 AM';
+SELECT TIME'13:00:00 PM';
+SELECT TIME'24:00:00 AM';
+SELECT TIME'24:00:00 PM';
+
+-- cast string to time
+SELECT cast("12:34:56" as time);
+SELECT cast("12:34:56.789" as time(3));
+SELECT cast("12:34:56.789" as time(6));
+SELECT cast("12:34:56.789012" as time without time zone);
+
+-- cast time to time
+SELECT cast(cast('12:00' as time(0)) as time(2));
+SELECT cast(('23:59:59.001001' :: time(6)) as time(4));
+SELECT cast(time'11:59:59.999999' as time without time zone);
+
+-- SPARK-51554: time truncation.
+SELECT time_trunc('HOUR', time'12:34:56');
+SELECT time_trunc('MINUTE', time'12:34:56');
+SELECT time_trunc('SECOND', time'12:34:56');
+SELECT time_trunc('MILLISECOND', time'12:34:56');
+SELECT time_trunc('MICROSECOND', time'12:34:56');
+
+-- SPARK-51554: time truncation with various time precisions.
+SELECT time_trunc('HOUR', time'12:34:56.1');
+SELECT time_trunc('MINUTE', time'12:34:56.1');
+SELECT time_trunc('SECOND', time'12:34:56.1');
+SELECT time_trunc('MILLISECOND', time'12:34:56.1');
+SELECT time_trunc('MICROSECOND', time'12:34:56.1');
+SELECT time_trunc('HOUR', time'12:34:56.123456');
+SELECT time_trunc('MINUTE', time'12:34:56.123456');
+SELECT time_trunc('SECOND', time'12:34:56.123456');
+SELECT time_trunc('MILLISECOND', time'12:34:56.123456');
+SELECT time_trunc('MICROSECOND', time'12:34:56.123456');
+SELECT time_trunc('HOUR', time'12:34:56.123456789');
+SELECT time_trunc('MINUTE', time'12:34:56.123456789');
+SELECT time_trunc('SECOND', time'12:34:56.123456789');
+SELECT time_trunc('MILLISECOND', time'12:34:56.123456789');
+SELECT time_trunc('MICROSECOND', time'12:34:56.123456789');
+
+-- SPARK-51554: time truncation with various unit cases.
+SELECT time_trunc('hour', time'12:34:56');
+SELECT time_trunc('MiNuTe', time'12:34:56');
+SELECT time_trunc('sEcOnD', time'12:34:56');
+SELECT time_trunc('Millisecond', time'12:34:56');
+SELECT time_trunc('microseconD', time'12:34:56');
+
+-- SPARK-51554: time truncation with zero time.
+SELECT time_trunc('HOUR', time'00:00:00');
+SELECT time_trunc('MINUTE', time'00:00:00');
+SELECT time_trunc('SECOND', time'00:00:00');
+SELECT time_trunc('MILLISECOND', time'00:00:00');
+SELECT time_trunc('MICROSECOND', time'00:00:00');
+-- SPARK-51554: time truncation with small time.
+SELECT time_trunc('HOUR', time'00:00:00.000000001');
+SELECT time_trunc('MINUTE', time'00:00:00.000000001');
+SELECT time_trunc('SECOND', time'00:00:00.000000001');
+SELECT time_trunc('MILLISECOND', time'00:00:00.000000001');
+SELECT time_trunc('MICROSECOND', time'00:00:00.000000001');
+-- SPARK-51554: time truncation with max time.
+SELECT time_trunc('HOUR', time'23:59:59.999999999');
+SELECT time_trunc('MINUTE', time'23:59:59.999999999');
+SELECT time_trunc('SECOND', time'23:59:59.999999999');
+SELECT time_trunc('MILLISECOND', time'23:59:59.999999999');
+SELECT time_trunc('MICROSECOND', time'23:59:59.999999999');
+
+-- SPARK-51554: time truncation with invalid unit.
+SELECT time_trunc('', time'12:34:56');
+SELECT time_trunc(' ', time'12:34:56');
+SELECT time_trunc('MS', time'12:34:56');
+SELECT time_trunc('DAY', time'12:34:56');
+SELECT time_trunc('WEEK', time'12:34:56');
+SELECT time_trunc('ABCD', time'12:34:56');
+SELECT time_trunc('QUARTER', time'12:34:56');
+SELECT time_trunc('INVALID', time'12:34:56');
+SELECT time_trunc('INVALID_UNIT', time'12:34:56');
+
+-- SPARK-51554: time truncation with null inputs.
+SELECT time_trunc('HOUR', NULL);
+SELECT time_trunc(NULL, time'12:34:56');
+SELECT time_trunc(NULL, NULL);
+
+-- SPARK-51554: time truncation with table columns.
+SELECT time_trunc('HOUR', time_val) FROM trunc_time_view;
+SELECT time_trunc(unit, time'12:34:56') FROM trunc_time_view;
+SELECT time_trunc(unit, time_val) FROM trunc_time_view;
+
+-- SPARK-51562: test time function (i.e. alias for casting to time type).
+SELECT time("12:34:56");
+SELECT time("12:34:56.789");
+SELECT time("12:34:56.789012");
+SELECT time(cast('12:00' as time(0)));
+SELECT time(('23:59:59.001001' :: time(6)));
+SELECT time(time'11:59:59.999999');
+
+-- +/- ANSI day-time intervals
+SELECT '12:43:33.1234' :: TIME(4) + INTERVAL '01:04:05.56' HOUR TO SECOND;
+SELECT TIME'08:30' + NULL;
+SELECT NULL + TIME'08:30';
+SELECT TIME'00:00:00.0101' + 1;
+SELECT TIME'12:30' - INTERVAL '12:29:59.000001' HOUR TO SECOND;
+SELECT '23:59:59.999999' :: TIME - INTERVAL '23:59:59.999999' HOUR TO SECOND;
+SELECT '00:00:00.0001' :: TIME(4) - INTERVAL '0 00:00:00.0001' DAY TO SECOND;
+SELECT '08:30' :: TIME(0) - INTERVAL '6' HOUR;
+SELECT '10:00:01' :: TIME(1) - INTERVAL '1' MONTH;
+
+-- SPARK-51555: time difference.
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56');
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56');
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56');
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56');
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56');
+
+-- SPARK-51555: positive and negative time difference.
+SELECT time_diff('HOUR', time'01:02:03', time'12:34:56');
+SELECT time_diff('MINUTE', time'01:02:03', time'12:34:56');
+SELECT time_diff('SECOND', time'01:02:03', time'12:34:56');
+SELECT time_diff('HOUR', time'12:34:56', time'01:02:03');
+SELECT time_diff('MINUTE', time'12:34:56', time'01:02:03');
+SELECT time_diff('SECOND', time'12:34:56', time'01:02:03');
+
+-- SPARK-51555: time difference with various time precisions.
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.1');
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.1');
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.1');
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.1');
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.1');
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.123456');
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.123456');
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.123456');
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.123456');
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.123456');
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.123456789');
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.123456789');
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.123456789');
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.123456789');
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.123456789');
+
+-- SPARK-51555: time difference with various unit cases.
+SELECT time_diff('hour', time'00:00:00', time'12:34:56');
+SELECT time_diff('MiNuTe', time'00:00:00', time'12:34:56');
+SELECT time_diff('sEcOnD', time'00:00:00', time'12:34:56');
+SELECT time_diff('Millisecond', time'00:00:00', time'12:34:56');
+SELECT time_diff('microseconD', time'00:00:00', time'12:34:56');
+
+-- SPARK-51555: time difference with zero time.
+SELECT time_diff('HOUR', time'00:00:00', time'00:00:00');
+SELECT time_diff('MINUTE', time'00:00:00', time'00:00:00');
+SELECT time_diff('SECOND', time'00:00:00', time'00:00:00');
+SELECT time_diff('MILLISECOND', time'00:00:00', time'00:00:00');
+SELECT time_diff('MICROSECOND', time'00:00:00', time'00:00:00');
+-- SPARK-51555: time difference with small time.
+SELECT time_diff('HOUR', time'00:00:00', time'00:00:00.000000001');
+SELECT time_diff('MINUTE', time'00:00:00', time'00:00:00.000000001');
+SELECT time_diff('SECOND', time'00:00:00', time'00:00:00.000000001');
+SELECT time_diff('MILLISECOND', time'00:00:00', time'00:00:00.000000001');
+SELECT time_diff('MICROSECOND', time'00:00:00', time'00:00:00.000000001');
+-- SPARK-51555: time difference with max time.
+SELECT time_diff('HOUR', time'00:00:00', time'23:59:59.999999999');
+SELECT time_diff('MINUTE', time'00:00:00', time'23:59:59.999999999');
+SELECT time_diff('SECOND', time'00:00:00', time'23:59:59.999999999');
+SELECT time_diff('MILLISECOND', time'00:00:00', time'23:59:59.999999999');
+SELECT time_diff('MICROSECOND', time'00:00:00', time'23:59:59.999999999');
+
+-- SPARK-51555: time difference with invalid unit.
+SELECT time_diff('', time'00:00:00', time'12:34:56');
+SELECT time_diff(' ', time'00:00:00', time'12:34:56');
+SELECT time_diff('MS', time'00:00:00', time'12:34:56');
+SELECT time_diff('DAY', time'00:00:00', time'12:34:56');
+SELECT time_diff('WEEK', time'00:00:00', time'12:34:56');
+SELECT time_diff('ABCD', time'00:00:00', time'12:34:56');
+SELECT time_diff('QUARTER', time'00:00:00', time'12:34:56');
+SELECT time_diff('INVALID', time'00:00:00', time'12:34:56');
+SELECT time_diff('INVALID_UNIT', time'00:00:00', time'12:34:56');
+
+-- SPARK-51555: time difference with null inputs.
+SELECT time_diff(NULL, time'00:00:00', time'12:34:56');
+SELECT time_diff('MICROSECOND', NULL, time'12:34:56');
+SELECT time_diff('MICROSECOND', time'00:00:00', NULL);
+SELECT time_diff(NULL, NULL, time'12:34:56');
+SELECT time_diff(NULL, time'00:00:00', NULL);
+SELECT time_diff('MICROSECOND', NULL, NULL);
+SELECT time_diff(NULL, NULL, NULL);
+
+-- SPARK-51555: time difference with table columns.
+SELECT time_diff('SECOND', time_start, time_end) FROM timediff_view;
+SELECT time_diff(unit, time'01:02:03', time_end) FROM timediff_view;
+SELECT time_diff(unit, time_start, time'04:05:06') FROM timediff_view;
+SELECT time_diff('SECOND', time'01:02:03', time_end) FROM timediff_view;
+SELECT time_diff('SECOND', time_start, time'04:05:06') FROM timediff_view;
+SELECT time_diff(unit, time'01:02:03', time'04:05:06') FROM timediff_view;
+SELECT time_diff(unit, time_start, time_end) FROM timediff_view;
+
+-- Subtract times
+SELECT TIME'12:30:41' - TIME'10:00';
+SELECT TIME'08:30' - NULL;
+SELECT NULL - TIME'10:32';
+SELECT TIME'12:30:41.123' - TIMESTAMP'2025-07-11 10:00:01';
+SELECT '12:30:41.123' - TIME'10:00:01';
+SELECT '23:59:59.999999' :: TIME(6) - '00:00' :: TIME(0);
+SELECT '00:00:00.1234' :: TIME(4) - TIME'23:59:59';
diff --git a/sql/core/src/test/resources/sql-tests/inputs/timestamp-ltz.sql b/sql/core/src/test/resources/sql-tests/inputs/timestamp-ltz.sql
index 28fe4539855cd..c068e35dbd92a 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/timestamp-ltz.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/timestamp-ltz.sql
@@ -15,4 +15,16 @@ SELECT make_timestamp_ltz(2021, 07, 11, 6, 30, 45.678);
 SELECT make_timestamp_ltz(2021, 07, 11, 6, 30, 45.678, 'CET');
 SELECT make_timestamp_ltz(2021, 07, 11, 6, 30, 60.007);
 
+-- TimestampLTZ date/time fields constructor
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678));
+-- Handling NULL input.
+SELECT make_timestamp_ltz(NULL, TIME'00:00:00');
+SELECT make_timestamp_ltz(DATE'1970-01-01', NULL);
+-- Handling invalid input.
+SELECT make_timestamp_ltz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0');
+SELECT make_timestamp_ltz(DATE'2025-06-20', timestamp_ntz'2018-11-17 13:33:33');
+-- Optional timezone is ignored.
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST');
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET');
+
 SELECT convert_timezone('Europe/Brussels', timestamp_ltz'2022-03-23 00:00:00 America/Los_Angeles');
diff --git a/sql/core/src/test/resources/sql-tests/inputs/timestamp-ntz.sql b/sql/core/src/test/resources/sql-tests/inputs/timestamp-ntz.sql
index 7996f5879bf7b..0f9902cc4fee6 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/timestamp-ntz.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/timestamp-ntz.sql
@@ -15,6 +15,17 @@ SELECT make_timestamp_ntz(2021, 07, 11, 6, 30, 45.678);
 -- make_timestamp_ntz should not accept time zone input
 SELECT make_timestamp_ntz(2021, 07, 11, 6, 30, 45.678, 'CET');
 SELECT make_timestamp_ntz(2021, 07, 11, 6, 30, 60.007);
+SELECT make_timestamp_ntz(make_date(2021, 07, 11), make_time(6, 30, 45.678));
+SELECT make_timestamp_ntz(NULL, TIME'00:00:00');
+SELECT make_timestamp_ntz(DATE'1970-01-01', NULL);
+SELECT make_timestamp_ntz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0');
+SELECT make_timestamp_ntz(DATE'2025-06-20', '0:0:0');
+
+SELECT try_make_timestamp_ntz(make_date(2025, 6, 27), make_time(16, 08, 45.123456));
+SELECT try_make_timestamp_ntz(NULL, TIME'23:59:59.00001');
+SELECT try_make_timestamp_ntz(DATE'0001-01-01', NULL);
+SELECT try_make_timestamp_ntz('2018-11-17 13:33:33', TIME'0:0:0');
+SELECT try_make_timestamp_ntz(DATE'2025-06-20', 10D);
 
 SELECT convert_timezone('Europe/Moscow', 'America/Los_Angeles', timestamp_ntz'2022-01-01 00:00:00');
 SELECT convert_timezone('Europe/Brussels', timestamp_ntz'2022-03-23 00:00:00');
diff --git a/sql/core/src/test/resources/sql-tests/inputs/timestamp.sql b/sql/core/src/test/resources/sql-tests/inputs/timestamp.sql
index 72ea88a0320e3..96b5ab9fa35ce 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/timestamp.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/timestamp.sql
@@ -26,6 +26,39 @@ SELECT make_timestamp(1, 1, 1, 1, 1, 59.999999);
 SELECT make_timestamp(1, 1, 1, 1, 1, 99.999999);
 SELECT make_timestamp(1, 1, 1, 1, 1, 999.999999);
 
+-- SPARK-51415: timestamp date constructor.
+SELECT make_timestamp(make_date(2021, 07, 11));
+SELECT make_timestamp(DATE'1970-01-01');
+SELECT make_timestamp(NULL);
+
+-- SPARK-51415: timestamp date + time constructor.
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678));
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00');
+SELECT make_timestamp(NULL, TIME'00:00:00');
+SELECT make_timestamp(DATE'1970-01-01', NULL);
+SELECT make_timestamp(NULL, NULL);
+
+-- SPARK-51415: timestamp date + time + timezone constructor.
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT');
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST');
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC');
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET');
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST');
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC');
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC');
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC');
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL);
+SELECT make_timestamp(NULL, NULL, 'UTC');
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL);
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL);
+SELECT make_timestamp(NULL, NULL, NULL);
+
+-- SPARK-51415: unsupported input types.
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET');
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET');
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET');
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET');
+
 -- [SPARK-31710] TIMESTAMP_SECONDS, TIMESTAMP_MILLISECONDS and TIMESTAMP_MICROSECONDS that always create timestamp_ltz
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null);
 select TIMESTAMP_SECONDS(1.23), TIMESTAMP_SECONDS(1.23d), TIMESTAMP_SECONDS(FLOAT(1.23));
diff --git a/sql/core/src/test/resources/sql-tests/inputs/union-per-child-output-deduplication.sql b/sql/core/src/test/resources/sql-tests/inputs/union-per-child-output-deduplication.sql
new file mode 100644
index 0000000000000..f07b7c0b4a5bc
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/union-per-child-output-deduplication.sql
@@ -0,0 +1,81 @@
+DROP TABLE IF EXISTS t1;
+DROP VIEW  IF EXISTS v1;
+
+CREATE TABLE t1 (col1 STRING, col2 STRING, col3 STRING);
+
+CREATE VIEW v1 as SELECT * FROM t1;
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM t1
+     );
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM v1
+     );
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM v1
+     );
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM t1
+     );
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM t1
+     );
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM t1
+     );
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM v1
+     );
+
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM v1
+     );
+
+DROP VIEW v1;
+DROP TABLE t1;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/union.sql b/sql/core/src/test/resources/sql-tests/inputs/union.sql
index ab81cc7bbabb6..01b53c6132747 100644
--- a/sql/core/src/test/resources/sql-tests/inputs/union.sql
+++ b/sql/core/src/test/resources/sql-tests/inputs/union.sql
@@ -1,5 +1,6 @@
 CREATE OR REPLACE TEMPORARY VIEW t1 AS VALUES (1, 'a'), (2, 'b') tbl(c1, c2);
 CREATE OR REPLACE TEMPORARY VIEW t2 AS VALUES (1.0, 1), (2.0, 4) tbl(c1, c2);
+CREATE TABLE jsonTable (col1 INT, col2 INT, col3 INT, col4 INT) USING json;
 
 -- Simple Union
 SELECT *
@@ -59,6 +60,13 @@ SELECT SUM(t.v) FROM (
   SELECT v + v AS v FROM t3
 ) t;
 
+-- SPARK-52462: UNION should produce consistent results with different underlying table providers.
+SELECT col1, col2, col3, NULLIF('','') AS col4
+FROM jsonTable
+UNION ALL
+SELECT col2, col2, null AS col3, col4
+FROM jsonTable;
+
 -- Clean-up
 DROP VIEW IF EXISTS t1;
 DROP VIEW IF EXISTS t2;
@@ -66,3 +74,4 @@ DROP VIEW IF EXISTS t3;
 DROP VIEW IF EXISTS p1;
 DROP VIEW IF EXISTS p2;
 DROP VIEW IF EXISTS p3;
+DROP TABLE IF EXISTS jsonTable;
diff --git a/sql/core/src/test/resources/sql-tests/inputs/variant-field-extractions.sql b/sql/core/src/test/resources/sql-tests/inputs/variant-field-extractions.sql
new file mode 100644
index 0000000000000..3a5a3c454db9f
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/inputs/variant-field-extractions.sql
@@ -0,0 +1,74 @@
+-- Create temp view with Variant columns for testing field extraction and type casting.
+CREATE TEMP VIEW variant_test_data AS
+SELECT
+  parse_json('{ "price": 30 }') as int_price_variant,
+  parse_json('{ "price": 12345.678 }') as double_price_variant,
+  parse_json('{ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }') as multi_field_variant,
+  parse_json('{ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }') as array_value_variant,
+  parse_json('[{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }]') as array_variant,
+  parse_json('{ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }') as nested_variant,
+  parse_json('{ "field-name": "value1", "field.name": "value2", "field_name": "value3" }') as special_chars_variant;
+
+-- Single field extraction and type casting.
+select int_price_variant:price from variant_test_data;
+select int_price_variant:price::decimal(5, 2) from variant_test_data;
+select int_price_variant:price::string from variant_test_data;
+
+-- Applying an invalid function -- will throw an error.
+select double_price_variant:price::decimal(3, 2) from variant_test_data;
+
+-- Multi-field access.
+select multi_field_variant:name, multi_field_variant:age, multi_field_variant:city from variant_test_data;
+select multi_field_variant:name::string, multi_field_variant:age::int, multi_field_variant:active::boolean from variant_test_data;
+select multi_field_variant:['name'] from variant_test_data;
+select multi_field_variant:['age'] from variant_test_data;
+
+-- Array value access.
+select array_value_variant:item[0].model from variant_test_data;
+select array_value_variant:item[0].price from variant_test_data;
+select array_value_variant:item[1].model from variant_test_data;
+select array_value_variant:item[1].price from variant_test_data;
+
+-- Array access.
+select array_variant:[0].id from variant_test_data;
+select array_variant:[0].name from variant_test_data;
+select array_variant:[1].id from variant_test_data;
+select array_variant:[1].name from variant_test_data;
+
+-- Nested field access.
+select nested_variant:metadata.version from variant_test_data;
+select nested_variant:metadata.tags[0] from variant_test_data;
+select nested_variant:metadata.nested.level from variant_test_data;
+select nested_variant:metadata.nested.value from variant_test_data;
+select nested_variant:metadata['version'] from variant_test_data;
+select nested_variant:metadata['tags'] from variant_test_data;
+
+-- Special characters.
+select special_chars_variant:`field-name`::string from variant_test_data;
+select special_chars_variant:['field-name']::string from variant_test_data;
+select special_chars_variant:field_name::string from variant_test_data;
+select special_chars_variant:['field_name']::string from variant_test_data;
+-- Not supported; will return NULL.
+select special_chars_variant:`field.name`::string from variant_test_data;
+-- Using [] is okay.
+select special_chars_variant:['field.name']::string from variant_test_data;
+
+-- Array operations on Variant arrays.
+select multi_field_variant:scores[0]::int + multi_field_variant:scores[1]::int from variant_test_data;
+select count(*) from (select explode(cast(multi_field_variant:scores as array<int>)) as score from variant_test_data);
+
+-- ASTERISK syntax.
+select * from variant_test_data;
+-- Not supported; will throw an error.
+select multi_field_variant:* from variant_test_data;
+
+-- Type checking: The result of the following would all be 'variant'.
+select typeof(multi_field_variant:name) from variant_test_data;
+select typeof(multi_field_variant:age) from variant_test_data;
+select typeof(multi_field_variant:active) from variant_test_data;
+select typeof(multi_field_variant:scores) from variant_test_data;
+
+-- Variant field access with NULL handling.
+select isnull(multi_field_variant:missing_field) from variant_test_data;
+select isnotnull(multi_field_variant:name) from variant_test_data;
+select coalesce(multi_field_variant:missing_field, 'default_value') from variant_test_data;
diff --git a/sql/core/src/test/resources/sql-tests/results/binary.sql.out b/sql/core/src/test/resources/sql-tests/results/binary.sql.out
index 050f05271411a..bdbf4e538f6c5 100644
--- a/sql/core/src/test/resources/sql-tests/results/binary.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/binary.sql.out
@@ -37,3 +37,35 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 struct<to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333')):string>
 -- !query output
 1,Eason Yao 2018-11-17:13:33:33
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query schema
+struct<to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)):string>
+-- !query output
+<ROW>
+    <name>Eason</name>
+    <birth>2018</birth>
+    <org>Kindergarten Cop</org>
+</ROW>
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:string,birth:int,org:string>>
+-- !query output
+{"name":"Eason","birth":2018,"org":"Kindergarten Cop"}
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:binary,birth:int,org:binary>>
+-- !query output
+{"name":Eason,"birth":2018,"org":Kindergarten Cop}
diff --git a/sql/core/src/test/resources/sql-tests/results/binary_base64.sql.out b/sql/core/src/test/resources/sql-tests/results/binary_base64.sql.out
index 8724e8620b48f..0806f175550dc 100644
--- a/sql/core/src/test/resources/sql-tests/results/binary_base64.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/binary_base64.sql.out
@@ -37,3 +37,35 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 struct<to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333')):string>
 -- !query output
 1,RWFzb24gWWFvIDIwMTgtMTEtMTc6MTM6MzM6MzM
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query schema
+struct<to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)):string>
+-- !query output
+<ROW>
+    <name>RWFzb24</name>
+    <birth>2018</birth>
+    <org>S2luZGVyZ2FydGVuIENvcA</org>
+</ROW>
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:string,birth:int,org:string>>
+-- !query output
+{"name":"RWFzb24","birth":2018,"org":"S2luZGVyZ2FydGVuIENvcA"}
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:binary,birth:int,org:binary>>
+-- !query output
+{"name":RWFzb24,"birth":2018,"org":S2luZGVyZ2FydGVuIENvcA}
diff --git a/sql/core/src/test/resources/sql-tests/results/binary_basic.sql.out b/sql/core/src/test/resources/sql-tests/results/binary_basic.sql.out
index 0c543a7b45476..ce0d7d5d7f9bd 100644
--- a/sql/core/src/test/resources/sql-tests/results/binary_basic.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/binary_basic.sql.out
@@ -37,3 +37,35 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 struct<to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333')):string>
 -- !query output
 1,"[69, 97, 115, 111, 110, 32, 89, 97, 111, 32, 50, 48, 49, 56, 45, 49, 49, 45, 49, 55, 58, 49, 51, 58, 51, 51, 58, 51, 51]"
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query schema
+struct<to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)):string>
+-- !query output
+<ROW>
+    <name>[69, 97, 115, 111, 110]</name>
+    <birth>2018</birth>
+    <org>[75, 105, 110, 100, 101, 114, 103, 97, 114, 116, 101, 110, 32, 67, 111, 112]</org>
+</ROW>
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:string,birth:int,org:string>>
+-- !query output
+{"name":"[69, 97, 115, 111, 110]","birth":2018,"org":"[75, 105, 110, 100, 101, 114, 103, 97, 114, 116, 101, 110, 32, 67, 111, 112]"}
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:binary,birth:int,org:binary>>
+-- !query output
+{"name":[69, 97, 115, 111, 110],"birth":2018,"org":[75, 105, 110, 100, 101, 114, 103, 97, 114, 116, 101, 110, 32, 67, 111, 112]}
diff --git a/sql/core/src/test/resources/sql-tests/results/binary_hex.sql.out b/sql/core/src/test/resources/sql-tests/results/binary_hex.sql.out
index d977301f98e00..b1b23e02ea4ec 100644
--- a/sql/core/src/test/resources/sql-tests/results/binary_hex.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/binary_hex.sql.out
@@ -37,3 +37,35 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 struct<to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333')):string>
 -- !query output
 1,4561736F6E2059616F20323031382D31312D31373A31333A33333A3333
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query schema
+struct<to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)):string>
+-- !query output
+<ROW>
+    <name>4561736F6E</name>
+    <birth>2018</birth>
+    <org>4B696E64657267617274656E20436F70</org>
+</ROW>
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:string,birth:int,org:string>>
+-- !query output
+{"name":"4561736F6E","birth":2018,"org":"4B696E64657267617274656E20436F70"}
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:binary,birth:int,org:binary>>
+-- !query output
+{"name":4561736F6E,"birth":2018,"org":4B696E64657267617274656E20436F70}
diff --git a/sql/core/src/test/resources/sql-tests/results/binary_hex_discrete.sql.out b/sql/core/src/test/resources/sql-tests/results/binary_hex_discrete.sql.out
index 3fc6c0f53cc54..a07cfd8cacff2 100644
--- a/sql/core/src/test/resources/sql-tests/results/binary_hex_discrete.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/binary_hex_discrete.sql.out
@@ -37,3 +37,35 @@ SELECT to_csv(named_struct('n', 1, 'info', X'4561736F6E2059616F20323031382D31312
 struct<to_csv(named_struct(n, 1, info, X'4561736F6E2059616F20323031382D31312D31373A31333A33333A3333')):string>
 -- !query output
 1,[45 61 73 6F 6E 20 59 61 6F 20 32 30 31 38 2D 31 31 2D 31 37 3A 31 33 3A 33 33 3A 33 33]
+
+
+-- !query
+select to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop')))
+-- !query schema
+struct<to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop)):string>
+-- !query output
+<ROW>
+    <name>[45 61 73 6F 6E]</name>
+    <birth>2018</birth>
+    <org>[4B 69 6E 64 65 72 67 61 72 74 65 6E 20 43 6F 70]</org>
+</ROW>
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name STRING, birth INT, org STRING')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:string,birth:int,org:string>>
+-- !query output
+{"name":"[45 61 73 6F 6E]","birth":2018,"org":"[4B 69 6E 64 65 72 67 61 72 74 65 6E 20 43 6F 70]"}
+
+
+-- !query
+SELECT from_xml(
+         to_xml(named_struct('name', binary('Eason'), 'birth', 2018, 'org', binary('Kindergarten Cop'))),
+         'name binary, birth INT, org binary')
+-- !query schema
+struct<from_xml(to_xml(named_struct(name, Eason, birth, 2018, org, Kindergarten Cop))):struct<name:binary,birth:int,org:binary>>
+-- !query output
+{"name":[45 61 73 6F 6E],"birth":2018,"org":[4B 69 6E 64 65 72 67 61 72 74 65 6E 20 43 6F 70]}
diff --git a/sql/core/src/test/resources/sql-tests/results/cast.sql.out b/sql/core/src/test/resources/sql-tests/results/cast.sql.out
index 7dd7180165f2b..ca2f739113f13 100644
--- a/sql/core/src/test/resources/sql-tests/results/cast.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/cast.sql.out
@@ -1661,6 +1661,130 @@ struct<CAST(10.654321 AS INTERVAL MONTH):interval month>
 0-11
 
 
+-- !query
+SELECT CAST(TIME '00:01:52' AS tinyint)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS TINYINT):tinyint>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS smallint)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS SMALLINT):smallint>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS int)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS INT):int>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS bigint)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS BIGINT):bigint>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS tinyint)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"TIME(6)\"",
+    "targetType" : "\"TINYINT\"",
+    "value" : "TIME '23:59:59'"
+  }
+}
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS smallint)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"TIME(6)\"",
+    "targetType" : "\"SMALLINT\"",
+    "value" : "TIME '23:59:59'"
+  }
+}
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS int)
+-- !query schema
+struct<CAST(TIME '23:59:59' AS INT):int>
+-- !query output
+86399
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS bigint)
+-- !query schema
+struct<CAST(TIME '23:59:59' AS BIGINT):bigint>
+-- !query output
+86399
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS tinyint)
+-- !query schema
+struct<CAST(TIME '00:00:17.5' AS TINYINT):tinyint>
+-- !query output
+17
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS int)
+-- !query schema
+struct<CAST(TIME '00:00:17.5' AS INT):int>
+-- !query output
+17
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.9' AS int)
+-- !query schema
+struct<CAST(TIME '00:00:17.9' AS INT):int>
+-- !query output
+17
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS tinyint)
+-- !query schema
+struct<CAST(TIME '00:00:00' AS TINYINT):tinyint>
+-- !query output
+0
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS int)
+-- !query schema
+struct<CAST(TIME '00:00:00' AS INT):int>
+-- !query output
+0
+
+
 -- !query
 SELECT '1.23' :: int
 -- !query schema
@@ -1917,6 +2041,48 @@ struct<CAST(10.123456 AS INTERVAL DAY TO SECOND):interval day to second>
 0 00:00:10.123456000
 
 
+-- !query
+SELECT TIME '00:01:52' :: tinyint
+-- !query schema
+struct<CAST(TIME '00:01:52' AS TINYINT):tinyint>
+-- !query output
+112
+
+
+-- !query
+SELECT TIME '00:01:52' :: int
+-- !query schema
+struct<CAST(TIME '00:01:52' AS INT):int>
+-- !query output
+112
+
+
+-- !query
+SELECT TIME '23:59:59' :: tinyint
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"TIME(6)\"",
+    "targetType" : "\"TINYINT\"",
+    "value" : "TIME '23:59:59'"
+  }
+}
+
+
+-- !query
+SELECT TIME '23:59:59' :: int
+-- !query schema
+struct<CAST(TIME '23:59:59' AS INT):int>
+-- !query output
+86399
+
+
 -- !query
 SELECT '1.23' :: int :: long
 -- !query schema
@@ -2044,3 +2210,190 @@ org.apache.spark.sql.catalyst.parser.ParseException
     "hint" : ""
   }
 }
+
+
+-- !query
+SELECT CAST(time '00:00:00' AS decimal(1, 0))
+-- !query schema
+struct<CAST(TIME '00:00:00' AS DECIMAL(1,0)):decimal(1,0)>
+-- !query output
+0
+
+
+-- !query
+SELECT CAST(time '12:00:00' AS decimal(7, 2))
+-- !query schema
+struct<CAST(TIME '12:00:00' AS DECIMAL(7,2)):decimal(7,2)>
+-- !query output
+43200.00
+
+
+-- !query
+SELECT CAST(time '01:30:45' AS decimal(8, 3))
+-- !query schema
+struct<CAST(TIME '01:30:45' AS DECIMAL(8,3)):decimal(8,3)>
+-- !query output
+5445.000
+
+
+-- !query
+SELECT CAST(time '23:59:59' AS decimal(9, 4))
+-- !query schema
+struct<CAST(TIME '23:59:59' AS DECIMAL(9,4)):decimal(9,4)>
+-- !query output
+86399.0000
+
+
+-- !query
+SELECT CAST(time '01:02:03' AS decimal(15, 9))
+-- !query schema
+struct<CAST(TIME '01:02:03' AS DECIMAL(15,9)):decimal(15,9)>
+-- !query output
+3723.000000000
+
+
+-- !query
+SELECT CAST(time '10:20:30' AS decimal(20, 10))
+-- !query schema
+struct<CAST(TIME '10:20:30' AS DECIMAL(20,10)):decimal(20,10)>
+-- !query output
+37230.0000000000
+
+
+-- !query
+SELECT CAST(time '23:59:59.001' AS decimal(8, 3))
+-- !query schema
+struct<CAST(TIME '23:59:59.001' AS DECIMAL(8,3)):decimal(8,3)>
+-- !query output
+86399.001
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 6))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(11,6)):decimal(11,6)>
+-- !query output
+86399.999999
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 9))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(14,9)):decimal(14,9)>
+-- !query output
+86399.999999000
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(20, 10))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(20,10)):decimal(20,10)>
+-- !query output
+86399.9999990000
+
+
+-- !query
+SELECT CAST(time '00:01:00' AS decimal(1, 0))
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "NUMERIC_VALUE_OUT_OF_RANGE.WITH_SUGGESTION",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\"",
+    "precision" : "1",
+    "scale" : "0",
+    "value" : "60.000000000"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 45,
+    "fragment" : "CAST(time '00:01:00' AS decimal(1, 0))"
+  } ]
+}
+
+
+-- !query
+SELECT CAST(time '01:00:00' AS decimal(3, 0))
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "NUMERIC_VALUE_OUT_OF_RANGE.WITH_SUGGESTION",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\"",
+    "precision" : "3",
+    "scale" : "0",
+    "value" : "3600.000000000"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 45,
+    "fragment" : "CAST(time '01:00:00' AS decimal(3, 0))"
+  } ]
+}
+
+
+-- !query
+SELECT CAST(time '10:00:00' AS decimal(5, 2))
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "NUMERIC_VALUE_OUT_OF_RANGE.WITH_SUGGESTION",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\"",
+    "precision" : "5",
+    "scale" : "2",
+    "value" : "36000.000000000"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 45,
+    "fragment" : "CAST(time '10:00:00' AS decimal(5, 2))"
+  } ]
+}
+
+
+-- !query
+SELECT CAST(time '23:59:59.9' AS decimal(6, 0))
+-- !query schema
+struct<CAST(TIME '23:59:59.9' AS DECIMAL(6,0)):decimal(6,0)>
+-- !query output
+86400
+
+
+-- !query
+SELECT CAST(time '23:59:59.999' AS decimal(8, 2))
+-- !query schema
+struct<CAST(TIME '23:59:59.999' AS DECIMAL(8,2)):decimal(8,2)>
+-- !query output
+86400.00
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 5))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(11,5)):decimal(11,5)>
+-- !query output
+86400.00000
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 8))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(14,8)):decimal(14,8)>
+-- !query output
+86399.99999900
diff --git a/sql/core/src/test/resources/sql-tests/results/collations-aliases.sql.out b/sql/core/src/test/resources/sql-tests/results/collations-aliases.sql.out
new file mode 100644
index 0000000000000..efc0dd9f10f5d
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/collations-aliases.sql.out
@@ -0,0 +1,408 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+select * from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+select subq1.* from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+) AS subq1
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+with cte as (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+select * from cte
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+select * from values (1) where exists (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query schema
+struct<col1:int>
+-- !query output
+1
+
+
+-- !query
+select (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1 limit 1
+)
+-- !query schema
+struct<scalarsubquery():string collate UTF8_LCASE>
+-- !query output
+Something else. Nothing here. Something else. Nothing here.
+
+
+-- !query
+select (
+  with cte as (
+    select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  )
+  select * from cte limit 1
+)
+-- !query schema
+struct<scalarsubquery():string collate UTF8_LCASE>
+-- !query output
+Something else. Nothing here. Something else. Nothing here.
+
+
+-- !query
+select * from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1 limit 1
+)
+where (
+  `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` == 'aaa'
+)
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+
+
+
+-- !query
+select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  group by 1
+  order by 1
+)
+-- !query schema
+struct<lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+a a
+aaaaaaaa aaaaaaaa
+aaaaaaaaaaaaaaaaaaaaaaaa aaaaaaaaaaaaaaaaaaaaaaaa
+abc abc
+abcdcba abcdcba
+efd2 efd2
+hello, world! nice day. hello, world! nice day.
+i̇o  i̇o 
+i̇o i̇o
+sitting sitting
+something else. nothing here. something else. nothing here.
+sql sql
+
+
+-- !query
+select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+  group by 1
+  order by max(concat_ws(' ', utf8_lcase, utf8_lcase))
+)
+-- !query schema
+struct<lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+a a
+aaaaaaaa aaaaaaaa
+aaaaaaaaaaaaaaaaaaaaaaaa aaaaaaaaaaaaaaaaaaaaaaaa
+abc abc
+abcdcba abcdcba
+efd2 efd2
+hello, world! nice day. hello, world! nice day.
+i̇o  i̇o 
+i̇o i̇o
+sitting sitting
+something else. nothing here. something else. nothing here.
+sql sql
+
+
+-- !query
+create temporary view v1 as (
+  select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select * from v1
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from v1
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+drop view v1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+drop table t1
+-- !query schema
+struct<>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/collations-basic.sql.out b/sql/core/src/test/resources/sql-tests/results/collations-basic.sql.out
new file mode 100644
index 0000000000000..f10ca3ca89c61
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/collations-basic.sql.out
@@ -0,0 +1,1748 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values('aaa', 'aaa')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values('AAA', 'AAA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values('bbb', 'bbb')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values('BBB', 'BBB')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+describe table t1
+-- !query schema
+struct<col_name:string,data_type:string,comment:string>
+-- !query output
+utf8_binary         	string              	                    
+utf8_lcase          	string collate UTF8_LCASE
+
+
+-- !query
+select count(*) from t1 group by utf8_binary
+-- !query schema
+struct<count(1):bigint>
+-- !query output
+1
+1
+1
+1
+
+
+-- !query
+select count(*) from t1 group by utf8_lcase
+-- !query schema
+struct<count(1):bigint>
+-- !query output
+2
+2
+
+
+-- !query
+select * from t1 where utf8_binary = 'aaa'
+-- !query schema
+struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
+-- !query output
+aaa	aaa
+
+
+-- !query
+select * from t1 where utf8_lcase = 'aaa' collate utf8_lcase
+-- !query schema
+struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
+-- !query output
+AAA	AAA
+aaa	aaa
+
+
+-- !query
+select * from t1 where utf8_binary < 'bbb'
+-- !query schema
+struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
+-- !query output
+AAA	AAA
+BBB	BBB
+aaa	aaa
+
+
+-- !query
+select * from t1 where utf8_lcase < 'bbb' collate utf8_lcase
+-- !query schema
+struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
+-- !query output
+AAA	AAA
+aaa	aaa
+
+
+-- !query
+select l.utf8_binary, r.utf8_lcase from t1 l join t1 r on l.utf8_lcase = r.utf8_lcase
+-- !query schema
+struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
+-- !query output
+AAA	AAA
+AAA	aaa
+BBB	BBB
+BBB	bbb
+aaa	AAA
+aaa	aaa
+bbb	BBB
+bbb	bbb
+
+
+-- !query
+create table t2(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t2 values('aaa', 'aaa')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t2 values('bbb', 'bbb')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select * from t1 anti join t2 on t1.utf8_lcase = t2.utf8_lcase
+-- !query schema
+struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
+-- !query output
+
+
+
+-- !query
+drop table t2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+drop table t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query schema
+struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+zzz
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query schema
+struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+aaa
+bbb
+zzz
+zzz
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query schema
+struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+aaa
+bbb
+zzz
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query schema
+struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+AAA
+BBB
+ZZZ
+aaa
+aaa
+bbb
+bbb
+zzz
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate utf8_lcase from values ('aaa'), ('bbb')
+-- !query schema
+struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+aaa
+bbb
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "EXCEPT",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 162,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "EXCEPT ALL",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 166,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "UNION",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 161,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "UNION",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 165,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "columnOrdinalNumber" : "first",
+    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
+    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
+    "hint" : "",
+    "operator" : "INTERSECT",
+    "tableOrdinalNumber" : "second"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 156,
+    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')"
+  } ]
+}
+
+
+-- !query
+create table t1 (c1 struct<utf8_binary: string collate utf8_binary, utf8_lcase: string collate utf8_lcase>) USING PARQUET
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values (named_struct('utf8_binary', 'aaa', 'utf8_lcase', 'aaa'))
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values (named_struct('utf8_binary', 'AAA', 'utf8_lcase', 'AAA'))
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select count(*) from t1 group by c1.utf8_binary
+-- !query schema
+struct<count(1):bigint>
+-- !query output
+1
+1
+
+
+-- !query
+select count(*) from t1 group by c1.utf8_lcase
+-- !query schema
+struct<count(1):bigint>
+-- !query output
+2
+
+
+-- !query
+drop table t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select array_contains(ARRAY('aaa' collate utf8_lcase),'AAA' collate utf8_lcase)
+-- !query schema
+struct<array_contains(array(collate(aaa, utf8_lcase)), collate(AAA, utf8_lcase)):boolean>
+-- !query output
+true
+
+
+-- !query
+select array_position(ARRAY('aaa' collate utf8_lcase, 'bbb' collate utf8_lcase),'BBB' collate utf8_lcase)
+-- !query schema
+struct<array_position(array(collate(aaa, utf8_lcase), collate(bbb, utf8_lcase)), collate(BBB, utf8_lcase)):bigint>
+-- !query output
+2
+
+
+-- !query
+select nullif('aaa' COLLATE utf8_lcase, 'AAA' COLLATE utf8_lcase)
+-- !query schema
+struct<nullif(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+NULL
+
+
+-- !query
+select least('aaa' COLLATE utf8_lcase, 'AAA' collate utf8_lcase, 'a' collate utf8_lcase)
+-- !query schema
+struct<least(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase), collate(a, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+a
+
+
+-- !query
+select arrays_overlap(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query schema
+struct<arrays_overlap(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):boolean>
+-- !query output
+true
+
+
+-- !query
+select array_distinct(array('aaa' collate utf8_lcase, 'AAA' collate utf8_lcase))
+-- !query schema
+struct<array_distinct(array(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
+-- !query output
+["aaa"]
+
+
+-- !query
+select array_union(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query schema
+struct<array_union(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
+-- !query output
+["aaa"]
+
+
+-- !query
+select array_intersect(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query schema
+struct<array_intersect(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
+-- !query output
+["aaa"]
+
+
+-- !query
+select array_except(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
+-- !query schema
+struct<array_except(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
+-- !query output
+[]
+
+
+-- !query
+select 'a' collate unicode < 'A'
+-- !query schema
+struct<(collate(a, unicode) < 'A' collate UNICODE):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'a' collate unicode_ci = 'A'
+-- !query schema
+struct<(collate(a, unicode_ci) = 'A' collate UNICODE_CI):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'a' collate unicode_ai = 'å'
+-- !query schema
+struct<(collate(a, unicode_ai) = 'å' collate UNICODE_AI):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'a' collate unicode_ci_ai = 'Å'
+-- !query schema
+struct<(collate(a, unicode_ci_ai) = 'Å' collate UNICODE_CI_AI):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'a' collate en < 'A'
+-- !query schema
+struct<(collate(a, en) < 'A' collate en):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'a' collate en_ci = 'A'
+-- !query schema
+struct<(collate(a, en_ci) = 'A' collate en_CI):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'a' collate en_ai = 'å'
+-- !query schema
+struct<(collate(a, en_ai) = 'å' collate en_AI):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'a' collate en_ci_ai = 'Å'
+-- !query schema
+struct<(collate(a, en_ci_ai) = 'Å' collate en_CI_AI):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'Kypper' collate sv < 'Köpfe'
+-- !query schema
+struct<(collate(Kypper, sv) < 'Köpfe' collate sv):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'Kypper' collate de > 'Köpfe'
+-- !query schema
+struct<(collate(Kypper, de) > 'Köpfe' collate de):boolean>
+-- !query output
+true
+
+
+-- !query
+select 'I' collate tr_ci = 'ı'
+-- !query schema
+struct<(collate(I, tr_ci) = 'ı' collate tr_CI):boolean>
+-- !query output
+true
+
+
+-- !query
+create table t3 (text string collate utf8_binary, pairDelim string collate utf8_lcase, keyValueDelim string collate utf8_binary) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t3 values('a:1,b:2,c:3', ',', ':')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select str_to_map(text, pairDelim, keyValueDelim) from t3
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "INDETERMINATE_COLLATION",
+  "sqlState" : "42P22"
+}
+
+
+-- !query
+select str_to_map(text collate utf8_binary, pairDelim collate utf8_lcase, keyValueDelim collate utf8_binary) from t3
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select str_to_map(text collate utf8_binary, pairDelim collate utf8_binary, keyValueDelim collate utf8_binary) from t3
+-- !query schema
+struct<str_to_map(collate(text, utf8_binary), collate(pairDelim, utf8_binary), collate(keyValueDelim, utf8_binary)):map<string,string>>
+-- !query output
+{"a":"1","b":"2","c":"3"}
+
+
+-- !query
+select str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai) from t3
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(text, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"str_to_map(collate(text, unicode_ai), collate(pairDelim, unicode_ai), collate(keyValueDelim, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 106,
+    "fragment" : "str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+drop table t3
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+create table t2(ascii double) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t2 values (97.52143)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t2 values (66.421)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+create table t3(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t3 values ('aaAaAAaA', 'aaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t3 values ('efd2', 'efd2')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+create table t4(num long) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t4 values (97)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t4 values (66)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select elt(2, s, utf8_binary) from t1
+-- !query schema
+struct<elt(2, s, utf8_binary):string>
+-- !query output
+Hello, world! Nice day.
+Something else. Nothing here.
+Spark
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abc
+abcdcba
+bbAbAAbA
+efd2
+kitten
+İo
+İo
+İo
+İo
+
+
+-- !query
+select elt(2, utf8_binary, utf8_lcase, s) from t1
+-- !query schema
+struct<elt(2, utf8_binary, utf8_lcase, s):string collate null>
+-- !query output
+Hello, world! Nice day.
+SQL
+Something else. Nothing here.
+a
+aBcDCbA
+aaAaAAaA
+aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA
+abc
+efd2
+i̇o
+sitTing
+İo
+İo
+İo
+
+
+-- !query
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<elt(1, collate(utf8_binary, utf8_binary), collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+Hello, world! Nice day.
+Something else. Nothing here.
+Spark
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abc
+abcdcba
+bbAbAAbA
+efd2
+kitten
+İo
+İo
+İo
+İo
+
+
+-- !query
+select elt(1, utf8_binary collate utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<elt(1, collate(utf8_binary, utf8_binary), utf8_lcase):string>
+-- !query output
+Hello, world! Nice day.
+Something else. Nothing here.
+Spark
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abc
+abcdcba
+bbAbAAbA
+efd2
+kitten
+İo
+İo
+İo
+İo
+
+
+-- !query
+select elt(1, utf8_binary, 'word'), elt(1, utf8_lcase, 'word') from t1
+-- !query schema
+struct<elt(1, utf8_binary, word):string,elt(1, utf8_lcase, 'word' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select elt(1, utf8_binary, 'word' collate utf8_lcase), elt(1, utf8_lcase, 'word' collate utf8_binary) from t1
+-- !query schema
+struct<elt(1, utf8_binary, collate(word, utf8_lcase)):string collate UTF8_LCASE,elt(1, utf8_lcase, collate(word, utf8_binary)):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select ascii(utf8_binary), ascii(utf8_lcase) from t1
+-- !query schema
+struct<ascii(utf8_binary):int,ascii(utf8_lcase):int>
+-- !query output
+101	101
+107	115
+304	105
+304	304
+304	304
+304	304
+72	72
+83	83
+83	83
+97	97
+97	97
+97	97
+97	97
+97	97
+98	97
+
+
+-- !query
+select ascii(utf8_binary collate utf8_lcase), ascii(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<ascii(collate(utf8_binary, utf8_lcase)):int,ascii(collate(utf8_lcase, utf8_binary)):int>
+-- !query output
+101	101
+107	115
+304	105
+304	304
+304	304
+304	304
+72	72
+83	83
+83	83
+97	97
+97	97
+97	97
+97	97
+97	97
+98	97
+
+
+-- !query
+select unbase64(utf8_binary), unbase64(utf8_lcase) from t3
+-- !query schema
+struct<unbase64(utf8_binary):binary,unbase64(utf8_lcase):binary>
+-- !query output
+i� �	i�h�
+y�v	y�v
+
+
+-- !query
+select unbase64(utf8_binary collate utf8_lcase), unbase64(utf8_lcase collate utf8_binary) from t3
+-- !query schema
+struct<unbase64(collate(utf8_binary, utf8_lcase)):binary,unbase64(collate(utf8_lcase, utf8_binary)):binary>
+-- !query output
+i� �	i�h�
+y�v	y�v
+
+
+-- !query
+select base64(utf8_binary), base64(utf8_lcase) from t1
+-- !query schema
+struct<base64(utf8_binary):string,base64(utf8_lcase):string>
+-- !query output
+SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=	SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=
+U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=	U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=
+U3Bhcms=	U1FM
+YWFBYUFBYUE=	YWFBYUFBYUE=
+YWFBYUFBYUE=	YWFBYWFBYUE=
+YWFBYUFBYUE=	YWFBYWFBYUFhYUFhYUFhQWFhQWFhQWFB
+YWJj	YWJj
+YWJjZGNiYQ==	YUJjRENiQQ==
+YmJBYkFBYkE=	YQ==
+ZWZkMg==	ZWZkMg==
+a2l0dGVu	c2l0VGluZw==
+xLBv	acyHbw==
+xLBv	xLBv
+xLBv	xLBvIA==
+xLBvIA==	xLBv
+
+
+-- !query
+select base64(utf8_binary collate utf8_lcase), base64(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<base64(collate(utf8_binary, utf8_lcase)):string,base64(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=	SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=
+U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=	U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=
+U3Bhcms=	U1FM
+YWFBYUFBYUE=	YWFBYUFBYUE=
+YWFBYUFBYUE=	YWFBYWFBYUE=
+YWFBYUFBYUE=	YWFBYWFBYUFhYUFhYUFhQWFhQWFhQWFB
+YWJj	YWJj
+YWJjZGNiYQ==	YUJjRENiQQ==
+YmJBYkFBYkE=	YQ==
+ZWZkMg==	ZWZkMg==
+a2l0dGVu	c2l0VGluZw==
+xLBv	acyHbw==
+xLBv	xLBv
+xLBv	xLBvIA==
+xLBvIA==	xLBv
+
+
+-- !query
+select decode(encode(utf8_binary, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase, 'utf-8'), 'utf-8') from t1
+-- !query schema
+struct<decode(encode(utf8_binary, utf-8), utf-8):string,decode(encode(utf8_lcase, utf-8), utf-8):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select decode(encode(utf8_binary collate utf8_lcase, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase collate utf8_binary, 'utf-8'), 'utf-8') from t1
+-- !query schema
+struct<decode(encode(collate(utf8_binary, utf8_lcase), utf-8), utf-8):string,decode(encode(collate(utf8_lcase, utf8_binary), utf-8), utf-8):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select format_number(ascii, '###.###') from t2
+-- !query schema
+struct<format_number(ascii, ###.###):string>
+-- !query output
+66.421
+97.521
+
+
+-- !query
+select format_number(ascii, '###.###' collate utf8_lcase) from t2
+-- !query schema
+struct<format_number(ascii, collate(###.###, utf8_lcase)):string>
+-- !query output
+66.421
+97.521
+
+
+-- !query
+select encode(utf8_binary, 'utf-8'), encode(utf8_lcase, 'utf-8') from t1
+-- !query schema
+struct<encode(utf8_binary, utf-8):binary,encode(utf8_lcase, utf-8):binary>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select encode(utf8_binary collate utf8_lcase, 'utf-8'), encode(utf8_lcase collate utf8_binary, 'utf-8') from t1
+-- !query schema
+struct<encode(collate(utf8_binary, utf8_lcase), utf-8):binary,encode(collate(utf8_lcase, utf8_binary), utf-8):binary>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select to_binary(utf8_binary, 'utf-8'), to_binary(utf8_lcase, 'utf-8') from t1
+-- !query schema
+struct<to_binary(utf8_binary, utf-8):binary,to_binary(utf8_lcase, utf-8):binary>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select to_binary(utf8_binary collate utf8_lcase, 'utf-8'), to_binary(utf8_lcase collate utf8_binary, 'utf-8') from t1
+-- !query schema
+struct<to_binary(collate(utf8_binary, utf8_lcase), utf-8):binary,to_binary(collate(utf8_lcase, utf8_binary), utf-8):binary>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select soundex(utf8_binary), soundex(utf8_lcase) from t1
+-- !query schema
+struct<soundex(utf8_binary):string,soundex(utf8_lcase):string>
+-- !query output
+A000	A000
+A000	A000
+A000	A000
+A120	A120
+A123	A123
+B110	A000
+E130	E130
+H464	H464
+K350	S352
+S162	S400
+S535	S535
+İo	I000
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select soundex(utf8_binary collate utf8_lcase), soundex(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<soundex(collate(utf8_binary, utf8_lcase)):string,soundex(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+A000	A000
+A000	A000
+A000	A000
+A120	A120
+A123	A123
+B110	A000
+E130	E130
+H464	H464
+K350	S352
+S162	S400
+S535	S535
+İo	I000
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select luhn_check(num) from t4
+-- !query schema
+struct<luhn_check(num):boolean>
+-- !query output
+false
+false
+
+
+-- !query
+select levenshtein(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<levenshtein(utf8_binary, utf8_lcase):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+1
+1
+1
+16
+2
+4
+4
+4
+8
+
+
+-- !query
+select levenshtein(s, utf8_binary) from t1
+-- !query schema
+struct<levenshtein(s, utf8_binary):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+1
+1
+
+
+-- !query
+select levenshtein(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select levenshtein(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<levenshtein(utf8_binary, collate(utf8_lcase, utf8_binary)):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+1
+1
+1
+16
+2
+4
+4
+4
+8
+
+
+-- !query
+select levenshtein(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<levenshtein(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+1
+1
+1
+16
+2
+4
+4
+4
+8
+
+
+-- !query
+select levenshtein(utf8_binary, 'a'), levenshtein(utf8_lcase, 'a') from t1
+-- !query schema
+struct<levenshtein(utf8_binary, a):int,levenshtein(utf8_lcase, 'a' collate UTF8_LCASE):int>
+-- !query output
+2	2
+2	2
+2	3
+2	3
+22	22
+29	29
+3	2
+4	3
+4	4
+6	6
+6	7
+7	23
+7	7
+7	7
+8	0
+
+
+-- !query
+select levenshtein(utf8_binary, 'AaAA' collate utf8_lcase, 3), levenshtein(utf8_lcase, 'AAa' collate utf8_binary, 4) from t1
+-- !query schema
+struct<levenshtein(utf8_binary, collate(AaAA, utf8_lcase), 3):int,levenshtein(utf8_lcase, collate(AAa, utf8_binary), 4):int>
+-- !query output
+-1	-1
+-1	-1
+-1	-1
+-1	-1
+-1	-1
+-1	-1
+-1	-1
+-1	2
+-1	3
+-1	3
+-1	3
+-1	3
+-1	3
+-1	4
+3	3
+
+
+-- !query
+select is_valid_utf8(utf8_binary), is_valid_utf8(utf8_lcase) from t1
+-- !query schema
+struct<is_valid_utf8(utf8_binary):boolean,is_valid_utf8(utf8_lcase):boolean>
+-- !query output
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+
+
+-- !query
+select is_valid_utf8(utf8_binary collate utf8_lcase), is_valid_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<is_valid_utf8(collate(utf8_binary, utf8_lcase)):boolean,is_valid_utf8(collate(utf8_lcase, utf8_binary)):boolean>
+-- !query output
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+
+
+-- !query
+select is_valid_utf8(utf8_binary collate utf8_lcase_rtrim), is_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<is_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim)):boolean,is_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim)):boolean>
+-- !query output
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+
+
+-- !query
+select make_valid_utf8(utf8_binary), make_valid_utf8(utf8_lcase) from t1
+-- !query schema
+struct<make_valid_utf8(utf8_binary):string,make_valid_utf8(utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select make_valid_utf8(utf8_binary collate utf8_lcase), make_valid_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<make_valid_utf8(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,make_valid_utf8(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select make_valid_utf8(utf8_binary collate utf8_lcase_rtrim), make_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<make_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim)):string collate UTF8_LCASE_RTRIM,make_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select validate_utf8(utf8_binary), validate_utf8(utf8_lcase) from t1
+-- !query schema
+struct<validate_utf8(utf8_binary):string,validate_utf8(utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select validate_utf8(utf8_binary collate utf8_lcase), validate_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<validate_utf8(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,validate_utf8(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select validate_utf8(utf8_binary collate utf8_lcase_rtrim), validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<validate_utf8(collate(utf8_binary, utf8_lcase_rtrim)):string collate UTF8_LCASE_RTRIM,validate_utf8(collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select try_validate_utf8(utf8_binary), try_validate_utf8(utf8_lcase) from t1
+-- !query schema
+struct<try_validate_utf8(utf8_binary):string,try_validate_utf8(utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select try_validate_utf8(utf8_binary collate utf8_lcase), try_validate_utf8(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<try_validate_utf8(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,try_validate_utf8(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select try_validate_utf8(utf8_binary collate utf8_lcase_rtrim), try_validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<try_validate_utf8(collate(utf8_binary, utf8_lcase_rtrim)):string collate UTF8_LCASE_RTRIM,try_validate_utf8(collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+drop table t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+drop table t2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+drop table t3
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+drop table t4
+-- !query schema
+struct<>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/collations-padding-trim.sql.out b/sql/core/src/test/resources/sql-tests/results/collations-padding-trim.sql.out
new file mode 100644
index 0000000000000..d18a011292c43
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/collations-padding-trim.sql.out
@@ -0,0 +1,1225 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select rpad(utf8_binary, 8, utf8_lcase) from t1
+-- !query schema
+struct<rpad(utf8_binary, 8, utf8_lcase):string collate null>
+-- !query output
+Hello, w
+Somethin
+SparkSQL
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abcabcab
+abcdcbaa
+bbAbAAbA
+efd2efd2
+kittensi
+İo İoİoİ
+İoi̇oi̇o
+İoİo İo 
+İoİoİoİo
+
+
+-- !query
+select rpad(s, 8, utf8_binary) from t1
+-- !query schema
+struct<rpad(s, 8, utf8_binary):string>
+-- !query output
+Hello, w
+Somethin
+SparkSpa
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abcabcab
+abcdcbaa
+bbAbaAbA
+efd2efd2
+kittenki
+İoİo İo 
+İoİoİoİo
+İoİoİoİo
+İoİoİoİo
+
+
+-- !query
+select rpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select rpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<rpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+Hello, w
+Somethin
+SparkSQL
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abcabcab
+abcdcbaa
+bbAbAAbA
+efd2efd2
+kittensi
+İo İoİoİ
+İoi̇oi̇o
+İoİo İo 
+İoİoİoİo
+
+
+-- !query
+select rpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<rpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+Hello, w
+Somethin
+SparkSQL
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abcabcab
+abcdcbaa
+bbAbAAbA
+efd2efd2
+kittensi
+İo İoİoİ
+İoi̇oi̇o
+İoİo İo 
+İoİoİoİo
+
+
+-- !query
+select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+Hello, w
+SQLSpark
+Somethin
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+aabcdcba
+abcababc
+bbAbAAbA
+efd2efd2
+i̇oi̇oİo
+sikitten
+İo İo İo
+İoİoİoİo
+İoİoİİo
+
+
+-- !query
+select rpad(utf8_binary, 8, 'a'), rpad(utf8_lcase, 8, 'a') from t1
+-- !query schema
+struct<rpad(utf8_binary, 8, a):string,rpad(utf8_lcase, 8, 'a' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+Hello, w	Hello, w
+Somethin	Somethin
+Sparkaaa	SQLaaaaa
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaA
+abcaaaaa	abcaaaaa
+abcdcbaa	aBcDCbAa
+bbAbAAbA	aaaaaaaa
+efd2aaaa	efd2aaaa
+kittenaa	sitTinga
+İo aaaaa	İoaaaaaa
+İoaaaaaa	i̇oaaaaa
+İoaaaaaa	İo aaaaa
+İoaaaaaa	İoaaaaaa
+
+
+-- !query
+select rpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), rpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t1
+-- !query schema
+struct<rpad(utf8_binary, 8, collate(AaAA, utf8_lcase)):string collate UTF8_LCASE,rpad(utf8_lcase, 8, collate(AAa, utf8_binary)):string>
+-- !query output
+Hello, w	Hello, w
+Somethin	Somethin
+SparkAaA	SQLAAaAA
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaA
+abcAaAAA	abcAAaAA
+abcdcbaA	aBcDCbAA
+bbAbAAbA	aAAaAAaA
+efd2AaAA	efd2AAaA
+kittenAa	sitTingA
+İo AaAAA	İoAAaAAa
+İoAaAAAa	i̇oAAaAA
+İoAaAAAa	İo AAaAA
+İoAaAAAa	İoAAaAAa
+
+
+-- !query
+select lpad(utf8_binary, 8, utf8_lcase) from t1
+-- !query schema
+struct<lpad(utf8_binary, 8, utf8_lcase):string collate null>
+-- !query output
+Hello, w
+SQLSpark
+Somethin
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+aabcdcba
+abcababc
+bbAbAAbA
+efd2efd2
+i̇oi̇oİo
+sikitten
+İo İo İo
+İoİoİoİo
+İoİoİİo
+
+
+-- !query
+select lpad(s, 8, utf8_binary) from t1
+-- !query schema
+struct<lpad(s, 8, utf8_binary):string>
+-- !query output
+Hello, w
+Somethin
+SpaSpark
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+aabcdcba
+abcababc
+bbAbaAbA
+efd2efd2
+kikitten
+İo İo İo
+İoİoİoİo
+İoİoİoİo
+İoİoİoİo
+
+
+-- !query
+select lpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select lpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<lpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+Hello, w
+SQLSpark
+Somethin
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+aabcdcba
+abcababc
+bbAbAAbA
+efd2efd2
+i̇oi̇oİo
+sikitten
+İo İo İo
+İoİoİoİo
+İoİoİİo
+
+
+-- !query
+select lpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<lpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+Hello, w
+SQLSpark
+Somethin
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+aabcdcba
+abcababc
+bbAbAAbA
+efd2efd2
+i̇oi̇oİo
+sikitten
+İo İo İo
+İoİoİoİo
+İoİoİİo
+
+
+-- !query
+select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+Hello, w
+SQLSpark
+Somethin
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+aabcdcba
+abcababc
+bbAbAAbA
+efd2efd2
+i̇oi̇oİo
+sikitten
+İo İo İo
+İoİoİoİo
+İoİoİİo
+
+
+-- !query
+select lpad(utf8_binary, 8, 'a'), lpad(utf8_lcase, 8, 'a') from t1
+-- !query schema
+struct<lpad(utf8_binary, 8, a):string,lpad(utf8_lcase, 8, 'a' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+Hello, w	Hello, w
+Somethin	Somethin
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaA
+aaaSpark	aaaaaSQL
+aaaaaabc	aaaaaabc
+aaaaaaİo	aaaaaaİo
+aaaaaaİo	aaaaai̇o
+aaaaaaİo	aaaaaİo 
+aaaaaİo 	aaaaaaİo
+aaaaefd2	aaaaefd2
+aabcdcba	aaBcDCbA
+aakitten	asitTing
+bbAbAAbA	aaaaaaaa
+
+
+-- !query
+select lpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), lpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t1
+-- !query schema
+struct<lpad(utf8_binary, 8, collate(AaAA, utf8_lcase)):string collate UTF8_LCASE,lpad(utf8_lcase, 8, collate(AAa, utf8_binary)):string>
+-- !query output
+AaAAAabc	AAaAAabc
+AaAAAaİo	AAaAAaİo
+AaAAAaİo	AAaAAi̇o
+AaAAAaİo	AAaAAİo 
+AaAAAİo 	AAaAAaİo
+AaAAefd2	AAaAefd2
+AaASpark	AAaAASQL
+Aabcdcba	AaBcDCbA
+Aakitten	AsitTing
+Hello, w	Hello, w
+Somethin	Somethin
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaA
+bbAbAAbA	AAaAAaAa
+
+
+-- !query
+select TRIM(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(BOTH utf8_binary FROM utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 36,
+    "fragment" : "TRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select TRIM(s, utf8_binary) from t1
+-- !query schema
+struct<TRIM(BOTH s FROM utf8_binary):string>
+-- !query output
+
+
+
+-- !query
+select TRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select TRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<TRIM(BOTH utf8_binary FROM collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+ 
+BcDCbA
+QL
+a
+i̇
+sitTing
+
+
+-- !query
+select TRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<TRIM(BOTH collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+ 
+QL
+sitTing
+
+
+-- !query
+select TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(BOTH collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select TRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<TRIM(BOTH collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+
+
+
+
+
+
+
+
+
+ 
+BcDCbA
+QL
+a
+i̇
+sitTing
+
+
+-- !query
+select TRIM('ABc', utf8_binary), TRIM('ABc', utf8_lcase) from t1
+-- !query schema
+struct<TRIM(BOTH ABc FROM utf8_binary):string,TRIM(BOTH 'ABc' collate UTF8_LCASE FROM utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAa	
+aaAaAAa	
+aaAaAAa	
+ab	
+abcdcba	D
+bbAbAAb	
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select TRIM('ABc' collate utf8_lcase, utf8_binary), TRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<TRIM(BOTH collate(ABc, utf8_lcase) FROM utf8_binary):string collate UTF8_LCASE,TRIM(BOTH collate(AAa, utf8_binary) FROM utf8_lcase):string>
+-- !query output
+	
+	
+	
+	
+	bc
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+d	BcDCb
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select BTRIM(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(BOTH utf8_lcase FROM utf8_binary)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "BTRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select BTRIM(s, utf8_binary) from t1
+-- !query schema
+struct<btrim(s, utf8_binary):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+a
+
+
+-- !query
+select BTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select BTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<btrim(utf8_binary, collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+ 
+bbAbAAbA
+d
+kitte
+park
+İ
+
+
+-- !query
+select BTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<btrim(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+ 
+bbAbAAb
+kitte
+park
+İ
+
+
+-- !query
+select BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(BOTH collate(utf8_lcase, unicode_ai) FROM collate(utf8_binary, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select BTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<btrim(collate(utf8_binary, utf8_binary_rtrim), collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+
+
+
+
+
+
+
+
+
+ 
+bbAbAAbA
+d
+kitte
+park
+İ
+
+
+-- !query
+select BTRIM('ABc', utf8_binary), BTRIM('ABc', utf8_lcase) from t1
+-- !query schema
+struct<btrim(ABc, utf8_binary):string,btrim(ABc, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+AB	
+AB	
+AB	B
+ABc	ABc
+ABc	ABc
+ABc	ABc
+ABc	ABc
+ABc	ABc
+ABc	ABc
+ABc	ABc
+ABc	ABc
+Bc	Bc
+Bc	Bc
+Bc	Bc
+Bc	Bc
+
+
+-- !query
+select BTRIM('ABc' collate utf8_lcase, utf8_binary), BTRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<btrim(collate(ABc, utf8_lcase), utf8_binary):string collate UTF8_LCASE,btrim(collate(AAa, utf8_binary), utf8_lcase):string>
+-- !query output
+	
+	AA
+ABc	AAa
+ABc	AAa
+ABc	AAa
+ABc	AAa
+ABc	AAa
+ABc	AAa
+ABc	AAa
+B	AA
+Bc	
+Bc	
+Bc	
+Bc	AAa
+c	AA
+
+
+-- !query
+select LTRIM(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(LEADING utf8_binary FROM utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "LTRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select LTRIM(s, utf8_binary) from t1
+-- !query schema
+struct<TRIM(LEADING s FROM utf8_binary):string>
+-- !query output
+
+
+
+-- !query
+select LTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select LTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<TRIM(LEADING utf8_binary FROM collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+ 
+BcDCbA
+QL
+a
+i̇o
+sitTing
+
+
+-- !query
+select LTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<TRIM(LEADING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+ 
+QL
+sitTing
+
+
+-- !query
+select LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(LEADING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select LTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<TRIM(LEADING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+
+
+
+
+
+
+
+
+
+ 
+BcDCbA
+QL
+a
+i̇o
+sitTing
+
+
+-- !query
+select LTRIM('ABc', utf8_binary), LTRIM('ABc', utf8_lcase) from t1
+-- !query schema
+struct<TRIM(LEADING ABc FROM utf8_binary):string,TRIM(LEADING 'ABc' collate UTF8_LCASE FROM utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	
+aaAaAAaA	
+aaAaAAaA	
+abc	
+abcdcba	DCbA
+bbAbAAbA	
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select LTRIM('ABc' collate utf8_lcase, utf8_binary), LTRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<TRIM(LEADING collate(ABc, utf8_lcase) FROM utf8_binary):string collate UTF8_LCASE,TRIM(LEADING collate(AAa, utf8_binary) FROM utf8_lcase):string>
+-- !query output
+	
+	
+	
+	
+	bc
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+dcba	BcDCbA
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select RTRIM(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"TRIM(TRAILING utf8_binary FROM utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "RTRIM(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select RTRIM(s, utf8_binary) from t1
+-- !query schema
+struct<TRIM(TRAILING s FROM utf8_binary):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+İo
+
+
+-- !query
+select RTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select RTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<TRIM(TRAILING utf8_binary FROM collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+SQL
+a
+aBcDCbA
+i̇
+sitTing
+İo
+
+
+-- !query
+select RTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<TRIM(TRAILING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+SQL
+sitTing
+İo
+
+
+-- !query
+select RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"TRIM(TRAILING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select RTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<TRIM(TRAILING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
+-- !query output
+
+
+
+
+
+
+
+
+
+ 
+SQL
+a
+aBcDCbA
+i̇
+sitTing
+
+
+-- !query
+select RTRIM('ABc', utf8_binary), RTRIM('ABc', utf8_lcase) from t1
+-- !query schema
+struct<TRIM(TRAILING ABc FROM utf8_binary):string,TRIM(TRAILING 'ABc' collate UTF8_LCASE FROM utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAa	
+aaAaAAa	
+aaAaAAa	
+ab	
+abcdcba	aBcD
+bbAbAAb	
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select RTRIM('ABc' collate utf8_lcase, utf8_binary), RTRIM('AAa' collate utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<TRIM(TRAILING collate(ABc, utf8_lcase) FROM utf8_binary):string collate UTF8_LCASE,TRIM(TRAILING collate(AAa, utf8_binary) FROM utf8_lcase):string>
+-- !query output
+	
+	
+	
+	
+	abc
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+abcd	aBcDCb
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+drop table t1
+-- !query schema
+struct<>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/collations-string-functions.sql.out b/sql/core/src/test/resources/sql-tests/results/collations-string-functions.sql.out
new file mode 100644
index 0000000000000..ed4f6b500ae6e
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/collations-string-functions.sql.out
@@ -0,0 +1,2858 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+create table t1(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Spark', 'Spark', 'SQL')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('bbAbaAbA', 'bbAbAAbA', 'a')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'İo ')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo ', 'İo')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('İo', 'İo', 'i̇o')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('efd2', 'efd2', 'efd2')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('kitten', 'kitten', 'sitTing')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abc', 'abc', 'abc')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t1 values ('abcdcba', 'abcdcba', 'aBcDCbA')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+create table t2(ascii long) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t2 values (97)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t2 values (66)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+create table t3(format string collate utf8_binary, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+insert into t3 values ('%s%s', 'abCdE', 'abCdE')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select concat_ws(' ', utf8_lcase, utf8_lcase) from t1
+-- !query schema
+struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+SQL SQL
+Something else. Nothing here. Something else. Nothing here.
+a a
+aBcDCbA aBcDCbA
+aaAaAAaA aaAaAAaA
+aaAaaAaA aaAaaAaA
+aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+efd2 efd2
+i̇o i̇o
+sitTing sitTing
+İo  İo 
+İo İo
+İo İo
+
+
+-- !query
+select concat_ws(' ', utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<concat_ws(' ' collate null, utf8_binary, utf8_lcase):string collate null>
+-- !query output
+Hello, world! Nice day. Hello, world! Nice day.
+Something else. Nothing here. Something else. Nothing here.
+Spark SQL
+aaAaAAaA aaAaAAaA
+aaAaAAaA aaAaaAaA
+aaAaAAaA aaAaaAaAaaAaaAaAaaAaaAaA
+abc abc
+abcdcba aBcDCbA
+bbAbAAbA a
+efd2 efd2
+kitten sitTing
+İo  İo
+İo i̇o
+İo İo
+İo İo
+
+
+-- !query
+select concat_ws(' ' collate utf8_binary, utf8_binary, 'SQL' collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select concat_ws(' ' collate utf8_lcase, utf8_binary, 'SQL' collate utf8_lcase) from t1
+-- !query schema
+struct<concat_ws(collate( , utf8_lcase), utf8_binary, collate(SQL, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day. SQL
+Something else. Nothing here. SQL
+Spark SQL
+aaAaAAaA SQL
+aaAaAAaA SQL
+aaAaAAaA SQL
+abc SQL
+abcdcba SQL
+bbAbAAbA SQL
+efd2 SQL
+kitten SQL
+İo  SQL
+İo SQL
+İo SQL
+İo SQL
+
+
+-- !query
+select concat_ws(',', utf8_lcase, 'word'), concat_ws(',', utf8_binary, 'word') from t1
+-- !query schema
+struct<concat_ws(',' collate UTF8_LCASE, utf8_lcase, 'word' collate UTF8_LCASE):string collate UTF8_LCASE,concat_ws(,, utf8_binary, word):string>
+-- !query output
+Hello, world! Nice day.,word	Hello, world! Nice day.,word
+SQL,word	Spark,word
+Something else. Nothing here.,word	Something else. Nothing here.,word
+a,word	bbAbAAbA,word
+aBcDCbA,word	abcdcba,word
+aaAaAAaA,word	aaAaAAaA,word
+aaAaaAaA,word	aaAaAAaA,word
+aaAaaAaAaaAaaAaAaaAaaAaA,word	aaAaAAaA,word
+abc,word	abc,word
+efd2,word	efd2,word
+i̇o,word	İo,word
+sitTing,word	kitten,word
+İo ,word	İo,word
+İo,word	İo ,word
+İo,word	İo,word
+
+
+-- !query
+select concat_ws(',', utf8_lcase, 'word' collate utf8_binary), concat_ws(',', utf8_binary, 'word' collate utf8_lcase) from t1
+-- !query schema
+struct<concat_ws(,, utf8_lcase, collate(word, utf8_binary)):string,concat_ws(',' collate UTF8_LCASE, utf8_binary, collate(word, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.,word	Hello, world! Nice day.,word
+SQL,word	Spark,word
+Something else. Nothing here.,word	Something else. Nothing here.,word
+a,word	bbAbAAbA,word
+aBcDCbA,word	abcdcba,word
+aaAaAAaA,word	aaAaAAaA,word
+aaAaaAaA,word	aaAaAAaA,word
+aaAaaAaAaaAaaAaAaaAaaAaA,word	aaAaAAaA,word
+abc,word	abc,word
+efd2,word	efd2,word
+i̇o,word	İo,word
+sitTing,word	kitten,word
+İo ,word	İo,word
+İo,word	İo ,word
+İo,word	İo,word
+
+
+-- !query
+select split_part(utf8_binary, utf8_lcase, 3) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "INDETERMINATE_COLLATION",
+  "sqlState" : "42P22"
+}
+
+
+-- !query
+select split_part(s, utf8_binary, 1) from t1
+-- !query schema
+struct<split_part(s, utf8_binary, 1):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+
+bbAbaAbA
+İo
+
+
+-- !query
+select split_part(utf8_binary collate utf8_binary, s collate utf8_lcase, 1) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select split_part(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1
+-- !query schema
+struct<split_part(utf8_binary, collate(utf8_lcase, utf8_binary), 2):string>
+-- !query output
+
+
+
+-- !query
+select split_part(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1
+-- !query schema
+struct<split_part(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2):string collate UTF8_LCASE>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+
+ 
+b
+
+
+-- !query
+select split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"split_part(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
+  } ]
+}
+
+
+-- !query
+select split_part(utf8_binary, 'a', 3), split_part(utf8_lcase, 'a', 3) from t1
+-- !query schema
+struct<split_part(utf8_binary, a, 3):string,split_part(utf8_lcase, 'a' collate UTF8_LCASE, 3):string collate UTF8_LCASE>
+-- !query output
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+A	
+A	
+A
+
+
+-- !query
+select split_part(utf8_binary, 'a' collate utf8_lcase, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t1
+-- !query schema
+struct<split_part(utf8_binary, collate(a, utf8_lcase), 3):string collate UTF8_LCASE,split_part(utf8_lcase, collate(a, utf8_binary), 3):string>
+-- !query output
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	A
+	A
+	A
+
+
+-- !query
+select split_part(utf8_binary, 'a ' collate utf8_lcase_rtrim, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t1
+-- !query schema
+struct<split_part(utf8_binary, collate(a , utf8_lcase_rtrim), 3):string collate UTF8_LCASE_RTRIM,split_part(utf8_lcase, collate(a, utf8_binary), 3):string>
+-- !query output
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	
+	A
+	A
+	A
+
+
+-- !query
+select contains(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"contains(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 40,
+    "fragment" : "contains(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select contains(s, utf8_binary) from t1
+-- !query schema
+struct<contains(s, utf8_binary):boolean>
+-- !query output
+false
+false
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select contains(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select contains(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<contains(utf8_binary, collate(utf8_lcase, utf8_binary)):boolean>
+-- !query output
+false
+false
+false
+false
+false
+false
+false
+false
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select contains(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<contains(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):boolean>
+-- !query output
+false
+false
+false
+false
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"contains(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select contains(utf8_binary, 'a'), contains(utf8_lcase, 'a') from t1
+-- !query schema
+struct<contains(utf8_binary, a):boolean,contains(utf8_lcase, 'a' collate UTF8_LCASE):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	true
+true	false
+true	true
+true	true
+true	true
+true	true
+true	true
+true	true
+
+
+-- !query
+select contains(utf8_binary, 'AaAA' collate utf8_lcase), contains(utf8_lcase, 'AAa' collate utf8_binary) from t1
+-- !query schema
+struct<contains(utf8_binary, collate(AaAA, utf8_lcase)):boolean,contains(utf8_lcase, collate(AAa, utf8_binary)):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+true	false
+true	false
+true	true
+
+
+-- !query
+select contains(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim), contains(utf8_lcase, 'AAa ' collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<contains(utf8_binary, collate(AaAA , utf8_lcase_rtrim)):boolean,contains(utf8_lcase, collate(AAa , utf8_binary_rtrim)):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+true	false
+true	false
+true	true
+
+
+-- !query
+select substring_index(utf8_binary, utf8_lcase, 2) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"substring_index(utf8_binary, utf8_lcase, 2)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "substring_index(utf8_binary, utf8_lcase, 2)"
+  } ]
+}
+
+
+-- !query
+select substring_index(s, utf8_binary,1) from t1
+-- !query schema
+struct<substring_index(s, utf8_binary, 1):string>
+-- !query output
+
+
+
+
+
+
+
+
+
+
+
+
+
+bbAbaAbA
+İo
+
+
+-- !query
+select substring_index(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select substring_index(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1
+-- !query schema
+struct<substring_index(utf8_binary, collate(utf8_lcase, utf8_binary), 2):string>
+-- !query output
+Hello, world! Nice day.
+Something else. Nothing here.
+Spark
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abc
+abcdcba
+bbAbAAbA
+efd2
+kitten
+İo
+İo
+İo
+İo
+
+
+-- !query
+select substring_index(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1
+-- !query schema
+struct<substring_index(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.
+Something else. Nothing here.
+Spark
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abc
+abcdcba
+bbAb
+efd2
+kitten
+İo
+İo
+İo
+İo
+
+
+-- !query
+select substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"substring_index(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 88,
+    "fragment" : "substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
+  } ]
+}
+
+
+-- !query
+select substring_index(utf8_binary, 'a', 2), substring_index(utf8_lcase, 'a', 2) from t1
+-- !query schema
+struct<substring_index(utf8_binary, a, 2):string,substring_index(utf8_lcase, 'a' collate UTF8_LCASE, 2):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+a	a
+a	a
+a	a
+abc	abc
+abcdcb	aBcDCb
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select substring_index(utf8_binary, 'AaAA' collate utf8_lcase, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1
+-- !query schema
+struct<substring_index(utf8_binary, collate(AaAA, utf8_lcase), 2):string collate UTF8_LCASE,substring_index(utf8_lcase, collate(AAa, utf8_binary), 2):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+a	aaAaAAaA
+a	aaAaaAaA
+a	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select substring_index(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1
+-- !query schema
+struct<substring_index(utf8_binary, collate(AaAA , utf8_lcase_rtrim), 2):string collate UTF8_LCASE_RTRIM,substring_index(utf8_lcase, collate(AAa, utf8_binary), 2):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+a	aaAaAAaA
+a	aaAaaAaA
+a	aaAaaAaAaaAaaAaAaaAaaAaA
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select instr(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"instr(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 37,
+    "fragment" : "instr(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select instr(s, utf8_binary) from t1
+-- !query schema
+struct<instr(s, utf8_binary):int>
+-- !query output
+0
+0
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+
+
+-- !query
+select instr(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select instr(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<instr(utf8_binary, collate(utf8_lcase, utf8_binary)):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+0
+0
+1
+1
+1
+1
+1
+1
+1
+
+
+-- !query
+select instr(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<instr(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):int>
+-- !query output
+0
+0
+0
+0
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+3
+
+
+-- !query
+select instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"instr(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 75,
+    "fragment" : "instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select instr(utf8_binary, 'a'), instr(utf8_lcase, 'a') from t1
+-- !query schema
+struct<instr(utf8_binary, a):int,instr(utf8_lcase, 'a' collate UTF8_LCASE):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	1
+1	1
+1	1
+1	1
+1	1
+1	1
+21	21
+3	0
+
+
+-- !query
+select instr(utf8_binary, 'AaAA' collate utf8_lcase), instr(utf8_lcase, 'AAa' collate utf8_binary) from t1
+-- !query schema
+struct<instr(utf8_binary, collate(AaAA, utf8_lcase)):int,instr(utf8_lcase, collate(AAa, utf8_binary)):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+1	0
+1	0
+1	5
+
+
+-- !query
+select find_in_set(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"find_in_set(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 43,
+    "fragment" : "find_in_set(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select find_in_set(s, utf8_binary) from t1
+-- !query schema
+struct<find_in_set(s, utf8_binary):int>
+-- !query output
+0
+0
+0
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+
+
+-- !query
+select find_in_set(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select find_in_set(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<find_in_set(utf8_binary, collate(utf8_lcase, utf8_binary)):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+1
+1
+1
+1
+1
+
+
+-- !query
+select find_in_set(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<find_in_set(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+0
+1
+1
+1
+1
+1
+1
+1
+1
+
+
+-- !query
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o'), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o') from t1
+-- !query schema
+struct<find_in_set(utf8_binary, aaAaaAaA,i̇o):int,find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate UTF8_LCASE):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	1
+0	1
+0	2
+0	2
+0	2
+
+
+-- !query
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o' collate utf8_lcase), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t1
+-- !query schema
+struct<find_in_set(utf8_binary, collate(aaAaaAaA,i̇o, utf8_lcase)):int,find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary)):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+1	0
+1	0
+1	1
+2	0
+2	0
+2	2
+
+
+-- !query
+select find_in_set(utf8_binary, 'aaAaaAaA,i̇o ' collate utf8_lcase_rtrim), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t1
+-- !query schema
+struct<find_in_set(utf8_binary, collate(aaAaaAaA,i̇o , utf8_lcase_rtrim)):int,find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary)):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+1	0
+1	0
+1	1
+2	0
+2	0
+2	0
+2	2
+
+
+-- !query
+select startswith(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"startswith(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 42,
+    "fragment" : "startswith(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select startswith(s, utf8_binary) from t1
+-- !query schema
+struct<startswith(s, utf8_binary):boolean>
+-- !query output
+false
+false
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select startswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select startswith(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<startswith(utf8_binary, collate(utf8_lcase, utf8_binary)):boolean>
+-- !query output
+false
+false
+false
+false
+false
+false
+false
+false
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select startswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<startswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):boolean>
+-- !query output
+false
+false
+false
+false
+false
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"startswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 80,
+    "fragment" : "startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select startswith(utf8_binary, 'aaAaaAaA'), startswith(utf8_lcase, 'aaAaaAaA') from t1
+-- !query schema
+struct<startswith(utf8_binary, aaAaaAaA):boolean,startswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	true
+false	true
+false	true
+
+
+-- !query
+select startswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query schema
+struct<startswith(utf8_binary, collate(aaAaaAaA, utf8_lcase)):boolean,startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+true	false
+true	true
+true	true
+
+
+-- !query
+select startswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query schema
+struct<startswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim)):boolean,startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+true	false
+true	true
+true	true
+
+
+-- !query
+select translate(utf8_lcase, utf8_lcase, '12345') from t1
+-- !query schema
+struct<translate(utf8_lcase, utf8_lcase, '12345' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+1
+11111111
+11111111
+111111111111111111111111
+12
+12
+123
+123
+123
+123
+12332
+12335532
+1234
+1234321
+123454142544
+
+
+-- !query
+select translate(utf8_binary, utf8_lcase, '12345') from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"translate(utf8_binary, utf8_lcase, 12345)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "translate(utf8_binary, utf8_lcase, '12345')"
+  } ]
+}
+
+
+-- !query
+select translate(utf8_binary, 'aBc' collate utf8_lcase, '12345' collate utf8_binary) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
+  }
+}
+
+
+-- !query
+select translate(utf8_binary, 'SQL' collate utf8_lcase, '12345' collate utf8_lcase) from t1
+-- !query schema
+struct<translate(utf8_binary, collate(SQL, utf8_lcase), collate(12345, utf8_lcase)):string collate UTF8_LCASE>
+-- !query output
+1omething e31e. Nothing here.
+1park
+He33o, wor3d! Nice day.
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abc
+abcdcba
+bbAbAAbA
+efd2
+kitten
+İo
+İo
+İo
+İo
+
+
+-- !query
+select translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"utf8_binary\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"translate(utf8_binary, collate(SQL, unicode_ai), collate(12345, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select translate(utf8_lcase, 'aaAaaAaA', '12345'), translate(utf8_binary, 'aaAaaAaA', '12345') from t1
+-- !query schema
+struct<translate(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, '12345' collate UTF8_LCASE):string collate UTF8_LCASE,translate(utf8_binary, aaAaaAaA, 12345):string>
+-- !query output
+1	bb3b33b3
+11111111	11313313
+11111111	11313313
+111111111111111111111111	11313313
+1BcDCb1	1bcdcb1
+1bc	1bc
+Hello, world! Nice d1y.	Hello, world! Nice d1y.
+SQL	Sp1rk
+Something else. Nothing here.	Something else. Nothing here.
+efd2	efd2
+i̇o	İo
+sitTing	kitten
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select translate(utf8_lcase, 'aBc' collate utf8_binary, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t1
+-- !query schema
+struct<translate(utf8_lcase, collate(aBc, utf8_binary), 12345):string,translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+1	22121121
+11A11A1A	11111111
+11A11A1A11A11A1A11A11A1A	11111111
+11A1AA1A	11111111
+123DCbA	123d321
+1b3	123
+Hello, world! Ni3e d1y.	Hello, world! Ni3e d1y.
+SQL	Sp1rk
+Something else. Nothing here.	Something else. Nothing here.
+efd2	efd2
+i̇o	İo
+sitTing	kitten
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select translate(utf8_lcase, 'aBc ' collate utf8_binary_rtrim, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t1
+-- !query schema
+struct<translate(utf8_lcase, collate(aBc , utf8_binary_rtrim), '12345' collate UTF8_BINARY_RTRIM):string collate UTF8_BINARY_RTRIM,translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+1	22121121
+11A11A1A	11111111
+11A11A1A11A11A1A11A11A1A	11111111
+11A1AA1A	11111111
+123DCbA	123d321
+1b3	123
+Hello,4world!4Ni3e4d1y.	Hello, world! Ni3e d1y.
+SQL	Sp1rk
+Something4else.4Nothing4here.	Something else. Nothing here.
+efd2	efd2
+i̇o	İo
+sitTing	kitten
+İo	İo
+İo	İo 
+İo4	İo
+
+
+-- !query
+select replace(utf8_binary, utf8_lcase, 'abc') from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"replace(utf8_binary, utf8_lcase, abc)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 46,
+    "fragment" : "replace(utf8_binary, utf8_lcase, 'abc')"
+  } ]
+}
+
+
+-- !query
+select replace(s, utf8_binary, 'abc') from t1
+-- !query schema
+struct<replace(s, utf8_binary, abc):string>
+-- !query output
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+bbAbaAbA
+İo
+
+
+-- !query
+select replace(utf8_binary collate utf8_binary, s collate utf8_lcase, 'abc') from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select replace(utf8_binary, utf8_lcase collate utf8_binary, 'abc') from t1
+-- !query schema
+struct<replace(utf8_binary, collate(utf8_lcase, utf8_binary), abc):string>
+-- !query output
+Spark
+aaAaAAaA
+aaAaAAaA
+abc
+abc
+abc
+abc
+abc
+abc
+abc 
+abcdcba
+bbAbAAbA
+kitten
+İo
+İo
+
+
+-- !query
+select replace(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 'abc') from t1
+-- !query schema
+struct<replace(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 'abc' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+Spark
+aaAaAAaA
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc
+abc 
+bbabcbabcabcbabc
+kitten
+İo
+
+
+-- !query
+select replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc') from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"replace(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 'abc' collate UNICODE_AI)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 84,
+    "fragment" : "replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc')"
+  } ]
+}
+
+
+-- !query
+select replace(utf8_binary, 'aaAaaAaA', 'abc'), replace(utf8_lcase, 'aaAaaAaA', 'abc') from t1
+-- !query schema
+struct<replace(utf8_binary, aaAaaAaA, abc):string,replace(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, 'abc' collate UTF8_LCASE):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	abc
+aaAaAAaA	abc
+aaAaAAaA	abcabcabc
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select replace(utf8_binary, 'aaAaaAaA' collate utf8_lcase, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t1
+-- !query schema
+struct<replace(utf8_binary, collate(aaAaaAaA, utf8_lcase), 'abc' collate UTF8_LCASE):string collate UTF8_LCASE,replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+abc	aaAaAAaA
+abc	abc
+abc	abc
+abc	abcabcabc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select replace(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t1
+-- !query schema
+struct<replace(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim), 'abc' collate UTF8_LCASE_RTRIM):string collate UTF8_LCASE_RTRIM,replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc):string>
+-- !query output
+Hello, world! Nice day.	Hello, world! Nice day.
+Something else. Nothing here.	Something else. Nothing here.
+Spark	SQL
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	abc
+aaAaAAaA	abcabcabc
+abc	abc
+abcdcba	aBcDCbA
+bbAbAAbA	a
+efd2	efd2
+kitten	sitTing
+İo	i̇o
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select endswith(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"endswith(utf8_binary, utf8_lcase)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 40,
+    "fragment" : "endswith(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select endswith(s, utf8_binary) from t1
+-- !query schema
+struct<endswith(s, utf8_binary):boolean>
+-- !query output
+false
+false
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select endswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select endswith(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<endswith(utf8_binary, collate(utf8_lcase, utf8_binary)):boolean>
+-- !query output
+false
+false
+false
+false
+false
+false
+false
+false
+false
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select endswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t1
+-- !query schema
+struct<endswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):boolean>
+-- !query output
+false
+false
+false
+false
+false
+true
+true
+true
+true
+true
+true
+true
+true
+true
+true
+
+
+-- !query
+select endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"endswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
+  } ]
+}
+
+
+-- !query
+select endswith(utf8_binary, 'aaAaaAaA'), endswith(utf8_lcase, 'aaAaaAaA') from t1
+-- !query schema
+struct<endswith(utf8_binary, aaAaaAaA):boolean,endswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	true
+false	true
+false	true
+
+
+-- !query
+select endswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query schema
+struct<endswith(utf8_binary, collate(aaAaaAaA, utf8_lcase)):boolean,endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+true	false
+true	true
+true	true
+
+
+-- !query
+select endswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t1
+-- !query schema
+struct<endswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim)):boolean,endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
+-- !query output
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+false	false
+true	false
+true	true
+true	true
+
+
+-- !query
+select repeat(utf8_binary, 3), repeat(utf8_lcase, 2) from t1
+-- !query schema
+struct<repeat(utf8_binary, 3):string,repeat(utf8_lcase, 2):string collate UTF8_LCASE>
+-- !query output
+Hello, world! Nice day.Hello, world! Nice day.Hello, world! Nice day.	Hello, world! Nice day.Hello, world! Nice day.
+Something else. Nothing here.Something else. Nothing here.Something else. Nothing here.	Something else. Nothing here.Something else. Nothing here.
+SparkSparkSpark	SQLSQL
+aaAaAAaAaaAaAAaAaaAaAAaA	aaAaAAaAaaAaAAaA
+aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaA
+aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaA
+abcabcabc	abcabc
+abcdcbaabcdcbaabcdcba	aBcDCbAaBcDCbA
+bbAbAAbAbbAbAAbAbbAbAAbA	aa
+efd2efd2efd2	efd2efd2
+kittenkittenkitten	sitTingsitTing
+İo İo İo 	İoİo
+İoİoİo	i̇oi̇o
+İoİoİo	İo İo 
+İoİoİo	İoİo
+
+
+-- !query
+select repeat(utf8_binary collate utf8_lcase, 3), repeat(utf8_lcase collate utf8_binary, 2) from t1
+-- !query schema
+struct<repeat(collate(utf8_binary, utf8_lcase), 3):string collate UTF8_LCASE,repeat(collate(utf8_lcase, utf8_binary), 2):string>
+-- !query output
+Hello, world! Nice day.Hello, world! Nice day.Hello, world! Nice day.	Hello, world! Nice day.Hello, world! Nice day.
+Something else. Nothing here.Something else. Nothing here.Something else. Nothing here.	Something else. Nothing here.Something else. Nothing here.
+SparkSparkSpark	SQLSQL
+aaAaAAaAaaAaAAaAaaAaAAaA	aaAaAAaAaaAaAAaA
+aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaA
+aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaA
+abcabcabc	abcabc
+abcdcbaabcdcbaabcdcba	aBcDCbAaBcDCbA
+bbAbAAbAbbAbAAbAbbAbAAbA	aa
+efd2efd2efd2	efd2efd2
+kittenkittenkitten	sitTingsitTing
+İo İo İo 	İoİo
+İoİoİo	i̇oi̇o
+İoİoİo	İo İo 
+İoİoİo	İoİo
+
+
+-- !query
+select chr(ascii) from t2
+-- !query schema
+struct<chr(ascii):string>
+-- !query output
+B
+a
+
+
+-- !query
+select sentences(utf8_binary), sentences(utf8_lcase) from t1
+-- !query schema
+struct<sentences(utf8_binary, , ):array<array<string>>,sentences(utf8_lcase, , ):array<array<string collate UTF8_LCASE>>>
+-- !query output
+[["Hello","world"],["Nice","day"]]	[["Hello","world"],["Nice","day"]]
+[["Something","else"],["Nothing","here"]]	[["Something","else"],["Nothing","here"]]
+[["Spark"]]	[["SQL"]]
+[["aaAaAAaA"]]	[["aaAaAAaA"]]
+[["aaAaAAaA"]]	[["aaAaaAaA"]]
+[["aaAaAAaA"]]	[["aaAaaAaAaaAaaAaAaaAaaAaA"]]
+[["abc"]]	[["abc"]]
+[["abcdcba"]]	[["aBcDCbA"]]
+[["bbAbAAbA"]]	[["a"]]
+[["efd2"]]	[["efd2"]]
+[["kitten"]]	[["sitTing"]]
+[["İo"]]	[["i̇o"]]
+[["İo"]]	[["İo"]]
+[["İo"]]	[["İo"]]
+[["İo"]]	[["İo"]]
+
+
+-- !query
+select sentences(utf8_binary collate utf8_lcase), sentences(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<sentences(collate(utf8_binary, utf8_lcase), , ):array<array<string collate UTF8_LCASE>>,sentences(collate(utf8_lcase, utf8_binary), , ):array<array<string>>>
+-- !query output
+[["Hello","world"],["Nice","day"]]	[["Hello","world"],["Nice","day"]]
+[["Something","else"],["Nothing","here"]]	[["Something","else"],["Nothing","here"]]
+[["Spark"]]	[["SQL"]]
+[["aaAaAAaA"]]	[["aaAaAAaA"]]
+[["aaAaAAaA"]]	[["aaAaaAaA"]]
+[["aaAaAAaA"]]	[["aaAaaAaAaaAaaAaAaaAaaAaA"]]
+[["abc"]]	[["abc"]]
+[["abcdcba"]]	[["aBcDCbA"]]
+[["bbAbAAbA"]]	[["a"]]
+[["efd2"]]	[["efd2"]]
+[["kitten"]]	[["sitTing"]]
+[["İo"]]	[["i̇o"]]
+[["İo"]]	[["İo"]]
+[["İo"]]	[["İo"]]
+[["İo"]]	[["İo"]]
+
+
+-- !query
+select upper(utf8_binary), upper(utf8_lcase) from t1
+-- !query schema
+struct<upper(utf8_binary):string,upper(utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+AAAAAAAA	AAAAAAAA
+AAAAAAAA	AAAAAAAA
+AAAAAAAA	AAAAAAAAAAAAAAAAAAAAAAAA
+ABC	ABC
+ABCDCBA	ABCDCBA
+BBABAABA	A
+EFD2	EFD2
+HELLO, WORLD! NICE DAY.	HELLO, WORLD! NICE DAY.
+KITTEN	SITTING
+SOMETHING ELSE. NOTHING HERE.	SOMETHING ELSE. NOTHING HERE.
+SPARK	SQL
+İO	İO
+İO	İO
+İO	İO 
+İO 	İO
+
+
+-- !query
+select upper(utf8_binary collate utf8_lcase), upper(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<upper(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,upper(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+AAAAAAAA	AAAAAAAA
+AAAAAAAA	AAAAAAAA
+AAAAAAAA	AAAAAAAAAAAAAAAAAAAAAAAA
+ABC	ABC
+ABCDCBA	ABCDCBA
+BBABAABA	A
+EFD2	EFD2
+HELLO, WORLD! NICE DAY.	HELLO, WORLD! NICE DAY.
+KITTEN	SITTING
+SOMETHING ELSE. NOTHING HERE.	SOMETHING ELSE. NOTHING HERE.
+SPARK	SQL
+İO	İO
+İO	İO
+İO	İO 
+İO 	İO
+
+
+-- !query
+select lower(utf8_binary), lower(utf8_lcase) from t1
+-- !query schema
+struct<lower(utf8_binary):string,lower(utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+aaaaaaaa	aaaaaaaa
+aaaaaaaa	aaaaaaaa
+aaaaaaaa	aaaaaaaaaaaaaaaaaaaaaaaa
+abc	abc
+abcdcba	abcdcba
+bbabaaba	a
+efd2	efd2
+hello, world! nice day.	hello, world! nice day.
+i̇o	i̇o
+i̇o	i̇o
+i̇o	i̇o 
+i̇o 	i̇o
+kitten	sitting
+something else. nothing here.	something else. nothing here.
+spark	sql
+
+
+-- !query
+select lower(utf8_binary collate utf8_lcase), lower(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<lower(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,lower(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+aaaaaaaa	aaaaaaaa
+aaaaaaaa	aaaaaaaa
+aaaaaaaa	aaaaaaaaaaaaaaaaaaaaaaaa
+abc	abc
+abcdcba	abcdcba
+bbabaaba	a
+efd2	efd2
+hello, world! nice day.	hello, world! nice day.
+i̇o	i̇o
+i̇o	i̇o
+i̇o	i̇o 
+i̇o 	i̇o
+kitten	sitting
+something else. nothing here.	something else. nothing here.
+spark	sql
+
+
+-- !query
+select initcap(utf8_binary), initcap(utf8_lcase) from t1
+-- !query schema
+struct<initcap(utf8_binary):string,initcap(utf8_lcase):string collate UTF8_LCASE>
+-- !query output
+Aaaaaaaa	Aaaaaaaa
+Aaaaaaaa	Aaaaaaaa
+Aaaaaaaa	Aaaaaaaaaaaaaaaaaaaaaaaa
+Abc	Abc
+Abcdcba	Abcdcba
+Bbabaaba	A
+Efd2	Efd2
+Hello, World! Nice Day.	Hello, World! Nice Day.
+Kitten	Sitting
+Something Else. Nothing Here.	Something Else. Nothing Here.
+Spark	Sql
+İo	İo
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select initcap(utf8_binary collate utf8_lcase), initcap(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<initcap(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,initcap(collate(utf8_lcase, utf8_binary)):string>
+-- !query output
+Aaaaaaaa	Aaaaaaaa
+Aaaaaaaa	Aaaaaaaa
+Aaaaaaaa	Aaaaaaaaaaaaaaaaaaaaaaaa
+Abc	Abc
+Abcdcba	Abcdcba
+Bbabaaba	A
+Efd2	Efd2
+Hello, World! Nice Day.	Hello, World! Nice Day.
+Kitten	Sitting
+Something Else. Nothing Here.	Something Else. Nothing Here.
+Spark	Sql
+İo	İo
+İo	İo
+İo	İo 
+İo 	İo
+
+
+-- !query
+select overlay(utf8_binary, utf8_lcase, 2) from t1
+-- !query schema
+struct<overlay(utf8_binary, utf8_lcase, 2, -1):string collate null>
+-- !query output
+HHello, world! Nice day.
+SSQLk
+SSomething else. Nothing here.
+aaBcDCbA
+aaaAaAAaA
+aaaAaaAaA
+aaaAaaAaAaaAaaAaAaaAaaAaA
+aabc
+baAbAAbA
+eefd2
+ksitTing
+İi̇o
+İİo
+İİo
+İİo
+
+
+-- !query
+select overlay(s, utf8_binary,1) from t1
+-- !query schema
+struct<overlay(s, utf8_binary, 1, -1):string>
+-- !query output
+Hello, world! Nice day.
+Something else. Nothing here.
+Spark
+aaAaAAaA
+aaAaAAaA
+aaAaAAaA
+abc
+abcdcba
+bbAbAAbA
+efd2
+kitten
+İo
+İo
+İo
+İo
+
+
+-- !query
+select overlay(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select overlay(utf8_binary, utf8_lcase collate utf8_binary, 2) from t1
+-- !query schema
+struct<overlay(utf8_binary, collate(utf8_lcase, utf8_binary), 2, -1):string>
+-- !query output
+HHello, world! Nice day.
+SSQLk
+SSomething else. Nothing here.
+aaBcDCbA
+aaaAaAAaA
+aaaAaaAaA
+aaaAaaAaAaaAaaAaAaaAaaAaA
+aabc
+baAbAAbA
+eefd2
+ksitTing
+İi̇o
+İİo
+İİo
+İİo
+
+
+-- !query
+select overlay(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t1
+-- !query schema
+struct<overlay(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2, -1):string collate UTF8_LCASE>
+-- !query output
+HHello, world! Nice day.
+SSQLk
+SSomething else. Nothing here.
+aaBcDCbA
+aaaAaAAaA
+aaaAaaAaA
+aaaAaaAaAaaAaaAaAaaAaaAaA
+aabc
+baAbAAbA
+eefd2
+ksitTing
+İi̇o
+İİo
+İİo
+İİo
+
+
+-- !query
+select overlay(utf8_binary, 'a', 2), overlay(utf8_lcase, 'a', 2) from t1
+-- !query schema
+struct<overlay(utf8_binary, a, 2, -1):string,overlay(utf8_lcase, 'a' collate UTF8_LCASE, 2, -1):string collate UTF8_LCASE>
+-- !query output
+Hallo, world! Nice day.	Hallo, world! Nice day.
+Saark	SaL
+Samething else. Nothing here.	Samething else. Nothing here.
+aaAaAAaA	aaAaAAaA
+aaAaAAaA	aaAaaAaA
+aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
+aac	aac
+aacdcba	aacDCbA
+baAbAAbA	aa
+ead2	ead2
+katten	satTing
+İa	iao
+İa	İa
+İa	İa 
+İa 	İa
+
+
+-- !query
+select overlay(utf8_binary, 'AaAA' collate utf8_lcase, 2), overlay(utf8_lcase, 'AAa' collate utf8_binary, 2) from t1
+-- !query schema
+struct<overlay(utf8_binary, collate(AaAA, utf8_lcase), 2, -1):string collate UTF8_LCASE,overlay(utf8_lcase, collate(AAa, utf8_binary), 2, -1):string>
+-- !query output
+HAaAA, world! Nice day.	HAAao, world! Nice day.
+SAaAA	SAAa
+SAaAAhing else. Nothing here.	SAAathing else. Nothing here.
+aAaAA	aAAa
+aAaAAAaA	aAAaAAaA
+aAaAAAaA	aAAaaAaA
+aAaAAAaA	aAAaaAaAaaAaaAaAaaAaaAaA
+aAaAAba	aAAaCbA
+bAaAAAbA	aAAa
+eAaAA	eAAa
+kAaAAn	sAAaing
+İAaAA	iAAa
+İAaAA	İAAa
+İAaAA	İAAa
+İAaAA	İAAa
+
+
+-- !query
+select format_string(format, utf8_binary, utf8_lcase) from t3
+-- !query schema
+struct<format_string(format, utf8_binary, utf8_lcase):string>
+-- !query output
+abCdEabCdE
+
+
+-- !query
+select format_string(format collate utf8_lcase, utf8_lcase, utf8_binary collate utf8_lcase, 3), format_string(format, utf8_lcase collate utf8_binary, utf8_binary) from t3
+-- !query schema
+struct<format_string(collate(format, utf8_lcase), utf8_lcase, collate(utf8_binary, utf8_lcase), 3):string collate UTF8_LCASE,format_string(format, collate(utf8_lcase, utf8_binary), utf8_binary):string>
+-- !query output
+abCdEabCdE	abCdEabCdE
+
+
+-- !query
+select format_string(format, utf8_binary, utf8_lcase) from t3
+-- !query schema
+struct<format_string(format, utf8_binary, utf8_lcase):string>
+-- !query output
+abCdEabCdE
+
+
+-- !query
+select length(utf8_binary), length(utf8_lcase) from t1
+-- !query schema
+struct<length(utf8_binary):int,length(utf8_lcase):int>
+-- !query output
+2	2
+2	3
+2	3
+23	23
+29	29
+3	2
+3	3
+4	4
+5	3
+6	7
+7	7
+8	1
+8	24
+8	8
+8	8
+
+
+-- !query
+select length(utf8_binary collate utf8_lcase), length(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<length(collate(utf8_binary, utf8_lcase)):int,length(collate(utf8_lcase, utf8_binary)):int>
+-- !query output
+2	2
+2	3
+2	3
+23	23
+29	29
+3	2
+3	3
+4	4
+5	3
+6	7
+7	7
+8	1
+8	24
+8	8
+8	8
+
+
+-- !query
+select bit_length(utf8_binary), bit_length(utf8_lcase) from t1
+-- !query schema
+struct<bit_length(utf8_binary):int,bit_length(utf8_lcase):int>
+-- !query output
+184	184
+232	232
+24	24
+24	24
+24	32
+24	32
+32	24
+32	32
+40	24
+48	56
+56	56
+64	192
+64	64
+64	64
+64	8
+
+
+-- !query
+select bit_length(utf8_binary collate utf8_lcase), bit_length(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<bit_length(collate(utf8_binary, utf8_lcase)):int,bit_length(collate(utf8_lcase, utf8_binary)):int>
+-- !query output
+184	184
+232	232
+24	24
+24	24
+24	32
+24	32
+32	24
+32	32
+40	24
+48	56
+56	56
+64	192
+64	64
+64	64
+64	8
+
+
+-- !query
+select octet_length(utf8_binary), octet_length(utf8_lcase) from t1
+-- !query schema
+struct<octet_length(utf8_binary):int,octet_length(utf8_lcase):int>
+-- !query output
+23	23
+29	29
+3	3
+3	3
+3	4
+3	4
+4	3
+4	4
+5	3
+6	7
+7	7
+8	1
+8	24
+8	8
+8	8
+
+
+-- !query
+select octet_length(utf8_binary collate utf8_lcase), octet_length(utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<octet_length(collate(utf8_binary, utf8_lcase)):int,octet_length(collate(utf8_lcase, utf8_binary)):int>
+-- !query output
+23	23
+29	29
+3	3
+3	3
+3	4
+3	4
+4	3
+4	4
+5	3
+6	7
+7	7
+8	1
+8	24
+8	8
+8	8
+
+
+-- !query
+select octet_length(utf8_binary collate utf8_lcase_rtrim), octet_length(utf8_lcase collate utf8_binary_rtrim) from t1
+-- !query schema
+struct<octet_length(collate(utf8_binary, utf8_lcase_rtrim)):int,octet_length(collate(utf8_lcase, utf8_binary_rtrim)):int>
+-- !query output
+23	23
+29	29
+3	3
+3	3
+3	4
+3	4
+4	3
+4	4
+5	3
+6	7
+7	7
+8	1
+8	24
+8	8
+8	8
+
+
+-- !query
+select substr(utf8_binary, 2, 2), substr(utf8_lcase, 2, 2) from t1
+-- !query schema
+struct<substr(utf8_binary, 2, 2):string,substr(utf8_lcase, 2, 2):string collate UTF8_LCASE>
+-- !query output
+aA	aA
+aA	aA
+aA	aA
+bA	
+bc	Bc
+bc	bc
+el	el
+fd	fd
+it	it
+o	o
+o	o 
+o	̇o
+o 	o
+om	om
+pa	QL
+
+
+-- !query
+select substr(utf8_binary collate utf8_lcase, 2, 2), substr(utf8_lcase collate utf8_binary, 2, 2) from t1
+-- !query schema
+struct<substr(collate(utf8_binary, utf8_lcase), 2, 2):string collate UTF8_LCASE,substr(collate(utf8_lcase, utf8_binary), 2, 2):string>
+-- !query output
+aA	aA
+aA	aA
+aA	aA
+bA	
+bc	Bc
+bc	bc
+el	el
+fd	fd
+it	it
+o	o
+o	o 
+o	̇o
+o 	o
+om	om
+pa	QL
+
+
+-- !query
+select right(utf8_binary, 2), right(utf8_lcase, 2) from t1
+-- !query schema
+struct<right(utf8_binary, 2):string,right(utf8_lcase, 2):string collate UTF8_LCASE>
+-- !query output
+aA	aA
+aA	aA
+aA	aA
+bA	a
+ba	bA
+bc	bc
+d2	d2
+e.	e.
+en	ng
+o 	İo
+rk	QL
+y.	y.
+İo	o 
+İo	İo
+İo	̇o
+
+
+-- !query
+select right(utf8_binary collate utf8_lcase, 2), right(utf8_lcase collate utf8_binary, 2) from t1
+-- !query schema
+struct<right(collate(utf8_binary, utf8_lcase), 2):string collate UTF8_LCASE,right(collate(utf8_lcase, utf8_binary), 2):string>
+-- !query output
+aA	aA
+aA	aA
+aA	aA
+bA	a
+ba	bA
+bc	bc
+d2	d2
+e.	e.
+en	ng
+o 	İo
+rk	QL
+y.	y.
+İo	o 
+İo	İo
+İo	̇o
+
+
+-- !query
+select left(utf8_binary, '2' collate utf8_lcase), left(utf8_lcase, 2) from t1
+-- !query schema
+struct<left(utf8_binary, collate(2, utf8_lcase)):string,left(utf8_lcase, 2):string collate UTF8_LCASE>
+-- !query output
+He	He
+So	So
+Sp	SQ
+aa	aa
+aa	aa
+aa	aa
+ab	aB
+ab	ab
+bb	a
+ef	ef
+ki	si
+İo	i̇
+İo	İo
+İo	İo
+İo	İo
+
+
+-- !query
+select left(utf8_binary collate utf8_lcase, 2), left(utf8_lcase collate utf8_binary, 2) from t1
+-- !query schema
+struct<left(collate(utf8_binary, utf8_lcase), 2):string collate UTF8_LCASE,left(collate(utf8_lcase, utf8_binary), 2):string>
+-- !query output
+He	He
+So	So
+Sp	SQ
+aa	aa
+aa	aa
+aa	aa
+ab	aB
+ab	ab
+bb	a
+ef	ef
+ki	si
+İo	i̇
+İo	İo
+İo	İo
+İo	İo
+
+
+-- !query
+select locate(utf8_binary, utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
+  "sqlState" : "42P22",
+  "messageParameters" : {
+    "expr" : "\"locate(utf8_binary, utf8_lcase, 1)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 38,
+    "fragment" : "locate(utf8_binary, utf8_lcase)"
+  } ]
+}
+
+
+-- !query
+select locate(s, utf8_binary) from t1
+-- !query schema
+struct<locate(s, utf8_binary, 1):int>
+-- !query output
+0
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+1
+
+
+-- !query
+select locate(utf8_binary collate utf8_binary, s collate utf8_lcase) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
+  "sqlState" : "42P21",
+  "messageParameters" : {
+    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
+  }
+}
+
+
+-- !query
+select locate(utf8_binary, utf8_lcase collate utf8_binary) from t1
+-- !query schema
+struct<locate(utf8_binary, collate(utf8_lcase, utf8_binary), 1):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+0
+0
+1
+1
+1
+1
+1
+1
+1
+
+
+-- !query
+select locate(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 3) from t1
+-- !query schema
+struct<locate(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 3):int>
+-- !query output
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+0
+3
+
+
+-- !query
+select locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3) from t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
+    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"STRING\"",
+    "sqlExpr" : "\"locate(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 3)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3)"
+  } ]
+}
+
+
+-- !query
+select locate(utf8_binary, 'a'), locate(utf8_lcase, 'a') from t1
+-- !query schema
+struct<locate(utf8_binary, a, 1):int,locate(utf8_lcase, 'a' collate UTF8_LCASE, 1):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	1
+
+
+-- !query
+select locate(utf8_binary, 'AaAA' collate utf8_lcase, 4), locate(utf8_lcase, 'AAa' collate utf8_binary, 4) from t1
+-- !query schema
+struct<locate(utf8_binary, collate(AaAA, utf8_lcase), 4):int,locate(utf8_lcase, collate(AAa, utf8_binary), 4):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+
+
+-- !query
+select locate(utf8_binary, 'AaAA ' collate utf8_binary_rtrim, 4), locate(utf8_lcase, 'AAa ' collate utf8_binary, 4) from t1
+-- !query schema
+struct<locate(utf8_binary, collate(AaAA , utf8_binary_rtrim), 4):int,locate(utf8_lcase, collate(AAa , utf8_binary), 4):int>
+-- !query output
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+0	0
+
+
+-- !query
+drop table t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+drop table t2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+drop table t3
+-- !query schema
+struct<>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/collations.sql.out b/sql/core/src/test/resources/sql-tests/results/collations.sql.out
deleted file mode 100644
index 2055ec0c2c80f..0000000000000
--- a/sql/core/src/test/resources/sql-tests/results/collations.sql.out
+++ /dev/null
@@ -1,5834 +0,0 @@
--- Automatically generated by SQLQueryTestSuite
--- !query
-create table t1(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t1 values('aaa', 'aaa')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t1 values('AAA', 'AAA')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t1 values('bbb', 'bbb')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t1 values('BBB', 'BBB')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-describe table t1
--- !query schema
-struct<col_name:string,data_type:string,comment:string>
--- !query output
-utf8_binary         	string              	                    
-utf8_lcase          	string collate UTF8_LCASE
-
-
--- !query
-select count(*) from t1 group by utf8_binary
--- !query schema
-struct<count(1):bigint>
--- !query output
-1
-1
-1
-1
-
-
--- !query
-select count(*) from t1 group by utf8_lcase
--- !query schema
-struct<count(1):bigint>
--- !query output
-2
-2
-
-
--- !query
-select * from t1 where utf8_binary = 'aaa'
--- !query schema
-struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
--- !query output
-aaa	aaa
-
-
--- !query
-select * from t1 where utf8_lcase = 'aaa' collate utf8_lcase
--- !query schema
-struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
--- !query output
-AAA	AAA
-aaa	aaa
-
-
--- !query
-select * from t1 where utf8_binary < 'bbb'
--- !query schema
-struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
--- !query output
-AAA	AAA
-BBB	BBB
-aaa	aaa
-
-
--- !query
-select * from t1 where utf8_lcase < 'bbb' collate utf8_lcase
--- !query schema
-struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
--- !query output
-AAA	AAA
-aaa	aaa
-
-
--- !query
-select l.utf8_binary, r.utf8_lcase from t1 l join t1 r on l.utf8_lcase = r.utf8_lcase
--- !query schema
-struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
--- !query output
-AAA	AAA
-AAA	aaa
-BBB	BBB
-BBB	bbb
-aaa	AAA
-aaa	aaa
-bbb	BBB
-bbb	bbb
-
-
--- !query
-create table t2(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t2 values('aaa', 'aaa')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t2 values('bbb', 'bbb')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-select * from t1 anti join t2 on t1.utf8_lcase = t2.utf8_lcase
--- !query schema
-struct<utf8_binary:string,utf8_lcase:string collate UTF8_LCASE>
--- !query output
-
-
-
--- !query
-drop table t2
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-drop table t1
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query schema
-struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-zzz
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query schema
-struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-aaa
-bbb
-zzz
-zzz
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query schema
-struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-aaa
-bbb
-zzz
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query schema
-struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-AAA
-BBB
-ZZZ
-aaa
-aaa
-bbb
-bbb
-zzz
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate utf8_lcase from values ('aaa'), ('bbb')
--- !query schema
-struct<collate(col1, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-aaa
-bbb
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "EXCEPT",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 162,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "EXCEPT ALL",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 166,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') except all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "UNION",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 161,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "UNION",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 165,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('AAA'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') union all select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INCOMPATIBLE_COLUMN_TYPE",
-  "sqlState" : "42825",
-  "messageParameters" : {
-    "columnOrdinalNumber" : "first",
-    "dataType1" : "\"STRING COLLATE UNICODE_CI\"",
-    "dataType2" : "\"STRING COLLATE UTF8_LCASE\"",
-    "hint" : "",
-    "operator" : "INTERSECT",
-    "tableOrdinalNumber" : "second"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 156,
-    "fragment" : "select col1 collate utf8_lcase from values ('aaa'), ('bbb'), ('BBB'), ('zzz'), ('ZZZ') intersect select col1 collate unicode_ci from values ('aaa'), ('bbb')"
-  } ]
-}
-
-
--- !query
-create table t1 (c1 struct<utf8_binary: string collate utf8_binary, utf8_lcase: string collate utf8_lcase>) USING PARQUET
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t1 values (named_struct('utf8_binary', 'aaa', 'utf8_lcase', 'aaa'))
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t1 values (named_struct('utf8_binary', 'AAA', 'utf8_lcase', 'AAA'))
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-select count(*) from t1 group by c1.utf8_binary
--- !query schema
-struct<count(1):bigint>
--- !query output
-1
-1
-
-
--- !query
-select count(*) from t1 group by c1.utf8_lcase
--- !query schema
-struct<count(1):bigint>
--- !query output
-2
-
-
--- !query
-drop table t1
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-select array_contains(ARRAY('aaa' collate utf8_lcase),'AAA' collate utf8_lcase)
--- !query schema
-struct<array_contains(array(collate(aaa, utf8_lcase)), collate(AAA, utf8_lcase)):boolean>
--- !query output
-true
-
-
--- !query
-select array_position(ARRAY('aaa' collate utf8_lcase, 'bbb' collate utf8_lcase),'BBB' collate utf8_lcase)
--- !query schema
-struct<array_position(array(collate(aaa, utf8_lcase), collate(bbb, utf8_lcase)), collate(BBB, utf8_lcase)):bigint>
--- !query output
-2
-
-
--- !query
-select nullif('aaa' COLLATE utf8_lcase, 'AAA' COLLATE utf8_lcase)
--- !query schema
-struct<nullif(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-NULL
-
-
--- !query
-select least('aaa' COLLATE utf8_lcase, 'AAA' collate utf8_lcase, 'a' collate utf8_lcase)
--- !query schema
-struct<least(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase), collate(a, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-a
-
-
--- !query
-select arrays_overlap(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query schema
-struct<arrays_overlap(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):boolean>
--- !query output
-true
-
-
--- !query
-select array_distinct(array('aaa' collate utf8_lcase, 'AAA' collate utf8_lcase))
--- !query schema
-struct<array_distinct(array(collate(aaa, utf8_lcase), collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
--- !query output
-["aaa"]
-
-
--- !query
-select array_union(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query schema
-struct<array_union(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
--- !query output
-["aaa"]
-
-
--- !query
-select array_intersect(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query schema
-struct<array_intersect(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
--- !query output
-["aaa"]
-
-
--- !query
-select array_except(array('aaa' collate utf8_lcase), array('AAA' collate utf8_lcase))
--- !query schema
-struct<array_except(array(collate(aaa, utf8_lcase)), array(collate(AAA, utf8_lcase))):array<string collate UTF8_LCASE>>
--- !query output
-[]
-
-
--- !query
-select 'a' collate unicode < 'A'
--- !query schema
-struct<(collate(a, unicode) < 'A' collate UNICODE):boolean>
--- !query output
-true
-
-
--- !query
-select 'a' collate unicode_ci = 'A'
--- !query schema
-struct<(collate(a, unicode_ci) = 'A' collate UNICODE_CI):boolean>
--- !query output
-true
-
-
--- !query
-select 'a' collate unicode_ai = 'å'
--- !query schema
-struct<(collate(a, unicode_ai) = 'å' collate UNICODE_AI):boolean>
--- !query output
-true
-
-
--- !query
-select 'a' collate unicode_ci_ai = 'Å'
--- !query schema
-struct<(collate(a, unicode_ci_ai) = 'Å' collate UNICODE_CI_AI):boolean>
--- !query output
-true
-
-
--- !query
-select 'a' collate en < 'A'
--- !query schema
-struct<(collate(a, en) < 'A' collate en):boolean>
--- !query output
-true
-
-
--- !query
-select 'a' collate en_ci = 'A'
--- !query schema
-struct<(collate(a, en_ci) = 'A' collate en_CI):boolean>
--- !query output
-true
-
-
--- !query
-select 'a' collate en_ai = 'å'
--- !query schema
-struct<(collate(a, en_ai) = 'å' collate en_AI):boolean>
--- !query output
-true
-
-
--- !query
-select 'a' collate en_ci_ai = 'Å'
--- !query schema
-struct<(collate(a, en_ci_ai) = 'Å' collate en_CI_AI):boolean>
--- !query output
-true
-
-
--- !query
-select 'Kypper' collate sv < 'Köpfe'
--- !query schema
-struct<(collate(Kypper, sv) < 'Köpfe' collate sv):boolean>
--- !query output
-true
-
-
--- !query
-select 'Kypper' collate de > 'Köpfe'
--- !query schema
-struct<(collate(Kypper, de) > 'Köpfe' collate de):boolean>
--- !query output
-true
-
-
--- !query
-select 'I' collate tr_ci = 'ı'
--- !query schema
-struct<(collate(I, tr_ci) = 'ı' collate tr_CI):boolean>
--- !query output
-true
-
-
--- !query
-create table t4 (text string collate utf8_binary, pairDelim string collate utf8_lcase, keyValueDelim string collate utf8_binary) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t4 values('a:1,b:2,c:3', ',', ':')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-select str_to_map(text, pairDelim, keyValueDelim) from t4
--- !query schema
-struct<>
--- !query output
-org.apache.spark.SparkRuntimeException
-{
-  "errorClass" : "INDETERMINATE_COLLATION",
-  "sqlState" : "42P22"
-}
-
-
--- !query
-select str_to_map(text collate utf8_binary, pairDelim collate utf8_lcase, keyValueDelim collate utf8_binary) from t4
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select str_to_map(text collate utf8_binary, pairDelim collate utf8_binary, keyValueDelim collate utf8_binary) from t4
--- !query schema
-struct<str_to_map(collate(text, utf8_binary), collate(pairDelim, utf8_binary), collate(keyValueDelim, utf8_binary)):map<string,string>>
--- !query output
-{"a":"1","b":"2","c":"3"}
-
-
--- !query
-select str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai) from t4
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(text, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"str_to_map(collate(text, unicode_ai), collate(pairDelim, unicode_ai), collate(keyValueDelim, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 106,
-    "fragment" : "str_to_map(text collate unicode_ai, pairDelim collate unicode_ai, keyValueDelim collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-drop table t4
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-create table t5(s string, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('Spark', 'Spark', 'SQL')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaAAaA')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaA')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('aaAaAAaA', 'aaAaAAaA', 'aaAaaAaAaaAaaAaAaaAaaAaA')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('bbAbaAbA', 'bbAbAAbA', 'a')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('İo', 'İo', 'İo')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('İo', 'İo', 'İo ')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('İo', 'İo ', 'İo')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('İo', 'İo', 'i̇o')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('efd2', 'efd2', 'efd2')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('Hello, world! Nice day.', 'Hello, world! Nice day.', 'Hello, world! Nice day.')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('Something else. Nothing here.', 'Something else. Nothing here.', 'Something else. Nothing here.')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('kitten', 'kitten', 'sitTing')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('abc', 'abc', 'abc')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t5 values ('abcdcba', 'abcdcba', 'aBcDCbA')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-create table t6(ascii long) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t6 values (97)
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t6 values (66)
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-create table t7(ascii double) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t7 values (97.52143)
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t7 values (66.421)
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-create table t8(format string collate utf8_binary, utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t8 values ('%s%s', 'abCdE', 'abCdE')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-create table t9(num long) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t9 values (97)
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t9 values (66)
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-create table t10(utf8_binary string collate utf8_binary, utf8_lcase string collate utf8_lcase) using parquet
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t10 values ('aaAaAAaA', 'aaAaaAaA')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-insert into t10 values ('efd2', 'efd2')
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-select concat_ws(' ', utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<concat_ws(' ' collate null, utf8_binary, utf8_lcase):string collate null>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-Something else. Nothing here. Something else. Nothing here.
-Spark SQL
-aaAaAAaA aaAaAAaA
-aaAaAAaA aaAaaAaA
-aaAaAAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-abcdcba aBcDCbA
-bbAbAAbA a
-efd2 efd2
-kitten sitTing
-İo  İo
-İo i̇o
-İo İo
-İo İo
-
-
--- !query
-select concat_ws(' ' collate utf8_binary, utf8_binary, 'SQL' collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select concat_ws(' ' collate utf8_lcase, utf8_binary, 'SQL' collate utf8_lcase) from t5
--- !query schema
-struct<concat_ws(collate( , utf8_lcase), utf8_binary, collate(SQL, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. SQL
-Something else. Nothing here. SQL
-Spark SQL
-aaAaAAaA SQL
-aaAaAAaA SQL
-aaAaAAaA SQL
-abc SQL
-abcdcba SQL
-bbAbAAbA SQL
-efd2 SQL
-kitten SQL
-İo  SQL
-İo SQL
-İo SQL
-İo SQL
-
-
--- !query
-select concat_ws(',', utf8_lcase, 'word'), concat_ws(',', utf8_binary, 'word') from t5
--- !query schema
-struct<concat_ws(',' collate UTF8_LCASE, utf8_lcase, 'word' collate UTF8_LCASE):string collate UTF8_LCASE,concat_ws(,, utf8_binary, word):string>
--- !query output
-Hello, world! Nice day.,word	Hello, world! Nice day.,word
-SQL,word	Spark,word
-Something else. Nothing here.,word	Something else. Nothing here.,word
-a,word	bbAbAAbA,word
-aBcDCbA,word	abcdcba,word
-aaAaAAaA,word	aaAaAAaA,word
-aaAaaAaA,word	aaAaAAaA,word
-aaAaaAaAaaAaaAaAaaAaaAaA,word	aaAaAAaA,word
-abc,word	abc,word
-efd2,word	efd2,word
-i̇o,word	İo,word
-sitTing,word	kitten,word
-İo ,word	İo,word
-İo,word	İo ,word
-İo,word	İo,word
-
-
--- !query
-select concat_ws(',', utf8_lcase, 'word' collate utf8_binary), concat_ws(',', utf8_binary, 'word' collate utf8_lcase) from t5
--- !query schema
-struct<concat_ws(,, utf8_lcase, collate(word, utf8_binary)):string,concat_ws(',' collate UTF8_LCASE, utf8_binary, collate(word, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.,word	Hello, world! Nice day.,word
-SQL,word	Spark,word
-Something else. Nothing here.,word	Something else. Nothing here.,word
-a,word	bbAbAAbA,word
-aBcDCbA,word	abcdcba,word
-aaAaAAaA,word	aaAaAAaA,word
-aaAaaAaA,word	aaAaAAaA,word
-aaAaaAaAaaAaaAaAaaAaaAaA,word	aaAaAAaA,word
-abc,word	abc,word
-efd2,word	efd2,word
-i̇o,word	İo,word
-sitTing,word	kitten,word
-İo ,word	İo,word
-İo,word	İo ,word
-İo,word	İo,word
-
-
--- !query
-select elt(2, s, utf8_binary) from t5
--- !query schema
-struct<elt(2, s, utf8_binary):string>
--- !query output
-Hello, world! Nice day.
-Something else. Nothing here.
-Spark
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abc
-abcdcba
-bbAbAAbA
-efd2
-kitten
-İo
-İo
-İo
-İo
-
-
--- !query
-select elt(2, utf8_binary, utf8_lcase, s) from t5
--- !query schema
-struct<elt(2, utf8_binary, utf8_lcase, s):string collate null>
--- !query output
-Hello, world! Nice day.
-SQL
-Something else. Nothing here.
-a
-aBcDCbA
-aaAaAAaA
-aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA
-abc
-efd2
-i̇o
-sitTing
-İo
-İo
-İo
-
-
--- !query
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<elt(1, collate(utf8_binary, utf8_binary), collate(utf8_lcase, utf8_binary)):string>
--- !query output
-Hello, world! Nice day.
-Something else. Nothing here.
-Spark
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abc
-abcdcba
-bbAbAAbA
-efd2
-kitten
-İo
-İo
-İo
-İo
-
-
--- !query
-select elt(1, utf8_binary collate utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<elt(1, collate(utf8_binary, utf8_binary), utf8_lcase):string>
--- !query output
-Hello, world! Nice day.
-Something else. Nothing here.
-Spark
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abc
-abcdcba
-bbAbAAbA
-efd2
-kitten
-İo
-İo
-İo
-İo
-
-
--- !query
-select elt(1, utf8_binary, 'word'), elt(1, utf8_lcase, 'word') from t5
--- !query schema
-struct<elt(1, utf8_binary, word):string,elt(1, utf8_lcase, 'word' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select elt(1, utf8_binary, 'word' collate utf8_lcase), elt(1, utf8_lcase, 'word' collate utf8_binary) from t5
--- !query schema
-struct<elt(1, utf8_binary, collate(word, utf8_lcase)):string collate UTF8_LCASE,elt(1, utf8_lcase, collate(word, utf8_binary)):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select split_part(utf8_binary, utf8_lcase, 3) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.SparkRuntimeException
-{
-  "errorClass" : "INDETERMINATE_COLLATION",
-  "sqlState" : "42P22"
-}
-
-
--- !query
-select split_part(s, utf8_binary, 1) from t5
--- !query schema
-struct<split_part(s, utf8_binary, 1):string>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
-
-bbAbaAbA
-İo
-
-
--- !query
-select split_part(utf8_binary collate utf8_binary, s collate utf8_lcase, 1) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select split_part(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5
--- !query schema
-struct<split_part(utf8_binary, collate(utf8_lcase, utf8_binary), 2):string>
--- !query output
-
-
-
--- !query
-select split_part(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5
--- !query schema
-struct<split_part(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2):string collate UTF8_LCASE>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
-
- 
-b
-
-
--- !query
-select split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"split_part(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 83,
-    "fragment" : "split_part(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
-  } ]
-}
-
-
--- !query
-select split_part(utf8_binary, 'a', 3), split_part(utf8_lcase, 'a', 3) from t5
--- !query schema
-struct<split_part(utf8_binary, a, 3):string,split_part(utf8_lcase, 'a' collate UTF8_LCASE, 3):string collate UTF8_LCASE>
--- !query output
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-A	
-A	
-A
-
-
--- !query
-select split_part(utf8_binary, 'a' collate utf8_lcase, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t5
--- !query schema
-struct<split_part(utf8_binary, collate(a, utf8_lcase), 3):string collate UTF8_LCASE,split_part(utf8_lcase, collate(a, utf8_binary), 3):string>
--- !query output
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	A
-	A
-	A
-
-
--- !query
-select split_part(utf8_binary, 'a ' collate utf8_lcase_rtrim, 3), split_part(utf8_lcase, 'a' collate utf8_binary, 3) from t5
--- !query schema
-struct<split_part(utf8_binary, collate(a , utf8_lcase_rtrim), 3):string collate UTF8_LCASE_RTRIM,split_part(utf8_lcase, collate(a, utf8_binary), 3):string>
--- !query output
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	
-	A
-	A
-	A
-
-
--- !query
-select contains(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"contains(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 40,
-    "fragment" : "contains(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select contains(s, utf8_binary) from t5
--- !query schema
-struct<contains(s, utf8_binary):boolean>
--- !query output
-false
-false
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select contains(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select contains(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<contains(utf8_binary, collate(utf8_lcase, utf8_binary)):boolean>
--- !query output
-false
-false
-false
-false
-false
-false
-false
-false
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select contains(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<contains(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):boolean>
--- !query output
-false
-false
-false
-false
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"contains(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 78,
-    "fragment" : "contains(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select contains(utf8_binary, 'a'), contains(utf8_lcase, 'a') from t5
--- !query schema
-struct<contains(utf8_binary, a):boolean,contains(utf8_lcase, 'a' collate UTF8_LCASE):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	true
-true	false
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-
-
--- !query
-select contains(utf8_binary, 'AaAA' collate utf8_lcase), contains(utf8_lcase, 'AAa' collate utf8_binary) from t5
--- !query schema
-struct<contains(utf8_binary, collate(AaAA, utf8_lcase)):boolean,contains(utf8_lcase, collate(AAa, utf8_binary)):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-true	false
-true	false
-true	true
-
-
--- !query
-select contains(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim), contains(utf8_lcase, 'AAa ' collate utf8_binary_rtrim) from t5
--- !query schema
-struct<contains(utf8_binary, collate(AaAA , utf8_lcase_rtrim)):boolean,contains(utf8_lcase, collate(AAa , utf8_binary_rtrim)):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-true	false
-true	false
-true	true
-
-
--- !query
-select substring_index(utf8_binary, utf8_lcase, 2) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"substring_index(utf8_binary, utf8_lcase, 2)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 50,
-    "fragment" : "substring_index(utf8_binary, utf8_lcase, 2)"
-  } ]
-}
-
-
--- !query
-select substring_index(s, utf8_binary,1) from t5
--- !query schema
-struct<substring_index(s, utf8_binary, 1):string>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
-
-bbAbaAbA
-İo
-
-
--- !query
-select substring_index(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select substring_index(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5
--- !query schema
-struct<substring_index(utf8_binary, collate(utf8_lcase, utf8_binary), 2):string>
--- !query output
-Hello, world! Nice day.
-Something else. Nothing here.
-Spark
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abc
-abcdcba
-bbAbAAbA
-efd2
-kitten
-İo
-İo
-İo
-İo
-
-
--- !query
-select substring_index(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5
--- !query schema
-struct<substring_index(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.
-Something else. Nothing here.
-Spark
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abc
-abcdcba
-bbAb
-efd2
-kitten
-İo
-İo
-İo
-İo
-
-
--- !query
-select substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"substring_index(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 2)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 88,
-    "fragment" : "substring_index(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 2)"
-  } ]
-}
-
-
--- !query
-select substring_index(utf8_binary, 'a', 2), substring_index(utf8_lcase, 'a', 2) from t5
--- !query schema
-struct<substring_index(utf8_binary, a, 2):string,substring_index(utf8_lcase, 'a' collate UTF8_LCASE, 2):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-a	a
-a	a
-a	a
-abc	abc
-abcdcb	aBcDCb
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select substring_index(utf8_binary, 'AaAA' collate utf8_lcase, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5
--- !query schema
-struct<substring_index(utf8_binary, collate(AaAA, utf8_lcase), 2):string collate UTF8_LCASE,substring_index(utf8_lcase, collate(AAa, utf8_binary), 2):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-a	aaAaAAaA
-a	aaAaaAaA
-a	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select substring_index(utf8_binary, 'AaAA ' collate utf8_lcase_rtrim, 2), substring_index(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5
--- !query schema
-struct<substring_index(utf8_binary, collate(AaAA , utf8_lcase_rtrim), 2):string collate UTF8_LCASE_RTRIM,substring_index(utf8_lcase, collate(AAa, utf8_binary), 2):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-a	aaAaAAaA
-a	aaAaaAaA
-a	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select instr(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"instr(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "instr(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select instr(s, utf8_binary) from t5
--- !query schema
-struct<instr(s, utf8_binary):int>
--- !query output
-0
-0
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-
-
--- !query
-select instr(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select instr(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<instr(utf8_binary, collate(utf8_lcase, utf8_binary)):int>
--- !query output
-0
-0
-0
-0
-0
-0
-0
-0
-1
-1
-1
-1
-1
-1
-1
-
-
--- !query
-select instr(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<instr(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):int>
--- !query output
-0
-0
-0
-0
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-3
-
-
--- !query
-select instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"instr(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "instr(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select instr(utf8_binary, 'a'), instr(utf8_lcase, 'a') from t5
--- !query schema
-struct<instr(utf8_binary, a):int,instr(utf8_lcase, 'a' collate UTF8_LCASE):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	1
-1	1
-1	1
-1	1
-1	1
-1	1
-21	21
-3	0
-
-
--- !query
-select instr(utf8_binary, 'AaAA' collate utf8_lcase), instr(utf8_lcase, 'AAa' collate utf8_binary) from t5
--- !query schema
-struct<instr(utf8_binary, collate(AaAA, utf8_lcase)):int,instr(utf8_lcase, collate(AAa, utf8_binary)):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-1	0
-1	0
-1	5
-
-
--- !query
-select find_in_set(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"find_in_set(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 43,
-    "fragment" : "find_in_set(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select find_in_set(s, utf8_binary) from t5
--- !query schema
-struct<find_in_set(s, utf8_binary):int>
--- !query output
-0
-0
-0
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-
-
--- !query
-select find_in_set(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select find_in_set(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<find_in_set(utf8_binary, collate(utf8_lcase, utf8_binary)):int>
--- !query output
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-1
-1
-1
-1
-1
-
-
--- !query
-select find_in_set(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<find_in_set(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):int>
--- !query output
-0
-0
-0
-0
-0
-0
-0
-1
-1
-1
-1
-1
-1
-1
-1
-
-
--- !query
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o'), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o') from t5
--- !query schema
-struct<find_in_set(utf8_binary, aaAaaAaA,i̇o):int,find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate UTF8_LCASE):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	1
-0	1
-0	2
-0	2
-0	2
-
-
--- !query
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o' collate utf8_lcase), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t5
--- !query schema
-struct<find_in_set(utf8_binary, collate(aaAaaAaA,i̇o, utf8_lcase)):int,find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary)):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-1	0
-1	0
-1	1
-2	0
-2	0
-2	2
-
-
--- !query
-select find_in_set(utf8_binary, 'aaAaaAaA,i̇o ' collate utf8_lcase_rtrim), find_in_set(utf8_lcase, 'aaAaaAaA,i̇o' collate utf8_binary) from t5
--- !query schema
-struct<find_in_set(utf8_binary, collate(aaAaaAaA,i̇o , utf8_lcase_rtrim)):int,find_in_set(utf8_lcase, collate(aaAaaAaA,i̇o, utf8_binary)):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-1	0
-1	0
-1	1
-2	0
-2	0
-2	0
-2	2
-
-
--- !query
-select startswith(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"startswith(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 42,
-    "fragment" : "startswith(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select startswith(s, utf8_binary) from t5
--- !query schema
-struct<startswith(s, utf8_binary):boolean>
--- !query output
-false
-false
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select startswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select startswith(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<startswith(utf8_binary, collate(utf8_lcase, utf8_binary)):boolean>
--- !query output
-false
-false
-false
-false
-false
-false
-false
-false
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select startswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<startswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):boolean>
--- !query output
-false
-false
-false
-false
-false
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"startswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 80,
-    "fragment" : "startswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select startswith(utf8_binary, 'aaAaaAaA'), startswith(utf8_lcase, 'aaAaaAaA') from t5
--- !query schema
-struct<startswith(utf8_binary, aaAaaAaA):boolean,startswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	true
-false	true
-false	true
-
-
--- !query
-select startswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query schema
-struct<startswith(utf8_binary, collate(aaAaaAaA, utf8_lcase)):boolean,startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-true	false
-true	true
-true	true
-
-
--- !query
-select startswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), startswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query schema
-struct<startswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim)):boolean,startswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-true	false
-true	true
-true	true
-
-
--- !query
-select translate(utf8_lcase, utf8_lcase, '12345') from t5
--- !query schema
-struct<translate(utf8_lcase, utf8_lcase, '12345' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-1
-11111111
-11111111
-111111111111111111111111
-12
-12
-123
-123
-123
-123
-12332
-12335532
-1234
-1234321
-123454142544
-
-
--- !query
-select translate(utf8_binary, utf8_lcase, '12345') from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"translate(utf8_binary, utf8_lcase, 12345)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 50,
-    "fragment" : "translate(utf8_binary, utf8_lcase, '12345')"
-  } ]
-}
-
-
--- !query
-select translate(utf8_binary, 'aBc' collate utf8_lcase, '12345' collate utf8_binary) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select translate(utf8_binary, 'SQL' collate utf8_lcase, '12345' collate utf8_lcase) from t5
--- !query schema
-struct<translate(utf8_binary, collate(SQL, utf8_lcase), collate(12345, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-1omething e31e. Nothing here.
-1park
-He33o, wor3d! Nice day.
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abc
-abcdcba
-bbAbAAbA
-efd2
-kitten
-İo
-İo
-İo
-İo
-
-
--- !query
-select translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"utf8_binary\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"translate(utf8_binary, collate(SQL, unicode_ai), collate(12345, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 83,
-    "fragment" : "translate(utf8_binary, 'SQL' collate unicode_ai, '12345' collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select translate(utf8_lcase, 'aaAaaAaA', '12345'), translate(utf8_binary, 'aaAaaAaA', '12345') from t5
--- !query schema
-struct<translate(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, '12345' collate UTF8_LCASE):string collate UTF8_LCASE,translate(utf8_binary, aaAaaAaA, 12345):string>
--- !query output
-1	bb3b33b3
-11111111	11313313
-11111111	11313313
-111111111111111111111111	11313313
-1BcDCb1	1bcdcb1
-1bc	1bc
-Hello, world! Nice d1y.	Hello, world! Nice d1y.
-SQL	Sp1rk
-Something else. Nothing here.	Something else. Nothing here.
-efd2	efd2
-i̇o	İo
-sitTing	kitten
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select translate(utf8_lcase, 'aBc' collate utf8_binary, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t5
--- !query schema
-struct<translate(utf8_lcase, collate(aBc, utf8_binary), 12345):string,translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-1	22121121
-11A11A1A	11111111
-11A11A1A11A11A1A11A11A1A	11111111
-11A1AA1A	11111111
-123DCbA	123d321
-1b3	123
-Hello, world! Ni3e d1y.	Hello, world! Ni3e d1y.
-SQL	Sp1rk
-Something else. Nothing here.	Something else. Nothing here.
-efd2	efd2
-i̇o	İo
-sitTing	kitten
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select translate(utf8_lcase, 'aBc ' collate utf8_binary_rtrim, '12345'), translate(utf8_binary, 'aBc' collate utf8_lcase, '12345') from t5
--- !query schema
-struct<translate(utf8_lcase, collate(aBc , utf8_binary_rtrim), '12345' collate UTF8_BINARY_RTRIM):string collate UTF8_BINARY_RTRIM,translate(utf8_binary, collate(aBc, utf8_lcase), '12345' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-1	22121121
-11A11A1A	11111111
-11A11A1A11A11A1A11A11A1A	11111111
-11A1AA1A	11111111
-123DCbA	123d321
-1b3	123
-Hello,4world!4Ni3e4d1y.	Hello, world! Ni3e d1y.
-SQL	Sp1rk
-Something4else.4Nothing4here.	Something else. Nothing here.
-efd2	efd2
-i̇o	İo
-sitTing	kitten
-İo	İo
-İo	İo 
-İo4	İo
-
-
--- !query
-select replace(utf8_binary, utf8_lcase, 'abc') from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"replace(utf8_binary, utf8_lcase, abc)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 46,
-    "fragment" : "replace(utf8_binary, utf8_lcase, 'abc')"
-  } ]
-}
-
-
--- !query
-select replace(s, utf8_binary, 'abc') from t5
--- !query schema
-struct<replace(s, utf8_binary, abc):string>
--- !query output
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-bbAbaAbA
-İo
-
-
--- !query
-select replace(utf8_binary collate utf8_binary, s collate utf8_lcase, 'abc') from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select replace(utf8_binary, utf8_lcase collate utf8_binary, 'abc') from t5
--- !query schema
-struct<replace(utf8_binary, collate(utf8_lcase, utf8_binary), abc):string>
--- !query output
-Spark
-aaAaAAaA
-aaAaAAaA
-abc
-abc
-abc
-abc
-abc
-abc
-abc 
-abcdcba
-bbAbAAbA
-kitten
-İo
-İo
-
-
--- !query
-select replace(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 'abc') from t5
--- !query schema
-struct<replace(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 'abc' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-Spark
-aaAaAAaA
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc
-abc 
-bbabcbabcabcbabc
-kitten
-İo
-
-
--- !query
-select replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc') from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"replace(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 'abc' collate UNICODE_AI)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 84,
-    "fragment" : "replace(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 'abc')"
-  } ]
-}
-
-
--- !query
-select replace(utf8_binary, 'aaAaaAaA', 'abc'), replace(utf8_lcase, 'aaAaaAaA', 'abc') from t5
--- !query schema
-struct<replace(utf8_binary, aaAaaAaA, abc):string,replace(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE, 'abc' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	abc
-aaAaAAaA	abc
-aaAaAAaA	abcabcabc
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select replace(utf8_binary, 'aaAaaAaA' collate utf8_lcase, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t5
--- !query schema
-struct<replace(utf8_binary, collate(aaAaaAaA, utf8_lcase), 'abc' collate UTF8_LCASE):string collate UTF8_LCASE,replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-abc	aaAaAAaA
-abc	abc
-abc	abc
-abc	abcabcabc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select replace(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim, 'abc'), replace(utf8_lcase, 'aaAaaAaA' collate utf8_binary, 'abc') from t5
--- !query schema
-struct<replace(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim), 'abc' collate UTF8_LCASE_RTRIM):string collate UTF8_LCASE_RTRIM,replace(utf8_lcase, collate(aaAaaAaA, utf8_binary), abc):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	abc
-aaAaAAaA	abcabcabc
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select endswith(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"endswith(utf8_binary, utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 40,
-    "fragment" : "endswith(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select endswith(s, utf8_binary) from t5
--- !query schema
-struct<endswith(s, utf8_binary):boolean>
--- !query output
-false
-false
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select endswith(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select endswith(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<endswith(utf8_binary, collate(utf8_lcase, utf8_binary)):boolean>
--- !query output
-false
-false
-false
-false
-false
-false
-false
-false
-false
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select endswith(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<endswith(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):boolean>
--- !query output
-false
-false
-false
-false
-false
-true
-true
-true
-true
-true
-true
-true
-true
-true
-true
-
-
--- !query
-select endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"endswith(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 78,
-    "fragment" : "endswith(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select endswith(utf8_binary, 'aaAaaAaA'), endswith(utf8_lcase, 'aaAaaAaA') from t5
--- !query schema
-struct<endswith(utf8_binary, aaAaaAaA):boolean,endswith(utf8_lcase, 'aaAaaAaA' collate UTF8_LCASE):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	true
-false	true
-false	true
-
-
--- !query
-select endswith(utf8_binary, 'aaAaaAaA' collate utf8_lcase), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query schema
-struct<endswith(utf8_binary, collate(aaAaaAaA, utf8_lcase)):boolean,endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-true	false
-true	true
-true	true
-
-
--- !query
-select endswith(utf8_binary, 'aaAaaAaA ' collate utf8_lcase_rtrim), endswith(utf8_lcase, 'aaAaaAaA' collate utf8_binary) from t5
--- !query schema
-struct<endswith(utf8_binary, collate(aaAaaAaA , utf8_lcase_rtrim)):boolean,endswith(utf8_lcase, collate(aaAaaAaA, utf8_binary)):boolean>
--- !query output
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-false	false
-true	false
-true	true
-true	true
-
-
--- !query
-select repeat(utf8_binary, 3), repeat(utf8_lcase, 2) from t5
--- !query schema
-struct<repeat(utf8_binary, 3):string,repeat(utf8_lcase, 2):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.Hello, world! Nice day.Hello, world! Nice day.	Hello, world! Nice day.Hello, world! Nice day.
-Something else. Nothing here.Something else. Nothing here.Something else. Nothing here.	Something else. Nothing here.Something else. Nothing here.
-SparkSparkSpark	SQLSQL
-aaAaAAaAaaAaAAaAaaAaAAaA	aaAaAAaAaaAaAAaA
-aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaA
-aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaA
-abcabcabc	abcabc
-abcdcbaabcdcbaabcdcba	aBcDCbAaBcDCbA
-bbAbAAbAbbAbAAbAbbAbAAbA	aa
-efd2efd2efd2	efd2efd2
-kittenkittenkitten	sitTingsitTing
-İo İo İo 	İoİo
-İoİoİo	i̇oi̇o
-İoİoİo	İo İo 
-İoİoİo	İoİo
-
-
--- !query
-select repeat(utf8_binary collate utf8_lcase, 3), repeat(utf8_lcase collate utf8_binary, 2) from t5
--- !query schema
-struct<repeat(collate(utf8_binary, utf8_lcase), 3):string collate UTF8_LCASE,repeat(collate(utf8_lcase, utf8_binary), 2):string>
--- !query output
-Hello, world! Nice day.Hello, world! Nice day.Hello, world! Nice day.	Hello, world! Nice day.Hello, world! Nice day.
-Something else. Nothing here.Something else. Nothing here.Something else. Nothing here.	Something else. Nothing here.Something else. Nothing here.
-SparkSparkSpark	SQLSQL
-aaAaAAaAaaAaAAaAaaAaAAaA	aaAaAAaAaaAaAAaA
-aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaA
-aaAaAAaAaaAaAAaAaaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaAaaAaaAaA
-abcabcabc	abcabc
-abcdcbaabcdcbaabcdcba	aBcDCbAaBcDCbA
-bbAbAAbAbbAbAAbAbbAbAAbA	aa
-efd2efd2efd2	efd2efd2
-kittenkittenkitten	sitTingsitTing
-İo İo İo 	İoİo
-İoİoİo	i̇oi̇o
-İoİoİo	İo İo 
-İoİoİo	İoİo
-
-
--- !query
-select ascii(utf8_binary), ascii(utf8_lcase) from t5
--- !query schema
-struct<ascii(utf8_binary):int,ascii(utf8_lcase):int>
--- !query output
-101	101
-107	115
-304	105
-304	304
-304	304
-304	304
-72	72
-83	83
-83	83
-97	97
-97	97
-97	97
-97	97
-97	97
-98	97
-
-
--- !query
-select ascii(utf8_binary collate utf8_lcase), ascii(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<ascii(collate(utf8_binary, utf8_lcase)):int,ascii(collate(utf8_lcase, utf8_binary)):int>
--- !query output
-101	101
-107	115
-304	105
-304	304
-304	304
-304	304
-72	72
-83	83
-83	83
-97	97
-97	97
-97	97
-97	97
-97	97
-98	97
-
-
--- !query
-select unbase64(utf8_binary), unbase64(utf8_lcase) from t10
--- !query schema
-struct<unbase64(utf8_binary):binary,unbase64(utf8_lcase):binary>
--- !query output
-i� �	i�h�
-y�v	y�v
-
-
--- !query
-select unbase64(utf8_binary collate utf8_lcase), unbase64(utf8_lcase collate utf8_binary) from t10
--- !query schema
-struct<unbase64(collate(utf8_binary, utf8_lcase)):binary,unbase64(collate(utf8_lcase, utf8_binary)):binary>
--- !query output
-i� �	i�h�
-y�v	y�v
-
-
--- !query
-select chr(ascii) from t6
--- !query schema
-struct<chr(ascii):string>
--- !query output
-B
-a
-
-
--- !query
-select base64(utf8_binary), base64(utf8_lcase) from t5
--- !query schema
-struct<base64(utf8_binary):string,base64(utf8_lcase):string>
--- !query output
-SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=	SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=
-U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=	U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=
-U3Bhcms=	U1FM
-YWFBYUFBYUE=	YWFBYUFBYUE=
-YWFBYUFBYUE=	YWFBYWFBYUE=
-YWFBYUFBYUE=	YWFBYWFBYUFhYUFhYUFhQWFhQWFhQWFB
-YWJj	YWJj
-YWJjZGNiYQ==	YUJjRENiQQ==
-YmJBYkFBYkE=	YQ==
-ZWZkMg==	ZWZkMg==
-a2l0dGVu	c2l0VGluZw==
-xLBv	acyHbw==
-xLBv	xLBv
-xLBv	xLBvIA==
-xLBvIA==	xLBv
-
-
--- !query
-select base64(utf8_binary collate utf8_lcase), base64(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<base64(collate(utf8_binary, utf8_lcase)):string,base64(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=	SGVsbG8sIHdvcmxkISBOaWNlIGRheS4=
-U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=	U29tZXRoaW5nIGVsc2UuIE5vdGhpbmcgaGVyZS4=
-U3Bhcms=	U1FM
-YWFBYUFBYUE=	YWFBYUFBYUE=
-YWFBYUFBYUE=	YWFBYWFBYUE=
-YWFBYUFBYUE=	YWFBYWFBYUFhYUFhYUFhQWFhQWFhQWFB
-YWJj	YWJj
-YWJjZGNiYQ==	YUJjRENiQQ==
-YmJBYkFBYkE=	YQ==
-ZWZkMg==	ZWZkMg==
-a2l0dGVu	c2l0VGluZw==
-xLBv	acyHbw==
-xLBv	xLBv
-xLBv	xLBvIA==
-xLBvIA==	xLBv
-
-
--- !query
-select decode(encode(utf8_binary, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase, 'utf-8'), 'utf-8') from t5
--- !query schema
-struct<decode(encode(utf8_binary, utf-8), utf-8):string,decode(encode(utf8_lcase, utf-8), utf-8):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select decode(encode(utf8_binary collate utf8_lcase, 'utf-8'), 'utf-8'), decode(encode(utf8_lcase collate utf8_binary, 'utf-8'), 'utf-8') from t5
--- !query schema
-struct<decode(encode(collate(utf8_binary, utf8_lcase), utf-8), utf-8):string,decode(encode(collate(utf8_lcase, utf8_binary), utf-8), utf-8):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select format_number(ascii, '###.###') from t7
--- !query schema
-struct<format_number(ascii, ###.###):string>
--- !query output
-66.421
-97.521
-
-
--- !query
-select format_number(ascii, '###.###' collate utf8_lcase) from t7
--- !query schema
-struct<format_number(ascii, collate(###.###, utf8_lcase)):string>
--- !query output
-66.421
-97.521
-
-
--- !query
-select encode(utf8_binary, 'utf-8'), encode(utf8_lcase, 'utf-8') from t5
--- !query schema
-struct<encode(utf8_binary, utf-8):binary,encode(utf8_lcase, utf-8):binary>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select encode(utf8_binary collate utf8_lcase, 'utf-8'), encode(utf8_lcase collate utf8_binary, 'utf-8') from t5
--- !query schema
-struct<encode(collate(utf8_binary, utf8_lcase), utf-8):binary,encode(collate(utf8_lcase, utf8_binary), utf-8):binary>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select to_binary(utf8_binary, 'utf-8'), to_binary(utf8_lcase, 'utf-8') from t5
--- !query schema
-struct<to_binary(utf8_binary, utf-8):binary,to_binary(utf8_lcase, utf-8):binary>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select to_binary(utf8_binary collate utf8_lcase, 'utf-8'), to_binary(utf8_lcase collate utf8_binary, 'utf-8') from t5
--- !query schema
-struct<to_binary(collate(utf8_binary, utf8_lcase), utf-8):binary,to_binary(collate(utf8_lcase, utf8_binary), utf-8):binary>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select sentences(utf8_binary), sentences(utf8_lcase) from t5
--- !query schema
-struct<sentences(utf8_binary, , ):array<array<string>>,sentences(utf8_lcase, , ):array<array<string collate UTF8_LCASE>>>
--- !query output
-[["Hello","world"],["Nice","day"]]	[["Hello","world"],["Nice","day"]]
-[["Something","else"],["Nothing","here"]]	[["Something","else"],["Nothing","here"]]
-[["Spark"]]	[["SQL"]]
-[["aaAaAAaA"]]	[["aaAaAAaA"]]
-[["aaAaAAaA"]]	[["aaAaaAaA"]]
-[["aaAaAAaA"]]	[["aaAaaAaAaaAaaAaAaaAaaAaA"]]
-[["abc"]]	[["abc"]]
-[["abcdcba"]]	[["aBcDCbA"]]
-[["bbAbAAbA"]]	[["a"]]
-[["efd2"]]	[["efd2"]]
-[["kitten"]]	[["sitTing"]]
-[["İo"]]	[["i̇o"]]
-[["İo"]]	[["İo"]]
-[["İo"]]	[["İo"]]
-[["İo"]]	[["İo"]]
-
-
--- !query
-select sentences(utf8_binary collate utf8_lcase), sentences(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<sentences(collate(utf8_binary, utf8_lcase), , ):array<array<string collate UTF8_LCASE>>,sentences(collate(utf8_lcase, utf8_binary), , ):array<array<string>>>
--- !query output
-[["Hello","world"],["Nice","day"]]	[["Hello","world"],["Nice","day"]]
-[["Something","else"],["Nothing","here"]]	[["Something","else"],["Nothing","here"]]
-[["Spark"]]	[["SQL"]]
-[["aaAaAAaA"]]	[["aaAaAAaA"]]
-[["aaAaAAaA"]]	[["aaAaaAaA"]]
-[["aaAaAAaA"]]	[["aaAaaAaAaaAaaAaAaaAaaAaA"]]
-[["abc"]]	[["abc"]]
-[["abcdcba"]]	[["aBcDCbA"]]
-[["bbAbAAbA"]]	[["a"]]
-[["efd2"]]	[["efd2"]]
-[["kitten"]]	[["sitTing"]]
-[["İo"]]	[["i̇o"]]
-[["İo"]]	[["İo"]]
-[["İo"]]	[["İo"]]
-[["İo"]]	[["İo"]]
-
-
--- !query
-select upper(utf8_binary), upper(utf8_lcase) from t5
--- !query schema
-struct<upper(utf8_binary):string,upper(utf8_lcase):string collate UTF8_LCASE>
--- !query output
-AAAAAAAA	AAAAAAAA
-AAAAAAAA	AAAAAAAA
-AAAAAAAA	AAAAAAAAAAAAAAAAAAAAAAAA
-ABC	ABC
-ABCDCBA	ABCDCBA
-BBABAABA	A
-EFD2	EFD2
-HELLO, WORLD! NICE DAY.	HELLO, WORLD! NICE DAY.
-KITTEN	SITTING
-SOMETHING ELSE. NOTHING HERE.	SOMETHING ELSE. NOTHING HERE.
-SPARK	SQL
-İO	İO
-İO	İO
-İO	İO 
-İO 	İO
-
-
--- !query
-select upper(utf8_binary collate utf8_lcase), upper(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<upper(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,upper(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-AAAAAAAA	AAAAAAAA
-AAAAAAAA	AAAAAAAA
-AAAAAAAA	AAAAAAAAAAAAAAAAAAAAAAAA
-ABC	ABC
-ABCDCBA	ABCDCBA
-BBABAABA	A
-EFD2	EFD2
-HELLO, WORLD! NICE DAY.	HELLO, WORLD! NICE DAY.
-KITTEN	SITTING
-SOMETHING ELSE. NOTHING HERE.	SOMETHING ELSE. NOTHING HERE.
-SPARK	SQL
-İO	İO
-İO	İO
-İO	İO 
-İO 	İO
-
-
--- !query
-select lower(utf8_binary), lower(utf8_lcase) from t5
--- !query schema
-struct<lower(utf8_binary):string,lower(utf8_lcase):string collate UTF8_LCASE>
--- !query output
-aaaaaaaa	aaaaaaaa
-aaaaaaaa	aaaaaaaa
-aaaaaaaa	aaaaaaaaaaaaaaaaaaaaaaaa
-abc	abc
-abcdcba	abcdcba
-bbabaaba	a
-efd2	efd2
-hello, world! nice day.	hello, world! nice day.
-i̇o	i̇o
-i̇o	i̇o
-i̇o	i̇o 
-i̇o 	i̇o
-kitten	sitting
-something else. nothing here.	something else. nothing here.
-spark	sql
-
-
--- !query
-select lower(utf8_binary collate utf8_lcase), lower(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<lower(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,lower(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-aaaaaaaa	aaaaaaaa
-aaaaaaaa	aaaaaaaa
-aaaaaaaa	aaaaaaaaaaaaaaaaaaaaaaaa
-abc	abc
-abcdcba	abcdcba
-bbabaaba	a
-efd2	efd2
-hello, world! nice day.	hello, world! nice day.
-i̇o	i̇o
-i̇o	i̇o
-i̇o	i̇o 
-i̇o 	i̇o
-kitten	sitting
-something else. nothing here.	something else. nothing here.
-spark	sql
-
-
--- !query
-select initcap(utf8_binary), initcap(utf8_lcase) from t5
--- !query schema
-struct<initcap(utf8_binary):string,initcap(utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Aaaaaaaa	Aaaaaaaa
-Aaaaaaaa	Aaaaaaaa
-Aaaaaaaa	Aaaaaaaaaaaaaaaaaaaaaaaa
-Abc	Abc
-Abcdcba	Abcdcba
-Bbabaaba	A
-Efd2	Efd2
-Hello, World! Nice Day.	Hello, World! Nice Day.
-Kitten	Sitting
-Something Else. Nothing Here.	Something Else. Nothing Here.
-Spark	Sql
-İo	İo
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select initcap(utf8_binary collate utf8_lcase), initcap(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<initcap(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,initcap(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-Aaaaaaaa	Aaaaaaaa
-Aaaaaaaa	Aaaaaaaa
-Aaaaaaaa	Aaaaaaaaaaaaaaaaaaaaaaaa
-Abc	Abc
-Abcdcba	Abcdcba
-Bbabaaba	A
-Efd2	Efd2
-Hello, World! Nice Day.	Hello, World! Nice Day.
-Kitten	Sitting
-Something Else. Nothing Here.	Something Else. Nothing Here.
-Spark	Sql
-İo	İo
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select overlay(utf8_binary, utf8_lcase, 2) from t5
--- !query schema
-struct<overlay(utf8_binary, utf8_lcase, 2, -1):string collate null>
--- !query output
-HHello, world! Nice day.
-SSQLk
-SSomething else. Nothing here.
-aaBcDCbA
-aaaAaAAaA
-aaaAaaAaA
-aaaAaaAaAaaAaaAaAaaAaaAaA
-aabc
-baAbAAbA
-eefd2
-ksitTing
-İi̇o
-İİo
-İİo
-İİo
-
-
--- !query
-select overlay(s, utf8_binary,1) from t5
--- !query schema
-struct<overlay(s, utf8_binary, 1, -1):string>
--- !query output
-Hello, world! Nice day.
-Something else. Nothing here.
-Spark
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abc
-abcdcba
-bbAbAAbA
-efd2
-kitten
-İo
-İo
-İo
-İo
-
-
--- !query
-select overlay(utf8_binary collate utf8_binary, s collate utf8_lcase, 3) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select overlay(utf8_binary, utf8_lcase collate utf8_binary, 2) from t5
--- !query schema
-struct<overlay(utf8_binary, collate(utf8_lcase, utf8_binary), 2, -1):string>
--- !query output
-HHello, world! Nice day.
-SSQLk
-SSomething else. Nothing here.
-aaBcDCbA
-aaaAaAAaA
-aaaAaaAaA
-aaaAaaAaAaaAaaAaAaaAaaAaA
-aabc
-baAbAAbA
-eefd2
-ksitTing
-İi̇o
-İİo
-İİo
-İİo
-
-
--- !query
-select overlay(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 2) from t5
--- !query schema
-struct<overlay(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 2, -1):string collate UTF8_LCASE>
--- !query output
-HHello, world! Nice day.
-SSQLk
-SSomething else. Nothing here.
-aaBcDCbA
-aaaAaAAaA
-aaaAaaAaA
-aaaAaaAaAaaAaaAaAaaAaaAaA
-aabc
-baAbAAbA
-eefd2
-ksitTing
-İi̇o
-İİo
-İİo
-İİo
-
-
--- !query
-select overlay(utf8_binary, 'a', 2), overlay(utf8_lcase, 'a', 2) from t5
--- !query schema
-struct<overlay(utf8_binary, a, 2, -1):string,overlay(utf8_lcase, 'a' collate UTF8_LCASE, 2, -1):string collate UTF8_LCASE>
--- !query output
-Hallo, world! Nice day.	Hallo, world! Nice day.
-Saark	SaL
-Samething else. Nothing here.	Samething else. Nothing here.
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-aac	aac
-aacdcba	aacDCbA
-baAbAAbA	aa
-ead2	ead2
-katten	satTing
-İa	iao
-İa	İa
-İa	İa 
-İa 	İa
-
-
--- !query
-select overlay(utf8_binary, 'AaAA' collate utf8_lcase, 2), overlay(utf8_lcase, 'AAa' collate utf8_binary, 2) from t5
--- !query schema
-struct<overlay(utf8_binary, collate(AaAA, utf8_lcase), 2, -1):string collate UTF8_LCASE,overlay(utf8_lcase, collate(AAa, utf8_binary), 2, -1):string>
--- !query output
-HAaAA, world! Nice day.	HAAao, world! Nice day.
-SAaAA	SAAa
-SAaAAhing else. Nothing here.	SAAathing else. Nothing here.
-aAaAA	aAAa
-aAaAAAaA	aAAaAAaA
-aAaAAAaA	aAAaaAaA
-aAaAAAaA	aAAaaAaAaaAaaAaAaaAaaAaA
-aAaAAba	aAAaCbA
-bAaAAAbA	aAAa
-eAaAA	eAAa
-kAaAAn	sAAaing
-İAaAA	iAAa
-İAaAA	İAAa
-İAaAA	İAAa
-İAaAA	İAAa
-
-
--- !query
-select format_string(format, utf8_binary, utf8_lcase) from t8
--- !query schema
-struct<format_string(format, utf8_binary, utf8_lcase):string>
--- !query output
-abCdEabCdE
-
-
--- !query
-select format_string(format collate utf8_lcase, utf8_lcase, utf8_binary collate utf8_lcase, 3), format_string(format, utf8_lcase collate utf8_binary, utf8_binary) from t8
--- !query schema
-struct<format_string(collate(format, utf8_lcase), utf8_lcase, collate(utf8_binary, utf8_lcase), 3):string collate UTF8_LCASE,format_string(format, collate(utf8_lcase, utf8_binary), utf8_binary):string>
--- !query output
-abCdEabCdE	abCdEabCdE
-
-
--- !query
-select format_string(format, utf8_binary, utf8_lcase) from t8
--- !query schema
-struct<format_string(format, utf8_binary, utf8_lcase):string>
--- !query output
-abCdEabCdE
-
-
--- !query
-select soundex(utf8_binary), soundex(utf8_lcase) from t5
--- !query schema
-struct<soundex(utf8_binary):string,soundex(utf8_lcase):string>
--- !query output
-A000	A000
-A000	A000
-A000	A000
-A120	A120
-A123	A123
-B110	A000
-E130	E130
-H464	H464
-K350	S352
-S162	S400
-S535	S535
-İo	I000
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select soundex(utf8_binary collate utf8_lcase), soundex(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<soundex(collate(utf8_binary, utf8_lcase)):string,soundex(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-A000	A000
-A000	A000
-A000	A000
-A120	A120
-A123	A123
-B110	A000
-E130	E130
-H464	H464
-K350	S352
-S162	S400
-S535	S535
-İo	I000
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select length(utf8_binary), length(utf8_lcase) from t5
--- !query schema
-struct<length(utf8_binary):int,length(utf8_lcase):int>
--- !query output
-2	2
-2	3
-2	3
-23	23
-29	29
-3	2
-3	3
-4	4
-5	3
-6	7
-7	7
-8	1
-8	24
-8	8
-8	8
-
-
--- !query
-select length(utf8_binary collate utf8_lcase), length(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<length(collate(utf8_binary, utf8_lcase)):int,length(collate(utf8_lcase, utf8_binary)):int>
--- !query output
-2	2
-2	3
-2	3
-23	23
-29	29
-3	2
-3	3
-4	4
-5	3
-6	7
-7	7
-8	1
-8	24
-8	8
-8	8
-
-
--- !query
-select bit_length(utf8_binary), bit_length(utf8_lcase) from t5
--- !query schema
-struct<bit_length(utf8_binary):int,bit_length(utf8_lcase):int>
--- !query output
-184	184
-232	232
-24	24
-24	24
-24	32
-24	32
-32	24
-32	32
-40	24
-48	56
-56	56
-64	192
-64	64
-64	64
-64	8
-
-
--- !query
-select bit_length(utf8_binary collate utf8_lcase), bit_length(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<bit_length(collate(utf8_binary, utf8_lcase)):int,bit_length(collate(utf8_lcase, utf8_binary)):int>
--- !query output
-184	184
-232	232
-24	24
-24	24
-24	32
-24	32
-32	24
-32	32
-40	24
-48	56
-56	56
-64	192
-64	64
-64	64
-64	8
-
-
--- !query
-select octet_length(utf8_binary), octet_length(utf8_lcase) from t5
--- !query schema
-struct<octet_length(utf8_binary):int,octet_length(utf8_lcase):int>
--- !query output
-23	23
-29	29
-3	3
-3	3
-3	4
-3	4
-4	3
-4	4
-5	3
-6	7
-7	7
-8	1
-8	24
-8	8
-8	8
-
-
--- !query
-select octet_length(utf8_binary collate utf8_lcase), octet_length(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<octet_length(collate(utf8_binary, utf8_lcase)):int,octet_length(collate(utf8_lcase, utf8_binary)):int>
--- !query output
-23	23
-29	29
-3	3
-3	3
-3	4
-3	4
-4	3
-4	4
-5	3
-6	7
-7	7
-8	1
-8	24
-8	8
-8	8
-
-
--- !query
-select octet_length(utf8_binary collate utf8_lcase_rtrim), octet_length(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<octet_length(collate(utf8_binary, utf8_lcase_rtrim)):int,octet_length(collate(utf8_lcase, utf8_binary_rtrim)):int>
--- !query output
-23	23
-29	29
-3	3
-3	3
-3	4
-3	4
-4	3
-4	4
-5	3
-6	7
-7	7
-8	1
-8	24
-8	8
-8	8
-
-
--- !query
-select luhn_check(num) from t9
--- !query schema
-struct<luhn_check(num):boolean>
--- !query output
-false
-false
-
-
--- !query
-select levenshtein(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<levenshtein(utf8_binary, utf8_lcase):int>
--- !query output
-0
-0
-0
-0
-0
-0
-1
-1
-1
-16
-2
-4
-4
-4
-8
-
-
--- !query
-select levenshtein(s, utf8_binary) from t5
--- !query schema
-struct<levenshtein(s, utf8_binary):int>
--- !query output
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-1
-1
-
-
--- !query
-select levenshtein(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select levenshtein(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<levenshtein(utf8_binary, collate(utf8_lcase, utf8_binary)):int>
--- !query output
-0
-0
-0
-0
-0
-0
-1
-1
-1
-16
-2
-4
-4
-4
-8
-
-
--- !query
-select levenshtein(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<levenshtein(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):int>
--- !query output
-0
-0
-0
-0
-0
-0
-1
-1
-1
-16
-2
-4
-4
-4
-8
-
-
--- !query
-select levenshtein(utf8_binary, 'a'), levenshtein(utf8_lcase, 'a') from t5
--- !query schema
-struct<levenshtein(utf8_binary, a):int,levenshtein(utf8_lcase, 'a' collate UTF8_LCASE):int>
--- !query output
-2	2
-2	2
-2	3
-2	3
-22	22
-29	29
-3	2
-4	3
-4	4
-6	6
-6	7
-7	23
-7	7
-7	7
-8	0
-
-
--- !query
-select levenshtein(utf8_binary, 'AaAA' collate utf8_lcase, 3), levenshtein(utf8_lcase, 'AAa' collate utf8_binary, 4) from t5
--- !query schema
-struct<levenshtein(utf8_binary, collate(AaAA, utf8_lcase), 3):int,levenshtein(utf8_lcase, collate(AAa, utf8_binary), 4):int>
--- !query output
--1	-1
--1	-1
--1	-1
--1	-1
--1	-1
--1	-1
--1	-1
--1	2
--1	3
--1	3
--1	3
--1	3
--1	3
--1	4
-3	3
-
-
--- !query
-select is_valid_utf8(utf8_binary), is_valid_utf8(utf8_lcase) from t5
--- !query schema
-struct<is_valid_utf8(utf8_binary):boolean,is_valid_utf8(utf8_lcase):boolean>
--- !query output
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-
-
--- !query
-select is_valid_utf8(utf8_binary collate utf8_lcase), is_valid_utf8(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<is_valid_utf8(collate(utf8_binary, utf8_lcase)):boolean,is_valid_utf8(collate(utf8_lcase, utf8_binary)):boolean>
--- !query output
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-
-
--- !query
-select is_valid_utf8(utf8_binary collate utf8_lcase_rtrim), is_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<is_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim)):boolean,is_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim)):boolean>
--- !query output
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-true	true
-
-
--- !query
-select make_valid_utf8(utf8_binary), make_valid_utf8(utf8_lcase) from t5
--- !query schema
-struct<make_valid_utf8(utf8_binary):string,make_valid_utf8(utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select make_valid_utf8(utf8_binary collate utf8_lcase), make_valid_utf8(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<make_valid_utf8(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,make_valid_utf8(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select make_valid_utf8(utf8_binary collate utf8_lcase_rtrim), make_valid_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<make_valid_utf8(collate(utf8_binary, utf8_lcase_rtrim)):string collate UTF8_LCASE_RTRIM,make_valid_utf8(collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select validate_utf8(utf8_binary), validate_utf8(utf8_lcase) from t5
--- !query schema
-struct<validate_utf8(utf8_binary):string,validate_utf8(utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select validate_utf8(utf8_binary collate utf8_lcase), validate_utf8(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<validate_utf8(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,validate_utf8(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select validate_utf8(utf8_binary collate utf8_lcase_rtrim), validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<validate_utf8(collate(utf8_binary, utf8_lcase_rtrim)):string collate UTF8_LCASE_RTRIM,validate_utf8(collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select try_validate_utf8(utf8_binary), try_validate_utf8(utf8_lcase) from t5
--- !query schema
-struct<try_validate_utf8(utf8_binary):string,try_validate_utf8(utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select try_validate_utf8(utf8_binary collate utf8_lcase), try_validate_utf8(utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<try_validate_utf8(collate(utf8_binary, utf8_lcase)):string collate UTF8_LCASE,try_validate_utf8(collate(utf8_lcase, utf8_binary)):string>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select try_validate_utf8(utf8_binary collate utf8_lcase_rtrim), try_validate_utf8(utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<try_validate_utf8(collate(utf8_binary, utf8_lcase_rtrim)):string collate UTF8_LCASE_RTRIM,try_validate_utf8(collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaAaaAaaAaAaaAaaAaA
-abc	abc
-abcdcba	aBcDCbA
-bbAbAAbA	a
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select substr(utf8_binary, 2, 2), substr(utf8_lcase, 2, 2) from t5
--- !query schema
-struct<substr(utf8_binary, 2, 2):string,substr(utf8_lcase, 2, 2):string collate UTF8_LCASE>
--- !query output
-aA	aA
-aA	aA
-aA	aA
-bA	
-bc	Bc
-bc	bc
-el	el
-fd	fd
-it	it
-o	o
-o	o 
-o	̇o
-o 	o
-om	om
-pa	QL
-
-
--- !query
-select substr(utf8_binary collate utf8_lcase, 2, 2), substr(utf8_lcase collate utf8_binary, 2, 2) from t5
--- !query schema
-struct<substr(collate(utf8_binary, utf8_lcase), 2, 2):string collate UTF8_LCASE,substr(collate(utf8_lcase, utf8_binary), 2, 2):string>
--- !query output
-aA	aA
-aA	aA
-aA	aA
-bA	
-bc	Bc
-bc	bc
-el	el
-fd	fd
-it	it
-o	o
-o	o 
-o	̇o
-o 	o
-om	om
-pa	QL
-
-
--- !query
-select right(utf8_binary, 2), right(utf8_lcase, 2) from t5
--- !query schema
-struct<right(utf8_binary, 2):string,right(utf8_lcase, 2):string collate UTF8_LCASE>
--- !query output
-aA	aA
-aA	aA
-aA	aA
-bA	a
-ba	bA
-bc	bc
-d2	d2
-e.	e.
-en	ng
-o 	İo
-rk	QL
-y.	y.
-İo	o 
-İo	İo
-İo	̇o
-
-
--- !query
-select right(utf8_binary collate utf8_lcase, 2), right(utf8_lcase collate utf8_binary, 2) from t5
--- !query schema
-struct<right(collate(utf8_binary, utf8_lcase), 2):string collate UTF8_LCASE,right(collate(utf8_lcase, utf8_binary), 2):string>
--- !query output
-aA	aA
-aA	aA
-aA	aA
-bA	a
-ba	bA
-bc	bc
-d2	d2
-e.	e.
-en	ng
-o 	İo
-rk	QL
-y.	y.
-İo	o 
-İo	İo
-İo	̇o
-
-
--- !query
-select left(utf8_binary, '2' collate utf8_lcase), left(utf8_lcase, 2) from t5
--- !query schema
-struct<left(utf8_binary, collate(2, utf8_lcase)):string,left(utf8_lcase, 2):string collate UTF8_LCASE>
--- !query output
-He	He
-So	So
-Sp	SQ
-aa	aa
-aa	aa
-aa	aa
-ab	aB
-ab	ab
-bb	a
-ef	ef
-ki	si
-İo	i̇
-İo	İo
-İo	İo
-İo	İo
-
-
--- !query
-select left(utf8_binary collate utf8_lcase, 2), left(utf8_lcase collate utf8_binary, 2) from t5
--- !query schema
-struct<left(collate(utf8_binary, utf8_lcase), 2):string collate UTF8_LCASE,left(collate(utf8_lcase, utf8_binary), 2):string>
--- !query output
-He	He
-So	So
-Sp	SQ
-aa	aa
-aa	aa
-aa	aa
-ab	aB
-ab	ab
-bb	a
-ef	ef
-ki	si
-İo	i̇
-İo	İo
-İo	İo
-İo	İo
-
-
--- !query
-select rpad(utf8_binary, 8, utf8_lcase) from t5
--- !query schema
-struct<rpad(utf8_binary, 8, utf8_lcase):string collate null>
--- !query output
-Hello, w
-Somethin
-SparkSQL
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abcabcab
-abcdcbaa
-bbAbAAbA
-efd2efd2
-kittensi
-İo İoİoİ
-İoi̇oi̇o
-İoİo İo 
-İoİoİoİo
-
-
--- !query
-select rpad(s, 8, utf8_binary) from t5
--- !query schema
-struct<rpad(s, 8, utf8_binary):string>
--- !query output
-Hello, w
-Somethin
-SparkSpa
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abcabcab
-abcdcbaa
-bbAbaAbA
-efd2efd2
-kittenki
-İoİo İo 
-İoİoİoİo
-İoİoİoİo
-İoİoİoİo
-
-
--- !query
-select rpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select rpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<rpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary)):string>
--- !query output
-Hello, w
-Somethin
-SparkSQL
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abcabcab
-abcdcbaa
-bbAbAAbA
-efd2efd2
-kittensi
-İo İoİoİ
-İoi̇oi̇o
-İoİo İo 
-İoİoİoİo
-
-
--- !query
-select rpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<rpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-Hello, w
-Somethin
-SparkSQL
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-abcabcab
-abcdcbaa
-bbAbAAbA
-efd2efd2
-kittensi
-İo İoİoİ
-İoi̇oi̇o
-İoİo İo 
-İoİoİoİo
-
-
--- !query
-select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-Hello, w
-SQLSpark
-Somethin
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-aabcdcba
-abcababc
-bbAbAAbA
-efd2efd2
-i̇oi̇oİo
-sikitten
-İo İo İo
-İoİoİoİo
-İoİoİİo
-
-
--- !query
-select rpad(utf8_binary, 8, 'a'), rpad(utf8_lcase, 8, 'a') from t5
--- !query schema
-struct<rpad(utf8_binary, 8, a):string,rpad(utf8_lcase, 8, 'a' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-Hello, w	Hello, w
-Somethin	Somethin
-Sparkaaa	SQLaaaaa
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaA
-abcaaaaa	abcaaaaa
-abcdcbaa	aBcDCbAa
-bbAbAAbA	aaaaaaaa
-efd2aaaa	efd2aaaa
-kittenaa	sitTinga
-İo aaaaa	İoaaaaaa
-İoaaaaaa	i̇oaaaaa
-İoaaaaaa	İo aaaaa
-İoaaaaaa	İoaaaaaa
-
-
--- !query
-select rpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), rpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t5
--- !query schema
-struct<rpad(utf8_binary, 8, collate(AaAA, utf8_lcase)):string collate UTF8_LCASE,rpad(utf8_lcase, 8, collate(AAa, utf8_binary)):string>
--- !query output
-Hello, w	Hello, w
-Somethin	Somethin
-SparkAaA	SQLAAaAA
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaA
-abcAaAAA	abcAAaAA
-abcdcbaA	aBcDCbAA
-bbAbAAbA	aAAaAAaA
-efd2AaAA	efd2AAaA
-kittenAa	sitTingA
-İo AaAAA	İoAAaAAa
-İoAaAAAa	i̇oAAaAA
-İoAaAAAa	İo AAaAA
-İoAaAAAa	İoAAaAAa
-
-
--- !query
-select lpad(utf8_binary, 8, utf8_lcase) from t5
--- !query schema
-struct<lpad(utf8_binary, 8, utf8_lcase):string collate null>
--- !query output
-Hello, w
-SQLSpark
-Somethin
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-aabcdcba
-abcababc
-bbAbAAbA
-efd2efd2
-i̇oi̇oİo
-sikitten
-İo İo İo
-İoİoİoİo
-İoİoİİo
-
-
--- !query
-select lpad(s, 8, utf8_binary) from t5
--- !query schema
-struct<lpad(s, 8, utf8_binary):string>
--- !query output
-Hello, w
-Somethin
-SpaSpark
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-aabcdcba
-abcababc
-bbAbaAbA
-efd2efd2
-kikitten
-İo İo İo
-İoİoİoİo
-İoİoİoİo
-İoİoİoİo
-
-
--- !query
-select lpad(utf8_binary collate utf8_binary, 8, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select lpad(utf8_binary, 8, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<lpad(utf8_binary, 8, collate(utf8_lcase, utf8_binary)):string>
--- !query output
-Hello, w
-SQLSpark
-Somethin
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-aabcdcba
-abcababc
-bbAbAAbA
-efd2efd2
-i̇oi̇oİo
-sikitten
-İo İo İo
-İoİoİoİo
-İoİoİİo
-
-
--- !query
-select lpad(utf8_binary collate utf8_lcase, 8, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<lpad(collate(utf8_binary, utf8_lcase), 8, collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-Hello, w
-SQLSpark
-Somethin
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-aabcdcba
-abcababc
-bbAbAAbA
-efd2efd2
-i̇oi̇oİo
-sikitten
-İo İo İo
-İoİoİoİo
-İoİoİİo
-
-
--- !query
-select lpad(utf8_binary collate utf8_binary_rtrim, 8, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<lpad(collate(utf8_binary, utf8_binary_rtrim), 8, collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-Hello, w
-SQLSpark
-Somethin
-aaAaAAaA
-aaAaAAaA
-aaAaAAaA
-aabcdcba
-abcababc
-bbAbAAbA
-efd2efd2
-i̇oi̇oİo
-sikitten
-İo İo İo
-İoİoİoİo
-İoİoİİo
-
-
--- !query
-select lpad(utf8_binary, 8, 'a'), lpad(utf8_lcase, 8, 'a') from t5
--- !query schema
-struct<lpad(utf8_binary, 8, a):string,lpad(utf8_lcase, 8, 'a' collate UTF8_LCASE):string collate UTF8_LCASE>
--- !query output
-Hello, w	Hello, w
-Somethin	Somethin
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaA
-aaaSpark	aaaaaSQL
-aaaaaabc	aaaaaabc
-aaaaaaİo	aaaaaaİo
-aaaaaaİo	aaaaai̇o
-aaaaaaİo	aaaaaİo 
-aaaaaİo 	aaaaaaİo
-aaaaefd2	aaaaefd2
-aabcdcba	aaBcDCbA
-aakitten	asitTing
-bbAbAAbA	aaaaaaaa
-
-
--- !query
-select lpad(utf8_binary, 8, 'AaAA' collate utf8_lcase), lpad(utf8_lcase, 8, 'AAa' collate utf8_binary) from t5
--- !query schema
-struct<lpad(utf8_binary, 8, collate(AaAA, utf8_lcase)):string collate UTF8_LCASE,lpad(utf8_lcase, 8, collate(AAa, utf8_binary)):string>
--- !query output
-AaAAAabc	AAaAAabc
-AaAAAaİo	AAaAAaİo
-AaAAAaİo	AAaAAi̇o
-AaAAAaİo	AAaAAİo 
-AaAAAİo 	AAaAAaİo
-AaAAefd2	AAaAefd2
-AaASpark	AAaAASQL
-Aabcdcba	AaBcDCbA
-Aakitten	AsitTing
-Hello, w	Hello, w
-Somethin	Somethin
-aaAaAAaA	aaAaAAaA
-aaAaAAaA	aaAaaAaA
-aaAaAAaA	aaAaaAaA
-bbAbAAbA	AAaAAaAa
-
-
--- !query
-select locate(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"locate(utf8_binary, utf8_lcase, 1)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 38,
-    "fragment" : "locate(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select locate(s, utf8_binary) from t5
--- !query schema
-struct<locate(s, utf8_binary, 1):int>
--- !query output
-0
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-1
-
-
--- !query
-select locate(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select locate(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<locate(utf8_binary, collate(utf8_lcase, utf8_binary), 1):int>
--- !query output
-0
-0
-0
-0
-0
-0
-0
-0
-1
-1
-1
-1
-1
-1
-1
-
-
--- !query
-select locate(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase, 3) from t5
--- !query schema
-struct<locate(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase), 3):int>
--- !query output
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-0
-3
-
-
--- !query
-select locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"locate(collate(utf8_binary, unicode_ai), collate(utf8_lcase, unicode_ai), 3)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 79,
-    "fragment" : "locate(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai, 3)"
-  } ]
-}
-
-
--- !query
-select locate(utf8_binary, 'a'), locate(utf8_lcase, 'a') from t5
--- !query schema
-struct<locate(utf8_binary, a, 1):int,locate(utf8_lcase, 'a' collate UTF8_LCASE, 1):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	1
-
-
--- !query
-select locate(utf8_binary, 'AaAA' collate utf8_lcase, 4), locate(utf8_lcase, 'AAa' collate utf8_binary, 4) from t5
--- !query schema
-struct<locate(utf8_binary, collate(AaAA, utf8_lcase), 4):int,locate(utf8_lcase, collate(AAa, utf8_binary), 4):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-
-
--- !query
-select locate(utf8_binary, 'AaAA ' collate utf8_binary_rtrim, 4), locate(utf8_lcase, 'AAa ' collate utf8_binary, 4) from t5
--- !query schema
-struct<locate(utf8_binary, collate(AaAA , utf8_binary_rtrim), 4):int,locate(utf8_lcase, collate(AAa , utf8_binary), 4):int>
--- !query output
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-0	0
-
-
--- !query
-select TRIM(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(BOTH utf8_binary FROM utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 36,
-    "fragment" : "TRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select TRIM(s, utf8_binary) from t5
--- !query schema
-struct<TRIM(BOTH s FROM utf8_binary):string>
--- !query output
-
-
-
--- !query
-select TRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select TRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<TRIM(BOTH utf8_binary FROM collate(utf8_lcase, utf8_binary)):string>
--- !query output
-
-
-
-
-
-
-
-
-
- 
-BcDCbA
-QL
-a
-i̇
-sitTing
-
-
--- !query
-select TRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<TRIM(BOTH collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
- 
-QL
-sitTing
-
-
--- !query
-select TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(BOTH collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 74,
-    "fragment" : "TRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select TRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<TRIM(BOTH collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-
-
-
-
-
-
-
-
-
- 
-BcDCbA
-QL
-a
-i̇
-sitTing
-
-
--- !query
-select TRIM('ABc', utf8_binary), TRIM('ABc', utf8_lcase) from t5
--- !query schema
-struct<TRIM(BOTH ABc FROM utf8_binary):string,TRIM(BOTH 'ABc' collate UTF8_LCASE FROM utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAa	
-aaAaAAa	
-aaAaAAa	
-ab	
-abcdcba	D
-bbAbAAb	
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select TRIM('ABc' collate utf8_lcase, utf8_binary), TRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<TRIM(BOTH collate(ABc, utf8_lcase) FROM utf8_binary):string collate UTF8_LCASE,TRIM(BOTH collate(AAa, utf8_binary) FROM utf8_lcase):string>
--- !query output
-	
-	
-	
-	
-	bc
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-d	BcDCb
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select BTRIM(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(BOTH utf8_lcase FROM utf8_binary)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "BTRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select BTRIM(s, utf8_binary) from t5
--- !query schema
-struct<btrim(s, utf8_binary):string>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-a
-
-
--- !query
-select BTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING\", \"STRING COLLATE UTF8_LCASE\""
-  }
-}
-
-
--- !query
-select BTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<btrim(utf8_binary, collate(utf8_lcase, utf8_binary)):string>
--- !query output
-
-
-
-
-
-
-
-
-
- 
-bbAbAAbA
-d
-kitte
-park
-İ
-
-
--- !query
-select BTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<btrim(collate(utf8_binary, utf8_lcase), collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-
-
-
-
-
-
-
-
-
-
- 
-bbAbAAb
-kitte
-park
-İ
-
-
--- !query
-select BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_binary, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(BOTH collate(utf8_lcase, unicode_ai) FROM collate(utf8_binary, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "BTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select BTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<btrim(collate(utf8_binary, utf8_binary_rtrim), collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-
-
-
-
-
-
-
-
-
- 
-bbAbAAbA
-d
-kitte
-park
-İ
-
-
--- !query
-select BTRIM('ABc', utf8_binary), BTRIM('ABc', utf8_lcase) from t5
--- !query schema
-struct<btrim(ABc, utf8_binary):string,btrim(ABc, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-AB	
-AB	
-AB	B
-ABc	ABc
-ABc	ABc
-ABc	ABc
-ABc	ABc
-ABc	ABc
-ABc	ABc
-ABc	ABc
-ABc	ABc
-Bc	Bc
-Bc	Bc
-Bc	Bc
-Bc	Bc
-
-
--- !query
-select BTRIM('ABc' collate utf8_lcase, utf8_binary), BTRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<btrim(collate(ABc, utf8_lcase), utf8_binary):string collate UTF8_LCASE,btrim(collate(AAa, utf8_binary), utf8_lcase):string>
--- !query output
-	
-	AA
-ABc	AAa
-ABc	AAa
-ABc	AAa
-ABc	AAa
-ABc	AAa
-ABc	AAa
-ABc	AAa
-B	AA
-Bc	
-Bc	
-Bc	
-Bc	AAa
-c	AA
-
-
--- !query
-select LTRIM(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(LEADING utf8_binary FROM utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "LTRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select LTRIM(s, utf8_binary) from t5
--- !query schema
-struct<TRIM(LEADING s FROM utf8_binary):string>
--- !query output
-
-
-
--- !query
-select LTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select LTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<TRIM(LEADING utf8_binary FROM collate(utf8_lcase, utf8_binary)):string>
--- !query output
-
-
-
-
-
-
-
-
-
- 
-BcDCbA
-QL
-a
-i̇o
-sitTing
-
-
--- !query
-select LTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<TRIM(LEADING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
- 
-QL
-sitTing
-
-
--- !query
-select LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(LEADING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "LTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select LTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<TRIM(LEADING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-
-
-
-
-
-
-
-
-
- 
-BcDCbA
-QL
-a
-i̇o
-sitTing
-
-
--- !query
-select LTRIM('ABc', utf8_binary), LTRIM('ABc', utf8_lcase) from t5
--- !query schema
-struct<TRIM(LEADING ABc FROM utf8_binary):string,TRIM(LEADING 'ABc' collate UTF8_LCASE FROM utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAaA	
-aaAaAAaA	
-aaAaAAaA	
-abc	
-abcdcba	DCbA
-bbAbAAbA	
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select LTRIM('ABc' collate utf8_lcase, utf8_binary), LTRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<TRIM(LEADING collate(ABc, utf8_lcase) FROM utf8_binary):string collate UTF8_LCASE,TRIM(LEADING collate(AAa, utf8_binary) FROM utf8_lcase):string>
--- !query output
-	
-	
-	
-	
-	bc
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-dcba	BcDCbA
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select RTRIM(utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "INDETERMINATE_COLLATION_IN_EXPRESSION",
-  "sqlState" : "42P22",
-  "messageParameters" : {
-    "expr" : "\"TRIM(TRAILING utf8_binary FROM utf8_lcase)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 37,
-    "fragment" : "RTRIM(utf8_binary, utf8_lcase)"
-  } ]
-}
-
-
--- !query
-select RTRIM(s, utf8_binary) from t5
--- !query schema
-struct<TRIM(TRAILING s FROM utf8_binary):string>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-İo
-
-
--- !query
-select RTRIM(utf8_binary collate utf8_binary, s collate utf8_lcase) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "COLLATION_MISMATCH.EXPLICIT",
-  "sqlState" : "42P21",
-  "messageParameters" : {
-    "explicitTypes" : "\"STRING COLLATE UTF8_LCASE\", \"STRING\""
-  }
-}
-
-
--- !query
-select RTRIM(utf8_binary, utf8_lcase collate utf8_binary) from t5
--- !query schema
-struct<TRIM(TRAILING utf8_binary FROM collate(utf8_lcase, utf8_binary)):string>
--- !query output
-
-
-
-
-
-
-
-
-
-SQL
-a
-aBcDCbA
-i̇
-sitTing
-İo
-
-
--- !query
-select RTRIM(utf8_binary collate utf8_lcase, utf8_lcase collate utf8_lcase) from t5
--- !query schema
-struct<TRIM(TRAILING collate(utf8_binary, utf8_lcase) FROM collate(utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-
-
-
-
-
-
-
-
-
-
-
-
-SQL
-sitTing
-İo
-
-
--- !query
-select RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai) from t5
--- !query schema
-struct<>
--- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "inputSql" : "\"collate(utf8_lcase, unicode_ai)\"",
-    "inputType" : "\"STRING COLLATE UNICODE_AI\"",
-    "paramIndex" : "first",
-    "requiredType" : "\"STRING\"",
-    "sqlExpr" : "\"TRIM(TRAILING collate(utf8_binary, unicode_ai) FROM collate(utf8_lcase, unicode_ai))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 75,
-    "fragment" : "RTRIM(utf8_binary collate unicode_ai, utf8_lcase collate unicode_ai)"
-  } ]
-}
-
-
--- !query
-select RTRIM(utf8_binary collate utf8_binary_rtrim, utf8_lcase collate utf8_binary_rtrim) from t5
--- !query schema
-struct<TRIM(TRAILING collate(utf8_binary, utf8_binary_rtrim) FROM collate(utf8_lcase, utf8_binary_rtrim)):string collate UTF8_BINARY_RTRIM>
--- !query output
-
-
-
-
-
-
-
-
-
- 
-SQL
-a
-aBcDCbA
-i̇
-sitTing
-
-
--- !query
-select RTRIM('ABc', utf8_binary), RTRIM('ABc', utf8_lcase) from t5
--- !query schema
-struct<TRIM(TRAILING ABc FROM utf8_binary):string,TRIM(TRAILING 'ABc' collate UTF8_LCASE FROM utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-aaAaAAa	
-aaAaAAa	
-aaAaAAa	
-ab	
-abcdcba	aBcD
-bbAbAAb	
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select RTRIM('ABc' collate utf8_lcase, utf8_binary), RTRIM('AAa' collate utf8_binary, utf8_lcase) from t5
--- !query schema
-struct<TRIM(TRAILING collate(ABc, utf8_lcase) FROM utf8_binary):string collate UTF8_LCASE,TRIM(TRAILING collate(AAa, utf8_binary) FROM utf8_lcase):string>
--- !query output
-	
-	
-	
-	
-	abc
-Hello, world! Nice day.	Hello, world! Nice day.
-Something else. Nothing here.	Something else. Nothing here.
-Spark	SQL
-abcd	aBcDCb
-efd2	efd2
-kitten	sitTing
-İo	i̇o
-İo	İo
-İo	İo 
-İo 	İo
-
-
--- !query
-select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-select * from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-select subq1.* from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-) AS subq1
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-with cte as (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
-select * from cte
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-select * from values (1) where exists (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query schema
-struct<col1:int>
--- !query output
-1
-
-
--- !query
-select (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5 limit 1
-)
--- !query schema
-struct<scalarsubquery():string collate UTF8_LCASE>
--- !query output
-Something else. Nothing here. Something else. Nothing here.
-
-
--- !query
-select (
-  with cte as (
-    select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  )
-  select * from cte limit 1
-)
--- !query schema
-struct<scalarsubquery():string collate UTF8_LCASE>
--- !query output
-Something else. Nothing here. Something else. Nothing here.
-
-
--- !query
-select * from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5 limit 1
-)
-where (
-  `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` == 'aaa'
-)
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-
-
-
--- !query
-select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  group by 1
-  order by 1
-)
--- !query schema
-struct<lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-a a
-aaaaaaaa aaaaaaaa
-aaaaaaaaaaaaaaaaaaaaaaaa aaaaaaaaaaaaaaaaaaaaaaaa
-abc abc
-abcdcba abcdcba
-efd2 efd2
-hello, world! nice day. hello, world! nice day.
-i̇o  i̇o 
-i̇o i̇o
-sitting sitting
-something else. nothing here. something else. nothing here.
-sql sql
-
-
--- !query
-select lower(`concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)`) from (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-  group by 1
-  order by max(concat_ws(' ', utf8_lcase, utf8_lcase))
-)
--- !query schema
-struct<lower(concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)):string collate UTF8_LCASE>
--- !query output
-a a
-aaaaaaaa aaaaaaaa
-aaaaaaaaaaaaaaaaaaaaaaaa aaaaaaaaaaaaaaaaaaaaaaaa
-abc abc
-abcdcba abcdcba
-efd2 efd2
-hello, world! nice day. hello, world! nice day.
-i̇o  i̇o 
-i̇o i̇o
-sitting sitting
-something else. nothing here. something else. nothing here.
-sql sql
-
-
--- !query
-create temporary view v1 as (
-  select concat_ws(' ', utf8_lcase, utf8_lcase) from t5
-)
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-select * from v1
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-select `concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase)` from v1
--- !query schema
-struct<concat_ws(' ' collate UTF8_LCASE, utf8_lcase, utf8_lcase):string collate UTF8_LCASE>
--- !query output
-Hello, world! Nice day. Hello, world! Nice day.
-SQL SQL
-Something else. Nothing here. Something else. Nothing here.
-a a
-aBcDCbA aBcDCbA
-aaAaAAaA aaAaAAaA
-aaAaaAaA aaAaaAaA
-aaAaaAaAaaAaaAaAaaAaaAaA aaAaaAaAaaAaaAaAaaAaaAaA
-abc abc
-efd2 efd2
-i̇o i̇o
-sitTing sitTing
-İo  İo 
-İo İo
-İo İo
-
-
--- !query
-drop view v1
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-drop table t5
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-drop table t6
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-drop table t7
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-drop table t8
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-drop table t9
--- !query schema
-struct<>
--- !query output
-
-
-
--- !query
-drop table t10
--- !query schema
-struct<>
--- !query output
-
diff --git a/sql/core/src/test/resources/sql-tests/results/cte-recursion.sql.out b/sql/core/src/test/resources/sql-tests/results/cte-recursion.sql.out
index 346d6a4140fa8..f1fea1ff79eb8 100644
--- a/sql/core/src/test/resources/sql-tests/results/cte-recursion.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/cte-recursion.sql.out
@@ -448,20 +448,10 @@ SELECT * FROM r
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
+org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`level`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 62,
-    "stopIndex" : 66,
-    "fragment" : "level"
-  } ]
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
 }
 
 
@@ -504,13 +494,13 @@ WITH RECURSIVE t(col) (
 )
 SELECT * FROM t LIMIT 5
 -- !query schema
-struct<col:int>
+struct<>
 -- !query output
-1
-1
-1
-1
-1
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_REFERENCE.PLACE",
+  "sqlState" : "42836"
+}
 
 
 -- !query
@@ -535,6 +525,23 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 }
 
 
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT (SELECT n+1 FROM t1 WHERE n<5)
+)
+SELECT * FROM t1 LIMIT 5
+-- !query schema
+struct<n:int>
+-- !query output
+1
+2
+3
+4
+5
+
+
 -- !query
 WITH RECURSIVE
   t1 AS (
@@ -1451,13 +1458,13 @@ WITH RECURSIVE t1(n) AS (
     SELECT n+1 FROM t2 WHERE n < 5)
 SELECT * FROM t1
 -- !query schema
-struct<n:int>
+struct<>
 -- !query output
-1
-2
-3
-4
-5
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
 
 
 -- !query
@@ -1468,13 +1475,13 @@ WITH RECURSIVE t1 AS (
     SELECT n+1 FROM t2 WHERE n < 5)
 SELECT * FROM t1
 -- !query schema
-struct<n:int>
+struct<>
 -- !query output
-1
-2
-3
-4
-5
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
 
 
 -- !query
@@ -1656,3 +1663,287 @@ struct<val:array<int>>
 [2,1,5,3,4]
 [4,3,2,5,1]
 [4,5,1,2,3]
+
+
+-- !query
+WITH RECURSIVE t1(n, m) AS (
+    SELECT 1, CAST(1 AS BIGINT)
+    UNION ALL
+    SELECT n+1, n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query schema
+struct<n:int,m:bigint>
+-- !query output
+1	1
+2	2
+3	3
+4	4
+5	5
+
+
+-- !query
+WITH RECURSIVE t1(n, m) AS (
+    SELECT 1, 1
+    UNION ALL
+    SELECT n+1, CAST(n+1 AS BIGINT) FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkException
+{
+  "errorClass" : "CANNOT_MERGE_INCOMPATIBLE_DATA_TYPE",
+  "sqlState" : "42825",
+  "messageParameters" : {
+    "left" : "\"INT\"",
+    "right" : "\"BIGINT\""
+  }
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT CASE WHEN n < 5 THEN n + 1 ELSE NULL END FROM t1
+)
+SELECT * FROM t1 LIMIT 25
+-- !query schema
+struct<n:int>
+-- !query output
+1
+2
+3
+4
+5
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+NULL
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1 WHERE n < 5
+)
+SELECT (SELECT SUM(n) FROM (SELECT * FROM t1)), (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 3))
+-- !query schema
+struct<scalarsubquery():bigint,scalarsubquery():bigint>
+-- !query output
+15	6
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+)
+SELECT (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 5)), (SELECT SUM(n) FROM (SELECT * FROM t1 LIMIT 3))
+-- !query schema
+struct<scalarsubquery():bigint,scalarsubquery():bigint>
+-- !query output
+15	6
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+), t2(m) AS (
+    SELECT (SELECT SUM(n) FROM (SELECT n FROM t1 LIMIT 10) AS sums)
+    UNION ALL
+    SELECT m + (SELECT SUM(n) FROM (SELECT n FROM t1 LIMIT 3) AS sums) FROM t2
+)
+SELECT * FROM t2 LIMIT 20
+-- !query schema
+struct<m:bigint>
+-- !query output
+103
+109
+115
+121
+127
+133
+139
+145
+151
+157
+163
+169
+55
+61
+67
+73
+79
+85
+91
+97
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    SELECT n + 1 FROM t1
+)
+    ((SELECT n FROM t1) UNION ALL (SELECT n FROM t1)) LIMIT 20
+-- !query schema
+struct<n:int>
+-- !query output
+1
+10
+11
+12
+13
+14
+15
+16
+17
+18
+19
+2
+20
+3
+4
+5
+6
+7
+8
+9
+
+
+-- !query
+WITH RECURSIVE win(id, val) AS (
+    SELECT 1, CAST(10 AS BIGINT)
+    UNION ALL
+    SELECT id + 1, SUM(val) OVER (ORDER BY id ROWS BETWEEN 1 PRECEDING AND CURRENT ROW)
+    FROM win WHERE id < 3
+)
+SELECT * FROM win
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_REFERENCE.PLACE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1
+    UNION ALL
+    (SELECT n + 1 FROM t1 WHERE n < 5 ORDER BY n)
+)
+SELECT * FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_REFERENCE.PLACE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    SELECT 1 FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1 AS (
+    SELECT 1 AS n FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1(n) AS (
+    WITH t2(m) AS (SELECT 1)
+    SELECT 1 FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t1 AS (
+    WITH t2(m) AS (SELECT 1)
+    SELECT 1 AS n FROM t1
+    UNION ALL
+    SELECT n+1 FROM t1 WHERE n < 5)
+SELECT * FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
+}
+
+
+-- !query
+WITH RECURSIVE t AS (
+    SELECT 1 AS n
+    UNION ALL
+    SELECT n + m
+    FROM (SELECT 2 as m) subq
+             JOIN t ON n = m
+    WHERE n <> m
+)
+SELECT * FROM t
+-- !query schema
+struct<n:int>
+-- !query output
+1
diff --git a/sql/core/src/test/resources/sql-tests/results/date.sql.out b/sql/core/src/test/resources/sql-tests/results/date.sql.out
index 48eab6e1772a3..533795da1c499 100644
--- a/sql/core/src/test/resources/sql-tests/results/date.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/date.sql.out
@@ -802,7 +802,7 @@ struct<(2001-10-01 - DATE '2001-09-28'):interval day>
 -- !query
 select date '2001-09-28' - null
 -- !query schema
-struct<date_sub(DATE '2001-09-28', NULL):date>
+struct<(DATE '2001-09-28' - NULL):interval day>
 -- !query output
 NULL
 
@@ -886,7 +886,7 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select date'2011-11-11' + null
 -- !query schema
-struct<date_add(DATE '2011-11-11', NULL):date>
+struct<DATE '2011-11-11' + NULL:timestamp>
 -- !query output
 NULL
 
@@ -894,7 +894,7 @@ NULL
 -- !query
 select null + date'2011-11-11'
 -- !query schema
-struct<date_add(DATE '2011-11-11', NULL):date>
+struct<DATE '2011-11-11' + NULL:timestamp>
 -- !query output
 NULL
 
diff --git a/sql/core/src/test/resources/sql-tests/results/datetime-legacy.sql.out b/sql/core/src/test/resources/sql-tests/results/datetime-legacy.sql.out
index 9c7bba4084c72..55e5bb3d54466 100644
--- a/sql/core/src/test/resources/sql-tests/results/datetime-legacy.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/datetime-legacy.sql.out
@@ -802,7 +802,7 @@ struct<(2001-10-01 - DATE '2001-09-28'):interval day>
 -- !query
 select date '2001-09-28' - null
 -- !query schema
-struct<date_sub(DATE '2001-09-28', NULL):date>
+struct<(DATE '2001-09-28' - NULL):interval day>
 -- !query output
 NULL
 
@@ -886,7 +886,7 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select date'2011-11-11' + null
 -- !query schema
-struct<date_add(DATE '2011-11-11', NULL):date>
+struct<DATE '2011-11-11' + NULL:timestamp>
 -- !query output
 NULL
 
@@ -894,7 +894,7 @@ NULL
 -- !query
 select null + date'2011-11-11'
 -- !query schema
-struct<date_add(DATE '2011-11-11', NULL):date>
+struct<DATE '2011-11-11' + NULL:timestamp>
 -- !query output
 NULL
 
@@ -1404,6 +1404,278 @@ org.apache.spark.SparkDateTimeException
 }
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11)):timestamp>
+-- !query output
+2021-07-11 00:00:00
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query schema
+struct<make_timestamp(NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678)):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00'):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT):timestamp>
+-- !query output
+2021-07-10 10:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC):timestamp>
+-- !query output
+2021-07-10 23:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET):timestamp>
+-- !query output
+2021-07-10 21:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST):timestamp>
+-- !query output
+2021-07-10 14:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', UTC):timestamp>
+-- !query output
+1969-12-31 16:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query schema
@@ -2133,49 +2405,17 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query schema
-struct<>
+struct<TIMESTAMP '2011-11-11 11:11:11' + NULL:timestamp>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+NULL
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query schema
-struct<>
+struct<TIMESTAMP '2011-11-11 11:11:11' + NULL:timestamp>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+NULL
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/results/describe.sql.out b/sql/core/src/test/resources/sql-tests/results/describe.sql.out
index 3659267e8e9fe..989672c942854 100644
--- a/sql/core/src/test/resources/sql-tests/results/describe.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/describe.sql.out
@@ -453,6 +453,58 @@ org.apache.spark.sql.catalyst.parser.ParseException
 }
 
 
+-- !query
+DROP SCHEMA IF EXISTS test_schema
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE SCHEMA test_schema DEFAULT COLLATION UNICODE
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DESCRIBE SCHEMA EXTENDED test_schema
+-- !query schema
+struct<info_name:string,info_value:string>
+-- !query output
+Catalog Name	spark_catalog
+Collation	UNICODE
+Comment	
+Location [not included in comparison]/{warehouse_dir}/test_schema.db
+Namespace Name	test_schema
+Owner	[not included in comparison]
+Properties
+
+
+-- !query
+ALTER SCHEMA test_schema DEFAULT COLLATION UTF8_LCASE
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DESCRIBE SCHEMA EXTENDED test_schema
+-- !query schema
+struct<info_name:string,info_value:string>
+-- !query output
+Catalog Name	spark_catalog
+Collation	UTF8_LCASE
+Comment	
+Location [not included in comparison]/{warehouse_dir}/test_schema.db
+Namespace Name	test_schema
+Owner	[not included in comparison]
+Properties
+
+
 -- !query
 DESC temp_v
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers-enabled.sql.out b/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers-enabled.sql.out
index 2444c399a87ec..e52435269dc0e 100644
--- a/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers-enabled.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers-enabled.sql.out
@@ -170,6 +170,28 @@ org.apache.spark.sql.AnalysisException
 }
 
 
+-- !query
+select 1 from "not_""exists"
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "TABLE_OR_VIEW_NOT_FOUND",
+  "sqlState" : "42P01",
+  "messageParameters" : {
+    "relationName" : "`not_\"exists`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 15,
+    "stopIndex" : 28,
+    "fragment" : "\"not_\"\"exists\""
+  } ]
+}
+
+
 -- !query
 SELECT 1 FROM `hello`
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers.sql.out b/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers.sql.out
index 81a98a60590f0..2c0fd9587c808 100644
--- a/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/double-quoted-identifiers.sql.out
@@ -127,6 +127,22 @@ org.apache.spark.sql.catalyst.parser.ParseException
 }
 
 
+-- !query
+select 1 from "not_""exists"
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'\"not_\"\"exists\"'",
+    "hint" : ""
+  }
+}
+
+
 -- !query
 SELECT 1 FROM `hello`
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/explain-aqe.sql.out b/sql/core/src/test/resources/sql-tests/results/explain-aqe.sql.out
index af7c4639b8410..1545157aa53bf 100644
--- a/sql/core/src/test/resources/sql-tests/results/explain-aqe.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/explain-aqe.sql.out
@@ -990,7 +990,7 @@ Output [1]: [col1#x]
 Accumulated: false
 
 (4) Filter
-Arguments: (col1#x < 9)
+Arguments: (isnotnull(col1#x) AND (col1#x < 9))
 
 (5) Project
 Arguments: [(col1#x + 1) AS (level + 1)#x]
diff --git a/sql/core/src/test/resources/sql-tests/results/explain.sql.out b/sql/core/src/test/resources/sql-tests/results/explain.sql.out
index 5719c2620132f..898bd9097e43b 100644
--- a/sql/core/src/test/resources/sql-tests/results/explain.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/explain.sql.out
@@ -885,7 +885,7 @@ Output [1]: [col1#x]
 Accumulated: false
 
 (4) Filter
-Arguments: (col1#x < 9)
+Arguments: (isnotnull(col1#x) AND (col1#x < 9))
 
 (5) Project
 Arguments: [(col1#x + 1) AS (level + 1)#x]
diff --git a/sql/core/src/test/resources/sql-tests/results/having-and-order-by-recursive-type-name-resolution.sql.out b/sql/core/src/test/resources/sql-tests/results/having-and-order-by-recursive-type-name-resolution.sql.out
new file mode 100644
index 0000000000000..b1cdad6205d49
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/having-and-order-by-recursive-type-name-resolution.sql.out
@@ -0,0 +1,278 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 ORDER BY col1.a
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 HAVING col1.a > 0
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (NAMED_STRUCT('a', 1)) t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1.a
+-- !query schema
+struct<col1:struct<a:int>>
+-- !query output
+{"a":1}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a > 0
+-- !query schema
+struct<col1:struct<a:int>>
+-- !query output
+{"a":1}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a
+-- !query schema
+struct<col1:struct<a:int>>
+-- !query output
+{"a":1}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 ORDER BY col1.a
+-- !query schema
+struct<col1:struct<a:int>>
+-- !query output
+{"a":1}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 HAVING col1.a > 0
+-- !query schema
+struct<col1:struct<a:int>>
+-- !query output
+
+
+
+-- !query
+SELECT NAMED_STRUCT('a', 1) AS col1 FROM VALUES (NAMED_STRUCT('a', 0)) t (col1) GROUP BY col1 HAVING col1.a > 0 ORDER BY col1.a
+-- !query schema
+struct<col1:struct<a:int>>
+-- !query output
+
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 ORDER BY col1[0]
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 HAVING col1[0] > 0
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (ARRAY(1)) t (col1) GROUP BY col1 HAVING col1[0] > 0 ORDER BY col1[0]
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT ARRAY(1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1[0]
+-- !query schema
+struct<col1:array<int>>
+-- !query output
+[1]
+
+
+-- !query
+SELECT ARRAY(1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1[0] > 0
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_EXTRACT_BASE_FIELD_TYPE",
+  "sqlState" : "42000",
+  "messageParameters" : {
+    "base" : "\"tempresolvedcolumn(col1)\"",
+    "other" : "\"STRING\""
+  }
+}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1.a.b
+-- !query schema
+struct<col1:struct<a:struct<b:int>>>
+-- !query output
+{"a":{"b":1}}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a.b > 0
+-- !query schema
+struct<col1:struct<a:struct<b:int>>>
+-- !query output
+{"a":{"b":1}}
+
+
+-- !query
+SELECT NAMED_STRUCT('a', NAMED_STRUCT('b', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1.a.b > 0 ORDER BY col1.a.b
+-- !query schema
+struct<col1:struct<a:struct<b:int>>>
+-- !query output
+{"a":{"b":1}}
+
+
+-- !query
+SELECT ARRAY(NAMED_STRUCT('a', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1[0].a
+-- !query schema
+struct<col1:array<struct<a:int>>>
+-- !query output
+[{"a":1}]
+
+
+-- !query
+SELECT ARRAY(NAMED_STRUCT('a', 1)) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1[0].a > 0
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_EXTRACT_BASE_FIELD_TYPE",
+  "sqlState" : "42000",
+  "messageParameters" : {
+    "base" : "\"tempresolvedcolumn(col1)\"",
+    "other" : "\"STRING\""
+  }
+}
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 ORDER BY col1['key']
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 HAVING col1['key'] > 0
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT 'a' AS col1 FROM VALUES (MAP('key', 1)) t (col1) GROUP BY col1 HAVING col1['key'] > 0 ORDER BY col1['key']
+-- !query schema
+struct<col1:string>
+-- !query output
+a
+
+
+-- !query
+SELECT MAP('key', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 ORDER BY col1['key']
+-- !query schema
+struct<col1:map<string,int>>
+-- !query output
+{"key":1}
+
+
+-- !query
+SELECT MAP('key', 1) AS col1 FROM VALUES ('a') t (col1) GROUP BY col1 HAVING col1['key'] > 0
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_EXTRACT_BASE_FIELD_TYPE",
+  "sqlState" : "42000",
+  "messageParameters" : {
+    "base" : "\"tempresolvedcolumn(col1)\"",
+    "other" : "\"STRING\""
+  }
+}
+
+
+-- !query
+SELECT named_struct('a',1) as col, col1
+FROM values(named_struct('a',1))
+ORDER BY col1.a
+-- !query schema
+struct<col:struct<a:int>,col1:struct<a:int>>
+-- !query output
+{"a":1}	{"a":1}
+
+
+-- !query
+SELECT named_struct('a', 1) AS col1, col1
+FROM values(named_struct('a', 1))
+GROUP BY col1
+HAVING col1.a > 0
+-- !query schema
+struct<col1:struct<a:int>,col1:struct<a:int>>
+-- !query output
+{"a":1}	{"a":1}
+
+
+-- !query
+SELECT array(1, 2, 3) AS col1, col1
+FROM values(array(1, 2, 3))
+ORDER BY col1[0]
+-- !query schema
+struct<col1:array<int>,col1:array<int>>
+-- !query output
+[1,2,3]	[1,2,3]
+
+
+-- !query
+SELECT array(1, 2, 3) AS col1, col1
+FROM values(array(1, 2, 3))
+GROUP BY col1
+HAVING col1[1] > 1
+-- !query schema
+struct<col1:array<int>,col1:array<int>>
+-- !query output
+[1,2,3]	[1,2,3]
+
+
+-- !query
+SELECT map('a', 1, 'b', 2) AS col1, col1
+FROM values(map('a', 1, 'b', 2))
+ORDER BY col1['a']
+-- !query schema
+struct<col1:map<string,int>,col1:map<string,int>>
+-- !query output
+{"a":1,"b":2}	{"a":1,"b":2}
+
+
+-- !query
+SELECT map('a', 1, 'b', 2) AS col1, col1
+FROM values(map('a', 1, 'b', 2))
+GROUP BY col1
+HAVING col1['b'] > 1
+-- !query schema
+struct<col1:map<string,int>,col1:map<string,int>>
+-- !query output
+{"a":1,"b":2}	{"a":1,"b":2}
diff --git a/sql/core/src/test/resources/sql-tests/results/having.sql.out b/sql/core/src/test/resources/sql-tests/results/having.sql.out
index 1de971c7645c3..4ea7add3fc725 100644
--- a/sql/core/src/test/resources/sql-tests/results/having.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/having.sql.out
@@ -291,3 +291,71 @@ SELECT SUM(v) + 1 + MIN(v) FROM hav HAVING 1 + 1 + 1 + MIN(v) + 1 + SUM(v)
 struct<((sum(v) + 1) + min(v)):bigint>
 -- !query output
 13
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(1)
+GROUP BY col1
+HAVING (
+    SELECT col1 = 1
+)
+-- !query schema
+struct<alias:int>
+-- !query output
+1
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(named_struct('a', 1))
+GROUP BY col1
+HAVING (
+    SELECT col1.a = 1
+)
+-- !query schema
+struct<alias:struct<a:int>>
+-- !query output
+{"a":1}
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(array(1))
+GROUP BY col1
+HAVING (
+    SELECT col1[0] = 1
+)
+-- !query schema
+struct<alias:array<int>>
+-- !query output
+[1]
+
+
+-- !query
+SELECT col1 AS alias
+FROM values(map('a', 1))
+GROUP BY col1
+HAVING (
+    SELECT col1[0] = 1
+)
+-- !query schema
+struct<alias:map<string,int>>
+-- !query output
+
+
+
+-- !query
+SELECT col1 FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 = col2
+-- !query schema
+struct<col1:int>
+-- !query output
+1
+
+
+-- !query
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 = col2
+-- !query schema
+struct<a:int,b:int>
+-- !query output
+1	1
diff --git a/sql/core/src/test/resources/sql-tests/results/higher-order-functions.sql.out b/sql/core/src/test/resources/sql-tests/results/higher-order-functions.sql.out
index 7bfc35a61e092..b16bbcda2eb5a 100644
--- a/sql/core/src/test/resources/sql-tests/results/higher-order-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/higher-order-functions.sql.out
@@ -348,3 +348,837 @@ select aggregate(split('abcdefgh',''), array(array('')), (acc, x) -> array(array
 struct<aggregate(split(abcdefgh, , -1), array(array()), lambdafunction(array(array(namedlambdavariable())), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable())):array<array<string>>>
 -- !query output
 [["h"]]
+
+
+-- !query
+select aggregate(array(1, 2, 3), 0, 100) as aggregate_int_literal
+-- !query schema
+struct<aggregate_int_literal:int>
+-- !query output
+100
+
+
+-- !query
+select aggregate(array(1, 2, 3), map(), map('result', 999)) as aggregate_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 59,
+    "fragment" : "aggregate(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select aggregate(array(1, 2, 3), struct('init', 0), struct('final', 999)) as aggregate_struct_literal
+-- !query schema
+struct<aggregate_struct_literal:struct<col1:string,col2:int>>
+-- !query output
+{"col1":"final","col2":999}
+
+
+-- !query
+select aggregate(array(1, 2, 3), array(), array('result')) as aggregate_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "aggregate(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), 1) as array_sort_int_literal
+-- !query schema
+struct<array_sort_int_literal:array<int>>
+-- !query output
+[3,1,2]
+
+
+-- !query
+select array_sort(array(3, 1, 2), map('compare', 0)) as array_sort_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"MAP<STRING, INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(map(compare, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "array_sort(array(3, 1, 2), map('compare', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), struct('result', 0)) as array_sort_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"STRUCT<col1: STRING NOT NULL, col2: INT NOT NULL>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(struct(result, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 54,
+    "fragment" : "array_sort(array(3, 1, 2), struct('result', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), array(0)) as array_sort_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"ARRAY<INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(array(0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 43,
+    "fragment" : "array_sort(array(3, 1, 2), array(0))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), 1) as exists_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "exists(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), map('found', true)) as exists_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(found, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(map(found, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "exists(array(1, 2, 3), map('found', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), struct('exists', true)) as exists_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(exists, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(struct(exists, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 53,
+    "fragment" : "exists(array(1, 2, 3), struct('exists', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), array(true)) as exists_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(array(true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 42,
+    "fragment" : "exists(array(1, 2, 3), array(true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), 1) as filter_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "filter(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), map('key', 'value')) as filter_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(key, value), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, STRING>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(map(key, value), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "filter(array(1, 2, 3), map('key', 'value'))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), struct('valid', true)) as filter_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(valid, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(struct(valid, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "filter(array(1, 2, 3), struct('valid', true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), array(true, false)) as filter_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, false), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(array(true, false), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "filter(array(1, 2, 3), array(true, false))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), 1) as forall_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "forall(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), map('all', true)) as forall_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(all, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(map(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 47,
+    "fragment" : "forall(array(1, 2, 3), map('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), struct('all', true)) as forall_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(all, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(struct(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "forall(array(1, 2, 3), struct('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), array(true, true)) as forall_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(array(true, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 48,
+    "fragment" : "forall(array(1, 2, 3), array(true, true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), 1) as map_filter_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(1, namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 41,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), 1)"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), map('keep', true)) as map_filter_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 57,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), map('keep', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), struct('filter', true)) as map_filter_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 62,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), struct('filter', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), array(true)) as map_filter_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(array(true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 51,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), array(true))"
+  } ]
+}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), 100) as map_zipwith_int_literal
+-- !query schema
+struct<map_zipwith_int_literal:map<string,int>>
+-- !query output
+{"a":100}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), map('merged', true)) as map_zipwith_map_literal
+-- !query schema
+struct<map_zipwith_map_literal:map<string,map<string,boolean>>>
+-- !query output
+{"a":{"merged":true}}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), struct('left', 1, 'right', 10)) as map_zipwith_struct_literal
+-- !query schema
+struct<map_zipwith_struct_literal:map<string,struct<col1:string,col2:int,col3:string,col4:int>>>
+-- !query output
+{"a":{"col1":"left","col2":1,"col3":"right","col4":10}}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), array('combined')) as map_zipwith_array_literal
+-- !query schema
+struct<map_zipwith_array_literal:map<string,array<string>>>
+-- !query output
+{"a":["combined"]}
+
+
+-- !query
+select reduce(array(1, 2, 3), 0, 100) as reduce_int_literal
+-- !query schema
+struct<reduce_int_literal:int>
+-- !query output
+100
+
+
+-- !query
+select reduce(array(1, 2, 3), map(), map('result', 999)) as reduce_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 56,
+    "fragment" : "reduce(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select reduce(array(1, 2, 3), struct('init', 0), struct('final', 999)) as reduce_struct_literal
+-- !query schema
+struct<reduce_struct_literal:struct<col1:string,col2:int>>
+-- !query output
+{"col1":"final","col2":999}
+
+
+-- !query
+select reduce(array(1, 2, 3), array(), array('result')) as reduce_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 55,
+    "fragment" : "reduce(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select transform(array(1, 2, 3), 42) as transform_int_literal
+-- !query schema
+struct<transform_int_literal:array<int>>
+-- !query output
+[42,42,42]
+
+
+-- !query
+select transform(array(1, 2, 3), map('key', 'value')) as transform_map_literal
+-- !query schema
+struct<transform_map_literal:array<map<string,string>>>
+-- !query output
+[{"key":"value"},{"key":"value"},{"key":"value"}]
+
+
+-- !query
+select transform(array(1, 2, 3), struct('id', 99, 'name', 'test')) as transform_struct_literal
+-- !query schema
+struct<transform_struct_literal:array<struct<col1:string,col2:int,col3:string,col4:string>>>
+-- !query output
+[{"col1":"id","col2":99,"col3":"name","col4":"test"},{"col1":"id","col2":99,"col3":"name","col4":"test"},{"col1":"id","col2":99,"col3":"name","col4":"test"}]
+
+
+-- !query
+select transform(array(1, 2, 3), array('a', 'b')) as transform_array_literal
+-- !query schema
+struct<transform_array_literal:array<array<string>>>
+-- !query output
+[["a","b"],["a","b"],["a","b"]]
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), 42) as transform_keys_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "DUPLICATED_MAP_KEY",
+  "sqlState" : "23505",
+  "messageParameters" : {
+    "key" : "42",
+    "mapKeyDedupPolicy" : "\"spark.sql.mapKeyDedupPolicy\""
+  }
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), map('new', 'key')) as transform_keys_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.INVALID_MAP_KEY_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "keyType" : "\"MAP<STRING, STRING>\"",
+    "sqlExpr" : "\"transform_keys(map(a, 1, b, 2), lambdafunction(map(new, key), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 61,
+    "fragment" : "transform_keys(map('a', 1, 'b', 2), map('new', 'key'))"
+  } ]
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), struct('key', 'value')) as transform_keys_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "DUPLICATED_MAP_KEY",
+  "sqlState" : "23505",
+  "messageParameters" : {
+    "key" : "[key,value]",
+    "mapKeyDedupPolicy" : "\"spark.sql.mapKeyDedupPolicy\""
+  }
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), array('new_key')) as transform_keys_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "DUPLICATED_MAP_KEY",
+  "sqlState" : "23505",
+  "messageParameters" : {
+    "key" : "[new_key]",
+    "mapKeyDedupPolicy" : "\"spark.sql.mapKeyDedupPolicy\""
+  }
+}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), 999) as transform_values_int_literal
+-- !query schema
+struct<transform_values_int_literal:map<string,int>>
+-- !query output
+{"a":999,"b":999}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), map('new', 'value')) as transform_values_map_literal
+-- !query schema
+struct<transform_values_map_literal:map<string,map<string,string>>>
+-- !query output
+{"a":{"new":"value"},"b":{"new":"value"}}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), struct('val', 999)) as transform_values_struct_literal
+-- !query schema
+struct<transform_values_struct_literal:map<string,struct<col1:string,col2:int>>>
+-- !query output
+{"a":{"col1":"val","col2":999},"b":{"col1":"val","col2":999}}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), array('new_value')) as transform_values_array_literal
+-- !query schema
+struct<transform_values_array_literal:map<string,array<string>>>
+-- !query output
+{"a":["new_value"],"b":["new_value"]}
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), 100) as zipwith_int_literal
+-- !query schema
+struct<zipwith_int_literal:array<int>>
+-- !query output
+[100,100,100]
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), map('merged', true)) as zipwith_map_literal
+-- !query schema
+struct<zipwith_map_literal:array<map<string,boolean>>>
+-- !query output
+[{"merged":true},{"merged":true},{"merged":true}]
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), struct('left', 1, 'right', 2)) as zipwith_struct_literal
+-- !query schema
+struct<zipwith_struct_literal:array<struct<col1:string,col2:int,col3:string,col4:int>>>
+-- !query output
+[{"col1":"left","col2":1,"col3":"right","col4":2},{"col1":"left","col2":1,"col3":"right","col4":2},{"col1":"left","col2":1,"col3":"right","col4":2}]
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), array('combined')) as zipwith_array_literal
+-- !query schema
+struct<zipwith_array_literal:array<array<string>>>
+-- !query output
+[["combined"],["combined"],["combined"]]
diff --git a/sql/core/src/test/resources/sql-tests/results/keywords-enforced.sql.out b/sql/core/src/test/resources/sql-tests/results/keywords-enforced.sql.out
index a72b2c4dc8dab..ef17566850e31 100644
--- a/sql/core/src/test/resources/sql-tests/results/keywords-enforced.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/keywords-enforced.sql.out
@@ -390,6 +390,7 @@ WHILE	false
 WINDOW	false
 WITH	true
 WITHIN	true
+WITHOUT	false
 X	false
 YEAR	false
 YEARS	false
diff --git a/sql/core/src/test/resources/sql-tests/results/keywords.sql.out b/sql/core/src/test/resources/sql-tests/results/keywords.sql.out
index 59f860eb7ef49..97309774cc37d 100644
--- a/sql/core/src/test/resources/sql-tests/results/keywords.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/keywords.sql.out
@@ -390,6 +390,7 @@ WHILE	false
 WINDOW	false
 WITH	false
 WITHIN	false
+WITHOUT	false
 X	false
 YEAR	false
 YEARS	false
diff --git a/sql/core/src/test/resources/sql-tests/results/literals.sql.out b/sql/core/src/test/resources/sql-tests/results/literals.sql.out
index f7a8850fbaac4..410b55bdd4394 100644
--- a/sql/core/src/test/resources/sql-tests/results/literals.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/literals.sql.out
@@ -785,3 +785,59 @@ select -0, -0.0
 struct<0:int,0.0:decimal(1,1)>
 -- !query output
 0	0.0
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+S"par"k	S"par"k	S""par""k
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+S'par'k	S'par'k	S''par''k
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query schema
+struct<c1:string,c2:string,c3:string,c4:string,c5:string,c6:string>
+-- !query output
+Spark	Spark	Spark	Spark	Spark	Spark
+
+
+-- !query
+SET spark.sql.legacy.consecutiveStringLiterals.enabled=true
+-- !query schema
+struct<key:string,value:string>
+-- !query output
+spark.sql.legacy.consecutiveStringLiterals.enabled	true
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+Spark	S"par"k	S""par""k
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+Spark	S'par'k	S''par''k
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query schema
+struct<c1:string,c2:string,c3:string,c4:string,c5:string,c6:string>
+-- !query output
+Spark	Spark	Spark	Spark	Spark	Spark
diff --git a/sql/core/src/test/resources/sql-tests/results/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql.out b/sql/core/src/test/resources/sql-tests/results/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql.out
new file mode 100644
index 0000000000000..ad46fdd5fee01
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/name-precedence-in-order-by-and-having-with-conflicting-attributes.sql.out
@@ -0,0 +1,764 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+CREATE OR REPLACE TEMPORARY VIEW v1 AS SELECT col1 FROM VALUES
+  (42), (17), (99), (5), (42),
+  (23), (8), (17), (76), (33),
+  (99), (55), (3), (42), (8)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE OR REPLACE TEMPORARY VIEW v2 AS SELECT col1 FROM VALUES
+  ('apple'), ('banana'), ('cherry'), ('date'), ('apple'),
+  ('fig'), ('grape'), ('banana'), ('kiwi'), ('lemon'),
+  ('cherry'), ('mango'), ('orange'), ('apple'), ('grape')
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT 2 AS col1 FROM v1 ORDER BY col1
+-- !query schema
+struct<col1:int>
+-- !query output
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+2
+
+
+-- !query
+SELECT 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<col1:int>
+-- !query output
+2
+
+
+-- !query
+SELECT 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+-- !query schema
+struct<col1:int>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 ORDER BY col1
+) ORDER BY 1
+-- !query schema
+struct<c:int,col1:int>
+-- !query output
+3	2
+5	2
+8	2
+8	2
+17	2
+17	2
+23	2
+33	2
+42	2
+42	2
+42	2
+55	2
+76	2
+99	2
+99	2
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+) ORDER BY 1
+-- !query schema
+struct<c:int,col1:int>
+-- !query output
+3	2
+5	2
+8	2
+17	2
+23	2
+33	2
+42	2
+55	2
+76	2
+99	2
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1
+-- !query schema
+struct<c:int,col1:int>
+-- !query output
+55	2
+76	2
+99	2
+
+
+-- !query
+SELECT 2 AS col1, 3 AS col1 FROM v1 ORDER BY col1
+-- !query schema
+struct<col1:int,col1:int>
+-- !query output
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+2	3
+
+
+-- !query
+SELECT 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`col1`",
+    "proposal" : "`col1`, `col1`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 59,
+    "stopIndex" : 62,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 57,
+    "stopIndex" : 60,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 ORDER BY col1
+-- !query schema
+struct<c:int,col1:int,col1:int>
+-- !query output
+3	2	3
+5	2	3
+8	2	3
+8	2	3
+17	2	3
+17	2	3
+23	2	3
+33	2	3
+42	2	3
+42	2	3
+42	2	3
+55	2	3
+76	2	3
+99	2	3
+99	2	3
+
+
+-- !query
+SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<c:int,col1:int,col1:int>
+-- !query output
+3	2	3
+5	2	3
+8	2	3
+17	2	3
+23	2	3
+33	2	3
+42	2	3
+55	2	3
+76	2	3
+99	2	3
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 2 AS col1, 3 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1
+-- !query schema
+struct<c:int,col1:int,col1:int>
+-- !query output
+55	2	3
+76	2	3
+99	2	3
+
+
+-- !query
+SELECT col1, 2 AS col1 FROM v1 ORDER BY col1
+-- !query schema
+struct<col1:int,col1:int>
+-- !query output
+3	2
+5	2
+8	2
+8	2
+17	2
+17	2
+23	2
+33	2
+42	2
+42	2
+42	2
+55	2
+76	2
+99	2
+99	2
+
+
+-- !query
+SELECT col1, 2 AS col1 FROM v1 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<col1:int,col1:int>
+-- !query output
+3	2
+5	2
+8	2
+17	2
+23	2
+33	2
+42	2
+55	2
+76	2
+99	2
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1, 2 AS col1 FROM v1 GROUP BY ALL HAVING col1 > 50
+) ORDER BY 1
+-- !query schema
+struct<col1:int,col1:int>
+-- !query output
+55	2
+76	2
+99	2
+
+
+-- !query
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) ORDER BY col1
+-- !query schema
+struct<col1:int>
+-- !query output
+3
+
+
+-- !query
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<col1:int>
+-- !query output
+3
+
+
+-- !query
+SELECT 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL HAVING col1 > 50
+-- !query schema
+struct<col1:int>
+-- !query output
+
+
+
+-- !query
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) ORDER BY col1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 3 AS col1 FROM (SELECT 1 AS col1, 2 AS col1) GROUP BY ALL HAVING col1 > 50
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT 'col1' FROM v2 ORDER BY col1
+-- !query schema
+struct<col1:string>
+-- !query output
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+col1
+
+
+-- !query
+SELECT 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<col1:string>
+-- !query output
+col1
+
+
+-- !query
+SELECT 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+-- !query schema
+struct<col1:string>
+-- !query output
+col1
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 ORDER BY col1
+) ORDER BY 1
+-- !query schema
+struct<c:string,col1:string>
+-- !query output
+apple	col1
+apple	col1
+apple	col1
+banana	col1
+banana	col1
+cherry	col1
+cherry	col1
+date	col1
+fig	col1
+grape	col1
+grape	col1
+kiwi	col1
+lemon	col1
+mango	col1
+orange	col1
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+) ORDER BY 1
+-- !query schema
+struct<c:string,col1:string>
+-- !query output
+apple	col1
+banana	col1
+cherry	col1
+date	col1
+fig	col1
+grape	col1
+kiwi	col1
+lemon	col1
+mango	col1
+orange	col1
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1
+-- !query schema
+struct<c:string,col1:string>
+-- !query output
+cherry	col1
+date	col1
+fig	col1
+grape	col1
+kiwi	col1
+lemon	col1
+mango	col1
+orange	col1
+
+
+-- !query
+SELECT 'col1', 'col1' FROM v2 ORDER BY col1
+-- !query schema
+struct<col1:string,col1:string>
+-- !query output
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+col1	col1
+
+
+-- !query
+SELECT 'col1', 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`col1`",
+    "proposal" : "`col1`, `col1`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 53,
+    "stopIndex" : 56,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT 'col1', 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 51,
+    "stopIndex" : 54,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 'col1', 'col1' FROM v2 ORDER BY col1
+-- !query schema
+struct<c:string,col1:string,col1:string>
+-- !query output
+apple	col1	col1
+apple	col1	col1
+apple	col1	col1
+banana	col1	col1
+banana	col1	col1
+cherry	col1	col1
+cherry	col1	col1
+date	col1	col1
+fig	col1	col1
+grape	col1	col1
+grape	col1	col1
+kiwi	col1	col1
+lemon	col1	col1
+mango	col1	col1
+orange	col1	col1
+
+
+-- !query
+SELECT col1 AS c, 'col1', 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<c:string,col1:string,col1:string>
+-- !query output
+apple	col1	col1
+banana	col1	col1
+cherry	col1	col1
+date	col1	col1
+fig	col1	col1
+grape	col1	col1
+kiwi	col1	col1
+lemon	col1	col1
+mango	col1	col1
+orange	col1	col1
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1 AS c, 'col1', 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1
+-- !query schema
+struct<c:string,col1:string,col1:string>
+-- !query output
+cherry	col1	col1
+date	col1	col1
+fig	col1	col1
+grape	col1	col1
+kiwi	col1	col1
+lemon	col1	col1
+mango	col1	col1
+orange	col1	col1
+
+
+-- !query
+SELECT col1, 'col1' FROM v2 ORDER BY col1
+-- !query schema
+struct<col1:string,col1:string>
+-- !query output
+apple	col1
+apple	col1
+apple	col1
+banana	col1
+banana	col1
+cherry	col1
+cherry	col1
+date	col1
+fig	col1
+grape	col1
+grape	col1
+kiwi	col1
+lemon	col1
+mango	col1
+orange	col1
+
+
+-- !query
+SELECT col1, 'col1' FROM v2 GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<col1:string,col1:string>
+-- !query output
+apple	col1
+banana	col1
+cherry	col1
+date	col1
+fig	col1
+grape	col1
+kiwi	col1
+lemon	col1
+mango	col1
+orange	col1
+
+
+-- !query
+SELECT * FROM (
+  SELECT col1, 'col1' FROM v2 GROUP BY ALL HAVING col1 > 'banana'
+) ORDER BY 1
+-- !query schema
+struct<col1:string,col1:string>
+-- !query output
+cherry	col1
+date	col1
+fig	col1
+grape	col1
+kiwi	col1
+lemon	col1
+mango	col1
+orange	col1
+
+
+-- !query
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) ORDER BY col1
+-- !query schema
+struct<col1:string>
+-- !query output
+col1
+
+
+-- !query
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<col1:string>
+-- !query output
+col1
+
+
+-- !query
+SELECT 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL HAVING col1 > 'banana'
+-- !query schema
+struct<col1:string>
+-- !query output
+col1
+
+
+-- !query
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) ORDER BY col1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL ORDER BY col1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+SELECT col1 AS c, 'col1' FROM (SELECT 'a' AS col1, 'b' AS col1) GROUP BY ALL HAVING col1 > 'banana'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "AMBIGUOUS_REFERENCE",
+  "sqlState" : "42704",
+  "messageParameters" : {
+    "name" : "`col1`",
+    "referenceNames" : "[`col1`, `col1`]"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 11,
+    "fragment" : "col1"
+  } ]
+}
+
+
+-- !query
+DROP VIEW v2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW v1
+-- !query schema
+struct<>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/cast.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/cast.sql.out
index 6f74c63da3543..64d7b35970551 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/cast.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/cast.sql.out
@@ -916,6 +916,110 @@ struct<CAST(10.654321 AS INTERVAL MONTH):interval month>
 0-11
 
 
+-- !query
+SELECT CAST(TIME '00:01:52' AS tinyint)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS TINYINT):tinyint>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS smallint)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS SMALLINT):smallint>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS int)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS INT):int>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '00:01:52' AS bigint)
+-- !query schema
+struct<CAST(TIME '00:01:52' AS BIGINT):bigint>
+-- !query output
+112
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS tinyint)
+-- !query schema
+struct<CAST(TIME '23:59:59' AS TINYINT):tinyint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS smallint)
+-- !query schema
+struct<CAST(TIME '23:59:59' AS SMALLINT):smallint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS int)
+-- !query schema
+struct<CAST(TIME '23:59:59' AS INT):int>
+-- !query output
+86399
+
+
+-- !query
+SELECT CAST(TIME '23:59:59' AS bigint)
+-- !query schema
+struct<CAST(TIME '23:59:59' AS BIGINT):bigint>
+-- !query output
+86399
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS tinyint)
+-- !query schema
+struct<CAST(TIME '00:00:17.5' AS TINYINT):tinyint>
+-- !query output
+17
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.5' AS int)
+-- !query schema
+struct<CAST(TIME '00:00:17.5' AS INT):int>
+-- !query output
+17
+
+
+-- !query
+SELECT CAST(TIME '00:00:17.9' AS int)
+-- !query schema
+struct<CAST(TIME '00:00:17.9' AS INT):int>
+-- !query output
+17
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS tinyint)
+-- !query schema
+struct<CAST(TIME '00:00:00' AS TINYINT):tinyint>
+-- !query output
+0
+
+
+-- !query
+SELECT CAST(TIME '00:00:00' AS int)
+-- !query schema
+struct<CAST(TIME '00:00:00' AS INT):int>
+-- !query output
+0
+
+
 -- !query
 SELECT '1.23' :: int
 -- !query schema
@@ -1069,6 +1173,38 @@ struct<CAST(10.123456 AS INTERVAL DAY TO SECOND):interval day to second>
 0 00:00:10.123456000
 
 
+-- !query
+SELECT TIME '00:01:52' :: tinyint
+-- !query schema
+struct<CAST(TIME '00:01:52' AS TINYINT):tinyint>
+-- !query output
+112
+
+
+-- !query
+SELECT TIME '00:01:52' :: int
+-- !query schema
+struct<CAST(TIME '00:01:52' AS INT):int>
+-- !query output
+112
+
+
+-- !query
+SELECT TIME '23:59:59' :: tinyint
+-- !query schema
+struct<CAST(TIME '23:59:59' AS TINYINT):tinyint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT TIME '23:59:59' :: int
+-- !query schema
+struct<CAST(TIME '23:59:59' AS INT):int>
+-- !query output
+86399
+
+
 -- !query
 SELECT '1.23' :: int :: long
 -- !query schema
@@ -1159,3 +1295,139 @@ org.apache.spark.sql.catalyst.parser.ParseException
     "hint" : ""
   }
 }
+
+
+-- !query
+SELECT CAST(time '00:00:00' AS decimal(1, 0))
+-- !query schema
+struct<CAST(TIME '00:00:00' AS DECIMAL(1,0)):decimal(1,0)>
+-- !query output
+0
+
+
+-- !query
+SELECT CAST(time '12:00:00' AS decimal(7, 2))
+-- !query schema
+struct<CAST(TIME '12:00:00' AS DECIMAL(7,2)):decimal(7,2)>
+-- !query output
+43200.00
+
+
+-- !query
+SELECT CAST(time '01:30:45' AS decimal(8, 3))
+-- !query schema
+struct<CAST(TIME '01:30:45' AS DECIMAL(8,3)):decimal(8,3)>
+-- !query output
+5445.000
+
+
+-- !query
+SELECT CAST(time '23:59:59' AS decimal(9, 4))
+-- !query schema
+struct<CAST(TIME '23:59:59' AS DECIMAL(9,4)):decimal(9,4)>
+-- !query output
+86399.0000
+
+
+-- !query
+SELECT CAST(time '01:02:03' AS decimal(15, 9))
+-- !query schema
+struct<CAST(TIME '01:02:03' AS DECIMAL(15,9)):decimal(15,9)>
+-- !query output
+3723.000000000
+
+
+-- !query
+SELECT CAST(time '10:20:30' AS decimal(20, 10))
+-- !query schema
+struct<CAST(TIME '10:20:30' AS DECIMAL(20,10)):decimal(20,10)>
+-- !query output
+37230.0000000000
+
+
+-- !query
+SELECT CAST(time '23:59:59.001' AS decimal(8, 3))
+-- !query schema
+struct<CAST(TIME '23:59:59.001' AS DECIMAL(8,3)):decimal(8,3)>
+-- !query output
+86399.001
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 6))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(11,6)):decimal(11,6)>
+-- !query output
+86399.999999
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 9))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(14,9)):decimal(14,9)>
+-- !query output
+86399.999999000
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(20, 10))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(20,10)):decimal(20,10)>
+-- !query output
+86399.9999990000
+
+
+-- !query
+SELECT CAST(time '00:01:00' AS decimal(1, 0))
+-- !query schema
+struct<CAST(TIME '00:01:00' AS DECIMAL(1,0)):decimal(1,0)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT CAST(time '01:00:00' AS decimal(3, 0))
+-- !query schema
+struct<CAST(TIME '01:00:00' AS DECIMAL(3,0)):decimal(3,0)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT CAST(time '10:00:00' AS decimal(5, 2))
+-- !query schema
+struct<CAST(TIME '10:00:00' AS DECIMAL(5,2)):decimal(5,2)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT CAST(time '23:59:59.9' AS decimal(6, 0))
+-- !query schema
+struct<CAST(TIME '23:59:59.9' AS DECIMAL(6,0)):decimal(6,0)>
+-- !query output
+86400
+
+
+-- !query
+SELECT CAST(time '23:59:59.999' AS decimal(8, 2))
+-- !query schema
+struct<CAST(TIME '23:59:59.999' AS DECIMAL(8,2)):decimal(8,2)>
+-- !query output
+86400.00
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999' AS decimal(11, 5))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(11,5)):decimal(11,5)>
+-- !query output
+86400.00000
+
+
+-- !query
+SELECT CAST(time '23:59:59.999999999' AS decimal(14, 8))
+-- !query schema
+struct<CAST(TIME '23:59:59.999999' AS DECIMAL(14,8)):decimal(14,8)>
+-- !query output
+86399.99999900
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/date.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/date.sql.out
index c46c200ff026f..c3f8661d7f22e 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/date.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/date.sql.out
@@ -788,7 +788,7 @@ struct<(2001-10-01 - DATE '2001-09-28'):interval day>
 -- !query
 select date '2001-09-28' - null
 -- !query schema
-struct<date_sub(DATE '2001-09-28', NULL):date>
+struct<(DATE '2001-09-28' - NULL):interval day>
 -- !query output
 NULL
 
@@ -890,7 +890,7 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select date'2011-11-11' + null
 -- !query schema
-struct<date_add(DATE '2011-11-11', NULL):date>
+struct<DATE '2011-11-11' + NULL:timestamp>
 -- !query output
 NULL
 
@@ -898,7 +898,7 @@ NULL
 -- !query
 select null + date'2011-11-11'
 -- !query schema
-struct<date_add(DATE '2011-11-11', NULL):date>
+struct<DATE '2011-11-11' + NULL:timestamp>
 -- !query output
 NULL
 
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/double-quoted-identifiers.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/double-quoted-identifiers.sql.out
index 81a98a60590f0..2c0fd9587c808 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/double-quoted-identifiers.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/double-quoted-identifiers.sql.out
@@ -127,6 +127,22 @@ org.apache.spark.sql.catalyst.parser.ParseException
 }
 
 
+-- !query
+select 1 from "not_""exists"
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'\"not_\"\"exists\"'",
+    "hint" : ""
+  }
+}
+
+
 -- !query
 SELECT 1 FROM `hello`
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/higher-order-functions.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/higher-order-functions.sql.out
index 7bfc35a61e092..b16bbcda2eb5a 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/higher-order-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/higher-order-functions.sql.out
@@ -348,3 +348,837 @@ select aggregate(split('abcdefgh',''), array(array('')), (acc, x) -> array(array
 struct<aggregate(split(abcdefgh, , -1), array(array()), lambdafunction(array(array(namedlambdavariable())), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable())):array<array<string>>>
 -- !query output
 [["h"]]
+
+
+-- !query
+select aggregate(array(1, 2, 3), 0, 100) as aggregate_int_literal
+-- !query schema
+struct<aggregate_int_literal:int>
+-- !query output
+100
+
+
+-- !query
+select aggregate(array(1, 2, 3), map(), map('result', 999)) as aggregate_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 59,
+    "fragment" : "aggregate(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select aggregate(array(1, 2, 3), struct('init', 0), struct('final', 999)) as aggregate_struct_literal
+-- !query schema
+struct<aggregate_struct_literal:struct<col1:string,col2:int>>
+-- !query output
+{"col1":"final","col2":999}
+
+
+-- !query
+select aggregate(array(1, 2, 3), array(), array('result')) as aggregate_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"aggregate(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "aggregate(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), 1) as array_sort_int_literal
+-- !query schema
+struct<array_sort_int_literal:array<int>>
+-- !query output
+[3,1,2]
+
+
+-- !query
+select array_sort(array(3, 1, 2), map('compare', 0)) as array_sort_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"MAP<STRING, INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(map(compare, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "array_sort(array(3, 1, 2), map('compare', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), struct('result', 0)) as array_sort_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"STRUCT<col1: STRING NOT NULL, col2: INT NOT NULL>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(struct(result, 0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 54,
+    "fragment" : "array_sort(array(3, 1, 2), struct('result', 0))"
+  } ]
+}
+
+
+-- !query
+select array_sort(array(3, 1, 2), array(0)) as array_sort_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_RETURN_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "actualType" : "\"ARRAY<INT>\"",
+    "expectedType" : "\"INT\"",
+    "functionName" : "`lambdafunction`",
+    "sqlExpr" : "\"array_sort(array(3, 1, 2), lambdafunction(array(0), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 43,
+    "fragment" : "array_sort(array(3, 1, 2), array(0))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), 1) as exists_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "exists(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), map('found', true)) as exists_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(found, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(map(found, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "exists(array(1, 2, 3), map('found', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), struct('exists', true)) as exists_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(exists, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(struct(exists, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 53,
+    "fragment" : "exists(array(1, 2, 3), struct('exists', true))"
+  } ]
+}
+
+
+-- !query
+select exists(array(1, 2, 3), array(true)) as exists_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"exists(array(1, 2, 3), lambdafunction(array(true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 42,
+    "fragment" : "exists(array(1, 2, 3), array(true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), 1) as filter_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "filter(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), map('key', 'value')) as filter_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(key, value), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, STRING>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(map(key, value), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "filter(array(1, 2, 3), map('key', 'value'))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), struct('valid', true)) as filter_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(valid, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(struct(valid, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "filter(array(1, 2, 3), struct('valid', true))"
+  } ]
+}
+
+
+-- !query
+select filter(array(1, 2, 3), array(true, false)) as filter_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, false), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"filter(array(1, 2, 3), lambdafunction(array(true, false), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "filter(array(1, 2, 3), array(true, false))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), 1) as forall_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(1, namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 32,
+    "fragment" : "forall(array(1, 2, 3), 1)"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), map('all', true)) as forall_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(all, true), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(map(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 47,
+    "fragment" : "forall(array(1, 2, 3), map('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), struct('all', true)) as forall_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(all, true), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(struct(all, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "forall(array(1, 2, 3), struct('all', true))"
+  } ]
+}
+
+
+-- !query
+select forall(array(1, 2, 3), array(true, true)) as forall_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true, true), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"forall(array(1, 2, 3), lambdafunction(array(true, true), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 48,
+    "fragment" : "forall(array(1, 2, 3), array(true, true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), 1) as map_filter_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(1, namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"INT\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(1, namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 41,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), 1)"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), map('keep', true)) as map_filter_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(map(keep, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 57,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), map('keep', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), struct('filter', true)) as map_filter_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"STRUCT<col1: STRING NOT NULL, col2: BOOLEAN NOT NULL>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(struct(filter, true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 62,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), struct('filter', true))"
+  } ]
+}
+
+
+-- !query
+select map_filter(map('a', 1, 'b', 2), array(true)) as map_filter_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(true), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<BOOLEAN>\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"BOOLEAN\"",
+    "sqlExpr" : "\"map_filter(map(a, 1, b, 2), lambdafunction(array(true), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 51,
+    "fragment" : "map_filter(map('a', 1, 'b', 2), array(true))"
+  } ]
+}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), 100) as map_zipwith_int_literal
+-- !query schema
+struct<map_zipwith_int_literal:map<string,int>>
+-- !query output
+{"a":100}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), map('merged', true)) as map_zipwith_map_literal
+-- !query schema
+struct<map_zipwith_map_literal:map<string,map<string,boolean>>>
+-- !query output
+{"a":{"merged":true}}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), struct('left', 1, 'right', 10)) as map_zipwith_struct_literal
+-- !query schema
+struct<map_zipwith_struct_literal:map<string,struct<col1:string,col2:int,col3:string,col4:int>>>
+-- !query output
+{"a":{"col1":"left","col2":1,"col3":"right","col4":10}}
+
+
+-- !query
+select map_zip_with(map('a', 1), map('a', 10), array('combined')) as map_zipwith_array_literal
+-- !query schema
+struct<map_zipwith_array_literal:map<string,array<string>>>
+-- !query output
+{"a":["combined"]}
+
+
+-- !query
+select reduce(array(1, 2, 3), 0, 100) as reduce_int_literal
+-- !query schema
+struct<reduce_int_literal:int>
+-- !query output
+100
+
+
+-- !query
+select reduce(array(1, 2, 3), map(), map('result', 999)) as reduce_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"MAP<STRING, INT>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"MAP<VOID, VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), map(), lambdafunction(map(result, 999), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 56,
+    "fragment" : "reduce(array(1, 2, 3), map(), map('result', 999))"
+  } ]
+}
+
+
+-- !query
+select reduce(array(1, 2, 3), struct('init', 0), struct('final', 999)) as reduce_struct_literal
+-- !query schema
+struct<reduce_struct_literal:struct<col1:string,col2:int>>
+-- !query output
+{"col1":"final","col2":999}
+
+
+-- !query
+select reduce(array(1, 2, 3), array(), array('result')) as reduce_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"lambdafunction(array(result), namedlambdavariable(), namedlambdavariable())\"",
+    "inputType" : "\"ARRAY<STRING>\"",
+    "paramIndex" : "third",
+    "requiredType" : "\"ARRAY<VOID>\"",
+    "sqlExpr" : "\"reduce(array(1, 2, 3), array(), lambdafunction(array(result), namedlambdavariable(), namedlambdavariable()), lambdafunction(namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 55,
+    "fragment" : "reduce(array(1, 2, 3), array(), array('result'))"
+  } ]
+}
+
+
+-- !query
+select transform(array(1, 2, 3), 42) as transform_int_literal
+-- !query schema
+struct<transform_int_literal:array<int>>
+-- !query output
+[42,42,42]
+
+
+-- !query
+select transform(array(1, 2, 3), map('key', 'value')) as transform_map_literal
+-- !query schema
+struct<transform_map_literal:array<map<string,string>>>
+-- !query output
+[{"key":"value"},{"key":"value"},{"key":"value"}]
+
+
+-- !query
+select transform(array(1, 2, 3), struct('id', 99, 'name', 'test')) as transform_struct_literal
+-- !query schema
+struct<transform_struct_literal:array<struct<col1:string,col2:int,col3:string,col4:string>>>
+-- !query output
+[{"col1":"id","col2":99,"col3":"name","col4":"test"},{"col1":"id","col2":99,"col3":"name","col4":"test"},{"col1":"id","col2":99,"col3":"name","col4":"test"}]
+
+
+-- !query
+select transform(array(1, 2, 3), array('a', 'b')) as transform_array_literal
+-- !query schema
+struct<transform_array_literal:array<array<string>>>
+-- !query output
+[["a","b"],["a","b"],["a","b"]]
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), 42) as transform_keys_int_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "DUPLICATED_MAP_KEY",
+  "sqlState" : "23505",
+  "messageParameters" : {
+    "key" : "42",
+    "mapKeyDedupPolicy" : "\"spark.sql.mapKeyDedupPolicy\""
+  }
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), map('new', 'key')) as transform_keys_map_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.INVALID_MAP_KEY_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "keyType" : "\"MAP<STRING, STRING>\"",
+    "sqlExpr" : "\"transform_keys(map(a, 1, b, 2), lambdafunction(map(new, key), namedlambdavariable(), namedlambdavariable()))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 61,
+    "fragment" : "transform_keys(map('a', 1, 'b', 2), map('new', 'key'))"
+  } ]
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), struct('key', 'value')) as transform_keys_struct_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "DUPLICATED_MAP_KEY",
+  "sqlState" : "23505",
+  "messageParameters" : {
+    "key" : "[key,value]",
+    "mapKeyDedupPolicy" : "\"spark.sql.mapKeyDedupPolicy\""
+  }
+}
+
+
+-- !query
+select transform_keys(map('a', 1, 'b', 2), array('new_key')) as transform_keys_array_literal
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "DUPLICATED_MAP_KEY",
+  "sqlState" : "23505",
+  "messageParameters" : {
+    "key" : "[new_key]",
+    "mapKeyDedupPolicy" : "\"spark.sql.mapKeyDedupPolicy\""
+  }
+}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), 999) as transform_values_int_literal
+-- !query schema
+struct<transform_values_int_literal:map<string,int>>
+-- !query output
+{"a":999,"b":999}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), map('new', 'value')) as transform_values_map_literal
+-- !query schema
+struct<transform_values_map_literal:map<string,map<string,string>>>
+-- !query output
+{"a":{"new":"value"},"b":{"new":"value"}}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), struct('val', 999)) as transform_values_struct_literal
+-- !query schema
+struct<transform_values_struct_literal:map<string,struct<col1:string,col2:int>>>
+-- !query output
+{"a":{"col1":"val","col2":999},"b":{"col1":"val","col2":999}}
+
+
+-- !query
+select transform_values(map('a', 1, 'b', 2), array('new_value')) as transform_values_array_literal
+-- !query schema
+struct<transform_values_array_literal:map<string,array<string>>>
+-- !query output
+{"a":["new_value"],"b":["new_value"]}
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), 100) as zipwith_int_literal
+-- !query schema
+struct<zipwith_int_literal:array<int>>
+-- !query output
+[100,100,100]
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), map('merged', true)) as zipwith_map_literal
+-- !query schema
+struct<zipwith_map_literal:array<map<string,boolean>>>
+-- !query output
+[{"merged":true},{"merged":true},{"merged":true}]
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), struct('left', 1, 'right', 2)) as zipwith_struct_literal
+-- !query schema
+struct<zipwith_struct_literal:array<struct<col1:string,col2:int,col3:string,col4:int>>>
+-- !query output
+[{"col1":"left","col2":1,"col3":"right","col4":2},{"col1":"left","col2":1,"col3":"right","col4":2},{"col1":"left","col2":1,"col3":"right","col4":2}]
+
+
+-- !query
+select zip_with(array(1, 2, 3), array(4, 5, 6), array('combined')) as zipwith_array_literal
+-- !query schema
+struct<zipwith_array_literal:array<array<string>>>
+-- !query output
+[["combined"],["combined"],["combined"]]
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/keywords.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/keywords.sql.out
index 59f860eb7ef49..97309774cc37d 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/keywords.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/keywords.sql.out
@@ -390,6 +390,7 @@ WHILE	false
 WINDOW	false
 WITH	false
 WITHIN	false
+WITHOUT	false
 X	false
 YEAR	false
 YEARS	false
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/literals.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/literals.sql.out
index f7a8850fbaac4..410b55bdd4394 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/literals.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/literals.sql.out
@@ -785,3 +785,59 @@ select -0, -0.0
 struct<0:int,0.0:decimal(1,1)>
 -- !query output
 0	0.0
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+S"par"k	S"par"k	S""par""k
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+S'par'k	S'par'k	S''par''k
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query schema
+struct<c1:string,c2:string,c3:string,c4:string,c5:string,c6:string>
+-- !query output
+Spark	Spark	Spark	Spark	Spark	Spark
+
+
+-- !query
+SET spark.sql.legacy.consecutiveStringLiterals.enabled=true
+-- !query schema
+struct<key:string,value:string>
+-- !query output
+spark.sql.legacy.consecutiveStringLiterals.enabled	true
+
+
+-- !query
+SELECT "S""par""k" AS c1, "S\"par\"k" AS c2, 'S""par""k' AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+Spark	S"par"k	S""par""k
+
+
+-- !query
+SELECT 'S''par''k' AS c1, 'S\'par\'k' AS c2, "S''par''k" AS c3
+-- !query schema
+struct<c1:string,c2:string,c3:string>
+-- !query output
+Spark	S'par'k	S''par''k
+
+
+-- !query
+SELECT "S" "par" "k" AS c1, 'S' 'par' 'k' AS c2, "S" 'par' "k" AS c3, 'S' "par" 'k' AS c4, "S"'par'"k" AS c5, 'S'"par"'k' AS c6
+-- !query schema
+struct<c1:string,c2:string,c3:string,c4:string,c5:string,c6:string>
+-- !query output
+Spark	Spark	Spark	Spark	Spark	Spark
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/string-functions.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/string-functions.sql.out
index bb4d615deb292..2c968a7b2f775 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/string-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/string-functions.sql.out
@@ -147,6 +147,46 @@ struct<split(hello, , -1):array<string>>
 ["h","e","l","l","o"]
 
 
+-- !query
+SELECT split('hello', '', 0)
+-- !query schema
+struct<split(hello, , 0):array<string>>
+-- !query output
+["h","e","l","l","o"]
+
+
+-- !query
+SELECT split('hello', '', 1)
+-- !query schema
+struct<split(hello, , 1):array<string>>
+-- !query output
+["hello"]
+
+
+-- !query
+SELECT split('hello', '', 3)
+-- !query schema
+struct<split(hello, , 3):array<string>>
+-- !query output
+["h","e","llo"]
+
+
+-- !query
+SELECT split('hello', '', 5)
+-- !query schema
+struct<split(hello, , 5):array<string>>
+-- !query output
+["h","e","l","l","o"]
+
+
+-- !query
+SELECT split('hello', '', 100)
+-- !query schema
+struct<split(hello, , 100):array<string>>
+-- !query output
+["h","e","l","l","o"]
+
+
 -- !query
 SELECT split('', '')
 -- !query schema
@@ -155,6 +195,30 @@ struct<split(, , -1):array<string>>
 [""]
 
 
+-- !query
+SELECT split('', '', -1)
+-- !query schema
+struct<split(, , -1):array<string>>
+-- !query output
+[""]
+
+
+-- !query
+SELECT split('', '', 0)
+-- !query schema
+struct<split(, , 0):array<string>>
+-- !query output
+[""]
+
+
+-- !query
+SELECT split('', '', 1)
+-- !query schema
+struct<split(, , 1):array<string>>
+-- !query output
+[""]
+
+
 -- !query
 SELECT split('abc', null)
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/nonansi/timestamp.sql.out b/sql/core/src/test/resources/sql-tests/results/nonansi/timestamp.sql.out
index 0e0b014a3b161..932c1154ec66c 100644
--- a/sql/core/src/test/resources/sql-tests/results/nonansi/timestamp.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/nonansi/timestamp.sql.out
@@ -180,6 +180,278 @@ struct<make_timestamp(1, 1, 1, 1, 1, 999.999999):timestamp>
 NULL
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11)):timestamp>
+-- !query output
+2021-07-11 00:00:00
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query schema
+struct<make_timestamp(NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678)):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00'):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT):timestamp>
+-- !query output
+2021-07-10 10:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC):timestamp>
+-- !query output
+2021-07-10 23:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET):timestamp>
+-- !query output
+2021-07-10 21:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST):timestamp>
+-- !query output
+2021-07-10 14:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', UTC):timestamp>
+-- !query output
+1969-12-31 16:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query schema
@@ -805,49 +1077,17 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query schema
-struct<>
+struct<TIMESTAMP '2011-11-11 11:11:11' + NULL:timestamp>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+NULL
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query schema
-struct<>
+struct<TIMESTAMP '2011-11-11 11:11:11' + NULL:timestamp>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+NULL
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/results/order-by-ordinal.sql.out b/sql/core/src/test/resources/sql-tests/results/order-by-ordinal.sql.out
index f975715c12bc2..b1b63b1de1eab 100644
--- a/sql/core/src/test/resources/sql-tests/results/order-by-ordinal.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/order-by-ordinal.sql.out
@@ -148,6 +148,304 @@ struct<a:int,b:int>
 3	2
 
 
+-- !query
+set spark.sql.prioritizeOrdinalResolutionInSort.enabled=true
+-- !query schema
+struct<key:string,value:string>
+-- !query output
+spark.sql.prioritizeOrdinalResolutionInSort.enabled	true
+
+
+-- !query
+SELECT a FROM data ORDER BY 2, b
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 29,
+    "stopIndex" : 29,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 2
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY 'b', 2
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 34,
+    "stopIndex" : 34,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY `b`, 2
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 34,
+    "stopIndex" : 34,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY a, 2
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 3
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "3",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "3"
+  } ]
+}
+
+
+-- !query
+SELECT a, a + 1 FROM data ORDER BY b, 3
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "3",
+    "size" : "2"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 39,
+    "stopIndex" : 39,
+    "fragment" : "3"
+  } ]
+}
+
+
+-- !query
+set spark.sql.prioritizeOrdinalResolutionInSort.enabled=false
+-- !query schema
+struct<key:string,value:string>
+-- !query output
+spark.sql.prioritizeOrdinalResolutionInSort.enabled	false
+
+
+-- !query
+SELECT a FROM data ORDER BY 2, b
+-- !query schema
+struct<a:int>
+-- !query output
+1
+2
+3
+1
+2
+3
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 2
+-- !query schema
+struct<a:int>
+-- !query output
+1
+2
+3
+1
+2
+3
+
+
+-- !query
+SELECT a FROM data ORDER BY 'b', 2
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 34,
+    "stopIndex" : 34,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY `b`, 2
+-- !query schema
+struct<a:int>
+-- !query output
+1
+2
+3
+1
+2
+3
+
+
+-- !query
+SELECT a FROM data ORDER BY a, 2
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "2",
+    "size" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "2"
+  } ]
+}
+
+
+-- !query
+SELECT a FROM data ORDER BY b, 3
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "ORDER_BY_POS_OUT_OF_RANGE",
+  "sqlState" : "42805",
+  "messageParameters" : {
+    "index" : "3",
+    "size" : "2"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 32,
+    "stopIndex" : 32,
+    "fragment" : "3"
+  } ]
+}
+
+
+-- !query
+SELECT a, a + 1 FROM data ORDER BY b, 3
+-- !query schema
+struct<a:int,(a + 1):int>
+-- !query output
+1	2
+2	3
+3	4
+1	2
+2	3
+3	4
+
+
 -- !query
 set spark.sql.orderByOrdinal=false
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/order-by.sql.out b/sql/core/src/test/resources/sql-tests/results/order-by.sql.out
index 3666bc49189e6..6ce8d395fb0dd 100644
--- a/sql/core/src/test/resources/sql-tests/results/order-by.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/order-by.sql.out
@@ -442,6 +442,22 @@ struct<(sum(b) + 1):bigint>
 11
 
 
+-- !query
+SELECT col1 FROM VALUES(1,2) GROUP BY col1, col2 ORDER BY col2, col2
+-- !query schema
+struct<col1:int>
+-- !query output
+1
+
+
+-- !query
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 ORDER BY col2, col2
+-- !query schema
+struct<a:int,b:int>
+-- !query output
+1	1
+
+
 -- !query
 DROP VIEW IF EXISTS testData
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/postgreSQL/with.sql.out b/sql/core/src/test/resources/sql-tests/results/postgreSQL/with.sql.out
index 0ce77049905c4..1e0441e07393d 100644
--- a/sql/core/src/test/resources/sql-tests/results/postgreSQL/with.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/postgreSQL/with.sql.out
@@ -901,20 +901,10 @@ WITH RECURSIVE x(n) AS (SELECT n FROM x UNION ALL SELECT 1)
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
+org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`n`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 32,
-    "stopIndex" : 32,
-    "fragment" : "n"
-  } ]
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
 }
 
 
@@ -1553,15 +1543,8 @@ struct<>
 -- !query output
 org.apache.spark.sql.AnalysisException
 {
-  "errorClass" : "UNION_NOT_SUPPORTED_IN_RECURSIVE_CTE",
-  "sqlState" : "42836",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 185,
-    "fragment" : "WITH RECURSIVE outermost(x) AS (\n  WITH innermost as (SELECT 2 FROM outermost) -- fail\n    SELECT * FROM innermost\n    UNION SELECT * from outermost\n)\nSELECT * FROM outermost ORDER BY 1"
-  } ]
+  "errorClass" : "INVALID_RECURSIVE_CTE",
+  "sqlState" : "42836"
 }
 
 
diff --git a/sql/core/src/test/resources/sql-tests/results/replacing-missing-expression-with-alias.sql.out b/sql/core/src/test/resources/sql-tests/results/replacing-missing-expression-with-alias.sql.out
new file mode 100644
index 0000000000000..f3a6b0424b659
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/replacing-missing-expression-with-alias.sql.out
@@ -0,0 +1,178 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+SELECT col1 + 1 AS a FROM VALUES(1) GROUP BY a ORDER BY col1 + 1
+-- !query schema
+struct<a:int>
+-- !query output
+2
+
+
+-- !query
+SELECT col1 + 1 AS a, a AS b FROM VALUES(1) GROUP BY a ORDER BY col1 + 1
+-- !query schema
+struct<a:int,b:int>
+-- !query output
+2	2
+
+
+-- !query
+SELECT col1 + 1 AS a FROM VALUES(1) GROUP BY a HAVING col1 + 1 > 0
+-- !query schema
+struct<a:int>
+-- !query output
+2
+
+
+-- !query
+SELECT col1 + 1 AS a, a AS b FROM VALUES(1) GROUP BY a HAVING col1 + 1 > 0
+-- !query schema
+struct<a:int,b:int>
+-- !query output
+2	2
+
+
+-- !query
+SELECT col1, col2, GROUPING(col1) FROM VALUES("abc", 1) GROUP BY CUBE(col1, col2) ORDER BY GROUPING(col1)
+-- !query schema
+struct<col1:string,col2:int,grouping(col1):tinyint>
+-- !query output
+abc	1	0
+abc	NULL	0
+NULL	1	1
+NULL	NULL	1
+
+
+-- !query
+SELECT col1, col2, GROUPING(col1) FROM VALUES("abc", 1) GROUP BY CUBE(col1, col2) HAVING GROUPING(col1) != NULL
+-- !query schema
+struct<col1:string,col2:int,grouping(col1):tinyint>
+-- !query output
+
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) ORDER BY make_date(col1, col2, col3)
+-- !query schema
+struct<a:date>
+-- !query output
+0001-02-03
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) ORDER BY make_date(col1, col2, col3)
+-- !query schema
+struct<a:date,b:date>
+-- !query output
+0001-02-03	0001-02-03
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) HAVING make_date(col1, col2, col3) > '2025-01-01'
+-- !query schema
+struct<a:date>
+-- !query output
+
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) GROUP BY make_date(col1, col2, col3) HAVING make_date(col1, col2, col3) > '2025-01-01'
+-- !query schema
+struct<a:date,b:date>
+-- !query output
+
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a FROM VALUES(1,2,3) ORDER BY make_date(col1, col2, col3)
+-- !query schema
+struct<a:date>
+-- !query output
+0001-02-03
+
+
+-- !query
+SELECT make_date(col1, col2, col3) AS a, a AS b FROM VALUES(1,2,3) ORDER BY make_date(col1, col2, col3)
+-- !query schema
+struct<a:date,b:date>
+-- !query output
+0001-02-03	0001-02-03
+
+
+-- !query
+SELECT col1, col1 AS a FROM VALUES(1) GROUP BY col1 ORDER BY col1 ASC
+-- !query schema
+struct<col1:int,a:int>
+-- !query output
+1	1
+
+
+-- !query
+SELECT col1 AS a, col1 FROM VALUES(1) GROUP BY col1 ORDER BY col1 ASC
+-- !query schema
+struct<a:int,col1:int>
+-- !query output
+1	1
+
+
+-- !query
+SELECT col1, col1 AS a FROM VALUES(1) GROUP BY col1 HAVING col1 > 0
+-- !query schema
+struct<col1:int,a:int>
+-- !query output
+1	1
+
+
+-- !query
+SELECT col1 AS a, col1 FROM VALUES(1) GROUP BY col1 HAVING col1 > 0
+-- !query schema
+struct<a:int,col1:int>
+-- !query output
+1	1
+
+
+-- !query
+SELECT col2 AS b, col2 FROM VALUES(1,2) GROUP BY 1,2 ORDER BY ALL
+-- !query schema
+struct<b:int,col2:int>
+-- !query output
+2	2
+
+
+-- !query
+SELECT col2 AS b, col2 FROM VALUES(1,2) GROUP BY 1,2 HAVING col2 > 0 ORDER BY ALL
+-- !query schema
+struct<b:int,col2:int>
+-- !query output
+2	2
+
+
+-- !query
+SELECT col2 AS b, col2, b as c FROM VALUES(1,2) GROUP BY 1,2 ORDER BY ALL
+-- !query schema
+struct<b:int,col2:int,c:int>
+-- !query output
+2	2	2
+
+
+-- !query
+SELECT col2 AS b, col2, b as c FROM VALUES(1,2) GROUP BY 1,2 HAVING col2 > 0 ORDER BY ALL
+-- !query schema
+struct<b:int,col2:int,c:int>
+-- !query output
+2	2	2
+
+
+-- !query
+SELECT col1 AS a FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 > 1 ORDER BY col1
+-- !query schema
+struct<a:int>
+-- !query output
+1
+
+
+-- !query
+SELECT col1 AS a, a AS b FROM VALUES(1,2) GROUP BY col1, col2 HAVING col2 > 1 ORDER BY col1
+-- !query schema
+struct<a:int,b:int>
+-- !query output
+1	1
diff --git a/sql/core/src/test/resources/sql-tests/results/sql-session-variables.sql.out b/sql/core/src/test/resources/sql-tests/results/sql-session-variables.sql.out
index 73d3ec737085f..de8d6743fc761 100644
--- a/sql/core/src/test/resources/sql-tests/results/sql-session-variables.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/sql-session-variables.sql.out
@@ -1369,6 +1369,188 @@ struct<>
 
 
 
+-- !query
+SET VARIABLE title = 'DECLARE VARIABLE - multiple variables declared at once'
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DECLARE VARIABLE var1, var2, var3 INT
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DECLARE VARIABLE var4, var5, var6 INT DEFAULT CAST(RAND(0) * 10 AS INT)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DECLARE VARIABLE var7, var8, var9 DEFAULT 5
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT var4 = var5, var4 = var6, var5 = var6
+-- !query schema
+struct<(variablereference(system.session.var4=7) = variablereference(system.session.var5=7)):boolean,(variablereference(system.session.var4=7) = variablereference(system.session.var6=7)):boolean,(variablereference(system.session.var5=7) = variablereference(system.session.var6=7)):boolean>
+-- !query output
+true	true	true
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var1, var2, var3 DOUBLE
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var4, var5, var6 DOUBLE DEFAULT RAND(0)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var7, var8, var9 DEFAULT 1.5
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT var4 = var5, var4 = var6, var5 = var6
+-- !query schema
+struct<(variablereference(system.session.var4=0.7604953758285915D) = variablereference(system.session.var5=0.7604953758285915D)):boolean,(variablereference(system.session.var4=0.7604953758285915D) = variablereference(system.session.var6=0.7604953758285915D)):boolean,(variablereference(system.session.var5=0.7604953758285915D) = variablereference(system.session.var6=0.7604953758285915D)):boolean>
+-- !query output
+true	true	true
+
+
+-- !query
+DROP TEMPORARY VARIABLE var1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var3
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var4
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var5
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var6
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var7
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var8
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TEMPORARY VARIABLE var9
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SET VARIABLE title = 'DECLARE VARIABLE - duplicate names'
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DECLARE VARIABLE var1, var2, vAr1 INT
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE",
+  "sqlState" : "42734",
+  "messageParameters" : {
+    "variableName" : "`system`.`session`.`var1`"
+  }
+}
+
+
+-- !query
+DECLARE OR REPLACE VARIABLE var1, var2, vAr1 INT
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE",
+  "sqlState" : "42734",
+  "messageParameters" : {
+    "variableName" : "`system`.`session`.`var1`"
+  }
+}
+
+
 -- !query
 SET VARIABLE title = 'SET VARIABLE - row assignment'
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/sql-udf.sql.out b/sql/core/src/test/resources/sql-tests/results/sql-udf.sql.out
index eec42f1259344..de65b20b1408c 100644
--- a/sql/core/src/test/resources/sql-tests/results/sql-udf.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/sql-udf.sql.out
@@ -804,7 +804,7 @@ org.apache.spark.sql.AnalysisException
 
 
 -- !query
-CREATE FUNCTION foo2_1a(a INT) RETURNS INT RETURN a
+CREATE FUNCTION foo51() RETURNS INT RETURN (SELECT a FROM VALUES(1), (2) AS T(a))
 -- !query schema
 struct<>
 -- !query output
@@ -812,15 +812,24 @@ struct<>
 
 
 -- !query
-SELECT foo2_1a(5)
+SELECT foo51()
 -- !query schema
-struct<spark_catalog.default.foo2_1a(5):int>
+struct<>
 -- !query output
-5
+org.apache.spark.SparkException
+{
+  "errorClass" : "SCALAR_SUBQUERY_TOO_MANY_ROWS",
+  "sqlState" : "21000",
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "fragment" : ""
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo2_1b(a INT, b INT) RETURNS INT RETURN a + b
+CREATE FUNCTION foo52() RETURNS INT RETURN (SELECT 1 FROM VALUES(1) WHERE 1 = 0)
 -- !query schema
 struct<>
 -- !query output
@@ -828,15 +837,15 @@ struct<>
 
 
 -- !query
-SELECT foo2_1b(5, 6)
+SELECT foo52()
 -- !query schema
-struct<spark_catalog.default.foo2_1b(5, 6):int>
+struct<spark_catalog.default.foo52():int>
 -- !query output
-11
+NULL
 
 
 -- !query
-CREATE FUNCTION foo2_1c(a INT, b INT) RETURNS INT RETURN 10 * (a + b) + 100 * (a -b)
+CREATE FUNCTION foo6c(` a` INT, a INT, `a b` INT) RETURNS INT RETURN 1
 -- !query schema
 struct<>
 -- !query output
@@ -844,15 +853,15 @@ struct<>
 
 
 -- !query
-SELECT foo2_1c(5, 6)
+SELECT foo6c(1, 2, 3)
 -- !query schema
-struct<spark_catalog.default.foo2_1c(5, 6):int>
+struct<spark_catalog.default.foo6c(1, 2, 3):int>
 -- !query output
-10
+1
 
 
 -- !query
-CREATE FUNCTION foo2_1d(a INT, b INT) RETURNS INT RETURN ABS(a) - LENGTH(CAST(b AS VARCHAR(10)))
+CREATE FUNCTION foo6d() RETURNS TABLE(` a` INT, a INT, `a b` INT) RETURN SELECT 1, 2, 3
 -- !query schema
 struct<>
 -- !query output
@@ -860,15 +869,18 @@ struct<>
 
 
 -- !query
-SELECT foo2_1d(-5, 6)
+SELECT * FROM foo6d()
 -- !query schema
-struct<spark_catalog.default.foo2_1d(-5, 6):int>
+struct< a:int,a:int,a b:int>
 -- !query output
-4
+1	2	3
 
 
 -- !query
-CREATE FUNCTION foo2_2a(a INT) RETURNS INT RETURN SELECT a
+CREATE FUNCTION foo7a(a STRING, b STRING, c STRING) RETURNS STRING RETURN
+SELECT 'Foo.a: ' || a ||  ' Foo.a: ' || foo7a.a
+       || ' T.b: ' ||  b || ' Foo.b: ' || foo7a.b
+       || ' T.c: ' || c || ' T.c: ' || t.c FROM VALUES('t.b', 't.c') AS T(b, c)
 -- !query schema
 struct<>
 -- !query output
@@ -876,15 +888,18 @@ struct<>
 
 
 -- !query
-SELECT foo2_2a(5)
+SELECT foo7a('Foo.a', 'Foo.b', 'Foo.c')
 -- !query schema
-struct<spark_catalog.default.foo2_2a(5):int>
+struct<spark_catalog.default.foo7a(Foo.a, Foo.b, Foo.c):string>
 -- !query output
-5
+Foo.a: Foo.a Foo.a: Foo.a T.b: t.b Foo.b: Foo.b T.c: t.c T.c: t.c
 
 
 -- !query
-CREATE FUNCTION foo2_2b(a INT) RETURNS INT RETURN 1 + (SELECT a)
+CREATE FUNCTION foo7at(a STRING, b STRING, c STRING) RETURNS TABLE (a STRING, b STRING, c STRING, d STRING, e STRING) RETURN
+SELECT CONCAT('Foo.a: ', a), CONCAT('Foo.b: ', foo7at.b), CONCAT('T.b: ', b),
+       CONCAT('Foo.c: ', foo7at.c), CONCAT('T.c: ', c)
+FROM VALUES ('t.b', 't.c') AS T(b, c)
 -- !query schema
 struct<>
 -- !query output
@@ -892,62 +907,62 @@ struct<>
 
 
 -- !query
-SELECT foo2_2b(5)
+SELECT * FROM foo7at('Foo.a', 'Foo.b', 'Foo.c')
 -- !query schema
-struct<spark_catalog.default.foo2_2b(5):int>
+struct<a:string,b:string,c:string,d:string,e:string>
 -- !query output
-6
+Foo.a: Foo.a	Foo.b: Foo.b	T.b: t.b	Foo.c: Foo.c	T.c: t.c
 
 
 -- !query
-CREATE FUNCTION foo2_2c(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT a))
+CREATE FUNCTION foo9a(a BOOLEAN) RETURNS BOOLEAN RETURN NOT a
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`a`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 21,
-    "stopIndex" : 21,
-    "fragment" : "a"
-  } ]
-}
+
 
 
 -- !query
-CREATE FUNCTION foo2_2d(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT (SELECT (SELECT a))))
+SELECT foo9a(true)
+-- !query schema
+struct<spark_catalog.default.foo9a(true):boolean>
+-- !query output
+false
+
+
+-- !query
+SELECT foo9a(5)
+-- !query schema
+struct<spark_catalog.default.foo9a(5):boolean>
+-- !query output
+false
+
+
+-- !query
+SELECT foo9a('Nonsense')
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
+org.apache.spark.SparkRuntimeException
 {
-  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
-  "sqlState" : "42703",
+  "errorClass" : "CAST_INVALID_INPUT",
+  "sqlState" : "22018",
   "messageParameters" : {
-    "objectName" : "`a`"
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "expression" : "'Nonsense'",
+    "sourceType" : "\"STRING\"",
+    "targetType" : "\"BOOLEAN\""
   },
   "queryContext" : [ {
     "objectType" : "",
     "objectName" : "",
-    "startIndex" : 37,
-    "stopIndex" : 37,
-    "fragment" : "a"
+    "fragment" : ""
   } ]
 }
 
 
 -- !query
-CREATE FUNCTION foo2_2e(a INT) RETURNS INT RETURN
-SELECT a FROM (VALUES 1) AS V(c1) WHERE c1 = 2
-UNION ALL
-SELECT a + 1 FROM (VALUES 1) AS V(c1)
+CREATE FUNCTION foo9b(a BYTE) RETURNS BYTE RETURN CAST(a AS SHORT) + 1
 -- !query schema
 struct<>
 -- !query output
@@ -955,37 +970,51 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo2_2f(a INT) RETURNS INT RETURN
-SELECT a FROM (VALUES 1) AS V(c1)
-EXCEPT
-SELECT a + 1 FROM (VALUES 1) AS V(a)
+SELECT foo9b(126)
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo9b(126):tinyint>
 -- !query output
-
+127
 
 
 -- !query
-CREATE FUNCTION foo2_2g(a INT) RETURNS INT RETURN
-SELECT a FROM (VALUES 1) AS V(c1)
-INTERSECT
-SELECT a FROM (VALUES 1) AS V(a)
+SELECT foo9b(127)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"INT\"",
+    "targetType" : "\"TINYINT\"",
+    "value" : "128"
+  }
+}
 
 
 -- !query
-DROP TABLE IF EXISTS t1
+SELECT foo9b(128)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"INT\"",
+    "targetType" : "\"TINYINT\"",
+    "value" : "128"
+  }
+}
 
 
 -- !query
-DROP TABLE IF EXISTS t2
+CREATE FUNCTION foo9c(a SHORT) RETURNS SHORT RETURN CAST(a AS INTEGER) + 1
 -- !query schema
 struct<>
 -- !query output
@@ -993,31 +1022,51 @@ struct<>
 
 
 -- !query
-DROP TABLE IF EXISTS ts
+SELECT foo9c(32766)
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo9c(32766):smallint>
 -- !query output
-
+32767
 
 
 -- !query
-DROP TABLE IF EXISTS tm
+SELECT foo9c(32767)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"INT\"",
+    "targetType" : "\"SMALLINT\"",
+    "value" : "32768"
+  }
+}
 
 
 -- !query
-DROP TABLE IF EXISTS ta
+SELECT foo9c(32768)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"INT\"",
+    "targetType" : "\"SMALLINT\"",
+    "value" : "32768"
+  }
+}
 
 
 -- !query
-DROP TABLE IF EXISTS V1
+CREATE FUNCTION foo9d(a INTEGER) RETURNS INTEGER RETURN CAST(a AS BIGINT) + 1
 -- !query schema
 struct<>
 -- !query output
@@ -1025,31 +1074,57 @@ struct<>
 
 
 -- !query
-DROP TABLE IF EXISTS V2
+SELECT foo9d(2147483647 - 1)
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo9d((2147483647 - 1)):int>
 -- !query output
-
+2147483647
 
 
 -- !query
-DROP VIEW IF EXISTS t1
+SELECT foo9d(2147483647)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"BIGINT\"",
+    "targetType" : "\"INT\"",
+    "value" : "2147483648L"
+  }
+}
 
 
 -- !query
-DROP VIEW IF EXISTS t2
+SELECT foo9d(2147483647 + 1)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "ARITHMETIC_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "alternative" : " Use 'try_add' to tolerate overflow and return NULL instead.",
+    "config" : "\"spark.sql.ansi.enabled\"",
+    "message" : "integer overflow"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 14,
+    "stopIndex" : 27,
+    "fragment" : "2147483647 + 1"
+  } ]
+}
 
 
 -- !query
-DROP VIEW IF EXISTS ts
+CREATE FUNCTION foo9e(a BIGINT) RETURNS BIGINT RETURN CAST(a AS DECIMAL(20, 0)) + 1
 -- !query schema
 struct<>
 -- !query output
@@ -1057,31 +1132,51 @@ struct<>
 
 
 -- !query
-DROP VIEW IF EXISTS tm
+SELECT foo9e(9223372036854775807 - 1)
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo9e((9223372036854775807 - 1)):bigint>
 -- !query output
-
+9223372036854775807
 
 
 -- !query
-DROP VIEW IF EXISTS ta
+SELECT foo9e(9223372036854775807)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"DECIMAL(21,0)\"",
+    "targetType" : "\"BIGINT\"",
+    "value" : "9223372036854775808BD"
+  }
+}
 
 
 -- !query
-DROP VIEW IF EXISTS V1
+SELECT foo9e(9223372036854775807.0 + 1)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "CAST_OVERFLOW",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "sourceType" : "\"DECIMAL(21,1)\"",
+    "targetType" : "\"BIGINT\"",
+    "value" : "9223372036854775808.0BD"
+  }
+}
 
 
 -- !query
-DROP VIEW IF EXISTS V2
+CREATE FUNCTION foo9f(a DECIMAL( 5, 2 )) RETURNS DECIMAL (5, 2) RETURN CAST(a AS DECIMAL(6, 2)) + 1
 -- !query schema
 struct<>
 -- !query output
@@ -1089,23 +1184,61 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo2_3(a INT, b INT) RETURNS INT RETURN a + b
+SELECT foo9f(999 - 1)
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo9f((999 - 1)):decimal(5,2)>
 -- !query output
-
+999.00
 
 
 -- !query
-CREATE VIEW V1(c1, c2) AS VALUES (1, 2), (3, 4), (5, 6)
+SELECT foo9f(999)
 -- !query schema
 struct<>
 -- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "NUMERIC_VALUE_OUT_OF_RANGE.WITH_SUGGESTION",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\"",
+    "precision" : "5",
+    "scale" : "2",
+    "value" : "1000.00"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "fragment" : ""
+  } ]
+}
 
 
+-- !query
+SELECT foo9f(999 + 1)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "NUMERIC_VALUE_OUT_OF_RANGE.WITH_SUGGESTION",
+  "sqlState" : "22003",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\"",
+    "precision" : "5",
+    "scale" : "2",
+    "value" : "1000"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "fragment" : ""
+  } ]
+}
+
 
 -- !query
-CREATE VIEW V2(c1, c2) AS VALUES (-1, -2), (-3, -4), (-5, -6)
+CREATE FUNCTION foo9g(a FLOAT, b String) RETURNS FLOAT RETURN b || CAST(a AS String)
 -- !query schema
 struct<>
 -- !query output
@@ -1113,36 +1246,61 @@ struct<>
 
 
 -- !query
-SELECT foo2_3(c1, c2), foo2_3(c2, 1), foo2_3(c1, c2) - foo2_3(c2, c1 - 1) FROM V1 ORDER BY 1, 2, 3
+SELECT foo9g(123.23, '7')
 -- !query schema
-struct<spark_catalog.default.foo2_3(c1, c2):int,spark_catalog.default.foo2_3(c2, 1):int,(spark_catalog.default.foo2_3(c1, c2) - spark_catalog.default.foo2_3(c2, (c1 - 1))):int>
+struct<spark_catalog.default.foo9g(123.23, 7):float>
 -- !query output
-3	3	1
-7	5	1
-11	7	1
+7123.23
 
 
 -- !query
-SELECT * FROM V1 WHERE foo2_3(c1, 0) = c1 AND foo2_3(c1, c2) < 8
+SELECT foo9g('hello', '7')
 -- !query schema
-struct<c1:int,c2:int>
+struct<>
 -- !query output
-1	2
-3	4
+org.apache.spark.SparkNumberFormatException
+{
+  "errorClass" : "CAST_INVALID_INPUT",
+  "sqlState" : "22018",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "expression" : "'hello'",
+    "sourceType" : "\"STRING\"",
+    "targetType" : "\"FLOAT\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "fragment" : ""
+  } ]
+}
 
 
 -- !query
-SELECT foo2_3(SUM(c1), SUM(c2)), SUM(c1) + SUM(c2), SUM(foo2_3(c1, c2) + foo2_3(c2, c1) - foo2_3(c2, c1))
-FROM V1
+SELECT foo9g(123.23, 'q')
 -- !query schema
-struct<spark_catalog.default.foo2_3(sum(c1), sum(c2)):int,(sum(c1) + sum(c2)):bigint,sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1))):bigint>
+struct<>
 -- !query output
-21	21	21
+org.apache.spark.SparkNumberFormatException
+{
+  "errorClass" : "CAST_INVALID_INPUT",
+  "sqlState" : "22018",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "expression" : "'q123.23'",
+    "sourceType" : "\"STRING\"",
+    "targetType" : "\"FLOAT\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "fragment" : ""
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo2_4a(a ARRAY<STRING>) RETURNS STRING RETURN
-SELECT array_sort(a, (i, j) -> rank[i] - rank[j])[0] FROM (SELECT MAP('a', 1, 'b', 2) rank)
+CREATE FUNCTION foo9h(a DOUBLE, b String) RETURNS DOUBLE RETURN b || CAST(a AS String)
 -- !query schema
 struct<>
 -- !query output
@@ -1150,40 +1308,73 @@ struct<>
 
 
 -- !query
-SELECT foo2_4a(ARRAY('a', 'b'))
+SELECT foo9h(123.23, '7')
 -- !query schema
-struct<spark_catalog.default.foo2_4a(array(a, b)):string>
+struct<spark_catalog.default.foo9h(123.23, 7):double>
 -- !query output
-a
+7123.23
 
 
 -- !query
-CREATE FUNCTION foo2_4b(m MAP<STRING, STRING>, k STRING) RETURNS STRING RETURN
-SELECT v || ' ' || v FROM (SELECT upper(m[k]) AS v)
+SELECT foo9h('hello', '7')
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.SparkNumberFormatException
+{
+  "errorClass" : "CAST_INVALID_INPUT",
+  "sqlState" : "22018",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "expression" : "'hello'",
+    "sourceType" : "\"STRING\"",
+    "targetType" : "\"DOUBLE\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "fragment" : ""
+  } ]
+}
 
 
 -- !query
-SELECT foo2_4b(map('a', 'hello', 'b', 'world'), 'a')
+SELECT foo9h(123.23, 'q')
 -- !query schema
-struct<spark_catalog.default.foo2_4b(map(a, hello, b, world), a):string>
+struct<>
 -- !query output
-HELLO HELLO
+org.apache.spark.SparkNumberFormatException
+{
+  "errorClass" : "CAST_INVALID_INPUT",
+  "sqlState" : "22018",
+  "messageParameters" : {
+    "ansiConfig" : "\"spark.sql.ansi.enabled\"",
+    "expression" : "'q123.23'",
+    "sourceType" : "\"STRING\"",
+    "targetType" : "\"DOUBLE\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "fragment" : ""
+  } ]
+}
 
 
 -- !query
-DROP VIEW V2
+CREATE FUNCTION foo9i(a VARCHAR(10), b VARCHAR(10)) RETURNS VARCHAR(12) RETURN a || b
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_CHAR_OR_VARCHAR_AS_STRING",
+  "sqlState" : "0A000"
+}
 
 
 -- !query
-DROP VIEW V1
+CREATE FUNCTION foo9j(a STRING, b STRING) RETURNS STRING RETURN a || b
 -- !query schema
 struct<>
 -- !query output
@@ -1191,23 +1382,23 @@ struct<>
 
 
 -- !query
-CREATE VIEW t1(c1, c2) AS VALUES (0, 1), (0, 2), (1, 2)
+SELECT foo9j('1234567890', '12')
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo9j(1234567890, 12):string>
 -- !query output
-
+123456789012
 
 
 -- !query
-CREATE VIEW t2(c1, c2) AS VALUES (0, 2), (0, 3)
+SELECT foo9j(12345678901, '12')
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo9j(12345678901, 12):string>
 -- !query output
-
+1234567890112
 
 
 -- !query
-CREATE VIEW ts(x) AS VALUES NAMED_STRUCT('a', 1, 'b', 2)
+CREATE FUNCTION foo9l(a DATE, b INTERVAL) RETURNS DATE RETURN a + b
 -- !query schema
 struct<>
 -- !query output
@@ -1215,39 +1406,102 @@ struct<>
 
 
 -- !query
-CREATE VIEW tm(x) AS VALUES MAP('a', 1, 'b', 2)
+SELECT foo9l(DATE '2020-02-02', INTERVAL '1' YEAR)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 50,
+    "fragment" : "foo9l(DATE '2020-02-02', INTERVAL '1' YEAR)"
+  } ]
+}
 
 
 -- !query
-CREATE VIEW ta(x) AS VALUES ARRAY(1, 2, 3)
+SELECT foo9l('2020-02-02', INTERVAL '1' YEAR)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 45,
+    "fragment" : "foo9l('2020-02-02', INTERVAL '1' YEAR)"
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo3_1a(a DOUBLE, b DOUBLE) RETURNS DOUBLE RETURN a * b
+SELECT foo9l(DATE '-7', INTERVAL '1' YEAR)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'-7'",
+    "valueType" : "\"DATE\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 14,
+    "stopIndex" : 22,
+    "fragment" : "DATE '-7'"
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo3_1b(x INT) RETURNS INT RETURN x
+SELECT foo9l(DATE '2020-02-02', INTERVAL '9999999' YEAR)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "sqlExpr" : "\"INTERVAL '9999999' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 56,
+    "fragment" : "foo9l(DATE '2020-02-02', INTERVAL '9999999' YEAR)"
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo3_1c(x INT) RETURNS INT RETURN SELECT x
+CREATE FUNCTION foo9m(a TIMESTAMP, b INTERVAL) RETURNS TIMESTAMP RETURN a + b
 -- !query schema
 struct<>
 -- !query output
@@ -1255,31 +1509,79 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_1d(x INT) RETURNS INT RETURN (SELECT SUM(c2) FROM t2 WHERE c1 = x)
+SELECT foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '1' YEAR)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 67,
+    "fragment" : "foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '1' YEAR)"
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo3_1e() RETURNS INT RETURN foo3_1d(0)
+SELECT foo9m('2020-02-02 12:15:16.123', INTERVAL '1' YEAR)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "sqlExpr" : "\"INTERVAL '1' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "foo9m('2020-02-02 12:15:16.123', INTERVAL '1' YEAR)"
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo3_1f() RETURNS INT RETURN SELECT SUM(c2) FROM t2 WHERE c1 = 0
+SELECT foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '999999' YEAR)
 -- !query schema
 struct<>
 -- !query output
-
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.CAST_WITHOUT_SUGGESTION",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "sqlExpr" : "\"INTERVAL '999999' YEAR\"",
+    "srcType" : "\"INTERVAL YEAR\"",
+    "targetType" : "\"INTERVAL\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 72,
+    "fragment" : "foo9m(TIMESTAMP'2020-02-02 12:15:16.123', INTERVAL '999999' YEAR)"
+  } ]
+}
 
 
 -- !query
-CREATE FUNCTION foo3_1g(x INT) RETURNS INT RETURN SELECT (SELECT x)
+CREATE FUNCTION foo9n(a ARRAY<INTEGER>) RETURNS ARRAY<INTEGER> RETURN a
 -- !query schema
 struct<>
 -- !query output
@@ -1287,866 +1589,3528 @@ struct<>
 
 
 -- !query
-SELECT a, b, foo3_1a(a + 1, b + 1) FROM t1 AS t(a, b)
+SELECT foo9n(ARRAY(1, 2, 3))
 -- !query schema
-struct<a:int,b:int,spark_catalog.default.foo3_1a((a + 1), (b + 1)):double>
+struct<spark_catalog.default.foo9n(array(1, 2, 3)):array<int>>
 -- !query output
-0	1	2.0
-0	2	3.0
-1	2	6.0
+[1,2,3]
 
 
 -- !query
-SELECT x, foo3_1c(x) FROM t1 AS t(x, y)
+SELECT foo9n(from_json('[1, 2, 3]', 'array<int>'))
 -- !query schema
-struct<x:int,spark_catalog.default.foo3_1c(x):int>
+struct<spark_catalog.default.foo9n(from_json([1, 2, 3])):array<int>>
 -- !query output
-0	0
-0	0
-1	1
+[1,2,3]
 
 
 -- !query
-SELECT c1, foo3_1d(c1) FROM t1
+CREATE FUNCTION foo9o(a MAP<STRING, INTEGER>) RETURNS MAP<STRING, INTEGER> RETURN a
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1d(c1):int>
+struct<>
 -- !query output
-0	5
-0	5
-1	NULL
+
 
 
 -- !query
-SELECT c1, foo3_1a(foo3_1b(c1), foo3_1b(c1)) FROM t1
+SELECT foo9o(MAP('hello', 1, 'world', 2))
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), spark_catalog.default.foo3_1b(c1)):double>
+struct<spark_catalog.default.foo9o(map(hello, 1, world, 2)):map<string,int>>
 -- !query output
-0	0.0
-0	0.0
-1	1.0
+{"hello":1,"world":2}
 
 
 -- !query
-SELECT c1, foo3_1d(foo3_1c(foo3_1b(c1))) FROM t1
+SELECT foo9o(from_json('{"hello":1, "world":2}', 'map<string,int>'))
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1))):int>
+struct<spark_catalog.default.foo9o(entries):map<string,int>>
 -- !query output
-0	5
-0	5
-1	NULL
+{"hello":1,"world":2}
 
 
 -- !query
-SELECT c1, foo3_1a(foo3_1c(foo3_1b(c1)), foo3_1d(foo3_1b(c1))) FROM t1
+CREATE FUNCTION foo9p(a STRUCT<a1: INTEGER, a2: STRING>) RETURNS STRUCT<a1: INTEGER, a2: STRING> RETURN a
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1)), spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1b(c1))):double>
+struct<>
 -- !query output
-0	0.0
-0	0.0
-1	NULL
+
 
 
 -- !query
-SELECT foo3_1c(foo3_1e()) FROM t1
+SELECT foo9p(STRUCT(1, 'hello'))
 -- !query schema
-struct<spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1e()):int>
+struct<spark_catalog.default.foo9p(struct(1, hello)):struct<a1:int,a2:string>>
 -- !query output
-5
-5
-5
+{"a1":1,"a2":"hello"}
 
 
 -- !query
-SELECT foo3_1a(MAX(c1), MAX(c2)) FROM t1
+SELECT foo9p(from_json('{1:"hello"}', 'struct<a1:int, a2:string>'))
 -- !query schema
-struct<spark_catalog.default.foo3_1a(max(c1), max(c2)):double>
+struct<spark_catalog.default.foo9p(from_json({1:"hello"})):struct<a1:int,a2:string>>
 -- !query output
-2.0
+{"a1":null,"a2":null}
 
 
 -- !query
-SELECT foo3_1a(MAX(c1), c2) FROM t1 GROUP BY c2
+CREATE FUNCTION foo9q(a ARRAY<STRUCT<a1: INT, a2: STRING>>) RETURNS ARRAY<STRUCT<a1: INT, a2: STRING>> RETURN a
 -- !query schema
-struct<spark_catalog.default.foo3_1a(max(c1), c2):double>
+struct<>
 -- !query output
-0.0
-2.0
+
 
 
 -- !query
-SELECT foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+SELECT foo9q(ARRAY(STRUCT(1, 'hello'), STRUCT(2, 'world')))
 -- !query schema
-struct<spark_catalog.default.foo3_1a(c1, c2):double>
+struct<spark_catalog.default.foo9q(array(struct(1, hello), struct(2, world))):array<struct<a1:int,a2:string>>>
 -- !query output
-0.0
-0.0
-2.0
+[{"a1":1,"a2":"hello"},{"a1":2,"a2":"world"}]
 
 
 -- !query
-SELECT MAX(foo3_1a(c1, c2)) FROM t1 GROUP BY c1, c2
+SELECT foo9q(ARRAY(NAMED_STRUCT('x', 1, 'y', 'hello'), NAMED_STRUCT('x', 2, 'y', 'world')))
 -- !query schema
-struct<max(spark_catalog.default.foo3_1a(c1, c2)):double>
+struct<spark_catalog.default.foo9q(array(named_struct(x, 1, y, hello), named_struct(x, 2, y, world))):array<struct<a1:int,a2:string>>>
 -- !query output
-0.0
-0.0
-2.0
+[{"a1":1,"a2":"hello"},{"a1":2,"a2":"world"}]
 
 
 -- !query
-SELECT MAX(c1) + foo3_1b(MAX(c1)) FROM t1 GROUP BY c2
+SELECT foo9q(from_json('[{1:"hello"}, {2:"world"}]', 'array<struct<a1:int,a2:string>>'))
 -- !query schema
-struct<(max(c1) + spark_catalog.default.foo3_1b(max(c1))):int>
+struct<spark_catalog.default.foo9q(from_json([{1:"hello"}, {2:"world"}])):array<struct<a1:int,a2:string>>>
 -- !query output
-0
-2
+NULL
 
 
 -- !query
-SELECT c1, SUM(foo3_1c(c2)) FROM t1 GROUP BY c1
+CREATE FUNCTION foo9r(a ARRAY<MAP<STRING, INT>>) RETURNS ARRAY<MAP<STRING, INT>> RETURN a
 -- !query schema
-struct<c1:int,sum(spark_catalog.default.foo3_1c(c2)):bigint>
+struct<>
 -- !query output
-0	3
-1	2
+
 
 
 -- !query
-SELECT c1, SUM(foo3_1d(c2)) FROM t1 GROUP BY c1
+SELECT foo9r(ARRAY(MAP('hello', 1), MAP('world', 2)))
 -- !query schema
-struct<c1:int,sum(spark_catalog.default.foo3_1d(c2)):bigint>
+struct<spark_catalog.default.foo9r(array(map(hello, 1), map(world, 2))):array<map<string,int>>>
 -- !query output
-0	NULL
-1	NULL
+[{"hello":1},{"world":2}]
 
 
 -- !query
-SELECT foo3_1c(c1), foo3_1d(c1) FROM t1 GROUP BY c1
+SELECT foo9r(from_json('[{"hello":1}, {"world":2}]', 'array<map<string,int>>'))
 -- !query schema
-struct<spark_catalog.default.foo3_1c(c1):int,spark_catalog.default.foo3_1d(c1):int>
+struct<spark_catalog.default.foo9r(from_json([{"hello":1}, {"world":2}])):array<map<string,int>>>
 -- !query output
-0	5
-1	NULL
+[{"hello":1},{"world":2}]
 
 
 -- !query
-SELECT foo3_1a(SUM(c1), rand(0) * 0) FROM t1
+CREATE OR REPLACE FUNCTION foo1_10(a INT) RETURNS INT RETURN a + 2
 -- !query schema
-struct<spark_catalog.default.foo3_1a(sum(c1), (rand(0) * 0)):double>
+struct<>
 -- !query output
-0.0
+
 
 
 -- !query
-SELECT foo3_1a(SUM(c1) + rand(0) * 0, SUM(c2)) FROM t1
+CREATE OR REPLACE FUNCTION bar1_10(b INT) RETURNS STRING RETURN foo1_10(TRY_CAST(b AS STRING))
 -- !query schema
-struct<spark_catalog.default.foo3_1a((sum(c1) + (rand(0) * 0)), sum(c2)):double>
+struct<>
 -- !query output
-5.0
+
 
 
 -- !query
-SELECT foo3_1b(SUM(c1) + rand(0) * 0) FROM t1
+SELECT bar1_10(3)
 -- !query schema
-struct<spark_catalog.default.foo3_1b((sum(c1) + (rand(0) * 0))):int>
+struct<spark_catalog.default.bar1_10(3):string>
 -- !query output
-1
+5
 
 
 -- !query
-SELECT foo3_1b(SUM(1) + rand(0) * 0) FROM t1 GROUP BY c2
+CREATE OR REPLACE FUNCTION foo1_11a() RETURN 42
 -- !query schema
-struct<spark_catalog.default.foo3_1b((sum(1) + (rand(0) * 0))):int>
+struct<>
 -- !query output
-1
-2
+
 
 
 -- !query
-SELECT foo3_1c(SUM(c2) + rand(0) * 0) FROM t1 GROUP by c1
+SELECT foo1_11a()
 -- !query schema
-struct<spark_catalog.default.foo3_1c((sum(c2) + (rand(0) * 0))):int>
+struct<spark_catalog.default.foo1_11a():int>
 -- !query output
-2
-3
+42
 
 
 -- !query
-SELECT foo3_1b(foo3_1b(MAX(c2))) FROM t1
+CREATE OR REPLACE FUNCTION foo1_11b() RETURN 'hello world'
 -- !query schema
-struct<spark_catalog.default.foo3_1b(spark_catalog.default.foo3_1b(max(c2))):int>
+struct<>
 -- !query output
-2
+
 
 
 -- !query
-SELECT foo3_1b(MAX(foo3_1b(c2))) FROM t1
+SELECT foo1_11b()
 -- !query schema
-struct<spark_catalog.default.foo3_1b(max(spark_catalog.default.foo3_1b(c2))):int>
+struct<spark_catalog.default.foo1_11b():string>
 -- !query output
-2
+hello world
 
 
 -- !query
-SELECT foo3_1a(foo3_1b(c1), MAX(c2)) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11c(a INT, b INT) RETURN a + b
 -- !query schema
-struct<spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), max(c2)):double>
+struct<>
 -- !query output
-0.0
-2.0
+
 
 
 -- !query
-SELECT c1, foo3_1b(c1) FROM t1 GROUP BY c1
+SELECT foo1_11c(3, 5)
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1b(c1):int>
+struct<spark_catalog.default.foo1_11c(3, 5):int>
 -- !query output
-0	0
-1	1
+8
 
 
 -- !query
-SELECT c1, foo3_1b(c1 + 1) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11d(a DOUBLE, b INT) RETURN a * b + 1.5
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1b((c1 + 1)):int>
+struct<>
 -- !query output
-0	1
-1	2
+
 
 
 -- !query
-SELECT c1, foo3_1b(c1 + rand(0) * 0) FROM t1 GROUP BY c1
+SELECT foo1_11d(3.0, 5)
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1b((c1 + (rand(0) * 0))):int>
+struct<spark_catalog.default.foo1_11d(3.0, 5):double>
 -- !query output
-0	0
-1	1
+16.5
 
 
 -- !query
-SELECT c1, foo3_1a(c1, MIN(c2)) FROM t1 GROUP BY c1
+CREATE OR REPLACE FUNCTION foo1_11e(a INT) RETURN a > 10
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1a(c1, min(c2)):double>
+struct<>
 -- !query output
-0	0.0
-1	2.0
+
 
 
 -- !query
-SELECT c1, foo3_1a(c1 + 1, MIN(c2 + 1)) FROM t1 GROUP BY c1
+SELECT foo1_11e(15), foo1_11e(5)
 -- !query schema
-struct<c1:int,spark_catalog.default.foo3_1a((c1 + 1), min((c2 + 1))):double>
+struct<spark_catalog.default.foo1_11e(15):boolean,spark_catalog.default.foo1_11e(5):boolean>
 -- !query output
-0	2.0
-1	6.0
+true	false
 
 
 -- !query
-SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+CREATE OR REPLACE FUNCTION foo1_11f(d DATE) RETURN d + INTERVAL '1' DAY
 -- !query schema
-struct<c1:int,c2:int,spark_catalog.default.foo3_1a(c1, c2):double>
+struct<>
 -- !query output
-0	1	0.0
-0	2	0.0
-1	2	2.0
+
 
 
 -- !query
-SELECT c1, c2, foo3_1a(1, 2) FROM t1 GROUP BY c1, c2
+SELECT foo1_11f(DATE '2024-01-01')
 -- !query schema
-struct<c1:int,c2:int,spark_catalog.default.foo3_1a(1, 2):double>
+struct<spark_catalog.default.foo1_11f(DATE '2024-01-01'):date>
 -- !query output
-0	1	2.0
-0	2	2.0
-1	2	2.0
+2024-01-02
 
 
 -- !query
-SELECT c1 + c2, foo3_1b(c1 + c2 + 1) FROM t1 GROUP BY c1 + c2
+CREATE OR REPLACE FUNCTION foo1_11g(n INT) RETURN ARRAY(1, 2, n)
 -- !query schema
-struct<(c1 + c2):int,spark_catalog.default.foo3_1b(((c1 + c2) + 1)):int>
+struct<>
 -- !query output
-1	2
-2	3
-3	4
+
 
 
 -- !query
-SELECT COUNT(*) + foo3_1b(c1) + foo3_1b(SUM(c2)) + SUM(foo3_1b(c2)) FROM t1 GROUP BY c1
+SELECT foo1_11g(5)
 -- !query schema
-struct<(((count(1) + spark_catalog.default.foo3_1b(c1)) + spark_catalog.default.foo3_1b(sum(c2))) + sum(spark_catalog.default.foo3_1b(c2))):bigint>
+struct<spark_catalog.default.foo1_11g(5):array<int>>
 -- !query output
-6
-8
+[1,2,5]
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+CREATE OR REPLACE FUNCTION foo1_11h(a INT, b STRING) RETURN STRUCT(a, b)
 -- !query schema
-struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b(sum(c2)):int>
+struct<>
 -- !query output
-0	2	3
-1	1	2
+
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 0
+SELECT foo1_11h(1, 'test')
 -- !query schema
-struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b(sum(c2)):int>
+struct<spark_catalog.default.foo1_11h(1, test):struct<a:int,b:string>>
 -- !query output
-0	2	3
-1	1	2
+{"a":1,"b":"test"}
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING SUM(foo3_1b(c2)) > 0
+CREATE OR REPLACE FUNCTION foo1_11i(x INT) RETURN (SELECT x * 2)
 -- !query schema
-struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b(sum(c2)):int>
+struct<>
 -- !query output
-0	2	3
-1	1	2
+
 
 
 -- !query
-SELECT foo3_1b(c1), MIN(c2) FROM t1 GROUP BY 1
+SELECT foo1_11i(5)
 -- !query schema
-struct<spark_catalog.default.foo3_1b(c1):int,min(c2):int>
+struct<spark_catalog.default.foo1_11i(5):int>
 -- !query output
-0	1
-1	2
+10
 
 
 -- !query
-SELECT foo3_1a(c1 + rand(0) * 0, c2) FROM t1 GROUP BY 1
+CREATE OR REPLACE FUNCTION foo1_11j(s STRING) RETURN UPPER(s)
 -- !query schema
-struct<spark_catalog.default.foo3_1a((c1 + (rand(0) * 0)), c2):double>
+struct<>
 -- !query output
-0.0
-2.0
+
 
 
 -- !query
-SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2, 3
+SELECT foo1_11j('hello')
 -- !query schema
-struct<c1:int,c2:int,spark_catalog.default.foo3_1a(c1, c2):double>
+struct<spark_catalog.default.foo1_11j(hello):string>
 -- !query output
-0	1	0.0
-0	2	0.0
-1	2	2.0
+HELLO
 
 
 -- !query
-SELECT c1, (SELECT c1), (SELECT foo3_1b(c1)), SUM(c2) FROM t1 GROUP BY 1, 2, 3
+CREATE OR REPLACE FUNCTION foo1_11k(a INT, b STRING) RETURN CONCAT(CAST(a AS STRING), '_', b)
 -- !query schema
-struct<c1:int,scalarsubquery(c1):int,scalarsubquery(c1):int,sum(c2):bigint>
+struct<>
 -- !query output
-0	0	0	3
-1	1	1	2
+
 
 
 -- !query
-SELECT c1, SUM(c2) + foo3_1a(MIN(c2), MAX(c2)) + (SELECT SUM(c2)) FROM t1 GROUP BY c1
+SELECT foo1_11k(123, 'test')
 -- !query schema
-struct<>
+struct<spark_catalog.default.foo1_11k(123, test):string>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "sqlExprs" : "\"sum(c2) AS `sum(outer(spark_catalog.default.t1.c2))`\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 51,
-    "stopIndex" : 64,
-    "fragment" : "SELECT SUM(c2)"
-  } ]
-}
+123_test
 
 
 -- !query
-SELECT foo3_1b(SUM(c1)) + (SELECT foo3_1b(SUM(c1))) FROM t1
+CREATE OR REPLACE FUNCTION foo1_11l() RETURNS TABLE RETURN SELECT 1 as id, 'hello' as name
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 27,
-    "stopIndex" : 51,
-    "fragment" : "(SELECT foo3_1b(SUM(c1)))"
-  } ]
-}
+
 
 
 -- !query
-SELECT SUM(foo3_1b(SUM(c1))) FROM t1
+SELECT * FROM foo1_11l()
 -- !query schema
-struct<>
+struct<id:int,name:string>
 -- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
-  "sqlState" : "42607",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 12,
-    "stopIndex" : 27,
-    "fragment" : "foo3_1b(SUM(c1))"
-  } ]
-}
+1	hello
 
 
 -- !query
-SELECT foo3_1b(SUM(c1)) + (SELECT SUM(SUM(c1))) FROM t1
+CREATE OR REPLACE FUNCTION foo1_11m(a INT, b STRING) RETURNS TABLE RETURN SELECT a * 2 as doubled, UPPER(b) as upper_name
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
-  "sqlState" : "42607",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 39,
-    "stopIndex" : 45,
-    "fragment" : "SUM(c1)"
-  } ]
-}
+
 
 
 -- !query
-SELECT foo3_1b(SUM(c1) + SUM(SUM(c1))) FROM t1
+SELECT * FROM foo1_11m(5, 'world')
 -- !query schema
-struct<>
+struct<doubled:int,upper_name:string>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
-  "sqlState" : "42607",
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 30,
-    "stopIndex" : 36,
-    "fragment" : "SUM(c1)"
-  } ]
-}
+10	WORLD
 
 
 -- !query
-SELECT foo3_1b(SUM(c1 + rand(0) * 0)) FROM t1
+CREATE OR REPLACE FUNCTION foo1_11n(arr ARRAY<INT>) RETURNS TABLE RETURN SELECT size(arr) as array_size, arr[0] as first_element
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
-  "sqlState" : "42845",
-  "messageParameters" : {
-    "sqlExpr" : "\"sum((c1 + (rand(0) * 0)))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 20,
-    "stopIndex" : 35,
-    "fragment" : "c1 + rand(0) * 0"
-  } ]
-}
+
 
 
 -- !query
-SELECT SUM(foo3_1b(c1) + rand(0) * 0) FROM t1
+SELECT * FROM foo1_11n(ARRAY(1, 2, 3))
 -- !query schema
-struct<>
+struct<array_size:int,first_element:int>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
-  "sqlState" : "42845",
-  "messageParameters" : {
-    "sqlExpr" : "\"sum((spark_catalog.default.foo3_1b(foo3_1b.x) + (rand(0) * 0)))\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 12,
-    "stopIndex" : 36,
-    "fragment" : "foo3_1b(c1) + rand(0) * 0"
-  } ]
-}
+3	1
 
 
 -- !query
-SELECT SUM(foo3_1b(c1 + rand(0) * 0)) FROM t1
+CREATE OR REPLACE FUNCTION foo1_11o(id INT, name STRING) RETURNS TABLE RETURN SELECT STRUCT(id, name) as person_info, id + 100 as modified_id
 -- !query schema
-struct<sum(spark_catalog.default.foo3_1b((c1 + (rand(0) * 0)))):bigint>
+struct<>
 -- !query output
-1
+
 
 
 -- !query
-SELECT foo3_1b(SUM(c1) + foo3_1b(SUM(c1))) FROM t1
+SELECT * FROM foo1_11o(1, 'Alice')
 -- !query schema
-struct<spark_catalog.default.foo3_1b((sum(c1) + spark_catalog.default.foo3_1b(sum(c1)))):int>
+struct<person_info:struct<id:int,name:string>,modified_id:int>
 -- !query output
-2
+{"id":1,"name":"Alice"}	101
 
 
 -- !query
-SELECT foo3_1b(SUM(c2) + foo3_1b(SUM(c1))) AS foo FROM t1 HAVING foo > 0
+CREATE FUNCTION foo2_1a(a INT) RETURNS INT RETURN a
 -- !query schema
-struct<foo:int>
+struct<>
 -- !query output
-6
+
 
 
 -- !query
-SELECT c1, COUNT(*), foo3_1b(SUM(c2) + foo3_1b(SUM(c2))) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+SELECT foo2_1a(5)
 -- !query schema
-struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b((sum(c2) + spark_catalog.default.foo3_1b(sum(c2)))):int>
+struct<spark_catalog.default.foo2_1a(5):int>
 -- !query output
-0	2	6
-1	1	4
+5
 
 
 -- !query
-SELECT foo3_1a(c1, MAX(c2)) FROM t1 GROUP BY c1, 1
+CREATE FUNCTION foo2_1b(a INT, b INT) RETURNS INT RETURN a + b
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "GROUP_BY_POS_AGGREGATE",
-  "sqlState" : "42903",
-  "messageParameters" : {
-    "aggExpr" : "spark_catalog.default.foo3_1a(spark_catalog.default.t1.c1, max(spark_catalog.default.t1.c2)) AS `spark_catalog.default.foo3_1a(c1, max(c2))`",
-    "index" : "1"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 50,
-    "stopIndex" : 50,
-    "fragment" : "1"
-  } ]
-}
+
 
 
 -- !query
-WITH cte AS (SELECT foo3_1a(c1, c2) FROM t1)
-SELECT * FROM cte
+SELECT foo2_1b(5, 6)
 -- !query schema
-struct<spark_catalog.default.foo3_1a(c1, c2):double>
+struct<spark_catalog.default.foo2_1b(5, 6):int>
 -- !query output
-0.0
-0.0
-2.0
+11
 
 
 -- !query
-SELECT SUM(c2) FROM t1 GROUP BY foo3_1b(c1)
+CREATE FUNCTION foo2_1c(a INT, b INT) RETURNS INT RETURN 10 * (a + b) + 100 * (a -b)
 -- !query schema
-struct<sum(c2):bigint>
+struct<>
 -- !query output
-2
-3
+
 
 
 -- !query
-SELECT foo3_1b(c1), SUM(c2) FROM t1 GROUP BY 1
+SELECT foo2_1c(5, 6)
 -- !query schema
-struct<spark_catalog.default.foo3_1b(c1):int,sum(c2):bigint>
+struct<spark_catalog.default.foo2_1c(5, 6):int>
 -- !query output
-0	3
-1	2
+10
 
 
 -- !query
-SELECT foo3_1b(c1), c2, GROUPING(foo3_1b(c1)), SUM(c1) FROM t1 GROUP BY ROLLUP(foo3_1b(c1), c2)
+CREATE FUNCTION foo2_1d(a INT, b INT) RETURNS INT RETURN ABS(a) - LENGTH(CAST(b AS VARCHAR(10)))
 -- !query schema
-struct<spark_catalog.default.foo3_1b(c1):int,c2:int,grouping(spark_catalog.default.foo3_1b(c1)):tinyint,sum(c1):bigint>
+struct<>
 -- !query output
-0	1	0	0
-0	2	0	0
-0	NULL	0	0
-1	2	0	1
-1	NULL	0	1
-NULL	NULL	1	1
+
 
 
 -- !query
-SELECT c1, SUM(c2) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 1
+SELECT foo2_1d(-5, 6)
 -- !query schema
-struct<c1:int,sum(c2):bigint>
+struct<spark_catalog.default.foo2_1d(-5, 6):int>
 -- !query output
-0	3
-1	2
+4
 
 
 -- !query
-SELECT c1, SUM(c2) FROM t1 GROUP BY CUBE(c1) HAVING foo3_1b(GROUPING(c1)) = 0
+CREATE FUNCTION foo2_2a(a INT) RETURNS INT RETURN SELECT a
 -- !query schema
-struct<c1:int,sum(c2):bigint>
+struct<>
 -- !query output
-0	3
-1	2
+
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1a(t1.c1, t2.c2) >= 2
+SELECT foo2_2a(5)
 -- !query schema
-struct<c1:int,c2:int,c1:int,c2:int>
+struct<spark_catalog.default.foo2_2a(5):int>
 -- !query output
-1	2	0	2
-1	2	0	3
+5
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c2) = foo3_1b(t2.c2)
+CREATE FUNCTION foo2_2b(a INT) RETURNS INT RETURN 1 + (SELECT a)
 -- !query schema
-struct<c1:int,c2:int,c1:int,c2:int>
+struct<>
 -- !query output
-0	2	0	2
-1	2	0	2
+
+
+
+-- !query
+SELECT foo2_2b(5)
+-- !query schema
+struct<spark_catalog.default.foo2_2b(5):int>
+-- !query output
+6
+
+
+-- !query
+CREATE FUNCTION foo2_2c(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT a))
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`a`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 21,
+    "stopIndex" : 21,
+    "fragment" : "a"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo2_2d(a INT) RETURNS INT RETURN 1 + (SELECT (SELECT (SELECT (SELECT a))))
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITHOUT_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`a`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 37,
+    "stopIndex" : 37,
+    "fragment" : "a"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo2_2e(a INT) RETURNS INT RETURN
+SELECT a FROM (VALUES 1) AS V(c1) WHERE c1 = 2
+UNION ALL
+SELECT a + 1 FROM (VALUES 1) AS V(c1)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo2_2f(a INT) RETURNS INT RETURN
+SELECT a FROM (VALUES 1) AS V(c1)
+EXCEPT
+SELECT a + 1 FROM (VALUES 1) AS V(a)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo2_2g(a INT) RETURNS INT RETURN
+SELECT a FROM (VALUES 1) AS V(c1)
+INTERSECT
+SELECT a FROM (VALUES 1) AS V(a)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE IF EXISTS t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE IF EXISTS t2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE IF EXISTS ts
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE IF EXISTS tm
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE IF EXISTS ta
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE IF EXISTS V1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE IF EXISTS V2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW IF EXISTS t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW IF EXISTS t2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW IF EXISTS ts
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW IF EXISTS tm
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW IF EXISTS ta
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW IF EXISTS V1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW IF EXISTS V2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo2_3(a INT, b INT) RETURNS INT RETURN a + b
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW V1(c1, c2) AS VALUES (1, 2), (3, 4), (5, 6)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW V2(c1, c2) AS VALUES (-1, -2), (-3, -4), (-5, -6)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT foo2_3(c1, c2), foo2_3(c2, 1), foo2_3(c1, c2) - foo2_3(c2, c1 - 1) FROM V1 ORDER BY 1, 2, 3
+-- !query schema
+struct<spark_catalog.default.foo2_3(c1, c2):int,spark_catalog.default.foo2_3(c2, 1):int,(spark_catalog.default.foo2_3(c1, c2) - spark_catalog.default.foo2_3(c2, (c1 - 1))):int>
+-- !query output
+3	3	1
+7	5	1
+11	7	1
+
+
+-- !query
+SELECT * FROM V1 WHERE foo2_3(c1, 0) = c1 AND foo2_3(c1, c2) < 8
+-- !query schema
+struct<c1:int,c2:int>
+-- !query output
+1	2
+3	4
+
+
+-- !query
+SELECT foo2_3(SUM(c1), SUM(c2)), SUM(c1) + SUM(c2), SUM(foo2_3(c1, c2) + foo2_3(c2, c1) - foo2_3(c2, c1))
+FROM V1
+-- !query schema
+struct<spark_catalog.default.foo2_3(sum(c1), sum(c2)):int,(sum(c1) + sum(c2)):bigint,sum(((spark_catalog.default.foo2_3(c1, c2) + spark_catalog.default.foo2_3(c2, c1)) - spark_catalog.default.foo2_3(c2, c1))):bigint>
+-- !query output
+21	21	21
+
+
+-- !query
+CREATE FUNCTION foo2_4a(a ARRAY<STRING>) RETURNS STRING RETURN
+SELECT array_sort(a, (i, j) -> rank[i] - rank[j])[0] FROM (SELECT MAP('a', 1, 'b', 2) rank)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT foo2_4a(ARRAY('a', 'b'))
+-- !query schema
+struct<spark_catalog.default.foo2_4a(array(a, b)):string>
+-- !query output
+a
+
+
+-- !query
+CREATE FUNCTION foo2_4b(m MAP<STRING, STRING>, k STRING) RETURNS STRING RETURN
+SELECT v || ' ' || v FROM (SELECT upper(m[k]) AS v)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT foo2_4b(map('a', 'hello', 'b', 'world'), 'a')
+-- !query schema
+struct<spark_catalog.default.foo2_4b(map(a, hello, b, world), a):string>
+-- !query output
+HELLO HELLO
+
+
+-- !query
+DROP VIEW V2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW V1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW t1(c1, c2) AS VALUES (0, 1), (0, 2), (1, 2)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW t2(c1, c2) AS VALUES (0, 2), (0, 3)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW ts(x) AS VALUES NAMED_STRUCT('a', 1, 'b', 2)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW tm(x) AS VALUES MAP('a', 1, 'b', 2)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW ta(x) AS VALUES ARRAY(1, 2, 3)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1a(a DOUBLE, b DOUBLE) RETURNS DOUBLE RETURN a * b
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1b(x INT) RETURNS INT RETURN x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1c(x INT) RETURNS INT RETURN SELECT x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1d(x INT) RETURNS INT RETURN (SELECT SUM(c2) FROM t2 WHERE c1 = x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1e() RETURNS INT RETURN foo3_1d(0)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1f() RETURNS INT RETURN SELECT SUM(c2) FROM t2 WHERE c1 = 0
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1g(x INT) RETURNS INT RETURN SELECT (SELECT x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT a, b, foo3_1a(a + 1, b + 1) FROM t1 AS t(a, b)
+-- !query schema
+struct<a:int,b:int,spark_catalog.default.foo3_1a((a + 1), (b + 1)):double>
+-- !query output
+0	1	2.0
+0	2	3.0
+1	2	6.0
+
+
+-- !query
+SELECT x, foo3_1c(x) FROM t1 AS t(x, y)
+-- !query schema
+struct<x:int,spark_catalog.default.foo3_1c(x):int>
+-- !query output
+0	0
+0	0
+1	1
+
+
+-- !query
+SELECT c1, foo3_1d(c1) FROM t1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1d(c1):int>
+-- !query output
+0	5
+0	5
+1	NULL
+
+
+-- !query
+SELECT c1, foo3_1a(foo3_1b(c1), foo3_1b(c1)) FROM t1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), spark_catalog.default.foo3_1b(c1)):double>
+-- !query output
+0	0.0
+0	0.0
+1	1.0
+
+
+-- !query
+SELECT c1, foo3_1d(foo3_1c(foo3_1b(c1))) FROM t1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1))):int>
+-- !query output
+0	5
+0	5
+1	NULL
+
+
+-- !query
+SELECT c1, foo3_1a(foo3_1c(foo3_1b(c1)), foo3_1d(foo3_1b(c1))) FROM t1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1b(c1)), spark_catalog.default.foo3_1d(spark_catalog.default.foo3_1b(c1))):double>
+-- !query output
+0	0.0
+0	0.0
+1	NULL
+
+
+-- !query
+SELECT foo3_1c(foo3_1e()) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1c(spark_catalog.default.foo3_1e()):int>
+-- !query output
+5
+5
+5
+
+
+-- !query
+SELECT foo3_1a(MAX(c1), MAX(c2)) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1a(max(c1), max(c2)):double>
+-- !query output
+2.0
+
+
+-- !query
+SELECT foo3_1a(MAX(c1), c2) FROM t1 GROUP BY c2
+-- !query schema
+struct<spark_catalog.default.foo3_1a(max(c1), c2):double>
+-- !query output
+0.0
+2.0
+
+
+-- !query
+SELECT foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+-- !query schema
+struct<spark_catalog.default.foo3_1a(c1, c2):double>
+-- !query output
+0.0
+0.0
+2.0
+
+
+-- !query
+SELECT MAX(foo3_1a(c1, c2)) FROM t1 GROUP BY c1, c2
+-- !query schema
+struct<max(spark_catalog.default.foo3_1a(c1, c2)):double>
+-- !query output
+0.0
+0.0
+2.0
+
+
+-- !query
+SELECT MAX(c1) + foo3_1b(MAX(c1)) FROM t1 GROUP BY c2
+-- !query schema
+struct<(max(c1) + spark_catalog.default.foo3_1b(max(c1))):int>
+-- !query output
+0
+2
+
+
+-- !query
+SELECT c1, SUM(foo3_1c(c2)) FROM t1 GROUP BY c1
+-- !query schema
+struct<c1:int,sum(spark_catalog.default.foo3_1c(c2)):bigint>
+-- !query output
+0	3
+1	2
+
+
+-- !query
+SELECT c1, SUM(foo3_1d(c2)) FROM t1 GROUP BY c1
+-- !query schema
+struct<c1:int,sum(spark_catalog.default.foo3_1d(c2)):bigint>
+-- !query output
+0	NULL
+1	NULL
+
+
+-- !query
+SELECT foo3_1c(c1), foo3_1d(c1) FROM t1 GROUP BY c1
+-- !query schema
+struct<spark_catalog.default.foo3_1c(c1):int,spark_catalog.default.foo3_1d(c1):int>
+-- !query output
+0	5
+1	NULL
+
+
+-- !query
+SELECT foo3_1a(SUM(c1), rand(0) * 0) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1a(sum(c1), (rand(0) * 0)):double>
+-- !query output
+0.0
+
+
+-- !query
+SELECT foo3_1a(SUM(c1) + rand(0) * 0, SUM(c2)) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1a((sum(c1) + (rand(0) * 0)), sum(c2)):double>
+-- !query output
+5.0
+
+
+-- !query
+SELECT foo3_1b(SUM(c1) + rand(0) * 0) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1b((sum(c1) + (rand(0) * 0))):int>
+-- !query output
+1
+
+
+-- !query
+SELECT foo3_1b(SUM(1) + rand(0) * 0) FROM t1 GROUP BY c2
+-- !query schema
+struct<spark_catalog.default.foo3_1b((sum(1) + (rand(0) * 0))):int>
+-- !query output
+1
+2
+
+
+-- !query
+SELECT foo3_1c(SUM(c2) + rand(0) * 0) FROM t1 GROUP by c1
+-- !query schema
+struct<spark_catalog.default.foo3_1c((sum(c2) + (rand(0) * 0))):int>
+-- !query output
+2
+3
+
+
+-- !query
+SELECT foo3_1b(foo3_1b(MAX(c2))) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1b(spark_catalog.default.foo3_1b(max(c2))):int>
+-- !query output
+2
+
+
+-- !query
+SELECT foo3_1b(MAX(foo3_1b(c2))) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1b(max(spark_catalog.default.foo3_1b(c2))):int>
+-- !query output
+2
+
+
+-- !query
+SELECT foo3_1a(foo3_1b(c1), MAX(c2)) FROM t1 GROUP BY c1
+-- !query schema
+struct<spark_catalog.default.foo3_1a(spark_catalog.default.foo3_1b(c1), max(c2)):double>
+-- !query output
+0.0
+2.0
+
+
+-- !query
+SELECT c1, foo3_1b(c1) FROM t1 GROUP BY c1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1b(c1):int>
+-- !query output
+0	0
+1	1
+
+
+-- !query
+SELECT c1, foo3_1b(c1 + 1) FROM t1 GROUP BY c1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1b((c1 + 1)):int>
+-- !query output
+0	1
+1	2
+
+
+-- !query
+SELECT c1, foo3_1b(c1 + rand(0) * 0) FROM t1 GROUP BY c1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1b((c1 + (rand(0) * 0))):int>
+-- !query output
+0	0
+1	1
+
+
+-- !query
+SELECT c1, foo3_1a(c1, MIN(c2)) FROM t1 GROUP BY c1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1a(c1, min(c2)):double>
+-- !query output
+0	0.0
+1	2.0
+
+
+-- !query
+SELECT c1, foo3_1a(c1 + 1, MIN(c2 + 1)) FROM t1 GROUP BY c1
+-- !query schema
+struct<c1:int,spark_catalog.default.foo3_1a((c1 + 1), min((c2 + 1))):double>
+-- !query output
+0	2.0
+1	6.0
+
+
+-- !query
+SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2
+-- !query schema
+struct<c1:int,c2:int,spark_catalog.default.foo3_1a(c1, c2):double>
+-- !query output
+0	1	0.0
+0	2	0.0
+1	2	2.0
+
+
+-- !query
+SELECT c1, c2, foo3_1a(1, 2) FROM t1 GROUP BY c1, c2
+-- !query schema
+struct<c1:int,c2:int,spark_catalog.default.foo3_1a(1, 2):double>
+-- !query output
+0	1	2.0
+0	2	2.0
+1	2	2.0
+
+
+-- !query
+SELECT c1 + c2, foo3_1b(c1 + c2 + 1) FROM t1 GROUP BY c1 + c2
+-- !query schema
+struct<(c1 + c2):int,spark_catalog.default.foo3_1b(((c1 + c2) + 1)):int>
+-- !query output
+1	2
+2	3
+3	4
+
+
+-- !query
+SELECT COUNT(*) + foo3_1b(c1) + foo3_1b(SUM(c2)) + SUM(foo3_1b(c2)) FROM t1 GROUP BY c1
+-- !query schema
+struct<(((count(1) + spark_catalog.default.foo3_1b(c1)) + spark_catalog.default.foo3_1b(sum(c2))) + sum(spark_catalog.default.foo3_1b(c2))):bigint>
+-- !query output
+6
+8
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+-- !query schema
+struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b(sum(c2)):int>
+-- !query output
+0	2	3
+1	1	2
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 0
+-- !query schema
+struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b(sum(c2)):int>
+-- !query output
+0	2	3
+1	1	2
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2)) FROM t1 GROUP BY c1 HAVING SUM(foo3_1b(c2)) > 0
+-- !query schema
+struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b(sum(c2)):int>
+-- !query output
+0	2	3
+1	1	2
+
+
+-- !query
+SELECT foo3_1b(c1), MIN(c2) FROM t1 GROUP BY 1
+-- !query schema
+struct<spark_catalog.default.foo3_1b(c1):int,min(c2):int>
+-- !query output
+0	1
+1	2
+
+
+-- !query
+SELECT foo3_1a(c1 + rand(0) * 0, c2) FROM t1 GROUP BY 1
+-- !query schema
+struct<spark_catalog.default.foo3_1a((c1 + (rand(0) * 0)), c2):double>
+-- !query output
+0.0
+2.0
+
+
+-- !query
+SELECT c1, c2, foo3_1a(c1, c2) FROM t1 GROUP BY c1, c2, 3
+-- !query schema
+struct<c1:int,c2:int,spark_catalog.default.foo3_1a(c1, c2):double>
+-- !query output
+0	1	0.0
+0	2	0.0
+1	2	2.0
+
+
+-- !query
+SELECT c1, (SELECT c1), (SELECT foo3_1b(c1)), SUM(c2) FROM t1 GROUP BY 1, 2, 3
+-- !query schema
+struct<c1:int,scalarsubquery(c1):int,scalarsubquery(c1):int,sum(c2):bigint>
+-- !query output
+0	0	0	3
+1	1	1	2
+
+
+-- !query
+SELECT c1, SUM(c2) + foo3_1a(MIN(c2), MAX(c2)) + (SELECT SUM(c2)) FROM t1 GROUP BY c1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "sqlExprs" : "\"sum(c2) AS `sum(outer(spark_catalog.default.t1.c2))`\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 51,
+    "stopIndex" : 64,
+    "fragment" : "SELECT SUM(c2)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1)) + (SELECT foo3_1b(SUM(c1))) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 27,
+    "stopIndex" : 51,
+    "fragment" : "(SELECT foo3_1b(SUM(c1)))"
+  } ]
+}
+
+
+-- !query
+SELECT SUM(foo3_1b(SUM(c1))) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
+  "sqlState" : "42607",
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 12,
+    "stopIndex" : 27,
+    "fragment" : "foo3_1b(SUM(c1))"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1)) + (SELECT SUM(SUM(c1))) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
+  "sqlState" : "42607",
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 39,
+    "stopIndex" : 45,
+    "fragment" : "SUM(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1) + SUM(SUM(c1))) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "NESTED_AGGREGATE_FUNCTION",
+  "sqlState" : "42607",
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 30,
+    "stopIndex" : 36,
+    "fragment" : "SUM(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b(SUM(c1 + rand(0) * 0)) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
+  "sqlState" : "42845",
+  "messageParameters" : {
+    "sqlExpr" : "\"sum((c1 + (rand(0) * 0)))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 20,
+    "stopIndex" : 35,
+    "fragment" : "c1 + rand(0) * 0"
+  } ]
+}
+
+
+-- !query
+SELECT SUM(foo3_1b(c1) + rand(0) * 0) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "AGGREGATE_FUNCTION_WITH_NONDETERMINISTIC_EXPRESSION",
+  "sqlState" : "42845",
+  "messageParameters" : {
+    "sqlExpr" : "\"sum((spark_catalog.default.foo3_1b(foo3_1b.x) + (rand(0) * 0)))\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 12,
+    "stopIndex" : 36,
+    "fragment" : "foo3_1b(c1) + rand(0) * 0"
+  } ]
+}
+
+
+-- !query
+SELECT SUM(foo3_1b(c1 + rand(0) * 0)) FROM t1
+-- !query schema
+struct<sum(spark_catalog.default.foo3_1b((c1 + (rand(0) * 0)))):bigint>
+-- !query output
+1
+
+
+-- !query
+SELECT foo3_1b(SUM(c1) + foo3_1b(SUM(c1))) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1b((sum(c1) + spark_catalog.default.foo3_1b(sum(c1)))):int>
+-- !query output
+2
+
+
+-- !query
+SELECT foo3_1b(SUM(c2) + foo3_1b(SUM(c1))) AS foo FROM t1 HAVING foo > 0
+-- !query schema
+struct<foo:int>
+-- !query output
+6
+
+
+-- !query
+SELECT c1, COUNT(*), foo3_1b(SUM(c2) + foo3_1b(SUM(c2))) FROM t1 GROUP BY c1 HAVING COUNT(*) > 0
+-- !query schema
+struct<c1:int,count(1):bigint,spark_catalog.default.foo3_1b((sum(c2) + spark_catalog.default.foo3_1b(sum(c2)))):int>
+-- !query output
+0	2	6
+1	1	4
+
+
+-- !query
+SELECT foo3_1a(c1, MAX(c2)) FROM t1 GROUP BY c1, 1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "GROUP_BY_POS_AGGREGATE",
+  "sqlState" : "42903",
+  "messageParameters" : {
+    "aggExpr" : "spark_catalog.default.foo3_1a(spark_catalog.default.t1.c1, max(spark_catalog.default.t1.c2)) AS `spark_catalog.default.foo3_1a(c1, max(c2))`",
+    "index" : "1"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 50,
+    "stopIndex" : 50,
+    "fragment" : "1"
+  } ]
+}
+
+
+-- !query
+WITH cte AS (SELECT foo3_1a(c1, c2) FROM t1)
+SELECT * FROM cte
+-- !query schema
+struct<spark_catalog.default.foo3_1a(c1, c2):double>
+-- !query output
+0.0
+0.0
+2.0
+
+
+-- !query
+SELECT SUM(c2) FROM t1 GROUP BY foo3_1b(c1)
+-- !query schema
+struct<sum(c2):bigint>
+-- !query output
+2
+3
+
+
+-- !query
+SELECT foo3_1b(c1), SUM(c2) FROM t1 GROUP BY 1
+-- !query schema
+struct<spark_catalog.default.foo3_1b(c1):int,sum(c2):bigint>
+-- !query output
+0	3
+1	2
+
+
+-- !query
+SELECT foo3_1b(c1), c2, GROUPING(foo3_1b(c1)), SUM(c1) FROM t1 GROUP BY ROLLUP(foo3_1b(c1), c2)
+-- !query schema
+struct<spark_catalog.default.foo3_1b(c1):int,c2:int,grouping(spark_catalog.default.foo3_1b(c1)):tinyint,sum(c1):bigint>
+-- !query output
+0	1	0	0
+0	2	0	0
+0	NULL	0	0
+1	2	0	1
+1	NULL	0	1
+NULL	NULL	1	1
+
+
+-- !query
+SELECT c1, SUM(c2) FROM t1 GROUP BY c1 HAVING foo3_1b(SUM(c2)) > 1
+-- !query schema
+struct<c1:int,sum(c2):bigint>
+-- !query output
+0	3
+1	2
+
+
+-- !query
+SELECT c1, SUM(c2) FROM t1 GROUP BY CUBE(c1) HAVING foo3_1b(GROUPING(c1)) = 0
+-- !query schema
+struct<c1:int,sum(c2):bigint>
+-- !query output
+0	3
+1	2
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1a(t1.c1, t2.c2) >= 2
+-- !query schema
+struct<c1:int,c2:int,c1:int,c2:int>
+-- !query output
+1	2	0	2
+1	2	0	3
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c2) = foo3_1b(t2.c2)
+-- !query schema
+struct<c1:int,c2:int,c1:int,c2:int>
+-- !query output
+0	2	0	2
+1	2	0	2
 
 
 -- !query
 SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c1 + t2.c1 + 2) > 2
 -- !query schema
-struct<c1:int,c2:int,c1:int,c2:int>
+struct<c1:int,c2:int,c1:int,c2:int>
+-- !query output
+1	2	0	2
+1	2	0	3
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1a(foo3_1b(t1.c1), t2.c2) >= 2
+-- !query schema
+struct<c1:int,c2:int,c1:int,c2:int>
+-- !query output
+1	2	0	2
+1	2	0	3
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1f() > 0
+-- !query schema
+struct<c1:int,c2:int,c1:int,c2:int>
+-- !query output
+0	1	0	2
+0	1	0	3
+0	2	0	2
+0	2	0	3
+1	2	0	2
+1	2	0	3
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c1 + rand(0) * 0) > 1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
+  "sqlState" : "42K0E",
+  "messageParameters" : {
+    "sqlExprs" : "\"(spark_catalog.default.foo3_1b(foo3_1b.x) > 1)\""
+  }
+}
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1c(t1.c1) = 2
+-- !query schema
+struct<c1:int,c2:int,c1:int,c2:int>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_1g(t1.c1) = 2
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.UNSUPPORTED_CORRELATED_SCALAR_SUBQUERY",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "treeNode" : "Join Inner, (spark_catalog.default.foo3_1g(x#x) = 2)\n:  +- Project [outer(x#x)]\n:     +- OneRowRelation\n:- SubqueryAlias spark_catalog.default.t1\n:  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n:     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n:        +- LocalRelation [col1#x, col2#x]\n+- SubqueryAlias spark_catalog.default.t2\n   +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
+  }
+}
+
+
+-- !query
+SELECT * FROM t1 ORDER BY foo3_1b(c1)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
+    "nodeName" : "Sort"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 27,
+    "stopIndex" : 37,
+    "fragment" : "foo3_1b(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT * FROM t1 LIMIT foo3_1b(1)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
+    "nodeName" : "GlobalLimit"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 24,
+    "stopIndex" : 33,
+    "fragment" : "foo3_1b(1)"
+  } ]
+}
+
+
+-- !query
+SELECT * FROM ta LATERAL VIEW EXPLODE(ARRAY(foo3_1b(x[0]), foo3_1b(x[1]))) AS t
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
+    "nodeName" : "Generate"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 45,
+    "stopIndex" : 57,
+    "fragment" : "foo3_1b(x[0])"
+  } ]
+}
+
+
+-- !query
+SELECT CASE WHEN foo3_1b(rand(0) * 0 < 1 THEN 1 ELSE -1 END
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'foo3_1b'",
+    "hint" : ""
+  }
+}
+
+
+-- !query
+SELECT (SELECT SUM(c2) FROM t2 WHERE c1 = foo3_1b(t1.c1)) FROM t1
+-- !query schema
+struct<scalarsubquery(c1):bigint>
+-- !query output
+5
+5
+NULL
+
+
+-- !query
+SELECT foo3_1b((SELECT SUM(c1) FROM t1))
+-- !query schema
+struct<spark_catalog.default.foo3_1b(scalarsubquery()):int>
+-- !query output
+1
+
+
+-- !query
+SELECT foo3_1a(c1, (SELECT MIN(c1) FROM t1)) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_1a(c1, scalarsubquery()):double>
+-- !query output
+0.0
+0.0
+0.0
+
+
+-- !query
+SELECT foo3_1b((SELECT SUM(c1))) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 17,
+    "stopIndex" : 30,
+    "fragment" : "SELECT SUM(c1)"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_1b((SELECT SUM(c1) FROM t1 WHERE c2 = t2.c2)) FROM t2
+-- !query schema
+struct<spark_catalog.default.foo3_1b(scalarsubquery(c2)):int>
+-- !query output
+1
+NULL
+
+
+-- !query
+SELECT c2, AVG(foo3_1b((SELECT COUNT(*) FROM t1 WHERE c2 = t2.c2))) OVER (PARTITION BY c1) AS r FROM t2
+-- !query schema
+struct<c2:int,r:double>
+-- !query output
+2	1.0
+3	1.0
+
+
+-- !query
+CREATE FUNCTION foo3_1x(x STRUCT<a: INT, b: INT>) RETURNS INT RETURN x.a + x.b
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_1y(x ARRAY<INT>) RETURNS INT RETURN aggregate(x, BIGINT(0), (x, y) -> x + y)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT foo3_1a(x.a, x.b) FROM ts
+-- !query schema
+struct<spark_catalog.default.foo3_1a(x.a, x.b):double>
+-- !query output
+2.0
+
+
+-- !query
+SELECT foo3_1x(x) FROM ts
+-- !query schema
+struct<spark_catalog.default.foo3_1x(x):int>
+-- !query output
+3
+
+
+-- !query
+SELECT foo3_1a(x['a'], x['b']) FROM tm
+-- !query schema
+struct<spark_catalog.default.foo3_1a(x[a], x[b]):double>
+-- !query output
+2.0
+
+
+-- !query
+SELECT foo3_1a(x[0], x[1]) FROM ta
+-- !query schema
+struct<spark_catalog.default.foo3_1a(x[0], x[1]):double>
+-- !query output
+2.0
+
+
+-- !query
+SELECT foo3_1y(x) FROM ta
+-- !query schema
+struct<spark_catalog.default.foo3_1y(x):int>
+-- !query output
+6
+
+
+-- !query
+CREATE FUNCTION foo3_2a() RETURNS INT RETURN FLOOR(RAND() * 6) + 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT CASE WHEN foo3_2a() > 6 THEN FALSE ELSE TRUE END
+-- !query schema
+struct<CASE WHEN (spark_catalog.default.foo3_2a() > 6) THEN false ELSE true END:boolean>
+-- !query output
+true
+
+
+-- !query
+SELECT * FROM t1 JOIN t2 ON foo3_2a() = 1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
+  "sqlState" : "42K0E",
+  "messageParameters" : {
+    "sqlExprs" : "\"(spark_catalog.default.foo3_2a() = 1)\""
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2b1(x INT) RETURNS BOOLEAN RETURN x IN (SELECT 1)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b1(c1)
+-- !query schema
+struct<c1:int,c2:int>
+-- !query output
+1	2
+
+
+-- !query
+CREATE FUNCTION foo3_2b2(x INT) RETURNS INT RETURN IF(x IN (SELECT 1), 1, 0)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b2(c1) = 0
+-- !query schema
+struct<c1:int,c2:int>
+-- !query output
+0	1
+0	2
+
+
+-- !query
+SELECT foo3_2b2(c1) FROM t1
+-- !query schema
+struct<spark_catalog.default.foo3_2b2(c1):int>
+-- !query output
+0
+0
+1
+
+
+-- !query
+CREATE FUNCTION foo3_2b3(x INT) RETURNS BOOLEAN RETURN x IN (SELECT c1 FROM t2)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b3(c1)
+-- !query schema
+struct<c1:int,c2:int>
+-- !query output
+0	1
+0	2
+
+
+-- !query
+CREATE FUNCTION foo3_2b4(x INT) RETURNS BOOLEAN RETURN x NOT IN (SELECT c2 FROM t2 WHERE x = c1)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2b4(c1)
+-- !query schema
+struct<c1:int,c2:int>
+-- !query output
+0	1
+0	2
+1	2
+
+
+-- !query
+CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN SUM(1) + IF(x IN (SELECT 1), 1, 0)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "USER_DEFINED_FUNCTIONS.CANNOT_CONTAIN_COMPLEX_FUNCTIONS",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "queryText" : "SUM(1) + IF(x IN (SELECT 1), 1, 0)"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN y IN (SELECT 1)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`y`",
+    "proposal" : "`x`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 1,
+    "fragment" : "y"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN x IN (SELECT x WHERE x = 1)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_2c1(x INT) RETURNS BOOLEAN RETURN EXISTS(SELECT 1)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2c1(c1)
+-- !query schema
+struct<c1:int,c2:int>
+-- !query output
+0	1
+0	2
+1	2
+
+
+-- !query
+CREATE FUNCTION foo3_2c2(x INT) RETURNS BOOLEAN RETURN NOT EXISTS(SELECT * FROM t2 WHERE c1 = x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM t1 WHERE foo3_2c2(c1)
+-- !query schema
+struct<c1:int,c2:int>
+-- !query output
+1	2
+
+
+-- !query
+CREATE FUNCTION foo3_2d1(x INT) RETURNS INT RETURN SELECT (SELECT x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_2d2(x INT) RETURNS INT RETURN SELECT (SELECT 1 WHERE EXISTS (SELECT * FROM t2 WHERE c1 = x))
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
+  "sqlState" : "42703",
+  "messageParameters" : {
+    "objectName" : "`x`",
+    "proposal" : "`c1`, `c2`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 60,
+    "stopIndex" : 60,
+    "fragment" : "x"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo3_2e1(
+    occurrences ARRAY<STRUCT<start_time: TIMESTAMP, occurrence_id: STRING>>,
+    instance_start_time TIMESTAMP
+) RETURNS STRING RETURN
+WITH t AS (
+    SELECT transform(occurrences, x -> named_struct(
+        'diff', abs(unix_millis(x.start_time) - unix_millis(instance_start_time)),
+        'id', x.occurrence_id
+    )) AS diffs
+)
+SELECT CASE WHEN occurrences IS NULL OR size(occurrences) = 0
+       THEN NULL
+       ELSE sort_array(diffs)[0].id END AS id
+FROM t
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT foo3_2e1(
+    ARRAY(STRUCT('2022-01-01 10:11:12', '1'), STRUCT('2022-01-01 10:11:15', '2')),
+    '2022-01-01')
+-- !query schema
+struct<spark_catalog.default.foo3_2e1(array(struct(2022-01-01 10:11:12, 1), struct(2022-01-01 10:11:15, 2)), 2022-01-01):string>
+-- !query output
+1
+
+
+-- !query
+SET spark.sql.ansi.enabled=true
+-- !query schema
+struct<key:string,value:string>
+-- !query output
+spark.sql.ansi.enabled	true
+
+
+-- !query
+CREATE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SET spark.sql.ansi.enabled=false
+-- !query schema
+struct<key:string,value:string>
+-- !query output
+spark.sql.ansi.enabled	false
+
+
+-- !query
+SELECT foo3_3a(0)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "DIVIDE_BY_ZERO",
+  "sqlState" : "22012",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 5,
+    "fragment" : "1 / x"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_3b(0)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "DIVIDE_BY_ZERO",
+  "sqlState" : "22012",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 1,
+    "stopIndex" : 5,
+    "fragment" : "1 / x"
+  } ]
+}
+
+
+-- !query
+SELECT * FROM foo3_3at(0)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkArithmeticException
+{
+  "errorClass" : "DIVIDE_BY_ZERO",
+  "sqlState" : "22012",
+  "messageParameters" : {
+    "config" : "\"spark.sql.ansi.enabled\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 12,
+    "fragment" : "1 / x"
+  } ]
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE OR REPLACE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT foo3_3a(0)
+-- !query schema
+struct<spark_catalog.default.foo3_3a(0):double>
+-- !query output
+NULL
+
+
+-- !query
+SELECT foo3_3b(0)
+-- !query schema
+struct<foo3_3b(0):double>
+-- !query output
+NULL
+
+
+-- !query
+SELECT * FROM foo3_3at(0)
+-- !query schema
+struct<a:double>
+-- !query output
+NULL
+
+
+-- !query
+CREATE FUNCTION foo3_3c() RETURNS INT RETURN CAST('a' AS INT)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_3ct() RETURNS TABLE (a INT) RETURN SELECT CAST('a' AS INT)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_3d() RETURNS INT RETURN 'a' + 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_3dt() RETURNS TABLE (a INT) RETURN SELECT 'a' + 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT foo3_3c()
+-- !query schema
+struct<spark_catalog.default.foo3_3c():int>
+-- !query output
+NULL
+
+
+-- !query
+SELECT foo3_3d()
+-- !query schema
+struct<spark_catalog.default.foo3_3d():int>
+-- !query output
+NULL
+
+
+-- !query
+SELECT * FROM foo3_3ct()
+-- !query schema
+struct<a:int>
+-- !query output
+NULL
+
+
+-- !query
+SELECT * FROM foo3_3dt()
+-- !query schema
+struct<a:int>
+-- !query output
+NULL
+
+
+-- !query
+SET spark.sql.ansi.enabled=true
+-- !query schema
+struct<key:string,value:string>
+-- !query output
+spark.sql.ansi.enabled	true
+
+
+-- !query
+SELECT foo3_3c()
+-- !query schema
+struct<spark_catalog.default.foo3_3c():int>
+-- !query output
+NULL
+
+
+-- !query
+SELECT foo3_3d()
+-- !query schema
+struct<spark_catalog.default.foo3_3d():int>
+-- !query output
+NULL
+
+
+-- !query
+SELECT * FROM foo3_3ct()
+-- !query schema
+struct<a:int>
+-- !query output
+NULL
+
+
+-- !query
+SELECT * FROM foo3_3dt()
+-- !query schema
+struct<a:int>
+-- !query output
+NULL
+
+
+-- !query
+RESET spark.sql.ansi.enabled
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_4a(x INT) RETURNS INT RETURN 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_4b(x INT) RETURNS INT RETURN foo3_4a(x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_4c(x INT) RETURNS INT RETURN foo3_4b(x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_4d(x INT) RETURNS INT RETURN (SELECT foo3_4c(x))
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_4e(x INT) RETURNS TABLE(a INT) RETURN SELECT foo3_4a(x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_4f(x INT) RETURNS TABLE(b INT) RETURN SELECT * FROM foo3_4e(x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE OR REPLACE TEMP FUNCTION foo3_4g(x INT) RETURN x + 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE OR REPLACE TEMP FUNCTION foo3_4h(x INT) RETURN foo3_4g(x) + 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4b(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4c(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4c -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN foo3_4d(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4d -> spark_catalog.default.foo3_4c -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURN FoO3_4b(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4b -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4a(x INT) RETURNS INT RETURN SELECT SUM(a) FROM foo3_4e(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4a -> spark_catalog.default.foo3_4e -> spark_catalog.default.foo3_4a"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4e(x INT) RETURNS TABLE (c INT) RETURN SELECT * FROM foo3_4f(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4e -> spark_catalog.default.foo3_4f -> spark_catalog.default.foo3_4e"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE FUNCTION foo3_4e(x INT) RETURNS TABLE RETURN SELECT * FROM fOo3_4F(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "spark_catalog.default.foo3_4e -> spark_catalog.default.foo3_4f -> spark_catalog.default.foo3_4e"
+  }
+}
+
+
+-- !query
+CREATE OR REPLACE TEMP FUNCTION foo3_4g(x INT) RETURN foo3_4h(x) + 1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "CYCLIC_FUNCTION_REFERENCE",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "path" : "foo3_4g -> foo3_4h -> foo3_4g"
+  }
+}
+
+
+-- !query
+CREATE TEMPORARY VIEW t AS VALUES (0) t(a)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_5a(x INT) RETURNS INT RETURN x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_5b(x INT) RETURNS INT RETURN (SELECT SUM(a) FROM t)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE TEMPORARY FUNCTION foo3_5c(x INT) RETURNS TABLE (a INT) RETURN SELECT a FROM t
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS INT RETURN foo3_5a(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "FUNCTION",
+    "tempObjName" : "`foo3_5a`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS TABLE (a INT) RETURN SELECT foo3_5a(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "FUNCTION",
+    "tempObjName" : "`foo3_5a`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS INT RETURN (SELECT SUM(a) FROM t)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "VIEW",
+    "tempObjName" : "`t`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_5d(x INT) RETURNS TABLE (a INT) RETURN SELECT a FROM t
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_TEMP_OBJ_REFERENCE",
+  "sqlState" : "42K0F",
+  "messageParameters" : {
+    "obj" : "FUNCTION",
+    "objName" : "`default`.`foo3_5d`",
+    "tempObj" : "VIEW",
+    "tempObjName" : "`t`"
+  }
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12a(x INT) RETURNS INT CONTAINS SQL RETURN x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12b(x INT) RETURNS INT READS SQL DATA RETURN x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12c(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT x)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12d(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT COUNT(*) FROM range(0, 3))
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12e(x INT) RETURNS INT CONTAINS SQL RETURN (SELECT COUNT(*) FROM VALUES (0, 1))
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN SELECT SUM(c2) FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN foo3_12b(x) + 1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN 1 + (SELECT SUM(c2) FROM t1)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12g(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT x, x + 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12h(x INT) RETURNS TABLE (a INT, b INT) READS SQL DATA RETURN SELECT x, x + 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12i(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM VALUES (0, 1)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12j(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT id, id + 1 FROM RANGE(3)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12k(x INT) RETURNS TABLE (a INT, b INT) RETURN SELECT c1, c2 FROM t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT c1, c2 FROM t1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT foo3_12b(x), x
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM foo3_12h(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT, b INT) CONTAINS SQL RETURN SELECT * FROM foo3_12k(x)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE TABLE tbl USING PARQUET AS SELECT c1 FROM t2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS INT CONTAINS SQL RETURN SELECT SUM(c1) FROM tbl
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+CREATE FUNCTION foo3_12f(x INT) RETURNS TABLE (a INT) CONTAINS SQL RETURN SELECT * FROM tbl
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "INVALID_SQL_FUNCTION_DATA_ACCESS",
+  "sqlState" : "42K0E"
+}
+
+
+-- !query
+DROP TABLE tbl
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_14a() RETURNS INT RETURN 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo3_14b() RETURNS TABLE (a INT) RETURN SELECT 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM foo3_14a()
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "NOT_A_TABLE_FUNCTION",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_14a`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 15,
+    "stopIndex" : 24,
+    "fragment" : "foo3_14a()"
+  } ]
+}
+
+
+-- !query
+SELECT foo3_14b()
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.AnalysisException
+{
+  "errorClass" : "NOT_A_SCALAR_FUNCTION",
+  "sqlState" : "42887",
+  "messageParameters" : {
+    "functionName" : "`spark_catalog`.`default`.`foo3_14b`"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 17,
+    "fragment" : "foo3_14b()"
+  } ]
+}
+
+
+-- !query
+CREATE FUNCTION foo4_0() RETURNS TABLE (x INT) RETURN SELECT 1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo4_1(x INT) RETURNS TABLE (a INT) RETURN SELECT x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo4_2(x INT) RETURNS TABLE (a INT) RETURN SELECT c2 FROM t2 WHERE c1 = x
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE FUNCTION foo4_3(x INT) RETURNS TABLE (a INT, cnt INT) RETURN SELECT c1, COUNT(*) FROM t2 WHERE c1 = x GROUP BY c1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM foo4_0()
+-- !query schema
+struct<x:int>
+-- !query output
+1
+
+
+-- !query
+SELECT * FROM foo4_1(1)
+-- !query schema
+struct<a:int>
+-- !query output
+1
+
+
+-- !query
+SELECT * FROM foo4_2(2)
+-- !query schema
+struct<a:int>
+-- !query output
+
+
+
+-- !query
+SELECT * FROM foo4_3(0)
+-- !query schema
+struct<a:int,cnt:int>
+-- !query output
+0	2
+
+
+-- !query
+SELECT * FROM foo4_1(rand(0) * 0)
+-- !query schema
+struct<a:int>
+-- !query output
+0
+
+
+-- !query
+SELECT * FROM foo4_1(x => 1)
+-- !query schema
+struct<a:int>
+-- !query output
+1
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_1(c1)
+-- !query schema
+struct<c1:int,c2:int,a:int>
+-- !query output
+0	1	0
+0	2	0
+1	2	1
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_2(c1)
+-- !query schema
+struct<c1:int,c2:int,a:int>
+-- !query output
+0	1	2
+0	1	3
+0	2	2
+0	2	3
+
+
+-- !query
+SELECT * FROM t1 JOIN LATERAL foo4_2(c1) ON t1.c2 = foo4_2.a
+-- !query schema
+struct<c1:int,c2:int,a:int>
+-- !query output
+0	2	2
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_3(c1)
+-- !query schema
+struct<c1:int,c2:int,a:int,cnt:int>
+-- !query output
+0	1	0	2
+0	2	0	2
+
+
+-- !query
+SELECT * FROM t1, LATERAL (SELECT cnt FROM foo4_3(c1))
+-- !query schema
+struct<c1:int,c2:int,cnt:int>
+-- !query output
+0	1	2
+0	2	2
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.NON_DETERMINISTIC_LATERAL_SUBQUERIES",
+  "sqlState" : "0A000",
+  "messageParameters" : {
+    "treeNode" : "LateralJoin lateral-subquery#x [c1#x], Inner\n:  +- SQLFunctionNode spark_catalog.default.foo4_1\n:     +- SubqueryAlias foo4_1\n:        +- Project [cast(x#x as int) AS a#x]\n:           +- LateralJoin lateral-subquery#x [x#x], Inner\n:              :  +- Project [outer(x#x) AS x#x]\n:              :     +- OneRowRelation\n:              +- Project [cast((cast(outer(c1#x) as double) + (rand(number) * cast(0 as double))) as int) AS x#x]\n:                 +- OneRowRelation\n+- SubqueryAlias spark_catalog.default.t1\n   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 10,
+    "stopIndex" : 50,
+    "fragment" : "FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)"
+  } ]
+}
+
+
+-- !query
+SELECT * FROM t1 JOIN foo4_1(1) AS foo4_1(x) ON t1.c1 = foo4_1.x
+-- !query schema
+struct<c1:int,c2:int,x:int>
+-- !query output
+1	2	1
+
+
+-- !query
+SELECT * FROM t1, LATERAL foo4_1(c1), LATERAL foo4_2(foo4_1.a + c1)
+-- !query schema
+struct<c1:int,c2:int,a:int,a:int>
+-- !query output
+0	1	0	2
+0	1	0	3
+0	2	0	2
+0	2	0	3
+
+
+-- !query
+SELECT (SELECT MAX(a) FROM foo4_1(c1)) FROM t1
+-- !query schema
+struct<scalarsubquery(c1):int>
+-- !query output
+0
+0
+1
+
+
+-- !query
+SELECT (SELECT MAX(a) FROM foo4_1(c1) WHERE a = c2) FROM t1
+-- !query schema
+struct<scalarsubquery(c2, c1):int>
+-- !query output
+NULL
+NULL
+NULL
+
+
+-- !query
+SELECT (SELECT MAX(cnt) FROM foo4_3(c1)) FROM t1
+-- !query schema
+struct<scalarsubquery(c1):int>
+-- !query output
+2
+2
+NULL
+
+
+-- !query
+DROP VIEW t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW t2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1a0
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1a1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1a2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1b0
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1b1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1b2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1c1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1c2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d4
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d5
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1d6
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1e1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1e2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1e3
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo1f1
+-- !query schema
+struct<>
 -- !query output
-1	2	0	2
-1	2	0	3
+
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1a(foo3_1b(t1.c1), t2.c2) >= 2
+DROP FUNCTION IF EXISTS foo1f2
 -- !query schema
-struct<c1:int,c2:int,c1:int,c2:int>
+struct<>
 -- !query output
-1	2	0	2
-1	2	0	3
+
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1f() > 0
+DROP FUNCTION IF EXISTS foo1g1
 -- !query schema
-struct<c1:int,c2:int,c1:int,c2:int>
+struct<>
 -- !query output
-0	1	0	2
-0	1	0	3
-0	2	0	2
-0	2	0	3
-1	2	0	2
-1	2	0	3
+
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1b(t1.c1 + rand(0) * 0) > 1
+DROP FUNCTION IF EXISTS foo1g2
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
-  "sqlState" : "42K0E",
-  "messageParameters" : {
-    "sqlExprs" : "\"(spark_catalog.default.foo3_1b(foo3_1b.x) > 1)\""
-  }
-}
+
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1c(t1.c1) = 2
+DROP FUNCTION IF EXISTS foo2a0
 -- !query schema
-struct<c1:int,c2:int,c1:int,c2:int>
+struct<>
 -- !query output
 
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_1g(t1.c1) = 2
+DROP FUNCTION IF EXISTS foo2a2
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.UNSUPPORTED_CORRELATED_SCALAR_SUBQUERY",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "treeNode" : "Join Inner, (spark_catalog.default.foo3_1g(x#x) = 2)\n:  +- Project [outer(x#x)]\n:     +- OneRowRelation\n:- SubqueryAlias spark_catalog.default.t1\n:  +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n:     +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n:        +- LocalRelation [col1#x, col2#x]\n+- SubqueryAlias spark_catalog.default.t2\n   +- View (`spark_catalog`.`default`.`t2`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
-  }
-}
+
 
 
 -- !query
-SELECT * FROM t1 ORDER BY foo3_1b(c1)
+DROP FUNCTION IF EXISTS foo2a4
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
-    "nodeName" : "Sort"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 27,
-    "stopIndex" : 37,
-    "fragment" : "foo3_1b(c1)"
-  } ]
-}
+
 
 
 -- !query
-SELECT * FROM t1 LIMIT foo3_1b(1)
+DROP FUNCTION IF EXISTS foo2b1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo2b2
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo2c1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo31
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo32
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo33
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo41
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo42
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo51
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo52
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo6c
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo6d
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo7a
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo7at
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9a
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9b
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9c
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9d
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9e
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9f
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9g
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9h
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9i
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9j
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9l
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo9m
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
-    "nodeName" : "GlobalLimit"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 24,
-    "stopIndex" : 33,
-    "fragment" : "foo3_1b(1)"
-  } ]
-}
+
 
 
 -- !query
-SELECT * FROM ta LATERAL VIEW EXPLODE(ARRAY(foo3_1b(x[0]), foo3_1b(x[1]))) AS t
+DROP FUNCTION IF EXISTS foo9n
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SQL_UDF_USAGE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "functionName" : "`spark_catalog`.`default`.`foo3_1b`",
-    "nodeName" : "Generate"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 45,
-    "stopIndex" : 57,
-    "fragment" : "foo3_1b(x[0])"
-  } ]
-}
+
 
 
 -- !query
-SELECT CASE WHEN foo3_1b(rand(0) * 0 < 1 THEN 1 ELSE -1 END
+DROP FUNCTION IF EXISTS foo9o
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.parser.ParseException
-{
-  "errorClass" : "PARSE_SYNTAX_ERROR",
-  "sqlState" : "42601",
-  "messageParameters" : {
-    "error" : "'foo3_1b'",
-    "hint" : ""
-  }
-}
+
 
 
 -- !query
-SELECT (SELECT SUM(c2) FROM t2 WHERE c1 = foo3_1b(t1.c1)) FROM t1
+DROP FUNCTION IF EXISTS foo9p
 -- !query schema
-struct<scalarsubquery(c1):bigint>
+struct<>
 -- !query output
-5
-5
-NULL
+
 
 
 -- !query
-SELECT foo3_1b((SELECT SUM(c1) FROM t1))
+DROP FUNCTION IF EXISTS foo9q
 -- !query schema
-struct<spark_catalog.default.foo3_1b(scalarsubquery()):int>
+struct<>
 -- !query output
-1
+
 
 
 -- !query
-SELECT foo3_1a(c1, (SELECT MIN(c1) FROM t1)) FROM t1
+DROP FUNCTION IF EXISTS foo9r
 -- !query schema
-struct<spark_catalog.default.foo3_1a(c1, scalarsubquery()):double>
+struct<>
 -- !query output
-0.0
-0.0
-0.0
+
 
 
 -- !query
-SELECT foo3_1b((SELECT SUM(c1))) FROM t1
+DROP FUNCTION IF EXISTS foo1_10
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.CORRELATED_REFERENCE",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "sqlExprs" : "\"sum(c1) AS `sum(outer(spark_catalog.default.t1.c1))`\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 17,
-    "stopIndex" : 30,
-    "fragment" : "SELECT SUM(c1)"
-  } ]
-}
+
 
 
 -- !query
-SELECT foo3_1b((SELECT SUM(c1) FROM t1 WHERE c2 = t2.c2)) FROM t2
+DROP FUNCTION IF EXISTS bar1_10
 -- !query schema
-struct<spark_catalog.default.foo3_1b(scalarsubquery(c2)):int>
+struct<>
 -- !query output
-1
-NULL
+
 
 
 -- !query
-SELECT c2, AVG(foo3_1b((SELECT COUNT(*) FROM t1 WHERE c2 = t2.c2))) OVER (PARTITION BY c1) AS r FROM t2
+DROP FUNCTION IF EXISTS foo1_11a
 -- !query schema
-struct<c2:int,r:double>
+struct<>
 -- !query output
-2	1.0
-3	1.0
+
 
 
 -- !query
-CREATE FUNCTION foo3_1x(x STRUCT<a: INT, b: INT>) RETURNS INT RETURN x.a + x.b
+DROP FUNCTION IF EXISTS foo1_11b
 -- !query schema
 struct<>
 -- !query output
@@ -2154,7 +5118,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_1y(x ARRAY<INT>) RETURNS INT RETURN aggregate(x, BIGINT(0), (x, y) -> x + y)
+DROP FUNCTION IF EXISTS foo1_11c
 -- !query schema
 struct<>
 -- !query output
@@ -2162,47 +5126,47 @@ struct<>
 
 
 -- !query
-SELECT foo3_1a(x.a, x.b) FROM ts
+DROP FUNCTION IF EXISTS foo1_11d
 -- !query schema
-struct<spark_catalog.default.foo3_1a(x.a, x.b):double>
+struct<>
 -- !query output
-2.0
+
 
 
 -- !query
-SELECT foo3_1x(x) FROM ts
+DROP FUNCTION IF EXISTS foo1_11e
 -- !query schema
-struct<spark_catalog.default.foo3_1x(x):int>
+struct<>
 -- !query output
-3
+
 
 
 -- !query
-SELECT foo3_1a(x['a'], x['b']) FROM tm
+DROP FUNCTION IF EXISTS foo1_11f
 -- !query schema
-struct<spark_catalog.default.foo3_1a(x[a], x[b]):double>
+struct<>
 -- !query output
-2.0
+
 
 
 -- !query
-SELECT foo3_1a(x[0], x[1]) FROM ta
+DROP FUNCTION IF EXISTS foo1_11g
 -- !query schema
-struct<spark_catalog.default.foo3_1a(x[0], x[1]):double>
+struct<>
 -- !query output
-2.0
+
 
 
 -- !query
-SELECT foo3_1y(x) FROM ta
+DROP FUNCTION IF EXISTS foo1_11h
 -- !query schema
-struct<spark_catalog.default.foo3_1y(x):int>
+struct<>
 -- !query output
-6
+
 
 
 -- !query
-CREATE FUNCTION foo3_2a() RETURNS INT RETURN FLOOR(RAND() * 6) + 1
+DROP FUNCTION IF EXISTS foo1_11i
 -- !query schema
 struct<>
 -- !query output
@@ -2210,30 +5174,23 @@ struct<>
 
 
 -- !query
-SELECT CASE WHEN foo3_2a() > 6 THEN FALSE ELSE TRUE END
+DROP FUNCTION IF EXISTS foo1_11j
 -- !query schema
-struct<CASE WHEN (spark_catalog.default.foo3_2a() > 6) THEN false ELSE true END:boolean>
+struct<>
 -- !query output
-true
+
 
 
 -- !query
-SELECT * FROM t1 JOIN t2 ON foo3_2a() = 1
+DROP FUNCTION IF EXISTS foo1_11k
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "INVALID_NON_DETERMINISTIC_EXPRESSIONS",
-  "sqlState" : "42K0E",
-  "messageParameters" : {
-    "sqlExprs" : "\"(spark_catalog.default.foo3_2a() = 1)\""
-  }
-}
+
 
 
 -- !query
-CREATE FUNCTION foo3_2b1(x INT) RETURNS BOOLEAN RETURN x IN (SELECT 1)
+DROP FUNCTION IF EXISTS foo1_11l
 -- !query schema
 struct<>
 -- !query output
@@ -2241,15 +5198,15 @@ struct<>
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b1(c1)
+DROP FUNCTION IF EXISTS foo1_11m
 -- !query schema
-struct<c1:int,c2:int>
+struct<>
 -- !query output
-1	2
+
 
 
 -- !query
-CREATE FUNCTION foo3_2b2(x INT) RETURNS INT RETURN IF(x IN (SELECT 1), 1, 0)
+DROP FUNCTION IF EXISTS foo1_11n
 -- !query schema
 struct<>
 -- !query output
@@ -2257,26 +5214,23 @@ struct<>
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b2(c1) = 0
+DROP FUNCTION IF EXISTS foo1_11o
 -- !query schema
-struct<c1:int,c2:int>
+struct<>
 -- !query output
-0	1
-0	2
+
 
 
 -- !query
-SELECT foo3_2b2(c1) FROM t1
+DROP FUNCTION IF EXISTS foo2_1a
 -- !query schema
-struct<spark_catalog.default.foo3_2b2(c1):int>
+struct<>
 -- !query output
-0
-0
-1
+
 
 
 -- !query
-CREATE FUNCTION foo3_2b3(x INT) RETURNS BOOLEAN RETURN x IN (SELECT c1 FROM t2)
+DROP FUNCTION IF EXISTS foo2_1b
 -- !query schema
 struct<>
 -- !query output
@@ -2284,16 +5238,15 @@ struct<>
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b3(c1)
+DROP FUNCTION IF EXISTS foo2_1c
 -- !query schema
-struct<c1:int,c2:int>
+struct<>
 -- !query output
-0	1
-0	2
+
 
 
 -- !query
-CREATE FUNCTION foo3_2b4(x INT) RETURNS BOOLEAN RETURN x NOT IN (SELECT c2 FROM t2 WHERE x = c1)
+DROP FUNCTION IF EXISTS foo2_1d
 -- !query schema
 struct<>
 -- !query output
@@ -2301,55 +5254,31 @@ struct<>
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2b4(c1)
+DROP FUNCTION IF EXISTS foo2_2a
 -- !query schema
-struct<c1:int,c2:int>
+struct<>
 -- !query output
-0	1
-0	2
-1	2
+
 
 
 -- !query
-CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN SUM(1) + IF(x IN (SELECT 1), 1, 0)
+DROP FUNCTION IF EXISTS foo2_2b
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.AnalysisException
-{
-  "errorClass" : "USER_DEFINED_FUNCTIONS.CANNOT_CONTAIN_COMPLEX_FUNCTIONS",
-  "sqlState" : "42601",
-  "messageParameters" : {
-    "queryText" : "SUM(1) + IF(x IN (SELECT 1), 1, 0)"
-  }
-}
+
 
 
 -- !query
-CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN y IN (SELECT 1)
+DROP FUNCTION IF EXISTS foo2_2c
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`y`",
-    "proposal" : "`x`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 1,
-    "fragment" : "y"
-  } ]
-}
+
 
 
 -- !query
-CREATE FUNCTION foo3_2b5(x INT) RETURNS BOOLEAN RETURN x IN (SELECT x WHERE x = 1)
+DROP FUNCTION IF EXISTS foo2_2d
 -- !query schema
 struct<>
 -- !query output
@@ -2357,7 +5286,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_2c1(x INT) RETURNS BOOLEAN RETURN EXISTS(SELECT 1)
+DROP FUNCTION IF EXISTS foo2_2e
 -- !query schema
 struct<>
 -- !query output
@@ -2365,17 +5294,15 @@ struct<>
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2c1(c1)
+DROP FUNCTION IF EXISTS foo2_2f
 -- !query schema
-struct<c1:int,c2:int>
+struct<>
 -- !query output
-0	1
-0	2
-1	2
+
 
 
 -- !query
-CREATE FUNCTION foo3_2c2(x INT) RETURNS BOOLEAN RETURN NOT EXISTS(SELECT * FROM t2 WHERE c1 = x)
+DROP FUNCTION IF EXISTS foo2_2g
 -- !query schema
 struct<>
 -- !query output
@@ -2383,15 +5310,15 @@ struct<>
 
 
 -- !query
-SELECT * FROM t1 WHERE foo3_2c2(c1)
+DROP FUNCTION IF EXISTS foo2_3
 -- !query schema
-struct<c1:int,c2:int>
+struct<>
 -- !query output
-1	2
+
 
 
 -- !query
-CREATE FUNCTION foo3_2d1(x INT) RETURNS INT RETURN SELECT (SELECT x)
+DROP FUNCTION IF EXISTS foo2_4a
 -- !query schema
 struct<>
 -- !query output
@@ -2399,43 +5326,15 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_2d2(x INT) RETURNS INT RETURN SELECT (SELECT 1 WHERE EXISTS (SELECT * FROM t2 WHERE c1 = x))
+DROP FUNCTION IF EXISTS foo2_4b
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNRESOLVED_COLUMN.WITH_SUGGESTION",
-  "sqlState" : "42703",
-  "messageParameters" : {
-    "objectName" : "`x`",
-    "proposal" : "`c1`, `c2`"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 60,
-    "stopIndex" : 60,
-    "fragment" : "x"
-  } ]
-}
+
 
 
 -- !query
-CREATE FUNCTION foo3_2e1(
-    occurrences ARRAY<STRUCT<start_time: TIMESTAMP, occurrence_id: STRING>>,
-    instance_start_time TIMESTAMP
-) RETURNS STRING RETURN
-WITH t AS (
-    SELECT transform(occurrences, x -> named_struct(
-        'diff', abs(unix_millis(x.start_time) - unix_millis(instance_start_time)),
-        'id', x.occurrence_id
-    )) AS diffs
-)
-SELECT CASE WHEN occurrences IS NULL OR size(occurrences) = 0
-       THEN NULL
-       ELSE sort_array(diffs)[0].id END AS id
-FROM t
+DROP FUNCTION IF EXISTS foo3_1a
 -- !query schema
 struct<>
 -- !query output
@@ -2443,25 +5342,23 @@ struct<>
 
 
 -- !query
-SELECT foo3_2e1(
-    ARRAY(STRUCT('2022-01-01 10:11:12', '1'), STRUCT('2022-01-01 10:11:15', '2')),
-    '2022-01-01')
+DROP FUNCTION IF EXISTS foo3_1b
 -- !query schema
-struct<spark_catalog.default.foo3_2e1(array(struct(2022-01-01 10:11:12, 1), struct(2022-01-01 10:11:15, 2)), 2022-01-01):string>
+struct<>
 -- !query output
-1
+
 
 
 -- !query
-SET spark.sql.ansi.enabled=true
+DROP FUNCTION IF EXISTS foo3_1c
 -- !query schema
-struct<key:string,value:string>
+struct<>
 -- !query output
-spark.sql.ansi.enabled	true
+
 
 
 -- !query
-CREATE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_1d
 -- !query schema
 struct<>
 -- !query output
@@ -2469,7 +5366,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+DROP FUNCTION IF EXISTS foo3_1e
 -- !query schema
 struct<>
 -- !query output
@@ -2477,7 +5374,7 @@ struct<>
 
 
 -- !query
-CREATE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_1f
 -- !query schema
 struct<>
 -- !query output
@@ -2485,81 +5382,47 @@ struct<>
 
 
 -- !query
-SET spark.sql.ansi.enabled=false
+DROP FUNCTION IF EXISTS foo3_1g
 -- !query schema
-struct<key:string,value:string>
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP FUNCTION IF EXISTS foo3_1x
+-- !query schema
+struct<>
 -- !query output
-spark.sql.ansi.enabled	false
+
 
 
 -- !query
-SELECT foo3_3a(0)
+DROP FUNCTION IF EXISTS foo3_1y
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.SparkArithmeticException
-{
-  "errorClass" : "DIVIDE_BY_ZERO",
-  "sqlState" : "22012",
-  "messageParameters" : {
-    "config" : "\"spark.sql.ansi.enabled\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 5,
-    "fragment" : "1 / x"
-  } ]
-}
+
 
 
 -- !query
-SELECT foo3_3b(0)
+DROP FUNCTION IF EXISTS foo3_2a
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.SparkArithmeticException
-{
-  "errorClass" : "DIVIDE_BY_ZERO",
-  "sqlState" : "22012",
-  "messageParameters" : {
-    "config" : "\"spark.sql.ansi.enabled\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 1,
-    "stopIndex" : 5,
-    "fragment" : "1 / x"
-  } ]
-}
+
 
 
 -- !query
-SELECT * FROM foo3_3at(0)
+DROP FUNCTION IF EXISTS foo3_2b1
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.SparkArithmeticException
-{
-  "errorClass" : "DIVIDE_BY_ZERO",
-  "sqlState" : "22012",
-  "messageParameters" : {
-    "config" : "\"spark.sql.ansi.enabled\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 12,
-    "fragment" : "1 / x"
-  } ]
-}
+
 
 
 -- !query
-CREATE OR REPLACE FUNCTION foo3_3a(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_2b2
 -- !query schema
 struct<>
 -- !query output
@@ -2567,24 +5430,15 @@ struct<>
 
 
 -- !query
-CREATE OR REPLACE FUNCTION foo3_3at(x INT) RETURNS TABLE (a DOUBLE) RETURN SELECT 1 / x
+DROP FUNCTION IF EXISTS foo3_2b3
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.analysis.FunctionAlreadyExistsException
-{
-  "errorClass" : "ROUTINE_ALREADY_EXISTS",
-  "sqlState" : "42723",
-  "messageParameters" : {
-    "existingRoutineType" : "routine",
-    "newRoutineType" : "routine",
-    "routineName" : "`default`.`foo3_3at`"
-  }
-}
+
 
 
 -- !query
-CREATE OR REPLACE TEMPORARY FUNCTION foo3_3b(x INT) RETURNS DOUBLE RETURN 1 / x
+DROP FUNCTION IF EXISTS foo3_2b4
 -- !query schema
 struct<>
 -- !query output
@@ -2592,45 +5446,31 @@ struct<>
 
 
 -- !query
-SELECT foo3_3a(0)
+DROP FUNCTION IF EXISTS foo3_2b5
 -- !query schema
-struct<spark_catalog.default.foo3_3a(0):double>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT foo3_3b(0)
+DROP FUNCTION IF EXISTS foo3_2c1
 -- !query schema
-struct<foo3_3b(0):double>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT * FROM foo3_3at(0)
+DROP FUNCTION IF EXISTS foo3_2c2
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.SparkArithmeticException
-{
-  "errorClass" : "DIVIDE_BY_ZERO",
-  "sqlState" : "22012",
-  "messageParameters" : {
-    "config" : "\"spark.sql.ansi.enabled\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 12,
-    "fragment" : "1 / x"
-  } ]
-}
+
 
 
 -- !query
-CREATE FUNCTION foo3_3c() RETURNS INT RETURN CAST('a' AS INT)
+DROP FUNCTION IF EXISTS foo3_2d1
 -- !query schema
 struct<>
 -- !query output
@@ -2638,7 +5478,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_3ct() RETURNS TABLE (a INT) RETURN SELECT CAST('a' AS INT)
+DROP FUNCTION IF EXISTS foo3_2d2
 -- !query schema
 struct<>
 -- !query output
@@ -2646,7 +5486,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_3d() RETURNS INT RETURN 'a' + 1
+DROP FUNCTION IF EXISTS foo3_2e1
 -- !query schema
 struct<>
 -- !query output
@@ -2654,7 +5494,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo3_3dt() RETURNS TABLE (a INT) RETURN SELECT 'a' + 1
+DROP FUNCTION IF EXISTS foo3_3a
 -- !query schema
 struct<>
 -- !query output
@@ -2662,79 +5502,79 @@ struct<>
 
 
 -- !query
-SELECT foo3_3c()
+DROP FUNCTION IF EXISTS foo3_3at
 -- !query schema
-struct<spark_catalog.default.foo3_3c():int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT foo3_3d()
+DROP FUNCTION IF EXISTS foo3_14a
 -- !query schema
-struct<spark_catalog.default.foo3_3d():int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT * FROM foo3_3ct()
+DROP FUNCTION IF EXISTS foo3_14b
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT * FROM foo3_3dt()
+DROP FUNCTION IF EXISTS foo3_3c
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SET spark.sql.ansi.enabled=true
+DROP FUNCTION IF EXISTS foo3_3ct
 -- !query schema
-struct<key:string,value:string>
+struct<>
 -- !query output
-spark.sql.ansi.enabled	true
+
 
 
 -- !query
-SELECT foo3_3c()
+DROP FUNCTION IF EXISTS foo3_3d
 -- !query schema
-struct<spark_catalog.default.foo3_3c():int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT foo3_3d()
+DROP FUNCTION IF EXISTS foo3_3dt
 -- !query schema
-struct<spark_catalog.default.foo3_3d():int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT * FROM foo3_3ct()
+DROP FUNCTION IF EXISTS foo3_4a
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-SELECT * FROM foo3_3dt()
+DROP FUNCTION IF EXISTS foo3_4b
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
-NULL
+
 
 
 -- !query
-RESET spark.sql.ansi.enabled
+DROP FUNCTION IF EXISTS foo3_4c
 -- !query schema
 struct<>
 -- !query output
@@ -2742,7 +5582,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo4_0() RETURNS TABLE (x INT) RETURN SELECT 1
+DROP FUNCTION IF EXISTS foo3_4d
 -- !query schema
 struct<>
 -- !query output
@@ -2750,7 +5590,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo4_1(x INT) RETURNS TABLE (a INT) RETURN SELECT x
+DROP FUNCTION IF EXISTS foo3_4e
 -- !query schema
 struct<>
 -- !query output
@@ -2758,7 +5598,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo4_2(x INT) RETURNS TABLE (a INT) RETURN SELECT c2 FROM t2 WHERE c1 = x
+DROP FUNCTION IF EXISTS foo3_4f
 -- !query schema
 struct<>
 -- !query output
@@ -2766,7 +5606,7 @@ struct<>
 
 
 -- !query
-CREATE FUNCTION foo4_3(x INT) RETURNS TABLE (a INT, cnt INT) RETURN SELECT c1, COUNT(*) FROM t2 WHERE c1 = x GROUP BY c1
+DROP FUNCTION IF EXISTS foo3_12a
 -- !query schema
 struct<>
 -- !query output
@@ -2774,173 +5614,143 @@ struct<>
 
 
 -- !query
-SELECT * FROM foo4_0()
+DROP FUNCTION IF EXISTS foo3_12b
 -- !query schema
-struct<x:int>
+struct<>
 -- !query output
-1
+
 
 
 -- !query
-SELECT * FROM foo4_1(1)
+DROP FUNCTION IF EXISTS foo3_12c
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
-1
+
 
 
 -- !query
-SELECT * FROM foo4_2(2)
+DROP FUNCTION IF EXISTS foo3_12d
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
 
 
 
 -- !query
-SELECT * FROM foo4_3(0)
+DROP FUNCTION IF EXISTS foo3_12e
 -- !query schema
-struct<a:int,cnt:int>
+struct<>
 -- !query output
-0	2
+
 
 
 -- !query
-SELECT * FROM foo4_1(rand(0) * 0)
+DROP FUNCTION IF EXISTS foo3_12f
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
-0
+
 
 
 -- !query
-SELECT * FROM foo4_1(x => 1)
+DROP FUNCTION IF EXISTS foo3_12g
 -- !query schema
-struct<a:int>
+struct<>
 -- !query output
-1
+
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_1(c1)
+DROP FUNCTION IF EXISTS foo3_12h
 -- !query schema
-struct<c1:int,c2:int,a:int>
+struct<>
 -- !query output
-0	1	0
-0	2	0
-1	2	1
+
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_2(c1)
+DROP FUNCTION IF EXISTS foo3_12i
 -- !query schema
-struct<c1:int,c2:int,a:int>
+struct<>
 -- !query output
-0	1	2
-0	1	3
-0	2	2
-0	2	3
+
 
 
 -- !query
-SELECT * FROM t1 JOIN LATERAL foo4_2(c1) ON t1.c2 = foo4_2.a
+DROP FUNCTION IF EXISTS foo3_12j
 -- !query schema
-struct<c1:int,c2:int,a:int>
+struct<>
 -- !query output
-0	2	2
+
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_3(c1)
+DROP FUNCTION IF EXISTS foo3_12k
 -- !query schema
-struct<c1:int,c2:int,a:int,cnt:int>
+struct<>
 -- !query output
-0	1	0	2
-0	2	0	2
+
 
 
 -- !query
-SELECT * FROM t1, LATERAL (SELECT cnt FROM foo4_3(c1))
+DROP FUNCTION IF EXISTS foo4_0
 -- !query schema
-struct<c1:int,c2:int,cnt:int>
+struct<>
 -- !query output
-0	1	2
-0	2	2
+
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)
+DROP FUNCTION IF EXISTS foo4_1
 -- !query schema
 struct<>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "UNSUPPORTED_SUBQUERY_EXPRESSION_CATEGORY.NON_DETERMINISTIC_LATERAL_SUBQUERIES",
-  "sqlState" : "0A000",
-  "messageParameters" : {
-    "treeNode" : "LateralJoin lateral-subquery#x [c1#x], Inner\n:  +- SQLFunctionNode spark_catalog.default.foo4_1\n:     +- SubqueryAlias foo4_1\n:        +- Project [cast(x#x as int) AS a#x]\n:           +- LateralJoin lateral-subquery#x [x#x], Inner\n:              :  +- Project [outer(x#x) AS x#x]\n:              :     +- OneRowRelation\n:              +- Project [cast((cast(outer(c1#x) as double) + (rand(number) * cast(0 as double))) as int) AS x#x]\n:                 +- OneRowRelation\n+- SubqueryAlias spark_catalog.default.t1\n   +- View (`spark_catalog`.`default`.`t1`, [c1#x, c2#x])\n      +- Project [cast(col1#x as int) AS c1#x, cast(col2#x as int) AS c2#x]\n         +- LocalRelation [col1#x, col2#x]\n"
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 10,
-    "stopIndex" : 50,
-    "fragment" : "FROM t1, LATERAL foo4_1(c1 + rand(0) * 0)"
-  } ]
-}
+
 
 
 -- !query
-SELECT * FROM t1 JOIN foo4_1(1) AS foo4_1(x) ON t1.c1 = foo4_1.x
+DROP FUNCTION IF EXISTS foo4_2
 -- !query schema
-struct<c1:int,c2:int,x:int>
+struct<>
 -- !query output
-1	2	1
+
 
 
 -- !query
-SELECT * FROM t1, LATERAL foo4_1(c1), LATERAL foo4_2(foo4_1.a + c1)
+DROP FUNCTION IF EXISTS foo4_3
 -- !query schema
-struct<c1:int,c2:int,a:int,a:int>
+struct<>
 -- !query output
-0	1	0	2
-0	1	0	3
-0	2	0	2
-0	2	0	3
+
 
 
 -- !query
-SELECT (SELECT MAX(a) FROM foo4_1(c1)) FROM t1
+DROP TEMPORARY FUNCTION IF EXISTS foo1d3
 -- !query schema
-struct<scalarsubquery(c1):int>
+struct<>
 -- !query output
-0
-0
-1
+
 
 
 -- !query
-SELECT (SELECT MAX(a) FROM foo4_1(c1) WHERE a = c2) FROM t1
+DROP TEMPORARY FUNCTION IF EXISTS foo3_3b
 -- !query schema
-struct<scalarsubquery(c2, c1):int>
+struct<>
 -- !query output
-NULL
-NULL
-NULL
+
 
 
 -- !query
-SELECT (SELECT MAX(cnt) FROM foo4_3(c1)) FROM t1
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5a
 -- !query schema
-struct<scalarsubquery(c1):int>
+struct<>
 -- !query output
-2
-2
-NULL
+
 
 
 -- !query
-DROP VIEW t1
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5b
 -- !query schema
 struct<>
 -- !query output
@@ -2948,7 +5758,7 @@ struct<>
 
 
 -- !query
-DROP VIEW t2
+DROP TEMPORARY FUNCTION IF EXISTS foo3_5c
 -- !query schema
 struct<>
 -- !query output
diff --git a/sql/core/src/test/resources/sql-tests/results/string-functions.sql.out b/sql/core/src/test/resources/sql-tests/results/string-functions.sql.out
index 34a560d771e8f..1d706cba88c98 100644
--- a/sql/core/src/test/resources/sql-tests/results/string-functions.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/string-functions.sql.out
@@ -181,6 +181,46 @@ struct<split(hello, , -1):array<string>>
 ["h","e","l","l","o"]
 
 
+-- !query
+SELECT split('hello', '', 0)
+-- !query schema
+struct<split(hello, , 0):array<string>>
+-- !query output
+["h","e","l","l","o"]
+
+
+-- !query
+SELECT split('hello', '', 1)
+-- !query schema
+struct<split(hello, , 1):array<string>>
+-- !query output
+["hello"]
+
+
+-- !query
+SELECT split('hello', '', 3)
+-- !query schema
+struct<split(hello, , 3):array<string>>
+-- !query output
+["h","e","llo"]
+
+
+-- !query
+SELECT split('hello', '', 5)
+-- !query schema
+struct<split(hello, , 5):array<string>>
+-- !query output
+["h","e","l","l","o"]
+
+
+-- !query
+SELECT split('hello', '', 100)
+-- !query schema
+struct<split(hello, , 100):array<string>>
+-- !query output
+["h","e","l","l","o"]
+
+
 -- !query
 SELECT split('', '')
 -- !query schema
@@ -189,6 +229,30 @@ struct<split(, , -1):array<string>>
 [""]
 
 
+-- !query
+SELECT split('', '', -1)
+-- !query schema
+struct<split(, , -1):array<string>>
+-- !query output
+[""]
+
+
+-- !query
+SELECT split('', '', 0)
+-- !query schema
+struct<split(, , 0):array<string>>
+-- !query output
+[""]
+
+
+-- !query
+SELECT split('', '', 1)
+-- !query schema
+struct<split(, , 1):array<string>>
+-- !query output
+[""]
+
+
 -- !query
 SELECT split('abc', null)
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/struct.sql.out b/sql/core/src/test/resources/sql-tests/results/struct.sql.out
index d642321e218d6..1fdb8ebaac64a 100644
--- a/sql/core/src/test/resources/sql-tests/results/struct.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/struct.sql.out
@@ -85,3 +85,43 @@ struct<ID:int,struct(ST.C AS STC, ST.D AS STD).STD:string>
 1	delta
 2	eta
 3	iota
+
+
+-- !query
+SELECT STRUCT(1 AS a) AS b, b AS c
+-- !query schema
+struct<b:struct<a:int>,c:struct<a:int>>
+-- !query output
+{"a":1}	{"a":1}
+
+
+-- !query
+SELECT STRUCT(col1 AS a) AS b, b AS c FROM VALUES(1)
+-- !query schema
+struct<b:struct<a:int>,c:struct<a:int>>
+-- !query output
+{"a":1}	{"a":1}
+
+
+-- !query
+SELECT STRUCT(1 AS a) AS b, b AS c GROUP BY b
+-- !query schema
+struct<b:struct<a:int>,c:struct<a:int>>
+-- !query output
+{"a":1}	{"a":1}
+
+
+-- !query
+SELECT STRUCT(col1 AS a) AS b, b AS c FROM VALUES(1) GROUP BY b
+-- !query schema
+struct<b:struct<a:int>,c:struct<a:int>>
+-- !query output
+{"a":1}	{"a":1}
+
+
+-- !query
+SELECT MAX(STRUCT(1 AS a)), 2 AS b, b AS c GROUP BY b
+-- !query schema
+struct<max(struct(1 AS a)):struct<a:int>,b:int,c:int>
+-- !query output
+{"a":1}	2	2
diff --git a/sql/core/src/test/resources/sql-tests/results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out b/sql/core/src/test/resources/sql-tests/results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out
index 2460c2452ea56..b37fe614e2376 100644
--- a/sql/core/src/test/resources/sql-tests/results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/subquery/scalar-subquery/scalar-subquery-predicate.sql.out
@@ -914,3 +914,19 @@ SELECT * FROM t0 WHERE t0a = (SELECT distinct(t1c) FROM t1 WHERE t1a = t0a)
 struct<t0a:int,t0b:int>
 -- !query output
 
+
+
+-- !query
+SELECT MAX(a.col1)
+FROM VALUES (1) AS a(col1)
+GROUP BY a.col1
+HAVING COUNT(*) = (
+        SELECT COUNT(*)
+        FROM VALUES (1),(1),(2),(2) AS c(col1)
+        WHERE c.col1 >= a.col1
+        LIMIT 1
+    )
+-- !query schema
+struct<max(col1):int>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/time.sql.out b/sql/core/src/test/resources/sql-tests/results/time.sql.out
index efe53559a7e01..2908f266dc9cd 100644
--- a/sql/core/src/test/resources/sql-tests/results/time.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/time.sql.out
@@ -1,4 +1,12 @@
 -- Automatically generated by SQLQueryTestSuite
+-- !query
+create temporary view timediff_view as select time'01:02:03' time_start, time'04:05:06' time_end, 'SECOND' unit
+-- !query schema
+struct<>
+-- !query output
+
+
+
 -- !query
 create temporary view time_view as select '11:53:26.038344' time_str, 'HH:mm:ss.SSSSSS' fmt_str
 -- !query schema
@@ -7,6 +15,14 @@ struct<>
 
 
 
+-- !query
+create temporary view trunc_time_view as select time'11:53:26.038344' time_val, 'MINUTE' unit
+-- !query schema
+struct<>
+-- !query output
+
+
+
 -- !query
 select time '16:39:45\t'
 -- !query schema
@@ -498,3 +514,1866 @@ select extract(SECOND FROM cast('09:08:01.987654' as time(6)))
 struct<extract(SECOND FROM CAST(09:08:01.987654 AS TIME(6))):decimal(8,6)>
 -- !query output
 1.987654
+
+
+-- !query
+SELECT TIME'0:0:0'
+-- !query schema
+struct<TIME '00:00:00':time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT TIME'01:02:03'
+-- !query schema
+struct<TIME '01:02:03':time(6)>
+-- !query output
+01:02:03
+
+
+-- !query
+SELECT TIME'12:34:56'
+-- !query schema
+struct<TIME '12:34:56':time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT TIME'23:59:59'
+-- !query schema
+struct<TIME '23:59:59':time(6)>
+-- !query output
+23:59:59
+
+
+-- !query
+SELECT TIME'23:59:59.9'
+-- !query schema
+struct<TIME '23:59:59.9':time(6)>
+-- !query output
+23:59:59.9
+
+
+-- !query
+SELECT TIME'23:59:59.99'
+-- !query schema
+struct<TIME '23:59:59.99':time(6)>
+-- !query output
+23:59:59.99
+
+
+-- !query
+SELECT TIME'23:59:59.999'
+-- !query schema
+struct<TIME '23:59:59.999':time(6)>
+-- !query output
+23:59:59.999
+
+
+-- !query
+SELECT TIME'23:59:59.9999'
+-- !query schema
+struct<TIME '23:59:59.9999':time(6)>
+-- !query output
+23:59:59.9999
+
+
+-- !query
+SELECT TIME'23:59:59.99999'
+-- !query schema
+struct<TIME '23:59:59.99999':time(6)>
+-- !query output
+23:59:59.99999
+
+
+-- !query
+SELECT TIME'23:59:59.999999'
+-- !query schema
+struct<TIME '23:59:59.999999':time(6)>
+-- !query output
+23:59:59.999999
+
+
+-- !query
+SELECT TIME'01:02:03 AM'
+-- !query schema
+struct<TIME '01:02:03':time(6)>
+-- !query output
+01:02:03
+
+
+-- !query
+SELECT TIME'01:02:03 am'
+-- !query schema
+struct<TIME '01:02:03':time(6)>
+-- !query output
+01:02:03
+
+
+-- !query
+SELECT TIME'01:02:03 Am'
+-- !query schema
+struct<TIME '01:02:03':time(6)>
+-- !query output
+01:02:03
+
+
+-- !query
+SELECT TIME'01:02:03 PM'
+-- !query schema
+struct<TIME '13:02:03':time(6)>
+-- !query output
+13:02:03
+
+
+-- !query
+SELECT TIME'01:02:03 pm'
+-- !query schema
+struct<TIME '13:02:03':time(6)>
+-- !query output
+13:02:03
+
+
+-- !query
+SELECT TIME'01:02:03 pM'
+-- !query schema
+struct<TIME '13:02:03':time(6)>
+-- !query output
+13:02:03
+
+
+-- !query
+SELECT TIME'00:00:60'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:00:60'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 21,
+    "fragment" : "TIME'00:00:60'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'00:60:00'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:60:00'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 21,
+    "fragment" : "TIME'00:60:00'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'24:00:00'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'24:00:00'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 21,
+    "fragment" : "TIME'24:00:00'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'00:00:00 AM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:00:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'00:00:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'00:00:00 PM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'00:00:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'00:00:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:00:60 AM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:00:60 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:00:60 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:00:60 PM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:00:60 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:00:60 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:60:00 AM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:60:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:60:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:60:00 PM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'12:60:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'12:60:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'13:00:00 AM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'13:00:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'13:00:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'13:00:00 PM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'13:00:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'13:00:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'24:00:00 AM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'24:00:00 AM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'24:00:00 AM'"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'24:00:00 PM'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "INVALID_TYPED_LITERAL",
+  "sqlState" : "42604",
+  "messageParameters" : {
+    "value" : "'24:00:00 PM'",
+    "valueType" : "\"TIME\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 24,
+    "fragment" : "TIME'24:00:00 PM'"
+  } ]
+}
+
+
+-- !query
+SELECT cast("12:34:56" as time)
+-- !query schema
+struct<CAST(12:34:56 AS TIME(6)):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT cast("12:34:56.789" as time(3))
+-- !query schema
+struct<CAST(12:34:56.789 AS TIME(3)):time(3)>
+-- !query output
+12:34:56.789
+
+
+-- !query
+SELECT cast("12:34:56.789" as time(6))
+-- !query schema
+struct<CAST(12:34:56.789 AS TIME(6)):time(6)>
+-- !query output
+12:34:56.789
+
+
+-- !query
+SELECT cast("12:34:56.789012" as time without time zone)
+-- !query schema
+struct<CAST(12:34:56.789012 AS TIME(6)):time(6)>
+-- !query output
+12:34:56.789012
+
+
+-- !query
+SELECT cast(cast('12:00' as time(0)) as time(2))
+-- !query schema
+struct<CAST(CAST(12:00 AS TIME(0)) AS TIME(2)):time(2)>
+-- !query output
+12:00:00
+
+
+-- !query
+SELECT cast(('23:59:59.001001' :: time(6)) as time(4))
+-- !query schema
+struct<CAST(CAST(23:59:59.001001 AS TIME(6)) AS TIME(4)):time(4)>
+-- !query output
+23:59:59.001
+
+
+-- !query
+SELECT cast(time'11:59:59.999999' as time without time zone)
+-- !query schema
+struct<CAST(TIME '11:59:59.999999' AS TIME(6)):time(6)>
+-- !query output
+11:59:59.999999
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56')
+-- !query schema
+struct<time_trunc(HOUR, TIME '12:34:56'):time(6)>
+-- !query output
+12:00:00
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56')
+-- !query schema
+struct<time_trunc(MINUTE, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:00
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56')
+-- !query schema
+struct<time_trunc(SECOND, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56')
+-- !query schema
+struct<time_trunc(MILLISECOND, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56')
+-- !query schema
+struct<time_trunc(MICROSECOND, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56.1')
+-- !query schema
+struct<time_trunc(HOUR, TIME '12:34:56.1'):time(6)>
+-- !query output
+12:00:00
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56.1')
+-- !query schema
+struct<time_trunc(MINUTE, TIME '12:34:56.1'):time(6)>
+-- !query output
+12:34:00
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56.1')
+-- !query schema
+struct<time_trunc(SECOND, TIME '12:34:56.1'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56.1')
+-- !query schema
+struct<time_trunc(MILLISECOND, TIME '12:34:56.1'):time(6)>
+-- !query output
+12:34:56.1
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56.1')
+-- !query schema
+struct<time_trunc(MICROSECOND, TIME '12:34:56.1'):time(6)>
+-- !query output
+12:34:56.1
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56.123456')
+-- !query schema
+struct<time_trunc(HOUR, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:00:00
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56.123456')
+-- !query schema
+struct<time_trunc(MINUTE, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:00
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56.123456')
+-- !query schema
+struct<time_trunc(SECOND, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56.123456')
+-- !query schema
+struct<time_trunc(MILLISECOND, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:56.123
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56.123456')
+-- !query schema
+struct<time_trunc(MICROSECOND, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:56.123456
+
+
+-- !query
+SELECT time_trunc('HOUR', time'12:34:56.123456789')
+-- !query schema
+struct<time_trunc(HOUR, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:00:00
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'12:34:56.123456789')
+-- !query schema
+struct<time_trunc(MINUTE, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:00
+
+
+-- !query
+SELECT time_trunc('SECOND', time'12:34:56.123456789')
+-- !query schema
+struct<time_trunc(SECOND, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'12:34:56.123456789')
+-- !query schema
+struct<time_trunc(MILLISECOND, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:56.123
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'12:34:56.123456789')
+-- !query schema
+struct<time_trunc(MICROSECOND, TIME '12:34:56.123456'):time(6)>
+-- !query output
+12:34:56.123456
+
+
+-- !query
+SELECT time_trunc('hour', time'12:34:56')
+-- !query schema
+struct<time_trunc(hour, TIME '12:34:56'):time(6)>
+-- !query output
+12:00:00
+
+
+-- !query
+SELECT time_trunc('MiNuTe', time'12:34:56')
+-- !query schema
+struct<time_trunc(MiNuTe, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:00
+
+
+-- !query
+SELECT time_trunc('sEcOnD', time'12:34:56')
+-- !query schema
+struct<time_trunc(sEcOnD, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('Millisecond', time'12:34:56')
+-- !query schema
+struct<time_trunc(Millisecond, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('microseconD', time'12:34:56')
+-- !query schema
+struct<time_trunc(microseconD, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time_trunc('HOUR', time'00:00:00')
+-- !query schema
+struct<time_trunc(HOUR, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'00:00:00')
+-- !query schema
+struct<time_trunc(MINUTE, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('SECOND', time'00:00:00')
+-- !query schema
+struct<time_trunc(SECOND, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'00:00:00')
+-- !query schema
+struct<time_trunc(MILLISECOND, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'00:00:00')
+-- !query schema
+struct<time_trunc(MICROSECOND, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('HOUR', time'00:00:00.000000001')
+-- !query schema
+struct<time_trunc(HOUR, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'00:00:00.000000001')
+-- !query schema
+struct<time_trunc(MINUTE, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('SECOND', time'00:00:00.000000001')
+-- !query schema
+struct<time_trunc(SECOND, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'00:00:00.000000001')
+-- !query schema
+struct<time_trunc(MILLISECOND, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'00:00:00.000000001')
+-- !query schema
+struct<time_trunc(MICROSECOND, TIME '00:00:00'):time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT time_trunc('HOUR', time'23:59:59.999999999')
+-- !query schema
+struct<time_trunc(HOUR, TIME '23:59:59.999999'):time(6)>
+-- !query output
+23:00:00
+
+
+-- !query
+SELECT time_trunc('MINUTE', time'23:59:59.999999999')
+-- !query schema
+struct<time_trunc(MINUTE, TIME '23:59:59.999999'):time(6)>
+-- !query output
+23:59:00
+
+
+-- !query
+SELECT time_trunc('SECOND', time'23:59:59.999999999')
+-- !query schema
+struct<time_trunc(SECOND, TIME '23:59:59.999999'):time(6)>
+-- !query output
+23:59:59
+
+
+-- !query
+SELECT time_trunc('MILLISECOND', time'23:59:59.999999999')
+-- !query schema
+struct<time_trunc(MILLISECOND, TIME '23:59:59.999999'):time(6)>
+-- !query output
+23:59:59.999
+
+
+-- !query
+SELECT time_trunc('MICROSECOND', time'23:59:59.999999999')
+-- !query schema
+struct<time_trunc(MICROSECOND, TIME '23:59:59.999999'):time(6)>
+-- !query output
+23:59:59.999999
+
+
+-- !query
+SELECT time_trunc('', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "''",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc(' ', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "' '",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('MS', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "'MS'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('DAY', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "'DAY'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('WEEK', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "'WEEK'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('ABCD', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "'ABCD'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('QUARTER', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "'QUARTER'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('INVALID', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "'INVALID'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('INVALID_UNIT', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_trunc`",
+    "invalidValue" : "'INVALID_UNIT'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_trunc('HOUR', NULL)
+-- !query schema
+struct<time_trunc(HOUR, NULL):time(6)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_trunc(NULL, time'12:34:56')
+-- !query schema
+struct<time_trunc(NULL, TIME '12:34:56'):time(6)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_trunc(NULL, NULL)
+-- !query schema
+struct<time_trunc(NULL, NULL):time(6)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_trunc('HOUR', time_val) FROM trunc_time_view
+-- !query schema
+struct<time_trunc(HOUR, time_val):time(6)>
+-- !query output
+11:00:00
+
+
+-- !query
+SELECT time_trunc(unit, time'12:34:56') FROM trunc_time_view
+-- !query schema
+struct<time_trunc(unit, TIME '12:34:56'):time(6)>
+-- !query output
+12:34:00
+
+
+-- !query
+SELECT time_trunc(unit, time_val) FROM trunc_time_view
+-- !query schema
+struct<time_trunc(unit, time_val):time(6)>
+-- !query output
+11:53:00
+
+
+-- !query
+SELECT time("12:34:56")
+-- !query schema
+struct<12:34:56:time(6)>
+-- !query output
+12:34:56
+
+
+-- !query
+SELECT time("12:34:56.789")
+-- !query schema
+struct<12:34:56.789:time(6)>
+-- !query output
+12:34:56.789
+
+
+-- !query
+SELECT time("12:34:56.789012")
+-- !query schema
+struct<12:34:56.789012:time(6)>
+-- !query output
+12:34:56.789012
+
+
+-- !query
+SELECT time(cast('12:00' as time(0)))
+-- !query schema
+struct<CAST(12:00 AS TIME(0)):time(6)>
+-- !query output
+12:00:00
+
+
+-- !query
+SELECT time(('23:59:59.001001' :: time(6)))
+-- !query schema
+struct<CAST(23:59:59.001001 AS TIME(6)):time(6)>
+-- !query output
+23:59:59.001001
+
+
+-- !query
+SELECT time(time'11:59:59.999999')
+-- !query schema
+struct<TIME '11:59:59.999999':time(6)>
+-- !query output
+11:59:59.999999
+
+
+-- !query
+SELECT '12:43:33.1234' :: TIME(4) + INTERVAL '01:04:05.56' HOUR TO SECOND
+-- !query schema
+struct<CAST(12:43:33.1234 AS TIME(4)) + INTERVAL '01:04:05.56' HOUR TO SECOND:time(6)>
+-- !query output
+13:47:38.6834
+
+
+-- !query
+SELECT TIME'08:30' + NULL
+-- !query schema
+struct<TIME '08:30:00' + NULL:time(6)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT NULL + TIME'08:30'
+-- !query schema
+struct<TIME '08:30:00' + NULL:time(6)>
+-- !query output
+NULL
+
+
+-- !query
+SELECT TIME'00:00:00.0101' + 1
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "left" : "\"TIME(6)\"",
+    "right" : "\"INT\"",
+    "sqlExpr" : "\"(TIME '00:00:00.0101' + 1)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 30,
+    "fragment" : "TIME'00:00:00.0101' + 1"
+  } ]
+}
+
+
+-- !query
+SELECT TIME'12:30' - INTERVAL '12:29:59.000001' HOUR TO SECOND
+-- !query schema
+struct<TIME '12:30:00' - INTERVAL '12:29:59.000001' HOUR TO SECOND:time(6)>
+-- !query output
+00:00:00.999999
+
+
+-- !query
+SELECT '23:59:59.999999' :: TIME - INTERVAL '23:59:59.999999' HOUR TO SECOND
+-- !query schema
+struct<CAST(23:59:59.999999 AS TIME(6)) - INTERVAL '23:59:59.999999' HOUR TO SECOND:time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT '00:00:00.0001' :: TIME(4) - INTERVAL '0 00:00:00.0001' DAY TO SECOND
+-- !query schema
+struct<CAST(00:00:00.0001 AS TIME(4)) - INTERVAL '0 00:00:00.0001' DAY TO SECOND:time(6)>
+-- !query output
+00:00:00
+
+
+-- !query
+SELECT '08:30' :: TIME(0) - INTERVAL '6' HOUR
+-- !query schema
+struct<CAST(08:30 AS TIME(0)) - INTERVAL '06' HOUR:time(0)>
+-- !query output
+02:30:00
+
+
+-- !query
+SELECT '10:00:01' :: TIME(1) - INTERVAL '1' MONTH
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "left" : "\"TIME(1)\"",
+    "right" : "\"INTERVAL MONTH\"",
+    "sqlExpr" : "\"(CAST(10:00:01 AS TIME(1)) - INTERVAL '1' MONTH)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 49,
+    "fragment" : "'10:00:01' :: TIME(1) - INTERVAL '1' MONTH"
+  } ]
+}
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(HOUR, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+12
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+754
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(SECOND, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+45296
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+45296000
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+45296000000
+
+
+-- !query
+SELECT time_diff('HOUR', time'01:02:03', time'12:34:56')
+-- !query schema
+struct<time_diff(HOUR, TIME '01:02:03', TIME '12:34:56'):bigint>
+-- !query output
+11
+
+
+-- !query
+SELECT time_diff('MINUTE', time'01:02:03', time'12:34:56')
+-- !query schema
+struct<time_diff(MINUTE, TIME '01:02:03', TIME '12:34:56'):bigint>
+-- !query output
+692
+
+
+-- !query
+SELECT time_diff('SECOND', time'01:02:03', time'12:34:56')
+-- !query schema
+struct<time_diff(SECOND, TIME '01:02:03', TIME '12:34:56'):bigint>
+-- !query output
+41573
+
+
+-- !query
+SELECT time_diff('HOUR', time'12:34:56', time'01:02:03')
+-- !query schema
+struct<time_diff(HOUR, TIME '12:34:56', TIME '01:02:03'):bigint>
+-- !query output
+-11
+
+
+-- !query
+SELECT time_diff('MINUTE', time'12:34:56', time'01:02:03')
+-- !query schema
+struct<time_diff(MINUTE, TIME '12:34:56', TIME '01:02:03'):bigint>
+-- !query output
+-692
+
+
+-- !query
+SELECT time_diff('SECOND', time'12:34:56', time'01:02:03')
+-- !query schema
+struct<time_diff(SECOND, TIME '12:34:56', TIME '01:02:03'):bigint>
+-- !query output
+-41573
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.1')
+-- !query schema
+struct<time_diff(HOUR, TIME '00:00:00', TIME '12:34:56.1'):bigint>
+-- !query output
+12
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.1')
+-- !query schema
+struct<time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56.1'):bigint>
+-- !query output
+754
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.1')
+-- !query schema
+struct<time_diff(SECOND, TIME '00:00:00', TIME '12:34:56.1'):bigint>
+-- !query output
+45296
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.1')
+-- !query schema
+struct<time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56.1'):bigint>
+-- !query output
+45296100
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.1')
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56.1'):bigint>
+-- !query output
+45296100000
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.123456')
+-- !query schema
+struct<time_diff(HOUR, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+12
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.123456')
+-- !query schema
+struct<time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+754
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.123456')
+-- !query schema
+struct<time_diff(SECOND, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+45296
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.123456')
+-- !query schema
+struct<time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+45296123
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.123456')
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+45296123456
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'12:34:56.123456789')
+-- !query schema
+struct<time_diff(HOUR, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+12
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'12:34:56.123456789')
+-- !query schema
+struct<time_diff(MINUTE, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+754
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'12:34:56.123456789')
+-- !query schema
+struct<time_diff(SECOND, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+45296
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'12:34:56.123456789')
+-- !query schema
+struct<time_diff(MILLISECOND, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+45296123
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'12:34:56.123456789')
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', TIME '12:34:56.123456'):bigint>
+-- !query output
+45296123456
+
+
+-- !query
+SELECT time_diff('hour', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(hour, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+12
+
+
+-- !query
+SELECT time_diff('MiNuTe', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(MiNuTe, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+754
+
+
+-- !query
+SELECT time_diff('sEcOnD', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(sEcOnD, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+45296
+
+
+-- !query
+SELECT time_diff('Millisecond', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(Millisecond, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+45296000
+
+
+-- !query
+SELECT time_diff('microseconD', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(microseconD, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+45296000000
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'00:00:00')
+-- !query schema
+struct<time_diff(HOUR, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'00:00:00')
+-- !query schema
+struct<time_diff(MINUTE, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'00:00:00')
+-- !query schema
+struct<time_diff(SECOND, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'00:00:00')
+-- !query schema
+struct<time_diff(MILLISECOND, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'00:00:00')
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'00:00:00.000000001')
+-- !query schema
+struct<time_diff(HOUR, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'00:00:00.000000001')
+-- !query schema
+struct<time_diff(MINUTE, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'00:00:00.000000001')
+-- !query schema
+struct<time_diff(SECOND, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'00:00:00.000000001')
+-- !query schema
+struct<time_diff(MILLISECOND, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'00:00:00.000000001')
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', TIME '00:00:00'):bigint>
+-- !query output
+0
+
+
+-- !query
+SELECT time_diff('HOUR', time'00:00:00', time'23:59:59.999999999')
+-- !query schema
+struct<time_diff(HOUR, TIME '00:00:00', TIME '23:59:59.999999'):bigint>
+-- !query output
+23
+
+
+-- !query
+SELECT time_diff('MINUTE', time'00:00:00', time'23:59:59.999999999')
+-- !query schema
+struct<time_diff(MINUTE, TIME '00:00:00', TIME '23:59:59.999999'):bigint>
+-- !query output
+1439
+
+
+-- !query
+SELECT time_diff('SECOND', time'00:00:00', time'23:59:59.999999999')
+-- !query schema
+struct<time_diff(SECOND, TIME '00:00:00', TIME '23:59:59.999999'):bigint>
+-- !query output
+86399
+
+
+-- !query
+SELECT time_diff('MILLISECOND', time'00:00:00', time'23:59:59.999999999')
+-- !query schema
+struct<time_diff(MILLISECOND, TIME '00:00:00', TIME '23:59:59.999999'):bigint>
+-- !query output
+86399999
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', time'23:59:59.999999999')
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', TIME '23:59:59.999999'):bigint>
+-- !query output
+86399999999
+
+
+-- !query
+SELECT time_diff('', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "''",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff(' ', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "' '",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff('MS', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "'MS'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff('DAY', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "'DAY'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff('WEEK', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "'WEEK'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff('ABCD', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "'ABCD'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff('QUARTER', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "'QUARTER'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff('INVALID', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "'INVALID'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff('INVALID_UNIT', time'00:00:00', time'12:34:56')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkIllegalArgumentException
+{
+  "errorClass" : "INVALID_PARAMETER_VALUE.TIME_UNIT",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "functionName" : "`time_diff`",
+    "invalidValue" : "'INVALID_UNIT'",
+    "parameter" : "`unit`"
+  }
+}
+
+
+-- !query
+SELECT time_diff(NULL, time'00:00:00', time'12:34:56')
+-- !query schema
+struct<time_diff(NULL, TIME '00:00:00', TIME '12:34:56'):bigint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_diff('MICROSECOND', NULL, time'12:34:56')
+-- !query schema
+struct<time_diff(MICROSECOND, NULL, TIME '12:34:56'):bigint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_diff('MICROSECOND', time'00:00:00', NULL)
+-- !query schema
+struct<time_diff(MICROSECOND, TIME '00:00:00', NULL):bigint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_diff(NULL, NULL, time'12:34:56')
+-- !query schema
+struct<time_diff(NULL, NULL, TIME '12:34:56'):bigint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_diff(NULL, time'00:00:00', NULL)
+-- !query schema
+struct<time_diff(NULL, TIME '00:00:00', NULL):bigint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_diff('MICROSECOND', NULL, NULL)
+-- !query schema
+struct<time_diff(MICROSECOND, NULL, NULL):bigint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_diff(NULL, NULL, NULL)
+-- !query schema
+struct<time_diff(NULL, NULL, NULL):bigint>
+-- !query output
+NULL
+
+
+-- !query
+SELECT time_diff('SECOND', time_start, time_end) FROM timediff_view
+-- !query schema
+struct<time_diff(SECOND, time_start, time_end):bigint>
+-- !query output
+10983
+
+
+-- !query
+SELECT time_diff(unit, time'01:02:03', time_end) FROM timediff_view
+-- !query schema
+struct<time_diff(unit, TIME '01:02:03', time_end):bigint>
+-- !query output
+10983
+
+
+-- !query
+SELECT time_diff(unit, time_start, time'04:05:06') FROM timediff_view
+-- !query schema
+struct<time_diff(unit, time_start, TIME '04:05:06'):bigint>
+-- !query output
+10983
+
+
+-- !query
+SELECT time_diff('SECOND', time'01:02:03', time_end) FROM timediff_view
+-- !query schema
+struct<time_diff(SECOND, TIME '01:02:03', time_end):bigint>
+-- !query output
+10983
+
+
+-- !query
+SELECT time_diff('SECOND', time_start, time'04:05:06') FROM timediff_view
+-- !query schema
+struct<time_diff(SECOND, time_start, TIME '04:05:06'):bigint>
+-- !query output
+10983
+
+
+-- !query
+SELECT time_diff(unit, time'01:02:03', time'04:05:06') FROM timediff_view
+-- !query schema
+struct<time_diff(unit, TIME '01:02:03', TIME '04:05:06'):bigint>
+-- !query output
+10983
+
+
+-- !query
+SELECT time_diff(unit, time_start, time_end) FROM timediff_view
+-- !query schema
+struct<time_diff(unit, time_start, time_end):bigint>
+-- !query output
+10983
+
+
+-- !query
+SELECT TIME'12:30:41' - TIME'10:00'
+-- !query schema
+struct<TIME '12:30:41' - TIME '10:00:00':interval hour to second>
+-- !query output
+0 02:30:41.000000000
+
+
+-- !query
+SELECT TIME'08:30' - NULL
+-- !query schema
+struct<TIME '08:30:00' - NULL:interval hour to second>
+-- !query output
+NULL
+
+
+-- !query
+SELECT NULL - TIME'10:32'
+-- !query schema
+struct<NULL - TIME '10:32:00':interval hour to second>
+-- !query output
+NULL
+
+
+-- !query
+SELECT TIME'12:30:41.123' - TIMESTAMP'2025-07-11 10:00:01'
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIME '12:30:41.123'\"",
+    "inputType" : "\"TIME(6)\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"(TIMESTAMP OR TIMESTAMP WITHOUT TIME ZONE)\"",
+    "sqlExpr" : "\"(TIME '12:30:41.123' - TIMESTAMP '2025-07-11 10:00:01')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 58,
+    "fragment" : "TIME'12:30:41.123' - TIMESTAMP'2025-07-11 10:00:01'"
+  } ]
+}
+
+
+-- !query
+SELECT '12:30:41.123' - TIME'10:00:01'
+-- !query schema
+struct<12:30:41.123 - TIME '10:00:01':interval hour to second>
+-- !query output
+0 02:30:40.123000000
+
+
+-- !query
+SELECT '23:59:59.999999' :: TIME(6) - '00:00' :: TIME(0)
+-- !query schema
+struct<CAST(23:59:59.999999 AS TIME(6)) - CAST(00:00 AS TIME(0)):interval hour to second>
+-- !query output
+0 23:59:59.999999000
+
+
+-- !query
+SELECT '00:00:00.1234' :: TIME(4) - TIME'23:59:59'
+-- !query schema
+struct<CAST(00:00:00.1234 AS TIME(4)) - TIME '23:59:59':interval hour to second>
+-- !query output
+-0 23:59:58.876600000
diff --git a/sql/core/src/test/resources/sql-tests/results/timestamp-ltz.sql.out b/sql/core/src/test/resources/sql-tests/results/timestamp-ltz.sql.out
index 963505615225a..69f9213cfc23d 100644
--- a/sql/core/src/test/resources/sql-tests/results/timestamp-ltz.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/timestamp-ltz.sql.out
@@ -62,6 +62,98 @@ org.apache.spark.SparkDateTimeException
 }
 
 
+-- !query
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678)):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp_ltz(NULL, TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00'):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp_ltz(DATE'1970-01-01', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp_ltz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp_ltz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp_ltz(DATE'2025-06-20', timestamp_ntz'2018-11-17 13:33:33')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '2025-06-20', TIMESTAMP_NTZ '2018-11-17 13:33:33')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp_ltz(DATE'2025-06-20', timestamp_ntz'2018-11-17 13:33:33')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp_ltz(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET):timestamp>
+-- !query output
+2021-07-10 21:30:45.678
+
+
 -- !query
 SELECT convert_timezone('Europe/Brussels', timestamp_ltz'2022-03-23 00:00:00 America/Los_Angeles')
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/timestamp-ntz.sql.out b/sql/core/src/test/resources/sql-tests/results/timestamp-ntz.sql.out
index 9e37bf4e9caa5..aff9b5abffd34 100644
--- a/sql/core/src/test/resources/sql-tests/results/timestamp-ntz.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/timestamp-ntz.sql.out
@@ -51,7 +51,7 @@ org.apache.spark.sql.AnalysisException
   "messageParameters" : {
     "actualNum" : "7",
     "docroot" : "https://spark.apache.org/docs/latest",
-    "expectedNum" : "6",
+    "expectedNum" : "[2, 6]",
     "functionName" : "`make_timestamp_ntz`"
   },
   "queryContext" : [ {
@@ -79,6 +79,158 @@ org.apache.spark.SparkDateTimeException
 }
 
 
+-- !query
+SELECT make_timestamp_ntz(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query schema
+struct<make_timestamp_ntz(make_date(2021, 7, 11), make_time(6, 30, 45.678)):timestamp_ntz>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp_ntz(NULL, TIME'00:00:00')
+-- !query schema
+struct<make_timestamp_ntz(NULL, TIME '00:00:00'):timestamp_ntz>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp_ntz(DATE'1970-01-01', NULL)
+-- !query schema
+struct<make_timestamp_ntz(DATE '1970-01-01', NULL):timestamp_ntz>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp_ntz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp_ntz(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp_ntz(timestamp_ntz'2018-11-17 13:33:33', TIME'0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp_ntz(DATE'2025-06-20', '0:0:0')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"0:0:0\"",
+    "inputType" : "\"STRING\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp_ntz(DATE '2025-06-20', 0:0:0)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "make_timestamp_ntz(DATE'2025-06-20', '0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT try_make_timestamp_ntz(make_date(2025, 6, 27), make_time(16, 08, 45.123456))
+-- !query schema
+struct<try_make_timestamp_ntz(make_timestamp_ntz(make_date(2025, 6, 27), make_time(16, 8, 45.123456))):timestamp_ntz>
+-- !query output
+2025-06-27 16:08:45.123456
+
+
+-- !query
+SELECT try_make_timestamp_ntz(NULL, TIME'23:59:59.00001')
+-- !query schema
+struct<try_make_timestamp_ntz(make_timestamp_ntz(NULL, TIME '23:59:59.00001')):timestamp_ntz>
+-- !query output
+NULL
+
+
+-- !query
+SELECT try_make_timestamp_ntz(DATE'0001-01-01', NULL)
+-- !query schema
+struct<try_make_timestamp_ntz(make_timestamp_ntz(DATE '0001-01-01', NULL)):timestamp_ntz>
+-- !query output
+NULL
+
+
+-- !query
+SELECT try_make_timestamp_ntz('2018-11-17 13:33:33', TIME'0:0:0')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"2018-11-17 13:33:33\"",
+    "inputType" : "\"STRING\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp_ntz(2018-11-17 13:33:33, TIME '00:00:00')\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 65,
+    "fragment" : "try_make_timestamp_ntz('2018-11-17 13:33:33', TIME'0:0:0')"
+  } ]
+}
+
+
+-- !query
+SELECT try_make_timestamp_ntz(DATE'2025-06-20', 10D)
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"10.0\"",
+    "inputType" : "\"DOUBLE\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp_ntz(DATE '2025-06-20', 10.0)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 52,
+    "fragment" : "try_make_timestamp_ntz(DATE'2025-06-20', 10D)"
+  } ]
+}
+
+
 -- !query
 SELECT convert_timezone('Europe/Moscow', 'America/Los_Angeles', timestamp_ntz'2022-01-01 00:00:00')
 -- !query schema
diff --git a/sql/core/src/test/resources/sql-tests/results/timestamp.sql.out b/sql/core/src/test/resources/sql-tests/results/timestamp.sql.out
index 09e32baf93935..f72c0dfb4cd23 100644
--- a/sql/core/src/test/resources/sql-tests/results/timestamp.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/timestamp.sql.out
@@ -211,6 +211,278 @@ org.apache.spark.SparkDateTimeException
 }
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11)):timestamp>
+-- !query output
+2021-07-11 00:00:00
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query schema
+struct<make_timestamp(NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678)):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00'):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT):timestamp>
+-- !query output
+2021-07-10 10:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC):timestamp>
+-- !query output
+2021-07-10 23:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET):timestamp>
+-- !query output
+2021-07-10 21:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST):timestamp>
+-- !query output
+2021-07-10 14:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', UTC):timestamp>
+-- !query output
+1969-12-31 16:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query schema
@@ -812,49 +1084,17 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query schema
-struct<>
+struct<TIMESTAMP '2011-11-11 11:11:11' + NULL:timestamp>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+NULL
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query schema
-struct<>
+struct<TIMESTAMP '2011-11-11 11:11:11' + NULL:timestamp>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+NULL
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp-ansi.sql.out b/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp-ansi.sql.out
index 381da4907a4cf..1d69a5b225c56 100644
--- a/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp-ansi.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp-ansi.sql.out
@@ -211,6 +211,278 @@ org.apache.spark.SparkDateTimeException
 }
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11)):timestamp>
+-- !query output
+2021-07-11 00:00:00
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query schema
+struct<make_timestamp(NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678)):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00'):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT):timestamp>
+-- !query output
+2021-07-10 10:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC):timestamp>
+-- !query output
+2021-07-10 23:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET):timestamp>
+-- !query output
+2021-07-10 21:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST):timestamp>
+-- !query output
+2021-07-10 14:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', UTC):timestamp>
+-- !query output
+1969-12-31 16:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query schema
@@ -829,49 +1101,17 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query schema
-struct<>
+struct<TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL:timestamp_ntz>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP_NTZ\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+NULL
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query schema
-struct<>
+struct<TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL:timestamp_ntz>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP_NTZ\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP_NTZ '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+NULL
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp.sql.out b/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp.sql.out
index 34103b66f00c1..533b79ac7f55d 100644
--- a/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/timestampNTZ/timestamp.sql.out
@@ -180,6 +180,278 @@ struct<make_timestamp(1, 1, 1, 1, 1, 999.999999):timestamp_ntz>
 NULL
 
 
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11)):timestamp>
+-- !query output
+2021-07-11 00:00:00
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL)
+-- !query schema
+struct<make_timestamp(NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678))
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678)):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00'):timestamp>
+-- !query output
+1970-01-01 00:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00'):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'MIT')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), MIT):timestamp>
+-- !query output
+2021-07-10 10:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'PST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), PST):timestamp>
+-- !query output
+2021-07-11 06:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'UTC')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), UTC):timestamp>
+-- !query output
+2021-07-10 23:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'CET')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), CET):timestamp>
+-- !query output
+2021-07-10 21:30:45.678
+
+
+-- !query
+SELECT make_timestamp(make_date(2021, 07, 11), make_time(6, 30, 45.678), 'JST')
+-- !query schema
+struct<make_timestamp(make_date(2021, 7, 11), make_time(6, 30, 45.678), JST):timestamp>
+-- !query output
+2021-07-10 14:30:45.678
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', UTC):timestamp>
+-- !query output
+1969-12-31 16:00:00
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, 'UTC')
+-- !query schema
+struct<make_timestamp(NULL, NULL, UTC):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, TIME'00:00:00', NULL)
+-- !query schema
+struct<make_timestamp(NULL, TIME '00:00:00', NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', NULL, NULL)
+-- !query schema
+struct<make_timestamp(DATE '1970-01-01', NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(NULL, NULL, NULL)
+-- !query schema
+struct<make_timestamp(NULL, NULL, NULL):timestamp>
+-- !query output
+NULL
+
+
+-- !query
+SELECT make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 74,
+    "fragment" : "make_timestamp(timestamp '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "first",
+    "requiredType" : "\"DATE\"",
+    "sqlExpr" : "\"make_timestamp(TIMESTAMP_NTZ '2018-11-17 13:33:33', TIME '00:00:00', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 78,
+    "fragment" : "make_timestamp(timestamp_ntz '2018-11-17 13:33:33', TIME'0:0:0', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 79,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
+-- !query
+SELECT make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.ExtendedAnalysisException
+{
+  "errorClass" : "DATATYPE_MISMATCH.UNEXPECTED_INPUT_TYPE",
+  "sqlState" : "42K09",
+  "messageParameters" : {
+    "inputSql" : "\"TIMESTAMP_NTZ '2018-11-17 13:33:33'\"",
+    "inputType" : "\"TIMESTAMP_NTZ\"",
+    "paramIndex" : "second",
+    "requiredType" : "\"TIME\"",
+    "sqlExpr" : "\"make_timestamp(DATE '1970-01-01', TIMESTAMP_NTZ '2018-11-17 13:33:33', CET)\""
+  },
+  "queryContext" : [ {
+    "objectType" : "",
+    "objectName" : "",
+    "startIndex" : 8,
+    "stopIndex" : 83,
+    "fragment" : "make_timestamp(DATE'1970-01-01', timestamp_ntz '2018-11-17 13:33:33', 'CET')"
+  } ]
+}
+
+
 -- !query
 select TIMESTAMP_SECONDS(1230219000),TIMESTAMP_SECONDS(-1230219000),TIMESTAMP_SECONDS(null)
 -- !query schema
@@ -805,49 +1077,17 @@ org.apache.spark.sql.catalyst.ExtendedAnalysisException
 -- !query
 select timestamp'2011-11-11 11:11:11' + null
 -- !query schema
-struct<>
+struct<TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL:timestamp_ntz>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"TIMESTAMP_NTZ\"",
-    "right" : "\"VOID\"",
-    "sqlExpr" : "\"(TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL)\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "timestamp'2011-11-11 11:11:11' + null"
-  } ]
-}
+NULL
 
 
 -- !query
 select null + timestamp'2011-11-11 11:11:11'
 -- !query schema
-struct<>
+struct<TIMESTAMP_NTZ '2011-11-11 11:11:11' + NULL:timestamp_ntz>
 -- !query output
-org.apache.spark.sql.catalyst.ExtendedAnalysisException
-{
-  "errorClass" : "DATATYPE_MISMATCH.BINARY_OP_DIFF_TYPES",
-  "sqlState" : "42K09",
-  "messageParameters" : {
-    "left" : "\"VOID\"",
-    "right" : "\"TIMESTAMP_NTZ\"",
-    "sqlExpr" : "\"(NULL + TIMESTAMP_NTZ '2011-11-11 11:11:11')\""
-  },
-  "queryContext" : [ {
-    "objectType" : "",
-    "objectName" : "",
-    "startIndex" : 8,
-    "stopIndex" : 44,
-    "fragment" : "null + timestamp'2011-11-11 11:11:11'"
-  } ]
-}
+NULL
 
 
 -- !query
diff --git a/sql/core/src/test/resources/sql-tests/results/union-per-child-output-deduplication.sql.out b/sql/core/src/test/resources/sql-tests/results/union-per-child-output-deduplication.sql.out
new file mode 100644
index 0000000000000..3471d57f5fb5a
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/union-per-child-output-deduplication.sql.out
@@ -0,0 +1,167 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+DROP TABLE IF EXISTS t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP VIEW  IF EXISTS v1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE TABLE t1 (col1 STRING, col2 STRING, col3 STRING)
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+CREATE VIEW v1 as SELECT * FROM t1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM t1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM v1
+         UNION
+         SELECT col3, col2 FROM t1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+SELECT *
+FROM (
+         SELECT col1, col2 FROM t1
+         UNION
+         SELECT col3, col2 FROM v1
+         UNION
+         SELECT col2, col2 FROM v1
+     )
+-- !query schema
+struct<col1:string,col2:string>
+-- !query output
+
+
+
+-- !query
+DROP VIEW v1
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+DROP TABLE t1
+-- !query schema
+struct<>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/union.sql.out b/sql/core/src/test/resources/sql-tests/results/union.sql.out
index ce4d3421ae838..2086a81c9e29b 100644
--- a/sql/core/src/test/resources/sql-tests/results/union.sql.out
+++ b/sql/core/src/test/resources/sql-tests/results/union.sql.out
@@ -15,6 +15,14 @@ struct<>
 
 
 
+-- !query
+CREATE TABLE jsonTable (col1 INT, col2 INT, col3 INT, col4 INT) USING json
+-- !query schema
+struct<>
+-- !query output
+
+
+
 -- !query
 SELECT *
 FROM   (SELECT * FROM t1
@@ -200,6 +208,18 @@ struct<sum(v):decimal(21,0)>
 3
 
 
+-- !query
+SELECT col1, col2, col3, NULLIF('','') AS col4
+FROM jsonTable
+UNION ALL
+SELECT col2, col2, null AS col3, col4
+FROM jsonTable
+-- !query schema
+struct<col1:int,col2:int,col3:int,col4:bigint>
+-- !query output
+
+
+
 -- !query
 DROP VIEW IF EXISTS t1
 -- !query schema
@@ -246,3 +266,11 @@ DROP VIEW IF EXISTS p3
 struct<>
 -- !query output
 
+
+
+-- !query
+DROP TABLE IF EXISTS jsonTable
+-- !query schema
+struct<>
+-- !query output
+
diff --git a/sql/core/src/test/resources/sql-tests/results/variant-field-extractions.sql.out b/sql/core/src/test/resources/sql-tests/results/variant-field-extractions.sql.out
new file mode 100644
index 0000000000000..a5f0436d9b115
--- /dev/null
+++ b/sql/core/src/test/resources/sql-tests/results/variant-field-extractions.sql.out
@@ -0,0 +1,343 @@
+-- Automatically generated by SQLQueryTestSuite
+-- !query
+CREATE TEMP VIEW variant_test_data AS
+SELECT
+  parse_json('{ "price": 30 }') as int_price_variant,
+  parse_json('{ "price": 12345.678 }') as double_price_variant,
+  parse_json('{ "name": "John", "age": 30, "city": "New York", "active": true, "scores": [85, 92, 78] }') as multi_field_variant,
+  parse_json('{ "item": [ { "model" : "basic", "price" : 6.12 }, { "model" : "medium", "price" : 9.24 } ] }') as array_value_variant,
+  parse_json('[{ "id": 1, "name": "Alice" }, { "id": 2, "name": "Bob" }, { "id": 3, "name": "Charlie" }]') as array_variant,
+  parse_json('{ "metadata": { "version": "1.0", "tags": ["important", "urgent"], "nested": { "level": 2, "value": "deep" } } }') as nested_variant,
+  parse_json('{ "field-name": "value1", "field.name": "value2", "field_name": "value3" }') as special_chars_variant
+-- !query schema
+struct<>
+-- !query output
+
+
+
+-- !query
+select int_price_variant:price from variant_test_data
+-- !query schema
+struct<price:variant>
+-- !query output
+30
+
+
+-- !query
+select int_price_variant:price::decimal(5, 2) from variant_test_data
+-- !query schema
+struct<price:decimal(5,2)>
+-- !query output
+30.00
+
+
+-- !query
+select int_price_variant:price::string from variant_test_data
+-- !query schema
+struct<price:string>
+-- !query output
+30
+
+
+-- !query
+select double_price_variant:price::decimal(3, 2) from variant_test_data
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.SparkRuntimeException
+{
+  "errorClass" : "INVALID_VARIANT_CAST",
+  "sqlState" : "22023",
+  "messageParameters" : {
+    "dataType" : "\"DECIMAL(3,2)\"",
+    "value" : "12345.678"
+  }
+}
+
+
+-- !query
+select multi_field_variant:name, multi_field_variant:age, multi_field_variant:city from variant_test_data
+-- !query schema
+struct<name:variant,age:variant,city:variant>
+-- !query output
+"John"	30	"New York"
+
+
+-- !query
+select multi_field_variant:name::string, multi_field_variant:age::int, multi_field_variant:active::boolean from variant_test_data
+-- !query schema
+struct<name:string,age:int,active:boolean>
+-- !query output
+John	30	true
+
+
+-- !query
+select multi_field_variant:['name'] from variant_test_data
+-- !query schema
+struct<name:variant>
+-- !query output
+"John"
+
+
+-- !query
+select multi_field_variant:['age'] from variant_test_data
+-- !query schema
+struct<age:variant>
+-- !query output
+30
+
+
+-- !query
+select array_value_variant:item[0].model from variant_test_data
+-- !query schema
+struct<model:variant>
+-- !query output
+"basic"
+
+
+-- !query
+select array_value_variant:item[0].price from variant_test_data
+-- !query schema
+struct<price:variant>
+-- !query output
+6.12
+
+
+-- !query
+select array_value_variant:item[1].model from variant_test_data
+-- !query schema
+struct<model:variant>
+-- !query output
+"medium"
+
+
+-- !query
+select array_value_variant:item[1].price from variant_test_data
+-- !query schema
+struct<price:variant>
+-- !query output
+9.24
+
+
+-- !query
+select array_variant:[0].id from variant_test_data
+-- !query schema
+struct<id:variant>
+-- !query output
+1
+
+
+-- !query
+select array_variant:[0].name from variant_test_data
+-- !query schema
+struct<name:variant>
+-- !query output
+"Alice"
+
+
+-- !query
+select array_variant:[1].id from variant_test_data
+-- !query schema
+struct<id:variant>
+-- !query output
+2
+
+
+-- !query
+select array_variant:[1].name from variant_test_data
+-- !query schema
+struct<name:variant>
+-- !query output
+"Bob"
+
+
+-- !query
+select nested_variant:metadata.version from variant_test_data
+-- !query schema
+struct<version:variant>
+-- !query output
+"1.0"
+
+
+-- !query
+select nested_variant:metadata.tags[0] from variant_test_data
+-- !query schema
+struct<tags:variant>
+-- !query output
+"important"
+
+
+-- !query
+select nested_variant:metadata.nested.level from variant_test_data
+-- !query schema
+struct<level:variant>
+-- !query output
+2
+
+
+-- !query
+select nested_variant:metadata.nested.value from variant_test_data
+-- !query schema
+struct<value:variant>
+-- !query output
+"deep"
+
+
+-- !query
+select nested_variant:metadata['version'] from variant_test_data
+-- !query schema
+struct<version:variant>
+-- !query output
+"1.0"
+
+
+-- !query
+select nested_variant:metadata['tags'] from variant_test_data
+-- !query schema
+struct<tags:variant>
+-- !query output
+["important","urgent"]
+
+
+-- !query
+select special_chars_variant:`field-name`::string from variant_test_data
+-- !query schema
+struct<field-name:string>
+-- !query output
+value1
+
+
+-- !query
+select special_chars_variant:['field-name']::string from variant_test_data
+-- !query schema
+struct<field-name:string>
+-- !query output
+value1
+
+
+-- !query
+select special_chars_variant:field_name::string from variant_test_data
+-- !query schema
+struct<field_name:string>
+-- !query output
+value3
+
+
+-- !query
+select special_chars_variant:['field_name']::string from variant_test_data
+-- !query schema
+struct<field_name:string>
+-- !query output
+value3
+
+
+-- !query
+select special_chars_variant:`field.name`::string from variant_test_data
+-- !query schema
+struct<name:string>
+-- !query output
+NULL
+
+
+-- !query
+select special_chars_variant:['field.name']::string from variant_test_data
+-- !query schema
+struct<field.name:string>
+-- !query output
+value2
+
+
+-- !query
+select multi_field_variant:scores[0]::int + multi_field_variant:scores[1]::int from variant_test_data
+-- !query schema
+struct<(CAST(variant_get(multi_field_variant, $.scores[0]) AS scores AS INT) + CAST(variant_get(multi_field_variant, $.scores[1]) AS scores AS INT)):int>
+-- !query output
+177
+
+
+-- !query
+select count(*) from (select explode(cast(multi_field_variant:scores as array<int>)) as score from variant_test_data)
+-- !query schema
+struct<count(1):bigint>
+-- !query output
+3
+
+
+-- !query
+select * from variant_test_data
+-- !query schema
+struct<int_price_variant:variant,double_price_variant:variant,multi_field_variant:variant,array_value_variant:variant,array_variant:variant,nested_variant:variant,special_chars_variant:variant>
+-- !query output
+{"price":30}	{"price":12345.678}	{"active":true,"age":30,"city":"New York","name":"John","scores":[85,92,78]}	{"item":[{"model":"basic","price":6.12},{"model":"medium","price":9.24}]}	[{"id":1,"name":"Alice"},{"id":2,"name":"Bob"},{"id":3,"name":"Charlie"}]	{"metadata":{"nested":{"level":2,"value":"deep"},"tags":["important","urgent"],"version":"1.0"}}	{"field-name":"value1","field.name":"value2","field_name":"value3"}
+
+
+-- !query
+select multi_field_variant:* from variant_test_data
+-- !query schema
+struct<>
+-- !query output
+org.apache.spark.sql.catalyst.parser.ParseException
+{
+  "errorClass" : "PARSE_SYNTAX_ERROR",
+  "sqlState" : "42601",
+  "messageParameters" : {
+    "error" : "'*'",
+    "hint" : ""
+  }
+}
+
+
+-- !query
+select typeof(multi_field_variant:name) from variant_test_data
+-- !query schema
+struct<typeof(variant_get(multi_field_variant, $.name) AS name):string>
+-- !query output
+variant
+
+
+-- !query
+select typeof(multi_field_variant:age) from variant_test_data
+-- !query schema
+struct<typeof(variant_get(multi_field_variant, $.age) AS age):string>
+-- !query output
+variant
+
+
+-- !query
+select typeof(multi_field_variant:active) from variant_test_data
+-- !query schema
+struct<typeof(variant_get(multi_field_variant, $.active) AS active):string>
+-- !query output
+variant
+
+
+-- !query
+select typeof(multi_field_variant:scores) from variant_test_data
+-- !query schema
+struct<typeof(variant_get(multi_field_variant, $.scores) AS scores):string>
+-- !query output
+variant
+
+
+-- !query
+select isnull(multi_field_variant:missing_field) from variant_test_data
+-- !query schema
+struct<(variant_get(multi_field_variant, $.missing_field) AS missing_field IS NULL):boolean>
+-- !query output
+true
+
+
+-- !query
+select isnotnull(multi_field_variant:name) from variant_test_data
+-- !query schema
+struct<(variant_get(multi_field_variant, $.name) AS name IS NOT NULL):boolean>
+-- !query output
+true
+
+
+-- !query
+select coalesce(multi_field_variant:missing_field, 'default_value') from variant_test_data
+-- !query schema
+struct<coalesce(variant_get(multi_field_variant, $.missing_field) AS missing_field, default_value):variant>
+-- !query output
+"default_value"
diff --git a/sql/core/src/test/resources/test-data/cars.csv.hadoop.zst b/sql/core/src/test/resources/test-data/cars.csv.hadoop.zst
new file mode 100644
index 0000000000000..25af65bdf580c
Binary files /dev/null and b/sql/core/src/test/resources/test-data/cars.csv.hadoop.zst differ
diff --git a/sql/core/src/test/resources/test-data/cars.csv.zst b/sql/core/src/test/resources/test-data/cars.csv.zst
new file mode 100644
index 0000000000000..5b5fd92199974
Binary files /dev/null and b/sql/core/src/test/resources/test-data/cars.csv.zst differ
diff --git a/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_at_the_end.xml b/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_at_the_end.xml
new file mode 100644
index 0000000000000..432761ea33eda
--- /dev/null
+++ b/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_at_the_end.xml
@@ -0,0 +1,44 @@
+<baskets>
+    <basket>
+        <entry>
+            <key>1</key>
+            <value>fork</value>
+        </entry>
+        <entry>
+            <key>2</key>
+            <value>cup</value>
+        </entry>
+    </basket>
+    <basket>
+        <entry>
+            <key>3</key>
+            <value>apple</value>
+        </entry>
+        <entry>
+            <key>4</key>
+            <value>banana</value>
+        </entry>
+    </basket>
+    <basket>
+        <entry>
+            <key>5</key>
+            <value>straw</value>
+        </entry>
+        <entry>
+            <key>6</key>
+            <value>spoon</value>
+        </entry>
+    </basket>
+    <basket invalid="true">
+        <entry>
+            <key>9027</key>
+            <value>glasstop stove in black</value>
+            <extra>123</extra>
+        </entry>
+        <entry>
+            <key>288</key>
+            <value>wooden spoon</value>
+            <extra>123</extra>
+        </entry>
+    </basket>
+</baskets>
diff --git a/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_in_the_beginning.xml b/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_in_the_beginning.xml
new file mode 100644
index 0000000000000..1f4be8bf45106
--- /dev/null
+++ b/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_in_the_beginning.xml
@@ -0,0 +1,44 @@
+<baskets>
+    <basket invalid="true">
+        <entry>
+            <key>9027</key>
+            <value>glasstop stove in black</value>
+            <extra>123</extra>
+        </entry>
+        <entry>
+            <key>288</key>
+            <value>wooden spoon</value>
+            <extra>123</extra>
+        </entry>
+    </basket>
+    <basket>
+        <entry>
+            <key>1</key>
+            <value>fork</value>
+        </entry>
+        <entry>
+            <key>2</key>
+            <value>cup</value>
+        </entry>
+    </basket>
+    <basket>
+        <entry>
+            <key>3</key>
+            <value>apple</value>
+        </entry>
+        <entry>
+            <key>4</key>
+            <value>banana</value>
+        </entry>
+    </basket>
+    <basket>
+        <entry>
+            <key>5</key>
+            <value>straw</value>
+        </entry>
+        <entry>
+            <key>6</key>
+            <value>spoon</value>
+        </entry>
+    </basket>
+</baskets>
diff --git a/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_in_the_middle.xml b/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_in_the_middle.xml
new file mode 100644
index 0000000000000..2959c422daa1a
--- /dev/null
+++ b/sql/core/src/test/resources/test-data/xml-resources/basket_invalid_in_the_middle.xml
@@ -0,0 +1,44 @@
+<baskets>
+    <basket>
+        <entry>
+            <key>1</key>
+            <value>fork</value>
+        </entry>
+        <entry>
+            <key>2</key>
+            <value>cup</value>
+        </entry>
+    </basket>
+    <basket invalid="true">
+        <entry>
+            <key>9027</key>
+            <value>glasstop stove in black</value>
+            <extra>123</extra>
+        </entry>
+        <entry>
+            <key>288</key>
+            <value>wooden spoon</value>
+            <extra>123</extra>
+        </entry>
+    </basket>
+    <basket>
+        <entry>
+            <key>3</key>
+            <value>apple</value>
+        </entry>
+        <entry>
+            <key>4</key>
+            <value>banana</value>
+        </entry>
+    </basket>
+    <basket>
+        <entry>
+            <key>5</key>
+            <value>straw</value>
+        </entry>
+        <entry>
+            <key>6</key>
+            <value>spoon</value>
+        </entry>
+    </basket>
+</baskets>
diff --git a/sql/core/src/test/resources/test-data/xml-resources/books-malformed-attributes.xml b/sql/core/src/test/resources/test-data/xml-resources/books-malformed-attributes.xml
index e9830d55d3da7..10b94f956eb32 100644
--- a/sql/core/src/test/resources/test-data/xml-resources/books-malformed-attributes.xml
+++ b/sql/core/src/test/resources/test-data/xml-resources/books-malformed-attributes.xml
@@ -1,5 +1,15 @@
 <?xml version="1.0"?>
 <catalog>
+   <book id="bk111">
+      <author>O'Brien, Tim</author>
+      <title>MSXML3: A Comprehensive Guide</title>
+      <genre>Computer</genre>
+      <price>36.95</price>
+      <publish_date>2000-12-01</publish_date>
+      <description>The Microsoft MSXML3 parser is covered in
+         detail, with attention to XML DOM interfaces, XSLT processing,
+         SAX and more.</description>
+   </book>
    <book id="Malformed attribute with " caracter ">
       <author>Kress, Peter</author>
       <title>Paradox Lost</title>
@@ -19,16 +29,6 @@
       <description>Microsoft's .NET initiative is explored in
       detail in this deep programmer's reference.</description>
    </book>
-   <book id="bk111">
-      <author>O'Brien, Tim</author>
-      <title>MSXML3: A Comprehensive Guide</title>
-      <genre>Computer</genre>
-      <price>36.95</price>
-      <publish_date>2000-12-01</publish_date>
-      <description>The Microsoft MSXML3 parser is covered in
-      detail, with attention to XML DOM interfaces, XSLT processing,
-      SAX and more.</description>
-   </book>
    <book id="bk112">
       <author>Galos, Mike</author>
       <title>Visual Studio 7: A Comprehensive Guide</title>
diff --git a/sql/core/src/test/resources/test-data/xml-resources/cars-malformed.xml b/sql/core/src/test/resources/test-data/xml-resources/cars-malformed.xml
index 3859f04fbe199..18b782c0603b4 100644
--- a/sql/core/src/test/resources/test-data/xml-resources/cars-malformed.xml
+++ b/sql/core/src/test/resources/test-data/xml-resources/cars-malformed.xml
@@ -1,5 +1,10 @@
 <?xml version="1.0"?>
 <ROWSET>
+    <ROW>
+        <year>2015</year>
+        <make>Chevy</make>
+        <model>Volt</model>
+    </ROW>
     <ROW>
         <year>2012</year>
         <make>Tesla</make>
@@ -12,9 +17,4 @@
         <model>E350</model>model></model>
         <comment>Go get one now they are going fast</comment>
     </ROW>
-    <ROW>
-        <year>2015</year>
-        <make>Chevy</make>
-        <model>Volt</model>
-    </ROW>
 </ROWSET>
diff --git a/sql/core/src/test/resources/test-data/xml-resources/cars.xml.zst b/sql/core/src/test/resources/test-data/xml-resources/cars.xml.zst
new file mode 100644
index 0000000000000..223208572242d
Binary files /dev/null and b/sql/core/src/test/resources/test-data/xml-resources/cars.xml.zst differ
diff --git a/sql/core/src/test/resources/test-data/xml-resources/cdata-ending-eof.xml b/sql/core/src/test/resources/test-data/xml-resources/cdata-ending-eof.xml
index c1ec547db3391..3b964c68cfcb2 100644
--- a/sql/core/src/test/resources/test-data/xml-resources/cdata-ending-eof.xml
+++ b/sql/core/src/test/resources/test-data/xml-resources/cdata-ending-eof.xml
@@ -44,6 +44,3 @@
     ]]> <ROW> <a>16</a> </ROW>
     <ROW> <a>17</a> </ROW>
 </ROWSET>
-<![CDATA[
-    CDATA ending at eof
-]]>
diff --git a/sql/core/src/test/resources/test-data/xml-resources/cdata-no-close.xml b/sql/core/src/test/resources/test-data/xml-resources/cdata-no-close.xml
index 133ef22538ec3..3b964c68cfcb2 100644
--- a/sql/core/src/test/resources/test-data/xml-resources/cdata-no-close.xml
+++ b/sql/core/src/test/resources/test-data/xml-resources/cdata-no-close.xml
@@ -44,5 +44,3 @@
     ]]> <ROW> <a>16</a> </ROW>
     <ROW> <a>17</a> </ROW>
 </ROWSET>
-<![CDATA[
-        CDATA ending at eof
diff --git a/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml b/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml
index 7164f067a7d28..98b733a4a83b6 100644
--- a/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml
+++ b/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml
@@ -1,3621 +1,6343 @@
-﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>﻿﻿<?xml version="1.0" encoding="utf-8"?>
-<Houses>
-    <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3" HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
-           AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525" STARTDATE="1900-01-01"
-           ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
-    <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60" HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
-           AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001" OKTMO="80644450101"
-           POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="37"
-           NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
-    <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749" HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
-           AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030" OKTMO="28628422246"
-           POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="386"
-           NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
-    <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69" HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
-           AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415" STARTDATE="2013-02-21"
-           ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
-    <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c" HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
-           AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029" OKTMO="17644424176"
-           POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="65"
-           NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
-    <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a" HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
-           AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002" OKTMO="22621424106"
-           POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="37"
-           NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
-    <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353" HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
-           AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518" STARTDATE="2013-01-18"
-           ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7" NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
-           DIVTYPE="0"/>
-    <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac" HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
-           AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0" ESTSTATUS="1" STATSTATUS="0"
-           IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009" OKTMO="60602436126"
-           POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="46"
-           NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
-    <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3" HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
-           AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001" POSTALCODE="400120"
-           STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
-           NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
-    <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf" HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
-           AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008" OKTMO="76632410106"
-           POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
-           DIVTYPE="0"/>
-    <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d" HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
-           AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001" OKTMO="61626424"
-           POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04" UPDATEDATE="2017-12-17" COUNTER="2"
-           DIVTYPE="0"/>
-    <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9" HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
-           AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801" STARTDATE="2016-12-13"
-           ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1" NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
-           DIVTYPE="2"/>
-    <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5" HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
-           AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002" OKTMO="82644450106"
-           POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="52"
-           NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
-    <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e" HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
-           AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101" POSTALCODE="393927"
-           STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
-           NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
-    <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed" HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
-           AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420" STARTDATE="2017-02-15"
-           ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31" NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
-           DIVTYPE="0"/>
-    <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617" HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
-           AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039" STARTDATE="2015-06-24"
-           ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
-    <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d" HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
-           AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020" OKTMO="78612405296"
-           POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="7"
-           NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
-    <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c" HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
-           AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008" STARTDATE="1900-01-01"
-           ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
-    <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7" HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
-           AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003" OKTMO="01645428111"
-           POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
-           NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
-    <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf" HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
-           AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000" OKTMO="22635151"
-           POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="6"
-           NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
-    <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8" HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
-           AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001" OKTMO="22614416"
-           POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01" UPDATEDATE="2011-12-23" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46" HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
-           AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007" OKTMO="75652405121"
-           POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="48"
-           DIVTYPE="0"/>
-    <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07" HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
-           AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000" OKTMO="92638101"
-           POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="9"
-           DIVTYPE="0"/>
-    <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08" HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
-           AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1" STRSTATUS="0" ESTSTATUS="3"
-           STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101" POSTALCODE="385129"
-           STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
-           NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
-    <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb" HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
-           AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051" POSTALCODE="664518"
-           STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
-           NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
-    <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931" HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
-           AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141" POSTALCODE="182533"
-           STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
-           NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
-    <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc" HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
-           AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016" STARTDATE="2015-05-21"
-           ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
-    <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486" HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
-           AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136" POSTALCODE="141214"
-           STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12" DIVTYPE="0"/>
-    <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc" HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
-           AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003" OKTMO="08609412106"
-           POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17" UPDATEDATE="2017-02-17" COUNTER="1"
-           NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
-    <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c" HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
-           AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001" POSTALCODE="426003"
-           STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
-           NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
-    <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee" HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
-           AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0" ESTSTATUS="3" STATSTATUS="0"
-           IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001" OKTMO="01633423101"
-           POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="219"
-           DIVTYPE="2"/>
-    <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091" HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
-           AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004" OKTMO="66608424111"
-           POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="22"
-           NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
-    <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066" HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
-           AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141" POSTALCODE="155286"
-           STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
-           NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
-    <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32" HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
-           AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000" OKTMO="33624101"
-           POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06" UPDATEDATE="2012-02-09" COUNTER="17"
-           DIVTYPE="0"/>
-    <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b" HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
-           AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001" OKTMO="34648410101"
-           POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="16"
-           NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
-    <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4" HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
-           AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030" STARTDATE="2017-06-06"
-           ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3" NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
-           DIVTYPE="2"/>
-    <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68" HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
-           AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0" ESTSTATUS="2" STATSTATUS="0"
-           IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005" OKTMO="68624420121"
-           POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10" UPDATEDATE="2015-12-13" COUNTER="60"
-           NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
-</Houses>
\ No newline at end of file
+﻿<?xml version="1.0" encoding="utf-8"?>
+<ROWSET>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+    <Houses>
+        <House HOUSEID="96a60057-523d-4d66-b610-0000000608b3"
+               HOUSEGUID="96a60057-523d-4d66-b610-0000000608b3"
+               AOGUID="600f3c31-6682-48d5-91d3-ab72cc644f76" HOUSENUM="74" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3022" IFNSUL="3022" OKATO="12205820001" OKTMO="12605420" POSTALCODE="416525"
+               STARTDATE="1900-01-01"
+               ENDDATE="2079-06-06" UPDATEDATE="2011-12-28" COUNTER="87" DIVTYPE="0"/>
+        <House HOUSEID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               HOUSEGUID="1e1e163c-0796-4189-9d0a-0000008cec60"
+               AOGUID="3c55848d-83b4-48e2-a6ab-267e98009f1c" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0269" IFNSUL="0269" TERRIFNSFL="0238" TERRIFNSUL="0238" OKATO="80244850001"
+               OKTMO="80644450101"
+               POSTALCODE="452080" STARTDATE="2017-03-30" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="37"
+               NORMDOC="e79dd379-f408-433d-89db-43729bc18944" DIVTYPE="1"/>
+        <House HOUSEID="3d0c507a-9ca3-4b75-98c7-0000008fa749"
+               HOUSEGUID="39d122fc-be61-47b1-be35-dbdee2ed00dc"
+               AOGUID="1a5eeb18-7835-4f55-9d92-822f6a21737b" HOUSENUM="663" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6910" IFNSUL="6910" TERRIFNSFL="6927" TERRIFNSUL="6927" OKATO="28228822030"
+               OKTMO="28628422246"
+               POSTALCODE="171513" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="386"
+               NORMDOC="3eccc546-0d45-40af-8a0d-f69e68849674" DIVTYPE="0"/>
+        <House HOUSEID="8419a880-0788-45f0-8bff-000001bd8a69"
+               HOUSEGUID="783d937e-70aa-4ee3-80da-1ef7f913a019"
+               AOGUID="94e37e5c-c674-444b-b74e-6a9cb9f0df9f" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1828" IFNSUL="1828" OKATO="94208825002" OKTMO="94608425" POSTALCODE="427415"
+               STARTDATE="2013-02-21"
+               ENDDATE="2014-01-10" UPDATEDATE="2017-12-17" COUNTER="4" DIVTYPE="0"/>
+        <House HOUSEID="1ee8cdd9-60dd-402a-b932-000002c78f6c"
+               HOUSEGUID="288c436d-8b82-4ca8-a5b8-6cb3d78d16b0"
+               AOGUID="f0d7370b-53b8-4db7-bb47-957e00066979" HOUSENUM="83" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3334" IFNSUL="3334" TERRIFNSFL="3320" TERRIFNSUL="3320" OKATO="17244000029"
+               OKTMO="17644424176"
+               POSTALCODE="602262" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="65"
+               NORMDOC="46a1a406-c147-4924-912a-0cf60992aa5c" DIVTYPE="0"/>
+        <House HOUSEID="bcb64c24-a9cb-4549-84dc-0000031c2e0a"
+               HOUSEGUID="e9fe0fae-0113-44eb-974e-88d77a1f7ce1"
+               AOGUID="3fcae74c-203c-406b-8dc2-be3261d03400" HOUSENUM="34" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5222" IFNSUL="5222" TERRIFNSFL="5211" TERRIFNSUL="5211" OKATO="22221824002"
+               OKTMO="22621424106"
+               POSTALCODE="606273" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="37"
+               NORMDOC="9b7b7c76-78a8-4788-880b-184bea8e6c00" DIVTYPE="0"/>
+        <House HOUSEID="607a71d0-badb-4198-8d2f-00000323c353"
+               HOUSEGUID="e8867960-6a4c-4b74-9d0e-4a1f226a08ae"
+               AOGUID="b9ad6dec-d71f-4cce-8a1f-5336bd21dc68" HOUSENUM="42" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3456" IFNSUL="3456" OKATO="18428000000" OKTMO="18728000" POSTALCODE="403518"
+               STARTDATE="2013-01-18"
+               ENDDATE="2016-01-14" UPDATEDATE="2016-01-17" COUNTER="7"
+               NORMDOC="7ae8a4d7-f4af-4eb3-a473-40b03ef6f99e"
+               DIVTYPE="0"/>
+        <House HOUSEID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               HOUSEGUID="43a8d374-ef16-4604-aac8-0000032dfdac"
+               AOGUID="0208b4ad-dc6d-469f-8224-8e1c9f72f0ad" HOUSENUM="33" STRSTATUS="0"
+               ESTSTATUS="1" STATSTATUS="0"
+               IFNSFL="6181" IFNSUL="6181" TERRIFNSFL="6102" TERRIFNSUL="6102" OKATO="60202867009"
+               OKTMO="60602436126"
+               POSTALCODE="346735" STARTDATE="2014-07-22" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="46"
+               NORMDOC="3b2db667-bc3d-463d-b889-b462ca3bebac" DIVTYPE="0"/>
+        <House HOUSEID="779c43ea-573d-4617-89bc-0000037450e3"
+               HOUSEGUID="7ce1bb1a-5115-43a5-9c6f-803d299aea97"
+               AOGUID="381c8364-55a4-45f0-9139-a34a1f143614" HOUSENUM="3" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3460" IFNSUL="3460" OKATO="18401363000" OKTMO="18701000001"
+               POSTALCODE="400120"
+               STARTDATE="2015-12-14" ENDDATE="2079-06-06" UPDATEDATE="2015-12-16" COUNTER="110"
+               NORMDOC="8498dcef-af7b-41e1-9af4-43634be322a8" DIVTYPE="0"/>
+        <House HOUSEID="a0e7dcc4-9478-46fe-8f67-0000037d3bbf"
+               HOUSEGUID="b4cc9cb7-ff80-46b4-847f-0e1a17850f37"
+               AOGUID="337edd52-feb9-4335-816a-616b87ec18b1" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7580" IFNSUL="7580" TERRIFNSFL="7515" TERRIFNSUL="7515" OKATO="76232000008"
+               OKTMO="76632410106"
+               POSTALCODE="674500" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="3"
+               DIVTYPE="0"/>
+        <House HOUSEID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               HOUSEGUID="ba1c2f28-a455-47e2-95e5-000003a0023d"
+               AOGUID="fce962f2-dff8-4eea-8413-5c94e0e69dec" HOUSENUM="2" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6225" IFNSUL="6225" TERRIFNSFL="6212" TERRIFNSUL="6212" OKATO="61226861001"
+               OKTMO="61626424"
+               POSTALCODE="391483" STARTDATE="1900-01-01" ENDDATE="2014-01-04"
+               UPDATEDATE="2017-12-17" COUNTER="2"
+               DIVTYPE="0"/>
+        <House HOUSEID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               HOUSEGUID="c04e7106-7e33-4f37-b961-000003c16ce9"
+               AOGUID="bcae22ba-cf73-4f18-b7ba-c926db2c6f35" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6727" IFNSUL="6727" OKATO="66258501000" OKTMO="66658101" POSTALCODE="215801"
+               STARTDATE="2016-12-13"
+               ENDDATE="2017-01-09" UPDATEDATE="2017-01-09" COUNTER="1"
+               NORMDOC="4b274c97-cc71-4ada-820f-25d746c4d458"
+               DIVTYPE="2"/>
+        <House HOUSEID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               HOUSEGUID="07fa4274-cafb-444f-ade3-0000048fa0e5"
+               AOGUID="7c70621d-cb62-42b3-87b4-835bffd362ff" HOUSENUM="52" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="0548" IFNSUL="0548" TERRIFNSFL="0527" TERRIFNSUL="0527" OKATO="82244850002"
+               OKTMO="82644450106"
+               POSTALCODE="368517" STARTDATE="2017-06-05" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="52"
+               NORMDOC="9baa1878-326a-45bd-be1b-df919ac694a6" DIVTYPE="2"/>
+        <House HOUSEID="0a731070-a75c-454c-b424-000004cf438e"
+               HOUSEGUID="237f5c44-3569-4198-9b86-771bd6926105"
+               AOGUID="0c83d89f-7c9d-40e8-8a7d-12340b1ae427" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="6809" IFNSUL="6809" OKATO="68216880001" OKTMO="68616480101"
+               POSTALCODE="393927"
+               STARTDATE="2015-11-13" ENDDATE="2017-01-01" UPDATEDATE="2017-10-19" COUNTER="33"
+               NORMDOC="7b8c1931-120e-4325-ae46-1eac8ffa97d5" DIVTYPE="2"/>
+        <House HOUSEID="f6cfb47d-9edb-470f-a409-0000051761ed"
+               HOUSEGUID="f89cfcb0-f61d-4902-b605-df1cee9cd7be"
+               AOGUID="5eedf172-9ac6-4f46-b110-2c53a15b1f6a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="9104" IFNSUL="9104" OKATO="35204000089" OKTMO="35604402" POSTALCODE="298420"
+               STARTDATE="2017-02-15"
+               ENDDATE="2017-07-25" UPDATEDATE="2017-07-25" COUNTER="31"
+               NORMDOC="8bd9578d-373f-41b1-bb56-16b3034076f7"
+               DIVTYPE="0"/>
+        <House HOUSEID="8c56dc29-94e4-43fc-a7fb-0000053b5617"
+               HOUSEGUID="45c9a40c-e130-4e2c-ba86-de2d6b151a97"
+               AOGUID="ed5e0f09-5ae7-4687-a072-bca540c3a1b2" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3905" IFNSUL="3906" OKATO="27401373000" OKTMO="27701000" POSTALCODE="236039"
+               STARTDATE="2015-06-24"
+               ENDDATE="2017-06-05" UPDATEDATE="2017-06-05" COUNTER="13" DIVTYPE="0"/>
+        <House HOUSEID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               HOUSEGUID="b5c4f8a6-7b86-4ea0-a9df-000005c0056d"
+               AOGUID="eec1c98f-8a29-410b-b6b7-8c96b63670ed" HOUSENUM="30" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7609" IFNSUL="7609" TERRIFNSFL="7616" TERRIFNSUL="7616" OKATO="78212866020"
+               OKTMO="78612405296"
+               POSTALCODE="152240" STARTDATE="2017-10-09" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="7"
+               NORMDOC="c8854e32-5fd6-433e-9ae0-6cb716bd09df" CADNUM="76:04:082601:58" DIVTYPE="1"/>
+        <House HOUSEID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               HOUSEGUID="5bde46db-a486-46c7-9ad9-000005fdaa7c"
+               AOGUID="7a53668c-1cf4-4ed0-a4df-526e0baa7216" HOUSENUM="425" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7327" IFNSUL="7327" OKATO="73401373000" OKTMO="73701000" POSTALCODE="432008"
+               STARTDATE="1900-01-01"
+               ENDDATE="2015-11-26" UPDATEDATE="2015-11-30" COUNTER="607" DIVTYPE="0"/>
+        <House HOUSEID="d60cc963-4b1c-4ed9-b01c-00000724d9f7"
+               HOUSEGUID="040b2917-3c89-431d-b4a5-9734702127e8"
+               AOGUID="9df7a3bc-ae81-4080-b79c-3a9223a5d77a" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2261" IFNSUL="2261" TERRIFNSFL="2290" TERRIFNSUL="2290" OKATO="01245828003"
+               OKTMO="01645428111"
+               POSTALCODE="659058" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="12"
+               NORMDOC="d1284e11-3657-4e79-af26-a9d3a9ecec7d" DIVTYPE="2"/>
+        <House HOUSEID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               HOUSEGUID="1ea2b959-7e53-4c4d-9fbe-0000072efedf"
+               AOGUID="56a7b834-ba7b-4cae-9f8a-b49ad5f92794" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5228" IFNSUL="5228" TERRIFNSFL="5219" TERRIFNSUL="5219" OKATO="22235551000"
+               OKTMO="22635151"
+               POSTALCODE="606710" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="6"
+               NORMDOC="c451dc9b-40e6-4bb1-8da6-9113d336de14" DIVTYPE="1"/>
+        <House HOUSEID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               HOUSEGUID="c4d041c4-fa60-4691-8404-0000078d6ce8"
+               AOGUID="989df635-a9a0-4d58-85b9-64ed6da7e4cd" HOUSENUM="49" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5225" IFNSUL="5225" TERRIFNSFL="5206" TERRIFNSUL="5206" OKATO="22214816001"
+               OKTMO="22614416"
+               POSTALCODE="606383" STARTDATE="1953-12-18" ENDDATE="2012-01-01"
+               UPDATEDATE="2011-12-23" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="01f763f6-df66-41c9-88b4-000007a2dd46"
+               HOUSEGUID="5acfe4bb-98c4-4234-8ad4-ca886e14c366"
+               AOGUID="07f88891-0975-43e4-9654-140c5d45719e" HOUSENUM="4" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="7460" IFNSUL="7460" TERRIFNSFL="7438" TERRIFNSUL="7438" OKATO="75252805007"
+               OKTMO="75652405121"
+               POSTALCODE="456534" STARTDATE="2014-01-04" ENDDATE="2079-06-06"
+               UPDATEDATE="2014-09-11" COUNTER="48"
+               DIVTYPE="0"/>
+        <House HOUSEID="067e9686-c0a8-474b-bd54-000007af3a07"
+               HOUSEGUID="067e9686-c0a8-474b-bd54-000007af3a07"
+               AOGUID="7cdb66ef-08cf-4da2-a354-57ad5169011f" HOUSENUM="10" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1675" IFNSUL="1675" TERRIFNSFL="1626" TERRIFNSUL="1626" OKATO="92238501000"
+               OKTMO="92638101"
+               POSTALCODE="422190" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="9"
+               DIVTYPE="0"/>
+        <House HOUSEID="d8d7d823-5006-4e8e-8d1c-000007ecff08"
+               HOUSEGUID="90b1627d-afab-4fa2-a96f-971363a1d2da"
+               AOGUID="d0892ae2-d45e-4bb6-a723-3e4a57c96e50" HOUSENUM="43" BUILDNUM="1"
+               STRSTATUS="0" ESTSTATUS="3"
+               STATSTATUS="0" IFNSFL="0107" IFNSUL="0107" OKATO="79230000005" OKTMO="79630417101"
+               POSTALCODE="385129"
+               STARTDATE="2015-12-17" ENDDATE="2079-06-06" UPDATEDATE="2015-12-23" COUNTER="80"
+               NORMDOC="c9860290-4789-4a45-82b2-542ad7e633a3" DIVTYPE="0"/>
+        <House HOUSEID="9e0a53de-b3a5-40d8-bcaf-0000080ca6cb"
+               HOUSEGUID="7e4a2ea2-673d-478d-86b0-4d43ef488d47"
+               AOGUID="250faece-4ac5-4509-89be-a030a29f8b1a" HOUSENUM="22" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="3827" IFNSUL="3827" OKATO="25212555000" OKTMO="25612155051"
+               POSTALCODE="664518"
+               STARTDATE="2014-03-13" ENDDATE="2079-06-06" UPDATEDATE="2014-09-11" COUNTER="24"
+               NORMDOC="978de505-da84-4cad-8971-ccd5e520ef77" DIVTYPE="0"/>
+        <House HOUSEID="5fc276d8-5d20-42c9-ad03-0000088e9931"
+               HOUSEGUID="a551020d-1d8b-4f2f-a144-2a6ca3bdf273"
+               AOGUID="98e98b43-1a90-488d-a33d-740659707d83" HOUSENUM="43" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6009" IFNSUL="6009" OKATO="58220820008" OKTMO="58620420141"
+               POSTALCODE="182533"
+               STARTDATE="2014-01-04" ENDDATE="2016-01-03" UPDATEDATE="2016-01-03" COUNTER="33"
+               NORMDOC="54727611-8dc3-40a2-adda-01fc1a567240" DIVTYPE="0"/>
+        <House HOUSEID="3a155e29-2633-44a1-9889-00000907eadc"
+               HOUSEGUID="7f64f158-110a-4409-a445-54bb69ae9010"
+               AOGUID="de1a767a-0b5c-466c-9ba3-12b25379f55a" HOUSENUM="31" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6165" IFNSUL="6165" OKATO="60401000000" OKTMO="60701000" POSTALCODE="344016"
+               STARTDATE="2015-05-21"
+               ENDDATE="2017-09-28" UPDATEDATE="2017-10-07" COUNTER="5" DIVTYPE="0"/>
+        <House HOUSEID="57a8c3b0-71ee-41b5-a2fc-0000099b2486"
+               HOUSEGUID="1c0e5121-986a-40fc-949f-ce5d03cc63bc"
+               AOGUID="587e30c5-ce51-4936-90fb-3b6589704f6b" HOUSENUM="20а" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="5038" IFNSUL="5038" OKATO="46247843022" OKTMO="46647443136"
+               POSTALCODE="141214"
+               STARTDATE="2014-03-19" ENDDATE="2079-06-06" UPDATEDATE="2017-04-24" COUNTER="12"
+               DIVTYPE="0"/>
+        <House HOUSEID="c5944b88-85c9-4377-9196-00000a6f60fc"
+               HOUSEGUID="73f7c69f-010b-4ece-9a4d-54885b1221cc"
+               AOGUID="a07e9944-ac11-46f6-adc4-ca4d2d5ed37e" HOUSENUM="1" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="2720" IFNSUL="2720" TERRIFNSFL="2707" TERRIFNSUL="2707" OKATO="08209000003"
+               OKTMO="08609412106"
+               POSTALCODE="682970" STARTDATE="2014-01-04" ENDDATE="2017-02-17"
+               UPDATEDATE="2017-02-17" COUNTER="1"
+               NORMDOC="749ca169-da00-4ea1-8270-4affb79fcc93" DIVTYPE="0"/>
+        <House HOUSEID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               HOUSEGUID="23a7f7a4-3b7d-4c6f-ade3-00000ad1051c"
+               AOGUID="c57d4c55-6d11-4245-9917-7b507b9ca4f2" HOUSENUM="12" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="1841" IFNSUL="1841" OKATO="94401000000" OKTMO="94701000001"
+               POSTALCODE="426003"
+               STARTDATE="2016-12-26" ENDDATE="2017-04-21" UPDATEDATE="2017-12-17" COUNTER="20"
+               NORMDOC="5ca30747-00ba-454d-83f3-1ebaac6ac147" DIVTYPE="1"/>
+        <House HOUSEID="d1b12807-e013-4afd-ada8-00000af74eee"
+               HOUSEGUID="f398b5e9-e085-400a-aa7d-633802dfdf07"
+               AOGUID="42b7e946-1087-413c-b372-311994158f01" HOUSENUM="239" STRSTATUS="0"
+               ESTSTATUS="3" STATSTATUS="0"
+               IFNSFL="2204" IFNSUL="2204" TERRIFNSFL="2264" TERRIFNSUL="2264" OKATO="01233823001"
+               OKTMO="01633423101"
+               POSTALCODE="659668" STARTDATE="2015-11-19" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="219"
+               DIVTYPE="2"/>
+        <House HOUSEID="647f089b-3a4b-490c-a603-00000bc67091"
+               HOUSEGUID="647f089b-3a4b-490c-a603-00000bc67091"
+               AOGUID="561c4a00-240b-4681-a14d-3e044ef43f75" HOUSENUM="6" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6722" IFNSUL="6722" TERRIFNSFL="6723" TERRIFNSUL="6723" OKATO="66208824004"
+               OKTMO="66608424111"
+               POSTALCODE="215047" STARTDATE="2014-01-10" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-12-17" COUNTER="22"
+               NORMDOC="c1f8318a-c091-4ea7-9734-7382fc23bed7" DIVTYPE="2"/>
+        <House HOUSEID="de5a7a0e-ab8e-4fa8-9302-00000c1a9066"
+               HOUSEGUID="e6634307-4377-46aa-9d37-36d40524063a"
+               AOGUID="79399fd5-8e3c-4be5-87db-34b5285cb0fc" HOUSENUM="35" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="3706" IFNSUL="3706" OKATO="24215812002" OKTMO="24615424141"
+               POSTALCODE="155286"
+               STARTDATE="2017-12-30" ENDDATE="2079-06-06" UPDATEDATE="2018-01-09" COUNTER="43"
+               NORMDOC="4b215e26-a03a-41de-8eda-8fe433b025e5" DIVTYPE="2"/>
+        <House HOUSEID="f31cfce5-0e34-4285-8585-00000c731a32"
+               HOUSEGUID="f31cfce5-0e34-4285-8585-00000c731a32"
+               AOGUID="32c177a0-49e9-4559-8567-49883c81850b" HOUSENUM="17" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4329" IFNSUL="4329" TERRIFNSFL="4318" TERRIFNSUL="4318" OKATO="33224501000"
+               OKTMO="33624101"
+               POSTALCODE="613711" STARTDATE="1900-01-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2012-02-09" COUNTER="17"
+               DIVTYPE="0"/>
+        <House HOUSEID="f18effb0-e35f-46c5-abf5-00000ca3275b"
+               HOUSEGUID="5c8b6e79-8575-4b65-bed9-7cb18e8b7b1a"
+               AOGUID="1118a430-2e0a-4e74-ab62-07ef840530cc" HOUSENUM="20" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4436" IFNSUL="4436" TERRIFNSFL="4430" TERRIFNSUL="4430" OKATO="34248810001"
+               OKTMO="34648410101"
+               POSTALCODE="157550" STARTDATE="2015-12-01" ENDDATE="2079-06-06"
+               UPDATEDATE="2017-04-24" COUNTER="16"
+               NORMDOC="0801d34f-e64a-4360-81b1-b5c7223fbd97" DIVTYPE="2"/>
+        <House HOUSEID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               HOUSEGUID="b5d5236f-9bb4-40e4-a560-00000d4866b4"
+               AOGUID="33c3554c-dff0-44a7-97be-3c8a768d8ba7" HOUSENUM="7" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="4345" IFNSUL="4345" OKATO="33401000000" OKTMO="33701000" POSTALCODE="610030"
+               STARTDATE="2017-06-06"
+               ENDDATE="2079-06-06" UPDATEDATE="2017-12-17" COUNTER="3"
+               NORMDOC="a29b28e6-b358-4837-ab6a-7ddfcc7a12bc"
+               DIVTYPE="2"/>
+        <House HOUSEID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               HOUSEGUID="dca2c5ed-28d3-401c-8ba7-00000d912a68"
+               AOGUID="9e33ac40-e0ec-4519-8aee-f1348c28560d" HOUSENUM="88" STRSTATUS="0"
+               ESTSTATUS="2" STATSTATUS="0"
+               IFNSFL="6827" IFNSUL="6827" TERRIFNSFL="6813" TERRIFNSUL="6813" OKATO="68224820005"
+               OKTMO="68624420121"
+               POSTALCODE="393081" STARTDATE="2015-10-24" ENDDATE="2015-12-10"
+               UPDATEDATE="2015-12-13" COUNTER="60"
+               NORMDOC="9be466a1-6798-4fa3-b95b-d0742506c1f8" DIVTYPE="1"/>
+    </Houses>
+</ROWSET>
\ No newline at end of file
diff --git a/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.bz2 b/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.bz2
index 0003edd5dc293..68c443de803b4 100644
Binary files a/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.bz2 and b/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.bz2 differ
diff --git a/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.gz b/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.gz
index 3e0172271cc67..98c8c41e8d41a 100644
Binary files a/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.gz and b/sql/core/src/test/resources/test-data/xml-resources/fias_house.large.xml.gz differ
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q10.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q10.sf100/explain.txt
index 8e472ce04796c..0e1b571b532f9 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q10.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q10.sf100/explain.txt
@@ -61,127 +61,127 @@ Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 
 (3) Filter [codegen id : 1]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
-Condition : (((isnotnull(c_customer_sk#1) AND isnotnull(c_current_addr_sk#3)) AND isnotnull(c_current_cdemo_sk#2)) AND might_contain(Subquery scalar-subquery#4, [id=#5], xxhash64(c_current_addr_sk#3, 42)))
+Condition : (((isnotnull(c_customer_sk#1) AND isnotnull(c_current_addr_sk#3)) AND isnotnull(c_current_cdemo_sk#2)) AND might_contain(Subquery scalar-subquery#4, [id=#1], xxhash64(c_current_addr_sk#3, 42)))
 
 (4) Exchange
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
-Arguments: hashpartitioning(c_customer_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(c_customer_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=2]
 
 (5) Sort [codegen id : 2]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 Arguments: [c_customer_sk#1 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.web_sales
-Output [2]: [ws_bill_customer_sk#6, ws_sold_date_sk#7]
+Output [2]: [ws_bill_customer_sk#5, ws_sold_date_sk#6]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#7), dynamicpruningexpression(ws_sold_date_sk#7 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#6), dynamicpruningexpression(ws_sold_date_sk#6 IN dynamicpruning#7)]
 PushedFilters: [IsNotNull(ws_bill_customer_sk)]
 ReadSchema: struct<ws_bill_customer_sk:int>
 
 (7) ColumnarToRow [codegen id : 4]
-Input [2]: [ws_bill_customer_sk#6, ws_sold_date_sk#7]
+Input [2]: [ws_bill_customer_sk#5, ws_sold_date_sk#6]
 
 (8) Filter [codegen id : 4]
-Input [2]: [ws_bill_customer_sk#6, ws_sold_date_sk#7]
-Condition : isnotnull(ws_bill_customer_sk#6)
+Input [2]: [ws_bill_customer_sk#5, ws_sold_date_sk#6]
+Condition : isnotnull(ws_bill_customer_sk#5)
 
 (9) ReusedExchange [Reuses operator id: 60]
-Output [1]: [d_date_sk#9]
+Output [1]: [d_date_sk#8]
 
 (10) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [ws_sold_date_sk#7]
-Right keys [1]: [d_date_sk#9]
+Left keys [1]: [ws_sold_date_sk#6]
+Right keys [1]: [d_date_sk#8]
 Join type: Inner
 Join condition: None
 
 (11) Project [codegen id : 4]
-Output [1]: [ws_bill_customer_sk#6 AS customer_sk#10]
-Input [3]: [ws_bill_customer_sk#6, ws_sold_date_sk#7, d_date_sk#9]
+Output [1]: [ws_bill_customer_sk#5 AS customer_sk#9]
+Input [3]: [ws_bill_customer_sk#5, ws_sold_date_sk#6, d_date_sk#8]
 
 (12) Scan parquet spark_catalog.default.catalog_sales
-Output [2]: [cs_ship_customer_sk#11, cs_sold_date_sk#12]
+Output [2]: [cs_ship_customer_sk#10, cs_sold_date_sk#11]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#12), dynamicpruningexpression(cs_sold_date_sk#12 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#11), dynamicpruningexpression(cs_sold_date_sk#11 IN dynamicpruning#7)]
 PushedFilters: [IsNotNull(cs_ship_customer_sk)]
 ReadSchema: struct<cs_ship_customer_sk:int>
 
 (13) ColumnarToRow [codegen id : 6]
-Input [2]: [cs_ship_customer_sk#11, cs_sold_date_sk#12]
+Input [2]: [cs_ship_customer_sk#10, cs_sold_date_sk#11]
 
 (14) Filter [codegen id : 6]
-Input [2]: [cs_ship_customer_sk#11, cs_sold_date_sk#12]
-Condition : isnotnull(cs_ship_customer_sk#11)
+Input [2]: [cs_ship_customer_sk#10, cs_sold_date_sk#11]
+Condition : isnotnull(cs_ship_customer_sk#10)
 
 (15) ReusedExchange [Reuses operator id: 60]
-Output [1]: [d_date_sk#13]
+Output [1]: [d_date_sk#12]
 
 (16) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [cs_sold_date_sk#12]
-Right keys [1]: [d_date_sk#13]
+Left keys [1]: [cs_sold_date_sk#11]
+Right keys [1]: [d_date_sk#12]
 Join type: Inner
 Join condition: None
 
 (17) Project [codegen id : 6]
-Output [1]: [cs_ship_customer_sk#11 AS customer_sk#14]
-Input [3]: [cs_ship_customer_sk#11, cs_sold_date_sk#12, d_date_sk#13]
+Output [1]: [cs_ship_customer_sk#10 AS customer_sk#13]
+Input [3]: [cs_ship_customer_sk#10, cs_sold_date_sk#11, d_date_sk#12]
 
 (18) Union
 
 (19) Exchange
-Input [1]: [customer_sk#10]
-Arguments: hashpartitioning(customer_sk#10, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [1]: [customer_sk#9]
+Arguments: hashpartitioning(customer_sk#9, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (20) Sort [codegen id : 7]
-Input [1]: [customer_sk#10]
-Arguments: [customer_sk#10 ASC NULLS FIRST], false, 0
+Input [1]: [customer_sk#9]
+Arguments: [customer_sk#9 ASC NULLS FIRST], false, 0
 
 (21) SortMergeJoin [codegen id : 8]
 Left keys [1]: [c_customer_sk#1]
-Right keys [1]: [customer_sk#10]
+Right keys [1]: [customer_sk#9]
 Join type: LeftSemi
 Join condition: None
 
 (22) Scan parquet spark_catalog.default.store_sales
-Output [2]: [ss_customer_sk#15, ss_sold_date_sk#16]
+Output [2]: [ss_customer_sk#14, ss_sold_date_sk#15]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#16), dynamicpruningexpression(ss_sold_date_sk#16 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#15), dynamicpruningexpression(ss_sold_date_sk#15 IN dynamicpruning#7)]
 PushedFilters: [IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_customer_sk:int>
 
 (23) ColumnarToRow [codegen id : 10]
-Input [2]: [ss_customer_sk#15, ss_sold_date_sk#16]
+Input [2]: [ss_customer_sk#14, ss_sold_date_sk#15]
 
 (24) Filter [codegen id : 10]
-Input [2]: [ss_customer_sk#15, ss_sold_date_sk#16]
-Condition : isnotnull(ss_customer_sk#15)
+Input [2]: [ss_customer_sk#14, ss_sold_date_sk#15]
+Condition : isnotnull(ss_customer_sk#14)
 
 (25) ReusedExchange [Reuses operator id: 60]
-Output [1]: [d_date_sk#17]
+Output [1]: [d_date_sk#16]
 
 (26) BroadcastHashJoin [codegen id : 10]
-Left keys [1]: [ss_sold_date_sk#16]
-Right keys [1]: [d_date_sk#17]
+Left keys [1]: [ss_sold_date_sk#15]
+Right keys [1]: [d_date_sk#16]
 Join type: Inner
 Join condition: None
 
 (27) Project [codegen id : 10]
-Output [1]: [ss_customer_sk#15 AS customer_sk#18]
-Input [3]: [ss_customer_sk#15, ss_sold_date_sk#16, d_date_sk#17]
+Output [1]: [ss_customer_sk#14 AS customer_sk#17]
+Input [3]: [ss_customer_sk#14, ss_sold_date_sk#15, d_date_sk#16]
 
 (28) Exchange
-Input [1]: [customer_sk#18]
-Arguments: hashpartitioning(customer_sk#18, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [1]: [customer_sk#17]
+Arguments: hashpartitioning(customer_sk#17, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (29) Sort [codegen id : 11]
-Input [1]: [customer_sk#18]
-Arguments: [customer_sk#18 ASC NULLS FIRST], false, 0
+Input [1]: [customer_sk#17]
+Arguments: [customer_sk#17 ASC NULLS FIRST], false, 0
 
 (30) SortMergeJoin [codegen id : 13]
 Left keys [1]: [c_customer_sk#1]
-Right keys [1]: [customer_sk#18]
+Right keys [1]: [customer_sk#17]
 Join type: LeftSemi
 Join condition: None
 
@@ -190,90 +190,90 @@ Output [2]: [c_current_cdemo_sk#2, c_current_addr_sk#3]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 
 (32) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#19, ca_county#20]
+Output [2]: [ca_address_sk#18, ca_county#19]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_county, [Dona Ana County,Douglas County,Gaines County,Richland County,Walker County]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_county:string>
 
 (33) ColumnarToRow [codegen id : 12]
-Input [2]: [ca_address_sk#19, ca_county#20]
+Input [2]: [ca_address_sk#18, ca_county#19]
 
 (34) Filter [codegen id : 12]
-Input [2]: [ca_address_sk#19, ca_county#20]
-Condition : (ca_county#20 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#19))
+Input [2]: [ca_address_sk#18, ca_county#19]
+Condition : (ca_county#19 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#18))
 
 (35) Project [codegen id : 12]
-Output [1]: [ca_address_sk#19]
-Input [2]: [ca_address_sk#19, ca_county#20]
+Output [1]: [ca_address_sk#18]
+Input [2]: [ca_address_sk#18, ca_county#19]
 
 (36) BroadcastExchange
-Input [1]: [ca_address_sk#19]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [ca_address_sk#18]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
 
 (37) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [c_current_addr_sk#3]
-Right keys [1]: [ca_address_sk#19]
+Right keys [1]: [ca_address_sk#18]
 Join type: Inner
 Join condition: None
 
 (38) Project [codegen id : 13]
 Output [1]: [c_current_cdemo_sk#2]
-Input [3]: [c_current_cdemo_sk#2, c_current_addr_sk#3, ca_address_sk#19]
+Input [3]: [c_current_cdemo_sk#2, c_current_addr_sk#3, ca_address_sk#18]
 
 (39) BroadcastExchange
 Input [1]: [c_current_cdemo_sk#2]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
 (40) Scan parquet spark_catalog.default.customer_demographics
-Output [9]: [cd_demo_sk#21, cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
+Output [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk)]
 ReadSchema: struct<cd_demo_sk:int,cd_gender:string,cd_marital_status:string,cd_education_status:string,cd_purchase_estimate:int,cd_credit_rating:string,cd_dep_count:int,cd_dep_employed_count:int,cd_dep_college_count:int>
 
 (41) ColumnarToRow
-Input [9]: [cd_demo_sk#21, cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
+Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
 
 (42) Filter
-Input [9]: [cd_demo_sk#21, cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
-Condition : isnotnull(cd_demo_sk#21)
+Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Condition : isnotnull(cd_demo_sk#20)
 
 (43) BroadcastHashJoin [codegen id : 14]
 Left keys [1]: [c_current_cdemo_sk#2]
-Right keys [1]: [cd_demo_sk#21]
+Right keys [1]: [cd_demo_sk#20]
 Join type: Inner
 Join condition: None
 
 (44) Project [codegen id : 14]
-Output [8]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
-Input [10]: [c_current_cdemo_sk#2, cd_demo_sk#21, cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
+Output [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Input [10]: [c_current_cdemo_sk#2, cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
 
 (45) HashAggregate [codegen id : 14]
-Input [8]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
-Keys [8]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
+Input [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Keys [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
 Functions [1]: [partial_count(1)]
-Aggregate Attributes [1]: [count#30]
-Results [9]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29, count#31]
+Aggregate Attributes [1]: [count#29]
+Results [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
 
 (46) Exchange
-Input [9]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29, count#31]
-Arguments: hashpartitioning(cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
+Arguments: hashpartitioning(cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, 5), ENSURE_REQUIREMENTS, [plan_id=7]
 
 (47) HashAggregate [codegen id : 15]
-Input [9]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29, count#31]
-Keys [8]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cd_purchase_estimate#25, cd_credit_rating#26, cd_dep_count#27, cd_dep_employed_count#28, cd_dep_college_count#29]
+Input [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
+Keys [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
 Functions [1]: [count(1)]
-Aggregate Attributes [1]: [count(1)#32]
-Results [14]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, count(1)#32 AS cnt1#33, cd_purchase_estimate#25, count(1)#32 AS cnt2#34, cd_credit_rating#26, count(1)#32 AS cnt3#35, cd_dep_count#27, count(1)#32 AS cnt4#36, cd_dep_employed_count#28, count(1)#32 AS cnt5#37, cd_dep_college_count#29, count(1)#32 AS cnt6#38]
+Aggregate Attributes [1]: [count(1)#31]
+Results [14]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, count(1)#31 AS cnt1#32, cd_purchase_estimate#24, count(1)#31 AS cnt2#33, cd_credit_rating#25, count(1)#31 AS cnt3#34, cd_dep_count#26, count(1)#31 AS cnt4#35, cd_dep_employed_count#27, count(1)#31 AS cnt5#36, cd_dep_college_count#28, count(1)#31 AS cnt6#37]
 
 (48) TakeOrderedAndProject
-Input [14]: [cd_gender#22, cd_marital_status#23, cd_education_status#24, cnt1#33, cd_purchase_estimate#25, cnt2#34, cd_credit_rating#26, cnt3#35, cd_dep_count#27, cnt4#36, cd_dep_employed_count#28, cnt5#37, cd_dep_college_count#29, cnt6#38]
-Arguments: 100, [cd_gender#22 ASC NULLS FIRST, cd_marital_status#23 ASC NULLS FIRST, cd_education_status#24 ASC NULLS FIRST, cd_purchase_estimate#25 ASC NULLS FIRST, cd_credit_rating#26 ASC NULLS FIRST, cd_dep_count#27 ASC NULLS FIRST, cd_dep_employed_count#28 ASC NULLS FIRST, cd_dep_college_count#29 ASC NULLS FIRST], [cd_gender#22, cd_marital_status#23, cd_education_status#24, cnt1#33, cd_purchase_estimate#25, cnt2#34, cd_credit_rating#26, cnt3#35, cd_dep_count#27, cnt4#36, cd_dep_employed_count#28, cnt5#37, cd_dep_college_count#29, cnt6#38]
+Input [14]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cnt1#32, cd_purchase_estimate#24, cnt2#33, cd_credit_rating#25, cnt3#34, cd_dep_count#26, cnt4#35, cd_dep_employed_count#27, cnt5#36, cd_dep_college_count#28, cnt6#37]
+Arguments: 100, [cd_gender#21 ASC NULLS FIRST, cd_marital_status#22 ASC NULLS FIRST, cd_education_status#23 ASC NULLS FIRST, cd_purchase_estimate#24 ASC NULLS FIRST, cd_credit_rating#25 ASC NULLS FIRST, cd_dep_count#26 ASC NULLS FIRST, cd_dep_employed_count#27 ASC NULLS FIRST, cd_dep_college_count#28 ASC NULLS FIRST], [cd_gender#21, cd_marital_status#22, cd_education_status#23, cnt1#32, cd_purchase_estimate#24, cnt2#33, cd_credit_rating#25, cnt3#34, cd_dep_count#26, cnt4#35, cd_dep_employed_count#27, cnt5#36, cd_dep_college_count#28, cnt6#37]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#4, [id=#5]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#4, [id=#1]
 ObjectHashAggregate (55)
 +- Exchange (54)
    +- ObjectHashAggregate (53)
@@ -284,42 +284,42 @@ ObjectHashAggregate (55)
 
 
 (49) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#19, ca_county#20]
+Output [2]: [ca_address_sk#18, ca_county#19]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_county, [Dona Ana County,Douglas County,Gaines County,Richland County,Walker County]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_county:string>
 
 (50) ColumnarToRow [codegen id : 1]
-Input [2]: [ca_address_sk#19, ca_county#20]
+Input [2]: [ca_address_sk#18, ca_county#19]
 
 (51) Filter [codegen id : 1]
-Input [2]: [ca_address_sk#19, ca_county#20]
-Condition : (ca_county#20 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#19))
+Input [2]: [ca_address_sk#18, ca_county#19]
+Condition : (ca_county#19 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#18))
 
 (52) Project [codegen id : 1]
-Output [1]: [ca_address_sk#19]
-Input [2]: [ca_address_sk#19, ca_county#20]
+Output [1]: [ca_address_sk#18]
+Input [2]: [ca_address_sk#18, ca_county#19]
 
 (53) ObjectHashAggregate
-Input [1]: [ca_address_sk#19]
+Input [1]: [ca_address_sk#18]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#19, 42), 2555, 57765, 0, 0)]
-Aggregate Attributes [1]: [buf#39]
-Results [1]: [buf#40]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)]
+Aggregate Attributes [1]: [buf#38]
+Results [1]: [buf#39]
 
 (54) Exchange
-Input [1]: [buf#40]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
+Input [1]: [buf#39]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
 
 (55) ObjectHashAggregate
-Input [1]: [buf#40]
+Input [1]: [buf#39]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#19, 42), 2555, 57765, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#19, 42), 2555, 57765, 0, 0)#41]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#19, 42), 2555, 57765, 0, 0)#41 AS bloomFilter#42]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)#40]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)#40 AS bloomFilter#41]
 
-Subquery:2 Hosting operator id = 6 Hosting Expression = ws_sold_date_sk#7 IN dynamicpruning#8
+Subquery:2 Hosting operator id = 6 Hosting Expression = ws_sold_date_sk#6 IN dynamicpruning#7
 BroadcastExchange (60)
 +- * Project (59)
    +- * Filter (58)
@@ -328,29 +328,29 @@ BroadcastExchange (60)
 
 
 (56) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#9, d_year#43, d_moy#44]
+Output [3]: [d_date_sk#8, d_year#42, d_moy#43]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2002), GreaterThanOrEqual(d_moy,4), LessThanOrEqual(d_moy,7), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (57) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#9, d_year#43, d_moy#44]
+Input [3]: [d_date_sk#8, d_year#42, d_moy#43]
 
 (58) Filter [codegen id : 1]
-Input [3]: [d_date_sk#9, d_year#43, d_moy#44]
-Condition : (((((isnotnull(d_year#43) AND isnotnull(d_moy#44)) AND (d_year#43 = 2002)) AND (d_moy#44 >= 4)) AND (d_moy#44 <= 7)) AND isnotnull(d_date_sk#9))
+Input [3]: [d_date_sk#8, d_year#42, d_moy#43]
+Condition : (((((isnotnull(d_year#42) AND isnotnull(d_moy#43)) AND (d_year#42 = 2002)) AND (d_moy#43 >= 4)) AND (d_moy#43 <= 7)) AND isnotnull(d_date_sk#8))
 
 (59) Project [codegen id : 1]
-Output [1]: [d_date_sk#9]
-Input [3]: [d_date_sk#9, d_year#43, d_moy#44]
+Output [1]: [d_date_sk#8]
+Input [3]: [d_date_sk#8, d_year#42, d_moy#43]
 
 (60) BroadcastExchange
-Input [1]: [d_date_sk#9]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Input [1]: [d_date_sk#8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
-Subquery:3 Hosting operator id = 12 Hosting Expression = cs_sold_date_sk#12 IN dynamicpruning#8
+Subquery:3 Hosting operator id = 12 Hosting Expression = cs_sold_date_sk#11 IN dynamicpruning#7
 
-Subquery:4 Hosting operator id = 22 Hosting Expression = ss_sold_date_sk#16 IN dynamicpruning#8
+Subquery:4 Hosting operator id = 22 Hosting Expression = ss_sold_date_sk#15 IN dynamicpruning#7
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q59.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q59.sf100/explain.txt
index 5313a1336fee4..0c4e41f43831d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q59.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-modified/q59.sf100/explain.txt
@@ -82,11 +82,11 @@ Input [3]: [d_date_sk#4, d_week_seq#5, d_day_name#6]
 
 (6) Filter [codegen id : 1]
 Input [3]: [d_date_sk#4, d_week_seq#5, d_day_name#6]
-Condition : ((isnotnull(d_date_sk#4) AND isnotnull(d_week_seq#5)) AND might_contain(Subquery scalar-subquery#7, [id=#8], xxhash64(d_week_seq#5, 42)))
+Condition : ((isnotnull(d_date_sk#4) AND isnotnull(d_week_seq#5)) AND might_contain(Subquery scalar-subquery#7, [id=#1], xxhash64(d_week_seq#5, 42)))
 
 (7) BroadcastExchange
 Input [3]: [d_date_sk#4, d_week_seq#5, d_day_name#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=1]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=2]
 
 (8) BroadcastHashJoin [codegen id : 2]
 Left keys [1]: [ss_sold_date_sk#3]
@@ -102,222 +102,222 @@ Input [6]: [ss_store_sk#1, ss_sales_price#2, ss_sold_date_sk#3, d_date_sk#4, d_w
 Input [4]: [ss_store_sk#1, ss_sales_price#2, d_week_seq#5, d_day_name#6]
 Keys [2]: [d_week_seq#5, ss_store_sk#1]
 Functions [7]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))]
-Aggregate Attributes [7]: [sum#9, sum#10, sum#11, sum#12, sum#13, sum#14, sum#15]
-Results [9]: [d_week_seq#5, ss_store_sk#1, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21, sum#22]
+Aggregate Attributes [7]: [sum#8, sum#9, sum#10, sum#11, sum#12, sum#13, sum#14]
+Results [9]: [d_week_seq#5, ss_store_sk#1, sum#15, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21]
 
 (11) Exchange
-Input [9]: [d_week_seq#5, ss_store_sk#1, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21, sum#22]
-Arguments: hashpartitioning(d_week_seq#5, ss_store_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [9]: [d_week_seq#5, ss_store_sk#1, sum#15, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21]
+Arguments: hashpartitioning(d_week_seq#5, ss_store_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) HashAggregate [codegen id : 10]
-Input [9]: [d_week_seq#5, ss_store_sk#1, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21, sum#22]
+Input [9]: [d_week_seq#5, ss_store_sk#1, sum#15, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21]
 Keys [2]: [d_week_seq#5, ss_store_sk#1]
 Functions [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))]
-Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#24, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#25, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#29]
-Results [9]: [d_week_seq#5, ss_store_sk#1, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#23,17,2) AS sun_sales#30, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#24,17,2) AS mon_sales#31, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#25,17,2) AS tue_sales#32, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#26,17,2) AS wed_sales#33, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#27,17,2) AS thu_sales#34, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#28,17,2) AS fri_sales#35, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#29,17,2) AS sat_sales#36]
+Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#22, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#24, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#25, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#28]
+Results [9]: [d_week_seq#5, ss_store_sk#1, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#22,17,2) AS sun_sales#29, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#23,17,2) AS mon_sales#30, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#24,17,2) AS tue_sales#31, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#25,17,2) AS wed_sales#32, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#26,17,2) AS thu_sales#33, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#27,17,2) AS fri_sales#34, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#28,17,2) AS sat_sales#35]
 
 (13) Scan parquet spark_catalog.default.store
-Output [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
+Output [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk), IsNotNull(s_store_id)]
 ReadSchema: struct<s_store_sk:int,s_store_id:string,s_store_name:string>
 
 (14) ColumnarToRow [codegen id : 3]
-Input [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
+Input [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
 
 (15) Filter [codegen id : 3]
-Input [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
-Condition : (isnotnull(s_store_sk#37) AND isnotnull(s_store_id#38))
+Input [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
+Condition : (isnotnull(s_store_sk#36) AND isnotnull(s_store_id#37))
 
 (16) BroadcastExchange
-Input [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=3]
+Input [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=4]
 
 (17) BroadcastHashJoin [codegen id : 10]
 Left keys [1]: [ss_store_sk#1]
-Right keys [1]: [s_store_sk#37]
+Right keys [1]: [s_store_sk#36]
 Join type: Inner
 Join condition: None
 
 (18) Project [codegen id : 10]
-Output [10]: [d_week_seq#5, sun_sales#30, mon_sales#31, tue_sales#32, wed_sales#33, thu_sales#34, fri_sales#35, sat_sales#36, s_store_id#38, s_store_name#39]
-Input [12]: [d_week_seq#5, ss_store_sk#1, sun_sales#30, mon_sales#31, tue_sales#32, wed_sales#33, thu_sales#34, fri_sales#35, sat_sales#36, s_store_sk#37, s_store_id#38, s_store_name#39]
+Output [10]: [d_week_seq#5, sun_sales#29, mon_sales#30, tue_sales#31, wed_sales#32, thu_sales#33, fri_sales#34, sat_sales#35, s_store_id#37, s_store_name#38]
+Input [12]: [d_week_seq#5, ss_store_sk#1, sun_sales#29, mon_sales#30, tue_sales#31, wed_sales#32, thu_sales#33, fri_sales#34, sat_sales#35, s_store_sk#36, s_store_id#37, s_store_name#38]
 
 (19) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#40, d_week_seq#41]
+Output [2]: [d_month_seq#39, d_week_seq#40]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1185), LessThanOrEqual(d_month_seq,1196), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (20) ColumnarToRow [codegen id : 4]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (21) Filter [codegen id : 4]
-Input [2]: [d_month_seq#40, d_week_seq#41]
-Condition : (((isnotnull(d_month_seq#40) AND (d_month_seq#40 >= 1185)) AND (d_month_seq#40 <= 1196)) AND isnotnull(d_week_seq#41))
+Input [2]: [d_month_seq#39, d_week_seq#40]
+Condition : (((isnotnull(d_month_seq#39) AND (d_month_seq#39 >= 1185)) AND (d_month_seq#39 <= 1196)) AND isnotnull(d_week_seq#40))
 
 (22) Project [codegen id : 4]
-Output [1]: [d_week_seq#41]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Output [1]: [d_week_seq#40]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (23) BroadcastExchange
-Input [1]: [d_week_seq#41]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [d_week_seq#40]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
 
 (24) BroadcastHashJoin [codegen id : 10]
 Left keys [1]: [d_week_seq#5]
-Right keys [1]: [d_week_seq#41]
+Right keys [1]: [d_week_seq#40]
 Join type: Inner
 Join condition: None
 
 (25) Project [codegen id : 10]
-Output [10]: [s_store_name#39 AS s_store_name1#42, d_week_seq#5 AS d_week_seq1#43, s_store_id#38 AS s_store_id1#44, sun_sales#30 AS sun_sales1#45, mon_sales#31 AS mon_sales1#46, tue_sales#32 AS tue_sales1#47, wed_sales#33 AS wed_sales1#48, thu_sales#34 AS thu_sales1#49, fri_sales#35 AS fri_sales1#50, sat_sales#36 AS sat_sales1#51]
-Input [11]: [d_week_seq#5, sun_sales#30, mon_sales#31, tue_sales#32, wed_sales#33, thu_sales#34, fri_sales#35, sat_sales#36, s_store_id#38, s_store_name#39, d_week_seq#41]
+Output [10]: [s_store_name#38 AS s_store_name1#41, d_week_seq#5 AS d_week_seq1#42, s_store_id#37 AS s_store_id1#43, sun_sales#29 AS sun_sales1#44, mon_sales#30 AS mon_sales1#45, tue_sales#31 AS tue_sales1#46, wed_sales#32 AS wed_sales1#47, thu_sales#33 AS thu_sales1#48, fri_sales#34 AS fri_sales1#49, sat_sales#35 AS sat_sales1#50]
+Input [11]: [d_week_seq#5, sun_sales#29, mon_sales#30, tue_sales#31, wed_sales#32, thu_sales#33, fri_sales#34, sat_sales#35, s_store_id#37, s_store_name#38, d_week_seq#40]
 
 (26) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54]
+Output [3]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#54)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#53)]
 PushedFilters: [IsNotNull(ss_store_sk)]
 ReadSchema: struct<ss_store_sk:int,ss_sales_price:decimal(7,2)>
 
 (27) ColumnarToRow [codegen id : 6]
-Input [3]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54]
+Input [3]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53]
 
 (28) Filter [codegen id : 6]
-Input [3]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54]
-Condition : isnotnull(ss_store_sk#52)
+Input [3]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53]
+Condition : isnotnull(ss_store_sk#51)
 
 (29) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
+Output [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date_sk), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int,d_day_name:string>
 
 (30) ColumnarToRow [codegen id : 5]
-Input [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
+Input [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
 
 (31) Filter [codegen id : 5]
-Input [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
-Condition : ((isnotnull(d_date_sk#55) AND isnotnull(d_week_seq#56)) AND might_contain(Subquery scalar-subquery#58, [id=#59], xxhash64(d_week_seq#56, 42)))
+Input [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
+Condition : ((isnotnull(d_date_sk#54) AND isnotnull(d_week_seq#55)) AND might_contain(Subquery scalar-subquery#57, [id=#6], xxhash64(d_week_seq#55, 42)))
 
 (32) BroadcastExchange
-Input [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=5]
+Input [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
 
 (33) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ss_sold_date_sk#54]
-Right keys [1]: [d_date_sk#55]
+Left keys [1]: [ss_sold_date_sk#53]
+Right keys [1]: [d_date_sk#54]
 Join type: Inner
 Join condition: None
 
 (34) Project [codegen id : 6]
-Output [4]: [ss_store_sk#52, ss_sales_price#53, d_week_seq#56, d_day_name#57]
-Input [6]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54, d_date_sk#55, d_week_seq#56, d_day_name#57]
+Output [4]: [ss_store_sk#51, ss_sales_price#52, d_week_seq#55, d_day_name#56]
+Input [6]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53, d_date_sk#54, d_week_seq#55, d_day_name#56]
 
 (35) HashAggregate [codegen id : 6]
-Input [4]: [ss_store_sk#52, ss_sales_price#53, d_week_seq#56, d_day_name#57]
-Keys [2]: [d_week_seq#56, ss_store_sk#52]
-Functions [6]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))]
-Aggregate Attributes [6]: [sum#60, sum#61, sum#62, sum#63, sum#64, sum#65]
-Results [8]: [d_week_seq#56, ss_store_sk#52, sum#66, sum#67, sum#68, sum#69, sum#70, sum#71]
+Input [4]: [ss_store_sk#51, ss_sales_price#52, d_week_seq#55, d_day_name#56]
+Keys [2]: [d_week_seq#55, ss_store_sk#51]
+Functions [6]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))]
+Aggregate Attributes [6]: [sum#58, sum#59, sum#60, sum#61, sum#62, sum#63]
+Results [8]: [d_week_seq#55, ss_store_sk#51, sum#64, sum#65, sum#66, sum#67, sum#68, sum#69]
 
 (36) Exchange
-Input [8]: [d_week_seq#56, ss_store_sk#52, sum#66, sum#67, sum#68, sum#69, sum#70, sum#71]
-Arguments: hashpartitioning(d_week_seq#56, ss_store_sk#52, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [8]: [d_week_seq#55, ss_store_sk#51, sum#64, sum#65, sum#66, sum#67, sum#68, sum#69]
+Arguments: hashpartitioning(d_week_seq#55, ss_store_sk#51, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (37) HashAggregate [codegen id : 9]
-Input [8]: [d_week_seq#56, ss_store_sk#52, sum#66, sum#67, sum#68, sum#69, sum#70, sum#71]
-Keys [2]: [d_week_seq#56, ss_store_sk#52]
-Functions [6]: [sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))]
-Aggregate Attributes [6]: [sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END))#24, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))#29]
-Results [8]: [d_week_seq#56, ss_store_sk#52, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END))#23,17,2) AS sun_sales#72, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END))#24,17,2) AS mon_sales#73, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END))#26,17,2) AS wed_sales#74, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END))#27,17,2) AS thu_sales#75, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END))#28,17,2) AS fri_sales#76, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))#29,17,2) AS sat_sales#77]
+Input [8]: [d_week_seq#55, ss_store_sk#51, sum#64, sum#65, sum#66, sum#67, sum#68, sum#69]
+Keys [2]: [d_week_seq#55, ss_store_sk#51]
+Functions [6]: [sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))]
+Aggregate Attributes [6]: [sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END))#22, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END))#25, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))#28]
+Results [8]: [d_week_seq#55, ss_store_sk#51, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END))#22,17,2) AS sun_sales#70, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END))#23,17,2) AS mon_sales#71, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END))#25,17,2) AS wed_sales#72, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END))#26,17,2) AS thu_sales#73, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END))#27,17,2) AS fri_sales#74, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))#28,17,2) AS sat_sales#75]
 
 (38) Scan parquet spark_catalog.default.store
-Output [2]: [s_store_sk#78, s_store_id#79]
+Output [2]: [s_store_sk#76, s_store_id#77]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk), IsNotNull(s_store_id)]
 ReadSchema: struct<s_store_sk:int,s_store_id:string>
 
 (39) ColumnarToRow [codegen id : 7]
-Input [2]: [s_store_sk#78, s_store_id#79]
+Input [2]: [s_store_sk#76, s_store_id#77]
 
 (40) Filter [codegen id : 7]
-Input [2]: [s_store_sk#78, s_store_id#79]
-Condition : (isnotnull(s_store_sk#78) AND isnotnull(s_store_id#79))
+Input [2]: [s_store_sk#76, s_store_id#77]
+Condition : (isnotnull(s_store_sk#76) AND isnotnull(s_store_id#77))
 
 (41) BroadcastExchange
-Input [2]: [s_store_sk#78, s_store_id#79]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
+Input [2]: [s_store_sk#76, s_store_id#77]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=9]
 
 (42) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_store_sk#52]
-Right keys [1]: [s_store_sk#78]
+Left keys [1]: [ss_store_sk#51]
+Right keys [1]: [s_store_sk#76]
 Join type: Inner
 Join condition: None
 
 (43) Project [codegen id : 9]
-Output [8]: [d_week_seq#56, sun_sales#72, mon_sales#73, wed_sales#74, thu_sales#75, fri_sales#76, sat_sales#77, s_store_id#79]
-Input [10]: [d_week_seq#56, ss_store_sk#52, sun_sales#72, mon_sales#73, wed_sales#74, thu_sales#75, fri_sales#76, sat_sales#77, s_store_sk#78, s_store_id#79]
+Output [8]: [d_week_seq#55, sun_sales#70, mon_sales#71, wed_sales#72, thu_sales#73, fri_sales#74, sat_sales#75, s_store_id#77]
+Input [10]: [d_week_seq#55, ss_store_sk#51, sun_sales#70, mon_sales#71, wed_sales#72, thu_sales#73, fri_sales#74, sat_sales#75, s_store_sk#76, s_store_id#77]
 
 (44) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#80, d_week_seq#81]
+Output [2]: [d_month_seq#78, d_week_seq#79]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1197), LessThanOrEqual(d_month_seq,1208), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (45) ColumnarToRow [codegen id : 8]
-Input [2]: [d_month_seq#80, d_week_seq#81]
+Input [2]: [d_month_seq#78, d_week_seq#79]
 
 (46) Filter [codegen id : 8]
-Input [2]: [d_month_seq#80, d_week_seq#81]
-Condition : (((isnotnull(d_month_seq#80) AND (d_month_seq#80 >= 1197)) AND (d_month_seq#80 <= 1208)) AND isnotnull(d_week_seq#81))
+Input [2]: [d_month_seq#78, d_week_seq#79]
+Condition : (((isnotnull(d_month_seq#78) AND (d_month_seq#78 >= 1197)) AND (d_month_seq#78 <= 1208)) AND isnotnull(d_week_seq#79))
 
 (47) Project [codegen id : 8]
-Output [1]: [d_week_seq#81]
-Input [2]: [d_month_seq#80, d_week_seq#81]
+Output [1]: [d_week_seq#79]
+Input [2]: [d_month_seq#78, d_week_seq#79]
 
 (48) BroadcastExchange
-Input [1]: [d_week_seq#81]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Input [1]: [d_week_seq#79]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
 (49) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [d_week_seq#56]
-Right keys [1]: [d_week_seq#81]
+Left keys [1]: [d_week_seq#55]
+Right keys [1]: [d_week_seq#79]
 Join type: Inner
 Join condition: None
 
 (50) Project [codegen id : 9]
-Output [8]: [d_week_seq#56 AS d_week_seq2#82, s_store_id#79 AS s_store_id2#83, sun_sales#72 AS sun_sales2#84, mon_sales#73 AS mon_sales2#85, wed_sales#74 AS wed_sales2#86, thu_sales#75 AS thu_sales2#87, fri_sales#76 AS fri_sales2#88, sat_sales#77 AS sat_sales2#89]
-Input [9]: [d_week_seq#56, sun_sales#72, mon_sales#73, wed_sales#74, thu_sales#75, fri_sales#76, sat_sales#77, s_store_id#79, d_week_seq#81]
+Output [8]: [d_week_seq#55 AS d_week_seq2#80, s_store_id#77 AS s_store_id2#81, sun_sales#70 AS sun_sales2#82, mon_sales#71 AS mon_sales2#83, wed_sales#72 AS wed_sales2#84, thu_sales#73 AS thu_sales2#85, fri_sales#74 AS fri_sales2#86, sat_sales#75 AS sat_sales2#87]
+Input [9]: [d_week_seq#55, sun_sales#70, mon_sales#71, wed_sales#72, thu_sales#73, fri_sales#74, sat_sales#75, s_store_id#77, d_week_seq#79]
 
 (51) BroadcastExchange
-Input [8]: [d_week_seq2#82, s_store_id2#83, sun_sales2#84, mon_sales2#85, wed_sales2#86, thu_sales2#87, fri_sales2#88, sat_sales2#89]
-Arguments: HashedRelationBroadcastMode(List(input[1, string, true], (input[0, int, true] - 52)),false), [plan_id=9]
+Input [8]: [d_week_seq2#80, s_store_id2#81, sun_sales2#82, mon_sales2#83, wed_sales2#84, thu_sales2#85, fri_sales2#86, sat_sales2#87]
+Arguments: HashedRelationBroadcastMode(List(input[1, string, true], (input[0, int, true] - 52)),false), [plan_id=11]
 
 (52) BroadcastHashJoin [codegen id : 10]
-Left keys [2]: [s_store_id1#44, d_week_seq1#43]
-Right keys [2]: [s_store_id2#83, (d_week_seq2#82 - 52)]
+Left keys [2]: [s_store_id1#43, d_week_seq1#42]
+Right keys [2]: [s_store_id2#81, (d_week_seq2#80 - 52)]
 Join type: Inner
 Join condition: None
 
 (53) Project [codegen id : 10]
-Output [10]: [s_store_name1#42, s_store_id1#44, d_week_seq1#43, (sun_sales1#45 / sun_sales2#84) AS (sun_sales1 / sun_sales2)#90, (mon_sales1#46 / mon_sales2#85) AS (mon_sales1 / mon_sales2)#91, (tue_sales1#47 / tue_sales1#47) AS (tue_sales1 / tue_sales1)#92, (wed_sales1#48 / wed_sales2#86) AS (wed_sales1 / wed_sales2)#93, (thu_sales1#49 / thu_sales2#87) AS (thu_sales1 / thu_sales2)#94, (fri_sales1#50 / fri_sales2#88) AS (fri_sales1 / fri_sales2)#95, (sat_sales1#51 / sat_sales2#89) AS (sat_sales1 / sat_sales2)#96]
-Input [18]: [s_store_name1#42, d_week_seq1#43, s_store_id1#44, sun_sales1#45, mon_sales1#46, tue_sales1#47, wed_sales1#48, thu_sales1#49, fri_sales1#50, sat_sales1#51, d_week_seq2#82, s_store_id2#83, sun_sales2#84, mon_sales2#85, wed_sales2#86, thu_sales2#87, fri_sales2#88, sat_sales2#89]
+Output [10]: [s_store_name1#41, s_store_id1#43, d_week_seq1#42, (sun_sales1#44 / sun_sales2#82) AS (sun_sales1 / sun_sales2)#88, (mon_sales1#45 / mon_sales2#83) AS (mon_sales1 / mon_sales2)#89, (tue_sales1#46 / tue_sales1#46) AS (tue_sales1 / tue_sales1)#90, (wed_sales1#47 / wed_sales2#84) AS (wed_sales1 / wed_sales2)#91, (thu_sales1#48 / thu_sales2#85) AS (thu_sales1 / thu_sales2)#92, (fri_sales1#49 / fri_sales2#86) AS (fri_sales1 / fri_sales2)#93, (sat_sales1#50 / sat_sales2#87) AS (sat_sales1 / sat_sales2)#94]
+Input [18]: [s_store_name1#41, d_week_seq1#42, s_store_id1#43, sun_sales1#44, mon_sales1#45, tue_sales1#46, wed_sales1#47, thu_sales1#48, fri_sales1#49, sat_sales1#50, d_week_seq2#80, s_store_id2#81, sun_sales2#82, mon_sales2#83, wed_sales2#84, thu_sales2#85, fri_sales2#86, sat_sales2#87]
 
 (54) TakeOrderedAndProject
-Input [10]: [s_store_name1#42, s_store_id1#44, d_week_seq1#43, (sun_sales1 / sun_sales2)#90, (mon_sales1 / mon_sales2)#91, (tue_sales1 / tue_sales1)#92, (wed_sales1 / wed_sales2)#93, (thu_sales1 / thu_sales2)#94, (fri_sales1 / fri_sales2)#95, (sat_sales1 / sat_sales2)#96]
-Arguments: 100, [s_store_name1#42 ASC NULLS FIRST, s_store_id1#44 ASC NULLS FIRST, d_week_seq1#43 ASC NULLS FIRST], [s_store_name1#42, s_store_id1#44, d_week_seq1#43, (sun_sales1 / sun_sales2)#90, (mon_sales1 / mon_sales2)#91, (tue_sales1 / tue_sales1)#92, (wed_sales1 / wed_sales2)#93, (thu_sales1 / thu_sales2)#94, (fri_sales1 / fri_sales2)#95, (sat_sales1 / sat_sales2)#96]
+Input [10]: [s_store_name1#41, s_store_id1#43, d_week_seq1#42, (sun_sales1 / sun_sales2)#88, (mon_sales1 / mon_sales2)#89, (tue_sales1 / tue_sales1)#90, (wed_sales1 / wed_sales2)#91, (thu_sales1 / thu_sales2)#92, (fri_sales1 / fri_sales2)#93, (sat_sales1 / sat_sales2)#94]
+Arguments: 100, [s_store_name1#41 ASC NULLS FIRST, s_store_id1#43 ASC NULLS FIRST, d_week_seq1#42 ASC NULLS FIRST], [s_store_name1#41, s_store_id1#43, d_week_seq1#42, (sun_sales1 / sun_sales2)#88, (mon_sales1 / mon_sales2)#89, (tue_sales1 / tue_sales1)#90, (wed_sales1 / wed_sales2)#91, (thu_sales1 / thu_sales2)#92, (fri_sales1 / fri_sales2)#93, (sat_sales1 / sat_sales2)#94]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 6 Hosting Expression = Subquery scalar-subquery#7, [id=#8]
+Subquery:1 Hosting operator id = 6 Hosting Expression = Subquery scalar-subquery#7, [id=#1]
 ObjectHashAggregate (61)
 +- Exchange (60)
    +- ObjectHashAggregate (59)
@@ -328,42 +328,42 @@ ObjectHashAggregate (61)
 
 
 (55) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#40, d_week_seq#41]
+Output [2]: [d_month_seq#39, d_week_seq#40]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1185), LessThanOrEqual(d_month_seq,1196), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (56) ColumnarToRow [codegen id : 1]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (57) Filter [codegen id : 1]
-Input [2]: [d_month_seq#40, d_week_seq#41]
-Condition : (((isnotnull(d_month_seq#40) AND (d_month_seq#40 >= 1185)) AND (d_month_seq#40 <= 1196)) AND isnotnull(d_week_seq#41))
+Input [2]: [d_month_seq#39, d_week_seq#40]
+Condition : (((isnotnull(d_month_seq#39) AND (d_month_seq#39 >= 1185)) AND (d_month_seq#39 <= 1196)) AND isnotnull(d_week_seq#40))
 
 (58) Project [codegen id : 1]
-Output [1]: [d_week_seq#41]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Output [1]: [d_week_seq#40]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (59) ObjectHashAggregate
-Input [1]: [d_week_seq#41]
+Input [1]: [d_week_seq#40]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [buf#97]
-Results [1]: [buf#98]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [buf#95]
+Results [1]: [buf#96]
 
 (60) Exchange
-Input [1]: [buf#98]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [buf#96]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (61) ObjectHashAggregate
-Input [1]: [buf#98]
+Input [1]: [buf#96]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)#99]
-Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)#99 AS bloomFilter#100]
+Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)#97]
+Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)#97 AS bloomFilter#98]
 
-Subquery:2 Hosting operator id = 31 Hosting Expression = Subquery scalar-subquery#58, [id=#59]
+Subquery:2 Hosting operator id = 31 Hosting Expression = Subquery scalar-subquery#57, [id=#6]
 ObjectHashAggregate (68)
 +- Exchange (67)
    +- ObjectHashAggregate (66)
@@ -374,39 +374,39 @@ ObjectHashAggregate (68)
 
 
 (62) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#80, d_week_seq#81]
+Output [2]: [d_month_seq#78, d_week_seq#79]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1197), LessThanOrEqual(d_month_seq,1208), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (63) ColumnarToRow [codegen id : 1]
-Input [2]: [d_month_seq#80, d_week_seq#81]
+Input [2]: [d_month_seq#78, d_week_seq#79]
 
 (64) Filter [codegen id : 1]
-Input [2]: [d_month_seq#80, d_week_seq#81]
-Condition : (((isnotnull(d_month_seq#80) AND (d_month_seq#80 >= 1197)) AND (d_month_seq#80 <= 1208)) AND isnotnull(d_week_seq#81))
+Input [2]: [d_month_seq#78, d_week_seq#79]
+Condition : (((isnotnull(d_month_seq#78) AND (d_month_seq#78 >= 1197)) AND (d_month_seq#78 <= 1208)) AND isnotnull(d_week_seq#79))
 
 (65) Project [codegen id : 1]
-Output [1]: [d_week_seq#81]
-Input [2]: [d_month_seq#80, d_week_seq#81]
+Output [1]: [d_week_seq#79]
+Input [2]: [d_month_seq#78, d_week_seq#79]
 
 (66) ObjectHashAggregate
-Input [1]: [d_week_seq#81]
+Input [1]: [d_week_seq#79]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#81, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [buf#101]
-Results [1]: [buf#102]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#79, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [buf#99]
+Results [1]: [buf#100]
 
 (67) Exchange
-Input [1]: [buf#102]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
+Input [1]: [buf#100]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (68) ObjectHashAggregate
-Input [1]: [buf#102]
+Input [1]: [buf#100]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#81, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#81, 42), 335, 8990, 0, 0)#103]
-Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#81, 42), 335, 8990, 0, 0)#103 AS bloomFilter#104]
+Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#79, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#79, 42), 335, 8990, 0, 0)#101]
+Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#79, 42), 335, 8990, 0, 0)#101 AS bloomFilter#102]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q10.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q10.sf100/explain.txt
index d3434fd6be977..cc4a5c82a4749 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q10.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q10.sf100/explain.txt
@@ -64,124 +64,124 @@ Input [3]: [c_customer_sk#3, c_current_cdemo_sk#4, c_current_addr_sk#5]
 
 (3) Filter [codegen id : 1]
 Input [3]: [c_customer_sk#3, c_current_cdemo_sk#4, c_current_addr_sk#5]
-Condition : ((isnotnull(c_current_addr_sk#5) AND isnotnull(c_current_cdemo_sk#4)) AND might_contain(Subquery scalar-subquery#6, [id=#7], xxhash64(c_current_addr_sk#5, 42)))
+Condition : ((isnotnull(c_current_addr_sk#5) AND isnotnull(c_current_cdemo_sk#4)) AND might_contain(Subquery scalar-subquery#6, [id=#1], xxhash64(c_current_addr_sk#5, 42)))
 
 (4) Exchange
 Input [3]: [c_customer_sk#3, c_current_cdemo_sk#4, c_current_addr_sk#5]
-Arguments: hashpartitioning(c_customer_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(c_customer_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=2]
 
 (5) Sort [codegen id : 2]
 Input [3]: [c_customer_sk#3, c_current_cdemo_sk#4, c_current_addr_sk#5]
 Arguments: [c_customer_sk#3 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.store_sales
-Output [2]: [ss_customer_sk#8, ss_sold_date_sk#9]
+Output [2]: [ss_customer_sk#7, ss_sold_date_sk#8]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#9), dynamicpruningexpression(ss_sold_date_sk#9 IN dynamicpruning#10)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#8), dynamicpruningexpression(ss_sold_date_sk#8 IN dynamicpruning#9)]
 ReadSchema: struct<ss_customer_sk:int>
 
 (7) ColumnarToRow [codegen id : 4]
-Input [2]: [ss_customer_sk#8, ss_sold_date_sk#9]
+Input [2]: [ss_customer_sk#7, ss_sold_date_sk#8]
 
 (8) ReusedExchange [Reuses operator id: 63]
-Output [1]: [d_date_sk#11]
+Output [1]: [d_date_sk#10]
 
 (9) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [ss_sold_date_sk#9]
-Right keys [1]: [d_date_sk#11]
+Left keys [1]: [ss_sold_date_sk#8]
+Right keys [1]: [d_date_sk#10]
 Join type: Inner
 Join condition: None
 
 (10) Project [codegen id : 4]
-Output [1]: [ss_customer_sk#8]
-Input [3]: [ss_customer_sk#8, ss_sold_date_sk#9, d_date_sk#11]
+Output [1]: [ss_customer_sk#7]
+Input [3]: [ss_customer_sk#7, ss_sold_date_sk#8, d_date_sk#10]
 
 (11) Exchange
-Input [1]: [ss_customer_sk#8]
-Arguments: hashpartitioning(ss_customer_sk#8, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [1]: [ss_customer_sk#7]
+Arguments: hashpartitioning(ss_customer_sk#7, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) Sort [codegen id : 5]
-Input [1]: [ss_customer_sk#8]
-Arguments: [ss_customer_sk#8 ASC NULLS FIRST], false, 0
+Input [1]: [ss_customer_sk#7]
+Arguments: [ss_customer_sk#7 ASC NULLS FIRST], false, 0
 
 (13) SortMergeJoin [codegen id : 6]
 Left keys [1]: [c_customer_sk#3]
-Right keys [1]: [ss_customer_sk#8]
+Right keys [1]: [ss_customer_sk#7]
 Join type: LeftSemi
 Join condition: None
 
 (14) Scan parquet spark_catalog.default.web_sales
-Output [2]: [ws_bill_customer_sk#12, ws_sold_date_sk#13]
+Output [2]: [ws_bill_customer_sk#11, ws_sold_date_sk#12]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#13), dynamicpruningexpression(ws_sold_date_sk#13 IN dynamicpruning#10)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#12), dynamicpruningexpression(ws_sold_date_sk#12 IN dynamicpruning#9)]
 ReadSchema: struct<ws_bill_customer_sk:int>
 
 (15) ColumnarToRow [codegen id : 8]
-Input [2]: [ws_bill_customer_sk#12, ws_sold_date_sk#13]
+Input [2]: [ws_bill_customer_sk#11, ws_sold_date_sk#12]
 
 (16) ReusedExchange [Reuses operator id: 63]
-Output [1]: [d_date_sk#14]
+Output [1]: [d_date_sk#13]
 
 (17) BroadcastHashJoin [codegen id : 8]
-Left keys [1]: [ws_sold_date_sk#13]
-Right keys [1]: [d_date_sk#14]
+Left keys [1]: [ws_sold_date_sk#12]
+Right keys [1]: [d_date_sk#13]
 Join type: Inner
 Join condition: None
 
 (18) Project [codegen id : 8]
-Output [1]: [ws_bill_customer_sk#12]
-Input [3]: [ws_bill_customer_sk#12, ws_sold_date_sk#13, d_date_sk#14]
+Output [1]: [ws_bill_customer_sk#11]
+Input [3]: [ws_bill_customer_sk#11, ws_sold_date_sk#12, d_date_sk#13]
 
 (19) Exchange
-Input [1]: [ws_bill_customer_sk#12]
-Arguments: hashpartitioning(ws_bill_customer_sk#12, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [1]: [ws_bill_customer_sk#11]
+Arguments: hashpartitioning(ws_bill_customer_sk#11, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (20) Sort [codegen id : 9]
-Input [1]: [ws_bill_customer_sk#12]
-Arguments: [ws_bill_customer_sk#12 ASC NULLS FIRST], false, 0
+Input [1]: [ws_bill_customer_sk#11]
+Arguments: [ws_bill_customer_sk#11 ASC NULLS FIRST], false, 0
 
 (21) SortMergeJoin [codegen id : 10]
 Left keys [1]: [c_customer_sk#3]
-Right keys [1]: [ws_bill_customer_sk#12]
+Right keys [1]: [ws_bill_customer_sk#11]
 Join type: ExistenceJoin(exists#2)
 Join condition: None
 
 (22) Scan parquet spark_catalog.default.catalog_sales
-Output [2]: [cs_ship_customer_sk#15, cs_sold_date_sk#16]
+Output [2]: [cs_ship_customer_sk#14, cs_sold_date_sk#15]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#16), dynamicpruningexpression(cs_sold_date_sk#16 IN dynamicpruning#10)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#15), dynamicpruningexpression(cs_sold_date_sk#15 IN dynamicpruning#9)]
 ReadSchema: struct<cs_ship_customer_sk:int>
 
 (23) ColumnarToRow [codegen id : 12]
-Input [2]: [cs_ship_customer_sk#15, cs_sold_date_sk#16]
+Input [2]: [cs_ship_customer_sk#14, cs_sold_date_sk#15]
 
 (24) ReusedExchange [Reuses operator id: 63]
-Output [1]: [d_date_sk#17]
+Output [1]: [d_date_sk#16]
 
 (25) BroadcastHashJoin [codegen id : 12]
-Left keys [1]: [cs_sold_date_sk#16]
-Right keys [1]: [d_date_sk#17]
+Left keys [1]: [cs_sold_date_sk#15]
+Right keys [1]: [d_date_sk#16]
 Join type: Inner
 Join condition: None
 
 (26) Project [codegen id : 12]
-Output [1]: [cs_ship_customer_sk#15]
-Input [3]: [cs_ship_customer_sk#15, cs_sold_date_sk#16, d_date_sk#17]
+Output [1]: [cs_ship_customer_sk#14]
+Input [3]: [cs_ship_customer_sk#14, cs_sold_date_sk#15, d_date_sk#16]
 
 (27) Exchange
-Input [1]: [cs_ship_customer_sk#15]
-Arguments: hashpartitioning(cs_ship_customer_sk#15, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Input [1]: [cs_ship_customer_sk#14]
+Arguments: hashpartitioning(cs_ship_customer_sk#14, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (28) Sort [codegen id : 13]
-Input [1]: [cs_ship_customer_sk#15]
-Arguments: [cs_ship_customer_sk#15 ASC NULLS FIRST], false, 0
+Input [1]: [cs_ship_customer_sk#14]
+Arguments: [cs_ship_customer_sk#14 ASC NULLS FIRST], false, 0
 
 (29) SortMergeJoin [codegen id : 15]
 Left keys [1]: [c_customer_sk#3]
-Right keys [1]: [cs_ship_customer_sk#15]
+Right keys [1]: [cs_ship_customer_sk#14]
 Join type: ExistenceJoin(exists#1)
 Join condition: None
 
@@ -194,102 +194,102 @@ Output [2]: [c_current_cdemo_sk#4, c_current_addr_sk#5]
 Input [5]: [c_customer_sk#3, c_current_cdemo_sk#4, c_current_addr_sk#5, exists#2, exists#1]
 
 (32) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#18, ca_county#19]
+Output [2]: [ca_address_sk#17, ca_county#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_county, [Dona Ana County,Jefferson County,La Porte County,Rush County,Toole County]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_county:string>
 
 (33) ColumnarToRow [codegen id : 14]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (34) Filter [codegen id : 14]
-Input [2]: [ca_address_sk#18, ca_county#19]
-Condition : (ca_county#19 IN (Rush County,Toole County,Jefferson County,Dona Ana County,La Porte County) AND isnotnull(ca_address_sk#18))
+Input [2]: [ca_address_sk#17, ca_county#18]
+Condition : (ca_county#18 IN (Rush County,Toole County,Jefferson County,Dona Ana County,La Porte County) AND isnotnull(ca_address_sk#17))
 
 (35) Project [codegen id : 14]
-Output [1]: [ca_address_sk#18]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (36) BroadcastExchange
-Input [1]: [ca_address_sk#18]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Input [1]: [ca_address_sk#17]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
 (37) BroadcastHashJoin [codegen id : 15]
 Left keys [1]: [c_current_addr_sk#5]
-Right keys [1]: [ca_address_sk#18]
+Right keys [1]: [ca_address_sk#17]
 Join type: Inner
 Join condition: None
 
 (38) Project [codegen id : 15]
 Output [1]: [c_current_cdemo_sk#4]
-Input [3]: [c_current_cdemo_sk#4, c_current_addr_sk#5, ca_address_sk#18]
+Input [3]: [c_current_cdemo_sk#4, c_current_addr_sk#5, ca_address_sk#17]
 
 (39) Exchange
 Input [1]: [c_current_cdemo_sk#4]
-Arguments: hashpartitioning(c_current_cdemo_sk#4, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Arguments: hashpartitioning(c_current_cdemo_sk#4, 5), ENSURE_REQUIREMENTS, [plan_id=7]
 
 (40) Sort [codegen id : 16]
 Input [1]: [c_current_cdemo_sk#4]
 Arguments: [c_current_cdemo_sk#4 ASC NULLS FIRST], false, 0
 
 (41) Scan parquet spark_catalog.default.customer_demographics
-Output [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Output [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk)]
 ReadSchema: struct<cd_demo_sk:int,cd_gender:string,cd_marital_status:string,cd_education_status:string,cd_purchase_estimate:int,cd_credit_rating:string,cd_dep_count:int,cd_dep_employed_count:int,cd_dep_college_count:int>
 
 (42) ColumnarToRow [codegen id : 17]
-Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Input [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 
 (43) Filter [codegen id : 17]
-Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Condition : isnotnull(cd_demo_sk#20)
+Input [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Condition : isnotnull(cd_demo_sk#19)
 
 (44) Exchange
-Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Arguments: hashpartitioning(cd_demo_sk#20, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Arguments: hashpartitioning(cd_demo_sk#19, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (45) Sort [codegen id : 18]
-Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Arguments: [cd_demo_sk#20 ASC NULLS FIRST], false, 0
+Input [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Arguments: [cd_demo_sk#19 ASC NULLS FIRST], false, 0
 
 (46) SortMergeJoin [codegen id : 19]
 Left keys [1]: [c_current_cdemo_sk#4]
-Right keys [1]: [cd_demo_sk#20]
+Right keys [1]: [cd_demo_sk#19]
 Join type: Inner
 Join condition: None
 
 (47) Project [codegen id : 19]
-Output [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Input [10]: [c_current_cdemo_sk#4, cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Output [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Input [10]: [c_current_cdemo_sk#4, cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 
 (48) HashAggregate [codegen id : 19]
-Input [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Keys [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Input [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Keys [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 Functions [1]: [partial_count(1)]
-Aggregate Attributes [1]: [count#29]
-Results [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
+Aggregate Attributes [1]: [count#28]
+Results [9]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, count#29]
 
 (49) Exchange
-Input [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
-Arguments: hashpartitioning(cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [9]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, count#29]
+Arguments: hashpartitioning(cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (50) HashAggregate [codegen id : 20]
-Input [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
-Keys [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Input [9]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, count#29]
+Keys [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 Functions [1]: [count(1)]
-Aggregate Attributes [1]: [count(1)#31]
-Results [14]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, count(1)#31 AS cnt1#32, cd_purchase_estimate#24, count(1)#31 AS cnt2#33, cd_credit_rating#25, count(1)#31 AS cnt3#34, cd_dep_count#26, count(1)#31 AS cnt4#35, cd_dep_employed_count#27, count(1)#31 AS cnt5#36, cd_dep_college_count#28, count(1)#31 AS cnt6#37]
+Aggregate Attributes [1]: [count(1)#30]
+Results [14]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, count(1)#30 AS cnt1#31, cd_purchase_estimate#23, count(1)#30 AS cnt2#32, cd_credit_rating#24, count(1)#30 AS cnt3#33, cd_dep_count#25, count(1)#30 AS cnt4#34, cd_dep_employed_count#26, count(1)#30 AS cnt5#35, cd_dep_college_count#27, count(1)#30 AS cnt6#36]
 
 (51) TakeOrderedAndProject
-Input [14]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cnt1#32, cd_purchase_estimate#24, cnt2#33, cd_credit_rating#25, cnt3#34, cd_dep_count#26, cnt4#35, cd_dep_employed_count#27, cnt5#36, cd_dep_college_count#28, cnt6#37]
-Arguments: 100, [cd_gender#21 ASC NULLS FIRST, cd_marital_status#22 ASC NULLS FIRST, cd_education_status#23 ASC NULLS FIRST, cd_purchase_estimate#24 ASC NULLS FIRST, cd_credit_rating#25 ASC NULLS FIRST, cd_dep_count#26 ASC NULLS FIRST, cd_dep_employed_count#27 ASC NULLS FIRST, cd_dep_college_count#28 ASC NULLS FIRST], [cd_gender#21, cd_marital_status#22, cd_education_status#23, cnt1#32, cd_purchase_estimate#24, cnt2#33, cd_credit_rating#25, cnt3#34, cd_dep_count#26, cnt4#35, cd_dep_employed_count#27, cnt5#36, cd_dep_college_count#28, cnt6#37]
+Input [14]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cnt1#31, cd_purchase_estimate#23, cnt2#32, cd_credit_rating#24, cnt3#33, cd_dep_count#25, cnt4#34, cd_dep_employed_count#26, cnt5#35, cd_dep_college_count#27, cnt6#36]
+Arguments: 100, [cd_gender#20 ASC NULLS FIRST, cd_marital_status#21 ASC NULLS FIRST, cd_education_status#22 ASC NULLS FIRST, cd_purchase_estimate#23 ASC NULLS FIRST, cd_credit_rating#24 ASC NULLS FIRST, cd_dep_count#25 ASC NULLS FIRST, cd_dep_employed_count#26 ASC NULLS FIRST, cd_dep_college_count#27 ASC NULLS FIRST], [cd_gender#20, cd_marital_status#21, cd_education_status#22, cnt1#31, cd_purchase_estimate#23, cnt2#32, cd_credit_rating#24, cnt3#33, cd_dep_count#25, cnt4#34, cd_dep_employed_count#26, cnt5#35, cd_dep_college_count#27, cnt6#36]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#6, [id=#7]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#6, [id=#1]
 ObjectHashAggregate (58)
 +- Exchange (57)
    +- ObjectHashAggregate (56)
@@ -300,42 +300,42 @@ ObjectHashAggregate (58)
 
 
 (52) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#18, ca_county#19]
+Output [2]: [ca_address_sk#17, ca_county#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_county, [Dona Ana County,Jefferson County,La Porte County,Rush County,Toole County]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_county:string>
 
 (53) ColumnarToRow [codegen id : 1]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (54) Filter [codegen id : 1]
-Input [2]: [ca_address_sk#18, ca_county#19]
-Condition : (ca_county#19 IN (Rush County,Toole County,Jefferson County,Dona Ana County,La Porte County) AND isnotnull(ca_address_sk#18))
+Input [2]: [ca_address_sk#17, ca_county#18]
+Condition : (ca_county#18 IN (Rush County,Toole County,Jefferson County,Dona Ana County,La Porte County) AND isnotnull(ca_address_sk#17))
 
 (55) Project [codegen id : 1]
-Output [1]: [ca_address_sk#18]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (56) ObjectHashAggregate
-Input [1]: [ca_address_sk#18]
+Input [1]: [ca_address_sk#17]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)]
-Aggregate Attributes [1]: [buf#38]
-Results [1]: [buf#39]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)]
+Aggregate Attributes [1]: [buf#37]
+Results [1]: [buf#38]
 
 (57) Exchange
-Input [1]: [buf#39]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
+Input [1]: [buf#38]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
 
 (58) ObjectHashAggregate
-Input [1]: [buf#39]
+Input [1]: [buf#38]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)#40]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)#40 AS bloomFilter#41]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)#39]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)#39 AS bloomFilter#40]
 
-Subquery:2 Hosting operator id = 6 Hosting Expression = ss_sold_date_sk#9 IN dynamicpruning#10
+Subquery:2 Hosting operator id = 6 Hosting Expression = ss_sold_date_sk#8 IN dynamicpruning#9
 BroadcastExchange (63)
 +- * Project (62)
    +- * Filter (61)
@@ -344,29 +344,29 @@ BroadcastExchange (63)
 
 
 (59) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#11, d_year#42, d_moy#43]
+Output [3]: [d_date_sk#10, d_year#41, d_moy#42]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2002), GreaterThanOrEqual(d_moy,1), LessThanOrEqual(d_moy,4), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (60) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#11, d_year#42, d_moy#43]
+Input [3]: [d_date_sk#10, d_year#41, d_moy#42]
 
 (61) Filter [codegen id : 1]
-Input [3]: [d_date_sk#11, d_year#42, d_moy#43]
-Condition : (((((isnotnull(d_year#42) AND isnotnull(d_moy#43)) AND (d_year#42 = 2002)) AND (d_moy#43 >= 1)) AND (d_moy#43 <= 4)) AND isnotnull(d_date_sk#11))
+Input [3]: [d_date_sk#10, d_year#41, d_moy#42]
+Condition : (((((isnotnull(d_year#41) AND isnotnull(d_moy#42)) AND (d_year#41 = 2002)) AND (d_moy#42 >= 1)) AND (d_moy#42 <= 4)) AND isnotnull(d_date_sk#10))
 
 (62) Project [codegen id : 1]
-Output [1]: [d_date_sk#11]
-Input [3]: [d_date_sk#11, d_year#42, d_moy#43]
+Output [1]: [d_date_sk#10]
+Input [3]: [d_date_sk#10, d_year#41, d_moy#42]
 
 (63) BroadcastExchange
-Input [1]: [d_date_sk#11]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
+Input [1]: [d_date_sk#10]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=11]
 
-Subquery:3 Hosting operator id = 14 Hosting Expression = ws_sold_date_sk#13 IN dynamicpruning#10
+Subquery:3 Hosting operator id = 14 Hosting Expression = ws_sold_date_sk#12 IN dynamicpruning#9
 
-Subquery:4 Hosting operator id = 22 Hosting Expression = cs_sold_date_sk#16 IN dynamicpruning#10
+Subquery:4 Hosting operator id = 22 Hosting Expression = cs_sold_date_sk#15 IN dynamicpruning#9
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a.sf100/explain.txt
index 8a53d4f895d3b..bd4c44de4e85b 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a.sf100/explain.txt
@@ -450,195 +450,195 @@ Results [5]: [i_brand_id#38, i_class_id#39, i_category_id#40, sum((cast(ss_quant
 
 (72) Filter [codegen id : 38]
 Input [5]: [i_brand_id#38, i_class_id#39, i_category_id#40, sales#49, number_sales#50]
-Condition : (isnotnull(sales#49) AND (cast(sales#49 as decimal(32,6)) > cast(Subquery scalar-subquery#51, [id=#52] as decimal(32,6))))
+Condition : (isnotnull(sales#49) AND (cast(sales#49 as decimal(32,6)) > cast(Subquery scalar-subquery#51, [id=#12] as decimal(32,6))))
 
 (73) Project [codegen id : 38]
-Output [6]: [sales#49, number_sales#50, store AS channel#53, i_brand_id#38 AS i_brand_id#54, i_class_id#39 AS i_class_id#55, i_category_id#40 AS i_category_id#56]
+Output [6]: [sales#49, number_sales#50, store AS channel#52, i_brand_id#38 AS i_brand_id#53, i_class_id#39 AS i_class_id#54, i_category_id#40 AS i_category_id#55]
 Input [5]: [i_brand_id#38, i_class_id#39, i_category_id#40, sales#49, number_sales#50]
 
 (74) Scan parquet spark_catalog.default.catalog_sales
-Output [4]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60]
+Output [4]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#60), dynamicpruningexpression(cs_sold_date_sk#60 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#59), dynamicpruningexpression(cs_sold_date_sk#59 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(cs_item_sk)]
 ReadSchema: struct<cs_item_sk:int,cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (75) ColumnarToRow [codegen id : 75]
-Input [4]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60]
+Input [4]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59]
 
 (76) Filter [codegen id : 75]
-Input [4]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60]
-Condition : isnotnull(cs_item_sk#57)
+Input [4]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59]
+Condition : isnotnull(cs_item_sk#56)
 
 (77) ReusedExchange [Reuses operator id: 56]
-Output [1]: [ss_item_sk#61]
+Output [1]: [ss_item_sk#60]
 
 (78) BroadcastHashJoin [codegen id : 75]
-Left keys [1]: [cs_item_sk#57]
-Right keys [1]: [ss_item_sk#61]
+Left keys [1]: [cs_item_sk#56]
+Right keys [1]: [ss_item_sk#60]
 Join type: LeftSemi
 Join condition: None
 
 (79) ReusedExchange [Reuses operator id: 135]
-Output [1]: [d_date_sk#62]
+Output [1]: [d_date_sk#61]
 
 (80) BroadcastHashJoin [codegen id : 75]
-Left keys [1]: [cs_sold_date_sk#60]
-Right keys [1]: [d_date_sk#62]
+Left keys [1]: [cs_sold_date_sk#59]
+Right keys [1]: [d_date_sk#61]
 Join type: Inner
 Join condition: None
 
 (81) Project [codegen id : 75]
-Output [3]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59]
-Input [5]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60, d_date_sk#62]
+Output [3]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58]
+Input [5]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59, d_date_sk#61]
 
 (82) ReusedExchange [Reuses operator id: 66]
-Output [4]: [i_item_sk#63, i_brand_id#64, i_class_id#65, i_category_id#66]
+Output [4]: [i_item_sk#62, i_brand_id#63, i_class_id#64, i_category_id#65]
 
 (83) BroadcastHashJoin [codegen id : 75]
-Left keys [1]: [cs_item_sk#57]
-Right keys [1]: [i_item_sk#63]
+Left keys [1]: [cs_item_sk#56]
+Right keys [1]: [i_item_sk#62]
 Join type: Inner
 Join condition: None
 
 (84) Project [codegen id : 75]
-Output [5]: [cs_quantity#58, cs_list_price#59, i_brand_id#64, i_class_id#65, i_category_id#66]
-Input [7]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, i_item_sk#63, i_brand_id#64, i_class_id#65, i_category_id#66]
+Output [5]: [cs_quantity#57, cs_list_price#58, i_brand_id#63, i_class_id#64, i_category_id#65]
+Input [7]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, i_item_sk#62, i_brand_id#63, i_class_id#64, i_category_id#65]
 
 (85) HashAggregate [codegen id : 75]
-Input [5]: [cs_quantity#58, cs_list_price#59, i_brand_id#64, i_class_id#65, i_category_id#66]
-Keys [3]: [i_brand_id#64, i_class_id#65, i_category_id#66]
-Functions [2]: [partial_sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59)), partial_count(1)]
-Aggregate Attributes [3]: [sum#67, isEmpty#68, count#69]
-Results [6]: [i_brand_id#64, i_class_id#65, i_category_id#66, sum#70, isEmpty#71, count#72]
+Input [5]: [cs_quantity#57, cs_list_price#58, i_brand_id#63, i_class_id#64, i_category_id#65]
+Keys [3]: [i_brand_id#63, i_class_id#64, i_category_id#65]
+Functions [2]: [partial_sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58)), partial_count(1)]
+Aggregate Attributes [3]: [sum#66, isEmpty#67, count#68]
+Results [6]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum#69, isEmpty#70, count#71]
 
 (86) Exchange
-Input [6]: [i_brand_id#64, i_class_id#65, i_category_id#66, sum#70, isEmpty#71, count#72]
-Arguments: hashpartitioning(i_brand_id#64, i_class_id#65, i_category_id#66, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [6]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum#69, isEmpty#70, count#71]
+Arguments: hashpartitioning(i_brand_id#63, i_class_id#64, i_category_id#65, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (87) HashAggregate [codegen id : 76]
-Input [6]: [i_brand_id#64, i_class_id#65, i_category_id#66, sum#70, isEmpty#71, count#72]
-Keys [3]: [i_brand_id#64, i_class_id#65, i_category_id#66]
-Functions [2]: [sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59)), count(1)]
-Aggregate Attributes [2]: [sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59))#73, count(1)#74]
-Results [5]: [i_brand_id#64, i_class_id#65, i_category_id#66, sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59))#73 AS sales#75, count(1)#74 AS number_sales#76]
+Input [6]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum#69, isEmpty#70, count#71]
+Keys [3]: [i_brand_id#63, i_class_id#64, i_category_id#65]
+Functions [2]: [sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58))#72, count(1)#73]
+Results [5]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58))#72 AS sales#74, count(1)#73 AS number_sales#75]
 
 (88) Filter [codegen id : 76]
-Input [5]: [i_brand_id#64, i_class_id#65, i_category_id#66, sales#75, number_sales#76]
-Condition : (isnotnull(sales#75) AND (cast(sales#75 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#52] as decimal(32,6))))
+Input [5]: [i_brand_id#63, i_class_id#64, i_category_id#65, sales#74, number_sales#75]
+Condition : (isnotnull(sales#74) AND (cast(sales#74 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#12] as decimal(32,6))))
 
 (89) Project [codegen id : 76]
-Output [6]: [sales#75, number_sales#76, catalog AS channel#77, i_brand_id#64, i_class_id#65, i_category_id#66]
-Input [5]: [i_brand_id#64, i_class_id#65, i_category_id#66, sales#75, number_sales#76]
+Output [6]: [sales#74, number_sales#75, catalog AS channel#76, i_brand_id#63, i_class_id#64, i_category_id#65]
+Input [5]: [i_brand_id#63, i_class_id#64, i_category_id#65, sales#74, number_sales#75]
 
 (90) Scan parquet spark_catalog.default.web_sales
-Output [4]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81]
+Output [4]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#81), dynamicpruningexpression(ws_sold_date_sk#81 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#80), dynamicpruningexpression(ws_sold_date_sk#80 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(ws_item_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (91) ColumnarToRow [codegen id : 113]
-Input [4]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81]
+Input [4]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80]
 
 (92) Filter [codegen id : 113]
-Input [4]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81]
-Condition : isnotnull(ws_item_sk#78)
+Input [4]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80]
+Condition : isnotnull(ws_item_sk#77)
 
 (93) ReusedExchange [Reuses operator id: 56]
-Output [1]: [ss_item_sk#82]
+Output [1]: [ss_item_sk#81]
 
 (94) BroadcastHashJoin [codegen id : 113]
-Left keys [1]: [ws_item_sk#78]
-Right keys [1]: [ss_item_sk#82]
+Left keys [1]: [ws_item_sk#77]
+Right keys [1]: [ss_item_sk#81]
 Join type: LeftSemi
 Join condition: None
 
 (95) ReusedExchange [Reuses operator id: 135]
-Output [1]: [d_date_sk#83]
+Output [1]: [d_date_sk#82]
 
 (96) BroadcastHashJoin [codegen id : 113]
-Left keys [1]: [ws_sold_date_sk#81]
-Right keys [1]: [d_date_sk#83]
+Left keys [1]: [ws_sold_date_sk#80]
+Right keys [1]: [d_date_sk#82]
 Join type: Inner
 Join condition: None
 
 (97) Project [codegen id : 113]
-Output [3]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80]
-Input [5]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81, d_date_sk#83]
+Output [3]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79]
+Input [5]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80, d_date_sk#82]
 
 (98) ReusedExchange [Reuses operator id: 66]
-Output [4]: [i_item_sk#84, i_brand_id#85, i_class_id#86, i_category_id#87]
+Output [4]: [i_item_sk#83, i_brand_id#84, i_class_id#85, i_category_id#86]
 
 (99) BroadcastHashJoin [codegen id : 113]
-Left keys [1]: [ws_item_sk#78]
-Right keys [1]: [i_item_sk#84]
+Left keys [1]: [ws_item_sk#77]
+Right keys [1]: [i_item_sk#83]
 Join type: Inner
 Join condition: None
 
 (100) Project [codegen id : 113]
-Output [5]: [ws_quantity#79, ws_list_price#80, i_brand_id#85, i_class_id#86, i_category_id#87]
-Input [7]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, i_item_sk#84, i_brand_id#85, i_class_id#86, i_category_id#87]
+Output [5]: [ws_quantity#78, ws_list_price#79, i_brand_id#84, i_class_id#85, i_category_id#86]
+Input [7]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, i_item_sk#83, i_brand_id#84, i_class_id#85, i_category_id#86]
 
 (101) HashAggregate [codegen id : 113]
-Input [5]: [ws_quantity#79, ws_list_price#80, i_brand_id#85, i_class_id#86, i_category_id#87]
-Keys [3]: [i_brand_id#85, i_class_id#86, i_category_id#87]
-Functions [2]: [partial_sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80)), partial_count(1)]
-Aggregate Attributes [3]: [sum#88, isEmpty#89, count#90]
-Results [6]: [i_brand_id#85, i_class_id#86, i_category_id#87, sum#91, isEmpty#92, count#93]
+Input [5]: [ws_quantity#78, ws_list_price#79, i_brand_id#84, i_class_id#85, i_category_id#86]
+Keys [3]: [i_brand_id#84, i_class_id#85, i_category_id#86]
+Functions [2]: [partial_sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79)), partial_count(1)]
+Aggregate Attributes [3]: [sum#87, isEmpty#88, count#89]
+Results [6]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum#90, isEmpty#91, count#92]
 
 (102) Exchange
-Input [6]: [i_brand_id#85, i_class_id#86, i_category_id#87, sum#91, isEmpty#92, count#93]
-Arguments: hashpartitioning(i_brand_id#85, i_class_id#86, i_category_id#87, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+Input [6]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum#90, isEmpty#91, count#92]
+Arguments: hashpartitioning(i_brand_id#84, i_class_id#85, i_category_id#86, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (103) HashAggregate [codegen id : 114]
-Input [6]: [i_brand_id#85, i_class_id#86, i_category_id#87, sum#91, isEmpty#92, count#93]
-Keys [3]: [i_brand_id#85, i_class_id#86, i_category_id#87]
-Functions [2]: [sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80))#94, count(1)#95]
-Results [5]: [i_brand_id#85, i_class_id#86, i_category_id#87, sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80))#94 AS sales#96, count(1)#95 AS number_sales#97]
+Input [6]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum#90, isEmpty#91, count#92]
+Keys [3]: [i_brand_id#84, i_class_id#85, i_category_id#86]
+Functions [2]: [sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79))#93, count(1)#94]
+Results [5]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79))#93 AS sales#95, count(1)#94 AS number_sales#96]
 
 (104) Filter [codegen id : 114]
-Input [5]: [i_brand_id#85, i_class_id#86, i_category_id#87, sales#96, number_sales#97]
-Condition : (isnotnull(sales#96) AND (cast(sales#96 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#52] as decimal(32,6))))
+Input [5]: [i_brand_id#84, i_class_id#85, i_category_id#86, sales#95, number_sales#96]
+Condition : (isnotnull(sales#95) AND (cast(sales#95 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#12] as decimal(32,6))))
 
 (105) Project [codegen id : 114]
-Output [6]: [sales#96, number_sales#97, web AS channel#98, i_brand_id#85, i_class_id#86, i_category_id#87]
-Input [5]: [i_brand_id#85, i_class_id#86, i_category_id#87, sales#96, number_sales#97]
+Output [6]: [sales#95, number_sales#96, web AS channel#97, i_brand_id#84, i_class_id#85, i_category_id#86]
+Input [5]: [i_brand_id#84, i_class_id#85, i_category_id#86, sales#95, number_sales#96]
 
 (106) Union
 
 (107) Expand [codegen id : 115]
-Input [6]: [sales#49, number_sales#50, channel#53, i_brand_id#54, i_class_id#55, i_category_id#56]
-Arguments: [[sales#49, number_sales#50, channel#53, i_brand_id#54, i_class_id#55, i_category_id#56, 0], [sales#49, number_sales#50, channel#53, i_brand_id#54, i_class_id#55, null, 1], [sales#49, number_sales#50, channel#53, i_brand_id#54, null, null, 3], [sales#49, number_sales#50, channel#53, null, null, null, 7], [sales#49, number_sales#50, null, null, null, null, 15]], [sales#49, number_sales#50, channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
+Input [6]: [sales#49, number_sales#50, channel#52, i_brand_id#53, i_class_id#54, i_category_id#55]
+Arguments: [[sales#49, number_sales#50, channel#52, i_brand_id#53, i_class_id#54, i_category_id#55, 0], [sales#49, number_sales#50, channel#52, i_brand_id#53, i_class_id#54, null, 1], [sales#49, number_sales#50, channel#52, i_brand_id#53, null, null, 3], [sales#49, number_sales#50, channel#52, null, null, null, 7], [sales#49, number_sales#50, null, null, null, null, 15]], [sales#49, number_sales#50, channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
 
 (108) HashAggregate [codegen id : 115]
-Input [7]: [sales#49, number_sales#50, channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
-Keys [5]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
+Input [7]: [sales#49, number_sales#50, channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
+Keys [5]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
 Functions [2]: [partial_sum(sales#49), partial_sum(number_sales#50)]
-Aggregate Attributes [3]: [sum#104, isEmpty#105, sum#106]
-Results [8]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, sum#107, isEmpty#108, sum#109]
+Aggregate Attributes [3]: [sum#103, isEmpty#104, sum#105]
+Results [8]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, sum#106, isEmpty#107, sum#108]
 
 (109) Exchange
-Input [8]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, sum#107, isEmpty#108, sum#109]
-Arguments: hashpartitioning(channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+Input [8]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, sum#106, isEmpty#107, sum#108]
+Arguments: hashpartitioning(channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, 5), ENSURE_REQUIREMENTS, [plan_id=15]
 
 (110) HashAggregate [codegen id : 116]
-Input [8]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, sum#107, isEmpty#108, sum#109]
-Keys [5]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
+Input [8]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, sum#106, isEmpty#107, sum#108]
+Keys [5]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
 Functions [2]: [sum(sales#49), sum(number_sales#50)]
-Aggregate Attributes [2]: [sum(sales#49)#110, sum(number_sales#50)#111]
-Results [6]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, sum(sales#49)#110 AS sum(sales)#112, sum(number_sales#50)#111 AS sum(number_sales)#113]
+Aggregate Attributes [2]: [sum(sales#49)#109, sum(number_sales#50)#110]
+Results [6]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, sum(sales#49)#109 AS sum(sales)#111, sum(number_sales#50)#110 AS sum(number_sales)#112]
 
 (111) TakeOrderedAndProject
-Input [6]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, sum(sales)#112, sum(number_sales)#113]
-Arguments: 100, [channel#99 ASC NULLS FIRST, i_brand_id#100 ASC NULLS FIRST, i_class_id#101 ASC NULLS FIRST, i_category_id#102 ASC NULLS FIRST], [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, sum(sales)#112, sum(number_sales)#113]
+Input [6]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, sum(sales)#111, sum(number_sales)#112]
+Arguments: 100, [channel#98 ASC NULLS FIRST, i_brand_id#99 ASC NULLS FIRST, i_class_id#100 ASC NULLS FIRST, i_category_id#101 ASC NULLS FIRST], [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, sum(sales)#111, sum(number_sales)#112]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#51, [id=#52]
+Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#51, [id=#12]
 * HashAggregate (130)
 +- Exchange (129)
    +- * HashAggregate (128)
@@ -661,99 +661,99 @@ Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquer
 
 
 (112) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#114, ss_list_price#115, ss_sold_date_sk#116]
+Output [3]: [ss_quantity#113, ss_list_price#114, ss_sold_date_sk#115]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#116), dynamicpruningexpression(ss_sold_date_sk#116 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#115), dynamicpruningexpression(ss_sold_date_sk#115 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (113) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#114, ss_list_price#115, ss_sold_date_sk#116]
+Input [3]: [ss_quantity#113, ss_list_price#114, ss_sold_date_sk#115]
 
 (114) ReusedExchange [Reuses operator id: 140]
-Output [1]: [d_date_sk#117]
+Output [1]: [d_date_sk#116]
 
 (115) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#116]
-Right keys [1]: [d_date_sk#117]
+Left keys [1]: [ss_sold_date_sk#115]
+Right keys [1]: [d_date_sk#116]
 Join type: Inner
 Join condition: None
 
 (116) Project [codegen id : 2]
-Output [2]: [ss_quantity#114 AS quantity#118, ss_list_price#115 AS list_price#119]
-Input [4]: [ss_quantity#114, ss_list_price#115, ss_sold_date_sk#116, d_date_sk#117]
+Output [2]: [ss_quantity#113 AS quantity#117, ss_list_price#114 AS list_price#118]
+Input [4]: [ss_quantity#113, ss_list_price#114, ss_sold_date_sk#115, d_date_sk#116]
 
 (117) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#120, cs_list_price#121, cs_sold_date_sk#122]
+Output [3]: [cs_quantity#119, cs_list_price#120, cs_sold_date_sk#121]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#122), dynamicpruningexpression(cs_sold_date_sk#122 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#121), dynamicpruningexpression(cs_sold_date_sk#121 IN dynamicpruning#12)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (118) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#120, cs_list_price#121, cs_sold_date_sk#122]
+Input [3]: [cs_quantity#119, cs_list_price#120, cs_sold_date_sk#121]
 
 (119) ReusedExchange [Reuses operator id: 140]
-Output [1]: [d_date_sk#123]
+Output [1]: [d_date_sk#122]
 
 (120) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#122]
-Right keys [1]: [d_date_sk#123]
+Left keys [1]: [cs_sold_date_sk#121]
+Right keys [1]: [d_date_sk#122]
 Join type: Inner
 Join condition: None
 
 (121) Project [codegen id : 4]
-Output [2]: [cs_quantity#120 AS quantity#124, cs_list_price#121 AS list_price#125]
-Input [4]: [cs_quantity#120, cs_list_price#121, cs_sold_date_sk#122, d_date_sk#123]
+Output [2]: [cs_quantity#119 AS quantity#123, cs_list_price#120 AS list_price#124]
+Input [4]: [cs_quantity#119, cs_list_price#120, cs_sold_date_sk#121, d_date_sk#122]
 
 (122) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#126, ws_list_price#127, ws_sold_date_sk#128]
+Output [3]: [ws_quantity#125, ws_list_price#126, ws_sold_date_sk#127]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#128), dynamicpruningexpression(ws_sold_date_sk#128 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#127), dynamicpruningexpression(ws_sold_date_sk#127 IN dynamicpruning#12)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (123) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#126, ws_list_price#127, ws_sold_date_sk#128]
+Input [3]: [ws_quantity#125, ws_list_price#126, ws_sold_date_sk#127]
 
 (124) ReusedExchange [Reuses operator id: 140]
-Output [1]: [d_date_sk#129]
+Output [1]: [d_date_sk#128]
 
 (125) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#128]
-Right keys [1]: [d_date_sk#129]
+Left keys [1]: [ws_sold_date_sk#127]
+Right keys [1]: [d_date_sk#128]
 Join type: Inner
 Join condition: None
 
 (126) Project [codegen id : 6]
-Output [2]: [ws_quantity#126 AS quantity#130, ws_list_price#127 AS list_price#131]
-Input [4]: [ws_quantity#126, ws_list_price#127, ws_sold_date_sk#128, d_date_sk#129]
+Output [2]: [ws_quantity#125 AS quantity#129, ws_list_price#126 AS list_price#130]
+Input [4]: [ws_quantity#125, ws_list_price#126, ws_sold_date_sk#127, d_date_sk#128]
 
 (127) Union
 
 (128) HashAggregate [codegen id : 7]
-Input [2]: [quantity#118, list_price#119]
+Input [2]: [quantity#117, list_price#118]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#118 as decimal(10,0)) * list_price#119))]
-Aggregate Attributes [2]: [sum#132, count#133]
-Results [2]: [sum#134, count#135]
+Functions [1]: [partial_avg((cast(quantity#117 as decimal(10,0)) * list_price#118))]
+Aggregate Attributes [2]: [sum#131, count#132]
+Results [2]: [sum#133, count#134]
 
 (129) Exchange
-Input [2]: [sum#134, count#135]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=15]
+Input [2]: [sum#133, count#134]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=16]
 
 (130) HashAggregate [codegen id : 8]
-Input [2]: [sum#134, count#135]
+Input [2]: [sum#133, count#134]
 Keys: []
-Functions [1]: [avg((cast(quantity#118 as decimal(10,0)) * list_price#119))]
-Aggregate Attributes [1]: [avg((cast(quantity#118 as decimal(10,0)) * list_price#119))#136]
-Results [1]: [avg((cast(quantity#118 as decimal(10,0)) * list_price#119))#136 AS average_sales#137]
+Functions [1]: [avg((cast(quantity#117 as decimal(10,0)) * list_price#118))]
+Aggregate Attributes [1]: [avg((cast(quantity#117 as decimal(10,0)) * list_price#118))#135]
+Results [1]: [avg((cast(quantity#117 as decimal(10,0)) * list_price#118))#135 AS average_sales#136]
 
-Subquery:2 Hosting operator id = 112 Hosting Expression = ss_sold_date_sk#116 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 112 Hosting Expression = ss_sold_date_sk#115 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 117 Hosting Expression = cs_sold_date_sk#122 IN dynamicpruning#12
+Subquery:3 Hosting operator id = 117 Hosting Expression = cs_sold_date_sk#121 IN dynamicpruning#12
 
-Subquery:4 Hosting operator id = 122 Hosting Expression = ws_sold_date_sk#128 IN dynamicpruning#12
+Subquery:4 Hosting operator id = 122 Hosting Expression = ws_sold_date_sk#127 IN dynamicpruning#12
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
 BroadcastExchange (135)
@@ -764,26 +764,26 @@ BroadcastExchange (135)
 
 
 (131) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#36, d_year#138, d_moy#139]
+Output [3]: [d_date_sk#36, d_year#137, d_moy#138]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,11), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (132) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#36, d_year#138, d_moy#139]
+Input [3]: [d_date_sk#36, d_year#137, d_moy#138]
 
 (133) Filter [codegen id : 1]
-Input [3]: [d_date_sk#36, d_year#138, d_moy#139]
-Condition : ((((isnotnull(d_year#138) AND isnotnull(d_moy#139)) AND (d_year#138 = 2001)) AND (d_moy#139 = 11)) AND isnotnull(d_date_sk#36))
+Input [3]: [d_date_sk#36, d_year#137, d_moy#138]
+Condition : ((((isnotnull(d_year#137) AND isnotnull(d_moy#138)) AND (d_year#137 = 2001)) AND (d_moy#138 = 11)) AND isnotnull(d_date_sk#36))
 
 (134) Project [codegen id : 1]
 Output [1]: [d_date_sk#36]
-Input [3]: [d_date_sk#36, d_year#138, d_moy#139]
+Input [3]: [d_date_sk#36, d_year#137, d_moy#138]
 
 (135) BroadcastExchange
 Input [1]: [d_date_sk#36]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
 
 Subquery:6 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
 BroadcastExchange (140)
@@ -794,37 +794,37 @@ BroadcastExchange (140)
 
 
 (136) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#13, d_year#140]
+Output [2]: [d_date_sk#13, d_year#139]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1999), LessThanOrEqual(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (137) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#140]
+Input [2]: [d_date_sk#13, d_year#139]
 
 (138) Filter [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#140]
-Condition : (((isnotnull(d_year#140) AND (d_year#140 >= 1999)) AND (d_year#140 <= 2001)) AND isnotnull(d_date_sk#13))
+Input [2]: [d_date_sk#13, d_year#139]
+Condition : (((isnotnull(d_year#139) AND (d_year#139 >= 1999)) AND (d_year#139 <= 2001)) AND isnotnull(d_date_sk#13))
 
 (139) Project [codegen id : 1]
 Output [1]: [d_date_sk#13]
-Input [2]: [d_date_sk#13, d_year#140]
+Input [2]: [d_date_sk#13, d_year#139]
 
 (140) BroadcastExchange
 Input [1]: [d_date_sk#13]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=18]
 
 Subquery:7 Hosting operator id = 18 Hosting Expression = cs_sold_date_sk#19 IN dynamicpruning#12
 
 Subquery:8 Hosting operator id = 41 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:9 Hosting operator id = 88 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#52]
+Subquery:9 Hosting operator id = 88 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#12]
 
-Subquery:10 Hosting operator id = 74 Hosting Expression = cs_sold_date_sk#60 IN dynamicpruning#5
+Subquery:10 Hosting operator id = 74 Hosting Expression = cs_sold_date_sk#59 IN dynamicpruning#5
 
-Subquery:11 Hosting operator id = 104 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#52]
+Subquery:11 Hosting operator id = 104 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#12]
 
-Subquery:12 Hosting operator id = 90 Hosting Expression = ws_sold_date_sk#81 IN dynamicpruning#5
+Subquery:12 Hosting operator id = 90 Hosting Expression = ws_sold_date_sk#80 IN dynamicpruning#5
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a/explain.txt
index 9c99ab3ad5b44..206805e0b820d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14a/explain.txt
@@ -420,195 +420,195 @@ Results [5]: [i_brand_id#37, i_class_id#38, i_category_id#39, sum((cast(ss_quant
 
 (66) Filter [codegen id : 26]
 Input [5]: [i_brand_id#37, i_class_id#38, i_category_id#39, sales#49, number_sales#50]
-Condition : (isnotnull(sales#49) AND (cast(sales#49 as decimal(32,6)) > cast(Subquery scalar-subquery#51, [id=#52] as decimal(32,6))))
+Condition : (isnotnull(sales#49) AND (cast(sales#49 as decimal(32,6)) > cast(Subquery scalar-subquery#51, [id=#10] as decimal(32,6))))
 
 (67) Project [codegen id : 26]
-Output [6]: [sales#49, number_sales#50, store AS channel#53, i_brand_id#37 AS i_brand_id#54, i_class_id#38 AS i_class_id#55, i_category_id#39 AS i_category_id#56]
+Output [6]: [sales#49, number_sales#50, store AS channel#52, i_brand_id#37 AS i_brand_id#53, i_class_id#38 AS i_class_id#54, i_category_id#39 AS i_category_id#55]
 Input [5]: [i_brand_id#37, i_class_id#38, i_category_id#39, sales#49, number_sales#50]
 
 (68) Scan parquet spark_catalog.default.catalog_sales
-Output [4]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60]
+Output [4]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#60), dynamicpruningexpression(cs_sold_date_sk#60 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#59), dynamicpruningexpression(cs_sold_date_sk#59 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(cs_item_sk)]
 ReadSchema: struct<cs_item_sk:int,cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (69) ColumnarToRow [codegen id : 51]
-Input [4]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60]
+Input [4]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59]
 
 (70) Filter [codegen id : 51]
-Input [4]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60]
-Condition : isnotnull(cs_item_sk#57)
+Input [4]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59]
+Condition : isnotnull(cs_item_sk#56)
 
 (71) ReusedExchange [Reuses operator id: 50]
-Output [1]: [ss_item_sk#61]
+Output [1]: [ss_item_sk#60]
 
 (72) BroadcastHashJoin [codegen id : 51]
-Left keys [1]: [cs_item_sk#57]
-Right keys [1]: [ss_item_sk#61]
+Left keys [1]: [cs_item_sk#56]
+Right keys [1]: [ss_item_sk#60]
 Join type: LeftSemi
 Join condition: None
 
 (73) ReusedExchange [Reuses operator id: 57]
-Output [4]: [i_item_sk#62, i_brand_id#63, i_class_id#64, i_category_id#65]
+Output [4]: [i_item_sk#61, i_brand_id#62, i_class_id#63, i_category_id#64]
 
 (74) BroadcastHashJoin [codegen id : 51]
-Left keys [1]: [cs_item_sk#57]
-Right keys [1]: [i_item_sk#62]
+Left keys [1]: [cs_item_sk#56]
+Right keys [1]: [i_item_sk#61]
 Join type: Inner
 Join condition: None
 
 (75) Project [codegen id : 51]
-Output [6]: [cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60, i_brand_id#63, i_class_id#64, i_category_id#65]
-Input [8]: [cs_item_sk#57, cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60, i_item_sk#62, i_brand_id#63, i_class_id#64, i_category_id#65]
+Output [6]: [cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59, i_brand_id#62, i_class_id#63, i_category_id#64]
+Input [8]: [cs_item_sk#56, cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59, i_item_sk#61, i_brand_id#62, i_class_id#63, i_category_id#64]
 
 (76) ReusedExchange [Reuses operator id: 129]
-Output [1]: [d_date_sk#66]
+Output [1]: [d_date_sk#65]
 
 (77) BroadcastHashJoin [codegen id : 51]
-Left keys [1]: [cs_sold_date_sk#60]
-Right keys [1]: [d_date_sk#66]
+Left keys [1]: [cs_sold_date_sk#59]
+Right keys [1]: [d_date_sk#65]
 Join type: Inner
 Join condition: None
 
 (78) Project [codegen id : 51]
-Output [5]: [cs_quantity#58, cs_list_price#59, i_brand_id#63, i_class_id#64, i_category_id#65]
-Input [7]: [cs_quantity#58, cs_list_price#59, cs_sold_date_sk#60, i_brand_id#63, i_class_id#64, i_category_id#65, d_date_sk#66]
+Output [5]: [cs_quantity#57, cs_list_price#58, i_brand_id#62, i_class_id#63, i_category_id#64]
+Input [7]: [cs_quantity#57, cs_list_price#58, cs_sold_date_sk#59, i_brand_id#62, i_class_id#63, i_category_id#64, d_date_sk#65]
 
 (79) HashAggregate [codegen id : 51]
-Input [5]: [cs_quantity#58, cs_list_price#59, i_brand_id#63, i_class_id#64, i_category_id#65]
-Keys [3]: [i_brand_id#63, i_class_id#64, i_category_id#65]
-Functions [2]: [partial_sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59)), partial_count(1)]
-Aggregate Attributes [3]: [sum#67, isEmpty#68, count#69]
-Results [6]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum#70, isEmpty#71, count#72]
+Input [5]: [cs_quantity#57, cs_list_price#58, i_brand_id#62, i_class_id#63, i_category_id#64]
+Keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
+Functions [2]: [partial_sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58)), partial_count(1)]
+Aggregate Attributes [3]: [sum#66, isEmpty#67, count#68]
+Results [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#69, isEmpty#70, count#71]
 
 (80) Exchange
-Input [6]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum#70, isEmpty#71, count#72]
-Arguments: hashpartitioning(i_brand_id#63, i_class_id#64, i_category_id#65, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#69, isEmpty#70, count#71]
+Arguments: hashpartitioning(i_brand_id#62, i_class_id#63, i_category_id#64, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (81) HashAggregate [codegen id : 52]
-Input [6]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum#70, isEmpty#71, count#72]
-Keys [3]: [i_brand_id#63, i_class_id#64, i_category_id#65]
-Functions [2]: [sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59)), count(1)]
-Aggregate Attributes [2]: [sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59))#73, count(1)#74]
-Results [5]: [i_brand_id#63, i_class_id#64, i_category_id#65, sum((cast(cs_quantity#58 as decimal(10,0)) * cs_list_price#59))#73 AS sales#75, count(1)#74 AS number_sales#76]
+Input [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#69, isEmpty#70, count#71]
+Keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
+Functions [2]: [sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58))#72, count(1)#73]
+Results [5]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum((cast(cs_quantity#57 as decimal(10,0)) * cs_list_price#58))#72 AS sales#74, count(1)#73 AS number_sales#75]
 
 (82) Filter [codegen id : 52]
-Input [5]: [i_brand_id#63, i_class_id#64, i_category_id#65, sales#75, number_sales#76]
-Condition : (isnotnull(sales#75) AND (cast(sales#75 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#52] as decimal(32,6))))
+Input [5]: [i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
+Condition : (isnotnull(sales#74) AND (cast(sales#74 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#10] as decimal(32,6))))
 
 (83) Project [codegen id : 52]
-Output [6]: [sales#75, number_sales#76, catalog AS channel#77, i_brand_id#63, i_class_id#64, i_category_id#65]
-Input [5]: [i_brand_id#63, i_class_id#64, i_category_id#65, sales#75, number_sales#76]
+Output [6]: [sales#74, number_sales#75, catalog AS channel#76, i_brand_id#62, i_class_id#63, i_category_id#64]
+Input [5]: [i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
 
 (84) Scan parquet spark_catalog.default.web_sales
-Output [4]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81]
+Output [4]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#81), dynamicpruningexpression(ws_sold_date_sk#81 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#80), dynamicpruningexpression(ws_sold_date_sk#80 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(ws_item_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (85) ColumnarToRow [codegen id : 77]
-Input [4]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81]
+Input [4]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80]
 
 (86) Filter [codegen id : 77]
-Input [4]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81]
-Condition : isnotnull(ws_item_sk#78)
+Input [4]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80]
+Condition : isnotnull(ws_item_sk#77)
 
 (87) ReusedExchange [Reuses operator id: 50]
-Output [1]: [ss_item_sk#82]
+Output [1]: [ss_item_sk#81]
 
 (88) BroadcastHashJoin [codegen id : 77]
-Left keys [1]: [ws_item_sk#78]
-Right keys [1]: [ss_item_sk#82]
+Left keys [1]: [ws_item_sk#77]
+Right keys [1]: [ss_item_sk#81]
 Join type: LeftSemi
 Join condition: None
 
 (89) ReusedExchange [Reuses operator id: 57]
-Output [4]: [i_item_sk#83, i_brand_id#84, i_class_id#85, i_category_id#86]
+Output [4]: [i_item_sk#82, i_brand_id#83, i_class_id#84, i_category_id#85]
 
 (90) BroadcastHashJoin [codegen id : 77]
-Left keys [1]: [ws_item_sk#78]
-Right keys [1]: [i_item_sk#83]
+Left keys [1]: [ws_item_sk#77]
+Right keys [1]: [i_item_sk#82]
 Join type: Inner
 Join condition: None
 
 (91) Project [codegen id : 77]
-Output [6]: [ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81, i_brand_id#84, i_class_id#85, i_category_id#86]
-Input [8]: [ws_item_sk#78, ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81, i_item_sk#83, i_brand_id#84, i_class_id#85, i_category_id#86]
+Output [6]: [ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80, i_brand_id#83, i_class_id#84, i_category_id#85]
+Input [8]: [ws_item_sk#77, ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80, i_item_sk#82, i_brand_id#83, i_class_id#84, i_category_id#85]
 
 (92) ReusedExchange [Reuses operator id: 129]
-Output [1]: [d_date_sk#87]
+Output [1]: [d_date_sk#86]
 
 (93) BroadcastHashJoin [codegen id : 77]
-Left keys [1]: [ws_sold_date_sk#81]
-Right keys [1]: [d_date_sk#87]
+Left keys [1]: [ws_sold_date_sk#80]
+Right keys [1]: [d_date_sk#86]
 Join type: Inner
 Join condition: None
 
 (94) Project [codegen id : 77]
-Output [5]: [ws_quantity#79, ws_list_price#80, i_brand_id#84, i_class_id#85, i_category_id#86]
-Input [7]: [ws_quantity#79, ws_list_price#80, ws_sold_date_sk#81, i_brand_id#84, i_class_id#85, i_category_id#86, d_date_sk#87]
+Output [5]: [ws_quantity#78, ws_list_price#79, i_brand_id#83, i_class_id#84, i_category_id#85]
+Input [7]: [ws_quantity#78, ws_list_price#79, ws_sold_date_sk#80, i_brand_id#83, i_class_id#84, i_category_id#85, d_date_sk#86]
 
 (95) HashAggregate [codegen id : 77]
-Input [5]: [ws_quantity#79, ws_list_price#80, i_brand_id#84, i_class_id#85, i_category_id#86]
-Keys [3]: [i_brand_id#84, i_class_id#85, i_category_id#86]
-Functions [2]: [partial_sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80)), partial_count(1)]
-Aggregate Attributes [3]: [sum#88, isEmpty#89, count#90]
-Results [6]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum#91, isEmpty#92, count#93]
+Input [5]: [ws_quantity#78, ws_list_price#79, i_brand_id#83, i_class_id#84, i_category_id#85]
+Keys [3]: [i_brand_id#83, i_class_id#84, i_category_id#85]
+Functions [2]: [partial_sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79)), partial_count(1)]
+Aggregate Attributes [3]: [sum#87, isEmpty#88, count#89]
+Results [6]: [i_brand_id#83, i_class_id#84, i_category_id#85, sum#90, isEmpty#91, count#92]
 
 (96) Exchange
-Input [6]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum#91, isEmpty#92, count#93]
-Arguments: hashpartitioning(i_brand_id#84, i_class_id#85, i_category_id#86, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [6]: [i_brand_id#83, i_class_id#84, i_category_id#85, sum#90, isEmpty#91, count#92]
+Arguments: hashpartitioning(i_brand_id#83, i_class_id#84, i_category_id#85, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (97) HashAggregate [codegen id : 78]
-Input [6]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum#91, isEmpty#92, count#93]
-Keys [3]: [i_brand_id#84, i_class_id#85, i_category_id#86]
-Functions [2]: [sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80))#94, count(1)#95]
-Results [5]: [i_brand_id#84, i_class_id#85, i_category_id#86, sum((cast(ws_quantity#79 as decimal(10,0)) * ws_list_price#80))#94 AS sales#96, count(1)#95 AS number_sales#97]
+Input [6]: [i_brand_id#83, i_class_id#84, i_category_id#85, sum#90, isEmpty#91, count#92]
+Keys [3]: [i_brand_id#83, i_class_id#84, i_category_id#85]
+Functions [2]: [sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79))#93, count(1)#94]
+Results [5]: [i_brand_id#83, i_class_id#84, i_category_id#85, sum((cast(ws_quantity#78 as decimal(10,0)) * ws_list_price#79))#93 AS sales#95, count(1)#94 AS number_sales#96]
 
 (98) Filter [codegen id : 78]
-Input [5]: [i_brand_id#84, i_class_id#85, i_category_id#86, sales#96, number_sales#97]
-Condition : (isnotnull(sales#96) AND (cast(sales#96 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#52] as decimal(32,6))))
+Input [5]: [i_brand_id#83, i_class_id#84, i_category_id#85, sales#95, number_sales#96]
+Condition : (isnotnull(sales#95) AND (cast(sales#95 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#51, [id=#10] as decimal(32,6))))
 
 (99) Project [codegen id : 78]
-Output [6]: [sales#96, number_sales#97, web AS channel#98, i_brand_id#84, i_class_id#85, i_category_id#86]
-Input [5]: [i_brand_id#84, i_class_id#85, i_category_id#86, sales#96, number_sales#97]
+Output [6]: [sales#95, number_sales#96, web AS channel#97, i_brand_id#83, i_class_id#84, i_category_id#85]
+Input [5]: [i_brand_id#83, i_class_id#84, i_category_id#85, sales#95, number_sales#96]
 
 (100) Union
 
 (101) Expand [codegen id : 79]
-Input [6]: [sales#49, number_sales#50, channel#53, i_brand_id#54, i_class_id#55, i_category_id#56]
-Arguments: [[sales#49, number_sales#50, channel#53, i_brand_id#54, i_class_id#55, i_category_id#56, 0], [sales#49, number_sales#50, channel#53, i_brand_id#54, i_class_id#55, null, 1], [sales#49, number_sales#50, channel#53, i_brand_id#54, null, null, 3], [sales#49, number_sales#50, channel#53, null, null, null, 7], [sales#49, number_sales#50, null, null, null, null, 15]], [sales#49, number_sales#50, channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
+Input [6]: [sales#49, number_sales#50, channel#52, i_brand_id#53, i_class_id#54, i_category_id#55]
+Arguments: [[sales#49, number_sales#50, channel#52, i_brand_id#53, i_class_id#54, i_category_id#55, 0], [sales#49, number_sales#50, channel#52, i_brand_id#53, i_class_id#54, null, 1], [sales#49, number_sales#50, channel#52, i_brand_id#53, null, null, 3], [sales#49, number_sales#50, channel#52, null, null, null, 7], [sales#49, number_sales#50, null, null, null, null, 15]], [sales#49, number_sales#50, channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
 
 (102) HashAggregate [codegen id : 79]
-Input [7]: [sales#49, number_sales#50, channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
-Keys [5]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
+Input [7]: [sales#49, number_sales#50, channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
+Keys [5]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
 Functions [2]: [partial_sum(sales#49), partial_sum(number_sales#50)]
-Aggregate Attributes [3]: [sum#104, isEmpty#105, sum#106]
-Results [8]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, sum#107, isEmpty#108, sum#109]
+Aggregate Attributes [3]: [sum#103, isEmpty#104, sum#105]
+Results [8]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, sum#106, isEmpty#107, sum#108]
 
 (103) Exchange
-Input [8]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, sum#107, isEmpty#108, sum#109]
-Arguments: hashpartitioning(channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [8]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, sum#106, isEmpty#107, sum#108]
+Arguments: hashpartitioning(channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (104) HashAggregate [codegen id : 80]
-Input [8]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103, sum#107, isEmpty#108, sum#109]
-Keys [5]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, spark_grouping_id#103]
+Input [8]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102, sum#106, isEmpty#107, sum#108]
+Keys [5]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, spark_grouping_id#102]
 Functions [2]: [sum(sales#49), sum(number_sales#50)]
-Aggregate Attributes [2]: [sum(sales#49)#110, sum(number_sales#50)#111]
-Results [6]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, sum(sales#49)#110 AS sum(sales)#112, sum(number_sales#50)#111 AS sum(number_sales)#113]
+Aggregate Attributes [2]: [sum(sales#49)#109, sum(number_sales#50)#110]
+Results [6]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, sum(sales#49)#109 AS sum(sales)#111, sum(number_sales#50)#110 AS sum(number_sales)#112]
 
 (105) TakeOrderedAndProject
-Input [6]: [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, sum(sales)#112, sum(number_sales)#113]
-Arguments: 100, [channel#99 ASC NULLS FIRST, i_brand_id#100 ASC NULLS FIRST, i_class_id#101 ASC NULLS FIRST, i_category_id#102 ASC NULLS FIRST], [channel#99, i_brand_id#100, i_class_id#101, i_category_id#102, sum(sales)#112, sum(number_sales)#113]
+Input [6]: [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, sum(sales)#111, sum(number_sales)#112]
+Arguments: 100, [channel#98 ASC NULLS FIRST, i_brand_id#99 ASC NULLS FIRST, i_class_id#100 ASC NULLS FIRST, i_category_id#101 ASC NULLS FIRST], [channel#98, i_brand_id#99, i_class_id#100, i_category_id#101, sum(sales)#111, sum(number_sales)#112]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#51, [id=#52]
+Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#51, [id=#10]
 * HashAggregate (124)
 +- Exchange (123)
    +- * HashAggregate (122)
@@ -631,99 +631,99 @@ Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquer
 
 
 (106) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#114, ss_list_price#115, ss_sold_date_sk#116]
+Output [3]: [ss_quantity#113, ss_list_price#114, ss_sold_date_sk#115]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#116), dynamicpruningexpression(ss_sold_date_sk#116 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#115), dynamicpruningexpression(ss_sold_date_sk#115 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (107) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#114, ss_list_price#115, ss_sold_date_sk#116]
+Input [3]: [ss_quantity#113, ss_list_price#114, ss_sold_date_sk#115]
 
 (108) ReusedExchange [Reuses operator id: 134]
-Output [1]: [d_date_sk#117]
+Output [1]: [d_date_sk#116]
 
 (109) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#116]
-Right keys [1]: [d_date_sk#117]
+Left keys [1]: [ss_sold_date_sk#115]
+Right keys [1]: [d_date_sk#116]
 Join type: Inner
 Join condition: None
 
 (110) Project [codegen id : 2]
-Output [2]: [ss_quantity#114 AS quantity#118, ss_list_price#115 AS list_price#119]
-Input [4]: [ss_quantity#114, ss_list_price#115, ss_sold_date_sk#116, d_date_sk#117]
+Output [2]: [ss_quantity#113 AS quantity#117, ss_list_price#114 AS list_price#118]
+Input [4]: [ss_quantity#113, ss_list_price#114, ss_sold_date_sk#115, d_date_sk#116]
 
 (111) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#120, cs_list_price#121, cs_sold_date_sk#122]
+Output [3]: [cs_quantity#119, cs_list_price#120, cs_sold_date_sk#121]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#122), dynamicpruningexpression(cs_sold_date_sk#122 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#121), dynamicpruningexpression(cs_sold_date_sk#121 IN dynamicpruning#12)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (112) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#120, cs_list_price#121, cs_sold_date_sk#122]
+Input [3]: [cs_quantity#119, cs_list_price#120, cs_sold_date_sk#121]
 
 (113) ReusedExchange [Reuses operator id: 134]
-Output [1]: [d_date_sk#123]
+Output [1]: [d_date_sk#122]
 
 (114) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#122]
-Right keys [1]: [d_date_sk#123]
+Left keys [1]: [cs_sold_date_sk#121]
+Right keys [1]: [d_date_sk#122]
 Join type: Inner
 Join condition: None
 
 (115) Project [codegen id : 4]
-Output [2]: [cs_quantity#120 AS quantity#124, cs_list_price#121 AS list_price#125]
-Input [4]: [cs_quantity#120, cs_list_price#121, cs_sold_date_sk#122, d_date_sk#123]
+Output [2]: [cs_quantity#119 AS quantity#123, cs_list_price#120 AS list_price#124]
+Input [4]: [cs_quantity#119, cs_list_price#120, cs_sold_date_sk#121, d_date_sk#122]
 
 (116) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#126, ws_list_price#127, ws_sold_date_sk#128]
+Output [3]: [ws_quantity#125, ws_list_price#126, ws_sold_date_sk#127]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#128), dynamicpruningexpression(ws_sold_date_sk#128 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#127), dynamicpruningexpression(ws_sold_date_sk#127 IN dynamicpruning#12)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (117) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#126, ws_list_price#127, ws_sold_date_sk#128]
+Input [3]: [ws_quantity#125, ws_list_price#126, ws_sold_date_sk#127]
 
 (118) ReusedExchange [Reuses operator id: 134]
-Output [1]: [d_date_sk#129]
+Output [1]: [d_date_sk#128]
 
 (119) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#128]
-Right keys [1]: [d_date_sk#129]
+Left keys [1]: [ws_sold_date_sk#127]
+Right keys [1]: [d_date_sk#128]
 Join type: Inner
 Join condition: None
 
 (120) Project [codegen id : 6]
-Output [2]: [ws_quantity#126 AS quantity#130, ws_list_price#127 AS list_price#131]
-Input [4]: [ws_quantity#126, ws_list_price#127, ws_sold_date_sk#128, d_date_sk#129]
+Output [2]: [ws_quantity#125 AS quantity#129, ws_list_price#126 AS list_price#130]
+Input [4]: [ws_quantity#125, ws_list_price#126, ws_sold_date_sk#127, d_date_sk#128]
 
 (121) Union
 
 (122) HashAggregate [codegen id : 7]
-Input [2]: [quantity#118, list_price#119]
+Input [2]: [quantity#117, list_price#118]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#118 as decimal(10,0)) * list_price#119))]
-Aggregate Attributes [2]: [sum#132, count#133]
-Results [2]: [sum#134, count#135]
+Functions [1]: [partial_avg((cast(quantity#117 as decimal(10,0)) * list_price#118))]
+Aggregate Attributes [2]: [sum#131, count#132]
+Results [2]: [sum#133, count#134]
 
 (123) Exchange
-Input [2]: [sum#134, count#135]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
+Input [2]: [sum#133, count#134]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=14]
 
 (124) HashAggregate [codegen id : 8]
-Input [2]: [sum#134, count#135]
+Input [2]: [sum#133, count#134]
 Keys: []
-Functions [1]: [avg((cast(quantity#118 as decimal(10,0)) * list_price#119))]
-Aggregate Attributes [1]: [avg((cast(quantity#118 as decimal(10,0)) * list_price#119))#136]
-Results [1]: [avg((cast(quantity#118 as decimal(10,0)) * list_price#119))#136 AS average_sales#137]
+Functions [1]: [avg((cast(quantity#117 as decimal(10,0)) * list_price#118))]
+Aggregate Attributes [1]: [avg((cast(quantity#117 as decimal(10,0)) * list_price#118))#135]
+Results [1]: [avg((cast(quantity#117 as decimal(10,0)) * list_price#118))#135 AS average_sales#136]
 
-Subquery:2 Hosting operator id = 106 Hosting Expression = ss_sold_date_sk#116 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 106 Hosting Expression = ss_sold_date_sk#115 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 111 Hosting Expression = cs_sold_date_sk#122 IN dynamicpruning#12
+Subquery:3 Hosting operator id = 111 Hosting Expression = cs_sold_date_sk#121 IN dynamicpruning#12
 
-Subquery:4 Hosting operator id = 116 Hosting Expression = ws_sold_date_sk#128 IN dynamicpruning#12
+Subquery:4 Hosting operator id = 116 Hosting Expression = ws_sold_date_sk#127 IN dynamicpruning#12
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
 BroadcastExchange (129)
@@ -734,26 +734,26 @@ BroadcastExchange (129)
 
 
 (125) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#40, d_year#138, d_moy#139]
+Output [3]: [d_date_sk#40, d_year#137, d_moy#138]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,11), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (126) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#40, d_year#138, d_moy#139]
+Input [3]: [d_date_sk#40, d_year#137, d_moy#138]
 
 (127) Filter [codegen id : 1]
-Input [3]: [d_date_sk#40, d_year#138, d_moy#139]
-Condition : ((((isnotnull(d_year#138) AND isnotnull(d_moy#139)) AND (d_year#138 = 2001)) AND (d_moy#139 = 11)) AND isnotnull(d_date_sk#40))
+Input [3]: [d_date_sk#40, d_year#137, d_moy#138]
+Condition : ((((isnotnull(d_year#137) AND isnotnull(d_moy#138)) AND (d_year#137 = 2001)) AND (d_moy#138 = 11)) AND isnotnull(d_date_sk#40))
 
 (128) Project [codegen id : 1]
 Output [1]: [d_date_sk#40]
-Input [3]: [d_date_sk#40, d_year#138, d_moy#139]
+Input [3]: [d_date_sk#40, d_year#137, d_moy#138]
 
 (129) BroadcastExchange
 Input [1]: [d_date_sk#40]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
 
 Subquery:6 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
 BroadcastExchange (134)
@@ -764,37 +764,37 @@ BroadcastExchange (134)
 
 
 (130) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_year#140]
+Output [2]: [d_date_sk#24, d_year#139]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1999), LessThanOrEqual(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (131) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#140]
+Input [2]: [d_date_sk#24, d_year#139]
 
 (132) Filter [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#140]
-Condition : (((isnotnull(d_year#140) AND (d_year#140 >= 1999)) AND (d_year#140 <= 2001)) AND isnotnull(d_date_sk#24))
+Input [2]: [d_date_sk#24, d_year#139]
+Condition : (((isnotnull(d_year#139) AND (d_year#139 >= 1999)) AND (d_year#139 <= 2001)) AND isnotnull(d_date_sk#24))
 
 (133) Project [codegen id : 1]
 Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_year#140]
+Input [2]: [d_date_sk#24, d_year#139]
 
 (134) BroadcastExchange
 Input [1]: [d_date_sk#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
 
 Subquery:7 Hosting operator id = 13 Hosting Expression = cs_sold_date_sk#18 IN dynamicpruning#12
 
 Subquery:8 Hosting operator id = 36 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:9 Hosting operator id = 82 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#52]
+Subquery:9 Hosting operator id = 82 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#10]
 
-Subquery:10 Hosting operator id = 68 Hosting Expression = cs_sold_date_sk#60 IN dynamicpruning#5
+Subquery:10 Hosting operator id = 68 Hosting Expression = cs_sold_date_sk#59 IN dynamicpruning#5
 
-Subquery:11 Hosting operator id = 98 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#52]
+Subquery:11 Hosting operator id = 98 Hosting Expression = ReusedSubquery Subquery scalar-subquery#51, [id=#10]
 
-Subquery:12 Hosting operator id = 84 Hosting Expression = ws_sold_date_sk#81 IN dynamicpruning#5
+Subquery:12 Hosting operator id = 84 Hosting Expression = ws_sold_date_sk#80 IN dynamicpruning#5
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b.sf100/explain.txt
index 0986e92088caa..fe9f8b2aab784 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b.sf100/explain.txt
@@ -429,97 +429,97 @@ Results [6]: [store AS channel#49, i_brand_id#38, i_class_id#39, i_category_id#4
 
 (72) Filter [codegen id : 76]
 Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51]
-Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
 
 (73) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Output [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#57), dynamicpruningexpression(ss_sold_date_sk#57 IN dynamicpruning#58)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#56), dynamicpruningexpression(ss_sold_date_sk#56 IN dynamicpruning#57)]
 PushedFilters: [IsNotNull(ss_item_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (74) ColumnarToRow [codegen id : 74]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 
 (75) Filter [codegen id : 74]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
-Condition : isnotnull(ss_item_sk#54)
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
+Condition : isnotnull(ss_item_sk#53)
 
 (76) ReusedExchange [Reuses operator id: 56]
-Output [1]: [ss_item_sk#59]
+Output [1]: [ss_item_sk#58]
 
 (77) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [ss_item_sk#59]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [ss_item_sk#58]
 Join type: LeftSemi
 Join condition: None
 
 (78) ReusedExchange [Reuses operator id: 128]
-Output [1]: [d_date_sk#60]
+Output [1]: [d_date_sk#59]
 
 (79) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_sold_date_sk#57]
-Right keys [1]: [d_date_sk#60]
+Left keys [1]: [ss_sold_date_sk#56]
+Right keys [1]: [d_date_sk#59]
 Join type: Inner
 Join condition: None
 
 (80) Project [codegen id : 74]
-Output [3]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56]
-Input [5]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, d_date_sk#60]
+Output [3]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55]
+Input [5]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, d_date_sk#59]
 
 (81) ReusedExchange [Reuses operator id: 66]
-Output [4]: [i_item_sk#61, i_brand_id#62, i_class_id#63, i_category_id#64]
+Output [4]: [i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
 
 (82) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [i_item_sk#61]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [i_item_sk#60]
 Join type: Inner
 Join condition: None
 
 (83) Project [codegen id : 74]
-Output [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#62, i_class_id#63, i_category_id#64]
-Input [7]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, i_item_sk#61, i_brand_id#62, i_class_id#63, i_category_id#64]
+Output [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#61, i_class_id#62, i_category_id#63]
+Input [7]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
 
 (84) HashAggregate [codegen id : 74]
-Input [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#62, i_class_id#63, i_category_id#64]
-Keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
-Functions [2]: [partial_sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), partial_count(1)]
-Aggregate Attributes [3]: [sum#65, isEmpty#66, count#67]
-Results [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#68, isEmpty#69, count#70]
+Input [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#61, i_class_id#62, i_category_id#63]
+Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
+Functions [2]: [partial_sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), partial_count(1)]
+Aggregate Attributes [3]: [sum#64, isEmpty#65, count#66]
+Results [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
 
 (85) Exchange
-Input [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#68, isEmpty#69, count#70]
-Arguments: hashpartitioning(i_brand_id#62, i_class_id#63, i_category_id#64, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
+Arguments: hashpartitioning(i_brand_id#61, i_class_id#62, i_category_id#63, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (86) HashAggregate [codegen id : 75]
-Input [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#68, isEmpty#69, count#70]
-Keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
-Functions [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71, count(1)#72]
-Results [6]: [store AS channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71 AS sales#74, count(1)#72 AS number_sales#75]
+Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
+Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
+Functions [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70, count(1)#71]
+Results [6]: [store AS channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70 AS sales#73, count(1)#71 AS number_sales#74]
 
 (87) Filter [codegen id : 75]
-Input [6]: [channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
-Condition : (isnotnull(sales#74) AND (cast(sales#74 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
+Condition : (isnotnull(sales#73) AND (cast(sales#73 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
 
 (88) BroadcastExchange
-Input [6]: [channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
-Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=13]
+Input [6]: [channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
+Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=14]
 
 (89) BroadcastHashJoin [codegen id : 76]
 Left keys [3]: [i_brand_id#38, i_class_id#39, i_category_id#40]
-Right keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
+Right keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
 Join type: Inner
 Join condition: None
 
 (90) TakeOrderedAndProject
-Input [12]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
-Arguments: 100, [i_brand_id#38 ASC NULLS FIRST, i_class_id#39 ASC NULLS FIRST, i_category_id#40 ASC NULLS FIRST], [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
+Input [12]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
+Arguments: 100, [i_brand_id#38 ASC NULLS FIRST, i_class_id#39 ASC NULLS FIRST, i_category_id#40 ASC NULLS FIRST], [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#52, [id=#53]
+Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#52, [id=#12]
 * HashAggregate (109)
 +- Exchange (108)
    +- * HashAggregate (107)
@@ -542,99 +542,99 @@ Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquer
 
 
 (91) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Output [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#78), dynamicpruningexpression(ss_sold_date_sk#78 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#77), dynamicpruningexpression(ss_sold_date_sk#77 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (92) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Input [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 
 (93) ReusedExchange [Reuses operator id: 123]
-Output [1]: [d_date_sk#79]
+Output [1]: [d_date_sk#78]
 
 (94) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#78]
-Right keys [1]: [d_date_sk#79]
+Left keys [1]: [ss_sold_date_sk#77]
+Right keys [1]: [d_date_sk#78]
 Join type: Inner
 Join condition: None
 
 (95) Project [codegen id : 2]
-Output [2]: [ss_quantity#76 AS quantity#80, ss_list_price#77 AS list_price#81]
-Input [4]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78, d_date_sk#79]
+Output [2]: [ss_quantity#75 AS quantity#79, ss_list_price#76 AS list_price#80]
+Input [4]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77, d_date_sk#78]
 
 (96) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Output [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#84), dynamicpruningexpression(cs_sold_date_sk#84 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#83), dynamicpruningexpression(cs_sold_date_sk#83 IN dynamicpruning#12)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (97) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Input [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 
 (98) ReusedExchange [Reuses operator id: 123]
-Output [1]: [d_date_sk#85]
+Output [1]: [d_date_sk#84]
 
 (99) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#84]
-Right keys [1]: [d_date_sk#85]
+Left keys [1]: [cs_sold_date_sk#83]
+Right keys [1]: [d_date_sk#84]
 Join type: Inner
 Join condition: None
 
 (100) Project [codegen id : 4]
-Output [2]: [cs_quantity#82 AS quantity#86, cs_list_price#83 AS list_price#87]
-Input [4]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84, d_date_sk#85]
+Output [2]: [cs_quantity#81 AS quantity#85, cs_list_price#82 AS list_price#86]
+Input [4]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83, d_date_sk#84]
 
 (101) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Output [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#90), dynamicpruningexpression(ws_sold_date_sk#90 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#89), dynamicpruningexpression(ws_sold_date_sk#89 IN dynamicpruning#12)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (102) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Input [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 
 (103) ReusedExchange [Reuses operator id: 123]
-Output [1]: [d_date_sk#91]
+Output [1]: [d_date_sk#90]
 
 (104) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#90]
-Right keys [1]: [d_date_sk#91]
+Left keys [1]: [ws_sold_date_sk#89]
+Right keys [1]: [d_date_sk#90]
 Join type: Inner
 Join condition: None
 
 (105) Project [codegen id : 6]
-Output [2]: [ws_quantity#88 AS quantity#92, ws_list_price#89 AS list_price#93]
-Input [4]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90, d_date_sk#91]
+Output [2]: [ws_quantity#87 AS quantity#91, ws_list_price#88 AS list_price#92]
+Input [4]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89, d_date_sk#90]
 
 (106) Union
 
 (107) HashAggregate [codegen id : 7]
-Input [2]: [quantity#80, list_price#81]
+Input [2]: [quantity#79, list_price#80]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [2]: [sum#94, count#95]
-Results [2]: [sum#96, count#97]
+Functions [1]: [partial_avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [2]: [sum#93, count#94]
+Results [2]: [sum#95, count#96]
 
 (108) Exchange
-Input [2]: [sum#96, count#97]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=14]
+Input [2]: [sum#95, count#96]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=15]
 
 (109) HashAggregate [codegen id : 8]
-Input [2]: [sum#96, count#97]
+Input [2]: [sum#95, count#96]
 Keys: []
-Functions [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98]
-Results [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98 AS average_sales#99]
+Functions [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97]
+Results [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97 AS average_sales#98]
 
-Subquery:2 Hosting operator id = 91 Hosting Expression = ss_sold_date_sk#78 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 91 Hosting Expression = ss_sold_date_sk#77 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 96 Hosting Expression = cs_sold_date_sk#84 IN dynamicpruning#12
+Subquery:3 Hosting operator id = 96 Hosting Expression = cs_sold_date_sk#83 IN dynamicpruning#12
 
-Subquery:4 Hosting operator id = 101 Hosting Expression = ws_sold_date_sk#90 IN dynamicpruning#12
+Subquery:4 Hosting operator id = 101 Hosting Expression = ws_sold_date_sk#89 IN dynamicpruning#12
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
 BroadcastExchange (114)
@@ -645,30 +645,30 @@ BroadcastExchange (114)
 
 
 (110) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#36, d_week_seq#100]
+Output [2]: [d_date_sk#36, d_week_seq#99]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#101), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#100), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (111) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#36, d_week_seq#100]
+Input [2]: [d_date_sk#36, d_week_seq#99]
 
 (112) Filter [codegen id : 1]
-Input [2]: [d_date_sk#36, d_week_seq#100]
-Condition : ((isnotnull(d_week_seq#100) AND (d_week_seq#100 = ReusedSubquery Subquery scalar-subquery#101, [id=#102])) AND isnotnull(d_date_sk#36))
+Input [2]: [d_date_sk#36, d_week_seq#99]
+Condition : ((isnotnull(d_week_seq#99) AND (d_week_seq#99 = ReusedSubquery Subquery scalar-subquery#100, [id=#16])) AND isnotnull(d_date_sk#36))
 
 (113) Project [codegen id : 1]
 Output [1]: [d_date_sk#36]
-Input [2]: [d_date_sk#36, d_week_seq#100]
+Input [2]: [d_date_sk#36, d_week_seq#99]
 
 (114) BroadcastExchange
 Input [1]: [d_date_sk#36]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
 
-Subquery:6 Hosting operator id = 112 Hosting Expression = ReusedSubquery Subquery scalar-subquery#101, [id=#102]
+Subquery:6 Hosting operator id = 112 Hosting Expression = ReusedSubquery Subquery scalar-subquery#100, [id=#16]
 
-Subquery:7 Hosting operator id = 110 Hosting Expression = Subquery scalar-subquery#101, [id=#102]
+Subquery:7 Hosting operator id = 110 Hosting Expression = Subquery scalar-subquery#100, [id=#16]
 * Project (118)
 +- * Filter (117)
    +- * ColumnarToRow (116)
@@ -676,22 +676,22 @@ Subquery:7 Hosting operator id = 110 Hosting Expression = Subquery scalar-subque
 
 
 (115) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,2000), EqualTo(d_moy,12), EqualTo(d_dom,11)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (116) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 (117) Filter [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
-Condition : (((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND isnotnull(d_dom#106)) AND (d_year#104 = 2000)) AND (d_moy#105 = 12)) AND (d_dom#106 = 11))
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
+Condition : (((((isnotnull(d_year#102) AND isnotnull(d_moy#103)) AND isnotnull(d_dom#104)) AND (d_year#102 = 2000)) AND (d_moy#103 = 12)) AND (d_dom#104 = 11))
 
 (118) Project [codegen id : 1]
-Output [1]: [d_week_seq#103]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [1]: [d_week_seq#101]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 Subquery:8 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
 BroadcastExchange (123)
@@ -702,34 +702,34 @@ BroadcastExchange (123)
 
 
 (119) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#13, d_year#107]
+Output [2]: [d_date_sk#13, d_year#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1999), LessThanOrEqual(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (120) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#107]
+Input [2]: [d_date_sk#13, d_year#105]
 
 (121) Filter [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#107]
-Condition : (((isnotnull(d_year#107) AND (d_year#107 >= 1999)) AND (d_year#107 <= 2001)) AND isnotnull(d_date_sk#13))
+Input [2]: [d_date_sk#13, d_year#105]
+Condition : (((isnotnull(d_year#105) AND (d_year#105 >= 1999)) AND (d_year#105 <= 2001)) AND isnotnull(d_date_sk#13))
 
 (122) Project [codegen id : 1]
 Output [1]: [d_date_sk#13]
-Input [2]: [d_date_sk#13, d_year#107]
+Input [2]: [d_date_sk#13, d_year#105]
 
 (123) BroadcastExchange
 Input [1]: [d_date_sk#13]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=18]
 
 Subquery:9 Hosting operator id = 18 Hosting Expression = cs_sold_date_sk#19 IN dynamicpruning#12
 
 Subquery:10 Hosting operator id = 41 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:11 Hosting operator id = 87 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:11 Hosting operator id = 87 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
 
-Subquery:12 Hosting operator id = 73 Hosting Expression = ss_sold_date_sk#57 IN dynamicpruning#58
+Subquery:12 Hosting operator id = 73 Hosting Expression = ss_sold_date_sk#56 IN dynamicpruning#57
 BroadcastExchange (128)
 +- * Project (127)
    +- * Filter (126)
@@ -738,30 +738,30 @@ BroadcastExchange (128)
 
 
 (124) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#60, d_week_seq#108]
+Output [2]: [d_date_sk#59, d_week_seq#106]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#109), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#107), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (125) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#60, d_week_seq#108]
+Input [2]: [d_date_sk#59, d_week_seq#106]
 
 (126) Filter [codegen id : 1]
-Input [2]: [d_date_sk#60, d_week_seq#108]
-Condition : ((isnotnull(d_week_seq#108) AND (d_week_seq#108 = ReusedSubquery Subquery scalar-subquery#109, [id=#110])) AND isnotnull(d_date_sk#60))
+Input [2]: [d_date_sk#59, d_week_seq#106]
+Condition : ((isnotnull(d_week_seq#106) AND (d_week_seq#106 = ReusedSubquery Subquery scalar-subquery#107, [id=#19])) AND isnotnull(d_date_sk#59))
 
 (127) Project [codegen id : 1]
-Output [1]: [d_date_sk#60]
-Input [2]: [d_date_sk#60, d_week_seq#108]
+Output [1]: [d_date_sk#59]
+Input [2]: [d_date_sk#59, d_week_seq#106]
 
 (128) BroadcastExchange
-Input [1]: [d_date_sk#60]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
+Input [1]: [d_date_sk#59]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=20]
 
-Subquery:13 Hosting operator id = 126 Hosting Expression = ReusedSubquery Subquery scalar-subquery#109, [id=#110]
+Subquery:13 Hosting operator id = 126 Hosting Expression = ReusedSubquery Subquery scalar-subquery#107, [id=#19]
 
-Subquery:14 Hosting operator id = 124 Hosting Expression = Subquery scalar-subquery#109, [id=#110]
+Subquery:14 Hosting operator id = 124 Hosting Expression = Subquery scalar-subquery#107, [id=#19]
 * Project (132)
 +- * Filter (131)
    +- * ColumnarToRow (130)
@@ -769,21 +769,21 @@ Subquery:14 Hosting operator id = 124 Hosting Expression = Subquery scalar-subqu
 
 
 (129) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,1999), EqualTo(d_moy,12), EqualTo(d_dom,11)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (130) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 (131) Filter [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
-Condition : (((((isnotnull(d_year#112) AND isnotnull(d_moy#113)) AND isnotnull(d_dom#114)) AND (d_year#112 = 1999)) AND (d_moy#113 = 12)) AND (d_dom#114 = 11))
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
+Condition : (((((isnotnull(d_year#109) AND isnotnull(d_moy#110)) AND isnotnull(d_dom#111)) AND (d_year#109 = 1999)) AND (d_moy#110 = 12)) AND (d_dom#111 = 11))
 
 (132) Project [codegen id : 1]
-Output [1]: [d_week_seq#111]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [1]: [d_week_seq#108]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b/explain.txt
index 3f4f3653371d9..9598ffa44739b 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q14b/explain.txt
@@ -399,97 +399,97 @@ Results [6]: [store AS channel#49, i_brand_id#37, i_class_id#38, i_category_id#3
 
 (66) Filter [codegen id : 52]
 Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51]
-Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
 
 (67) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Output [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#57), dynamicpruningexpression(ss_sold_date_sk#57 IN dynamicpruning#58)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#56), dynamicpruningexpression(ss_sold_date_sk#56 IN dynamicpruning#57)]
 PushedFilters: [IsNotNull(ss_item_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (68) ColumnarToRow [codegen id : 50]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 
 (69) Filter [codegen id : 50]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
-Condition : isnotnull(ss_item_sk#54)
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
+Condition : isnotnull(ss_item_sk#53)
 
 (70) ReusedExchange [Reuses operator id: 50]
-Output [1]: [ss_item_sk#59]
+Output [1]: [ss_item_sk#58]
 
 (71) BroadcastHashJoin [codegen id : 50]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [ss_item_sk#59]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [ss_item_sk#58]
 Join type: LeftSemi
 Join condition: None
 
 (72) ReusedExchange [Reuses operator id: 57]
-Output [4]: [i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
+Output [4]: [i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
 
 (73) BroadcastHashJoin [codegen id : 50]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [i_item_sk#60]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [i_item_sk#59]
 Join type: Inner
 Join condition: None
 
 (74) Project [codegen id : 50]
-Output [6]: [ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, i_brand_id#61, i_class_id#62, i_category_id#63]
-Input [8]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
+Output [6]: [ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, i_brand_id#60, i_class_id#61, i_category_id#62]
+Input [8]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
 
 (75) ReusedExchange [Reuses operator id: 122]
-Output [1]: [d_date_sk#64]
+Output [1]: [d_date_sk#63]
 
 (76) BroadcastHashJoin [codegen id : 50]
-Left keys [1]: [ss_sold_date_sk#57]
-Right keys [1]: [d_date_sk#64]
+Left keys [1]: [ss_sold_date_sk#56]
+Right keys [1]: [d_date_sk#63]
 Join type: Inner
 Join condition: None
 
 (77) Project [codegen id : 50]
-Output [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#61, i_class_id#62, i_category_id#63]
-Input [7]: [ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, i_brand_id#61, i_class_id#62, i_category_id#63, d_date_sk#64]
+Output [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#60, i_class_id#61, i_category_id#62]
+Input [7]: [ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, i_brand_id#60, i_class_id#61, i_category_id#62, d_date_sk#63]
 
 (78) HashAggregate [codegen id : 50]
-Input [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#61, i_class_id#62, i_category_id#63]
-Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
-Functions [2]: [partial_sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), partial_count(1)]
-Aggregate Attributes [3]: [sum#65, isEmpty#66, count#67]
-Results [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#68, isEmpty#69, count#70]
+Input [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#60, i_class_id#61, i_category_id#62]
+Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
+Functions [2]: [partial_sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), partial_count(1)]
+Aggregate Attributes [3]: [sum#64, isEmpty#65, count#66]
+Results [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
 
 (79) Exchange
-Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#68, isEmpty#69, count#70]
-Arguments: hashpartitioning(i_brand_id#61, i_class_id#62, i_category_id#63, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
+Arguments: hashpartitioning(i_brand_id#60, i_class_id#61, i_category_id#62, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (80) HashAggregate [codegen id : 51]
-Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#68, isEmpty#69, count#70]
-Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
-Functions [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71, count(1)#72]
-Results [6]: [store AS channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71 AS sales#74, count(1)#72 AS number_sales#75]
+Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
+Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
+Functions [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70, count(1)#71]
+Results [6]: [store AS channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70 AS sales#73, count(1)#71 AS number_sales#74]
 
 (81) Filter [codegen id : 51]
-Input [6]: [channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
-Condition : (isnotnull(sales#74) AND (cast(sales#74 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
+Condition : (isnotnull(sales#73) AND (cast(sales#73 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
 
 (82) BroadcastExchange
-Input [6]: [channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
-Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=11]
+Input [6]: [channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
+Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=12]
 
 (83) BroadcastHashJoin [codegen id : 52]
 Left keys [3]: [i_brand_id#37, i_class_id#38, i_category_id#39]
-Right keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
+Right keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
 Join type: Inner
 Join condition: None
 
 (84) TakeOrderedAndProject
-Input [12]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
-Arguments: 100, [i_brand_id#37 ASC NULLS FIRST, i_class_id#38 ASC NULLS FIRST, i_category_id#39 ASC NULLS FIRST], [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
+Input [12]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
+Arguments: 100, [i_brand_id#37 ASC NULLS FIRST, i_class_id#38 ASC NULLS FIRST, i_category_id#39 ASC NULLS FIRST], [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#52, [id=#53]
+Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#52, [id=#10]
 * HashAggregate (103)
 +- Exchange (102)
    +- * HashAggregate (101)
@@ -512,99 +512,99 @@ Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquer
 
 
 (85) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Output [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#78), dynamicpruningexpression(ss_sold_date_sk#78 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#77), dynamicpruningexpression(ss_sold_date_sk#77 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (86) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Input [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 
 (87) ReusedExchange [Reuses operator id: 117]
-Output [1]: [d_date_sk#79]
+Output [1]: [d_date_sk#78]
 
 (88) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#78]
-Right keys [1]: [d_date_sk#79]
+Left keys [1]: [ss_sold_date_sk#77]
+Right keys [1]: [d_date_sk#78]
 Join type: Inner
 Join condition: None
 
 (89) Project [codegen id : 2]
-Output [2]: [ss_quantity#76 AS quantity#80, ss_list_price#77 AS list_price#81]
-Input [4]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78, d_date_sk#79]
+Output [2]: [ss_quantity#75 AS quantity#79, ss_list_price#76 AS list_price#80]
+Input [4]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77, d_date_sk#78]
 
 (90) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Output [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#84), dynamicpruningexpression(cs_sold_date_sk#84 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#83), dynamicpruningexpression(cs_sold_date_sk#83 IN dynamicpruning#12)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (91) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Input [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 
 (92) ReusedExchange [Reuses operator id: 117]
-Output [1]: [d_date_sk#85]
+Output [1]: [d_date_sk#84]
 
 (93) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#84]
-Right keys [1]: [d_date_sk#85]
+Left keys [1]: [cs_sold_date_sk#83]
+Right keys [1]: [d_date_sk#84]
 Join type: Inner
 Join condition: None
 
 (94) Project [codegen id : 4]
-Output [2]: [cs_quantity#82 AS quantity#86, cs_list_price#83 AS list_price#87]
-Input [4]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84, d_date_sk#85]
+Output [2]: [cs_quantity#81 AS quantity#85, cs_list_price#82 AS list_price#86]
+Input [4]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83, d_date_sk#84]
 
 (95) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Output [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#90), dynamicpruningexpression(ws_sold_date_sk#90 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#89), dynamicpruningexpression(ws_sold_date_sk#89 IN dynamicpruning#12)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (96) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Input [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 
 (97) ReusedExchange [Reuses operator id: 117]
-Output [1]: [d_date_sk#91]
+Output [1]: [d_date_sk#90]
 
 (98) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#90]
-Right keys [1]: [d_date_sk#91]
+Left keys [1]: [ws_sold_date_sk#89]
+Right keys [1]: [d_date_sk#90]
 Join type: Inner
 Join condition: None
 
 (99) Project [codegen id : 6]
-Output [2]: [ws_quantity#88 AS quantity#92, ws_list_price#89 AS list_price#93]
-Input [4]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90, d_date_sk#91]
+Output [2]: [ws_quantity#87 AS quantity#91, ws_list_price#88 AS list_price#92]
+Input [4]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89, d_date_sk#90]
 
 (100) Union
 
 (101) HashAggregate [codegen id : 7]
-Input [2]: [quantity#80, list_price#81]
+Input [2]: [quantity#79, list_price#80]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [2]: [sum#94, count#95]
-Results [2]: [sum#96, count#97]
+Functions [1]: [partial_avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [2]: [sum#93, count#94]
+Results [2]: [sum#95, count#96]
 
 (102) Exchange
-Input [2]: [sum#96, count#97]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
+Input [2]: [sum#95, count#96]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (103) HashAggregate [codegen id : 8]
-Input [2]: [sum#96, count#97]
+Input [2]: [sum#95, count#96]
 Keys: []
-Functions [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98]
-Results [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98 AS average_sales#99]
+Functions [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97]
+Results [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97 AS average_sales#98]
 
-Subquery:2 Hosting operator id = 85 Hosting Expression = ss_sold_date_sk#78 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 85 Hosting Expression = ss_sold_date_sk#77 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 90 Hosting Expression = cs_sold_date_sk#84 IN dynamicpruning#12
+Subquery:3 Hosting operator id = 90 Hosting Expression = cs_sold_date_sk#83 IN dynamicpruning#12
 
-Subquery:4 Hosting operator id = 95 Hosting Expression = ws_sold_date_sk#90 IN dynamicpruning#12
+Subquery:4 Hosting operator id = 95 Hosting Expression = ws_sold_date_sk#89 IN dynamicpruning#12
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
 BroadcastExchange (108)
@@ -615,30 +615,30 @@ BroadcastExchange (108)
 
 
 (104) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#40, d_week_seq#100]
+Output [2]: [d_date_sk#40, d_week_seq#99]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#101), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#100), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (105) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#40, d_week_seq#100]
+Input [2]: [d_date_sk#40, d_week_seq#99]
 
 (106) Filter [codegen id : 1]
-Input [2]: [d_date_sk#40, d_week_seq#100]
-Condition : ((isnotnull(d_week_seq#100) AND (d_week_seq#100 = ReusedSubquery Subquery scalar-subquery#101, [id=#102])) AND isnotnull(d_date_sk#40))
+Input [2]: [d_date_sk#40, d_week_seq#99]
+Condition : ((isnotnull(d_week_seq#99) AND (d_week_seq#99 = ReusedSubquery Subquery scalar-subquery#100, [id=#14])) AND isnotnull(d_date_sk#40))
 
 (107) Project [codegen id : 1]
 Output [1]: [d_date_sk#40]
-Input [2]: [d_date_sk#40, d_week_seq#100]
+Input [2]: [d_date_sk#40, d_week_seq#99]
 
 (108) BroadcastExchange
 Input [1]: [d_date_sk#40]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
 
-Subquery:6 Hosting operator id = 106 Hosting Expression = ReusedSubquery Subquery scalar-subquery#101, [id=#102]
+Subquery:6 Hosting operator id = 106 Hosting Expression = ReusedSubquery Subquery scalar-subquery#100, [id=#14]
 
-Subquery:7 Hosting operator id = 104 Hosting Expression = Subquery scalar-subquery#101, [id=#102]
+Subquery:7 Hosting operator id = 104 Hosting Expression = Subquery scalar-subquery#100, [id=#14]
 * Project (112)
 +- * Filter (111)
    +- * ColumnarToRow (110)
@@ -646,22 +646,22 @@ Subquery:7 Hosting operator id = 104 Hosting Expression = Subquery scalar-subque
 
 
 (109) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,2000), EqualTo(d_moy,12), EqualTo(d_dom,11)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (110) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 (111) Filter [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
-Condition : (((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND isnotnull(d_dom#106)) AND (d_year#104 = 2000)) AND (d_moy#105 = 12)) AND (d_dom#106 = 11))
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
+Condition : (((((isnotnull(d_year#102) AND isnotnull(d_moy#103)) AND isnotnull(d_dom#104)) AND (d_year#102 = 2000)) AND (d_moy#103 = 12)) AND (d_dom#104 = 11))
 
 (112) Project [codegen id : 1]
-Output [1]: [d_week_seq#103]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [1]: [d_week_seq#101]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 Subquery:8 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
 BroadcastExchange (117)
@@ -672,34 +672,34 @@ BroadcastExchange (117)
 
 
 (113) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_year#107]
+Output [2]: [d_date_sk#24, d_year#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1999), LessThanOrEqual(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (114) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#107]
+Input [2]: [d_date_sk#24, d_year#105]
 
 (115) Filter [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#107]
-Condition : (((isnotnull(d_year#107) AND (d_year#107 >= 1999)) AND (d_year#107 <= 2001)) AND isnotnull(d_date_sk#24))
+Input [2]: [d_date_sk#24, d_year#105]
+Condition : (((isnotnull(d_year#105) AND (d_year#105 >= 1999)) AND (d_year#105 <= 2001)) AND isnotnull(d_date_sk#24))
 
 (116) Project [codegen id : 1]
 Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_year#107]
+Input [2]: [d_date_sk#24, d_year#105]
 
 (117) BroadcastExchange
 Input [1]: [d_date_sk#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
 
 Subquery:9 Hosting operator id = 13 Hosting Expression = cs_sold_date_sk#18 IN dynamicpruning#12
 
 Subquery:10 Hosting operator id = 36 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:11 Hosting operator id = 81 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:11 Hosting operator id = 81 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
 
-Subquery:12 Hosting operator id = 67 Hosting Expression = ss_sold_date_sk#57 IN dynamicpruning#58
+Subquery:12 Hosting operator id = 67 Hosting Expression = ss_sold_date_sk#56 IN dynamicpruning#57
 BroadcastExchange (122)
 +- * Project (121)
    +- * Filter (120)
@@ -708,30 +708,30 @@ BroadcastExchange (122)
 
 
 (118) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#64, d_week_seq#108]
+Output [2]: [d_date_sk#63, d_week_seq#106]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#109), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#107), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (119) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#64, d_week_seq#108]
+Input [2]: [d_date_sk#63, d_week_seq#106]
 
 (120) Filter [codegen id : 1]
-Input [2]: [d_date_sk#64, d_week_seq#108]
-Condition : ((isnotnull(d_week_seq#108) AND (d_week_seq#108 = ReusedSubquery Subquery scalar-subquery#109, [id=#110])) AND isnotnull(d_date_sk#64))
+Input [2]: [d_date_sk#63, d_week_seq#106]
+Condition : ((isnotnull(d_week_seq#106) AND (d_week_seq#106 = ReusedSubquery Subquery scalar-subquery#107, [id=#17])) AND isnotnull(d_date_sk#63))
 
 (121) Project [codegen id : 1]
-Output [1]: [d_date_sk#64]
-Input [2]: [d_date_sk#64, d_week_seq#108]
+Output [1]: [d_date_sk#63]
+Input [2]: [d_date_sk#63, d_week_seq#106]
 
 (122) BroadcastExchange
-Input [1]: [d_date_sk#64]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
+Input [1]: [d_date_sk#63]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=18]
 
-Subquery:13 Hosting operator id = 120 Hosting Expression = ReusedSubquery Subquery scalar-subquery#109, [id=#110]
+Subquery:13 Hosting operator id = 120 Hosting Expression = ReusedSubquery Subquery scalar-subquery#107, [id=#17]
 
-Subquery:14 Hosting operator id = 118 Hosting Expression = Subquery scalar-subquery#109, [id=#110]
+Subquery:14 Hosting operator id = 118 Hosting Expression = Subquery scalar-subquery#107, [id=#17]
 * Project (126)
 +- * Filter (125)
    +- * ColumnarToRow (124)
@@ -739,21 +739,21 @@ Subquery:14 Hosting operator id = 118 Hosting Expression = Subquery scalar-subqu
 
 
 (123) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,1999), EqualTo(d_moy,12), EqualTo(d_dom,11)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (124) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 (125) Filter [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
-Condition : (((((isnotnull(d_year#112) AND isnotnull(d_moy#113)) AND isnotnull(d_dom#114)) AND (d_year#112 = 1999)) AND (d_moy#113 = 12)) AND (d_dom#114 = 11))
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
+Condition : (((((isnotnull(d_year#109) AND isnotnull(d_moy#110)) AND isnotnull(d_dom#111)) AND (d_year#109 = 1999)) AND (d_moy#110 = 12)) AND (d_dom#111 = 11))
 
 (126) Project [codegen id : 1]
-Output [1]: [d_week_seq#111]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [1]: [d_week_seq#108]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q16.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q16.sf100/explain.txt
index aadf72d0af219..8e9f3b2379bc2 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q16.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q16.sf100/explain.txt
@@ -58,7 +58,7 @@ Input [8]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_wareho
 
 (3) Filter [codegen id : 1]
 Input [8]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_warehouse_sk#4, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, cs_sold_date_sk#8]
-Condition : (((((isnotnull(cs_ship_date_sk#1) AND isnotnull(cs_ship_addr_sk#2)) AND isnotnull(cs_call_center_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#10], xxhash64(cs_ship_addr_sk#2, 42))) AND might_contain(Subquery scalar-subquery#11, [id=#12], xxhash64(cs_call_center_sk#3, 42))) AND might_contain(Subquery scalar-subquery#13, [id=#14], xxhash64(cs_ship_date_sk#1, 42)))
+Condition : (((((isnotnull(cs_ship_date_sk#1) AND isnotnull(cs_ship_addr_sk#2)) AND isnotnull(cs_call_center_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#1], xxhash64(cs_ship_addr_sk#2, 42))) AND might_contain(Subquery scalar-subquery#10, [id=#2], xxhash64(cs_call_center_sk#3, 42))) AND might_contain(Subquery scalar-subquery#11, [id=#3], xxhash64(cs_ship_date_sk#1, 42)))
 
 (4) Project [codegen id : 1]
 Output [7]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_warehouse_sk#4, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
@@ -66,201 +66,201 @@ Input [8]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_wareho
 
 (5) Exchange
 Input [7]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_warehouse_sk#4, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
-Arguments: hashpartitioning(cs_order_number#5, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(cs_order_number#5, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (6) Sort [codegen id : 2]
 Input [7]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_warehouse_sk#4, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
 Arguments: [cs_order_number#5 ASC NULLS FIRST], false, 0
 
 (7) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_warehouse_sk#15, cs_order_number#16, cs_sold_date_sk#17]
+Output [3]: [cs_warehouse_sk#12, cs_order_number#13, cs_sold_date_sk#14]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_sales]
 ReadSchema: struct<cs_warehouse_sk:int,cs_order_number:int>
 
 (8) ColumnarToRow [codegen id : 3]
-Input [3]: [cs_warehouse_sk#15, cs_order_number#16, cs_sold_date_sk#17]
+Input [3]: [cs_warehouse_sk#12, cs_order_number#13, cs_sold_date_sk#14]
 
 (9) Project [codegen id : 3]
-Output [2]: [cs_warehouse_sk#15, cs_order_number#16]
-Input [3]: [cs_warehouse_sk#15, cs_order_number#16, cs_sold_date_sk#17]
+Output [2]: [cs_warehouse_sk#12, cs_order_number#13]
+Input [3]: [cs_warehouse_sk#12, cs_order_number#13, cs_sold_date_sk#14]
 
 (10) Exchange
-Input [2]: [cs_warehouse_sk#15, cs_order_number#16]
-Arguments: hashpartitioning(cs_order_number#16, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [2]: [cs_warehouse_sk#12, cs_order_number#13]
+Arguments: hashpartitioning(cs_order_number#13, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (11) Sort [codegen id : 4]
-Input [2]: [cs_warehouse_sk#15, cs_order_number#16]
-Arguments: [cs_order_number#16 ASC NULLS FIRST], false, 0
+Input [2]: [cs_warehouse_sk#12, cs_order_number#13]
+Arguments: [cs_order_number#13 ASC NULLS FIRST], false, 0
 
 (12) SortMergeJoin [codegen id : 5]
 Left keys [1]: [cs_order_number#5]
-Right keys [1]: [cs_order_number#16]
+Right keys [1]: [cs_order_number#13]
 Join type: LeftSemi
-Join condition: NOT (cs_warehouse_sk#4 = cs_warehouse_sk#15)
+Join condition: NOT (cs_warehouse_sk#4 = cs_warehouse_sk#12)
 
 (13) Project [codegen id : 5]
 Output [6]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
 Input [7]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_warehouse_sk#4, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
 
 (14) Scan parquet spark_catalog.default.catalog_returns
-Output [2]: [cr_order_number#18, cr_returned_date_sk#19]
+Output [2]: [cr_order_number#15, cr_returned_date_sk#16]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_returns]
 ReadSchema: struct<cr_order_number:int>
 
 (15) ColumnarToRow [codegen id : 6]
-Input [2]: [cr_order_number#18, cr_returned_date_sk#19]
+Input [2]: [cr_order_number#15, cr_returned_date_sk#16]
 
 (16) Project [codegen id : 6]
-Output [1]: [cr_order_number#18]
-Input [2]: [cr_order_number#18, cr_returned_date_sk#19]
+Output [1]: [cr_order_number#15]
+Input [2]: [cr_order_number#15, cr_returned_date_sk#16]
 
 (17) Exchange
-Input [1]: [cr_order_number#18]
-Arguments: hashpartitioning(cr_order_number#18, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [1]: [cr_order_number#15]
+Arguments: hashpartitioning(cr_order_number#15, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (18) Sort [codegen id : 7]
-Input [1]: [cr_order_number#18]
-Arguments: [cr_order_number#18 ASC NULLS FIRST], false, 0
+Input [1]: [cr_order_number#15]
+Arguments: [cr_order_number#15 ASC NULLS FIRST], false, 0
 
 (19) SortMergeJoin [codegen id : 11]
 Left keys [1]: [cs_order_number#5]
-Right keys [1]: [cr_order_number#18]
+Right keys [1]: [cr_order_number#15]
 Join type: LeftAnti
 Join condition: None
 
 (20) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#20, ca_state#21]
+Output [2]: [ca_address_sk#17, ca_state#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_state), EqualTo(ca_state,GA), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (21) ColumnarToRow [codegen id : 8]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (22) Filter [codegen id : 8]
-Input [2]: [ca_address_sk#20, ca_state#21]
-Condition : ((isnotnull(ca_state#21) AND (ca_state#21 = GA)) AND isnotnull(ca_address_sk#20))
+Input [2]: [ca_address_sk#17, ca_state#18]
+Condition : ((isnotnull(ca_state#18) AND (ca_state#18 = GA)) AND isnotnull(ca_address_sk#17))
 
 (23) Project [codegen id : 8]
-Output [1]: [ca_address_sk#20]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (24) BroadcastExchange
-Input [1]: [ca_address_sk#20]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [ca_address_sk#17]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 (25) BroadcastHashJoin [codegen id : 11]
 Left keys [1]: [cs_ship_addr_sk#2]
-Right keys [1]: [ca_address_sk#20]
+Right keys [1]: [ca_address_sk#17]
 Join type: Inner
 Join condition: None
 
 (26) Project [codegen id : 11]
 Output [5]: [cs_ship_date_sk#1, cs_call_center_sk#3, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
-Input [7]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, ca_address_sk#20]
+Input [7]: [cs_ship_date_sk#1, cs_ship_addr_sk#2, cs_call_center_sk#3, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, ca_address_sk#17]
 
 (27) Scan parquet spark_catalog.default.call_center
-Output [2]: [cc_call_center_sk#22, cc_county#23]
+Output [2]: [cc_call_center_sk#19, cc_county#20]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/call_center]
 PushedFilters: [IsNotNull(cc_county), EqualTo(cc_county,Williamson County), IsNotNull(cc_call_center_sk)]
 ReadSchema: struct<cc_call_center_sk:int,cc_county:string>
 
 (28) ColumnarToRow [codegen id : 9]
-Input [2]: [cc_call_center_sk#22, cc_county#23]
+Input [2]: [cc_call_center_sk#19, cc_county#20]
 
 (29) Filter [codegen id : 9]
-Input [2]: [cc_call_center_sk#22, cc_county#23]
-Condition : ((isnotnull(cc_county#23) AND (cc_county#23 = Williamson County)) AND isnotnull(cc_call_center_sk#22))
+Input [2]: [cc_call_center_sk#19, cc_county#20]
+Condition : ((isnotnull(cc_county#20) AND (cc_county#20 = Williamson County)) AND isnotnull(cc_call_center_sk#19))
 
 (30) Project [codegen id : 9]
-Output [1]: [cc_call_center_sk#22]
-Input [2]: [cc_call_center_sk#22, cc_county#23]
+Output [1]: [cc_call_center_sk#19]
+Input [2]: [cc_call_center_sk#19, cc_county#20]
 
 (31) BroadcastExchange
-Input [1]: [cc_call_center_sk#22]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Input [1]: [cc_call_center_sk#19]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
 
 (32) BroadcastHashJoin [codegen id : 11]
 Left keys [1]: [cs_call_center_sk#3]
-Right keys [1]: [cc_call_center_sk#22]
+Right keys [1]: [cc_call_center_sk#19]
 Join type: Inner
 Join condition: None
 
 (33) Project [codegen id : 11]
 Output [4]: [cs_ship_date_sk#1, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
-Input [6]: [cs_ship_date_sk#1, cs_call_center_sk#3, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, cc_call_center_sk#22]
+Input [6]: [cs_ship_date_sk#1, cs_call_center_sk#3, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, cc_call_center_sk#19]
 
 (34) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_date#25]
+Output [2]: [d_date_sk#21, d_date#22]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2002-02-01), LessThanOrEqual(d_date,2002-04-02), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (35) ColumnarToRow [codegen id : 10]
-Input [2]: [d_date_sk#24, d_date#25]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (36) Filter [codegen id : 10]
-Input [2]: [d_date_sk#24, d_date#25]
-Condition : (((isnotnull(d_date#25) AND (d_date#25 >= 2002-02-01)) AND (d_date#25 <= 2002-04-02)) AND isnotnull(d_date_sk#24))
+Input [2]: [d_date_sk#21, d_date#22]
+Condition : (((isnotnull(d_date#22) AND (d_date#22 >= 2002-02-01)) AND (d_date#22 <= 2002-04-02)) AND isnotnull(d_date_sk#21))
 
 (37) Project [codegen id : 10]
-Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_date#25]
+Output [1]: [d_date_sk#21]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (38) BroadcastExchange
-Input [1]: [d_date_sk#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [d_date_sk#21]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
 (39) BroadcastHashJoin [codegen id : 11]
 Left keys [1]: [cs_ship_date_sk#1]
-Right keys [1]: [d_date_sk#24]
+Right keys [1]: [d_date_sk#21]
 Join type: Inner
 Join condition: None
 
 (40) Project [codegen id : 11]
 Output [3]: [cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
-Input [5]: [cs_ship_date_sk#1, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, d_date_sk#24]
+Input [5]: [cs_ship_date_sk#1, cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7, d_date_sk#21]
 
 (41) HashAggregate [codegen id : 11]
 Input [3]: [cs_order_number#5, cs_ext_ship_cost#6, cs_net_profit#7]
 Keys [1]: [cs_order_number#5]
 Functions [2]: [partial_sum(UnscaledValue(cs_ext_ship_cost#6)), partial_sum(UnscaledValue(cs_net_profit#7))]
-Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_ship_cost#6))#26, sum(UnscaledValue(cs_net_profit#7))#27]
-Results [3]: [cs_order_number#5, sum#28, sum#29]
+Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_ship_cost#6))#23, sum(UnscaledValue(cs_net_profit#7))#24]
+Results [3]: [cs_order_number#5, sum#25, sum#26]
 
 (42) HashAggregate [codegen id : 11]
-Input [3]: [cs_order_number#5, sum#28, sum#29]
+Input [3]: [cs_order_number#5, sum#25, sum#26]
 Keys [1]: [cs_order_number#5]
 Functions [2]: [merge_sum(UnscaledValue(cs_ext_ship_cost#6)), merge_sum(UnscaledValue(cs_net_profit#7))]
-Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_ship_cost#6))#26, sum(UnscaledValue(cs_net_profit#7))#27]
-Results [3]: [cs_order_number#5, sum#28, sum#29]
+Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_ship_cost#6))#23, sum(UnscaledValue(cs_net_profit#7))#24]
+Results [3]: [cs_order_number#5, sum#25, sum#26]
 
 (43) HashAggregate [codegen id : 11]
-Input [3]: [cs_order_number#5, sum#28, sum#29]
+Input [3]: [cs_order_number#5, sum#25, sum#26]
 Keys: []
 Functions [3]: [merge_sum(UnscaledValue(cs_ext_ship_cost#6)), merge_sum(UnscaledValue(cs_net_profit#7)), partial_count(distinct cs_order_number#5)]
-Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_ship_cost#6))#26, sum(UnscaledValue(cs_net_profit#7))#27, count(cs_order_number#5)#30]
-Results [3]: [sum#28, sum#29, count#31]
+Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_ship_cost#6))#23, sum(UnscaledValue(cs_net_profit#7))#24, count(cs_order_number#5)#27]
+Results [3]: [sum#25, sum#26, count#28]
 
 (44) Exchange
-Input [3]: [sum#28, sum#29, count#31]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
+Input [3]: [sum#25, sum#26, count#28]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
 
 (45) HashAggregate [codegen id : 12]
-Input [3]: [sum#28, sum#29, count#31]
+Input [3]: [sum#25, sum#26, count#28]
 Keys: []
 Functions [3]: [sum(UnscaledValue(cs_ext_ship_cost#6)), sum(UnscaledValue(cs_net_profit#7)), count(distinct cs_order_number#5)]
-Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_ship_cost#6))#26, sum(UnscaledValue(cs_net_profit#7))#27, count(cs_order_number#5)#30]
-Results [3]: [count(cs_order_number#5)#30 AS order count #32, MakeDecimal(sum(UnscaledValue(cs_ext_ship_cost#6))#26,17,2) AS total shipping cost #33, MakeDecimal(sum(UnscaledValue(cs_net_profit#7))#27,17,2) AS total net profit #34]
+Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_ship_cost#6))#23, sum(UnscaledValue(cs_net_profit#7))#24, count(cs_order_number#5)#27]
+Results [3]: [count(cs_order_number#5)#27 AS order count #29, MakeDecimal(sum(UnscaledValue(cs_ext_ship_cost#6))#23,17,2) AS total shipping cost #30, MakeDecimal(sum(UnscaledValue(cs_net_profit#7))#24,17,2) AS total net profit #31]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#10]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#1]
 ObjectHashAggregate (52)
 +- Exchange (51)
    +- ObjectHashAggregate (50)
@@ -271,42 +271,42 @@ ObjectHashAggregate (52)
 
 
 (46) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#20, ca_state#21]
+Output [2]: [ca_address_sk#17, ca_state#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_state), EqualTo(ca_state,GA), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (47) ColumnarToRow [codegen id : 1]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (48) Filter [codegen id : 1]
-Input [2]: [ca_address_sk#20, ca_state#21]
-Condition : ((isnotnull(ca_state#21) AND (ca_state#21 = GA)) AND isnotnull(ca_address_sk#20))
+Input [2]: [ca_address_sk#17, ca_state#18]
+Condition : ((isnotnull(ca_state#18) AND (ca_state#18 = GA)) AND isnotnull(ca_address_sk#17))
 
 (49) Project [codegen id : 1]
-Output [1]: [ca_address_sk#20]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (50) ObjectHashAggregate
-Input [1]: [ca_address_sk#20]
+Input [1]: [ca_address_sk#17]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)]
-Aggregate Attributes [1]: [buf#35]
-Results [1]: [buf#36]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)]
+Aggregate Attributes [1]: [buf#32]
+Results [1]: [buf#33]
 
 (51) Exchange
-Input [1]: [buf#36]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
+Input [1]: [buf#33]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
 
 (52) ObjectHashAggregate
-Input [1]: [buf#36]
+Input [1]: [buf#33]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)#37]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)#37 AS bloomFilter#38]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)#34]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)#34 AS bloomFilter#35]
 
-Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#11, [id=#12]
+Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#10, [id=#2]
 ObjectHashAggregate (59)
 +- Exchange (58)
    +- ObjectHashAggregate (57)
@@ -317,42 +317,42 @@ ObjectHashAggregate (59)
 
 
 (53) Scan parquet spark_catalog.default.call_center
-Output [2]: [cc_call_center_sk#22, cc_county#23]
+Output [2]: [cc_call_center_sk#19, cc_county#20]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/call_center]
 PushedFilters: [IsNotNull(cc_county), EqualTo(cc_county,Williamson County), IsNotNull(cc_call_center_sk)]
 ReadSchema: struct<cc_call_center_sk:int,cc_county:string>
 
 (54) ColumnarToRow [codegen id : 1]
-Input [2]: [cc_call_center_sk#22, cc_county#23]
+Input [2]: [cc_call_center_sk#19, cc_county#20]
 
 (55) Filter [codegen id : 1]
-Input [2]: [cc_call_center_sk#22, cc_county#23]
-Condition : ((isnotnull(cc_county#23) AND (cc_county#23 = Williamson County)) AND isnotnull(cc_call_center_sk#22))
+Input [2]: [cc_call_center_sk#19, cc_county#20]
+Condition : ((isnotnull(cc_county#20) AND (cc_county#20 = Williamson County)) AND isnotnull(cc_call_center_sk#19))
 
 (56) Project [codegen id : 1]
-Output [1]: [cc_call_center_sk#22]
-Input [2]: [cc_call_center_sk#22, cc_county#23]
+Output [1]: [cc_call_center_sk#19]
+Input [2]: [cc_call_center_sk#19, cc_county#20]
 
 (57) ObjectHashAggregate
-Input [1]: [cc_call_center_sk#22]
+Input [1]: [cc_call_center_sk#19]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(cc_call_center_sk#22, 42), 4, 144, 0, 0)]
-Aggregate Attributes [1]: [buf#39]
-Results [1]: [buf#40]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(cc_call_center_sk#19, 42), 4, 144, 0, 0)]
+Aggregate Attributes [1]: [buf#36]
+Results [1]: [buf#37]
 
 (58) Exchange
-Input [1]: [buf#40]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
+Input [1]: [buf#37]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (59) ObjectHashAggregate
-Input [1]: [buf#40]
+Input [1]: [buf#37]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(cc_call_center_sk#22, 42), 4, 144, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(cc_call_center_sk#22, 42), 4, 144, 0, 0)#41]
-Results [1]: [bloom_filter_agg(xxhash64(cc_call_center_sk#22, 42), 4, 144, 0, 0)#41 AS bloomFilter#42]
+Functions [1]: [bloom_filter_agg(xxhash64(cc_call_center_sk#19, 42), 4, 144, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(cc_call_center_sk#19, 42), 4, 144, 0, 0)#38]
+Results [1]: [bloom_filter_agg(xxhash64(cc_call_center_sk#19, 42), 4, 144, 0, 0)#38 AS bloomFilter#39]
 
-Subquery:3 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#13, [id=#14]
+Subquery:3 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#11, [id=#3]
 ObjectHashAggregate (66)
 +- Exchange (65)
    +- ObjectHashAggregate (64)
@@ -363,39 +363,39 @@ ObjectHashAggregate (66)
 
 
 (60) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_date#25]
+Output [2]: [d_date_sk#21, d_date#22]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2002-02-01), LessThanOrEqual(d_date,2002-04-02), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (61) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#24, d_date#25]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (62) Filter [codegen id : 1]
-Input [2]: [d_date_sk#24, d_date#25]
-Condition : (((isnotnull(d_date#25) AND (d_date#25 >= 2002-02-01)) AND (d_date#25 <= 2002-04-02)) AND isnotnull(d_date_sk#24))
+Input [2]: [d_date_sk#21, d_date#22]
+Condition : (((isnotnull(d_date#22) AND (d_date#22 >= 2002-02-01)) AND (d_date#22 <= 2002-04-02)) AND isnotnull(d_date_sk#21))
 
 (63) Project [codegen id : 1]
-Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_date#25]
+Output [1]: [d_date_sk#21]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (64) ObjectHashAggregate
-Input [1]: [d_date_sk#24]
+Input [1]: [d_date_sk#21]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)]
-Aggregate Attributes [1]: [buf#43]
-Results [1]: [buf#44]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)]
+Aggregate Attributes [1]: [buf#40]
+Results [1]: [buf#41]
 
 (65) Exchange
-Input [1]: [buf#44]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [buf#41]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (66) ObjectHashAggregate
-Input [1]: [buf#44]
+Input [1]: [buf#41]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)#45]
-Results [1]: [bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)#45 AS bloomFilter#46]
+Functions [1]: [bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)#42]
+Results [1]: [bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)#42 AS bloomFilter#43]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q2.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q2.sf100/explain.txt
index 91dbbbc0c8eef..15064b764679d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q2.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q2.sf100/explain.txt
@@ -94,11 +94,11 @@ Input [3]: [d_date_sk#9, d_week_seq#10, d_day_name#11]
 
 (10) Filter [codegen id : 3]
 Input [3]: [d_date_sk#9, d_week_seq#10, d_day_name#11]
-Condition : ((isnotnull(d_date_sk#9) AND isnotnull(d_week_seq#10)) AND might_contain(Subquery scalar-subquery#12, [id=#13], xxhash64(d_week_seq#10, 42)))
+Condition : ((isnotnull(d_date_sk#9) AND isnotnull(d_week_seq#10)) AND might_contain(Subquery scalar-subquery#12, [id=#1], xxhash64(d_week_seq#10, 42)))
 
 (11) BroadcastExchange
 Input [3]: [d_date_sk#9, d_week_seq#10, d_day_name#11]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=1]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=2]
 
 (12) BroadcastHashJoin [codegen id : 4]
 Left keys [1]: [sold_date_sk#3]
@@ -114,185 +114,185 @@ Input [5]: [sold_date_sk#3, sales_price#4, d_date_sk#9, d_week_seq#10, d_day_nam
 Input [3]: [sales_price#4, d_week_seq#10, d_day_name#11]
 Keys [1]: [d_week_seq#10]
 Functions [7]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#11 = Sunday   ) THEN sales_price#4 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#11 = Monday   ) THEN sales_price#4 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#11 = Tuesday  ) THEN sales_price#4 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#11 = Wednesday) THEN sales_price#4 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#11 = Thursday ) THEN sales_price#4 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#11 = Friday   ) THEN sales_price#4 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#11 = Saturday ) THEN sales_price#4 END))]
-Aggregate Attributes [7]: [sum#14, sum#15, sum#16, sum#17, sum#18, sum#19, sum#20]
-Results [8]: [d_week_seq#10, sum#21, sum#22, sum#23, sum#24, sum#25, sum#26, sum#27]
+Aggregate Attributes [7]: [sum#13, sum#14, sum#15, sum#16, sum#17, sum#18, sum#19]
+Results [8]: [d_week_seq#10, sum#20, sum#21, sum#22, sum#23, sum#24, sum#25, sum#26]
 
 (15) Exchange
-Input [8]: [d_week_seq#10, sum#21, sum#22, sum#23, sum#24, sum#25, sum#26, sum#27]
-Arguments: hashpartitioning(d_week_seq#10, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [8]: [d_week_seq#10, sum#20, sum#21, sum#22, sum#23, sum#24, sum#25, sum#26]
+Arguments: hashpartitioning(d_week_seq#10, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (16) HashAggregate [codegen id : 12]
-Input [8]: [d_week_seq#10, sum#21, sum#22, sum#23, sum#24, sum#25, sum#26, sum#27]
+Input [8]: [d_week_seq#10, sum#20, sum#21, sum#22, sum#23, sum#24, sum#25, sum#26]
 Keys [1]: [d_week_seq#10]
 Functions [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#11 = Sunday   ) THEN sales_price#4 END)), sum(UnscaledValue(CASE WHEN (d_day_name#11 = Monday   ) THEN sales_price#4 END)), sum(UnscaledValue(CASE WHEN (d_day_name#11 = Tuesday  ) THEN sales_price#4 END)), sum(UnscaledValue(CASE WHEN (d_day_name#11 = Wednesday) THEN sales_price#4 END)), sum(UnscaledValue(CASE WHEN (d_day_name#11 = Thursday ) THEN sales_price#4 END)), sum(UnscaledValue(CASE WHEN (d_day_name#11 = Friday   ) THEN sales_price#4 END)), sum(UnscaledValue(CASE WHEN (d_day_name#11 = Saturday ) THEN sales_price#4 END))]
-Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#11 = Sunday   ) THEN sales_price#4 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Monday   ) THEN sales_price#4 END))#29, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Tuesday  ) THEN sales_price#4 END))#30, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Wednesday) THEN sales_price#4 END))#31, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Thursday ) THEN sales_price#4 END))#32, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Friday   ) THEN sales_price#4 END))#33, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Saturday ) THEN sales_price#4 END))#34]
-Results [8]: [d_week_seq#10, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Sunday   ) THEN sales_price#4 END))#28,17,2) AS sun_sales#35, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Monday   ) THEN sales_price#4 END))#29,17,2) AS mon_sales#36, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Tuesday  ) THEN sales_price#4 END))#30,17,2) AS tue_sales#37, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Wednesday) THEN sales_price#4 END))#31,17,2) AS wed_sales#38, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Thursday ) THEN sales_price#4 END))#32,17,2) AS thu_sales#39, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Friday   ) THEN sales_price#4 END))#33,17,2) AS fri_sales#40, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Saturday ) THEN sales_price#4 END))#34,17,2) AS sat_sales#41]
+Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#11 = Sunday   ) THEN sales_price#4 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Monday   ) THEN sales_price#4 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Tuesday  ) THEN sales_price#4 END))#29, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Wednesday) THEN sales_price#4 END))#30, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Thursday ) THEN sales_price#4 END))#31, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Friday   ) THEN sales_price#4 END))#32, sum(UnscaledValue(CASE WHEN (d_day_name#11 = Saturday ) THEN sales_price#4 END))#33]
+Results [8]: [d_week_seq#10, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Sunday   ) THEN sales_price#4 END))#27,17,2) AS sun_sales#34, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Monday   ) THEN sales_price#4 END))#28,17,2) AS mon_sales#35, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Tuesday  ) THEN sales_price#4 END))#29,17,2) AS tue_sales#36, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Wednesday) THEN sales_price#4 END))#30,17,2) AS wed_sales#37, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Thursday ) THEN sales_price#4 END))#31,17,2) AS thu_sales#38, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Friday   ) THEN sales_price#4 END))#32,17,2) AS fri_sales#39, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#11 = Saturday ) THEN sales_price#4 END))#33,17,2) AS sat_sales#40]
 
 (17) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_week_seq#42, d_year#43]
+Output [2]: [d_week_seq#41, d_year#42]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2001), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_week_seq:int,d_year:int>
 
 (18) ColumnarToRow [codegen id : 5]
-Input [2]: [d_week_seq#42, d_year#43]
+Input [2]: [d_week_seq#41, d_year#42]
 
 (19) Filter [codegen id : 5]
-Input [2]: [d_week_seq#42, d_year#43]
-Condition : ((isnotnull(d_year#43) AND (d_year#43 = 2001)) AND isnotnull(d_week_seq#42))
+Input [2]: [d_week_seq#41, d_year#42]
+Condition : ((isnotnull(d_year#42) AND (d_year#42 = 2001)) AND isnotnull(d_week_seq#41))
 
 (20) Project [codegen id : 5]
-Output [1]: [d_week_seq#42]
-Input [2]: [d_week_seq#42, d_year#43]
+Output [1]: [d_week_seq#41]
+Input [2]: [d_week_seq#41, d_year#42]
 
 (21) BroadcastExchange
-Input [1]: [d_week_seq#42]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=3]
+Input [1]: [d_week_seq#41]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
 
 (22) BroadcastHashJoin [codegen id : 12]
 Left keys [1]: [d_week_seq#10]
-Right keys [1]: [d_week_seq#42]
+Right keys [1]: [d_week_seq#41]
 Join type: Inner
 Join condition: None
 
 (23) Project [codegen id : 12]
-Output [8]: [d_week_seq#10 AS d_week_seq1#44, sun_sales#35 AS sun_sales1#45, mon_sales#36 AS mon_sales1#46, tue_sales#37 AS tue_sales1#47, wed_sales#38 AS wed_sales1#48, thu_sales#39 AS thu_sales1#49, fri_sales#40 AS fri_sales1#50, sat_sales#41 AS sat_sales1#51]
-Input [9]: [d_week_seq#10, sun_sales#35, mon_sales#36, tue_sales#37, wed_sales#38, thu_sales#39, fri_sales#40, sat_sales#41, d_week_seq#42]
+Output [8]: [d_week_seq#10 AS d_week_seq1#43, sun_sales#34 AS sun_sales1#44, mon_sales#35 AS mon_sales1#45, tue_sales#36 AS tue_sales1#46, wed_sales#37 AS wed_sales1#47, thu_sales#38 AS thu_sales1#48, fri_sales#39 AS fri_sales1#49, sat_sales#40 AS sat_sales1#50]
+Input [9]: [d_week_seq#10, sun_sales#34, mon_sales#35, tue_sales#36, wed_sales#37, thu_sales#38, fri_sales#39, sat_sales#40, d_week_seq#41]
 
 (24) Scan parquet spark_catalog.default.web_sales
-Output [2]: [ws_ext_sales_price#52, ws_sold_date_sk#53]
+Output [2]: [ws_ext_sales_price#51, ws_sold_date_sk#52]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#53)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#52)]
 ReadSchema: struct<ws_ext_sales_price:decimal(7,2)>
 
 (25) ColumnarToRow [codegen id : 6]
-Input [2]: [ws_ext_sales_price#52, ws_sold_date_sk#53]
+Input [2]: [ws_ext_sales_price#51, ws_sold_date_sk#52]
 
 (26) Project [codegen id : 6]
-Output [2]: [ws_sold_date_sk#53 AS sold_date_sk#54, ws_ext_sales_price#52 AS sales_price#55]
-Input [2]: [ws_ext_sales_price#52, ws_sold_date_sk#53]
+Output [2]: [ws_sold_date_sk#52 AS sold_date_sk#53, ws_ext_sales_price#51 AS sales_price#54]
+Input [2]: [ws_ext_sales_price#51, ws_sold_date_sk#52]
 
 (27) Scan parquet spark_catalog.default.catalog_sales
-Output [2]: [cs_ext_sales_price#56, cs_sold_date_sk#57]
+Output [2]: [cs_ext_sales_price#55, cs_sold_date_sk#56]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#57)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#56)]
 ReadSchema: struct<cs_ext_sales_price:decimal(7,2)>
 
 (28) ColumnarToRow [codegen id : 7]
-Input [2]: [cs_ext_sales_price#56, cs_sold_date_sk#57]
+Input [2]: [cs_ext_sales_price#55, cs_sold_date_sk#56]
 
 (29) Project [codegen id : 7]
-Output [2]: [cs_sold_date_sk#57 AS sold_date_sk#58, cs_ext_sales_price#56 AS sales_price#59]
-Input [2]: [cs_ext_sales_price#56, cs_sold_date_sk#57]
+Output [2]: [cs_sold_date_sk#56 AS sold_date_sk#57, cs_ext_sales_price#55 AS sales_price#58]
+Input [2]: [cs_ext_sales_price#55, cs_sold_date_sk#56]
 
 (30) Union
 
 (31) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#60, d_week_seq#61, d_day_name#62]
+Output [3]: [d_date_sk#59, d_week_seq#60, d_day_name#61]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date_sk), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int,d_day_name:string>
 
 (32) ColumnarToRow [codegen id : 8]
-Input [3]: [d_date_sk#60, d_week_seq#61, d_day_name#62]
+Input [3]: [d_date_sk#59, d_week_seq#60, d_day_name#61]
 
 (33) Filter [codegen id : 8]
-Input [3]: [d_date_sk#60, d_week_seq#61, d_day_name#62]
-Condition : ((isnotnull(d_date_sk#60) AND isnotnull(d_week_seq#61)) AND might_contain(Subquery scalar-subquery#63, [id=#64], xxhash64(d_week_seq#61, 42)))
+Input [3]: [d_date_sk#59, d_week_seq#60, d_day_name#61]
+Condition : ((isnotnull(d_date_sk#59) AND isnotnull(d_week_seq#60)) AND might_contain(Subquery scalar-subquery#62, [id=#5], xxhash64(d_week_seq#60, 42)))
 
 (34) BroadcastExchange
-Input [3]: [d_date_sk#60, d_week_seq#61, d_day_name#62]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=4]
+Input [3]: [d_date_sk#59, d_week_seq#60, d_day_name#61]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=6]
 
 (35) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [sold_date_sk#54]
-Right keys [1]: [d_date_sk#60]
+Left keys [1]: [sold_date_sk#53]
+Right keys [1]: [d_date_sk#59]
 Join type: Inner
 Join condition: None
 
 (36) Project [codegen id : 9]
-Output [3]: [sales_price#55, d_week_seq#61, d_day_name#62]
-Input [5]: [sold_date_sk#54, sales_price#55, d_date_sk#60, d_week_seq#61, d_day_name#62]
+Output [3]: [sales_price#54, d_week_seq#60, d_day_name#61]
+Input [5]: [sold_date_sk#53, sales_price#54, d_date_sk#59, d_week_seq#60, d_day_name#61]
 
 (37) HashAggregate [codegen id : 9]
-Input [3]: [sales_price#55, d_week_seq#61, d_day_name#62]
-Keys [1]: [d_week_seq#61]
-Functions [7]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#62 = Sunday   ) THEN sales_price#55 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#62 = Monday   ) THEN sales_price#55 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#62 = Tuesday  ) THEN sales_price#55 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#62 = Wednesday) THEN sales_price#55 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#62 = Thursday ) THEN sales_price#55 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#62 = Friday   ) THEN sales_price#55 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#62 = Saturday ) THEN sales_price#55 END))]
-Aggregate Attributes [7]: [sum#65, sum#66, sum#67, sum#68, sum#69, sum#70, sum#71]
-Results [8]: [d_week_seq#61, sum#72, sum#73, sum#74, sum#75, sum#76, sum#77, sum#78]
+Input [3]: [sales_price#54, d_week_seq#60, d_day_name#61]
+Keys [1]: [d_week_seq#60]
+Functions [7]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#61 = Sunday   ) THEN sales_price#54 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#61 = Monday   ) THEN sales_price#54 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#61 = Tuesday  ) THEN sales_price#54 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#61 = Wednesday) THEN sales_price#54 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#61 = Thursday ) THEN sales_price#54 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#61 = Friday   ) THEN sales_price#54 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#61 = Saturday ) THEN sales_price#54 END))]
+Aggregate Attributes [7]: [sum#63, sum#64, sum#65, sum#66, sum#67, sum#68, sum#69]
+Results [8]: [d_week_seq#60, sum#70, sum#71, sum#72, sum#73, sum#74, sum#75, sum#76]
 
 (38) Exchange
-Input [8]: [d_week_seq#61, sum#72, sum#73, sum#74, sum#75, sum#76, sum#77, sum#78]
-Arguments: hashpartitioning(d_week_seq#61, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [8]: [d_week_seq#60, sum#70, sum#71, sum#72, sum#73, sum#74, sum#75, sum#76]
+Arguments: hashpartitioning(d_week_seq#60, 5), ENSURE_REQUIREMENTS, [plan_id=7]
 
 (39) HashAggregate [codegen id : 11]
-Input [8]: [d_week_seq#61, sum#72, sum#73, sum#74, sum#75, sum#76, sum#77, sum#78]
-Keys [1]: [d_week_seq#61]
-Functions [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#62 = Sunday   ) THEN sales_price#55 END)), sum(UnscaledValue(CASE WHEN (d_day_name#62 = Monday   ) THEN sales_price#55 END)), sum(UnscaledValue(CASE WHEN (d_day_name#62 = Tuesday  ) THEN sales_price#55 END)), sum(UnscaledValue(CASE WHEN (d_day_name#62 = Wednesday) THEN sales_price#55 END)), sum(UnscaledValue(CASE WHEN (d_day_name#62 = Thursday ) THEN sales_price#55 END)), sum(UnscaledValue(CASE WHEN (d_day_name#62 = Friday   ) THEN sales_price#55 END)), sum(UnscaledValue(CASE WHEN (d_day_name#62 = Saturday ) THEN sales_price#55 END))]
-Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#62 = Sunday   ) THEN sales_price#55 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#62 = Monday   ) THEN sales_price#55 END))#29, sum(UnscaledValue(CASE WHEN (d_day_name#62 = Tuesday  ) THEN sales_price#55 END))#30, sum(UnscaledValue(CASE WHEN (d_day_name#62 = Wednesday) THEN sales_price#55 END))#31, sum(UnscaledValue(CASE WHEN (d_day_name#62 = Thursday ) THEN sales_price#55 END))#32, sum(UnscaledValue(CASE WHEN (d_day_name#62 = Friday   ) THEN sales_price#55 END))#33, sum(UnscaledValue(CASE WHEN (d_day_name#62 = Saturday ) THEN sales_price#55 END))#34]
-Results [8]: [d_week_seq#61, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#62 = Sunday   ) THEN sales_price#55 END))#28,17,2) AS sun_sales#79, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#62 = Monday   ) THEN sales_price#55 END))#29,17,2) AS mon_sales#80, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#62 = Tuesday  ) THEN sales_price#55 END))#30,17,2) AS tue_sales#81, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#62 = Wednesday) THEN sales_price#55 END))#31,17,2) AS wed_sales#82, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#62 = Thursday ) THEN sales_price#55 END))#32,17,2) AS thu_sales#83, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#62 = Friday   ) THEN sales_price#55 END))#33,17,2) AS fri_sales#84, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#62 = Saturday ) THEN sales_price#55 END))#34,17,2) AS sat_sales#85]
+Input [8]: [d_week_seq#60, sum#70, sum#71, sum#72, sum#73, sum#74, sum#75, sum#76]
+Keys [1]: [d_week_seq#60]
+Functions [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#61 = Sunday   ) THEN sales_price#54 END)), sum(UnscaledValue(CASE WHEN (d_day_name#61 = Monday   ) THEN sales_price#54 END)), sum(UnscaledValue(CASE WHEN (d_day_name#61 = Tuesday  ) THEN sales_price#54 END)), sum(UnscaledValue(CASE WHEN (d_day_name#61 = Wednesday) THEN sales_price#54 END)), sum(UnscaledValue(CASE WHEN (d_day_name#61 = Thursday ) THEN sales_price#54 END)), sum(UnscaledValue(CASE WHEN (d_day_name#61 = Friday   ) THEN sales_price#54 END)), sum(UnscaledValue(CASE WHEN (d_day_name#61 = Saturday ) THEN sales_price#54 END))]
+Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#61 = Sunday   ) THEN sales_price#54 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#61 = Monday   ) THEN sales_price#54 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#61 = Tuesday  ) THEN sales_price#54 END))#29, sum(UnscaledValue(CASE WHEN (d_day_name#61 = Wednesday) THEN sales_price#54 END))#30, sum(UnscaledValue(CASE WHEN (d_day_name#61 = Thursday ) THEN sales_price#54 END))#31, sum(UnscaledValue(CASE WHEN (d_day_name#61 = Friday   ) THEN sales_price#54 END))#32, sum(UnscaledValue(CASE WHEN (d_day_name#61 = Saturday ) THEN sales_price#54 END))#33]
+Results [8]: [d_week_seq#60, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#61 = Sunday   ) THEN sales_price#54 END))#27,17,2) AS sun_sales#77, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#61 = Monday   ) THEN sales_price#54 END))#28,17,2) AS mon_sales#78, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#61 = Tuesday  ) THEN sales_price#54 END))#29,17,2) AS tue_sales#79, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#61 = Wednesday) THEN sales_price#54 END))#30,17,2) AS wed_sales#80, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#61 = Thursday ) THEN sales_price#54 END))#31,17,2) AS thu_sales#81, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#61 = Friday   ) THEN sales_price#54 END))#32,17,2) AS fri_sales#82, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#61 = Saturday ) THEN sales_price#54 END))#33,17,2) AS sat_sales#83]
 
 (40) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_week_seq#86, d_year#87]
+Output [2]: [d_week_seq#84, d_year#85]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2002), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_week_seq:int,d_year:int>
 
 (41) ColumnarToRow [codegen id : 10]
-Input [2]: [d_week_seq#86, d_year#87]
+Input [2]: [d_week_seq#84, d_year#85]
 
 (42) Filter [codegen id : 10]
-Input [2]: [d_week_seq#86, d_year#87]
-Condition : ((isnotnull(d_year#87) AND (d_year#87 = 2002)) AND isnotnull(d_week_seq#86))
+Input [2]: [d_week_seq#84, d_year#85]
+Condition : ((isnotnull(d_year#85) AND (d_year#85 = 2002)) AND isnotnull(d_week_seq#84))
 
 (43) Project [codegen id : 10]
-Output [1]: [d_week_seq#86]
-Input [2]: [d_week_seq#86, d_year#87]
+Output [1]: [d_week_seq#84]
+Input [2]: [d_week_seq#84, d_year#85]
 
 (44) BroadcastExchange
-Input [1]: [d_week_seq#86]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [d_week_seq#84]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
 
 (45) BroadcastHashJoin [codegen id : 11]
-Left keys [1]: [d_week_seq#61]
-Right keys [1]: [d_week_seq#86]
+Left keys [1]: [d_week_seq#60]
+Right keys [1]: [d_week_seq#84]
 Join type: Inner
 Join condition: None
 
 (46) Project [codegen id : 11]
-Output [8]: [d_week_seq#61 AS d_week_seq2#88, sun_sales#79 AS sun_sales2#89, mon_sales#80 AS mon_sales2#90, tue_sales#81 AS tue_sales2#91, wed_sales#82 AS wed_sales2#92, thu_sales#83 AS thu_sales2#93, fri_sales#84 AS fri_sales2#94, sat_sales#85 AS sat_sales2#95]
-Input [9]: [d_week_seq#61, sun_sales#79, mon_sales#80, tue_sales#81, wed_sales#82, thu_sales#83, fri_sales#84, sat_sales#85, d_week_seq#86]
+Output [8]: [d_week_seq#60 AS d_week_seq2#86, sun_sales#77 AS sun_sales2#87, mon_sales#78 AS mon_sales2#88, tue_sales#79 AS tue_sales2#89, wed_sales#80 AS wed_sales2#90, thu_sales#81 AS thu_sales2#91, fri_sales#82 AS fri_sales2#92, sat_sales#83 AS sat_sales2#93]
+Input [9]: [d_week_seq#60, sun_sales#77, mon_sales#78, tue_sales#79, wed_sales#80, thu_sales#81, fri_sales#82, sat_sales#83, d_week_seq#84]
 
 (47) BroadcastExchange
-Input [8]: [d_week_seq2#88, sun_sales2#89, mon_sales2#90, tue_sales2#91, wed_sales2#92, thu_sales2#93, fri_sales2#94, sat_sales2#95]
-Arguments: HashedRelationBroadcastMode(List(cast((input[0, int, true] - 53) as bigint)),false), [plan_id=7]
+Input [8]: [d_week_seq2#86, sun_sales2#87, mon_sales2#88, tue_sales2#89, wed_sales2#90, thu_sales2#91, fri_sales2#92, sat_sales2#93]
+Arguments: HashedRelationBroadcastMode(List(cast((input[0, int, true] - 53) as bigint)),false), [plan_id=9]
 
 (48) BroadcastHashJoin [codegen id : 12]
-Left keys [1]: [d_week_seq1#44]
-Right keys [1]: [(d_week_seq2#88 - 53)]
+Left keys [1]: [d_week_seq1#43]
+Right keys [1]: [(d_week_seq2#86 - 53)]
 Join type: Inner
 Join condition: None
 
 (49) Project [codegen id : 12]
-Output [8]: [d_week_seq1#44, round((sun_sales1#45 / sun_sales2#89), 2) AS round((sun_sales1 / sun_sales2), 2)#96, round((mon_sales1#46 / mon_sales2#90), 2) AS round((mon_sales1 / mon_sales2), 2)#97, round((tue_sales1#47 / tue_sales2#91), 2) AS round((tue_sales1 / tue_sales2), 2)#98, round((wed_sales1#48 / wed_sales2#92), 2) AS round((wed_sales1 / wed_sales2), 2)#99, round((thu_sales1#49 / thu_sales2#93), 2) AS round((thu_sales1 / thu_sales2), 2)#100, round((fri_sales1#50 / fri_sales2#94), 2) AS round((fri_sales1 / fri_sales2), 2)#101, round((sat_sales1#51 / sat_sales2#95), 2) AS round((sat_sales1 / sat_sales2), 2)#102]
-Input [16]: [d_week_seq1#44, sun_sales1#45, mon_sales1#46, tue_sales1#47, wed_sales1#48, thu_sales1#49, fri_sales1#50, sat_sales1#51, d_week_seq2#88, sun_sales2#89, mon_sales2#90, tue_sales2#91, wed_sales2#92, thu_sales2#93, fri_sales2#94, sat_sales2#95]
+Output [8]: [d_week_seq1#43, round((sun_sales1#44 / sun_sales2#87), 2) AS round((sun_sales1 / sun_sales2), 2)#94, round((mon_sales1#45 / mon_sales2#88), 2) AS round((mon_sales1 / mon_sales2), 2)#95, round((tue_sales1#46 / tue_sales2#89), 2) AS round((tue_sales1 / tue_sales2), 2)#96, round((wed_sales1#47 / wed_sales2#90), 2) AS round((wed_sales1 / wed_sales2), 2)#97, round((thu_sales1#48 / thu_sales2#91), 2) AS round((thu_sales1 / thu_sales2), 2)#98, round((fri_sales1#49 / fri_sales2#92), 2) AS round((fri_sales1 / fri_sales2), 2)#99, round((sat_sales1#50 / sat_sales2#93), 2) AS round((sat_sales1 / sat_sales2), 2)#100]
+Input [16]: [d_week_seq1#43, sun_sales1#44, mon_sales1#45, tue_sales1#46, wed_sales1#47, thu_sales1#48, fri_sales1#49, sat_sales1#50, d_week_seq2#86, sun_sales2#87, mon_sales2#88, tue_sales2#89, wed_sales2#90, thu_sales2#91, fri_sales2#92, sat_sales2#93]
 
 (50) Exchange
-Input [8]: [d_week_seq1#44, round((sun_sales1 / sun_sales2), 2)#96, round((mon_sales1 / mon_sales2), 2)#97, round((tue_sales1 / tue_sales2), 2)#98, round((wed_sales1 / wed_sales2), 2)#99, round((thu_sales1 / thu_sales2), 2)#100, round((fri_sales1 / fri_sales2), 2)#101, round((sat_sales1 / sat_sales2), 2)#102]
-Arguments: rangepartitioning(d_week_seq1#44 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [8]: [d_week_seq1#43, round((sun_sales1 / sun_sales2), 2)#94, round((mon_sales1 / mon_sales2), 2)#95, round((tue_sales1 / tue_sales2), 2)#96, round((wed_sales1 / wed_sales2), 2)#97, round((thu_sales1 / thu_sales2), 2)#98, round((fri_sales1 / fri_sales2), 2)#99, round((sat_sales1 / sat_sales2), 2)#100]
+Arguments: rangepartitioning(d_week_seq1#43 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (51) Sort [codegen id : 13]
-Input [8]: [d_week_seq1#44, round((sun_sales1 / sun_sales2), 2)#96, round((mon_sales1 / mon_sales2), 2)#97, round((tue_sales1 / tue_sales2), 2)#98, round((wed_sales1 / wed_sales2), 2)#99, round((thu_sales1 / thu_sales2), 2)#100, round((fri_sales1 / fri_sales2), 2)#101, round((sat_sales1 / sat_sales2), 2)#102]
-Arguments: [d_week_seq1#44 ASC NULLS FIRST], true, 0
+Input [8]: [d_week_seq1#43, round((sun_sales1 / sun_sales2), 2)#94, round((mon_sales1 / mon_sales2), 2)#95, round((tue_sales1 / tue_sales2), 2)#96, round((wed_sales1 / wed_sales2), 2)#97, round((thu_sales1 / thu_sales2), 2)#98, round((fri_sales1 / fri_sales2), 2)#99, round((sat_sales1 / sat_sales2), 2)#100]
+Arguments: [d_week_seq1#43 ASC NULLS FIRST], true, 0
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 10 Hosting Expression = Subquery scalar-subquery#12, [id=#13]
+Subquery:1 Hosting operator id = 10 Hosting Expression = Subquery scalar-subquery#12, [id=#1]
 ObjectHashAggregate (58)
 +- Exchange (57)
    +- ObjectHashAggregate (56)
@@ -303,42 +303,42 @@ ObjectHashAggregate (58)
 
 
 (52) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_week_seq#42, d_year#43]
+Output [2]: [d_week_seq#41, d_year#42]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2001), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_week_seq:int,d_year:int>
 
 (53) ColumnarToRow [codegen id : 1]
-Input [2]: [d_week_seq#42, d_year#43]
+Input [2]: [d_week_seq#41, d_year#42]
 
 (54) Filter [codegen id : 1]
-Input [2]: [d_week_seq#42, d_year#43]
-Condition : ((isnotnull(d_year#43) AND (d_year#43 = 2001)) AND isnotnull(d_week_seq#42))
+Input [2]: [d_week_seq#41, d_year#42]
+Condition : ((isnotnull(d_year#42) AND (d_year#42 = 2001)) AND isnotnull(d_week_seq#41))
 
 (55) Project [codegen id : 1]
-Output [1]: [d_week_seq#42]
-Input [2]: [d_week_seq#42, d_year#43]
+Output [1]: [d_week_seq#41]
+Input [2]: [d_week_seq#41, d_year#42]
 
 (56) ObjectHashAggregate
-Input [1]: [d_week_seq#42]
+Input [1]: [d_week_seq#41]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#42, 42), 362, 9656, 0, 0)]
-Aggregate Attributes [1]: [buf#103]
-Results [1]: [buf#104]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#41, 42), 362, 9656, 0, 0)]
+Aggregate Attributes [1]: [buf#101]
+Results [1]: [buf#102]
 
 (57) Exchange
-Input [1]: [buf#104]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
+Input [1]: [buf#102]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
 
 (58) ObjectHashAggregate
-Input [1]: [buf#104]
+Input [1]: [buf#102]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#42, 42), 362, 9656, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#42, 42), 362, 9656, 0, 0)#105]
-Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#42, 42), 362, 9656, 0, 0)#105 AS bloomFilter#106]
+Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 362, 9656, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 362, 9656, 0, 0)#103]
+Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 362, 9656, 0, 0)#103 AS bloomFilter#104]
 
-Subquery:2 Hosting operator id = 33 Hosting Expression = Subquery scalar-subquery#63, [id=#64]
+Subquery:2 Hosting operator id = 33 Hosting Expression = Subquery scalar-subquery#62, [id=#5]
 ObjectHashAggregate (65)
 +- Exchange (64)
    +- ObjectHashAggregate (63)
@@ -349,39 +349,39 @@ ObjectHashAggregate (65)
 
 
 (59) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_week_seq#86, d_year#87]
+Output [2]: [d_week_seq#84, d_year#85]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2002), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_week_seq:int,d_year:int>
 
 (60) ColumnarToRow [codegen id : 1]
-Input [2]: [d_week_seq#86, d_year#87]
+Input [2]: [d_week_seq#84, d_year#85]
 
 (61) Filter [codegen id : 1]
-Input [2]: [d_week_seq#86, d_year#87]
-Condition : ((isnotnull(d_year#87) AND (d_year#87 = 2002)) AND isnotnull(d_week_seq#86))
+Input [2]: [d_week_seq#84, d_year#85]
+Condition : ((isnotnull(d_year#85) AND (d_year#85 = 2002)) AND isnotnull(d_week_seq#84))
 
 (62) Project [codegen id : 1]
-Output [1]: [d_week_seq#86]
-Input [2]: [d_week_seq#86, d_year#87]
+Output [1]: [d_week_seq#84]
+Input [2]: [d_week_seq#84, d_year#85]
 
 (63) ObjectHashAggregate
-Input [1]: [d_week_seq#86]
+Input [1]: [d_week_seq#84]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#86, 42), 362, 9656, 0, 0)]
-Aggregate Attributes [1]: [buf#107]
-Results [1]: [buf#108]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#84, 42), 362, 9656, 0, 0)]
+Aggregate Attributes [1]: [buf#105]
+Results [1]: [buf#106]
 
 (64) Exchange
-Input [1]: [buf#108]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [buf#106]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (65) ObjectHashAggregate
-Input [1]: [buf#108]
+Input [1]: [buf#106]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#86, 42), 362, 9656, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#86, 42), 362, 9656, 0, 0)#109]
-Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#86, 42), 362, 9656, 0, 0)#109 AS bloomFilter#110]
+Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#84, 42), 362, 9656, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#84, 42), 362, 9656, 0, 0)#107]
+Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#84, 42), 362, 9656, 0, 0)#107 AS bloomFilter#108]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a.sf100/explain.txt
index 0f44ef66d6aa3..bfc1aa32c7cee 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a.sf100/explain.txt
@@ -295,7 +295,7 @@ Results [2]: [c_customer_sk#24, sum((cast(ss_quantity#21 as decimal(10,0)) * ss_
 
 (44) Filter [codegen id : 15]
 Input [2]: [c_customer_sk#24, ssales#30]
-Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#32])))
+Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#7])))
 
 (45) Project [codegen id : 15]
 Output [1]: [c_customer_sk#24]
@@ -316,196 +316,196 @@ Output [3]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5]
 Input [4]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5]
 
 (49) ReusedExchange [Reuses operator id: 95]
-Output [1]: [d_date_sk#33]
+Output [1]: [d_date_sk#32]
 
 (50) BroadcastHashJoin [codegen id : 17]
 Left keys [1]: [cs_sold_date_sk#5]
-Right keys [1]: [d_date_sk#33]
+Right keys [1]: [d_date_sk#32]
 Join type: Inner
 Join condition: None
 
 (51) Project [codegen id : 17]
-Output [1]: [(cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4) AS sales#34]
-Input [4]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, d_date_sk#33]
+Output [1]: [(cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4) AS sales#33]
+Input [4]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, d_date_sk#32]
 
 (52) Scan parquet spark_catalog.default.web_sales
-Output [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Output [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#39), dynamicpruningexpression(ws_sold_date_sk#39 IN dynamicpruning#6)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#38), dynamicpruningexpression(ws_sold_date_sk#38 IN dynamicpruning#6)]
 ReadSchema: struct<ws_item_sk:int,ws_bill_customer_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (53) ColumnarToRow [codegen id : 18]
-Input [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Input [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 
 (54) Exchange
-Input [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Arguments: hashpartitioning(ws_item_sk#35, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Arguments: hashpartitioning(ws_item_sk#34, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (55) Sort [codegen id : 19]
-Input [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Arguments: [ws_item_sk#35 ASC NULLS FIRST], false, 0
+Input [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Arguments: [ws_item_sk#34 ASC NULLS FIRST], false, 0
 
 (56) ReusedExchange [Reuses operator id: 11]
-Output [2]: [ss_item_sk#40, d_date#41]
+Output [2]: [ss_item_sk#39, d_date#40]
 
 (57) Sort [codegen id : 22]
-Input [2]: [ss_item_sk#40, d_date#41]
-Arguments: [ss_item_sk#40 ASC NULLS FIRST], false, 0
+Input [2]: [ss_item_sk#39, d_date#40]
+Arguments: [ss_item_sk#39 ASC NULLS FIRST], false, 0
 
 (58) ReusedExchange [Reuses operator id: 16]
-Output [2]: [i_item_sk#42, i_item_desc#43]
+Output [2]: [i_item_sk#41, i_item_desc#42]
 
 (59) Sort [codegen id : 24]
-Input [2]: [i_item_sk#42, i_item_desc#43]
-Arguments: [i_item_sk#42 ASC NULLS FIRST], false, 0
+Input [2]: [i_item_sk#41, i_item_desc#42]
+Arguments: [i_item_sk#41 ASC NULLS FIRST], false, 0
 
 (60) SortMergeJoin [codegen id : 25]
-Left keys [1]: [ss_item_sk#40]
-Right keys [1]: [i_item_sk#42]
+Left keys [1]: [ss_item_sk#39]
+Right keys [1]: [i_item_sk#41]
 Join type: Inner
 Join condition: None
 
 (61) Project [codegen id : 25]
-Output [3]: [d_date#41, i_item_sk#42, substr(i_item_desc#43, 1, 30) AS _groupingexpression#44]
-Input [4]: [ss_item_sk#40, d_date#41, i_item_sk#42, i_item_desc#43]
+Output [3]: [d_date#40, i_item_sk#41, substr(i_item_desc#42, 1, 30) AS _groupingexpression#43]
+Input [4]: [ss_item_sk#39, d_date#40, i_item_sk#41, i_item_desc#42]
 
 (62) HashAggregate [codegen id : 25]
-Input [3]: [d_date#41, i_item_sk#42, _groupingexpression#44]
-Keys [3]: [_groupingexpression#44, i_item_sk#42, d_date#41]
+Input [3]: [d_date#40, i_item_sk#41, _groupingexpression#43]
+Keys [3]: [_groupingexpression#43, i_item_sk#41, d_date#40]
 Functions [1]: [partial_count(1)]
 Aggregate Attributes [1]: [count#15]
-Results [4]: [_groupingexpression#44, i_item_sk#42, d_date#41, count#16]
+Results [4]: [_groupingexpression#43, i_item_sk#41, d_date#40, count#16]
 
 (63) HashAggregate [codegen id : 25]
-Input [4]: [_groupingexpression#44, i_item_sk#42, d_date#41, count#16]
-Keys [3]: [_groupingexpression#44, i_item_sk#42, d_date#41]
+Input [4]: [_groupingexpression#43, i_item_sk#41, d_date#40, count#16]
+Keys [3]: [_groupingexpression#43, i_item_sk#41, d_date#40]
 Functions [1]: [count(1)]
 Aggregate Attributes [1]: [count(1)#17]
-Results [2]: [i_item_sk#42 AS item_sk#45, count(1)#17 AS cnt#46]
+Results [2]: [i_item_sk#41 AS item_sk#44, count(1)#17 AS cnt#45]
 
 (64) Filter [codegen id : 25]
-Input [2]: [item_sk#45, cnt#46]
-Condition : (cnt#46 > 4)
+Input [2]: [item_sk#44, cnt#45]
+Condition : (cnt#45 > 4)
 
 (65) Project [codegen id : 25]
-Output [1]: [item_sk#45]
-Input [2]: [item_sk#45, cnt#46]
+Output [1]: [item_sk#44]
+Input [2]: [item_sk#44, cnt#45]
 
 (66) Sort [codegen id : 25]
-Input [1]: [item_sk#45]
-Arguments: [item_sk#45 ASC NULLS FIRST], false, 0
+Input [1]: [item_sk#44]
+Arguments: [item_sk#44 ASC NULLS FIRST], false, 0
 
 (67) SortMergeJoin [codegen id : 26]
-Left keys [1]: [ws_item_sk#35]
-Right keys [1]: [item_sk#45]
+Left keys [1]: [ws_item_sk#34]
+Right keys [1]: [item_sk#44]
 Join type: LeftSemi
 Join condition: None
 
 (68) Project [codegen id : 26]
-Output [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Input [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Output [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Input [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 
 (69) Exchange
-Input [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Arguments: hashpartitioning(ws_bill_customer_sk#36, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Arguments: hashpartitioning(ws_bill_customer_sk#35, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (70) Sort [codegen id : 27]
-Input [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Arguments: [ws_bill_customer_sk#36 ASC NULLS FIRST], false, 0
+Input [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Arguments: [ws_bill_customer_sk#35 ASC NULLS FIRST], false, 0
 
 (71) ReusedExchange [Reuses operator id: 33]
-Output [3]: [ss_customer_sk#47, ss_quantity#48, ss_sales_price#49]
+Output [3]: [ss_customer_sk#46, ss_quantity#47, ss_sales_price#48]
 
 (72) Sort [codegen id : 29]
-Input [3]: [ss_customer_sk#47, ss_quantity#48, ss_sales_price#49]
-Arguments: [ss_customer_sk#47 ASC NULLS FIRST], false, 0
+Input [3]: [ss_customer_sk#46, ss_quantity#47, ss_sales_price#48]
+Arguments: [ss_customer_sk#46 ASC NULLS FIRST], false, 0
 
 (73) ReusedExchange [Reuses operator id: 38]
-Output [1]: [c_customer_sk#50]
+Output [1]: [c_customer_sk#49]
 
 (74) Sort [codegen id : 31]
-Input [1]: [c_customer_sk#50]
-Arguments: [c_customer_sk#50 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#49]
+Arguments: [c_customer_sk#49 ASC NULLS FIRST], false, 0
 
 (75) SortMergeJoin [codegen id : 32]
-Left keys [1]: [ss_customer_sk#47]
-Right keys [1]: [c_customer_sk#50]
+Left keys [1]: [ss_customer_sk#46]
+Right keys [1]: [c_customer_sk#49]
 Join type: Inner
 Join condition: None
 
 (76) Project [codegen id : 32]
-Output [3]: [ss_quantity#48, ss_sales_price#49, c_customer_sk#50]
-Input [4]: [ss_customer_sk#47, ss_quantity#48, ss_sales_price#49, c_customer_sk#50]
+Output [3]: [ss_quantity#47, ss_sales_price#48, c_customer_sk#49]
+Input [4]: [ss_customer_sk#46, ss_quantity#47, ss_sales_price#48, c_customer_sk#49]
 
 (77) HashAggregate [codegen id : 32]
-Input [3]: [ss_quantity#48, ss_sales_price#49, c_customer_sk#50]
-Keys [1]: [c_customer_sk#50]
-Functions [1]: [partial_sum((cast(ss_quantity#48 as decimal(10,0)) * ss_sales_price#49))]
-Aggregate Attributes [2]: [sum#51, isEmpty#52]
-Results [3]: [c_customer_sk#50, sum#53, isEmpty#54]
+Input [3]: [ss_quantity#47, ss_sales_price#48, c_customer_sk#49]
+Keys [1]: [c_customer_sk#49]
+Functions [1]: [partial_sum((cast(ss_quantity#47 as decimal(10,0)) * ss_sales_price#48))]
+Aggregate Attributes [2]: [sum#50, isEmpty#51]
+Results [3]: [c_customer_sk#49, sum#52, isEmpty#53]
 
 (78) HashAggregate [codegen id : 32]
-Input [3]: [c_customer_sk#50, sum#53, isEmpty#54]
-Keys [1]: [c_customer_sk#50]
-Functions [1]: [sum((cast(ss_quantity#48 as decimal(10,0)) * ss_sales_price#49))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#48 as decimal(10,0)) * ss_sales_price#49))#29]
-Results [2]: [c_customer_sk#50, sum((cast(ss_quantity#48 as decimal(10,0)) * ss_sales_price#49))#29 AS ssales#55]
+Input [3]: [c_customer_sk#49, sum#52, isEmpty#53]
+Keys [1]: [c_customer_sk#49]
+Functions [1]: [sum((cast(ss_quantity#47 as decimal(10,0)) * ss_sales_price#48))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#47 as decimal(10,0)) * ss_sales_price#48))#29]
+Results [2]: [c_customer_sk#49, sum((cast(ss_quantity#47 as decimal(10,0)) * ss_sales_price#48))#29 AS ssales#54]
 
 (79) Filter [codegen id : 32]
-Input [2]: [c_customer_sk#50, ssales#55]
-Condition : (isnotnull(ssales#55) AND (cast(ssales#55 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#32])))
+Input [2]: [c_customer_sk#49, ssales#54]
+Condition : (isnotnull(ssales#54) AND (cast(ssales#54 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#7])))
 
 (80) Project [codegen id : 32]
-Output [1]: [c_customer_sk#50]
-Input [2]: [c_customer_sk#50, ssales#55]
+Output [1]: [c_customer_sk#49]
+Input [2]: [c_customer_sk#49, ssales#54]
 
 (81) Sort [codegen id : 32]
-Input [1]: [c_customer_sk#50]
-Arguments: [c_customer_sk#50 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#49]
+Arguments: [c_customer_sk#49 ASC NULLS FIRST], false, 0
 
 (82) SortMergeJoin [codegen id : 34]
-Left keys [1]: [ws_bill_customer_sk#36]
-Right keys [1]: [c_customer_sk#50]
+Left keys [1]: [ws_bill_customer_sk#35]
+Right keys [1]: [c_customer_sk#49]
 Join type: LeftSemi
 Join condition: None
 
 (83) Project [codegen id : 34]
-Output [3]: [ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Input [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Output [3]: [ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Input [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 
 (84) ReusedExchange [Reuses operator id: 95]
-Output [1]: [d_date_sk#56]
+Output [1]: [d_date_sk#55]
 
 (85) BroadcastHashJoin [codegen id : 34]
-Left keys [1]: [ws_sold_date_sk#39]
-Right keys [1]: [d_date_sk#56]
+Left keys [1]: [ws_sold_date_sk#38]
+Right keys [1]: [d_date_sk#55]
 Join type: Inner
 Join condition: None
 
 (86) Project [codegen id : 34]
-Output [1]: [(cast(ws_quantity#37 as decimal(10,0)) * ws_list_price#38) AS sales#57]
-Input [4]: [ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39, d_date_sk#56]
+Output [1]: [(cast(ws_quantity#36 as decimal(10,0)) * ws_list_price#37) AS sales#56]
+Input [4]: [ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38, d_date_sk#55]
 
 (87) Union
 
 (88) HashAggregate [codegen id : 35]
-Input [1]: [sales#34]
+Input [1]: [sales#33]
 Keys: []
-Functions [1]: [partial_sum(sales#34)]
-Aggregate Attributes [2]: [sum#58, isEmpty#59]
-Results [2]: [sum#60, isEmpty#61]
+Functions [1]: [partial_sum(sales#33)]
+Aggregate Attributes [2]: [sum#57, isEmpty#58]
+Results [2]: [sum#59, isEmpty#60]
 
 (89) Exchange
-Input [2]: [sum#60, isEmpty#61]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
+Input [2]: [sum#59, isEmpty#60]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
 
 (90) HashAggregate [codegen id : 36]
-Input [2]: [sum#60, isEmpty#61]
+Input [2]: [sum#59, isEmpty#60]
 Keys: []
-Functions [1]: [sum(sales#34)]
-Aggregate Attributes [1]: [sum(sales#34)#62]
-Results [1]: [sum(sales#34)#62 AS sum(sales)#63]
+Functions [1]: [sum(sales#33)]
+Aggregate Attributes [1]: [sum(sales#33)#61]
+Results [1]: [sum(sales#33)#61 AS sum(sales)#62]
 
 ===== Subqueries =====
 
@@ -518,26 +518,26 @@ BroadcastExchange (95)
 
 
 (91) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#33, d_year#64, d_moy#65]
+Output [3]: [d_date_sk#32, d_year#63, d_moy#64]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,2), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (92) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#33, d_year#64, d_moy#65]
+Input [3]: [d_date_sk#32, d_year#63, d_moy#64]
 
 (93) Filter [codegen id : 1]
-Input [3]: [d_date_sk#33, d_year#64, d_moy#65]
-Condition : ((((isnotnull(d_year#64) AND isnotnull(d_moy#65)) AND (d_year#64 = 2000)) AND (d_moy#65 = 2)) AND isnotnull(d_date_sk#33))
+Input [3]: [d_date_sk#32, d_year#63, d_moy#64]
+Condition : ((((isnotnull(d_year#63) AND isnotnull(d_moy#64)) AND (d_year#63 = 2000)) AND (d_moy#64 = 2)) AND isnotnull(d_date_sk#32))
 
 (94) Project [codegen id : 1]
-Output [1]: [d_date_sk#33]
-Input [3]: [d_date_sk#33, d_year#64, d_moy#65]
+Output [1]: [d_date_sk#32]
+Input [3]: [d_date_sk#32, d_year#63, d_moy#64]
 
 (95) BroadcastExchange
-Input [1]: [d_date_sk#33]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
+Input [1]: [d_date_sk#32]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=11]
 
 Subquery:2 Hosting operator id = 5 Hosting Expression = ss_sold_date_sk#8 IN dynamicpruning#9
 BroadcastExchange (100)
@@ -548,28 +548,28 @@ BroadcastExchange (100)
 
 
 (96) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#10, d_date#11, d_year#66]
+Output [3]: [d_date_sk#10, d_date#11, d_year#65]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date,d_year:int>
 
 (97) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#66]
+Input [3]: [d_date_sk#10, d_date#11, d_year#65]
 
 (98) Filter [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#66]
-Condition : (d_year#66 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
+Input [3]: [d_date_sk#10, d_date#11, d_year#65]
+Condition : (d_year#65 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
 
 (99) Project [codegen id : 1]
 Output [2]: [d_date_sk#10, d_date#11]
-Input [3]: [d_date_sk#10, d_date#11, d_year#66]
+Input [3]: [d_date_sk#10, d_date#11, d_year#65]
 
 (100) BroadcastExchange
 Input [2]: [d_date_sk#10, d_date#11]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=11]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=12]
 
-Subquery:3 Hosting operator id = 44 Hosting Expression = Subquery scalar-subquery#31, [id=#32]
+Subquery:3 Hosting operator id = 44 Hosting Expression = Subquery scalar-subquery#31, [id=#7]
 * HashAggregate (117)
 +- Exchange (116)
    +- * HashAggregate (115)
@@ -590,91 +590,91 @@ Subquery:3 Hosting operator id = 44 Hosting Expression = Subquery scalar-subquer
 
 
 (101) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70]
+Output [4]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68, ss_sold_date_sk#69]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#70), dynamicpruningexpression(ss_sold_date_sk#70 IN dynamicpruning#71)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#69), dynamicpruningexpression(ss_sold_date_sk#69 IN dynamicpruning#70)]
 PushedFilters: [IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_customer_sk:int,ss_quantity:int,ss_sales_price:decimal(7,2)>
 
 (102) ColumnarToRow [codegen id : 2]
-Input [4]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70]
+Input [4]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68, ss_sold_date_sk#69]
 
 (103) Filter [codegen id : 2]
-Input [4]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70]
-Condition : isnotnull(ss_customer_sk#67)
+Input [4]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68, ss_sold_date_sk#69]
+Condition : isnotnull(ss_customer_sk#66)
 
 (104) ReusedExchange [Reuses operator id: 122]
-Output [1]: [d_date_sk#72]
+Output [1]: [d_date_sk#71]
 
 (105) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#70]
-Right keys [1]: [d_date_sk#72]
+Left keys [1]: [ss_sold_date_sk#69]
+Right keys [1]: [d_date_sk#71]
 Join type: Inner
 Join condition: None
 
 (106) Project [codegen id : 2]
-Output [3]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69]
-Input [5]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70, d_date_sk#72]
+Output [3]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68]
+Input [5]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68, ss_sold_date_sk#69, d_date_sk#71]
 
 (107) Exchange
-Input [3]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69]
-Arguments: hashpartitioning(ss_customer_sk#67, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [3]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68]
+Arguments: hashpartitioning(ss_customer_sk#66, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (108) Sort [codegen id : 3]
-Input [3]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69]
-Arguments: [ss_customer_sk#67 ASC NULLS FIRST], false, 0
+Input [3]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68]
+Arguments: [ss_customer_sk#66 ASC NULLS FIRST], false, 0
 
 (109) ReusedExchange [Reuses operator id: 38]
-Output [1]: [c_customer_sk#73]
+Output [1]: [c_customer_sk#72]
 
 (110) Sort [codegen id : 5]
-Input [1]: [c_customer_sk#73]
-Arguments: [c_customer_sk#73 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#72]
+Arguments: [c_customer_sk#72 ASC NULLS FIRST], false, 0
 
 (111) SortMergeJoin [codegen id : 6]
-Left keys [1]: [ss_customer_sk#67]
-Right keys [1]: [c_customer_sk#73]
+Left keys [1]: [ss_customer_sk#66]
+Right keys [1]: [c_customer_sk#72]
 Join type: Inner
 Join condition: None
 
 (112) Project [codegen id : 6]
-Output [3]: [ss_quantity#68, ss_sales_price#69, c_customer_sk#73]
-Input [4]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, c_customer_sk#73]
+Output [3]: [ss_quantity#67, ss_sales_price#68, c_customer_sk#72]
+Input [4]: [ss_customer_sk#66, ss_quantity#67, ss_sales_price#68, c_customer_sk#72]
 
 (113) HashAggregate [codegen id : 6]
-Input [3]: [ss_quantity#68, ss_sales_price#69, c_customer_sk#73]
-Keys [1]: [c_customer_sk#73]
-Functions [1]: [partial_sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))]
-Aggregate Attributes [2]: [sum#74, isEmpty#75]
-Results [3]: [c_customer_sk#73, sum#76, isEmpty#77]
+Input [3]: [ss_quantity#67, ss_sales_price#68, c_customer_sk#72]
+Keys [1]: [c_customer_sk#72]
+Functions [1]: [partial_sum((cast(ss_quantity#67 as decimal(10,0)) * ss_sales_price#68))]
+Aggregate Attributes [2]: [sum#73, isEmpty#74]
+Results [3]: [c_customer_sk#72, sum#75, isEmpty#76]
 
 (114) HashAggregate [codegen id : 6]
-Input [3]: [c_customer_sk#73, sum#76, isEmpty#77]
-Keys [1]: [c_customer_sk#73]
-Functions [1]: [sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))#78]
-Results [1]: [sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))#78 AS csales#79]
+Input [3]: [c_customer_sk#72, sum#75, isEmpty#76]
+Keys [1]: [c_customer_sk#72]
+Functions [1]: [sum((cast(ss_quantity#67 as decimal(10,0)) * ss_sales_price#68))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#67 as decimal(10,0)) * ss_sales_price#68))#77]
+Results [1]: [sum((cast(ss_quantity#67 as decimal(10,0)) * ss_sales_price#68))#77 AS csales#78]
 
 (115) HashAggregate [codegen id : 6]
-Input [1]: [csales#79]
+Input [1]: [csales#78]
 Keys: []
-Functions [1]: [partial_max(csales#79)]
-Aggregate Attributes [1]: [max#80]
-Results [1]: [max#81]
+Functions [1]: [partial_max(csales#78)]
+Aggregate Attributes [1]: [max#79]
+Results [1]: [max#80]
 
 (116) Exchange
-Input [1]: [max#81]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
+Input [1]: [max#80]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=14]
 
 (117) HashAggregate [codegen id : 7]
-Input [1]: [max#81]
+Input [1]: [max#80]
 Keys: []
-Functions [1]: [max(csales#79)]
-Aggregate Attributes [1]: [max(csales#79)#82]
-Results [1]: [max(csales#79)#82 AS tpcds_cmax#83]
+Functions [1]: [max(csales#78)]
+Aggregate Attributes [1]: [max(csales#78)#81]
+Results [1]: [max(csales#78)#81 AS tpcds_cmax#82]
 
-Subquery:4 Hosting operator id = 101 Hosting Expression = ss_sold_date_sk#70 IN dynamicpruning#71
+Subquery:4 Hosting operator id = 101 Hosting Expression = ss_sold_date_sk#69 IN dynamicpruning#70
 BroadcastExchange (122)
 +- * Project (121)
    +- * Filter (120)
@@ -683,29 +683,29 @@ BroadcastExchange (122)
 
 
 (118) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#72, d_year#84]
+Output [2]: [d_date_sk#71, d_year#83]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (119) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#72, d_year#84]
+Input [2]: [d_date_sk#71, d_year#83]
 
 (120) Filter [codegen id : 1]
-Input [2]: [d_date_sk#72, d_year#84]
-Condition : (d_year#84 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#72))
+Input [2]: [d_date_sk#71, d_year#83]
+Condition : (d_year#83 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#71))
 
 (121) Project [codegen id : 1]
-Output [1]: [d_date_sk#72]
-Input [2]: [d_date_sk#72, d_year#84]
+Output [1]: [d_date_sk#71]
+Input [2]: [d_date_sk#71, d_year#83]
 
 (122) BroadcastExchange
-Input [1]: [d_date_sk#72]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
+Input [1]: [d_date_sk#71]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
 
-Subquery:5 Hosting operator id = 52 Hosting Expression = ws_sold_date_sk#39 IN dynamicpruning#6
+Subquery:5 Hosting operator id = 52 Hosting Expression = ws_sold_date_sk#38 IN dynamicpruning#6
 
-Subquery:6 Hosting operator id = 79 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#32]
+Subquery:6 Hosting operator id = 79 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#7]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a/explain.txt
index 406072290a6aa..f231904d570b3 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23a/explain.txt
@@ -247,7 +247,7 @@ Results [2]: [c_customer_sk#24, sum((cast(ss_quantity#21 as decimal(10,0)) * ss_
 
 (38) Filter [codegen id : 9]
 Input [2]: [c_customer_sk#24, ssales#30]
-Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#32])))
+Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#7])))
 
 (39) Project [codegen id : 9]
 Output [1]: [c_customer_sk#24]
@@ -268,113 +268,113 @@ Output [3]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5]
 Input [4]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5]
 
 (43) ReusedExchange [Reuses operator id: 71]
-Output [1]: [d_date_sk#33]
+Output [1]: [d_date_sk#32]
 
 (44) BroadcastHashJoin [codegen id : 11]
 Left keys [1]: [cs_sold_date_sk#5]
-Right keys [1]: [d_date_sk#33]
+Right keys [1]: [d_date_sk#32]
 Join type: Inner
 Join condition: None
 
 (45) Project [codegen id : 11]
-Output [1]: [(cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4) AS sales#34]
-Input [4]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, d_date_sk#33]
+Output [1]: [(cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4) AS sales#33]
+Input [4]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, d_date_sk#32]
 
 (46) Scan parquet spark_catalog.default.web_sales
-Output [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Output [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#39), dynamicpruningexpression(ws_sold_date_sk#39 IN dynamicpruning#6)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#38), dynamicpruningexpression(ws_sold_date_sk#38 IN dynamicpruning#6)]
 ReadSchema: struct<ws_item_sk:int,ws_bill_customer_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (47) ColumnarToRow [codegen id : 16]
-Input [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Input [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 
 (48) ReusedExchange [Reuses operator id: 20]
-Output [1]: [item_sk#40]
+Output [1]: [item_sk#39]
 
 (49) BroadcastHashJoin [codegen id : 16]
-Left keys [1]: [ws_item_sk#35]
-Right keys [1]: [item_sk#40]
+Left keys [1]: [ws_item_sk#34]
+Right keys [1]: [item_sk#39]
 Join type: LeftSemi
 Join condition: None
 
 (50) Project [codegen id : 16]
-Output [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Input [5]: [ws_item_sk#35, ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Output [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Input [5]: [ws_item_sk#34, ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 
 (51) Exchange
-Input [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Arguments: hashpartitioning(ws_bill_customer_sk#36, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Arguments: hashpartitioning(ws_bill_customer_sk#35, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (52) Sort [codegen id : 17]
-Input [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Arguments: [ws_bill_customer_sk#36 ASC NULLS FIRST], false, 0
+Input [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Arguments: [ws_bill_customer_sk#35 ASC NULLS FIRST], false, 0
 
 (53) ReusedExchange [Reuses operator id: 36]
-Output [3]: [c_customer_sk#41, sum#42, isEmpty#43]
+Output [3]: [c_customer_sk#40, sum#41, isEmpty#42]
 
 (54) HashAggregate [codegen id : 20]
-Input [3]: [c_customer_sk#41, sum#42, isEmpty#43]
-Keys [1]: [c_customer_sk#41]
-Functions [1]: [sum((cast(ss_quantity#44 as decimal(10,0)) * ss_sales_price#45))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#44 as decimal(10,0)) * ss_sales_price#45))#29]
-Results [2]: [c_customer_sk#41, sum((cast(ss_quantity#44 as decimal(10,0)) * ss_sales_price#45))#29 AS ssales#46]
+Input [3]: [c_customer_sk#40, sum#41, isEmpty#42]
+Keys [1]: [c_customer_sk#40]
+Functions [1]: [sum((cast(ss_quantity#43 as decimal(10,0)) * ss_sales_price#44))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#43 as decimal(10,0)) * ss_sales_price#44))#29]
+Results [2]: [c_customer_sk#40, sum((cast(ss_quantity#43 as decimal(10,0)) * ss_sales_price#44))#29 AS ssales#45]
 
 (55) Filter [codegen id : 20]
-Input [2]: [c_customer_sk#41, ssales#46]
-Condition : (isnotnull(ssales#46) AND (cast(ssales#46 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#32])))
+Input [2]: [c_customer_sk#40, ssales#45]
+Condition : (isnotnull(ssales#45) AND (cast(ssales#45 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#7])))
 
 (56) Project [codegen id : 20]
-Output [1]: [c_customer_sk#41]
-Input [2]: [c_customer_sk#41, ssales#46]
+Output [1]: [c_customer_sk#40]
+Input [2]: [c_customer_sk#40, ssales#45]
 
 (57) Sort [codegen id : 20]
-Input [1]: [c_customer_sk#41]
-Arguments: [c_customer_sk#41 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#40]
+Arguments: [c_customer_sk#40 ASC NULLS FIRST], false, 0
 
 (58) SortMergeJoin [codegen id : 22]
-Left keys [1]: [ws_bill_customer_sk#36]
-Right keys [1]: [c_customer_sk#41]
+Left keys [1]: [ws_bill_customer_sk#35]
+Right keys [1]: [c_customer_sk#40]
 Join type: LeftSemi
 Join condition: None
 
 (59) Project [codegen id : 22]
-Output [3]: [ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
-Input [4]: [ws_bill_customer_sk#36, ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39]
+Output [3]: [ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
+Input [4]: [ws_bill_customer_sk#35, ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38]
 
 (60) ReusedExchange [Reuses operator id: 71]
-Output [1]: [d_date_sk#47]
+Output [1]: [d_date_sk#46]
 
 (61) BroadcastHashJoin [codegen id : 22]
-Left keys [1]: [ws_sold_date_sk#39]
-Right keys [1]: [d_date_sk#47]
+Left keys [1]: [ws_sold_date_sk#38]
+Right keys [1]: [d_date_sk#46]
 Join type: Inner
 Join condition: None
 
 (62) Project [codegen id : 22]
-Output [1]: [(cast(ws_quantity#37 as decimal(10,0)) * ws_list_price#38) AS sales#48]
-Input [4]: [ws_quantity#37, ws_list_price#38, ws_sold_date_sk#39, d_date_sk#47]
+Output [1]: [(cast(ws_quantity#36 as decimal(10,0)) * ws_list_price#37) AS sales#47]
+Input [4]: [ws_quantity#36, ws_list_price#37, ws_sold_date_sk#38, d_date_sk#46]
 
 (63) Union
 
 (64) HashAggregate [codegen id : 23]
-Input [1]: [sales#34]
+Input [1]: [sales#33]
 Keys: []
-Functions [1]: [partial_sum(sales#34)]
-Aggregate Attributes [2]: [sum#49, isEmpty#50]
-Results [2]: [sum#51, isEmpty#52]
+Functions [1]: [partial_sum(sales#33)]
+Aggregate Attributes [2]: [sum#48, isEmpty#49]
+Results [2]: [sum#50, isEmpty#51]
 
 (65) Exchange
-Input [2]: [sum#51, isEmpty#52]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
+Input [2]: [sum#50, isEmpty#51]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
 
 (66) HashAggregate [codegen id : 24]
-Input [2]: [sum#51, isEmpty#52]
+Input [2]: [sum#50, isEmpty#51]
 Keys: []
-Functions [1]: [sum(sales#34)]
-Aggregate Attributes [1]: [sum(sales#34)#53]
-Results [1]: [sum(sales#34)#53 AS sum(sales)#54]
+Functions [1]: [sum(sales#33)]
+Aggregate Attributes [1]: [sum(sales#33)#52]
+Results [1]: [sum(sales#33)#52 AS sum(sales)#53]
 
 ===== Subqueries =====
 
@@ -387,26 +387,26 @@ BroadcastExchange (71)
 
 
 (67) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#33, d_year#55, d_moy#56]
+Output [3]: [d_date_sk#32, d_year#54, d_moy#55]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,2), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (68) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#33, d_year#55, d_moy#56]
+Input [3]: [d_date_sk#32, d_year#54, d_moy#55]
 
 (69) Filter [codegen id : 1]
-Input [3]: [d_date_sk#33, d_year#55, d_moy#56]
-Condition : ((((isnotnull(d_year#55) AND isnotnull(d_moy#56)) AND (d_year#55 = 2000)) AND (d_moy#56 = 2)) AND isnotnull(d_date_sk#33))
+Input [3]: [d_date_sk#32, d_year#54, d_moy#55]
+Condition : ((((isnotnull(d_year#54) AND isnotnull(d_moy#55)) AND (d_year#54 = 2000)) AND (d_moy#55 = 2)) AND isnotnull(d_date_sk#32))
 
 (70) Project [codegen id : 1]
-Output [1]: [d_date_sk#33]
-Input [3]: [d_date_sk#33, d_year#55, d_moy#56]
+Output [1]: [d_date_sk#32]
+Input [3]: [d_date_sk#32, d_year#54, d_moy#55]
 
 (71) BroadcastExchange
-Input [1]: [d_date_sk#33]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
+Input [1]: [d_date_sk#32]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
 Subquery:2 Hosting operator id = 3 Hosting Expression = ss_sold_date_sk#8 IN dynamicpruning#9
 BroadcastExchange (76)
@@ -417,28 +417,28 @@ BroadcastExchange (76)
 
 
 (72) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#10, d_date#11, d_year#57]
+Output [3]: [d_date_sk#10, d_date#11, d_year#56]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date,d_year:int>
 
 (73) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#57]
+Input [3]: [d_date_sk#10, d_date#11, d_year#56]
 
 (74) Filter [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#57]
-Condition : (d_year#57 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
+Input [3]: [d_date_sk#10, d_date#11, d_year#56]
+Condition : (d_year#56 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
 
 (75) Project [codegen id : 1]
 Output [2]: [d_date_sk#10, d_date#11]
-Input [3]: [d_date_sk#10, d_date#11, d_year#57]
+Input [3]: [d_date_sk#10, d_date#11, d_year#56]
 
 (76) BroadcastExchange
 Input [2]: [d_date_sk#10, d_date#11]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=11]
 
-Subquery:3 Hosting operator id = 38 Hosting Expression = Subquery scalar-subquery#31, [id=#32]
+Subquery:3 Hosting operator id = 38 Hosting Expression = Subquery scalar-subquery#31, [id=#7]
 * HashAggregate (91)
 +- Exchange (90)
    +- * HashAggregate (89)
@@ -457,83 +457,83 @@ Subquery:3 Hosting operator id = 38 Hosting Expression = Subquery scalar-subquer
 
 
 (77) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_customer_sk#58, ss_quantity#59, ss_sales_price#60, ss_sold_date_sk#61]
+Output [4]: [ss_customer_sk#57, ss_quantity#58, ss_sales_price#59, ss_sold_date_sk#60]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#61), dynamicpruningexpression(ss_sold_date_sk#61 IN dynamicpruning#62)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#60), dynamicpruningexpression(ss_sold_date_sk#60 IN dynamicpruning#61)]
 PushedFilters: [IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_customer_sk:int,ss_quantity:int,ss_sales_price:decimal(7,2)>
 
 (78) ColumnarToRow [codegen id : 3]
-Input [4]: [ss_customer_sk#58, ss_quantity#59, ss_sales_price#60, ss_sold_date_sk#61]
+Input [4]: [ss_customer_sk#57, ss_quantity#58, ss_sales_price#59, ss_sold_date_sk#60]
 
 (79) Filter [codegen id : 3]
-Input [4]: [ss_customer_sk#58, ss_quantity#59, ss_sales_price#60, ss_sold_date_sk#61]
-Condition : isnotnull(ss_customer_sk#58)
+Input [4]: [ss_customer_sk#57, ss_quantity#58, ss_sales_price#59, ss_sold_date_sk#60]
+Condition : isnotnull(ss_customer_sk#57)
 
 (80) ReusedExchange [Reuses operator id: 32]
-Output [1]: [c_customer_sk#63]
+Output [1]: [c_customer_sk#62]
 
 (81) BroadcastHashJoin [codegen id : 3]
-Left keys [1]: [ss_customer_sk#58]
-Right keys [1]: [c_customer_sk#63]
+Left keys [1]: [ss_customer_sk#57]
+Right keys [1]: [c_customer_sk#62]
 Join type: Inner
 Join condition: None
 
 (82) Project [codegen id : 3]
-Output [4]: [ss_quantity#59, ss_sales_price#60, ss_sold_date_sk#61, c_customer_sk#63]
-Input [5]: [ss_customer_sk#58, ss_quantity#59, ss_sales_price#60, ss_sold_date_sk#61, c_customer_sk#63]
+Output [4]: [ss_quantity#58, ss_sales_price#59, ss_sold_date_sk#60, c_customer_sk#62]
+Input [5]: [ss_customer_sk#57, ss_quantity#58, ss_sales_price#59, ss_sold_date_sk#60, c_customer_sk#62]
 
 (83) ReusedExchange [Reuses operator id: 96]
-Output [1]: [d_date_sk#64]
+Output [1]: [d_date_sk#63]
 
 (84) BroadcastHashJoin [codegen id : 3]
-Left keys [1]: [ss_sold_date_sk#61]
-Right keys [1]: [d_date_sk#64]
+Left keys [1]: [ss_sold_date_sk#60]
+Right keys [1]: [d_date_sk#63]
 Join type: Inner
 Join condition: None
 
 (85) Project [codegen id : 3]
-Output [3]: [ss_quantity#59, ss_sales_price#60, c_customer_sk#63]
-Input [5]: [ss_quantity#59, ss_sales_price#60, ss_sold_date_sk#61, c_customer_sk#63, d_date_sk#64]
+Output [3]: [ss_quantity#58, ss_sales_price#59, c_customer_sk#62]
+Input [5]: [ss_quantity#58, ss_sales_price#59, ss_sold_date_sk#60, c_customer_sk#62, d_date_sk#63]
 
 (86) HashAggregate [codegen id : 3]
-Input [3]: [ss_quantity#59, ss_sales_price#60, c_customer_sk#63]
-Keys [1]: [c_customer_sk#63]
-Functions [1]: [partial_sum((cast(ss_quantity#59 as decimal(10,0)) * ss_sales_price#60))]
-Aggregate Attributes [2]: [sum#65, isEmpty#66]
-Results [3]: [c_customer_sk#63, sum#67, isEmpty#68]
+Input [3]: [ss_quantity#58, ss_sales_price#59, c_customer_sk#62]
+Keys [1]: [c_customer_sk#62]
+Functions [1]: [partial_sum((cast(ss_quantity#58 as decimal(10,0)) * ss_sales_price#59))]
+Aggregate Attributes [2]: [sum#64, isEmpty#65]
+Results [3]: [c_customer_sk#62, sum#66, isEmpty#67]
 
 (87) Exchange
-Input [3]: [c_customer_sk#63, sum#67, isEmpty#68]
-Arguments: hashpartitioning(c_customer_sk#63, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [3]: [c_customer_sk#62, sum#66, isEmpty#67]
+Arguments: hashpartitioning(c_customer_sk#62, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (88) HashAggregate [codegen id : 4]
-Input [3]: [c_customer_sk#63, sum#67, isEmpty#68]
-Keys [1]: [c_customer_sk#63]
-Functions [1]: [sum((cast(ss_quantity#59 as decimal(10,0)) * ss_sales_price#60))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#59 as decimal(10,0)) * ss_sales_price#60))#69]
-Results [1]: [sum((cast(ss_quantity#59 as decimal(10,0)) * ss_sales_price#60))#69 AS csales#70]
+Input [3]: [c_customer_sk#62, sum#66, isEmpty#67]
+Keys [1]: [c_customer_sk#62]
+Functions [1]: [sum((cast(ss_quantity#58 as decimal(10,0)) * ss_sales_price#59))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#58 as decimal(10,0)) * ss_sales_price#59))#68]
+Results [1]: [sum((cast(ss_quantity#58 as decimal(10,0)) * ss_sales_price#59))#68 AS csales#69]
 
 (89) HashAggregate [codegen id : 4]
-Input [1]: [csales#70]
+Input [1]: [csales#69]
 Keys: []
-Functions [1]: [partial_max(csales#70)]
-Aggregate Attributes [1]: [max#71]
-Results [1]: [max#72]
+Functions [1]: [partial_max(csales#69)]
+Aggregate Attributes [1]: [max#70]
+Results [1]: [max#71]
 
 (90) Exchange
-Input [1]: [max#72]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
+Input [1]: [max#71]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (91) HashAggregate [codegen id : 5]
-Input [1]: [max#72]
+Input [1]: [max#71]
 Keys: []
-Functions [1]: [max(csales#70)]
-Aggregate Attributes [1]: [max(csales#70)#73]
-Results [1]: [max(csales#70)#73 AS tpcds_cmax#74]
+Functions [1]: [max(csales#69)]
+Aggregate Attributes [1]: [max(csales#69)#72]
+Results [1]: [max(csales#69)#72 AS tpcds_cmax#73]
 
-Subquery:4 Hosting operator id = 77 Hosting Expression = ss_sold_date_sk#61 IN dynamicpruning#62
+Subquery:4 Hosting operator id = 77 Hosting Expression = ss_sold_date_sk#60 IN dynamicpruning#61
 BroadcastExchange (96)
 +- * Project (95)
    +- * Filter (94)
@@ -542,29 +542,29 @@ BroadcastExchange (96)
 
 
 (92) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#64, d_year#75]
+Output [2]: [d_date_sk#63, d_year#74]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (93) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#64, d_year#75]
+Input [2]: [d_date_sk#63, d_year#74]
 
 (94) Filter [codegen id : 1]
-Input [2]: [d_date_sk#64, d_year#75]
-Condition : (d_year#75 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#64))
+Input [2]: [d_date_sk#63, d_year#74]
+Condition : (d_year#74 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#63))
 
 (95) Project [codegen id : 1]
-Output [1]: [d_date_sk#64]
-Input [2]: [d_date_sk#64, d_year#75]
+Output [1]: [d_date_sk#63]
+Input [2]: [d_date_sk#63, d_year#74]
 
 (96) BroadcastExchange
-Input [1]: [d_date_sk#64]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
+Input [1]: [d_date_sk#63]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
 
-Subquery:5 Hosting operator id = 46 Hosting Expression = ws_sold_date_sk#39 IN dynamicpruning#6
+Subquery:5 Hosting operator id = 46 Hosting Expression = ws_sold_date_sk#38 IN dynamicpruning#6
 
-Subquery:6 Hosting operator id = 55 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#32]
+Subquery:6 Hosting operator id = 55 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#7]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b.sf100/explain.txt
index 7b8d3a1d10c01..768eab873ac6b 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b.sf100/explain.txt
@@ -339,7 +339,7 @@ Results [2]: [c_customer_sk#24, sum((cast(ss_quantity#21 as decimal(10,0)) * ss_
 
 (45) Filter [codegen id : 15]
 Input [2]: [c_customer_sk#24, ssales#30]
-Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#32])))
+Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#7])))
 
 (46) Project [codegen id : 15]
 Output [1]: [c_customer_sk#24]
@@ -356,39 +356,39 @@ Join type: LeftSemi
 Join condition: None
 
 (49) ReusedExchange [Reuses operator id: 134]
-Output [1]: [d_date_sk#33]
+Output [1]: [d_date_sk#32]
 
 (50) BroadcastHashJoin [codegen id : 17]
 Left keys [1]: [cs_sold_date_sk#5]
-Right keys [1]: [d_date_sk#33]
+Right keys [1]: [d_date_sk#32]
 Join type: Inner
 Join condition: None
 
 (51) Project [codegen id : 17]
 Output [3]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4]
-Input [5]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, d_date_sk#33]
+Input [5]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, d_date_sk#32]
 
 (52) Scan parquet spark_catalog.default.customer
-Output [3]: [c_customer_sk#34, c_first_name#35, c_last_name#36]
+Output [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer]
 PushedFilters: [IsNotNull(c_customer_sk)]
 ReadSchema: struct<c_customer_sk:int,c_first_name:string,c_last_name:string>
 
 (53) ColumnarToRow [codegen id : 18]
-Input [3]: [c_customer_sk#34, c_first_name#35, c_last_name#36]
+Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
 
 (54) Filter [codegen id : 18]
-Input [3]: [c_customer_sk#34, c_first_name#35, c_last_name#36]
-Condition : isnotnull(c_customer_sk#34)
+Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
+Condition : isnotnull(c_customer_sk#33)
 
 (55) Exchange
-Input [3]: [c_customer_sk#34, c_first_name#35, c_last_name#36]
-Arguments: hashpartitioning(c_customer_sk#34, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
+Arguments: hashpartitioning(c_customer_sk#33, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (56) Sort [codegen id : 19]
-Input [3]: [c_customer_sk#34, c_first_name#35, c_last_name#36]
-Arguments: [c_customer_sk#34 ASC NULLS FIRST], false, 0
+Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
+Arguments: [c_customer_sk#33 ASC NULLS FIRST], false, 0
 
 (57) ReusedExchange [Reuses operator id: 34]
 Output [3]: [ss_customer_sk#20, ss_quantity#21, ss_sales_price#22]
@@ -430,7 +430,7 @@ Results [2]: [c_customer_sk#24, sum((cast(ss_quantity#21 as decimal(10,0)) * ss_
 
 (65) Filter [codegen id : 24]
 Input [2]: [c_customer_sk#24, ssales#30]
-Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#32])))
+Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#7])))
 
 (66) Project [codegen id : 24]
 Output [1]: [c_customer_sk#24]
@@ -441,295 +441,295 @@ Input [1]: [c_customer_sk#24]
 Arguments: [c_customer_sk#24 ASC NULLS FIRST], false, 0
 
 (68) SortMergeJoin [codegen id : 25]
-Left keys [1]: [c_customer_sk#34]
+Left keys [1]: [c_customer_sk#33]
 Right keys [1]: [c_customer_sk#24]
 Join type: LeftSemi
 Join condition: None
 
 (69) SortMergeJoin [codegen id : 26]
 Left keys [1]: [cs_bill_customer_sk#1]
-Right keys [1]: [c_customer_sk#34]
+Right keys [1]: [c_customer_sk#33]
 Join type: Inner
 Join condition: None
 
 (70) Project [codegen id : 26]
-Output [4]: [cs_quantity#3, cs_list_price#4, c_first_name#35, c_last_name#36]
-Input [6]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, c_customer_sk#34, c_first_name#35, c_last_name#36]
+Output [4]: [cs_quantity#3, cs_list_price#4, c_first_name#34, c_last_name#35]
+Input [6]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, c_customer_sk#33, c_first_name#34, c_last_name#35]
 
 (71) HashAggregate [codegen id : 26]
-Input [4]: [cs_quantity#3, cs_list_price#4, c_first_name#35, c_last_name#36]
-Keys [2]: [c_last_name#36, c_first_name#35]
+Input [4]: [cs_quantity#3, cs_list_price#4, c_first_name#34, c_last_name#35]
+Keys [2]: [c_last_name#35, c_first_name#34]
 Functions [1]: [partial_sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))]
-Aggregate Attributes [2]: [sum#37, isEmpty#38]
-Results [4]: [c_last_name#36, c_first_name#35, sum#39, isEmpty#40]
+Aggregate Attributes [2]: [sum#36, isEmpty#37]
+Results [4]: [c_last_name#35, c_first_name#34, sum#38, isEmpty#39]
 
 (72) Exchange
-Input [4]: [c_last_name#36, c_first_name#35, sum#39, isEmpty#40]
-Arguments: hashpartitioning(c_last_name#36, c_first_name#35, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [4]: [c_last_name#35, c_first_name#34, sum#38, isEmpty#39]
+Arguments: hashpartitioning(c_last_name#35, c_first_name#34, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (73) HashAggregate [codegen id : 27]
-Input [4]: [c_last_name#36, c_first_name#35, sum#39, isEmpty#40]
-Keys [2]: [c_last_name#36, c_first_name#35]
+Input [4]: [c_last_name#35, c_first_name#34, sum#38, isEmpty#39]
+Keys [2]: [c_last_name#35, c_first_name#34]
 Functions [1]: [sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))]
-Aggregate Attributes [1]: [sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#41]
-Results [3]: [c_last_name#36, c_first_name#35, sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#41 AS sales#42]
+Aggregate Attributes [1]: [sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#40]
+Results [3]: [c_last_name#35, c_first_name#34, sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#40 AS sales#41]
 
 (74) Scan parquet spark_catalog.default.web_sales
-Output [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
+Output [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#47), dynamicpruningexpression(ws_sold_date_sk#47 IN dynamicpruning#6)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#46), dynamicpruningexpression(ws_sold_date_sk#46 IN dynamicpruning#6)]
 PushedFilters: [IsNotNull(ws_bill_customer_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_bill_customer_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (75) ColumnarToRow [codegen id : 28]
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
 
 (76) Filter [codegen id : 28]
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Condition : isnotnull(ws_bill_customer_sk#44)
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Condition : isnotnull(ws_bill_customer_sk#43)
 
 (77) Exchange
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Arguments: hashpartitioning(ws_item_sk#43, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Arguments: hashpartitioning(ws_item_sk#42, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (78) Sort [codegen id : 29]
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Arguments: [ws_item_sk#43 ASC NULLS FIRST], false, 0
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Arguments: [ws_item_sk#42 ASC NULLS FIRST], false, 0
 
 (79) ReusedExchange [Reuses operator id: 12]
-Output [2]: [ss_item_sk#48, d_date#49]
+Output [2]: [ss_item_sk#47, d_date#48]
 
 (80) Sort [codegen id : 32]
-Input [2]: [ss_item_sk#48, d_date#49]
-Arguments: [ss_item_sk#48 ASC NULLS FIRST], false, 0
+Input [2]: [ss_item_sk#47, d_date#48]
+Arguments: [ss_item_sk#47 ASC NULLS FIRST], false, 0
 
 (81) ReusedExchange [Reuses operator id: 17]
-Output [2]: [i_item_sk#50, i_item_desc#51]
+Output [2]: [i_item_sk#49, i_item_desc#50]
 
 (82) Sort [codegen id : 34]
-Input [2]: [i_item_sk#50, i_item_desc#51]
-Arguments: [i_item_sk#50 ASC NULLS FIRST], false, 0
+Input [2]: [i_item_sk#49, i_item_desc#50]
+Arguments: [i_item_sk#49 ASC NULLS FIRST], false, 0
 
 (83) SortMergeJoin [codegen id : 35]
-Left keys [1]: [ss_item_sk#48]
-Right keys [1]: [i_item_sk#50]
+Left keys [1]: [ss_item_sk#47]
+Right keys [1]: [i_item_sk#49]
 Join type: Inner
 Join condition: None
 
 (84) Project [codegen id : 35]
-Output [3]: [d_date#49, i_item_sk#50, substr(i_item_desc#51, 1, 30) AS _groupingexpression#52]
-Input [4]: [ss_item_sk#48, d_date#49, i_item_sk#50, i_item_desc#51]
+Output [3]: [d_date#48, i_item_sk#49, substr(i_item_desc#50, 1, 30) AS _groupingexpression#51]
+Input [4]: [ss_item_sk#47, d_date#48, i_item_sk#49, i_item_desc#50]
 
 (85) HashAggregate [codegen id : 35]
-Input [3]: [d_date#49, i_item_sk#50, _groupingexpression#52]
-Keys [3]: [_groupingexpression#52, i_item_sk#50, d_date#49]
+Input [3]: [d_date#48, i_item_sk#49, _groupingexpression#51]
+Keys [3]: [_groupingexpression#51, i_item_sk#49, d_date#48]
 Functions [1]: [partial_count(1)]
 Aggregate Attributes [1]: [count#15]
-Results [4]: [_groupingexpression#52, i_item_sk#50, d_date#49, count#16]
+Results [4]: [_groupingexpression#51, i_item_sk#49, d_date#48, count#16]
 
 (86) HashAggregate [codegen id : 35]
-Input [4]: [_groupingexpression#52, i_item_sk#50, d_date#49, count#16]
-Keys [3]: [_groupingexpression#52, i_item_sk#50, d_date#49]
+Input [4]: [_groupingexpression#51, i_item_sk#49, d_date#48, count#16]
+Keys [3]: [_groupingexpression#51, i_item_sk#49, d_date#48]
 Functions [1]: [count(1)]
 Aggregate Attributes [1]: [count(1)#17]
-Results [2]: [i_item_sk#50 AS item_sk#53, count(1)#17 AS cnt#54]
+Results [2]: [i_item_sk#49 AS item_sk#52, count(1)#17 AS cnt#53]
 
 (87) Filter [codegen id : 35]
-Input [2]: [item_sk#53, cnt#54]
-Condition : (cnt#54 > 4)
+Input [2]: [item_sk#52, cnt#53]
+Condition : (cnt#53 > 4)
 
 (88) Project [codegen id : 35]
-Output [1]: [item_sk#53]
-Input [2]: [item_sk#53, cnt#54]
+Output [1]: [item_sk#52]
+Input [2]: [item_sk#52, cnt#53]
 
 (89) Sort [codegen id : 35]
-Input [1]: [item_sk#53]
-Arguments: [item_sk#53 ASC NULLS FIRST], false, 0
+Input [1]: [item_sk#52]
+Arguments: [item_sk#52 ASC NULLS FIRST], false, 0
 
 (90) SortMergeJoin [codegen id : 36]
-Left keys [1]: [ws_item_sk#43]
-Right keys [1]: [item_sk#53]
+Left keys [1]: [ws_item_sk#42]
+Right keys [1]: [item_sk#52]
 Join type: LeftSemi
 Join condition: None
 
 (91) Project [codegen id : 36]
-Output [4]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
+Output [4]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
 
 (92) Exchange
-Input [4]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Arguments: hashpartitioning(ws_bill_customer_sk#44, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [4]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Arguments: hashpartitioning(ws_bill_customer_sk#43, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (93) Sort [codegen id : 37]
-Input [4]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Arguments: [ws_bill_customer_sk#44 ASC NULLS FIRST], false, 0
+Input [4]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Arguments: [ws_bill_customer_sk#43 ASC NULLS FIRST], false, 0
 
 (94) ReusedExchange [Reuses operator id: 34]
-Output [3]: [ss_customer_sk#55, ss_quantity#56, ss_sales_price#57]
+Output [3]: [ss_customer_sk#54, ss_quantity#55, ss_sales_price#56]
 
 (95) Sort [codegen id : 39]
-Input [3]: [ss_customer_sk#55, ss_quantity#56, ss_sales_price#57]
-Arguments: [ss_customer_sk#55 ASC NULLS FIRST], false, 0
+Input [3]: [ss_customer_sk#54, ss_quantity#55, ss_sales_price#56]
+Arguments: [ss_customer_sk#54 ASC NULLS FIRST], false, 0
 
 (96) ReusedExchange [Reuses operator id: 39]
-Output [1]: [c_customer_sk#58]
+Output [1]: [c_customer_sk#57]
 
 (97) Sort [codegen id : 41]
-Input [1]: [c_customer_sk#58]
-Arguments: [c_customer_sk#58 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#57]
+Arguments: [c_customer_sk#57 ASC NULLS FIRST], false, 0
 
 (98) SortMergeJoin [codegen id : 42]
-Left keys [1]: [ss_customer_sk#55]
-Right keys [1]: [c_customer_sk#58]
+Left keys [1]: [ss_customer_sk#54]
+Right keys [1]: [c_customer_sk#57]
 Join type: Inner
 Join condition: None
 
 (99) Project [codegen id : 42]
-Output [3]: [ss_quantity#56, ss_sales_price#57, c_customer_sk#58]
-Input [4]: [ss_customer_sk#55, ss_quantity#56, ss_sales_price#57, c_customer_sk#58]
+Output [3]: [ss_quantity#55, ss_sales_price#56, c_customer_sk#57]
+Input [4]: [ss_customer_sk#54, ss_quantity#55, ss_sales_price#56, c_customer_sk#57]
 
 (100) HashAggregate [codegen id : 42]
-Input [3]: [ss_quantity#56, ss_sales_price#57, c_customer_sk#58]
-Keys [1]: [c_customer_sk#58]
-Functions [1]: [partial_sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))]
-Aggregate Attributes [2]: [sum#59, isEmpty#60]
-Results [3]: [c_customer_sk#58, sum#61, isEmpty#62]
+Input [3]: [ss_quantity#55, ss_sales_price#56, c_customer_sk#57]
+Keys [1]: [c_customer_sk#57]
+Functions [1]: [partial_sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))]
+Aggregate Attributes [2]: [sum#58, isEmpty#59]
+Results [3]: [c_customer_sk#57, sum#60, isEmpty#61]
 
 (101) HashAggregate [codegen id : 42]
-Input [3]: [c_customer_sk#58, sum#61, isEmpty#62]
-Keys [1]: [c_customer_sk#58]
-Functions [1]: [sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))#29]
-Results [2]: [c_customer_sk#58, sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))#29 AS ssales#63]
+Input [3]: [c_customer_sk#57, sum#60, isEmpty#61]
+Keys [1]: [c_customer_sk#57]
+Functions [1]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))#29]
+Results [2]: [c_customer_sk#57, sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))#29 AS ssales#62]
 
 (102) Filter [codegen id : 42]
-Input [2]: [c_customer_sk#58, ssales#63]
-Condition : (isnotnull(ssales#63) AND (cast(ssales#63 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#32])))
+Input [2]: [c_customer_sk#57, ssales#62]
+Condition : (isnotnull(ssales#62) AND (cast(ssales#62 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#7])))
 
 (103) Project [codegen id : 42]
-Output [1]: [c_customer_sk#58]
-Input [2]: [c_customer_sk#58, ssales#63]
+Output [1]: [c_customer_sk#57]
+Input [2]: [c_customer_sk#57, ssales#62]
 
 (104) Sort [codegen id : 42]
-Input [1]: [c_customer_sk#58]
-Arguments: [c_customer_sk#58 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#57]
+Arguments: [c_customer_sk#57 ASC NULLS FIRST], false, 0
 
 (105) SortMergeJoin [codegen id : 44]
-Left keys [1]: [ws_bill_customer_sk#44]
-Right keys [1]: [c_customer_sk#58]
+Left keys [1]: [ws_bill_customer_sk#43]
+Right keys [1]: [c_customer_sk#57]
 Join type: LeftSemi
 Join condition: None
 
 (106) ReusedExchange [Reuses operator id: 134]
-Output [1]: [d_date_sk#64]
+Output [1]: [d_date_sk#63]
 
 (107) BroadcastHashJoin [codegen id : 44]
-Left keys [1]: [ws_sold_date_sk#47]
-Right keys [1]: [d_date_sk#64]
+Left keys [1]: [ws_sold_date_sk#46]
+Right keys [1]: [d_date_sk#63]
 Join type: Inner
 Join condition: None
 
 (108) Project [codegen id : 44]
-Output [3]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46]
-Input [5]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47, d_date_sk#64]
+Output [3]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45]
+Input [5]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46, d_date_sk#63]
 
 (109) ReusedExchange [Reuses operator id: 55]
-Output [3]: [c_customer_sk#65, c_first_name#66, c_last_name#67]
+Output [3]: [c_customer_sk#64, c_first_name#65, c_last_name#66]
 
 (110) Sort [codegen id : 46]
-Input [3]: [c_customer_sk#65, c_first_name#66, c_last_name#67]
-Arguments: [c_customer_sk#65 ASC NULLS FIRST], false, 0
+Input [3]: [c_customer_sk#64, c_first_name#65, c_last_name#66]
+Arguments: [c_customer_sk#64 ASC NULLS FIRST], false, 0
 
 (111) ReusedExchange [Reuses operator id: 34]
-Output [3]: [ss_customer_sk#55, ss_quantity#56, ss_sales_price#57]
+Output [3]: [ss_customer_sk#54, ss_quantity#55, ss_sales_price#56]
 
 (112) Sort [codegen id : 48]
-Input [3]: [ss_customer_sk#55, ss_quantity#56, ss_sales_price#57]
-Arguments: [ss_customer_sk#55 ASC NULLS FIRST], false, 0
+Input [3]: [ss_customer_sk#54, ss_quantity#55, ss_sales_price#56]
+Arguments: [ss_customer_sk#54 ASC NULLS FIRST], false, 0
 
 (113) ReusedExchange [Reuses operator id: 39]
-Output [1]: [c_customer_sk#58]
+Output [1]: [c_customer_sk#57]
 
 (114) Sort [codegen id : 50]
-Input [1]: [c_customer_sk#58]
-Arguments: [c_customer_sk#58 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#57]
+Arguments: [c_customer_sk#57 ASC NULLS FIRST], false, 0
 
 (115) SortMergeJoin [codegen id : 51]
-Left keys [1]: [ss_customer_sk#55]
-Right keys [1]: [c_customer_sk#58]
+Left keys [1]: [ss_customer_sk#54]
+Right keys [1]: [c_customer_sk#57]
 Join type: Inner
 Join condition: None
 
 (116) Project [codegen id : 51]
-Output [3]: [ss_quantity#56, ss_sales_price#57, c_customer_sk#58]
-Input [4]: [ss_customer_sk#55, ss_quantity#56, ss_sales_price#57, c_customer_sk#58]
+Output [3]: [ss_quantity#55, ss_sales_price#56, c_customer_sk#57]
+Input [4]: [ss_customer_sk#54, ss_quantity#55, ss_sales_price#56, c_customer_sk#57]
 
 (117) HashAggregate [codegen id : 51]
-Input [3]: [ss_quantity#56, ss_sales_price#57, c_customer_sk#58]
-Keys [1]: [c_customer_sk#58]
-Functions [1]: [partial_sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))]
-Aggregate Attributes [2]: [sum#59, isEmpty#60]
-Results [3]: [c_customer_sk#58, sum#61, isEmpty#62]
+Input [3]: [ss_quantity#55, ss_sales_price#56, c_customer_sk#57]
+Keys [1]: [c_customer_sk#57]
+Functions [1]: [partial_sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))]
+Aggregate Attributes [2]: [sum#58, isEmpty#59]
+Results [3]: [c_customer_sk#57, sum#60, isEmpty#61]
 
 (118) HashAggregate [codegen id : 51]
-Input [3]: [c_customer_sk#58, sum#61, isEmpty#62]
-Keys [1]: [c_customer_sk#58]
-Functions [1]: [sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))#29]
-Results [2]: [c_customer_sk#58, sum((cast(ss_quantity#56 as decimal(10,0)) * ss_sales_price#57))#29 AS ssales#63]
+Input [3]: [c_customer_sk#57, sum#60, isEmpty#61]
+Keys [1]: [c_customer_sk#57]
+Functions [1]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))#29]
+Results [2]: [c_customer_sk#57, sum((cast(ss_quantity#55 as decimal(10,0)) * ss_sales_price#56))#29 AS ssales#62]
 
 (119) Filter [codegen id : 51]
-Input [2]: [c_customer_sk#58, ssales#63]
-Condition : (isnotnull(ssales#63) AND (cast(ssales#63 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#32])))
+Input [2]: [c_customer_sk#57, ssales#62]
+Condition : (isnotnull(ssales#62) AND (cast(ssales#62 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#7])))
 
 (120) Project [codegen id : 51]
-Output [1]: [c_customer_sk#58]
-Input [2]: [c_customer_sk#58, ssales#63]
+Output [1]: [c_customer_sk#57]
+Input [2]: [c_customer_sk#57, ssales#62]
 
 (121) Sort [codegen id : 51]
-Input [1]: [c_customer_sk#58]
-Arguments: [c_customer_sk#58 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#57]
+Arguments: [c_customer_sk#57 ASC NULLS FIRST], false, 0
 
 (122) SortMergeJoin [codegen id : 52]
-Left keys [1]: [c_customer_sk#65]
-Right keys [1]: [c_customer_sk#58]
+Left keys [1]: [c_customer_sk#64]
+Right keys [1]: [c_customer_sk#57]
 Join type: LeftSemi
 Join condition: None
 
 (123) SortMergeJoin [codegen id : 53]
-Left keys [1]: [ws_bill_customer_sk#44]
-Right keys [1]: [c_customer_sk#65]
+Left keys [1]: [ws_bill_customer_sk#43]
+Right keys [1]: [c_customer_sk#64]
 Join type: Inner
 Join condition: None
 
 (124) Project [codegen id : 53]
-Output [4]: [ws_quantity#45, ws_list_price#46, c_first_name#66, c_last_name#67]
-Input [6]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, c_customer_sk#65, c_first_name#66, c_last_name#67]
+Output [4]: [ws_quantity#44, ws_list_price#45, c_first_name#65, c_last_name#66]
+Input [6]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, c_customer_sk#64, c_first_name#65, c_last_name#66]
 
 (125) HashAggregate [codegen id : 53]
-Input [4]: [ws_quantity#45, ws_list_price#46, c_first_name#66, c_last_name#67]
-Keys [2]: [c_last_name#67, c_first_name#66]
-Functions [1]: [partial_sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))]
-Aggregate Attributes [2]: [sum#68, isEmpty#69]
-Results [4]: [c_last_name#67, c_first_name#66, sum#70, isEmpty#71]
+Input [4]: [ws_quantity#44, ws_list_price#45, c_first_name#65, c_last_name#66]
+Keys [2]: [c_last_name#66, c_first_name#65]
+Functions [1]: [partial_sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))]
+Aggregate Attributes [2]: [sum#67, isEmpty#68]
+Results [4]: [c_last_name#66, c_first_name#65, sum#69, isEmpty#70]
 
 (126) Exchange
-Input [4]: [c_last_name#67, c_first_name#66, sum#70, isEmpty#71]
-Arguments: hashpartitioning(c_last_name#67, c_first_name#66, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [4]: [c_last_name#66, c_first_name#65, sum#69, isEmpty#70]
+Arguments: hashpartitioning(c_last_name#66, c_first_name#65, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (127) HashAggregate [codegen id : 54]
-Input [4]: [c_last_name#67, c_first_name#66, sum#70, isEmpty#71]
-Keys [2]: [c_last_name#67, c_first_name#66]
-Functions [1]: [sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))]
-Aggregate Attributes [1]: [sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))#72]
-Results [3]: [c_last_name#67, c_first_name#66, sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))#72 AS sales#73]
+Input [4]: [c_last_name#66, c_first_name#65, sum#69, isEmpty#70]
+Keys [2]: [c_last_name#66, c_first_name#65]
+Functions [1]: [sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))]
+Aggregate Attributes [1]: [sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))#71]
+Results [3]: [c_last_name#66, c_first_name#65, sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))#71 AS sales#72]
 
 (128) Union
 
 (129) TakeOrderedAndProject
-Input [3]: [c_last_name#36, c_first_name#35, sales#42]
-Arguments: 100, [c_last_name#36 ASC NULLS FIRST, c_first_name#35 ASC NULLS FIRST, sales#42 ASC NULLS FIRST], [c_last_name#36, c_first_name#35, sales#42]
+Input [3]: [c_last_name#35, c_first_name#34, sales#41]
+Arguments: 100, [c_last_name#35 ASC NULLS FIRST, c_first_name#34 ASC NULLS FIRST, sales#41 ASC NULLS FIRST], [c_last_name#35, c_first_name#34, sales#41]
 
 ===== Subqueries =====
 
@@ -742,26 +742,26 @@ BroadcastExchange (134)
 
 
 (130) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#33, d_year#74, d_moy#75]
+Output [3]: [d_date_sk#32, d_year#73, d_moy#74]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,2), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (131) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#33, d_year#74, d_moy#75]
+Input [3]: [d_date_sk#32, d_year#73, d_moy#74]
 
 (132) Filter [codegen id : 1]
-Input [3]: [d_date_sk#33, d_year#74, d_moy#75]
-Condition : ((((isnotnull(d_year#74) AND isnotnull(d_moy#75)) AND (d_year#74 = 2000)) AND (d_moy#75 = 2)) AND isnotnull(d_date_sk#33))
+Input [3]: [d_date_sk#32, d_year#73, d_moy#74]
+Condition : ((((isnotnull(d_year#73) AND isnotnull(d_moy#74)) AND (d_year#73 = 2000)) AND (d_moy#74 = 2)) AND isnotnull(d_date_sk#32))
 
 (133) Project [codegen id : 1]
-Output [1]: [d_date_sk#33]
-Input [3]: [d_date_sk#33, d_year#74, d_moy#75]
+Output [1]: [d_date_sk#32]
+Input [3]: [d_date_sk#32, d_year#73, d_moy#74]
 
 (134) BroadcastExchange
-Input [1]: [d_date_sk#33]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=12]
+Input [1]: [d_date_sk#32]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
 
 Subquery:2 Hosting operator id = 6 Hosting Expression = ss_sold_date_sk#8 IN dynamicpruning#9
 BroadcastExchange (139)
@@ -772,28 +772,28 @@ BroadcastExchange (139)
 
 
 (135) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#10, d_date#11, d_year#76]
+Output [3]: [d_date_sk#10, d_date#11, d_year#75]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date,d_year:int>
 
 (136) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#76]
+Input [3]: [d_date_sk#10, d_date#11, d_year#75]
 
 (137) Filter [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#76]
-Condition : (d_year#76 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
+Input [3]: [d_date_sk#10, d_date#11, d_year#75]
+Condition : (d_year#75 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
 
 (138) Project [codegen id : 1]
 Output [2]: [d_date_sk#10, d_date#11]
-Input [3]: [d_date_sk#10, d_date#11, d_year#76]
+Input [3]: [d_date_sk#10, d_date#11, d_year#75]
 
 (139) BroadcastExchange
 Input [2]: [d_date_sk#10, d_date#11]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
 
-Subquery:3 Hosting operator id = 45 Hosting Expression = Subquery scalar-subquery#31, [id=#32]
+Subquery:3 Hosting operator id = 45 Hosting Expression = Subquery scalar-subquery#31, [id=#7]
 * HashAggregate (156)
 +- Exchange (155)
    +- * HashAggregate (154)
@@ -814,91 +814,91 @@ Subquery:3 Hosting operator id = 45 Hosting Expression = Subquery scalar-subquer
 
 
 (140) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79, ss_sold_date_sk#80]
+Output [4]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78, ss_sold_date_sk#79]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#80), dynamicpruningexpression(ss_sold_date_sk#80 IN dynamicpruning#81)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#79), dynamicpruningexpression(ss_sold_date_sk#79 IN dynamicpruning#80)]
 PushedFilters: [IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_customer_sk:int,ss_quantity:int,ss_sales_price:decimal(7,2)>
 
 (141) ColumnarToRow [codegen id : 2]
-Input [4]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79, ss_sold_date_sk#80]
+Input [4]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78, ss_sold_date_sk#79]
 
 (142) Filter [codegen id : 2]
-Input [4]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79, ss_sold_date_sk#80]
-Condition : isnotnull(ss_customer_sk#77)
+Input [4]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78, ss_sold_date_sk#79]
+Condition : isnotnull(ss_customer_sk#76)
 
 (143) ReusedExchange [Reuses operator id: 161]
-Output [1]: [d_date_sk#82]
+Output [1]: [d_date_sk#81]
 
 (144) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#80]
-Right keys [1]: [d_date_sk#82]
+Left keys [1]: [ss_sold_date_sk#79]
+Right keys [1]: [d_date_sk#81]
 Join type: Inner
 Join condition: None
 
 (145) Project [codegen id : 2]
-Output [3]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79]
-Input [5]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79, ss_sold_date_sk#80, d_date_sk#82]
+Output [3]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78]
+Input [5]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78, ss_sold_date_sk#79, d_date_sk#81]
 
 (146) Exchange
-Input [3]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79]
-Arguments: hashpartitioning(ss_customer_sk#77, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+Input [3]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78]
+Arguments: hashpartitioning(ss_customer_sk#76, 5), ENSURE_REQUIREMENTS, [plan_id=15]
 
 (147) Sort [codegen id : 3]
-Input [3]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79]
-Arguments: [ss_customer_sk#77 ASC NULLS FIRST], false, 0
+Input [3]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78]
+Arguments: [ss_customer_sk#76 ASC NULLS FIRST], false, 0
 
 (148) ReusedExchange [Reuses operator id: 39]
-Output [1]: [c_customer_sk#83]
+Output [1]: [c_customer_sk#82]
 
 (149) Sort [codegen id : 5]
-Input [1]: [c_customer_sk#83]
-Arguments: [c_customer_sk#83 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#82]
+Arguments: [c_customer_sk#82 ASC NULLS FIRST], false, 0
 
 (150) SortMergeJoin [codegen id : 6]
-Left keys [1]: [ss_customer_sk#77]
-Right keys [1]: [c_customer_sk#83]
+Left keys [1]: [ss_customer_sk#76]
+Right keys [1]: [c_customer_sk#82]
 Join type: Inner
 Join condition: None
 
 (151) Project [codegen id : 6]
-Output [3]: [ss_quantity#78, ss_sales_price#79, c_customer_sk#83]
-Input [4]: [ss_customer_sk#77, ss_quantity#78, ss_sales_price#79, c_customer_sk#83]
+Output [3]: [ss_quantity#77, ss_sales_price#78, c_customer_sk#82]
+Input [4]: [ss_customer_sk#76, ss_quantity#77, ss_sales_price#78, c_customer_sk#82]
 
 (152) HashAggregate [codegen id : 6]
-Input [3]: [ss_quantity#78, ss_sales_price#79, c_customer_sk#83]
-Keys [1]: [c_customer_sk#83]
-Functions [1]: [partial_sum((cast(ss_quantity#78 as decimal(10,0)) * ss_sales_price#79))]
-Aggregate Attributes [2]: [sum#84, isEmpty#85]
-Results [3]: [c_customer_sk#83, sum#86, isEmpty#87]
+Input [3]: [ss_quantity#77, ss_sales_price#78, c_customer_sk#82]
+Keys [1]: [c_customer_sk#82]
+Functions [1]: [partial_sum((cast(ss_quantity#77 as decimal(10,0)) * ss_sales_price#78))]
+Aggregate Attributes [2]: [sum#83, isEmpty#84]
+Results [3]: [c_customer_sk#82, sum#85, isEmpty#86]
 
 (153) HashAggregate [codegen id : 6]
-Input [3]: [c_customer_sk#83, sum#86, isEmpty#87]
-Keys [1]: [c_customer_sk#83]
-Functions [1]: [sum((cast(ss_quantity#78 as decimal(10,0)) * ss_sales_price#79))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#78 as decimal(10,0)) * ss_sales_price#79))#88]
-Results [1]: [sum((cast(ss_quantity#78 as decimal(10,0)) * ss_sales_price#79))#88 AS csales#89]
+Input [3]: [c_customer_sk#82, sum#85, isEmpty#86]
+Keys [1]: [c_customer_sk#82]
+Functions [1]: [sum((cast(ss_quantity#77 as decimal(10,0)) * ss_sales_price#78))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#77 as decimal(10,0)) * ss_sales_price#78))#87]
+Results [1]: [sum((cast(ss_quantity#77 as decimal(10,0)) * ss_sales_price#78))#87 AS csales#88]
 
 (154) HashAggregate [codegen id : 6]
-Input [1]: [csales#89]
+Input [1]: [csales#88]
 Keys: []
-Functions [1]: [partial_max(csales#89)]
-Aggregate Attributes [1]: [max#90]
-Results [1]: [max#91]
+Functions [1]: [partial_max(csales#88)]
+Aggregate Attributes [1]: [max#89]
+Results [1]: [max#90]
 
 (155) Exchange
-Input [1]: [max#91]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=15]
+Input [1]: [max#90]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=16]
 
 (156) HashAggregate [codegen id : 7]
-Input [1]: [max#91]
+Input [1]: [max#90]
 Keys: []
-Functions [1]: [max(csales#89)]
-Aggregate Attributes [1]: [max(csales#89)#92]
-Results [1]: [max(csales#89)#92 AS tpcds_cmax#93]
+Functions [1]: [max(csales#88)]
+Aggregate Attributes [1]: [max(csales#88)#91]
+Results [1]: [max(csales#88)#91 AS tpcds_cmax#92]
 
-Subquery:4 Hosting operator id = 140 Hosting Expression = ss_sold_date_sk#80 IN dynamicpruning#81
+Subquery:4 Hosting operator id = 140 Hosting Expression = ss_sold_date_sk#79 IN dynamicpruning#80
 BroadcastExchange (161)
 +- * Project (160)
    +- * Filter (159)
@@ -907,33 +907,33 @@ BroadcastExchange (161)
 
 
 (157) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#82, d_year#94]
+Output [2]: [d_date_sk#81, d_year#93]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (158) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#82, d_year#94]
+Input [2]: [d_date_sk#81, d_year#93]
 
 (159) Filter [codegen id : 1]
-Input [2]: [d_date_sk#82, d_year#94]
-Condition : (d_year#94 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#82))
+Input [2]: [d_date_sk#81, d_year#93]
+Condition : (d_year#93 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#81))
 
 (160) Project [codegen id : 1]
-Output [1]: [d_date_sk#82]
-Input [2]: [d_date_sk#82, d_year#94]
+Output [1]: [d_date_sk#81]
+Input [2]: [d_date_sk#81, d_year#93]
 
 (161) BroadcastExchange
-Input [1]: [d_date_sk#82]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
+Input [1]: [d_date_sk#81]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
 
-Subquery:5 Hosting operator id = 65 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#32]
+Subquery:5 Hosting operator id = 65 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#7]
 
-Subquery:6 Hosting operator id = 74 Hosting Expression = ws_sold_date_sk#47 IN dynamicpruning#6
+Subquery:6 Hosting operator id = 74 Hosting Expression = ws_sold_date_sk#46 IN dynamicpruning#6
 
-Subquery:7 Hosting operator id = 102 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#32]
+Subquery:7 Hosting operator id = 102 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#7]
 
-Subquery:8 Hosting operator id = 119 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#32]
+Subquery:8 Hosting operator id = 119 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#7]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b/explain.txt
index 5e90c9067b19e..27cc7ad8b307d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q23b/explain.txt
@@ -273,7 +273,7 @@ Results [2]: [c_customer_sk#24, sum((cast(ss_quantity#21 as decimal(10,0)) * ss_
 
 (39) Filter [codegen id : 9]
 Input [2]: [c_customer_sk#24, ssales#30]
-Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#32])))
+Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * Subquery scalar-subquery#31, [id=#7])))
 
 (40) Project [codegen id : 9]
 Output [1]: [c_customer_sk#24]
@@ -290,26 +290,26 @@ Join type: LeftSemi
 Join condition: None
 
 (43) Scan parquet spark_catalog.default.customer
-Output [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
+Output [3]: [c_customer_sk#32, c_first_name#33, c_last_name#34]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer]
 PushedFilters: [IsNotNull(c_customer_sk)]
 ReadSchema: struct<c_customer_sk:int,c_first_name:string,c_last_name:string>
 
 (44) ColumnarToRow [codegen id : 10]
-Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
+Input [3]: [c_customer_sk#32, c_first_name#33, c_last_name#34]
 
 (45) Filter [codegen id : 10]
-Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
-Condition : isnotnull(c_customer_sk#33)
+Input [3]: [c_customer_sk#32, c_first_name#33, c_last_name#34]
+Condition : isnotnull(c_customer_sk#32)
 
 (46) Exchange
-Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
-Arguments: hashpartitioning(c_customer_sk#33, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [3]: [c_customer_sk#32, c_first_name#33, c_last_name#34]
+Arguments: hashpartitioning(c_customer_sk#32, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (47) Sort [codegen id : 11]
-Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
-Arguments: [c_customer_sk#33 ASC NULLS FIRST], false, 0
+Input [3]: [c_customer_sk#32, c_first_name#33, c_last_name#34]
+Arguments: [c_customer_sk#32 ASC NULLS FIRST], false, 0
 
 (48) ReusedExchange [Reuses operator id: 37]
 Output [3]: [c_customer_sk#24, sum#27, isEmpty#28]
@@ -323,7 +323,7 @@ Results [2]: [c_customer_sk#24, sum((cast(ss_quantity#21 as decimal(10,0)) * ss_
 
 (50) Filter [codegen id : 14]
 Input [2]: [c_customer_sk#24, ssales#30]
-Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#32])))
+Condition : (isnotnull(ssales#30) AND (cast(ssales#30 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#7])))
 
 (51) Project [codegen id : 14]
 Output [1]: [c_customer_sk#24]
@@ -334,169 +334,169 @@ Input [1]: [c_customer_sk#24]
 Arguments: [c_customer_sk#24 ASC NULLS FIRST], false, 0
 
 (53) SortMergeJoin [codegen id : 15]
-Left keys [1]: [c_customer_sk#33]
+Left keys [1]: [c_customer_sk#32]
 Right keys [1]: [c_customer_sk#24]
 Join type: LeftSemi
 Join condition: None
 
 (54) BroadcastExchange
-Input [3]: [c_customer_sk#33, c_first_name#34, c_last_name#35]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=8]
+Input [3]: [c_customer_sk#32, c_first_name#33, c_last_name#34]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=9]
 
 (55) BroadcastHashJoin [codegen id : 17]
 Left keys [1]: [cs_bill_customer_sk#1]
-Right keys [1]: [c_customer_sk#33]
+Right keys [1]: [c_customer_sk#32]
 Join type: Inner
 Join condition: None
 
 (56) Project [codegen id : 17]
-Output [5]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, c_first_name#34, c_last_name#35]
-Input [7]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, c_customer_sk#33, c_first_name#34, c_last_name#35]
+Output [5]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, c_first_name#33, c_last_name#34]
+Input [7]: [cs_bill_customer_sk#1, cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, c_customer_sk#32, c_first_name#33, c_last_name#34]
 
 (57) ReusedExchange [Reuses operator id: 92]
-Output [1]: [d_date_sk#36]
+Output [1]: [d_date_sk#35]
 
 (58) BroadcastHashJoin [codegen id : 17]
 Left keys [1]: [cs_sold_date_sk#5]
-Right keys [1]: [d_date_sk#36]
+Right keys [1]: [d_date_sk#35]
 Join type: Inner
 Join condition: None
 
 (59) Project [codegen id : 17]
-Output [4]: [cs_quantity#3, cs_list_price#4, c_first_name#34, c_last_name#35]
-Input [6]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, c_first_name#34, c_last_name#35, d_date_sk#36]
+Output [4]: [cs_quantity#3, cs_list_price#4, c_first_name#33, c_last_name#34]
+Input [6]: [cs_quantity#3, cs_list_price#4, cs_sold_date_sk#5, c_first_name#33, c_last_name#34, d_date_sk#35]
 
 (60) HashAggregate [codegen id : 17]
-Input [4]: [cs_quantity#3, cs_list_price#4, c_first_name#34, c_last_name#35]
-Keys [2]: [c_last_name#35, c_first_name#34]
+Input [4]: [cs_quantity#3, cs_list_price#4, c_first_name#33, c_last_name#34]
+Keys [2]: [c_last_name#34, c_first_name#33]
 Functions [1]: [partial_sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))]
-Aggregate Attributes [2]: [sum#37, isEmpty#38]
-Results [4]: [c_last_name#35, c_first_name#34, sum#39, isEmpty#40]
+Aggregate Attributes [2]: [sum#36, isEmpty#37]
+Results [4]: [c_last_name#34, c_first_name#33, sum#38, isEmpty#39]
 
 (61) Exchange
-Input [4]: [c_last_name#35, c_first_name#34, sum#39, isEmpty#40]
-Arguments: hashpartitioning(c_last_name#35, c_first_name#34, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Input [4]: [c_last_name#34, c_first_name#33, sum#38, isEmpty#39]
+Arguments: hashpartitioning(c_last_name#34, c_first_name#33, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (62) HashAggregate [codegen id : 18]
-Input [4]: [c_last_name#35, c_first_name#34, sum#39, isEmpty#40]
-Keys [2]: [c_last_name#35, c_first_name#34]
+Input [4]: [c_last_name#34, c_first_name#33, sum#38, isEmpty#39]
+Keys [2]: [c_last_name#34, c_first_name#33]
 Functions [1]: [sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))]
-Aggregate Attributes [1]: [sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#41]
-Results [3]: [c_last_name#35, c_first_name#34, sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#41 AS sales#42]
+Aggregate Attributes [1]: [sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#40]
+Results [3]: [c_last_name#34, c_first_name#33, sum((cast(cs_quantity#3 as decimal(10,0)) * cs_list_price#4))#40 AS sales#41]
 
 (63) Scan parquet spark_catalog.default.web_sales
-Output [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
+Output [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#47), dynamicpruningexpression(ws_sold_date_sk#47 IN dynamicpruning#6)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#46), dynamicpruningexpression(ws_sold_date_sk#46 IN dynamicpruning#6)]
 PushedFilters: [IsNotNull(ws_bill_customer_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_bill_customer_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (64) ColumnarToRow [codegen id : 23]
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
 
 (65) Filter [codegen id : 23]
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Condition : isnotnull(ws_bill_customer_sk#44)
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Condition : isnotnull(ws_bill_customer_sk#43)
 
 (66) ReusedExchange [Reuses operator id: 21]
-Output [1]: [item_sk#48]
+Output [1]: [item_sk#47]
 
 (67) BroadcastHashJoin [codegen id : 23]
-Left keys [1]: [ws_item_sk#43]
-Right keys [1]: [item_sk#48]
+Left keys [1]: [ws_item_sk#42]
+Right keys [1]: [item_sk#47]
 Join type: LeftSemi
 Join condition: None
 
 (68) Project [codegen id : 23]
-Output [4]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Input [5]: [ws_item_sk#43, ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
+Output [4]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Input [5]: [ws_item_sk#42, ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
 
 (69) Exchange
-Input [4]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Arguments: hashpartitioning(ws_bill_customer_sk#44, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [4]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Arguments: hashpartitioning(ws_bill_customer_sk#43, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (70) Sort [codegen id : 24]
-Input [4]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47]
-Arguments: [ws_bill_customer_sk#44 ASC NULLS FIRST], false, 0
+Input [4]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46]
+Arguments: [ws_bill_customer_sk#43 ASC NULLS FIRST], false, 0
 
 (71) ReusedExchange [Reuses operator id: 37]
-Output [3]: [c_customer_sk#49, sum#50, isEmpty#51]
+Output [3]: [c_customer_sk#48, sum#49, isEmpty#50]
 
 (72) HashAggregate [codegen id : 27]
-Input [3]: [c_customer_sk#49, sum#50, isEmpty#51]
-Keys [1]: [c_customer_sk#49]
-Functions [1]: [sum((cast(ss_quantity#52 as decimal(10,0)) * ss_sales_price#53))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#52 as decimal(10,0)) * ss_sales_price#53))#29]
-Results [2]: [c_customer_sk#49, sum((cast(ss_quantity#52 as decimal(10,0)) * ss_sales_price#53))#29 AS ssales#54]
+Input [3]: [c_customer_sk#48, sum#49, isEmpty#50]
+Keys [1]: [c_customer_sk#48]
+Functions [1]: [sum((cast(ss_quantity#51 as decimal(10,0)) * ss_sales_price#52))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#51 as decimal(10,0)) * ss_sales_price#52))#29]
+Results [2]: [c_customer_sk#48, sum((cast(ss_quantity#51 as decimal(10,0)) * ss_sales_price#52))#29 AS ssales#53]
 
 (73) Filter [codegen id : 27]
-Input [2]: [c_customer_sk#49, ssales#54]
-Condition : (isnotnull(ssales#54) AND (cast(ssales#54 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#32])))
+Input [2]: [c_customer_sk#48, ssales#53]
+Condition : (isnotnull(ssales#53) AND (cast(ssales#53 as decimal(38,8)) > (0.500000 * ReusedSubquery Subquery scalar-subquery#31, [id=#7])))
 
 (74) Project [codegen id : 27]
-Output [1]: [c_customer_sk#49]
-Input [2]: [c_customer_sk#49, ssales#54]
+Output [1]: [c_customer_sk#48]
+Input [2]: [c_customer_sk#48, ssales#53]
 
 (75) Sort [codegen id : 27]
-Input [1]: [c_customer_sk#49]
-Arguments: [c_customer_sk#49 ASC NULLS FIRST], false, 0
+Input [1]: [c_customer_sk#48]
+Arguments: [c_customer_sk#48 ASC NULLS FIRST], false, 0
 
 (76) SortMergeJoin [codegen id : 35]
-Left keys [1]: [ws_bill_customer_sk#44]
-Right keys [1]: [c_customer_sk#49]
+Left keys [1]: [ws_bill_customer_sk#43]
+Right keys [1]: [c_customer_sk#48]
 Join type: LeftSemi
 Join condition: None
 
 (77) ReusedExchange [Reuses operator id: 54]
-Output [3]: [c_customer_sk#55, c_first_name#56, c_last_name#57]
+Output [3]: [c_customer_sk#54, c_first_name#55, c_last_name#56]
 
 (78) BroadcastHashJoin [codegen id : 35]
-Left keys [1]: [ws_bill_customer_sk#44]
-Right keys [1]: [c_customer_sk#55]
+Left keys [1]: [ws_bill_customer_sk#43]
+Right keys [1]: [c_customer_sk#54]
 Join type: Inner
 Join condition: None
 
 (79) Project [codegen id : 35]
-Output [5]: [ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47, c_first_name#56, c_last_name#57]
-Input [7]: [ws_bill_customer_sk#44, ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47, c_customer_sk#55, c_first_name#56, c_last_name#57]
+Output [5]: [ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46, c_first_name#55, c_last_name#56]
+Input [7]: [ws_bill_customer_sk#43, ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46, c_customer_sk#54, c_first_name#55, c_last_name#56]
 
 (80) ReusedExchange [Reuses operator id: 92]
-Output [1]: [d_date_sk#58]
+Output [1]: [d_date_sk#57]
 
 (81) BroadcastHashJoin [codegen id : 35]
-Left keys [1]: [ws_sold_date_sk#47]
-Right keys [1]: [d_date_sk#58]
+Left keys [1]: [ws_sold_date_sk#46]
+Right keys [1]: [d_date_sk#57]
 Join type: Inner
 Join condition: None
 
 (82) Project [codegen id : 35]
-Output [4]: [ws_quantity#45, ws_list_price#46, c_first_name#56, c_last_name#57]
-Input [6]: [ws_quantity#45, ws_list_price#46, ws_sold_date_sk#47, c_first_name#56, c_last_name#57, d_date_sk#58]
+Output [4]: [ws_quantity#44, ws_list_price#45, c_first_name#55, c_last_name#56]
+Input [6]: [ws_quantity#44, ws_list_price#45, ws_sold_date_sk#46, c_first_name#55, c_last_name#56, d_date_sk#57]
 
 (83) HashAggregate [codegen id : 35]
-Input [4]: [ws_quantity#45, ws_list_price#46, c_first_name#56, c_last_name#57]
-Keys [2]: [c_last_name#57, c_first_name#56]
-Functions [1]: [partial_sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))]
-Aggregate Attributes [2]: [sum#59, isEmpty#60]
-Results [4]: [c_last_name#57, c_first_name#56, sum#61, isEmpty#62]
+Input [4]: [ws_quantity#44, ws_list_price#45, c_first_name#55, c_last_name#56]
+Keys [2]: [c_last_name#56, c_first_name#55]
+Functions [1]: [partial_sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))]
+Aggregate Attributes [2]: [sum#58, isEmpty#59]
+Results [4]: [c_last_name#56, c_first_name#55, sum#60, isEmpty#61]
 
 (84) Exchange
-Input [4]: [c_last_name#57, c_first_name#56, sum#61, isEmpty#62]
-Arguments: hashpartitioning(c_last_name#57, c_first_name#56, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [4]: [c_last_name#56, c_first_name#55, sum#60, isEmpty#61]
+Arguments: hashpartitioning(c_last_name#56, c_first_name#55, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (85) HashAggregate [codegen id : 36]
-Input [4]: [c_last_name#57, c_first_name#56, sum#61, isEmpty#62]
-Keys [2]: [c_last_name#57, c_first_name#56]
-Functions [1]: [sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))]
-Aggregate Attributes [1]: [sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))#63]
-Results [3]: [c_last_name#57, c_first_name#56, sum((cast(ws_quantity#45 as decimal(10,0)) * ws_list_price#46))#63 AS sales#64]
+Input [4]: [c_last_name#56, c_first_name#55, sum#60, isEmpty#61]
+Keys [2]: [c_last_name#56, c_first_name#55]
+Functions [1]: [sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))]
+Aggregate Attributes [1]: [sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))#62]
+Results [3]: [c_last_name#56, c_first_name#55, sum((cast(ws_quantity#44 as decimal(10,0)) * ws_list_price#45))#62 AS sales#63]
 
 (86) Union
 
 (87) TakeOrderedAndProject
-Input [3]: [c_last_name#35, c_first_name#34, sales#42]
-Arguments: 100, [c_last_name#35 ASC NULLS FIRST, c_first_name#34 ASC NULLS FIRST, sales#42 ASC NULLS FIRST], [c_last_name#35, c_first_name#34, sales#42]
+Input [3]: [c_last_name#34, c_first_name#33, sales#41]
+Arguments: 100, [c_last_name#34 ASC NULLS FIRST, c_first_name#33 ASC NULLS FIRST, sales#41 ASC NULLS FIRST], [c_last_name#34, c_first_name#33, sales#41]
 
 ===== Subqueries =====
 
@@ -509,26 +509,26 @@ BroadcastExchange (92)
 
 
 (88) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#36, d_year#65, d_moy#66]
+Output [3]: [d_date_sk#35, d_year#64, d_moy#65]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,2), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (89) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#36, d_year#65, d_moy#66]
+Input [3]: [d_date_sk#35, d_year#64, d_moy#65]
 
 (90) Filter [codegen id : 1]
-Input [3]: [d_date_sk#36, d_year#65, d_moy#66]
-Condition : ((((isnotnull(d_year#65) AND isnotnull(d_moy#66)) AND (d_year#65 = 2000)) AND (d_moy#66 = 2)) AND isnotnull(d_date_sk#36))
+Input [3]: [d_date_sk#35, d_year#64, d_moy#65]
+Condition : ((((isnotnull(d_year#64) AND isnotnull(d_moy#65)) AND (d_year#64 = 2000)) AND (d_moy#65 = 2)) AND isnotnull(d_date_sk#35))
 
 (91) Project [codegen id : 1]
-Output [1]: [d_date_sk#36]
-Input [3]: [d_date_sk#36, d_year#65, d_moy#66]
+Output [1]: [d_date_sk#35]
+Input [3]: [d_date_sk#35, d_year#64, d_moy#65]
 
 (92) BroadcastExchange
-Input [1]: [d_date_sk#36]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=12]
+Input [1]: [d_date_sk#35]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
 
 Subquery:2 Hosting operator id = 4 Hosting Expression = ss_sold_date_sk#8 IN dynamicpruning#9
 BroadcastExchange (97)
@@ -539,28 +539,28 @@ BroadcastExchange (97)
 
 
 (93) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#10, d_date#11, d_year#67]
+Output [3]: [d_date_sk#10, d_date#11, d_year#66]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date,d_year:int>
 
 (94) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#67]
+Input [3]: [d_date_sk#10, d_date#11, d_year#66]
 
 (95) Filter [codegen id : 1]
-Input [3]: [d_date_sk#10, d_date#11, d_year#67]
-Condition : (d_year#67 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
+Input [3]: [d_date_sk#10, d_date#11, d_year#66]
+Condition : (d_year#66 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#10))
 
 (96) Project [codegen id : 1]
 Output [2]: [d_date_sk#10, d_date#11]
-Input [3]: [d_date_sk#10, d_date#11, d_year#67]
+Input [3]: [d_date_sk#10, d_date#11, d_year#66]
 
 (97) BroadcastExchange
 Input [2]: [d_date_sk#10, d_date#11]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
 
-Subquery:3 Hosting operator id = 39 Hosting Expression = Subquery scalar-subquery#31, [id=#32]
+Subquery:3 Hosting operator id = 39 Hosting Expression = Subquery scalar-subquery#31, [id=#7]
 * HashAggregate (112)
 +- Exchange (111)
    +- * HashAggregate (110)
@@ -579,83 +579,83 @@ Subquery:3 Hosting operator id = 39 Hosting Expression = Subquery scalar-subquer
 
 
 (98) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_customer_sk#68, ss_quantity#69, ss_sales_price#70, ss_sold_date_sk#71]
+Output [4]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#71), dynamicpruningexpression(ss_sold_date_sk#71 IN dynamicpruning#72)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#70), dynamicpruningexpression(ss_sold_date_sk#70 IN dynamicpruning#71)]
 PushedFilters: [IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_customer_sk:int,ss_quantity:int,ss_sales_price:decimal(7,2)>
 
 (99) ColumnarToRow [codegen id : 3]
-Input [4]: [ss_customer_sk#68, ss_quantity#69, ss_sales_price#70, ss_sold_date_sk#71]
+Input [4]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70]
 
 (100) Filter [codegen id : 3]
-Input [4]: [ss_customer_sk#68, ss_quantity#69, ss_sales_price#70, ss_sold_date_sk#71]
-Condition : isnotnull(ss_customer_sk#68)
+Input [4]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70]
+Condition : isnotnull(ss_customer_sk#67)
 
 (101) ReusedExchange [Reuses operator id: 33]
-Output [1]: [c_customer_sk#73]
+Output [1]: [c_customer_sk#72]
 
 (102) BroadcastHashJoin [codegen id : 3]
-Left keys [1]: [ss_customer_sk#68]
-Right keys [1]: [c_customer_sk#73]
+Left keys [1]: [ss_customer_sk#67]
+Right keys [1]: [c_customer_sk#72]
 Join type: Inner
 Join condition: None
 
 (103) Project [codegen id : 3]
-Output [4]: [ss_quantity#69, ss_sales_price#70, ss_sold_date_sk#71, c_customer_sk#73]
-Input [5]: [ss_customer_sk#68, ss_quantity#69, ss_sales_price#70, ss_sold_date_sk#71, c_customer_sk#73]
+Output [4]: [ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70, c_customer_sk#72]
+Input [5]: [ss_customer_sk#67, ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70, c_customer_sk#72]
 
 (104) ReusedExchange [Reuses operator id: 117]
-Output [1]: [d_date_sk#74]
+Output [1]: [d_date_sk#73]
 
 (105) BroadcastHashJoin [codegen id : 3]
-Left keys [1]: [ss_sold_date_sk#71]
-Right keys [1]: [d_date_sk#74]
+Left keys [1]: [ss_sold_date_sk#70]
+Right keys [1]: [d_date_sk#73]
 Join type: Inner
 Join condition: None
 
 (106) Project [codegen id : 3]
-Output [3]: [ss_quantity#69, ss_sales_price#70, c_customer_sk#73]
-Input [5]: [ss_quantity#69, ss_sales_price#70, ss_sold_date_sk#71, c_customer_sk#73, d_date_sk#74]
+Output [3]: [ss_quantity#68, ss_sales_price#69, c_customer_sk#72]
+Input [5]: [ss_quantity#68, ss_sales_price#69, ss_sold_date_sk#70, c_customer_sk#72, d_date_sk#73]
 
 (107) HashAggregate [codegen id : 3]
-Input [3]: [ss_quantity#69, ss_sales_price#70, c_customer_sk#73]
-Keys [1]: [c_customer_sk#73]
-Functions [1]: [partial_sum((cast(ss_quantity#69 as decimal(10,0)) * ss_sales_price#70))]
-Aggregate Attributes [2]: [sum#75, isEmpty#76]
-Results [3]: [c_customer_sk#73, sum#77, isEmpty#78]
+Input [3]: [ss_quantity#68, ss_sales_price#69, c_customer_sk#72]
+Keys [1]: [c_customer_sk#72]
+Functions [1]: [partial_sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))]
+Aggregate Attributes [2]: [sum#74, isEmpty#75]
+Results [3]: [c_customer_sk#72, sum#76, isEmpty#77]
 
 (108) Exchange
-Input [3]: [c_customer_sk#73, sum#77, isEmpty#78]
-Arguments: hashpartitioning(c_customer_sk#73, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+Input [3]: [c_customer_sk#72, sum#76, isEmpty#77]
+Arguments: hashpartitioning(c_customer_sk#72, 5), ENSURE_REQUIREMENTS, [plan_id=15]
 
 (109) HashAggregate [codegen id : 4]
-Input [3]: [c_customer_sk#73, sum#77, isEmpty#78]
-Keys [1]: [c_customer_sk#73]
-Functions [1]: [sum((cast(ss_quantity#69 as decimal(10,0)) * ss_sales_price#70))]
-Aggregate Attributes [1]: [sum((cast(ss_quantity#69 as decimal(10,0)) * ss_sales_price#70))#79]
-Results [1]: [sum((cast(ss_quantity#69 as decimal(10,0)) * ss_sales_price#70))#79 AS csales#80]
+Input [3]: [c_customer_sk#72, sum#76, isEmpty#77]
+Keys [1]: [c_customer_sk#72]
+Functions [1]: [sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))]
+Aggregate Attributes [1]: [sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))#78]
+Results [1]: [sum((cast(ss_quantity#68 as decimal(10,0)) * ss_sales_price#69))#78 AS csales#79]
 
 (110) HashAggregate [codegen id : 4]
-Input [1]: [csales#80]
+Input [1]: [csales#79]
 Keys: []
-Functions [1]: [partial_max(csales#80)]
-Aggregate Attributes [1]: [max#81]
-Results [1]: [max#82]
+Functions [1]: [partial_max(csales#79)]
+Aggregate Attributes [1]: [max#80]
+Results [1]: [max#81]
 
 (111) Exchange
-Input [1]: [max#82]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=15]
+Input [1]: [max#81]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=16]
 
 (112) HashAggregate [codegen id : 5]
-Input [1]: [max#82]
+Input [1]: [max#81]
 Keys: []
-Functions [1]: [max(csales#80)]
-Aggregate Attributes [1]: [max(csales#80)#83]
-Results [1]: [max(csales#80)#83 AS tpcds_cmax#84]
+Functions [1]: [max(csales#79)]
+Aggregate Attributes [1]: [max(csales#79)#82]
+Results [1]: [max(csales#79)#82 AS tpcds_cmax#83]
 
-Subquery:4 Hosting operator id = 98 Hosting Expression = ss_sold_date_sk#71 IN dynamicpruning#72
+Subquery:4 Hosting operator id = 98 Hosting Expression = ss_sold_date_sk#70 IN dynamicpruning#71
 BroadcastExchange (117)
 +- * Project (116)
    +- * Filter (115)
@@ -664,31 +664,31 @@ BroadcastExchange (117)
 
 
 (113) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#74, d_year#85]
+Output [2]: [d_date_sk#73, d_year#84]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [In(d_year, [2000,2001,2002,2003]), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (114) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#74, d_year#85]
+Input [2]: [d_date_sk#73, d_year#84]
 
 (115) Filter [codegen id : 1]
-Input [2]: [d_date_sk#74, d_year#85]
-Condition : (d_year#85 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#74))
+Input [2]: [d_date_sk#73, d_year#84]
+Condition : (d_year#84 IN (2000,2001,2002,2003) AND isnotnull(d_date_sk#73))
 
 (116) Project [codegen id : 1]
-Output [1]: [d_date_sk#74]
-Input [2]: [d_date_sk#74, d_year#85]
+Output [1]: [d_date_sk#73]
+Input [2]: [d_date_sk#73, d_year#84]
 
 (117) BroadcastExchange
-Input [1]: [d_date_sk#74]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
+Input [1]: [d_date_sk#73]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
 
-Subquery:5 Hosting operator id = 50 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#32]
+Subquery:5 Hosting operator id = 50 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#7]
 
-Subquery:6 Hosting operator id = 63 Hosting Expression = ws_sold_date_sk#47 IN dynamicpruning#6
+Subquery:6 Hosting operator id = 63 Hosting Expression = ws_sold_date_sk#46 IN dynamicpruning#6
 
-Subquery:7 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#32]
+Subquery:7 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#31, [id=#7]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a.sf100/explain.txt
index c0d70d2fae105..4a7312c8d13ef 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a.sf100/explain.txt
@@ -62,227 +62,227 @@ Input [6]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, s
 
 (3) Filter [codegen id : 2]
 Input [6]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, ss_sold_date_sk#6]
-Condition : ((((isnotnull(ss_ticket_number#4) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_store_sk#3)) AND isnotnull(ss_customer_sk#2)) AND might_contain(Subquery scalar-subquery#7, [id=#8], xxhash64(ss_store_sk#3, 42)))
+Condition : ((((isnotnull(ss_ticket_number#4) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_store_sk#3)) AND isnotnull(ss_customer_sk#2)) AND might_contain(Subquery scalar-subquery#7, [id=#1], xxhash64(ss_store_sk#3, 42)))
 
 (4) Project [codegen id : 2]
 Output [5]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5]
 Input [6]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, ss_sold_date_sk#6]
 
 (5) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Output [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_color), EqualTo(i_color,pale                ), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (6) ColumnarToRow [codegen id : 1]
-Input [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Input [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 
 (7) Filter [codegen id : 1]
-Input [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Condition : ((isnotnull(i_color#12) AND (i_color#12 = pale                )) AND isnotnull(i_item_sk#9))
+Input [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Condition : ((isnotnull(i_color#11) AND (i_color#11 = pale                )) AND isnotnull(i_item_sk#8))
 
 (8) BroadcastExchange
-Input [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=1]
+Input [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=2]
 
 (9) BroadcastHashJoin [codegen id : 2]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [i_item_sk#9]
+Right keys [1]: [i_item_sk#8]
 Join type: Inner
 Join condition: None
 
 (10) Project [codegen id : 2]
-Output [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Input [11]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Output [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Input [11]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 
 (11) Exchange
-Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) Sort [codegen id : 3]
-Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 Arguments: [ss_customer_sk#2 ASC NULLS FIRST], false, 0
 
 (13) Scan parquet spark_catalog.default.customer
-Output [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
+Output [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer]
 PushedFilters: [IsNotNull(c_customer_sk), IsNotNull(c_birth_country)]
 ReadSchema: struct<c_customer_sk:int,c_first_name:string,c_last_name:string,c_birth_country:string>
 
 (14) ColumnarToRow [codegen id : 4]
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
 
 (15) Filter [codegen id : 4]
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
-Condition : (isnotnull(c_customer_sk#15) AND isnotnull(c_birth_country#18))
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
+Condition : (isnotnull(c_customer_sk#14) AND isnotnull(c_birth_country#17))
 
 (16) Exchange
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
-Arguments: hashpartitioning(c_customer_sk#15, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
+Arguments: hashpartitioning(c_customer_sk#14, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (17) Sort [codegen id : 5]
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
-Arguments: [c_customer_sk#15 ASC NULLS FIRST], false, 0
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
+Arguments: [c_customer_sk#14 ASC NULLS FIRST], false, 0
 
 (18) SortMergeJoin [codegen id : 6]
 Left keys [1]: [ss_customer_sk#2]
-Right keys [1]: [c_customer_sk#15]
+Right keys [1]: [c_customer_sk#14]
 Join type: Inner
 Join condition: None
 
 (19) Project [codegen id : 6]
-Output [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
-Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
+Output [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
+Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
 
 (20) Exchange
-Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
-Arguments: hashpartitioning(ss_ticket_number#4, ss_item_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
+Arguments: hashpartitioning(ss_ticket_number#4, ss_item_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (21) Sort [codegen id : 7]
-Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
+Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
 Arguments: [ss_ticket_number#4 ASC NULLS FIRST, ss_item_sk#1 ASC NULLS FIRST], false, 0
 
 (22) Scan parquet spark_catalog.default.store_returns
-Output [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
+Output [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_returns]
 PushedFilters: [IsNotNull(sr_ticket_number), IsNotNull(sr_item_sk)]
 ReadSchema: struct<sr_item_sk:int,sr_ticket_number:int>
 
 (23) ColumnarToRow [codegen id : 8]
-Input [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
+Input [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
 
 (24) Filter [codegen id : 8]
-Input [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
-Condition : (isnotnull(sr_ticket_number#20) AND isnotnull(sr_item_sk#19))
+Input [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
+Condition : (isnotnull(sr_ticket_number#19) AND isnotnull(sr_item_sk#18))
 
 (25) Project [codegen id : 8]
-Output [2]: [sr_item_sk#19, sr_ticket_number#20]
-Input [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
+Output [2]: [sr_item_sk#18, sr_ticket_number#19]
+Input [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
 
 (26) Exchange
-Input [2]: [sr_item_sk#19, sr_ticket_number#20]
-Arguments: hashpartitioning(sr_ticket_number#20, sr_item_sk#19, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [2]: [sr_item_sk#18, sr_ticket_number#19]
+Arguments: hashpartitioning(sr_ticket_number#19, sr_item_sk#18, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (27) Sort [codegen id : 9]
-Input [2]: [sr_item_sk#19, sr_ticket_number#20]
-Arguments: [sr_ticket_number#20 ASC NULLS FIRST, sr_item_sk#19 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#18, sr_ticket_number#19]
+Arguments: [sr_ticket_number#19 ASC NULLS FIRST, sr_item_sk#18 ASC NULLS FIRST], false, 0
 
 (28) SortMergeJoin [codegen id : 12]
 Left keys [2]: [ss_ticket_number#4, ss_item_sk#1]
-Right keys [2]: [sr_ticket_number#20, sr_item_sk#19]
+Right keys [2]: [sr_ticket_number#19, sr_item_sk#18]
 Join type: Inner
 Join condition: None
 
 (29) Project [codegen id : 12]
-Output [10]: [ss_store_sk#3, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
-Input [14]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18, sr_item_sk#19, sr_ticket_number#20]
+Output [10]: [ss_store_sk#3, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
+Input [14]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17, sr_item_sk#18, sr_ticket_number#19]
 
 (30) Scan parquet spark_catalog.default.store
-Output [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
+Output [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_market_id), EqualTo(s_market_id,8), IsNotNull(s_store_sk), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_store_name:string,s_market_id:int,s_state:string,s_zip:string>
 
 (31) ColumnarToRow [codegen id : 10]
-Input [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
+Input [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
 
 (32) Filter [codegen id : 10]
-Input [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
-Condition : (((isnotnull(s_market_id#24) AND (s_market_id#24 = 8)) AND isnotnull(s_store_sk#22)) AND isnotnull(s_zip#26))
+Input [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
+Condition : (((isnotnull(s_market_id#23) AND (s_market_id#23 = 8)) AND isnotnull(s_store_sk#21)) AND isnotnull(s_zip#25))
 
 (33) Project [codegen id : 10]
-Output [4]: [s_store_sk#22, s_store_name#23, s_state#25, s_zip#26]
-Input [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
+Output [4]: [s_store_sk#21, s_store_name#22, s_state#24, s_zip#25]
+Input [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
 
 (34) BroadcastExchange
-Input [4]: [s_store_sk#22, s_store_name#23, s_state#25, s_zip#26]
-Arguments: HashedRelationBroadcastMode(List(input[3, string, true]),false), [plan_id=6]
+Input [4]: [s_store_sk#21, s_store_name#22, s_state#24, s_zip#25]
+Arguments: HashedRelationBroadcastMode(List(input[3, string, true]),false), [plan_id=7]
 
 (35) Scan parquet spark_catalog.default.customer_address
-Output [3]: [ca_state#27, ca_zip#28, ca_country#29]
+Output [3]: [ca_state#26, ca_zip#27, ca_country#28]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_country), IsNotNull(ca_zip)]
 ReadSchema: struct<ca_state:string,ca_zip:string,ca_country:string>
 
 (36) ColumnarToRow
-Input [3]: [ca_state#27, ca_zip#28, ca_country#29]
+Input [3]: [ca_state#26, ca_zip#27, ca_country#28]
 
 (37) Filter
-Input [3]: [ca_state#27, ca_zip#28, ca_country#29]
-Condition : (isnotnull(ca_country#29) AND isnotnull(ca_zip#28))
+Input [3]: [ca_state#26, ca_zip#27, ca_country#28]
+Condition : (isnotnull(ca_country#28) AND isnotnull(ca_zip#27))
 
 (38) BroadcastHashJoin [codegen id : 11]
-Left keys [1]: [s_zip#26]
-Right keys [1]: [ca_zip#28]
+Left keys [1]: [s_zip#25]
+Right keys [1]: [ca_zip#27]
 Join type: Inner
 Join condition: None
 
 (39) Project [codegen id : 11]
-Output [5]: [s_store_sk#22, s_store_name#23, s_state#25, ca_state#27, ca_country#29]
-Input [7]: [s_store_sk#22, s_store_name#23, s_state#25, s_zip#26, ca_state#27, ca_zip#28, ca_country#29]
+Output [5]: [s_store_sk#21, s_store_name#22, s_state#24, ca_state#26, ca_country#28]
+Input [7]: [s_store_sk#21, s_store_name#22, s_state#24, s_zip#25, ca_state#26, ca_zip#27, ca_country#28]
 
 (40) BroadcastExchange
-Input [5]: [s_store_sk#22, s_store_name#23, s_state#25, ca_state#27, ca_country#29]
-Arguments: HashedRelationBroadcastMode(List(input[0, int, true], upper(input[4, string, true])),false), [plan_id=7]
+Input [5]: [s_store_sk#21, s_store_name#22, s_state#24, ca_state#26, ca_country#28]
+Arguments: HashedRelationBroadcastMode(List(input[0, int, true], upper(input[4, string, true])),false), [plan_id=8]
 
 (41) BroadcastHashJoin [codegen id : 12]
-Left keys [2]: [ss_store_sk#3, c_birth_country#18]
-Right keys [2]: [s_store_sk#22, upper(ca_country#29)]
+Left keys [2]: [ss_store_sk#3, c_birth_country#17]
+Right keys [2]: [s_store_sk#21, upper(ca_country#28)]
 Join type: Inner
 Join condition: None
 
 (42) Project [codegen id : 12]
-Output [11]: [ss_net_paid#5, s_store_name#23, s_state#25, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, ca_state#27]
-Input [15]: [ss_store_sk#3, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18, s_store_sk#22, s_store_name#23, s_state#25, ca_state#27, ca_country#29]
+Output [11]: [ss_net_paid#5, s_store_name#22, s_state#24, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, ca_state#26]
+Input [15]: [ss_store_sk#3, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17, s_store_sk#21, s_store_name#22, s_state#24, ca_state#26, ca_country#28]
 
 (43) HashAggregate [codegen id : 12]
-Input [11]: [ss_net_paid#5, s_store_name#23, s_state#25, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, ca_state#27]
-Keys [10]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11]
+Input [11]: [ss_net_paid#5, s_store_name#22, s_state#24, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, ca_state#26]
+Keys [10]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10]
 Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#5))]
-Aggregate Attributes [1]: [sum#30]
-Results [11]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, sum#31]
+Aggregate Attributes [1]: [sum#29]
+Results [11]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, sum#30]
 
 (44) Exchange
-Input [11]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, sum#31]
-Arguments: hashpartitioning(c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [11]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, sum#30]
+Arguments: hashpartitioning(c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (45) HashAggregate [codegen id : 13]
-Input [11]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, sum#31]
-Keys [10]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11]
+Input [11]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, sum#30]
+Keys [10]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10]
 Functions [1]: [sum(UnscaledValue(ss_net_paid#5))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#5))#32]
-Results [4]: [c_last_name#17, c_first_name#16, s_store_name#23, MakeDecimal(sum(UnscaledValue(ss_net_paid#5))#32,17,2) AS netpaid#33]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#5))#31]
+Results [4]: [c_last_name#16, c_first_name#15, s_store_name#22, MakeDecimal(sum(UnscaledValue(ss_net_paid#5))#31,17,2) AS netpaid#32]
 
 (46) HashAggregate [codegen id : 13]
-Input [4]: [c_last_name#17, c_first_name#16, s_store_name#23, netpaid#33]
-Keys [3]: [c_last_name#17, c_first_name#16, s_store_name#23]
-Functions [1]: [partial_sum(netpaid#33)]
-Aggregate Attributes [2]: [sum#34, isEmpty#35]
-Results [5]: [c_last_name#17, c_first_name#16, s_store_name#23, sum#36, isEmpty#37]
+Input [4]: [c_last_name#16, c_first_name#15, s_store_name#22, netpaid#32]
+Keys [3]: [c_last_name#16, c_first_name#15, s_store_name#22]
+Functions [1]: [partial_sum(netpaid#32)]
+Aggregate Attributes [2]: [sum#33, isEmpty#34]
+Results [5]: [c_last_name#16, c_first_name#15, s_store_name#22, sum#35, isEmpty#36]
 
 (47) Exchange
-Input [5]: [c_last_name#17, c_first_name#16, s_store_name#23, sum#36, isEmpty#37]
-Arguments: hashpartitioning(c_last_name#17, c_first_name#16, s_store_name#23, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Input [5]: [c_last_name#16, c_first_name#15, s_store_name#22, sum#35, isEmpty#36]
+Arguments: hashpartitioning(c_last_name#16, c_first_name#15, s_store_name#22, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (48) HashAggregate [codegen id : 14]
-Input [5]: [c_last_name#17, c_first_name#16, s_store_name#23, sum#36, isEmpty#37]
-Keys [3]: [c_last_name#17, c_first_name#16, s_store_name#23]
-Functions [1]: [sum(netpaid#33)]
-Aggregate Attributes [1]: [sum(netpaid#33)#38]
-Results [4]: [c_last_name#17, c_first_name#16, s_store_name#23, sum(netpaid#33)#38 AS paid#39]
+Input [5]: [c_last_name#16, c_first_name#15, s_store_name#22, sum#35, isEmpty#36]
+Keys [3]: [c_last_name#16, c_first_name#15, s_store_name#22]
+Functions [1]: [sum(netpaid#32)]
+Aggregate Attributes [1]: [sum(netpaid#32)#37]
+Results [4]: [c_last_name#16, c_first_name#15, s_store_name#22, sum(netpaid#32)#37 AS paid#38]
 
 (49) Filter [codegen id : 14]
-Input [4]: [c_last_name#17, c_first_name#16, s_store_name#23, paid#39]
-Condition : (isnotnull(paid#39) AND (cast(paid#39 as decimal(33,8)) > cast(Subquery scalar-subquery#40, [id=#41] as decimal(33,8))))
+Input [4]: [c_last_name#16, c_first_name#15, s_store_name#22, paid#38]
+Condition : (isnotnull(paid#38) AND (cast(paid#38 as decimal(33,8)) > cast(Subquery scalar-subquery#39, [id=#11] as decimal(33,8))))
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 49 Hosting Expression = Subquery scalar-subquery#40, [id=#41]
+Subquery:1 Hosting operator id = 49 Hosting Expression = Subquery scalar-subquery#39, [id=#11]
 * HashAggregate (96)
 +- Exchange (95)
    +- * HashAggregate (94)
@@ -333,222 +333,222 @@ Subquery:1 Hosting operator id = 49 Hosting Expression = Subquery scalar-subquer
 
 
 (50) Scan parquet spark_catalog.default.store_sales
-Output [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
+Output [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_ticket_number), IsNotNull(ss_item_sk), IsNotNull(ss_store_sk), IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_customer_sk:int,ss_store_sk:int,ss_ticket_number:int,ss_net_paid:decimal(7,2)>
 
 (51) ColumnarToRow [codegen id : 2]
-Input [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
+Input [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
 
 (52) Filter [codegen id : 2]
-Input [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
-Condition : (((isnotnull(ss_ticket_number#45) AND isnotnull(ss_item_sk#42)) AND isnotnull(ss_store_sk#44)) AND isnotnull(ss_customer_sk#43))
+Input [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
+Condition : (((isnotnull(ss_ticket_number#43) AND isnotnull(ss_item_sk#40)) AND isnotnull(ss_store_sk#42)) AND isnotnull(ss_customer_sk#41))
 
 (53) Project [codegen id : 2]
-Output [5]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46]
-Input [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
+Output [5]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44]
+Input [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
 
 (54) Scan parquet spark_catalog.default.store
-Output [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
+Output [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_market_id), EqualTo(s_market_id,8), IsNotNull(s_store_sk), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_store_name:string,s_market_id:int,s_state:string,s_zip:string>
 
 (55) ColumnarToRow [codegen id : 1]
-Input [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
+Input [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
 
 (56) Filter [codegen id : 1]
-Input [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
-Condition : (((isnotnull(s_market_id#50) AND (s_market_id#50 = 8)) AND isnotnull(s_store_sk#48)) AND isnotnull(s_zip#52))
+Input [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
+Condition : (((isnotnull(s_market_id#48) AND (s_market_id#48 = 8)) AND isnotnull(s_store_sk#46)) AND isnotnull(s_zip#50))
 
 (57) Project [codegen id : 1]
-Output [4]: [s_store_sk#48, s_store_name#49, s_state#51, s_zip#52]
-Input [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
+Output [4]: [s_store_sk#46, s_store_name#47, s_state#49, s_zip#50]
+Input [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
 
 (58) BroadcastExchange
-Input [4]: [s_store_sk#48, s_store_name#49, s_state#51, s_zip#52]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
+Input [4]: [s_store_sk#46, s_store_name#47, s_state#49, s_zip#50]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=12]
 
 (59) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_store_sk#44]
-Right keys [1]: [s_store_sk#48]
+Left keys [1]: [ss_store_sk#42]
+Right keys [1]: [s_store_sk#46]
 Join type: Inner
 Join condition: None
 
 (60) Project [codegen id : 2]
-Output [7]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52]
-Input [9]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, s_store_sk#48, s_store_name#49, s_state#51, s_zip#52]
+Output [7]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50]
+Input [9]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, s_store_sk#46, s_store_name#47, s_state#49, s_zip#50]
 
 (61) Exchange
-Input [7]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52]
-Arguments: hashpartitioning(ss_item_sk#42, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [7]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50]
+Arguments: hashpartitioning(ss_item_sk#40, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (62) Sort [codegen id : 3]
-Input [7]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52]
-Arguments: [ss_item_sk#42 ASC NULLS FIRST], false, 0
+Input [7]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50]
+Arguments: [ss_item_sk#40 ASC NULLS FIRST], false, 0
 
 (63) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Output [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (64) ColumnarToRow [codegen id : 4]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
 
 (65) Filter [codegen id : 4]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Condition : isnotnull(i_item_sk#53)
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Condition : isnotnull(i_item_sk#51)
 
 (66) Exchange
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: hashpartitioning(i_item_sk#53, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: hashpartitioning(i_item_sk#51, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (67) Sort [codegen id : 5]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: [i_item_sk#53 ASC NULLS FIRST], false, 0
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: [i_item_sk#51 ASC NULLS FIRST], false, 0
 
 (68) SortMergeJoin [codegen id : 6]
-Left keys [1]: [ss_item_sk#42]
-Right keys [1]: [i_item_sk#53]
+Left keys [1]: [ss_item_sk#40]
+Right keys [1]: [i_item_sk#51]
 Join type: Inner
 Join condition: None
 
 (69) Project [codegen id : 6]
-Output [12]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Input [13]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Output [12]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Input [13]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
 
 (70) Exchange
-Input [12]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: hashpartitioning(ss_customer_sk#43, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+Input [12]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: hashpartitioning(ss_customer_sk#41, 5), ENSURE_REQUIREMENTS, [plan_id=15]
 
 (71) Sort [codegen id : 7]
-Input [12]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: [ss_customer_sk#43 ASC NULLS FIRST], false, 0
+Input [12]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: [ss_customer_sk#41 ASC NULLS FIRST], false, 0
 
 (72) ReusedExchange [Reuses operator id: 16]
-Output [4]: [c_customer_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
+Output [4]: [c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
 
 (73) Sort [codegen id : 9]
-Input [4]: [c_customer_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: [c_customer_sk#59 ASC NULLS FIRST], false, 0
+Input [4]: [c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: [c_customer_sk#57 ASC NULLS FIRST], false, 0
 
 (74) SortMergeJoin [codegen id : 10]
-Left keys [1]: [ss_customer_sk#43]
-Right keys [1]: [c_customer_sk#59]
+Left keys [1]: [ss_customer_sk#41]
+Right keys [1]: [c_customer_sk#57]
 Join type: Inner
 Join condition: None
 
 (75) Project [codegen id : 10]
-Output [14]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Input [16]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_customer_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
+Output [14]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Input [16]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
 
 (76) Exchange
-Input [14]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: hashpartitioning(ss_ticket_number#45, ss_item_sk#42, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+Input [14]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: hashpartitioning(ss_ticket_number#43, ss_item_sk#40, 5), ENSURE_REQUIREMENTS, [plan_id=16]
 
 (77) Sort [codegen id : 11]
-Input [14]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: [ss_ticket_number#45 ASC NULLS FIRST, ss_item_sk#42 ASC NULLS FIRST], false, 0
+Input [14]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: [ss_ticket_number#43 ASC NULLS FIRST, ss_item_sk#40 ASC NULLS FIRST], false, 0
 
 (78) ReusedExchange [Reuses operator id: 26]
-Output [2]: [sr_item_sk#63, sr_ticket_number#64]
+Output [2]: [sr_item_sk#61, sr_ticket_number#62]
 
 (79) Sort [codegen id : 13]
-Input [2]: [sr_item_sk#63, sr_ticket_number#64]
-Arguments: [sr_ticket_number#64 ASC NULLS FIRST, sr_item_sk#63 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#61, sr_ticket_number#62]
+Arguments: [sr_ticket_number#62 ASC NULLS FIRST, sr_item_sk#61 ASC NULLS FIRST], false, 0
 
 (80) SortMergeJoin [codegen id : 14]
-Left keys [2]: [ss_ticket_number#45, ss_item_sk#42]
-Right keys [2]: [sr_ticket_number#64, sr_item_sk#63]
+Left keys [2]: [ss_ticket_number#43, ss_item_sk#40]
+Right keys [2]: [sr_ticket_number#62, sr_item_sk#61]
 Join type: Inner
 Join condition: None
 
 (81) Project [codegen id : 14]
-Output [12]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Input [16]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62, sr_item_sk#63, sr_ticket_number#64]
+Output [12]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Input [16]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60, sr_item_sk#61, sr_ticket_number#62]
 
 (82) Exchange
-Input [12]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: hashpartitioning(c_birth_country#62, s_zip#52, 5), ENSURE_REQUIREMENTS, [plan_id=15]
+Input [12]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: hashpartitioning(c_birth_country#60, s_zip#50, 5), ENSURE_REQUIREMENTS, [plan_id=17]
 
 (83) Sort [codegen id : 15]
-Input [12]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: [c_birth_country#62 ASC NULLS FIRST, s_zip#52 ASC NULLS FIRST], false, 0
+Input [12]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: [c_birth_country#60 ASC NULLS FIRST, s_zip#50 ASC NULLS FIRST], false, 0
 
 (84) Scan parquet spark_catalog.default.customer_address
-Output [3]: [ca_state#65, ca_zip#66, ca_country#67]
+Output [3]: [ca_state#63, ca_zip#64, ca_country#65]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_country), IsNotNull(ca_zip)]
 ReadSchema: struct<ca_state:string,ca_zip:string,ca_country:string>
 
 (85) ColumnarToRow [codegen id : 16]
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
 
 (86) Filter [codegen id : 16]
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
-Condition : (isnotnull(ca_country#67) AND isnotnull(ca_zip#66))
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
+Condition : (isnotnull(ca_country#65) AND isnotnull(ca_zip#64))
 
 (87) Exchange
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
-Arguments: hashpartitioning(upper(ca_country#67), ca_zip#66, 5), ENSURE_REQUIREMENTS, [plan_id=16]
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
+Arguments: hashpartitioning(upper(ca_country#65), ca_zip#64, 5), ENSURE_REQUIREMENTS, [plan_id=18]
 
 (88) Sort [codegen id : 17]
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
-Arguments: [upper(ca_country#67) ASC NULLS FIRST, ca_zip#66 ASC NULLS FIRST], false, 0
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
+Arguments: [upper(ca_country#65) ASC NULLS FIRST, ca_zip#64 ASC NULLS FIRST], false, 0
 
 (89) SortMergeJoin [codegen id : 18]
-Left keys [2]: [c_birth_country#62, s_zip#52]
-Right keys [2]: [upper(ca_country#67), ca_zip#66]
+Left keys [2]: [c_birth_country#60, s_zip#50]
+Right keys [2]: [upper(ca_country#65), ca_zip#64]
 Join type: Inner
 Join condition: None
 
 (90) Project [codegen id : 18]
-Output [11]: [ss_net_paid#46, s_store_name#49, s_state#51, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, ca_state#65]
-Input [15]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62, ca_state#65, ca_zip#66, ca_country#67]
+Output [11]: [ss_net_paid#44, s_store_name#47, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#63]
+Input [15]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60, ca_state#63, ca_zip#64, ca_country#65]
 
 (91) HashAggregate [codegen id : 18]
-Input [11]: [ss_net_paid#46, s_store_name#49, s_state#51, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, ca_state#65]
-Keys [10]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55]
-Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#46))]
-Aggregate Attributes [1]: [sum#68]
-Results [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
+Input [11]: [ss_net_paid#44, s_store_name#47, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#63]
+Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
+Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#44))]
+Aggregate Attributes [1]: [sum#66]
+Results [11]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#67]
 
 (92) Exchange
-Input [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
-Arguments: hashpartitioning(c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, 5), ENSURE_REQUIREMENTS, [plan_id=17]
+Input [11]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#67]
+Arguments: hashpartitioning(c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, 5), ENSURE_REQUIREMENTS, [plan_id=19]
 
 (93) HashAggregate [codegen id : 19]
-Input [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
-Keys [10]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55]
-Functions [1]: [sum(UnscaledValue(ss_net_paid#46))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#46))#32]
-Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#46))#32,17,2) AS netpaid#70]
+Input [11]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#67]
+Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
+Functions [1]: [sum(UnscaledValue(ss_net_paid#44))]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#44))#31]
+Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#44))#31,17,2) AS netpaid#68]
 
 (94) HashAggregate [codegen id : 19]
-Input [1]: [netpaid#70]
+Input [1]: [netpaid#68]
 Keys: []
-Functions [1]: [partial_avg(netpaid#70)]
-Aggregate Attributes [2]: [sum#71, count#72]
-Results [2]: [sum#73, count#74]
+Functions [1]: [partial_avg(netpaid#68)]
+Aggregate Attributes [2]: [sum#69, count#70]
+Results [2]: [sum#71, count#72]
 
 (95) Exchange
-Input [2]: [sum#73, count#74]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=18]
+Input [2]: [sum#71, count#72]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=20]
 
 (96) HashAggregate [codegen id : 20]
-Input [2]: [sum#73, count#74]
+Input [2]: [sum#71, count#72]
 Keys: []
-Functions [1]: [avg(netpaid#70)]
-Aggregate Attributes [1]: [avg(netpaid#70)#75]
-Results [1]: [(0.05 * avg(netpaid#70)#75) AS (0.05 * avg(netpaid))#76]
+Functions [1]: [avg(netpaid#68)]
+Aggregate Attributes [1]: [avg(netpaid#68)#73]
+Results [1]: [(0.05 * avg(netpaid#68)#73) AS (0.05 * avg(netpaid))#74]
 
-Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#7, [id=#8]
+Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#7, [id=#1]
 ObjectHashAggregate (103)
 +- Exchange (102)
    +- ObjectHashAggregate (101)
@@ -559,39 +559,39 @@ ObjectHashAggregate (103)
 
 
 (97) Scan parquet spark_catalog.default.store
-Output [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
+Output [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_market_id), EqualTo(s_market_id,8), IsNotNull(s_store_sk), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_market_id:int,s_zip:string>
 
 (98) ColumnarToRow [codegen id : 1]
-Input [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
+Input [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
 
 (99) Filter [codegen id : 1]
-Input [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
-Condition : (((isnotnull(s_market_id#24) AND (s_market_id#24 = 8)) AND isnotnull(s_store_sk#22)) AND isnotnull(s_zip#26))
+Input [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
+Condition : (((isnotnull(s_market_id#23) AND (s_market_id#23 = 8)) AND isnotnull(s_store_sk#21)) AND isnotnull(s_zip#25))
 
 (100) Project [codegen id : 1]
-Output [1]: [s_store_sk#22]
-Input [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
+Output [1]: [s_store_sk#21]
+Input [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
 
 (101) ObjectHashAggregate
-Input [1]: [s_store_sk#22]
+Input [1]: [s_store_sk#21]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)]
-Aggregate Attributes [1]: [buf#77]
-Results [1]: [buf#78]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)]
+Aggregate Attributes [1]: [buf#75]
+Results [1]: [buf#76]
 
 (102) Exchange
-Input [1]: [buf#78]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=19]
+Input [1]: [buf#76]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=21]
 
 (103) ObjectHashAggregate
-Input [1]: [buf#78]
+Input [1]: [buf#76]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)#79]
-Results [1]: [bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)#79 AS bloomFilter#80]
+Functions [1]: [bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)#77]
+Results [1]: [bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)#77 AS bloomFilter#78]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a/explain.txt
index c579d821ed24a..6d04eb5d610aa 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24a/explain.txt
@@ -263,11 +263,11 @@ Results [4]: [c_last_name#23, c_first_name#22, s_store_name#11, sum(netpaid#31)#
 
 (46) Filter [codegen id : 11]
 Input [4]: [c_last_name#23, c_first_name#22, s_store_name#11, paid#37]
-Condition : (isnotnull(paid#37) AND (cast(paid#37 as decimal(33,8)) > cast(Subquery scalar-subquery#38, [id=#39] as decimal(33,8))))
+Condition : (isnotnull(paid#37) AND (cast(paid#37 as decimal(33,8)) > cast(Subquery scalar-subquery#38, [id=#9] as decimal(33,8))))
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#38, [id=#39]
+Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#38, [id=#9]
 * HashAggregate (73)
 +- Exchange (72)
    +- * HashAggregate (71)
@@ -298,130 +298,130 @@ Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquer
 
 
 (47) ReusedExchange [Reuses operator id: 5]
-Output [5]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44]
+Output [5]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_ticket_number#42, ss_net_paid#43]
 
 (48) Sort [codegen id : 2]
-Input [5]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44]
-Arguments: [ss_ticket_number#43 ASC NULLS FIRST, ss_item_sk#40 ASC NULLS FIRST], false, 0
+Input [5]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_ticket_number#42, ss_net_paid#43]
+Arguments: [ss_ticket_number#42 ASC NULLS FIRST, ss_item_sk#39 ASC NULLS FIRST], false, 0
 
 (49) ReusedExchange [Reuses operator id: 11]
-Output [2]: [sr_item_sk#45, sr_ticket_number#46]
+Output [2]: [sr_item_sk#44, sr_ticket_number#45]
 
 (50) Sort [codegen id : 4]
-Input [2]: [sr_item_sk#45, sr_ticket_number#46]
-Arguments: [sr_ticket_number#46 ASC NULLS FIRST, sr_item_sk#45 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#44, sr_ticket_number#45]
+Arguments: [sr_ticket_number#45 ASC NULLS FIRST, sr_item_sk#44 ASC NULLS FIRST], false, 0
 
 (51) SortMergeJoin [codegen id : 9]
-Left keys [2]: [ss_ticket_number#43, ss_item_sk#40]
-Right keys [2]: [sr_ticket_number#46, sr_item_sk#45]
+Left keys [2]: [ss_ticket_number#42, ss_item_sk#39]
+Right keys [2]: [sr_ticket_number#45, sr_item_sk#44]
 Join type: Inner
 Join condition: None
 
 (52) Project [codegen id : 9]
-Output [4]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_net_paid#44]
-Input [7]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, sr_item_sk#45, sr_ticket_number#46]
+Output [4]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_net_paid#43]
+Input [7]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_ticket_number#42, ss_net_paid#43, sr_item_sk#44, sr_ticket_number#45]
 
 (53) ReusedExchange [Reuses operator id: 19]
-Output [4]: [s_store_sk#47, s_store_name#48, s_state#49, s_zip#50]
+Output [4]: [s_store_sk#46, s_store_name#47, s_state#48, s_zip#49]
 
 (54) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_store_sk#42]
-Right keys [1]: [s_store_sk#47]
+Left keys [1]: [ss_store_sk#41]
+Right keys [1]: [s_store_sk#46]
 Join type: Inner
 Join condition: None
 
 (55) Project [codegen id : 9]
-Output [6]: [ss_item_sk#40, ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50]
-Input [8]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_net_paid#44, s_store_sk#47, s_store_name#48, s_state#49, s_zip#50]
+Output [6]: [ss_item_sk#39, ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49]
+Input [8]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_net_paid#43, s_store_sk#46, s_store_name#47, s_state#48, s_zip#49]
 
 (56) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Output [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (57) ColumnarToRow [codegen id : 6]
-Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Input [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
 
 (58) Filter [codegen id : 6]
-Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
-Condition : isnotnull(i_item_sk#51)
+Input [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
+Condition : isnotnull(i_item_sk#50)
 
 (59) BroadcastExchange
-Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=9]
+Input [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=10]
 
 (60) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_item_sk#40]
-Right keys [1]: [i_item_sk#51]
+Left keys [1]: [ss_item_sk#39]
+Right keys [1]: [i_item_sk#50]
 Join type: Inner
 Join condition: None
 
 (61) Project [codegen id : 9]
-Output [10]: [ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
-Input [12]: [ss_item_sk#40, ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Output [10]: [ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
+Input [12]: [ss_item_sk#39, ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
 
 (62) ReusedExchange [Reuses operator id: 31]
-Output [4]: [c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
+Output [4]: [c_customer_sk#56, c_first_name#57, c_last_name#58, c_birth_country#59]
 
 (63) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_customer_sk#41]
-Right keys [1]: [c_customer_sk#57]
+Left keys [1]: [ss_customer_sk#40]
+Right keys [1]: [c_customer_sk#56]
 Join type: Inner
 Join condition: None
 
 (64) Project [codegen id : 9]
-Output [12]: [ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
-Input [14]: [ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
+Output [12]: [ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, c_birth_country#59]
+Input [14]: [ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_customer_sk#56, c_first_name#57, c_last_name#58, c_birth_country#59]
 
 (65) ReusedExchange [Reuses operator id: 37]
-Output [3]: [ca_state#61, ca_zip#62, ca_country#63]
+Output [3]: [ca_state#60, ca_zip#61, ca_country#62]
 
 (66) BroadcastHashJoin [codegen id : 9]
-Left keys [2]: [c_birth_country#60, s_zip#50]
-Right keys [2]: [upper(ca_country#63), ca_zip#62]
+Left keys [2]: [c_birth_country#59, s_zip#49]
+Right keys [2]: [upper(ca_country#62), ca_zip#61]
 Join type: Inner
 Join condition: None
 
 (67) Project [codegen id : 9]
-Output [11]: [ss_net_paid#44, s_store_name#48, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#61]
-Input [15]: [ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60, ca_state#61, ca_zip#62, ca_country#63]
+Output [11]: [ss_net_paid#43, s_store_name#47, s_state#48, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, ca_state#60]
+Input [15]: [ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, c_birth_country#59, ca_state#60, ca_zip#61, ca_country#62]
 
 (68) HashAggregate [codegen id : 9]
-Input [11]: [ss_net_paid#44, s_store_name#48, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#61]
-Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
-Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#44))]
-Aggregate Attributes [1]: [sum#64]
-Results [11]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#65]
+Input [11]: [ss_net_paid#43, s_store_name#47, s_state#48, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, ca_state#60]
+Keys [10]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52]
+Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#43))]
+Aggregate Attributes [1]: [sum#63]
+Results [11]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, sum#64]
 
 (69) Exchange
-Input [11]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#65]
-Arguments: hashpartitioning(c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [11]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, sum#64]
+Arguments: hashpartitioning(c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (70) HashAggregate [codegen id : 10]
-Input [11]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#65]
-Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
-Functions [1]: [sum(UnscaledValue(ss_net_paid#44))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#44))#30]
-Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#44))#30,17,2) AS netpaid#66]
+Input [11]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, sum#64]
+Keys [10]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52]
+Functions [1]: [sum(UnscaledValue(ss_net_paid#43))]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#43))#30]
+Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#43))#30,17,2) AS netpaid#65]
 
 (71) HashAggregate [codegen id : 10]
-Input [1]: [netpaid#66]
+Input [1]: [netpaid#65]
 Keys: []
-Functions [1]: [partial_avg(netpaid#66)]
-Aggregate Attributes [2]: [sum#67, count#68]
-Results [2]: [sum#69, count#70]
+Functions [1]: [partial_avg(netpaid#65)]
+Aggregate Attributes [2]: [sum#66, count#67]
+Results [2]: [sum#68, count#69]
 
 (72) Exchange
-Input [2]: [sum#69, count#70]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
+Input [2]: [sum#68, count#69]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (73) HashAggregate [codegen id : 11]
-Input [2]: [sum#69, count#70]
+Input [2]: [sum#68, count#69]
 Keys: []
-Functions [1]: [avg(netpaid#66)]
-Aggregate Attributes [1]: [avg(netpaid#66)#71]
-Results [1]: [(0.05 * avg(netpaid#66)#71) AS (0.05 * avg(netpaid))#72]
+Functions [1]: [avg(netpaid#65)]
+Aggregate Attributes [1]: [avg(netpaid#65)#70]
+Results [1]: [(0.05 * avg(netpaid#65)#70) AS (0.05 * avg(netpaid))#71]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b.sf100/explain.txt
index 5d21695183a38..563ad6bc53ea3 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b.sf100/explain.txt
@@ -62,227 +62,227 @@ Input [6]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, s
 
 (3) Filter [codegen id : 2]
 Input [6]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, ss_sold_date_sk#6]
-Condition : ((((isnotnull(ss_ticket_number#4) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_store_sk#3)) AND isnotnull(ss_customer_sk#2)) AND might_contain(Subquery scalar-subquery#7, [id=#8], xxhash64(ss_store_sk#3, 42)))
+Condition : ((((isnotnull(ss_ticket_number#4) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_store_sk#3)) AND isnotnull(ss_customer_sk#2)) AND might_contain(Subquery scalar-subquery#7, [id=#1], xxhash64(ss_store_sk#3, 42)))
 
 (4) Project [codegen id : 2]
 Output [5]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5]
 Input [6]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, ss_sold_date_sk#6]
 
 (5) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Output [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_color), EqualTo(i_color,chiffon             ), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (6) ColumnarToRow [codegen id : 1]
-Input [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Input [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 
 (7) Filter [codegen id : 1]
-Input [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Condition : ((isnotnull(i_color#12) AND (i_color#12 = chiffon             )) AND isnotnull(i_item_sk#9))
+Input [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Condition : ((isnotnull(i_color#11) AND (i_color#11 = chiffon             )) AND isnotnull(i_item_sk#8))
 
 (8) BroadcastExchange
-Input [6]: [i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=1]
+Input [6]: [i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=2]
 
 (9) BroadcastHashJoin [codegen id : 2]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [i_item_sk#9]
+Right keys [1]: [i_item_sk#8]
 Join type: Inner
 Join condition: None
 
 (10) Project [codegen id : 2]
-Output [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Input [11]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_item_sk#9, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Output [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Input [11]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_item_sk#8, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 
 (11) Exchange
-Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
-Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
+Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) Sort [codegen id : 3]
-Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14]
+Input [10]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13]
 Arguments: [ss_customer_sk#2 ASC NULLS FIRST], false, 0
 
 (13) Scan parquet spark_catalog.default.customer
-Output [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
+Output [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer]
 PushedFilters: [IsNotNull(c_customer_sk), IsNotNull(c_birth_country)]
 ReadSchema: struct<c_customer_sk:int,c_first_name:string,c_last_name:string,c_birth_country:string>
 
 (14) ColumnarToRow [codegen id : 4]
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
 
 (15) Filter [codegen id : 4]
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
-Condition : (isnotnull(c_customer_sk#15) AND isnotnull(c_birth_country#18))
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
+Condition : (isnotnull(c_customer_sk#14) AND isnotnull(c_birth_country#17))
 
 (16) Exchange
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
-Arguments: hashpartitioning(c_customer_sk#15, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
+Arguments: hashpartitioning(c_customer_sk#14, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (17) Sort [codegen id : 5]
-Input [4]: [c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
-Arguments: [c_customer_sk#15 ASC NULLS FIRST], false, 0
+Input [4]: [c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
+Arguments: [c_customer_sk#14 ASC NULLS FIRST], false, 0
 
 (18) SortMergeJoin [codegen id : 6]
 Left keys [1]: [ss_customer_sk#2]
-Right keys [1]: [c_customer_sk#15]
+Right keys [1]: [c_customer_sk#14]
 Join type: Inner
 Join condition: None
 
 (19) Project [codegen id : 6]
-Output [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
-Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_customer_sk#15, c_first_name#16, c_last_name#17, c_birth_country#18]
+Output [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
+Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_customer_sk#14, c_first_name#15, c_last_name#16, c_birth_country#17]
 
 (20) Exchange
-Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
-Arguments: hashpartitioning(ss_ticket_number#4, ss_item_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
+Arguments: hashpartitioning(ss_ticket_number#4, ss_item_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (21) Sort [codegen id : 7]
-Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
+Input [12]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
 Arguments: [ss_ticket_number#4 ASC NULLS FIRST, ss_item_sk#1 ASC NULLS FIRST], false, 0
 
 (22) Scan parquet spark_catalog.default.store_returns
-Output [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
+Output [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_returns]
 PushedFilters: [IsNotNull(sr_ticket_number), IsNotNull(sr_item_sk)]
 ReadSchema: struct<sr_item_sk:int,sr_ticket_number:int>
 
 (23) ColumnarToRow [codegen id : 8]
-Input [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
+Input [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
 
 (24) Filter [codegen id : 8]
-Input [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
-Condition : (isnotnull(sr_ticket_number#20) AND isnotnull(sr_item_sk#19))
+Input [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
+Condition : (isnotnull(sr_ticket_number#19) AND isnotnull(sr_item_sk#18))
 
 (25) Project [codegen id : 8]
-Output [2]: [sr_item_sk#19, sr_ticket_number#20]
-Input [3]: [sr_item_sk#19, sr_ticket_number#20, sr_returned_date_sk#21]
+Output [2]: [sr_item_sk#18, sr_ticket_number#19]
+Input [3]: [sr_item_sk#18, sr_ticket_number#19, sr_returned_date_sk#20]
 
 (26) Exchange
-Input [2]: [sr_item_sk#19, sr_ticket_number#20]
-Arguments: hashpartitioning(sr_ticket_number#20, sr_item_sk#19, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [2]: [sr_item_sk#18, sr_ticket_number#19]
+Arguments: hashpartitioning(sr_ticket_number#19, sr_item_sk#18, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (27) Sort [codegen id : 9]
-Input [2]: [sr_item_sk#19, sr_ticket_number#20]
-Arguments: [sr_ticket_number#20 ASC NULLS FIRST, sr_item_sk#19 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#18, sr_ticket_number#19]
+Arguments: [sr_ticket_number#19 ASC NULLS FIRST, sr_item_sk#18 ASC NULLS FIRST], false, 0
 
 (28) SortMergeJoin [codegen id : 12]
 Left keys [2]: [ss_ticket_number#4, ss_item_sk#1]
-Right keys [2]: [sr_ticket_number#20, sr_item_sk#19]
+Right keys [2]: [sr_ticket_number#19, sr_item_sk#18]
 Join type: Inner
 Join condition: None
 
 (29) Project [codegen id : 12]
-Output [10]: [ss_store_sk#3, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18]
-Input [14]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18, sr_item_sk#19, sr_ticket_number#20]
+Output [10]: [ss_store_sk#3, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17]
+Input [14]: [ss_item_sk#1, ss_store_sk#3, ss_ticket_number#4, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17, sr_item_sk#18, sr_ticket_number#19]
 
 (30) Scan parquet spark_catalog.default.store
-Output [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
+Output [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_market_id), EqualTo(s_market_id,8), IsNotNull(s_store_sk), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_store_name:string,s_market_id:int,s_state:string,s_zip:string>
 
 (31) ColumnarToRow [codegen id : 10]
-Input [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
+Input [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
 
 (32) Filter [codegen id : 10]
-Input [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
-Condition : (((isnotnull(s_market_id#24) AND (s_market_id#24 = 8)) AND isnotnull(s_store_sk#22)) AND isnotnull(s_zip#26))
+Input [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
+Condition : (((isnotnull(s_market_id#23) AND (s_market_id#23 = 8)) AND isnotnull(s_store_sk#21)) AND isnotnull(s_zip#25))
 
 (33) Project [codegen id : 10]
-Output [4]: [s_store_sk#22, s_store_name#23, s_state#25, s_zip#26]
-Input [5]: [s_store_sk#22, s_store_name#23, s_market_id#24, s_state#25, s_zip#26]
+Output [4]: [s_store_sk#21, s_store_name#22, s_state#24, s_zip#25]
+Input [5]: [s_store_sk#21, s_store_name#22, s_market_id#23, s_state#24, s_zip#25]
 
 (34) BroadcastExchange
-Input [4]: [s_store_sk#22, s_store_name#23, s_state#25, s_zip#26]
-Arguments: HashedRelationBroadcastMode(List(input[3, string, true]),false), [plan_id=6]
+Input [4]: [s_store_sk#21, s_store_name#22, s_state#24, s_zip#25]
+Arguments: HashedRelationBroadcastMode(List(input[3, string, true]),false), [plan_id=7]
 
 (35) Scan parquet spark_catalog.default.customer_address
-Output [3]: [ca_state#27, ca_zip#28, ca_country#29]
+Output [3]: [ca_state#26, ca_zip#27, ca_country#28]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_country), IsNotNull(ca_zip)]
 ReadSchema: struct<ca_state:string,ca_zip:string,ca_country:string>
 
 (36) ColumnarToRow
-Input [3]: [ca_state#27, ca_zip#28, ca_country#29]
+Input [3]: [ca_state#26, ca_zip#27, ca_country#28]
 
 (37) Filter
-Input [3]: [ca_state#27, ca_zip#28, ca_country#29]
-Condition : (isnotnull(ca_country#29) AND isnotnull(ca_zip#28))
+Input [3]: [ca_state#26, ca_zip#27, ca_country#28]
+Condition : (isnotnull(ca_country#28) AND isnotnull(ca_zip#27))
 
 (38) BroadcastHashJoin [codegen id : 11]
-Left keys [1]: [s_zip#26]
-Right keys [1]: [ca_zip#28]
+Left keys [1]: [s_zip#25]
+Right keys [1]: [ca_zip#27]
 Join type: Inner
 Join condition: None
 
 (39) Project [codegen id : 11]
-Output [5]: [s_store_sk#22, s_store_name#23, s_state#25, ca_state#27, ca_country#29]
-Input [7]: [s_store_sk#22, s_store_name#23, s_state#25, s_zip#26, ca_state#27, ca_zip#28, ca_country#29]
+Output [5]: [s_store_sk#21, s_store_name#22, s_state#24, ca_state#26, ca_country#28]
+Input [7]: [s_store_sk#21, s_store_name#22, s_state#24, s_zip#25, ca_state#26, ca_zip#27, ca_country#28]
 
 (40) BroadcastExchange
-Input [5]: [s_store_sk#22, s_store_name#23, s_state#25, ca_state#27, ca_country#29]
-Arguments: HashedRelationBroadcastMode(List(input[0, int, true], upper(input[4, string, true])),false), [plan_id=7]
+Input [5]: [s_store_sk#21, s_store_name#22, s_state#24, ca_state#26, ca_country#28]
+Arguments: HashedRelationBroadcastMode(List(input[0, int, true], upper(input[4, string, true])),false), [plan_id=8]
 
 (41) BroadcastHashJoin [codegen id : 12]
-Left keys [2]: [ss_store_sk#3, c_birth_country#18]
-Right keys [2]: [s_store_sk#22, upper(ca_country#29)]
+Left keys [2]: [ss_store_sk#3, c_birth_country#17]
+Right keys [2]: [s_store_sk#21, upper(ca_country#28)]
 Join type: Inner
 Join condition: None
 
 (42) Project [codegen id : 12]
-Output [11]: [ss_net_paid#5, s_store_name#23, s_state#25, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, ca_state#27]
-Input [15]: [ss_store_sk#3, ss_net_paid#5, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, c_birth_country#18, s_store_sk#22, s_store_name#23, s_state#25, ca_state#27, ca_country#29]
+Output [11]: [ss_net_paid#5, s_store_name#22, s_state#24, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, ca_state#26]
+Input [15]: [ss_store_sk#3, ss_net_paid#5, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, c_birth_country#17, s_store_sk#21, s_store_name#22, s_state#24, ca_state#26, ca_country#28]
 
 (43) HashAggregate [codegen id : 12]
-Input [11]: [ss_net_paid#5, s_store_name#23, s_state#25, i_current_price#10, i_size#11, i_color#12, i_units#13, i_manager_id#14, c_first_name#16, c_last_name#17, ca_state#27]
-Keys [10]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11]
+Input [11]: [ss_net_paid#5, s_store_name#22, s_state#24, i_current_price#9, i_size#10, i_color#11, i_units#12, i_manager_id#13, c_first_name#15, c_last_name#16, ca_state#26]
+Keys [10]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10]
 Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#5))]
-Aggregate Attributes [1]: [sum#30]
-Results [11]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, sum#31]
+Aggregate Attributes [1]: [sum#29]
+Results [11]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, sum#30]
 
 (44) Exchange
-Input [11]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, sum#31]
-Arguments: hashpartitioning(c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [11]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, sum#30]
+Arguments: hashpartitioning(c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (45) HashAggregate [codegen id : 13]
-Input [11]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11, sum#31]
-Keys [10]: [c_last_name#17, c_first_name#16, s_store_name#23, ca_state#27, s_state#25, i_color#12, i_current_price#10, i_manager_id#14, i_units#13, i_size#11]
+Input [11]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10, sum#30]
+Keys [10]: [c_last_name#16, c_first_name#15, s_store_name#22, ca_state#26, s_state#24, i_color#11, i_current_price#9, i_manager_id#13, i_units#12, i_size#10]
 Functions [1]: [sum(UnscaledValue(ss_net_paid#5))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#5))#32]
-Results [4]: [c_last_name#17, c_first_name#16, s_store_name#23, MakeDecimal(sum(UnscaledValue(ss_net_paid#5))#32,17,2) AS netpaid#33]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#5))#31]
+Results [4]: [c_last_name#16, c_first_name#15, s_store_name#22, MakeDecimal(sum(UnscaledValue(ss_net_paid#5))#31,17,2) AS netpaid#32]
 
 (46) HashAggregate [codegen id : 13]
-Input [4]: [c_last_name#17, c_first_name#16, s_store_name#23, netpaid#33]
-Keys [3]: [c_last_name#17, c_first_name#16, s_store_name#23]
-Functions [1]: [partial_sum(netpaid#33)]
-Aggregate Attributes [2]: [sum#34, isEmpty#35]
-Results [5]: [c_last_name#17, c_first_name#16, s_store_name#23, sum#36, isEmpty#37]
+Input [4]: [c_last_name#16, c_first_name#15, s_store_name#22, netpaid#32]
+Keys [3]: [c_last_name#16, c_first_name#15, s_store_name#22]
+Functions [1]: [partial_sum(netpaid#32)]
+Aggregate Attributes [2]: [sum#33, isEmpty#34]
+Results [5]: [c_last_name#16, c_first_name#15, s_store_name#22, sum#35, isEmpty#36]
 
 (47) Exchange
-Input [5]: [c_last_name#17, c_first_name#16, s_store_name#23, sum#36, isEmpty#37]
-Arguments: hashpartitioning(c_last_name#17, c_first_name#16, s_store_name#23, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Input [5]: [c_last_name#16, c_first_name#15, s_store_name#22, sum#35, isEmpty#36]
+Arguments: hashpartitioning(c_last_name#16, c_first_name#15, s_store_name#22, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (48) HashAggregate [codegen id : 14]
-Input [5]: [c_last_name#17, c_first_name#16, s_store_name#23, sum#36, isEmpty#37]
-Keys [3]: [c_last_name#17, c_first_name#16, s_store_name#23]
-Functions [1]: [sum(netpaid#33)]
-Aggregate Attributes [1]: [sum(netpaid#33)#38]
-Results [4]: [c_last_name#17, c_first_name#16, s_store_name#23, sum(netpaid#33)#38 AS paid#39]
+Input [5]: [c_last_name#16, c_first_name#15, s_store_name#22, sum#35, isEmpty#36]
+Keys [3]: [c_last_name#16, c_first_name#15, s_store_name#22]
+Functions [1]: [sum(netpaid#32)]
+Aggregate Attributes [1]: [sum(netpaid#32)#37]
+Results [4]: [c_last_name#16, c_first_name#15, s_store_name#22, sum(netpaid#32)#37 AS paid#38]
 
 (49) Filter [codegen id : 14]
-Input [4]: [c_last_name#17, c_first_name#16, s_store_name#23, paid#39]
-Condition : (isnotnull(paid#39) AND (cast(paid#39 as decimal(33,8)) > cast(Subquery scalar-subquery#40, [id=#41] as decimal(33,8))))
+Input [4]: [c_last_name#16, c_first_name#15, s_store_name#22, paid#38]
+Condition : (isnotnull(paid#38) AND (cast(paid#38 as decimal(33,8)) > cast(Subquery scalar-subquery#39, [id=#11] as decimal(33,8))))
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 49 Hosting Expression = Subquery scalar-subquery#40, [id=#41]
+Subquery:1 Hosting operator id = 49 Hosting Expression = Subquery scalar-subquery#39, [id=#11]
 * HashAggregate (96)
 +- Exchange (95)
    +- * HashAggregate (94)
@@ -333,222 +333,222 @@ Subquery:1 Hosting operator id = 49 Hosting Expression = Subquery scalar-subquer
 
 
 (50) Scan parquet spark_catalog.default.store_sales
-Output [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
+Output [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_ticket_number), IsNotNull(ss_item_sk), IsNotNull(ss_store_sk), IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_customer_sk:int,ss_store_sk:int,ss_ticket_number:int,ss_net_paid:decimal(7,2)>
 
 (51) ColumnarToRow [codegen id : 2]
-Input [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
+Input [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
 
 (52) Filter [codegen id : 2]
-Input [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
-Condition : (((isnotnull(ss_ticket_number#45) AND isnotnull(ss_item_sk#42)) AND isnotnull(ss_store_sk#44)) AND isnotnull(ss_customer_sk#43))
+Input [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
+Condition : (((isnotnull(ss_ticket_number#43) AND isnotnull(ss_item_sk#40)) AND isnotnull(ss_store_sk#42)) AND isnotnull(ss_customer_sk#41))
 
 (53) Project [codegen id : 2]
-Output [5]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46]
-Input [6]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, ss_sold_date_sk#47]
+Output [5]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44]
+Input [6]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, ss_sold_date_sk#45]
 
 (54) Scan parquet spark_catalog.default.store
-Output [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
+Output [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_market_id), EqualTo(s_market_id,8), IsNotNull(s_store_sk), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_store_name:string,s_market_id:int,s_state:string,s_zip:string>
 
 (55) ColumnarToRow [codegen id : 1]
-Input [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
+Input [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
 
 (56) Filter [codegen id : 1]
-Input [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
-Condition : (((isnotnull(s_market_id#50) AND (s_market_id#50 = 8)) AND isnotnull(s_store_sk#48)) AND isnotnull(s_zip#52))
+Input [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
+Condition : (((isnotnull(s_market_id#48) AND (s_market_id#48 = 8)) AND isnotnull(s_store_sk#46)) AND isnotnull(s_zip#50))
 
 (57) Project [codegen id : 1]
-Output [4]: [s_store_sk#48, s_store_name#49, s_state#51, s_zip#52]
-Input [5]: [s_store_sk#48, s_store_name#49, s_market_id#50, s_state#51, s_zip#52]
+Output [4]: [s_store_sk#46, s_store_name#47, s_state#49, s_zip#50]
+Input [5]: [s_store_sk#46, s_store_name#47, s_market_id#48, s_state#49, s_zip#50]
 
 (58) BroadcastExchange
-Input [4]: [s_store_sk#48, s_store_name#49, s_state#51, s_zip#52]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
+Input [4]: [s_store_sk#46, s_store_name#47, s_state#49, s_zip#50]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=12]
 
 (59) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_store_sk#44]
-Right keys [1]: [s_store_sk#48]
+Left keys [1]: [ss_store_sk#42]
+Right keys [1]: [s_store_sk#46]
 Join type: Inner
 Join condition: None
 
 (60) Project [codegen id : 2]
-Output [7]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52]
-Input [9]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, s_store_sk#48, s_store_name#49, s_state#51, s_zip#52]
+Output [7]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50]
+Input [9]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, s_store_sk#46, s_store_name#47, s_state#49, s_zip#50]
 
 (61) Exchange
-Input [7]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52]
-Arguments: hashpartitioning(ss_item_sk#42, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [7]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50]
+Arguments: hashpartitioning(ss_item_sk#40, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (62) Sort [codegen id : 3]
-Input [7]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52]
-Arguments: [ss_item_sk#42 ASC NULLS FIRST], false, 0
+Input [7]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50]
+Arguments: [ss_item_sk#40 ASC NULLS FIRST], false, 0
 
 (63) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Output [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (64) ColumnarToRow [codegen id : 4]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
 
 (65) Filter [codegen id : 4]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Condition : isnotnull(i_item_sk#53)
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Condition : isnotnull(i_item_sk#51)
 
 (66) Exchange
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: hashpartitioning(i_item_sk#53, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: hashpartitioning(i_item_sk#51, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (67) Sort [codegen id : 5]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: [i_item_sk#53 ASC NULLS FIRST], false, 0
+Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: [i_item_sk#51 ASC NULLS FIRST], false, 0
 
 (68) SortMergeJoin [codegen id : 6]
-Left keys [1]: [ss_item_sk#42]
-Right keys [1]: [i_item_sk#53]
+Left keys [1]: [ss_item_sk#40]
+Right keys [1]: [i_item_sk#51]
 Join type: Inner
 Join condition: None
 
 (69) Project [codegen id : 6]
-Output [12]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Input [13]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Output [12]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Input [13]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
 
 (70) Exchange
-Input [12]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: hashpartitioning(ss_customer_sk#43, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+Input [12]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: hashpartitioning(ss_customer_sk#41, 5), ENSURE_REQUIREMENTS, [plan_id=15]
 
 (71) Sort [codegen id : 7]
-Input [12]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: [ss_customer_sk#43 ASC NULLS FIRST], false, 0
+Input [12]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Arguments: [ss_customer_sk#41 ASC NULLS FIRST], false, 0
 
 (72) ReusedExchange [Reuses operator id: 16]
-Output [4]: [c_customer_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
+Output [4]: [c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
 
 (73) Sort [codegen id : 9]
-Input [4]: [c_customer_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: [c_customer_sk#59 ASC NULLS FIRST], false, 0
+Input [4]: [c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: [c_customer_sk#57 ASC NULLS FIRST], false, 0
 
 (74) SortMergeJoin [codegen id : 10]
-Left keys [1]: [ss_customer_sk#43]
-Right keys [1]: [c_customer_sk#59]
+Left keys [1]: [ss_customer_sk#41]
+Right keys [1]: [c_customer_sk#57]
 Join type: Inner
 Join condition: None
 
 (75) Project [codegen id : 10]
-Output [14]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Input [16]: [ss_item_sk#42, ss_customer_sk#43, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_customer_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
+Output [14]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Input [16]: [ss_item_sk#40, ss_customer_sk#41, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
 
 (76) Exchange
-Input [14]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: hashpartitioning(ss_ticket_number#45, ss_item_sk#42, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+Input [14]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: hashpartitioning(ss_ticket_number#43, ss_item_sk#40, 5), ENSURE_REQUIREMENTS, [plan_id=16]
 
 (77) Sort [codegen id : 11]
-Input [14]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: [ss_ticket_number#45 ASC NULLS FIRST, ss_item_sk#42 ASC NULLS FIRST], false, 0
+Input [14]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: [ss_ticket_number#43 ASC NULLS FIRST, ss_item_sk#40 ASC NULLS FIRST], false, 0
 
 (78) ReusedExchange [Reuses operator id: 26]
-Output [2]: [sr_item_sk#63, sr_ticket_number#64]
+Output [2]: [sr_item_sk#61, sr_ticket_number#62]
 
 (79) Sort [codegen id : 13]
-Input [2]: [sr_item_sk#63, sr_ticket_number#64]
-Arguments: [sr_ticket_number#64 ASC NULLS FIRST, sr_item_sk#63 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#61, sr_ticket_number#62]
+Arguments: [sr_ticket_number#62 ASC NULLS FIRST, sr_item_sk#61 ASC NULLS FIRST], false, 0
 
 (80) SortMergeJoin [codegen id : 14]
-Left keys [2]: [ss_ticket_number#45, ss_item_sk#42]
-Right keys [2]: [sr_ticket_number#64, sr_item_sk#63]
+Left keys [2]: [ss_ticket_number#43, ss_item_sk#40]
+Right keys [2]: [sr_ticket_number#62, sr_item_sk#61]
 Join type: Inner
 Join condition: None
 
 (81) Project [codegen id : 14]
-Output [12]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Input [16]: [ss_item_sk#42, ss_ticket_number#45, ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62, sr_item_sk#63, sr_ticket_number#64]
+Output [12]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Input [16]: [ss_item_sk#40, ss_ticket_number#43, ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60, sr_item_sk#61, sr_ticket_number#62]
 
 (82) Exchange
-Input [12]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: hashpartitioning(c_birth_country#62, s_zip#52, 5), ENSURE_REQUIREMENTS, [plan_id=15]
+Input [12]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: hashpartitioning(c_birth_country#60, s_zip#50, 5), ENSURE_REQUIREMENTS, [plan_id=17]
 
 (83) Sort [codegen id : 15]
-Input [12]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62]
-Arguments: [c_birth_country#62 ASC NULLS FIRST, s_zip#52 ASC NULLS FIRST], false, 0
+Input [12]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
+Arguments: [c_birth_country#60 ASC NULLS FIRST, s_zip#50 ASC NULLS FIRST], false, 0
 
 (84) Scan parquet spark_catalog.default.customer_address
-Output [3]: [ca_state#65, ca_zip#66, ca_country#67]
+Output [3]: [ca_state#63, ca_zip#64, ca_country#65]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_country), IsNotNull(ca_zip)]
 ReadSchema: struct<ca_state:string,ca_zip:string,ca_country:string>
 
 (85) ColumnarToRow [codegen id : 16]
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
 
 (86) Filter [codegen id : 16]
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
-Condition : (isnotnull(ca_country#67) AND isnotnull(ca_zip#66))
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
+Condition : (isnotnull(ca_country#65) AND isnotnull(ca_zip#64))
 
 (87) Exchange
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
-Arguments: hashpartitioning(upper(ca_country#67), ca_zip#66, 5), ENSURE_REQUIREMENTS, [plan_id=16]
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
+Arguments: hashpartitioning(upper(ca_country#65), ca_zip#64, 5), ENSURE_REQUIREMENTS, [plan_id=18]
 
 (88) Sort [codegen id : 17]
-Input [3]: [ca_state#65, ca_zip#66, ca_country#67]
-Arguments: [upper(ca_country#67) ASC NULLS FIRST, ca_zip#66 ASC NULLS FIRST], false, 0
+Input [3]: [ca_state#63, ca_zip#64, ca_country#65]
+Arguments: [upper(ca_country#65) ASC NULLS FIRST, ca_zip#64 ASC NULLS FIRST], false, 0
 
 (89) SortMergeJoin [codegen id : 18]
-Left keys [2]: [c_birth_country#62, s_zip#52]
-Right keys [2]: [upper(ca_country#67), ca_zip#66]
+Left keys [2]: [c_birth_country#60, s_zip#50]
+Right keys [2]: [upper(ca_country#65), ca_zip#64]
 Join type: Inner
 Join condition: None
 
 (90) Project [codegen id : 18]
-Output [11]: [ss_net_paid#46, s_store_name#49, s_state#51, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, ca_state#65]
-Input [15]: [ss_net_paid#46, s_store_name#49, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, c_birth_country#62, ca_state#65, ca_zip#66, ca_country#67]
+Output [11]: [ss_net_paid#44, s_store_name#47, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#63]
+Input [15]: [ss_net_paid#44, s_store_name#47, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60, ca_state#63, ca_zip#64, ca_country#65]
 
 (91) HashAggregate [codegen id : 18]
-Input [11]: [ss_net_paid#46, s_store_name#49, s_state#51, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#60, c_last_name#61, ca_state#65]
-Keys [10]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55]
-Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#46))]
-Aggregate Attributes [1]: [sum#68]
-Results [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
+Input [11]: [ss_net_paid#44, s_store_name#47, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#63]
+Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
+Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#44))]
+Aggregate Attributes [1]: [sum#66]
+Results [11]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#67]
 
 (92) Exchange
-Input [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
-Arguments: hashpartitioning(c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, 5), ENSURE_REQUIREMENTS, [plan_id=17]
+Input [11]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#67]
+Arguments: hashpartitioning(c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, 5), ENSURE_REQUIREMENTS, [plan_id=19]
 
 (93) HashAggregate [codegen id : 19]
-Input [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
-Keys [10]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55]
-Functions [1]: [sum(UnscaledValue(ss_net_paid#46))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#46))#32]
-Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#46))#32,17,2) AS netpaid#70]
+Input [11]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#67]
+Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#47, ca_state#63, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
+Functions [1]: [sum(UnscaledValue(ss_net_paid#44))]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#44))#31]
+Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#44))#31,17,2) AS netpaid#68]
 
 (94) HashAggregate [codegen id : 19]
-Input [1]: [netpaid#70]
+Input [1]: [netpaid#68]
 Keys: []
-Functions [1]: [partial_avg(netpaid#70)]
-Aggregate Attributes [2]: [sum#71, count#72]
-Results [2]: [sum#73, count#74]
+Functions [1]: [partial_avg(netpaid#68)]
+Aggregate Attributes [2]: [sum#69, count#70]
+Results [2]: [sum#71, count#72]
 
 (95) Exchange
-Input [2]: [sum#73, count#74]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=18]
+Input [2]: [sum#71, count#72]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=20]
 
 (96) HashAggregate [codegen id : 20]
-Input [2]: [sum#73, count#74]
+Input [2]: [sum#71, count#72]
 Keys: []
-Functions [1]: [avg(netpaid#70)]
-Aggregate Attributes [1]: [avg(netpaid#70)#75]
-Results [1]: [(0.05 * avg(netpaid#70)#75) AS (0.05 * avg(netpaid))#76]
+Functions [1]: [avg(netpaid#68)]
+Aggregate Attributes [1]: [avg(netpaid#68)#73]
+Results [1]: [(0.05 * avg(netpaid#68)#73) AS (0.05 * avg(netpaid))#74]
 
-Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#7, [id=#8]
+Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#7, [id=#1]
 ObjectHashAggregate (103)
 +- Exchange (102)
    +- ObjectHashAggregate (101)
@@ -559,39 +559,39 @@ ObjectHashAggregate (103)
 
 
 (97) Scan parquet spark_catalog.default.store
-Output [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
+Output [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_market_id), EqualTo(s_market_id,8), IsNotNull(s_store_sk), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_market_id:int,s_zip:string>
 
 (98) ColumnarToRow [codegen id : 1]
-Input [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
+Input [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
 
 (99) Filter [codegen id : 1]
-Input [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
-Condition : (((isnotnull(s_market_id#24) AND (s_market_id#24 = 8)) AND isnotnull(s_store_sk#22)) AND isnotnull(s_zip#26))
+Input [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
+Condition : (((isnotnull(s_market_id#23) AND (s_market_id#23 = 8)) AND isnotnull(s_store_sk#21)) AND isnotnull(s_zip#25))
 
 (100) Project [codegen id : 1]
-Output [1]: [s_store_sk#22]
-Input [3]: [s_store_sk#22, s_market_id#24, s_zip#26]
+Output [1]: [s_store_sk#21]
+Input [3]: [s_store_sk#21, s_market_id#23, s_zip#25]
 
 (101) ObjectHashAggregate
-Input [1]: [s_store_sk#22]
+Input [1]: [s_store_sk#21]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)]
-Aggregate Attributes [1]: [buf#77]
-Results [1]: [buf#78]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)]
+Aggregate Attributes [1]: [buf#75]
+Results [1]: [buf#76]
 
 (102) Exchange
-Input [1]: [buf#78]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=19]
+Input [1]: [buf#76]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=21]
 
 (103) ObjectHashAggregate
-Input [1]: [buf#78]
+Input [1]: [buf#76]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)#79]
-Results [1]: [bloom_filter_agg(xxhash64(s_store_sk#22, 42), 40, 1250, 0, 0)#79 AS bloomFilter#80]
+Functions [1]: [bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)#77]
+Results [1]: [bloom_filter_agg(xxhash64(s_store_sk#21, 42), 40, 1250, 0, 0)#77 AS bloomFilter#78]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b/explain.txt
index 26c1f61048065..876e9875a5ba8 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q24b/explain.txt
@@ -263,11 +263,11 @@ Results [4]: [c_last_name#23, c_first_name#22, s_store_name#11, sum(netpaid#31)#
 
 (46) Filter [codegen id : 11]
 Input [4]: [c_last_name#23, c_first_name#22, s_store_name#11, paid#37]
-Condition : (isnotnull(paid#37) AND (cast(paid#37 as decimal(33,8)) > cast(Subquery scalar-subquery#38, [id=#39] as decimal(33,8))))
+Condition : (isnotnull(paid#37) AND (cast(paid#37 as decimal(33,8)) > cast(Subquery scalar-subquery#38, [id=#9] as decimal(33,8))))
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#38, [id=#39]
+Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#38, [id=#9]
 * HashAggregate (73)
 +- Exchange (72)
    +- * HashAggregate (71)
@@ -298,130 +298,130 @@ Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquer
 
 
 (47) ReusedExchange [Reuses operator id: 5]
-Output [5]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44]
+Output [5]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_ticket_number#42, ss_net_paid#43]
 
 (48) Sort [codegen id : 2]
-Input [5]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44]
-Arguments: [ss_ticket_number#43 ASC NULLS FIRST, ss_item_sk#40 ASC NULLS FIRST], false, 0
+Input [5]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_ticket_number#42, ss_net_paid#43]
+Arguments: [ss_ticket_number#42 ASC NULLS FIRST, ss_item_sk#39 ASC NULLS FIRST], false, 0
 
 (49) ReusedExchange [Reuses operator id: 11]
-Output [2]: [sr_item_sk#45, sr_ticket_number#46]
+Output [2]: [sr_item_sk#44, sr_ticket_number#45]
 
 (50) Sort [codegen id : 4]
-Input [2]: [sr_item_sk#45, sr_ticket_number#46]
-Arguments: [sr_ticket_number#46 ASC NULLS FIRST, sr_item_sk#45 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#44, sr_ticket_number#45]
+Arguments: [sr_ticket_number#45 ASC NULLS FIRST, sr_item_sk#44 ASC NULLS FIRST], false, 0
 
 (51) SortMergeJoin [codegen id : 9]
-Left keys [2]: [ss_ticket_number#43, ss_item_sk#40]
-Right keys [2]: [sr_ticket_number#46, sr_item_sk#45]
+Left keys [2]: [ss_ticket_number#42, ss_item_sk#39]
+Right keys [2]: [sr_ticket_number#45, sr_item_sk#44]
 Join type: Inner
 Join condition: None
 
 (52) Project [codegen id : 9]
-Output [4]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_net_paid#44]
-Input [7]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_ticket_number#43, ss_net_paid#44, sr_item_sk#45, sr_ticket_number#46]
+Output [4]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_net_paid#43]
+Input [7]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_ticket_number#42, ss_net_paid#43, sr_item_sk#44, sr_ticket_number#45]
 
 (53) ReusedExchange [Reuses operator id: 19]
-Output [4]: [s_store_sk#47, s_store_name#48, s_state#49, s_zip#50]
+Output [4]: [s_store_sk#46, s_store_name#47, s_state#48, s_zip#49]
 
 (54) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_store_sk#42]
-Right keys [1]: [s_store_sk#47]
+Left keys [1]: [ss_store_sk#41]
+Right keys [1]: [s_store_sk#46]
 Join type: Inner
 Join condition: None
 
 (55) Project [codegen id : 9]
-Output [6]: [ss_item_sk#40, ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50]
-Input [8]: [ss_item_sk#40, ss_customer_sk#41, ss_store_sk#42, ss_net_paid#44, s_store_sk#47, s_store_name#48, s_state#49, s_zip#50]
+Output [6]: [ss_item_sk#39, ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49]
+Input [8]: [ss_item_sk#39, ss_customer_sk#40, ss_store_sk#41, ss_net_paid#43, s_store_sk#46, s_store_name#47, s_state#48, s_zip#49]
 
 (56) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Output [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (57) ColumnarToRow [codegen id : 6]
-Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Input [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
 
 (58) Filter [codegen id : 6]
-Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
-Condition : isnotnull(i_item_sk#51)
+Input [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
+Condition : isnotnull(i_item_sk#50)
 
 (59) BroadcastExchange
-Input [6]: [i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=9]
+Input [6]: [i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=10]
 
 (60) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_item_sk#40]
-Right keys [1]: [i_item_sk#51]
+Left keys [1]: [ss_item_sk#39]
+Right keys [1]: [i_item_sk#50]
 Join type: Inner
 Join condition: None
 
 (61) Project [codegen id : 9]
-Output [10]: [ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
-Input [12]: [ss_item_sk#40, ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_item_sk#51, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56]
+Output [10]: [ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
+Input [12]: [ss_item_sk#39, ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_item_sk#50, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55]
 
 (62) ReusedExchange [Reuses operator id: 31]
-Output [4]: [c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
+Output [4]: [c_customer_sk#56, c_first_name#57, c_last_name#58, c_birth_country#59]
 
 (63) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_customer_sk#41]
-Right keys [1]: [c_customer_sk#57]
+Left keys [1]: [ss_customer_sk#40]
+Right keys [1]: [c_customer_sk#56]
 Join type: Inner
 Join condition: None
 
 (64) Project [codegen id : 9]
-Output [12]: [ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60]
-Input [14]: [ss_customer_sk#41, ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_customer_sk#57, c_first_name#58, c_last_name#59, c_birth_country#60]
+Output [12]: [ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, c_birth_country#59]
+Input [14]: [ss_customer_sk#40, ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_customer_sk#56, c_first_name#57, c_last_name#58, c_birth_country#59]
 
 (65) ReusedExchange [Reuses operator id: 37]
-Output [3]: [ca_state#61, ca_zip#62, ca_country#63]
+Output [3]: [ca_state#60, ca_zip#61, ca_country#62]
 
 (66) BroadcastHashJoin [codegen id : 9]
-Left keys [2]: [c_birth_country#60, s_zip#50]
-Right keys [2]: [upper(ca_country#63), ca_zip#62]
+Left keys [2]: [c_birth_country#59, s_zip#49]
+Right keys [2]: [upper(ca_country#62), ca_zip#61]
 Join type: Inner
 Join condition: None
 
 (67) Project [codegen id : 9]
-Output [11]: [ss_net_paid#44, s_store_name#48, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#61]
-Input [15]: [ss_net_paid#44, s_store_name#48, s_state#49, s_zip#50, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, c_birth_country#60, ca_state#61, ca_zip#62, ca_country#63]
+Output [11]: [ss_net_paid#43, s_store_name#47, s_state#48, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, ca_state#60]
+Input [15]: [ss_net_paid#43, s_store_name#47, s_state#48, s_zip#49, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, c_birth_country#59, ca_state#60, ca_zip#61, ca_country#62]
 
 (68) HashAggregate [codegen id : 9]
-Input [11]: [ss_net_paid#44, s_store_name#48, s_state#49, i_current_price#52, i_size#53, i_color#54, i_units#55, i_manager_id#56, c_first_name#58, c_last_name#59, ca_state#61]
-Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
-Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#44))]
-Aggregate Attributes [1]: [sum#64]
-Results [11]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#65]
+Input [11]: [ss_net_paid#43, s_store_name#47, s_state#48, i_current_price#51, i_size#52, i_color#53, i_units#54, i_manager_id#55, c_first_name#57, c_last_name#58, ca_state#60]
+Keys [10]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52]
+Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#43))]
+Aggregate Attributes [1]: [sum#63]
+Results [11]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, sum#64]
 
 (69) Exchange
-Input [11]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#65]
-Arguments: hashpartitioning(c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [11]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, sum#64]
+Arguments: hashpartitioning(c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (70) HashAggregate [codegen id : 10]
-Input [11]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53, sum#65]
-Keys [10]: [c_last_name#59, c_first_name#58, s_store_name#48, ca_state#61, s_state#49, i_color#54, i_current_price#52, i_manager_id#56, i_units#55, i_size#53]
-Functions [1]: [sum(UnscaledValue(ss_net_paid#44))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#44))#30]
-Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#44))#30,17,2) AS netpaid#66]
+Input [11]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52, sum#64]
+Keys [10]: [c_last_name#58, c_first_name#57, s_store_name#47, ca_state#60, s_state#48, i_color#53, i_current_price#51, i_manager_id#55, i_units#54, i_size#52]
+Functions [1]: [sum(UnscaledValue(ss_net_paid#43))]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#43))#30]
+Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#43))#30,17,2) AS netpaid#65]
 
 (71) HashAggregate [codegen id : 10]
-Input [1]: [netpaid#66]
+Input [1]: [netpaid#65]
 Keys: []
-Functions [1]: [partial_avg(netpaid#66)]
-Aggregate Attributes [2]: [sum#67, count#68]
-Results [2]: [sum#69, count#70]
+Functions [1]: [partial_avg(netpaid#65)]
+Aggregate Attributes [2]: [sum#66, count#67]
+Results [2]: [sum#68, count#69]
 
 (72) Exchange
-Input [2]: [sum#69, count#70]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
+Input [2]: [sum#68, count#69]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (73) HashAggregate [codegen id : 11]
-Input [2]: [sum#69, count#70]
+Input [2]: [sum#68, count#69]
 Keys: []
-Functions [1]: [avg(netpaid#66)]
-Aggregate Attributes [1]: [avg(netpaid#66)#71]
-Results [1]: [(0.05 * avg(netpaid#66)#71) AS (0.05 * avg(netpaid))#72]
+Functions [1]: [avg(netpaid#65)]
+Aggregate Attributes [1]: [avg(netpaid#65)#70]
+Results [1]: [(0.05 * avg(netpaid#65)#70) AS (0.05 * avg(netpaid))#71]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q32.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q32.sf100/explain.txt
index 74b51485aeaa6..f40be2a320714 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q32.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q32.sf100/explain.txt
@@ -65,42 +65,42 @@ Input [3]: [cs_item_sk#3, cs_ext_discount_amt#4, cs_sold_date_sk#5]
 
 (8) Filter [codegen id : 3]
 Input [3]: [cs_item_sk#3, cs_ext_discount_amt#4, cs_sold_date_sk#5]
-Condition : (isnotnull(cs_item_sk#3) AND might_contain(Subquery scalar-subquery#7, [id=#8], xxhash64(cs_item_sk#3, 42)))
+Condition : (isnotnull(cs_item_sk#3) AND might_contain(Subquery scalar-subquery#7, [id=#2], xxhash64(cs_item_sk#3, 42)))
 
 (9) ReusedExchange [Reuses operator id: 41]
-Output [1]: [d_date_sk#9]
+Output [1]: [d_date_sk#8]
 
 (10) BroadcastHashJoin [codegen id : 3]
 Left keys [1]: [cs_sold_date_sk#5]
-Right keys [1]: [d_date_sk#9]
+Right keys [1]: [d_date_sk#8]
 Join type: Inner
 Join condition: None
 
 (11) Project [codegen id : 3]
 Output [2]: [cs_item_sk#3, cs_ext_discount_amt#4]
-Input [4]: [cs_item_sk#3, cs_ext_discount_amt#4, cs_sold_date_sk#5, d_date_sk#9]
+Input [4]: [cs_item_sk#3, cs_ext_discount_amt#4, cs_sold_date_sk#5, d_date_sk#8]
 
 (12) HashAggregate [codegen id : 3]
 Input [2]: [cs_item_sk#3, cs_ext_discount_amt#4]
 Keys [1]: [cs_item_sk#3]
 Functions [1]: [partial_avg(UnscaledValue(cs_ext_discount_amt#4))]
-Aggregate Attributes [2]: [sum#10, count#11]
-Results [3]: [cs_item_sk#3, sum#12, count#13]
+Aggregate Attributes [2]: [sum#9, count#10]
+Results [3]: [cs_item_sk#3, sum#11, count#12]
 
 (13) Exchange
-Input [3]: [cs_item_sk#3, sum#12, count#13]
-Arguments: hashpartitioning(cs_item_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [3]: [cs_item_sk#3, sum#11, count#12]
+Arguments: hashpartitioning(cs_item_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (14) HashAggregate
-Input [3]: [cs_item_sk#3, sum#12, count#13]
+Input [3]: [cs_item_sk#3, sum#11, count#12]
 Keys [1]: [cs_item_sk#3]
 Functions [1]: [avg(UnscaledValue(cs_ext_discount_amt#4))]
-Aggregate Attributes [1]: [avg(UnscaledValue(cs_ext_discount_amt#4))#14]
-Results [2]: [(1.3 * cast((avg(UnscaledValue(cs_ext_discount_amt#4))#14 / 100.0) as decimal(11,6))) AS (1.3 * avg(cs_ext_discount_amt))#15, cs_item_sk#3]
+Aggregate Attributes [1]: [avg(UnscaledValue(cs_ext_discount_amt#4))#13]
+Results [2]: [(1.3 * cast((avg(UnscaledValue(cs_ext_discount_amt#4))#13 / 100.0) as decimal(11,6))) AS (1.3 * avg(cs_ext_discount_amt))#14, cs_item_sk#3]
 
 (15) Filter
-Input [2]: [(1.3 * avg(cs_ext_discount_amt))#15, cs_item_sk#3]
-Condition : isnotnull((1.3 * avg(cs_ext_discount_amt))#15)
+Input [2]: [(1.3 * avg(cs_ext_discount_amt))#14, cs_item_sk#3]
+Condition : isnotnull((1.3 * avg(cs_ext_discount_amt))#14)
 
 (16) BroadcastHashJoin [codegen id : 4]
 Left keys [1]: [i_item_sk#1]
@@ -109,72 +109,72 @@ Join type: Inner
 Join condition: None
 
 (17) Project [codegen id : 4]
-Output [2]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#15]
-Input [3]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#15, cs_item_sk#3]
+Output [2]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#14]
+Input [3]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#14, cs_item_sk#3]
 
 (18) BroadcastExchange
-Input [2]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#15]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=3]
+Input [2]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#14]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
 
 (19) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_item_sk#16, cs_ext_discount_amt#17, cs_sold_date_sk#18]
+Output [3]: [cs_item_sk#15, cs_ext_discount_amt#16, cs_sold_date_sk#17]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#18), dynamicpruningexpression(cs_sold_date_sk#18 IN dynamicpruning#6)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#17), dynamicpruningexpression(cs_sold_date_sk#17 IN dynamicpruning#6)]
 PushedFilters: [IsNotNull(cs_item_sk), IsNotNull(cs_ext_discount_amt)]
 ReadSchema: struct<cs_item_sk:int,cs_ext_discount_amt:decimal(7,2)>
 
 (20) ColumnarToRow
-Input [3]: [cs_item_sk#16, cs_ext_discount_amt#17, cs_sold_date_sk#18]
+Input [3]: [cs_item_sk#15, cs_ext_discount_amt#16, cs_sold_date_sk#17]
 
 (21) Filter
-Input [3]: [cs_item_sk#16, cs_ext_discount_amt#17, cs_sold_date_sk#18]
-Condition : (isnotnull(cs_item_sk#16) AND isnotnull(cs_ext_discount_amt#17))
+Input [3]: [cs_item_sk#15, cs_ext_discount_amt#16, cs_sold_date_sk#17]
+Condition : (isnotnull(cs_item_sk#15) AND isnotnull(cs_ext_discount_amt#16))
 
 (22) BroadcastHashJoin [codegen id : 6]
 Left keys [1]: [i_item_sk#1]
-Right keys [1]: [cs_item_sk#16]
+Right keys [1]: [cs_item_sk#15]
 Join type: Inner
-Join condition: (cast(cs_ext_discount_amt#17 as decimal(14,7)) > (1.3 * avg(cs_ext_discount_amt))#15)
+Join condition: (cast(cs_ext_discount_amt#16 as decimal(14,7)) > (1.3 * avg(cs_ext_discount_amt))#14)
 
 (23) Project [codegen id : 6]
-Output [2]: [cs_ext_discount_amt#17, cs_sold_date_sk#18]
-Input [5]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#15, cs_item_sk#16, cs_ext_discount_amt#17, cs_sold_date_sk#18]
+Output [2]: [cs_ext_discount_amt#16, cs_sold_date_sk#17]
+Input [5]: [i_item_sk#1, (1.3 * avg(cs_ext_discount_amt))#14, cs_item_sk#15, cs_ext_discount_amt#16, cs_sold_date_sk#17]
 
 (24) ReusedExchange [Reuses operator id: 41]
-Output [1]: [d_date_sk#19]
+Output [1]: [d_date_sk#18]
 
 (25) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [cs_sold_date_sk#18]
-Right keys [1]: [d_date_sk#19]
+Left keys [1]: [cs_sold_date_sk#17]
+Right keys [1]: [d_date_sk#18]
 Join type: Inner
 Join condition: None
 
 (26) Project [codegen id : 6]
-Output [1]: [cs_ext_discount_amt#17]
-Input [3]: [cs_ext_discount_amt#17, cs_sold_date_sk#18, d_date_sk#19]
+Output [1]: [cs_ext_discount_amt#16]
+Input [3]: [cs_ext_discount_amt#16, cs_sold_date_sk#17, d_date_sk#18]
 
 (27) HashAggregate [codegen id : 6]
-Input [1]: [cs_ext_discount_amt#17]
+Input [1]: [cs_ext_discount_amt#16]
 Keys: []
-Functions [1]: [partial_sum(UnscaledValue(cs_ext_discount_amt#17))]
-Aggregate Attributes [1]: [sum#20]
-Results [1]: [sum#21]
+Functions [1]: [partial_sum(UnscaledValue(cs_ext_discount_amt#16))]
+Aggregate Attributes [1]: [sum#19]
+Results [1]: [sum#20]
 
 (28) Exchange
-Input [1]: [sum#21]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=4]
+Input [1]: [sum#20]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
 
 (29) HashAggregate [codegen id : 7]
-Input [1]: [sum#21]
+Input [1]: [sum#20]
 Keys: []
-Functions [1]: [sum(UnscaledValue(cs_ext_discount_amt#17))]
-Aggregate Attributes [1]: [sum(UnscaledValue(cs_ext_discount_amt#17))#22]
-Results [1]: [MakeDecimal(sum(UnscaledValue(cs_ext_discount_amt#17))#22,17,2) AS excess discount amount#23]
+Functions [1]: [sum(UnscaledValue(cs_ext_discount_amt#16))]
+Aggregate Attributes [1]: [sum(UnscaledValue(cs_ext_discount_amt#16))#21]
+Results [1]: [MakeDecimal(sum(UnscaledValue(cs_ext_discount_amt#16))#21,17,2) AS excess discount amount#22]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#7, [id=#8]
+Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#7, [id=#2]
 ObjectHashAggregate (36)
 +- Exchange (35)
    +- ObjectHashAggregate (34)
@@ -206,19 +206,19 @@ Input [2]: [i_item_sk#1, i_manufact_id#2]
 Input [1]: [i_item_sk#1]
 Keys: []
 Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)]
-Aggregate Attributes [1]: [buf#24]
-Results [1]: [buf#25]
+Aggregate Attributes [1]: [buf#23]
+Results [1]: [buf#24]
 
 (35) Exchange
-Input [1]: [buf#25]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
+Input [1]: [buf#24]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
 
 (36) ObjectHashAggregate
-Input [1]: [buf#25]
+Input [1]: [buf#24]
 Keys: []
 Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#26]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#26 AS bloomFilter#27]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#25]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#25 AS bloomFilter#26]
 
 Subquery:2 Hosting operator id = 6 Hosting Expression = cs_sold_date_sk#5 IN dynamicpruning#6
 BroadcastExchange (41)
@@ -229,27 +229,27 @@ BroadcastExchange (41)
 
 
 (37) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#9, d_date#28]
+Output [2]: [d_date_sk#8, d_date#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2000-01-27), LessThanOrEqual(d_date,2000-04-26), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (38) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#9, d_date#28]
+Input [2]: [d_date_sk#8, d_date#27]
 
 (39) Filter [codegen id : 1]
-Input [2]: [d_date_sk#9, d_date#28]
-Condition : (((isnotnull(d_date#28) AND (d_date#28 >= 2000-01-27)) AND (d_date#28 <= 2000-04-26)) AND isnotnull(d_date_sk#9))
+Input [2]: [d_date_sk#8, d_date#27]
+Condition : (((isnotnull(d_date#27) AND (d_date#27 >= 2000-01-27)) AND (d_date#27 <= 2000-04-26)) AND isnotnull(d_date_sk#8))
 
 (40) Project [codegen id : 1]
-Output [1]: [d_date_sk#9]
-Input [2]: [d_date_sk#9, d_date#28]
+Output [1]: [d_date_sk#8]
+Input [2]: [d_date_sk#8, d_date#27]
 
 (41) BroadcastExchange
-Input [1]: [d_date_sk#9]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [d_date_sk#8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
-Subquery:3 Hosting operator id = 19 Hosting Expression = cs_sold_date_sk#18 IN dynamicpruning#6
+Subquery:3 Hosting operator id = 19 Hosting Expression = cs_sold_date_sk#17 IN dynamicpruning#6
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/explain.txt
index 075a67dbbaaf6..d2c4f70ff7777 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/explain.txt
@@ -1,67 +1,66 @@
 == Physical Plan ==
-TakeOrderedAndProject (63)
-+- * HashAggregate (62)
-   +- Exchange (61)
-      +- * HashAggregate (60)
-         +- Union (59)
-            :- * HashAggregate (28)
-            :  +- Exchange (27)
-            :     +- * HashAggregate (26)
-            :        +- * Project (25)
-            :           +- * BroadcastHashJoin Inner BuildRight (24)
-            :              :- * Project (18)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (17)
-            :              :     :- * Project (6)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
-            :              :     :     :- * Filter (3)
-            :              :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :              :     :     +- ReusedExchange (4)
-            :              :     +- BroadcastExchange (16)
-            :              :        +- * BroadcastHashJoin LeftSemi BuildRight (15)
-            :              :           :- * Filter (9)
-            :              :           :  +- * ColumnarToRow (8)
-            :              :           :     +- Scan parquet spark_catalog.default.item (7)
-            :              :           +- BroadcastExchange (14)
-            :              :              +- * Project (13)
-            :              :                 +- * Filter (12)
-            :              :                    +- * ColumnarToRow (11)
-            :              :                       +- Scan parquet spark_catalog.default.item (10)
-            :              +- BroadcastExchange (23)
-            :                 +- * Project (22)
-            :                    +- * Filter (21)
-            :                       +- * ColumnarToRow (20)
-            :                          +- Scan parquet spark_catalog.default.customer_address (19)
-            :- * HashAggregate (43)
-            :  +- Exchange (42)
-            :     +- * HashAggregate (41)
-            :        +- * Project (40)
-            :           +- * BroadcastHashJoin Inner BuildRight (39)
-            :              :- * Project (37)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (36)
-            :              :     :- * Project (34)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
-            :              :     :     :- * Filter (31)
-            :              :     :     :  +- * ColumnarToRow (30)
-            :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
-            :              :     :     +- ReusedExchange (32)
-            :              :     +- ReusedExchange (35)
-            :              +- ReusedExchange (38)
-            +- * HashAggregate (58)
-               +- Exchange (57)
-                  +- * HashAggregate (56)
-                     +- * Project (55)
-                        +- * BroadcastHashJoin Inner BuildRight (54)
-                           :- * Project (52)
-                           :  +- * BroadcastHashJoin Inner BuildRight (51)
-                           :     :- * Project (49)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (48)
-                           :     :     :- * Filter (46)
-                           :     :     :  +- * ColumnarToRow (45)
-                           :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
-                           :     :     +- ReusedExchange (47)
-                           :     +- ReusedExchange (50)
-                           +- ReusedExchange (53)
+TakeOrderedAndProject (62)
++- * HashAggregate (61)
+   +- * HashAggregate (60)
+      +- Union (59)
+         :- * HashAggregate (28)
+         :  +- Exchange (27)
+         :     +- * HashAggregate (26)
+         :        +- * Project (25)
+         :           +- * BroadcastHashJoin Inner BuildRight (24)
+         :              :- * Project (18)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (17)
+         :              :     :- * Project (6)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
+         :              :     :     :- * Filter (3)
+         :              :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
+         :              :     :     +- ReusedExchange (4)
+         :              :     +- BroadcastExchange (16)
+         :              :        +- * BroadcastHashJoin LeftSemi BuildRight (15)
+         :              :           :- * Filter (9)
+         :              :           :  +- * ColumnarToRow (8)
+         :              :           :     +- Scan parquet spark_catalog.default.item (7)
+         :              :           +- BroadcastExchange (14)
+         :              :              +- * Project (13)
+         :              :                 +- * Filter (12)
+         :              :                    +- * ColumnarToRow (11)
+         :              :                       +- Scan parquet spark_catalog.default.item (10)
+         :              +- BroadcastExchange (23)
+         :                 +- * Project (22)
+         :                    +- * Filter (21)
+         :                       +- * ColumnarToRow (20)
+         :                          +- Scan parquet spark_catalog.default.customer_address (19)
+         :- * HashAggregate (43)
+         :  +- Exchange (42)
+         :     +- * HashAggregate (41)
+         :        +- * Project (40)
+         :           +- * BroadcastHashJoin Inner BuildRight (39)
+         :              :- * Project (37)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (36)
+         :              :     :- * Project (34)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
+         :              :     :     :- * Filter (31)
+         :              :     :     :  +- * ColumnarToRow (30)
+         :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
+         :              :     :     +- ReusedExchange (32)
+         :              :     +- ReusedExchange (35)
+         :              +- ReusedExchange (38)
+         +- * HashAggregate (58)
+            +- Exchange (57)
+               +- * HashAggregate (56)
+                  +- * Project (55)
+                     +- * BroadcastHashJoin Inner BuildRight (54)
+                        :- * Project (52)
+                        :  +- * BroadcastHashJoin Inner BuildRight (51)
+                        :     :- * Project (49)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (48)
+                        :     :     :- * Filter (46)
+                        :     :     :  +- * ColumnarToRow (45)
+                        :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
+                        :     :     +- ReusedExchange (47)
+                        :     +- ReusedExchange (50)
+                        +- ReusedExchange (53)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -79,7 +78,7 @@ Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Condition : (isnotnull(ss_addr_sk#2) AND isnotnull(ss_item_sk#1))
 
-(4) ReusedExchange [Reuses operator id: 68]
+(4) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#6]
 
 (5) BroadcastHashJoin [codegen id : 5]
@@ -213,7 +212,7 @@ Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_da
 Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_date_sk#20]
 Condition : (isnotnull(cs_bill_addr_sk#17) AND isnotnull(cs_item_sk#18))
 
-(32) ReusedExchange [Reuses operator id: 68]
+(32) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#21]
 
 (33) BroadcastHashJoin [codegen id : 11]
@@ -285,7 +284,7 @@ Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_da
 Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_date_sk#32]
 Condition : (isnotnull(ws_bill_addr_sk#30) AND isnotnull(ws_item_sk#29))
 
-(47) ReusedExchange [Reuses operator id: 68]
+(47) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#33]
 
 (48) BroadcastHashJoin [codegen id : 17]
@@ -351,52 +350,48 @@ Functions [1]: [partial_sum(total_sales#16)]
 Aggregate Attributes [2]: [sum#41, isEmpty#42]
 Results [3]: [i_manufact_id#8, sum#43, isEmpty#44]
 
-(61) Exchange
-Input [3]: [i_manufact_id#8, sum#43, isEmpty#44]
-Arguments: hashpartitioning(i_manufact_id#8, 5), ENSURE_REQUIREMENTS, [plan_id=7]
-
-(62) HashAggregate [codegen id : 20]
+(61) HashAggregate [codegen id : 19]
 Input [3]: [i_manufact_id#8, sum#43, isEmpty#44]
 Keys [1]: [i_manufact_id#8]
 Functions [1]: [sum(total_sales#16)]
 Aggregate Attributes [1]: [sum(total_sales#16)#45]
 Results [2]: [i_manufact_id#8, sum(total_sales#16)#45 AS total_sales#46]
 
-(63) TakeOrderedAndProject
+(62) TakeOrderedAndProject
 Input [2]: [i_manufact_id#8, total_sales#46]
 Arguments: 100, [total_sales#46 ASC NULLS FIRST], [i_manufact_id#8, total_sales#46]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (68)
-+- * Project (67)
-   +- * Filter (66)
-      +- * ColumnarToRow (65)
-         +- Scan parquet spark_catalog.default.date_dim (64)
+BroadcastExchange (67)
++- * Project (66)
+   +- * Filter (65)
+      +- * ColumnarToRow (64)
+         +- Scan parquet spark_catalog.default.date_dim (63)
 
 
-(64) Scan parquet spark_catalog.default.date_dim
+(63) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,5), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(65) ColumnarToRow [codegen id : 1]
+(64) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(66) Filter [codegen id : 1]
+(65) Filter [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Condition : ((((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 1998)) AND (d_moy#48 = 5)) AND isnotnull(d_date_sk#6))
 
-(67) Project [codegen id : 1]
+(66) Project [codegen id : 1]
 Output [1]: [d_date_sk#6]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(68) BroadcastExchange
+(67) BroadcastExchange
 Input [1]: [d_date_sk#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 Subquery:2 Hosting operator id = 29 Hosting Expression = cs_sold_date_sk#20 IN dynamicpruning#5
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/simplified.txt
index e47174615570c..70139c5caa7d6 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33.sf100/simplified.txt
@@ -1,105 +1,102 @@
 TakeOrderedAndProject [total_sales,i_manufact_id]
-  WholeStageCodegen (20)
+  WholeStageCodegen (19)
     HashAggregate [i_manufact_id,sum,isEmpty] [sum(total_sales),total_sales,sum,isEmpty]
-      InputAdapter
-        Exchange [i_manufact_id] #1
-          WholeStageCodegen (19)
-            HashAggregate [i_manufact_id,total_sales] [sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_manufact_id] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [i_manufact_id,ss_ext_sales_price] [sum,sum]
-                              Project [ss_ext_sales_price,i_manufact_id]
-                                BroadcastHashJoin [ss_addr_sk,ca_address_sk]
-                                  Project [ss_addr_sk,ss_ext_sales_price,i_manufact_id]
-                                    BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                      Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
-                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                          Filter [ss_addr_sk,ss_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
-                                                  SubqueryBroadcast [d_date_sk] #1
-                                                    BroadcastExchange #3
-                                                      WholeStageCodegen (1)
-                                                        Project [d_date_sk]
-                                                          Filter [d_year,d_moy,d_date_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        BroadcastExchange #4
-                                          WholeStageCodegen (3)
-                                            BroadcastHashJoin [i_manufact_id,i_manufact_id]
-                                              Filter [i_item_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.item [i_item_sk,i_manufact_id]
-                                              InputAdapter
-                                                BroadcastExchange #5
-                                                  WholeStageCodegen (2)
-                                                    Project [i_manufact_id]
-                                                      Filter [i_category]
-                                                        ColumnarToRow
-                                                          InputAdapter
-                                                            Scan parquet spark_catalog.default.item [i_category,i_manufact_id]
-                                  InputAdapter
-                                    BroadcastExchange #6
-                                      WholeStageCodegen (4)
-                                        Project [ca_address_sk]
-                                          Filter [ca_gmt_offset,ca_address_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
-                  WholeStageCodegen (12)
-                    HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_manufact_id] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [i_manufact_id,cs_ext_sales_price] [sum,sum]
-                              Project [cs_ext_sales_price,i_manufact_id]
-                                BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
-                                  Project [cs_bill_addr_sk,cs_ext_sales_price,i_manufact_id]
-                                    BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                      Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
-                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                          Filter [cs_bill_addr_sk,cs_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [i_item_sk,i_manufact_id] #4
-                                  InputAdapter
-                                    ReusedExchange [ca_address_sk] #6
-                  WholeStageCodegen (18)
-                    HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_manufact_id] #8
-                          WholeStageCodegen (17)
-                            HashAggregate [i_manufact_id,ws_ext_sales_price] [sum,sum]
-                              Project [ws_ext_sales_price,i_manufact_id]
-                                BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
-                                  Project [ws_bill_addr_sk,ws_ext_sales_price,i_manufact_id]
-                                    BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                      Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
-                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                          Filter [ws_bill_addr_sk,ws_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [i_item_sk,i_manufact_id] #4
-                                  InputAdapter
-                                    ReusedExchange [ca_address_sk] #6
+      HashAggregate [i_manufact_id,total_sales] [sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_manufact_id] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [i_manufact_id,ss_ext_sales_price] [sum,sum]
+                        Project [ss_ext_sales_price,i_manufact_id]
+                          BroadcastHashJoin [ss_addr_sk,ca_address_sk]
+                            Project [ss_addr_sk,ss_ext_sales_price,i_manufact_id]
+                              BroadcastHashJoin [ss_item_sk,i_item_sk]
+                                Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
+                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                    Filter [ss_addr_sk,ss_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
+                                            SubqueryBroadcast [d_date_sk] #1
+                                              BroadcastExchange #2
+                                                WholeStageCodegen (1)
+                                                  Project [d_date_sk]
+                                                    Filter [d_year,d_moy,d_date_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  BroadcastExchange #3
+                                    WholeStageCodegen (3)
+                                      BroadcastHashJoin [i_manufact_id,i_manufact_id]
+                                        Filter [i_item_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.item [i_item_sk,i_manufact_id]
+                                        InputAdapter
+                                          BroadcastExchange #4
+                                            WholeStageCodegen (2)
+                                              Project [i_manufact_id]
+                                                Filter [i_category]
+                                                  ColumnarToRow
+                                                    InputAdapter
+                                                      Scan parquet spark_catalog.default.item [i_category,i_manufact_id]
+                            InputAdapter
+                              BroadcastExchange #5
+                                WholeStageCodegen (4)
+                                  Project [ca_address_sk]
+                                    Filter [ca_gmt_offset,ca_address_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
+            WholeStageCodegen (12)
+              HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_manufact_id] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [i_manufact_id,cs_ext_sales_price] [sum,sum]
+                        Project [cs_ext_sales_price,i_manufact_id]
+                          BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
+                            Project [cs_bill_addr_sk,cs_ext_sales_price,i_manufact_id]
+                              BroadcastHashJoin [cs_item_sk,i_item_sk]
+                                Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
+                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                    Filter [cs_bill_addr_sk,cs_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [i_item_sk,i_manufact_id] #3
+                            InputAdapter
+                              ReusedExchange [ca_address_sk] #5
+            WholeStageCodegen (18)
+              HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_manufact_id] #7
+                    WholeStageCodegen (17)
+                      HashAggregate [i_manufact_id,ws_ext_sales_price] [sum,sum]
+                        Project [ws_ext_sales_price,i_manufact_id]
+                          BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
+                            Project [ws_bill_addr_sk,ws_ext_sales_price,i_manufact_id]
+                              BroadcastHashJoin [ws_item_sk,i_item_sk]
+                                Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
+                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                    Filter [ws_bill_addr_sk,ws_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [i_item_sk,i_manufact_id] #3
+                            InputAdapter
+                              ReusedExchange [ca_address_sk] #5
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/explain.txt
index eae0ce1329922..9b64c961a5e96 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/explain.txt
@@ -1,67 +1,66 @@
 == Physical Plan ==
-TakeOrderedAndProject (63)
-+- * HashAggregate (62)
-   +- Exchange (61)
-      +- * HashAggregate (60)
-         +- Union (59)
-            :- * HashAggregate (28)
-            :  +- Exchange (27)
-            :     +- * HashAggregate (26)
-            :        +- * Project (25)
-            :           +- * BroadcastHashJoin Inner BuildRight (24)
-            :              :- * Project (13)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (12)
-            :              :     :- * Project (6)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
-            :              :     :     :- * Filter (3)
-            :              :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :              :     :     +- ReusedExchange (4)
-            :              :     +- BroadcastExchange (11)
-            :              :        +- * Project (10)
-            :              :           +- * Filter (9)
-            :              :              +- * ColumnarToRow (8)
-            :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
-            :              +- BroadcastExchange (23)
-            :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
-            :                    :- * Filter (16)
-            :                    :  +- * ColumnarToRow (15)
-            :                    :     +- Scan parquet spark_catalog.default.item (14)
-            :                    +- BroadcastExchange (21)
-            :                       +- * Project (20)
-            :                          +- * Filter (19)
-            :                             +- * ColumnarToRow (18)
-            :                                +- Scan parquet spark_catalog.default.item (17)
-            :- * HashAggregate (43)
-            :  +- Exchange (42)
-            :     +- * HashAggregate (41)
-            :        +- * Project (40)
-            :           +- * BroadcastHashJoin Inner BuildRight (39)
-            :              :- * Project (37)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (36)
-            :              :     :- * Project (34)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
-            :              :     :     :- * Filter (31)
-            :              :     :     :  +- * ColumnarToRow (30)
-            :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
-            :              :     :     +- ReusedExchange (32)
-            :              :     +- ReusedExchange (35)
-            :              +- ReusedExchange (38)
-            +- * HashAggregate (58)
-               +- Exchange (57)
-                  +- * HashAggregate (56)
-                     +- * Project (55)
-                        +- * BroadcastHashJoin Inner BuildRight (54)
-                           :- * Project (52)
-                           :  +- * BroadcastHashJoin Inner BuildRight (51)
-                           :     :- * Project (49)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (48)
-                           :     :     :- * Filter (46)
-                           :     :     :  +- * ColumnarToRow (45)
-                           :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
-                           :     :     +- ReusedExchange (47)
-                           :     +- ReusedExchange (50)
-                           +- ReusedExchange (53)
+TakeOrderedAndProject (62)
++- * HashAggregate (61)
+   +- * HashAggregate (60)
+      +- Union (59)
+         :- * HashAggregate (28)
+         :  +- Exchange (27)
+         :     +- * HashAggregate (26)
+         :        +- * Project (25)
+         :           +- * BroadcastHashJoin Inner BuildRight (24)
+         :              :- * Project (13)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (12)
+         :              :     :- * Project (6)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
+         :              :     :     :- * Filter (3)
+         :              :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
+         :              :     :     +- ReusedExchange (4)
+         :              :     +- BroadcastExchange (11)
+         :              :        +- * Project (10)
+         :              :           +- * Filter (9)
+         :              :              +- * ColumnarToRow (8)
+         :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
+         :              +- BroadcastExchange (23)
+         :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
+         :                    :- * Filter (16)
+         :                    :  +- * ColumnarToRow (15)
+         :                    :     +- Scan parquet spark_catalog.default.item (14)
+         :                    +- BroadcastExchange (21)
+         :                       +- * Project (20)
+         :                          +- * Filter (19)
+         :                             +- * ColumnarToRow (18)
+         :                                +- Scan parquet spark_catalog.default.item (17)
+         :- * HashAggregate (43)
+         :  +- Exchange (42)
+         :     +- * HashAggregate (41)
+         :        +- * Project (40)
+         :           +- * BroadcastHashJoin Inner BuildRight (39)
+         :              :- * Project (37)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (36)
+         :              :     :- * Project (34)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
+         :              :     :     :- * Filter (31)
+         :              :     :     :  +- * ColumnarToRow (30)
+         :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
+         :              :     :     +- ReusedExchange (32)
+         :              :     +- ReusedExchange (35)
+         :              +- ReusedExchange (38)
+         +- * HashAggregate (58)
+            +- Exchange (57)
+               +- * HashAggregate (56)
+                  +- * Project (55)
+                     +- * BroadcastHashJoin Inner BuildRight (54)
+                        :- * Project (52)
+                        :  +- * BroadcastHashJoin Inner BuildRight (51)
+                        :     :- * Project (49)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (48)
+                        :     :     :- * Filter (46)
+                        :     :     :  +- * ColumnarToRow (45)
+                        :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
+                        :     :     +- ReusedExchange (47)
+                        :     +- ReusedExchange (50)
+                        +- ReusedExchange (53)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -79,7 +78,7 @@ Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Condition : (isnotnull(ss_addr_sk#2) AND isnotnull(ss_item_sk#1))
 
-(4) ReusedExchange [Reuses operator id: 68]
+(4) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#6]
 
 (5) BroadcastHashJoin [codegen id : 5]
@@ -213,7 +212,7 @@ Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_da
 Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_date_sk#20]
 Condition : (isnotnull(cs_bill_addr_sk#17) AND isnotnull(cs_item_sk#18))
 
-(32) ReusedExchange [Reuses operator id: 68]
+(32) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#21]
 
 (33) BroadcastHashJoin [codegen id : 11]
@@ -285,7 +284,7 @@ Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_da
 Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_date_sk#32]
 Condition : (isnotnull(ws_bill_addr_sk#30) AND isnotnull(ws_item_sk#29))
 
-(47) ReusedExchange [Reuses operator id: 68]
+(47) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#33]
 
 (48) BroadcastHashJoin [codegen id : 17]
@@ -351,52 +350,48 @@ Functions [1]: [partial_sum(total_sales#16)]
 Aggregate Attributes [2]: [sum#41, isEmpty#42]
 Results [3]: [i_manufact_id#10, sum#43, isEmpty#44]
 
-(61) Exchange
-Input [3]: [i_manufact_id#10, sum#43, isEmpty#44]
-Arguments: hashpartitioning(i_manufact_id#10, 5), ENSURE_REQUIREMENTS, [plan_id=7]
-
-(62) HashAggregate [codegen id : 20]
+(61) HashAggregate [codegen id : 19]
 Input [3]: [i_manufact_id#10, sum#43, isEmpty#44]
 Keys [1]: [i_manufact_id#10]
 Functions [1]: [sum(total_sales#16)]
 Aggregate Attributes [1]: [sum(total_sales#16)#45]
 Results [2]: [i_manufact_id#10, sum(total_sales#16)#45 AS total_sales#46]
 
-(63) TakeOrderedAndProject
+(62) TakeOrderedAndProject
 Input [2]: [i_manufact_id#10, total_sales#46]
 Arguments: 100, [total_sales#46 ASC NULLS FIRST], [i_manufact_id#10, total_sales#46]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (68)
-+- * Project (67)
-   +- * Filter (66)
-      +- * ColumnarToRow (65)
-         +- Scan parquet spark_catalog.default.date_dim (64)
+BroadcastExchange (67)
++- * Project (66)
+   +- * Filter (65)
+      +- * ColumnarToRow (64)
+         +- Scan parquet spark_catalog.default.date_dim (63)
 
 
-(64) Scan parquet spark_catalog.default.date_dim
+(63) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,5), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(65) ColumnarToRow [codegen id : 1]
+(64) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(66) Filter [codegen id : 1]
+(65) Filter [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Condition : ((((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 1998)) AND (d_moy#48 = 5)) AND isnotnull(d_date_sk#6))
 
-(67) Project [codegen id : 1]
+(66) Project [codegen id : 1]
 Output [1]: [d_date_sk#6]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(68) BroadcastExchange
+(67) BroadcastExchange
 Input [1]: [d_date_sk#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 Subquery:2 Hosting operator id = 29 Hosting Expression = cs_sold_date_sk#20 IN dynamicpruning#5
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/simplified.txt
index 959f7932eb5ae..b423d06e2cc4b 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q33/simplified.txt
@@ -1,105 +1,102 @@
 TakeOrderedAndProject [total_sales,i_manufact_id]
-  WholeStageCodegen (20)
+  WholeStageCodegen (19)
     HashAggregate [i_manufact_id,sum,isEmpty] [sum(total_sales),total_sales,sum,isEmpty]
-      InputAdapter
-        Exchange [i_manufact_id] #1
-          WholeStageCodegen (19)
-            HashAggregate [i_manufact_id,total_sales] [sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_manufact_id] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [i_manufact_id,ss_ext_sales_price] [sum,sum]
-                              Project [ss_ext_sales_price,i_manufact_id]
-                                BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                  Project [ss_item_sk,ss_ext_sales_price]
-                                    BroadcastHashJoin [ss_addr_sk,ca_address_sk]
-                                      Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
-                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                          Filter [ss_addr_sk,ss_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
-                                                  SubqueryBroadcast [d_date_sk] #1
-                                                    BroadcastExchange #3
-                                                      WholeStageCodegen (1)
-                                                        Project [d_date_sk]
-                                                          Filter [d_year,d_moy,d_date_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        BroadcastExchange #4
-                                          WholeStageCodegen (2)
-                                            Project [ca_address_sk]
-                                              Filter [ca_gmt_offset,ca_address_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
-                                  InputAdapter
-                                    BroadcastExchange #5
-                                      WholeStageCodegen (4)
-                                        BroadcastHashJoin [i_manufact_id,i_manufact_id]
-                                          Filter [i_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.item [i_item_sk,i_manufact_id]
-                                          InputAdapter
-                                            BroadcastExchange #6
-                                              WholeStageCodegen (3)
-                                                Project [i_manufact_id]
-                                                  Filter [i_category]
-                                                    ColumnarToRow
-                                                      InputAdapter
-                                                        Scan parquet spark_catalog.default.item [i_category,i_manufact_id]
-                  WholeStageCodegen (12)
-                    HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_manufact_id] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [i_manufact_id,cs_ext_sales_price] [sum,sum]
-                              Project [cs_ext_sales_price,i_manufact_id]
-                                BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                  Project [cs_item_sk,cs_ext_sales_price]
-                                    BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
-                                      Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
-                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                          Filter [cs_bill_addr_sk,cs_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_manufact_id] #5
-                  WholeStageCodegen (18)
-                    HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_manufact_id] #8
-                          WholeStageCodegen (17)
-                            HashAggregate [i_manufact_id,ws_ext_sales_price] [sum,sum]
-                              Project [ws_ext_sales_price,i_manufact_id]
-                                BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                  Project [ws_item_sk,ws_ext_sales_price]
-                                    BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
-                                      Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
-                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                          Filter [ws_bill_addr_sk,ws_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_manufact_id] #5
+      HashAggregate [i_manufact_id,total_sales] [sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_manufact_id] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [i_manufact_id,ss_ext_sales_price] [sum,sum]
+                        Project [ss_ext_sales_price,i_manufact_id]
+                          BroadcastHashJoin [ss_item_sk,i_item_sk]
+                            Project [ss_item_sk,ss_ext_sales_price]
+                              BroadcastHashJoin [ss_addr_sk,ca_address_sk]
+                                Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
+                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                    Filter [ss_addr_sk,ss_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
+                                            SubqueryBroadcast [d_date_sk] #1
+                                              BroadcastExchange #2
+                                                WholeStageCodegen (1)
+                                                  Project [d_date_sk]
+                                                    Filter [d_year,d_moy,d_date_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  BroadcastExchange #3
+                                    WholeStageCodegen (2)
+                                      Project [ca_address_sk]
+                                        Filter [ca_gmt_offset,ca_address_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
+                            InputAdapter
+                              BroadcastExchange #4
+                                WholeStageCodegen (4)
+                                  BroadcastHashJoin [i_manufact_id,i_manufact_id]
+                                    Filter [i_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.item [i_item_sk,i_manufact_id]
+                                    InputAdapter
+                                      BroadcastExchange #5
+                                        WholeStageCodegen (3)
+                                          Project [i_manufact_id]
+                                            Filter [i_category]
+                                              ColumnarToRow
+                                                InputAdapter
+                                                  Scan parquet spark_catalog.default.item [i_category,i_manufact_id]
+            WholeStageCodegen (12)
+              HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_manufact_id] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [i_manufact_id,cs_ext_sales_price] [sum,sum]
+                        Project [cs_ext_sales_price,i_manufact_id]
+                          BroadcastHashJoin [cs_item_sk,i_item_sk]
+                            Project [cs_item_sk,cs_ext_sales_price]
+                              BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
+                                Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
+                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                    Filter [cs_bill_addr_sk,cs_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_manufact_id] #4
+            WholeStageCodegen (18)
+              HashAggregate [i_manufact_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_manufact_id] #7
+                    WholeStageCodegen (17)
+                      HashAggregate [i_manufact_id,ws_ext_sales_price] [sum,sum]
+                        Project [ws_ext_sales_price,i_manufact_id]
+                          BroadcastHashJoin [ws_item_sk,i_item_sk]
+                            Project [ws_item_sk,ws_ext_sales_price]
+                              BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
+                                Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
+                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                    Filter [ws_bill_addr_sk,ws_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_manufact_id] #4
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q37.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q37.sf100/explain.txt
index cafddc19f5540..13d43f719ea72 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q37.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q37.sf100/explain.txt
@@ -113,7 +113,7 @@ Input [2]: [cs_item_sk#11, cs_sold_date_sk#12]
 
 (19) Filter [codegen id : 5]
 Input [2]: [cs_item_sk#11, cs_sold_date_sk#12]
-Condition : (isnotnull(cs_item_sk#11) AND might_contain(Subquery scalar-subquery#13, [id=#14], xxhash64(cs_item_sk#11, 42)))
+Condition : (isnotnull(cs_item_sk#11) AND might_contain(Subquery scalar-subquery#13, [id=#3], xxhash64(cs_item_sk#11, 42)))
 
 (20) Project [codegen id : 5]
 Output [1]: [cs_item_sk#11]
@@ -121,7 +121,7 @@ Input [2]: [cs_item_sk#11, cs_sold_date_sk#12]
 
 (21) Exchange
 Input [1]: [cs_item_sk#11]
-Arguments: hashpartitioning(cs_item_sk#11, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Arguments: hashpartitioning(cs_item_sk#11, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (22) Sort [codegen id : 6]
 Input [1]: [cs_item_sk#11]
@@ -146,7 +146,7 @@ Results [3]: [i_item_id#2, i_item_desc#3, i_current_price#4]
 
 (26) Exchange
 Input [3]: [i_item_id#2, i_item_desc#3, i_current_price#4]
-Arguments: hashpartitioning(i_item_id#2, i_item_desc#3, i_current_price#4, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Arguments: hashpartitioning(i_item_id#2, i_item_desc#3, i_current_price#4, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (27) HashAggregate [codegen id : 8]
 Input [3]: [i_item_id#2, i_item_desc#3, i_current_price#4]
@@ -170,28 +170,28 @@ BroadcastExchange (33)
 
 
 (29) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#10, d_date#15]
+Output [2]: [d_date_sk#10, d_date#14]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2000-02-01), LessThanOrEqual(d_date,2000-04-01), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (30) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#10, d_date#15]
+Input [2]: [d_date_sk#10, d_date#14]
 
 (31) Filter [codegen id : 1]
-Input [2]: [d_date_sk#10, d_date#15]
-Condition : (((isnotnull(d_date#15) AND (d_date#15 >= 2000-02-01)) AND (d_date#15 <= 2000-04-01)) AND isnotnull(d_date_sk#10))
+Input [2]: [d_date_sk#10, d_date#14]
+Condition : (((isnotnull(d_date#14) AND (d_date#14 >= 2000-02-01)) AND (d_date#14 <= 2000-04-01)) AND isnotnull(d_date_sk#10))
 
 (32) Project [codegen id : 1]
 Output [1]: [d_date_sk#10]
-Input [2]: [d_date_sk#10, d_date#15]
+Input [2]: [d_date_sk#10, d_date#14]
 
 (33) BroadcastExchange
 Input [1]: [d_date_sk#10]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
-Subquery:2 Hosting operator id = 19 Hosting Expression = Subquery scalar-subquery#13, [id=#14]
+Subquery:2 Hosting operator id = 19 Hosting Expression = Subquery scalar-subquery#13, [id=#3]
 ObjectHashAggregate (40)
 +- Exchange (39)
    +- ObjectHashAggregate (38)
@@ -223,18 +223,18 @@ Input [3]: [i_item_sk#1, i_current_price#4, i_manufact_id#5]
 Input [1]: [i_item_sk#1]
 Keys: []
 Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)]
-Aggregate Attributes [1]: [buf#16]
-Results [1]: [buf#17]
+Aggregate Attributes [1]: [buf#15]
+Results [1]: [buf#16]
 
 (39) Exchange
-Input [1]: [buf#17]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
+Input [1]: [buf#16]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
 
 (40) ObjectHashAggregate
-Input [1]: [buf#17]
+Input [1]: [buf#16]
 Keys: []
 Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#18]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#18 AS bloomFilter#19]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#17]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#17 AS bloomFilter#18]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q40.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q40.sf100/explain.txt
index 55ba768476e40..64a775892a22a 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q40.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q40.sf100/explain.txt
@@ -47,150 +47,150 @@ Input [5]: [cs_warehouse_sk#1, cs_item_sk#2, cs_order_number#3, cs_sales_price#4
 
 (3) Filter [codegen id : 1]
 Input [5]: [cs_warehouse_sk#1, cs_item_sk#2, cs_order_number#3, cs_sales_price#4, cs_sold_date_sk#5]
-Condition : ((isnotnull(cs_warehouse_sk#1) AND isnotnull(cs_item_sk#2)) AND might_contain(Subquery scalar-subquery#7, [id=#8], xxhash64(cs_item_sk#2, 42)))
+Condition : ((isnotnull(cs_warehouse_sk#1) AND isnotnull(cs_item_sk#2)) AND might_contain(Subquery scalar-subquery#7, [id=#1], xxhash64(cs_item_sk#2, 42)))
 
 (4) Exchange
 Input [5]: [cs_warehouse_sk#1, cs_item_sk#2, cs_order_number#3, cs_sales_price#4, cs_sold_date_sk#5]
-Arguments: hashpartitioning(cs_order_number#3, cs_item_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(cs_order_number#3, cs_item_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=2]
 
 (5) Sort [codegen id : 2]
 Input [5]: [cs_warehouse_sk#1, cs_item_sk#2, cs_order_number#3, cs_sales_price#4, cs_sold_date_sk#5]
 Arguments: [cs_order_number#3 ASC NULLS FIRST, cs_item_sk#2 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.catalog_returns
-Output [4]: [cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11, cr_returned_date_sk#12]
+Output [4]: [cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10, cr_returned_date_sk#11]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_returns]
 PushedFilters: [IsNotNull(cr_order_number), IsNotNull(cr_item_sk)]
 ReadSchema: struct<cr_item_sk:int,cr_order_number:int,cr_refunded_cash:decimal(7,2)>
 
 (7) ColumnarToRow [codegen id : 3]
-Input [4]: [cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11, cr_returned_date_sk#12]
+Input [4]: [cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10, cr_returned_date_sk#11]
 
 (8) Filter [codegen id : 3]
-Input [4]: [cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11, cr_returned_date_sk#12]
-Condition : (isnotnull(cr_order_number#10) AND isnotnull(cr_item_sk#9))
+Input [4]: [cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10, cr_returned_date_sk#11]
+Condition : (isnotnull(cr_order_number#9) AND isnotnull(cr_item_sk#8))
 
 (9) Project [codegen id : 3]
-Output [3]: [cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11]
-Input [4]: [cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11, cr_returned_date_sk#12]
+Output [3]: [cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10]
+Input [4]: [cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10, cr_returned_date_sk#11]
 
 (10) Exchange
-Input [3]: [cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11]
-Arguments: hashpartitioning(cr_order_number#10, cr_item_sk#9, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [3]: [cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10]
+Arguments: hashpartitioning(cr_order_number#9, cr_item_sk#8, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (11) Sort [codegen id : 4]
-Input [3]: [cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11]
-Arguments: [cr_order_number#10 ASC NULLS FIRST, cr_item_sk#9 ASC NULLS FIRST], false, 0
+Input [3]: [cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10]
+Arguments: [cr_order_number#9 ASC NULLS FIRST, cr_item_sk#8 ASC NULLS FIRST], false, 0
 
 (12) SortMergeJoin [codegen id : 8]
 Left keys [2]: [cs_order_number#3, cs_item_sk#2]
-Right keys [2]: [cr_order_number#10, cr_item_sk#9]
+Right keys [2]: [cr_order_number#9, cr_item_sk#8]
 Join type: LeftOuter
 Join condition: None
 
 (13) Project [codegen id : 8]
-Output [5]: [cs_warehouse_sk#1, cs_item_sk#2, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#11]
-Input [8]: [cs_warehouse_sk#1, cs_item_sk#2, cs_order_number#3, cs_sales_price#4, cs_sold_date_sk#5, cr_item_sk#9, cr_order_number#10, cr_refunded_cash#11]
+Output [5]: [cs_warehouse_sk#1, cs_item_sk#2, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#10]
+Input [8]: [cs_warehouse_sk#1, cs_item_sk#2, cs_order_number#3, cs_sales_price#4, cs_sold_date_sk#5, cr_item_sk#8, cr_order_number#9, cr_refunded_cash#10]
 
 (14) Scan parquet spark_catalog.default.item
-Output [3]: [i_item_sk#13, i_item_id#14, i_current_price#15]
+Output [3]: [i_item_sk#12, i_item_id#13, i_current_price#14]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), GreaterThanOrEqual(i_current_price,0.99), LessThanOrEqual(i_current_price,1.49), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_item_id:string,i_current_price:decimal(7,2)>
 
 (15) ColumnarToRow [codegen id : 5]
-Input [3]: [i_item_sk#13, i_item_id#14, i_current_price#15]
+Input [3]: [i_item_sk#12, i_item_id#13, i_current_price#14]
 
 (16) Filter [codegen id : 5]
-Input [3]: [i_item_sk#13, i_item_id#14, i_current_price#15]
-Condition : (((isnotnull(i_current_price#15) AND (i_current_price#15 >= 0.99)) AND (i_current_price#15 <= 1.49)) AND isnotnull(i_item_sk#13))
+Input [3]: [i_item_sk#12, i_item_id#13, i_current_price#14]
+Condition : (((isnotnull(i_current_price#14) AND (i_current_price#14 >= 0.99)) AND (i_current_price#14 <= 1.49)) AND isnotnull(i_item_sk#12))
 
 (17) Project [codegen id : 5]
-Output [2]: [i_item_sk#13, i_item_id#14]
-Input [3]: [i_item_sk#13, i_item_id#14, i_current_price#15]
+Output [2]: [i_item_sk#12, i_item_id#13]
+Input [3]: [i_item_sk#12, i_item_id#13, i_current_price#14]
 
 (18) BroadcastExchange
-Input [2]: [i_item_sk#13, i_item_id#14]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=3]
+Input [2]: [i_item_sk#12, i_item_id#13]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
 
 (19) BroadcastHashJoin [codegen id : 8]
 Left keys [1]: [cs_item_sk#2]
-Right keys [1]: [i_item_sk#13]
+Right keys [1]: [i_item_sk#12]
 Join type: Inner
 Join condition: None
 
 (20) Project [codegen id : 8]
-Output [5]: [cs_warehouse_sk#1, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#11, i_item_id#14]
-Input [7]: [cs_warehouse_sk#1, cs_item_sk#2, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#11, i_item_sk#13, i_item_id#14]
+Output [5]: [cs_warehouse_sk#1, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#10, i_item_id#13]
+Input [7]: [cs_warehouse_sk#1, cs_item_sk#2, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#10, i_item_sk#12, i_item_id#13]
 
 (21) ReusedExchange [Reuses operator id: 44]
-Output [2]: [d_date_sk#16, d_date#17]
+Output [2]: [d_date_sk#15, d_date#16]
 
 (22) BroadcastHashJoin [codegen id : 8]
 Left keys [1]: [cs_sold_date_sk#5]
-Right keys [1]: [d_date_sk#16]
+Right keys [1]: [d_date_sk#15]
 Join type: Inner
 Join condition: None
 
 (23) Project [codegen id : 8]
-Output [5]: [cs_warehouse_sk#1, cs_sales_price#4, cr_refunded_cash#11, i_item_id#14, d_date#17]
-Input [7]: [cs_warehouse_sk#1, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#11, i_item_id#14, d_date_sk#16, d_date#17]
+Output [5]: [cs_warehouse_sk#1, cs_sales_price#4, cr_refunded_cash#10, i_item_id#13, d_date#16]
+Input [7]: [cs_warehouse_sk#1, cs_sales_price#4, cs_sold_date_sk#5, cr_refunded_cash#10, i_item_id#13, d_date_sk#15, d_date#16]
 
 (24) Scan parquet spark_catalog.default.warehouse
-Output [2]: [w_warehouse_sk#18, w_state#19]
+Output [2]: [w_warehouse_sk#17, w_state#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/warehouse]
 PushedFilters: [IsNotNull(w_warehouse_sk)]
 ReadSchema: struct<w_warehouse_sk:int,w_state:string>
 
 (25) ColumnarToRow [codegen id : 7]
-Input [2]: [w_warehouse_sk#18, w_state#19]
+Input [2]: [w_warehouse_sk#17, w_state#18]
 
 (26) Filter [codegen id : 7]
-Input [2]: [w_warehouse_sk#18, w_state#19]
-Condition : isnotnull(w_warehouse_sk#18)
+Input [2]: [w_warehouse_sk#17, w_state#18]
+Condition : isnotnull(w_warehouse_sk#17)
 
 (27) BroadcastExchange
-Input [2]: [w_warehouse_sk#18, w_state#19]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=4]
+Input [2]: [w_warehouse_sk#17, w_state#18]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=5]
 
 (28) BroadcastHashJoin [codegen id : 8]
 Left keys [1]: [cs_warehouse_sk#1]
-Right keys [1]: [w_warehouse_sk#18]
+Right keys [1]: [w_warehouse_sk#17]
 Join type: Inner
 Join condition: None
 
 (29) Project [codegen id : 8]
-Output [5]: [cs_sales_price#4, cr_refunded_cash#11, w_state#19, i_item_id#14, d_date#17]
-Input [7]: [cs_warehouse_sk#1, cs_sales_price#4, cr_refunded_cash#11, i_item_id#14, d_date#17, w_warehouse_sk#18, w_state#19]
+Output [5]: [cs_sales_price#4, cr_refunded_cash#10, w_state#18, i_item_id#13, d_date#16]
+Input [7]: [cs_warehouse_sk#1, cs_sales_price#4, cr_refunded_cash#10, i_item_id#13, d_date#16, w_warehouse_sk#17, w_state#18]
 
 (30) HashAggregate [codegen id : 8]
-Input [5]: [cs_sales_price#4, cr_refunded_cash#11, w_state#19, i_item_id#14, d_date#17]
-Keys [2]: [w_state#19, i_item_id#14]
-Functions [2]: [partial_sum(CASE WHEN (d_date#17 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END), partial_sum(CASE WHEN (d_date#17 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END)]
-Aggregate Attributes [4]: [sum#20, isEmpty#21, sum#22, isEmpty#23]
-Results [6]: [w_state#19, i_item_id#14, sum#24, isEmpty#25, sum#26, isEmpty#27]
+Input [5]: [cs_sales_price#4, cr_refunded_cash#10, w_state#18, i_item_id#13, d_date#16]
+Keys [2]: [w_state#18, i_item_id#13]
+Functions [2]: [partial_sum(CASE WHEN (d_date#16 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END), partial_sum(CASE WHEN (d_date#16 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END)]
+Aggregate Attributes [4]: [sum#19, isEmpty#20, sum#21, isEmpty#22]
+Results [6]: [w_state#18, i_item_id#13, sum#23, isEmpty#24, sum#25, isEmpty#26]
 
 (31) Exchange
-Input [6]: [w_state#19, i_item_id#14, sum#24, isEmpty#25, sum#26, isEmpty#27]
-Arguments: hashpartitioning(w_state#19, i_item_id#14, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [6]: [w_state#18, i_item_id#13, sum#23, isEmpty#24, sum#25, isEmpty#26]
+Arguments: hashpartitioning(w_state#18, i_item_id#13, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (32) HashAggregate [codegen id : 9]
-Input [6]: [w_state#19, i_item_id#14, sum#24, isEmpty#25, sum#26, isEmpty#27]
-Keys [2]: [w_state#19, i_item_id#14]
-Functions [2]: [sum(CASE WHEN (d_date#17 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END), sum(CASE WHEN (d_date#17 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END)]
-Aggregate Attributes [2]: [sum(CASE WHEN (d_date#17 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END)#28, sum(CASE WHEN (d_date#17 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END)#29]
-Results [4]: [w_state#19, i_item_id#14, sum(CASE WHEN (d_date#17 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END)#28 AS sales_before#30, sum(CASE WHEN (d_date#17 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#11 as decimal(12,2)), 0.00)) ELSE 0.00 END)#29 AS sales_after#31]
+Input [6]: [w_state#18, i_item_id#13, sum#23, isEmpty#24, sum#25, isEmpty#26]
+Keys [2]: [w_state#18, i_item_id#13]
+Functions [2]: [sum(CASE WHEN (d_date#16 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END), sum(CASE WHEN (d_date#16 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END)]
+Aggregate Attributes [2]: [sum(CASE WHEN (d_date#16 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END)#27, sum(CASE WHEN (d_date#16 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END)#28]
+Results [4]: [w_state#18, i_item_id#13, sum(CASE WHEN (d_date#16 < 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END)#27 AS sales_before#29, sum(CASE WHEN (d_date#16 >= 2000-03-11) THEN (cs_sales_price#4 - coalesce(cast(cr_refunded_cash#10 as decimal(12,2)), 0.00)) ELSE 0.00 END)#28 AS sales_after#30]
 
 (33) TakeOrderedAndProject
-Input [4]: [w_state#19, i_item_id#14, sales_before#30, sales_after#31]
-Arguments: 100, [w_state#19 ASC NULLS FIRST, i_item_id#14 ASC NULLS FIRST], [w_state#19, i_item_id#14, sales_before#30, sales_after#31]
+Input [4]: [w_state#18, i_item_id#13, sales_before#29, sales_after#30]
+Arguments: 100, [w_state#18 ASC NULLS FIRST, i_item_id#13 ASC NULLS FIRST], [w_state#18, i_item_id#13, sales_before#29, sales_after#30]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#7, [id=#8]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#7, [id=#1]
 ObjectHashAggregate (40)
 +- Exchange (39)
    +- ObjectHashAggregate (38)
@@ -201,40 +201,40 @@ ObjectHashAggregate (40)
 
 
 (34) Scan parquet spark_catalog.default.item
-Output [2]: [i_item_sk#13, i_current_price#15]
+Output [2]: [i_item_sk#12, i_current_price#14]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), GreaterThanOrEqual(i_current_price,0.99), LessThanOrEqual(i_current_price,1.49), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2)>
 
 (35) ColumnarToRow [codegen id : 1]
-Input [2]: [i_item_sk#13, i_current_price#15]
+Input [2]: [i_item_sk#12, i_current_price#14]
 
 (36) Filter [codegen id : 1]
-Input [2]: [i_item_sk#13, i_current_price#15]
-Condition : (((isnotnull(i_current_price#15) AND (i_current_price#15 >= 0.99)) AND (i_current_price#15 <= 1.49)) AND isnotnull(i_item_sk#13))
+Input [2]: [i_item_sk#12, i_current_price#14]
+Condition : (((isnotnull(i_current_price#14) AND (i_current_price#14 >= 0.99)) AND (i_current_price#14 <= 1.49)) AND isnotnull(i_item_sk#12))
 
 (37) Project [codegen id : 1]
-Output [1]: [i_item_sk#13]
-Input [2]: [i_item_sk#13, i_current_price#15]
+Output [1]: [i_item_sk#12]
+Input [2]: [i_item_sk#12, i_current_price#14]
 
 (38) ObjectHashAggregate
-Input [1]: [i_item_sk#13]
+Input [1]: [i_item_sk#12]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#13, 42), 1019, 24988, 0, 0)]
-Aggregate Attributes [1]: [buf#32]
-Results [1]: [buf#33]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#12, 42), 1019, 24988, 0, 0)]
+Aggregate Attributes [1]: [buf#31]
+Results [1]: [buf#32]
 
 (39) Exchange
-Input [1]: [buf#33]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
+Input [1]: [buf#32]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
 
 (40) ObjectHashAggregate
-Input [1]: [buf#33]
+Input [1]: [buf#32]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#13, 42), 1019, 24988, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#13, 42), 1019, 24988, 0, 0)#34]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#13, 42), 1019, 24988, 0, 0)#34 AS bloomFilter#35]
+Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#12, 42), 1019, 24988, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#12, 42), 1019, 24988, 0, 0)#33]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#12, 42), 1019, 24988, 0, 0)#33 AS bloomFilter#34]
 
 Subquery:2 Hosting operator id = 1 Hosting Expression = cs_sold_date_sk#5 IN dynamicpruning#6
 BroadcastExchange (44)
@@ -244,21 +244,21 @@ BroadcastExchange (44)
 
 
 (41) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#16, d_date#17]
+Output [2]: [d_date_sk#15, d_date#16]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2000-02-10), LessThanOrEqual(d_date,2000-04-10), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (42) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#16, d_date#17]
+Input [2]: [d_date_sk#15, d_date#16]
 
 (43) Filter [codegen id : 1]
-Input [2]: [d_date_sk#16, d_date#17]
-Condition : (((isnotnull(d_date#17) AND (d_date#17 >= 2000-02-10)) AND (d_date#17 <= 2000-04-10)) AND isnotnull(d_date_sk#16))
+Input [2]: [d_date_sk#15, d_date#16]
+Condition : (((isnotnull(d_date#16) AND (d_date#16 >= 2000-02-10)) AND (d_date#16 <= 2000-04-10)) AND isnotnull(d_date_sk#15))
 
 (44) BroadcastExchange
-Input [2]: [d_date_sk#16, d_date#17]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
+Input [2]: [d_date_sk#15, d_date#16]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=8]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44.sf100/explain.txt
index 4e21aba538bbd..fff9168d82d00 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44.sf100/explain.txt
@@ -79,7 +79,7 @@ Results [2]: [ss_item_sk#1 AS item_sk#10, cast((avg(UnscaledValue(ss_net_profit#
 
 (8) Filter [codegen id : 2]
 Input [2]: [item_sk#10, rank_col#11]
-Condition : (isnotnull(rank_col#11) AND (cast(rank_col#11 as decimal(13,7)) > (0.9 * Subquery scalar-subquery#12, [id=#13])))
+Condition : (isnotnull(rank_col#11) AND (cast(rank_col#11 as decimal(13,7)) > (0.9 * Subquery scalar-subquery#12, [id=#2])))
 
 (9) Sort [codegen id : 2]
 Input [2]: [item_sk#10, rank_col#11]
@@ -91,7 +91,7 @@ Arguments: [rank_col#11 ASC NULLS FIRST], rank(rank_col#11), 10, Partial
 
 (11) Exchange
 Input [2]: [item_sk#10, rank_col#11]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=2]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) Sort [codegen id : 3]
 Input [2]: [item_sk#10, rank_col#11]
@@ -103,124 +103,124 @@ Arguments: [rank_col#11 ASC NULLS FIRST], rank(rank_col#11), 10, Final
 
 (14) Window
 Input [2]: [item_sk#10, rank_col#11]
-Arguments: [rank(rank_col#11) windowspecdefinition(rank_col#11 ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#14], [rank_col#11 ASC NULLS FIRST]
+Arguments: [rank(rank_col#11) windowspecdefinition(rank_col#11 ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#13], [rank_col#11 ASC NULLS FIRST]
 
 (15) Filter [codegen id : 10]
-Input [3]: [item_sk#10, rank_col#11, rnk#14]
-Condition : ((rnk#14 < 11) AND isnotnull(item_sk#10))
+Input [3]: [item_sk#10, rank_col#11, rnk#13]
+Condition : ((rnk#13 < 11) AND isnotnull(item_sk#10))
 
 (16) Project [codegen id : 10]
-Output [2]: [item_sk#10, rnk#14]
-Input [3]: [item_sk#10, rank_col#11, rnk#14]
+Output [2]: [item_sk#10, rnk#13]
+Input [3]: [item_sk#10, rank_col#11, rnk#13]
 
 (17) ReusedExchange [Reuses operator id: 6]
-Output [3]: [ss_item_sk#15, sum#16, count#17]
+Output [3]: [ss_item_sk#14, sum#15, count#16]
 
 (18) HashAggregate [codegen id : 5]
-Input [3]: [ss_item_sk#15, sum#16, count#17]
-Keys [1]: [ss_item_sk#15]
-Functions [1]: [avg(UnscaledValue(ss_net_profit#18))]
-Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#18))#19]
-Results [2]: [ss_item_sk#15 AS item_sk#20, cast((avg(UnscaledValue(ss_net_profit#18))#19 / 100.0) as decimal(11,6)) AS rank_col#21]
+Input [3]: [ss_item_sk#14, sum#15, count#16]
+Keys [1]: [ss_item_sk#14]
+Functions [1]: [avg(UnscaledValue(ss_net_profit#17))]
+Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#17))#18]
+Results [2]: [ss_item_sk#14 AS item_sk#19, cast((avg(UnscaledValue(ss_net_profit#17))#18 / 100.0) as decimal(11,6)) AS rank_col#20]
 
 (19) Filter [codegen id : 5]
-Input [2]: [item_sk#20, rank_col#21]
-Condition : (isnotnull(rank_col#21) AND (cast(rank_col#21 as decimal(13,7)) > (0.9 * ReusedSubquery Subquery scalar-subquery#12, [id=#13])))
+Input [2]: [item_sk#19, rank_col#20]
+Condition : (isnotnull(rank_col#20) AND (cast(rank_col#20 as decimal(13,7)) > (0.9 * ReusedSubquery Subquery scalar-subquery#12, [id=#2])))
 
 (20) Sort [codegen id : 5]
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], false, 0
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], false, 0
 
 (21) WindowGroupLimit
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], rank(rank_col#21), 10, Partial
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], rank(rank_col#20), 10, Partial
 
 (22) Exchange
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=3]
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=4]
 
 (23) Sort [codegen id : 6]
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], false, 0
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], false, 0
 
 (24) WindowGroupLimit
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], rank(rank_col#21), 10, Final
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], rank(rank_col#20), 10, Final
 
 (25) Window
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank(rank_col#21) windowspecdefinition(rank_col#21 DESC NULLS LAST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#22], [rank_col#21 DESC NULLS LAST]
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank(rank_col#20) windowspecdefinition(rank_col#20 DESC NULLS LAST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#21], [rank_col#20 DESC NULLS LAST]
 
 (26) Filter [codegen id : 7]
-Input [3]: [item_sk#20, rank_col#21, rnk#22]
-Condition : ((rnk#22 < 11) AND isnotnull(item_sk#20))
+Input [3]: [item_sk#19, rank_col#20, rnk#21]
+Condition : ((rnk#21 < 11) AND isnotnull(item_sk#19))
 
 (27) Project [codegen id : 7]
-Output [2]: [item_sk#20, rnk#22]
-Input [3]: [item_sk#20, rank_col#21, rnk#22]
+Output [2]: [item_sk#19, rnk#21]
+Input [3]: [item_sk#19, rank_col#20, rnk#21]
 
 (28) BroadcastExchange
-Input [2]: [item_sk#20, rnk#22]
-Arguments: HashedRelationBroadcastMode(List(cast(input[1, int, false] as bigint)),false), [plan_id=4]
+Input [2]: [item_sk#19, rnk#21]
+Arguments: HashedRelationBroadcastMode(List(cast(input[1, int, false] as bigint)),false), [plan_id=5]
 
 (29) BroadcastHashJoin [codegen id : 10]
-Left keys [1]: [rnk#14]
-Right keys [1]: [rnk#22]
+Left keys [1]: [rnk#13]
+Right keys [1]: [rnk#21]
 Join type: Inner
 Join condition: None
 
 (30) Project [codegen id : 10]
-Output [3]: [item_sk#10, rnk#14, item_sk#20]
-Input [4]: [item_sk#10, rnk#14, item_sk#20, rnk#22]
+Output [3]: [item_sk#10, rnk#13, item_sk#19]
+Input [4]: [item_sk#10, rnk#13, item_sk#19, rnk#21]
 
 (31) Scan parquet spark_catalog.default.item
-Output [2]: [i_item_sk#23, i_product_name#24]
+Output [2]: [i_item_sk#22, i_product_name#23]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_product_name:string>
 
 (32) ColumnarToRow [codegen id : 8]
-Input [2]: [i_item_sk#23, i_product_name#24]
+Input [2]: [i_item_sk#22, i_product_name#23]
 
 (33) Filter [codegen id : 8]
-Input [2]: [i_item_sk#23, i_product_name#24]
-Condition : isnotnull(i_item_sk#23)
+Input [2]: [i_item_sk#22, i_product_name#23]
+Condition : isnotnull(i_item_sk#22)
 
 (34) BroadcastExchange
-Input [2]: [i_item_sk#23, i_product_name#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=5]
+Input [2]: [i_item_sk#22, i_product_name#23]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=6]
 
 (35) BroadcastHashJoin [codegen id : 10]
 Left keys [1]: [item_sk#10]
-Right keys [1]: [i_item_sk#23]
+Right keys [1]: [i_item_sk#22]
 Join type: Inner
 Join condition: None
 
 (36) Project [codegen id : 10]
-Output [3]: [rnk#14, item_sk#20, i_product_name#24]
-Input [5]: [item_sk#10, rnk#14, item_sk#20, i_item_sk#23, i_product_name#24]
+Output [3]: [rnk#13, item_sk#19, i_product_name#23]
+Input [5]: [item_sk#10, rnk#13, item_sk#19, i_item_sk#22, i_product_name#23]
 
 (37) ReusedExchange [Reuses operator id: 34]
-Output [2]: [i_item_sk#25, i_product_name#26]
+Output [2]: [i_item_sk#24, i_product_name#25]
 
 (38) BroadcastHashJoin [codegen id : 10]
-Left keys [1]: [item_sk#20]
-Right keys [1]: [i_item_sk#25]
+Left keys [1]: [item_sk#19]
+Right keys [1]: [i_item_sk#24]
 Join type: Inner
 Join condition: None
 
 (39) Project [codegen id : 10]
-Output [3]: [rnk#14, i_product_name#24 AS best_performing#27, i_product_name#26 AS worst_performing#28]
-Input [5]: [rnk#14, item_sk#20, i_product_name#24, i_item_sk#25, i_product_name#26]
+Output [3]: [rnk#13, i_product_name#23 AS best_performing#26, i_product_name#25 AS worst_performing#27]
+Input [5]: [rnk#13, item_sk#19, i_product_name#23, i_item_sk#24, i_product_name#25]
 
 (40) TakeOrderedAndProject
-Input [3]: [rnk#14, best_performing#27, worst_performing#28]
-Arguments: 100, [rnk#14 ASC NULLS FIRST], [rnk#14, best_performing#27, worst_performing#28]
+Input [3]: [rnk#13, best_performing#26, worst_performing#27]
+Arguments: 100, [rnk#13 ASC NULLS FIRST], [rnk#13, best_performing#26, worst_performing#27]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#12, [id=#13]
+Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#12, [id=#2]
 * HashAggregate (47)
 +- Exchange (46)
    +- * HashAggregate (45)
@@ -231,41 +231,41 @@ Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery
 
 
 (41) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
+Output [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_store_sk), EqualTo(ss_store_sk,4), IsNull(ss_addr_sk)]
 ReadSchema: struct<ss_addr_sk:int,ss_store_sk:int,ss_net_profit:decimal(7,2)>
 
 (42) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
+Input [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
 
 (43) Filter [codegen id : 1]
-Input [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
-Condition : ((isnotnull(ss_store_sk#30) AND (ss_store_sk#30 = 4)) AND isnull(ss_addr_sk#29))
+Input [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
+Condition : ((isnotnull(ss_store_sk#29) AND (ss_store_sk#29 = 4)) AND isnull(ss_addr_sk#28))
 
 (44) Project [codegen id : 1]
-Output [2]: [ss_store_sk#30, ss_net_profit#31]
-Input [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
+Output [2]: [ss_store_sk#29, ss_net_profit#30]
+Input [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
 
 (45) HashAggregate [codegen id : 1]
-Input [2]: [ss_store_sk#30, ss_net_profit#31]
-Keys [1]: [ss_store_sk#30]
-Functions [1]: [partial_avg(UnscaledValue(ss_net_profit#31))]
-Aggregate Attributes [2]: [sum#33, count#34]
-Results [3]: [ss_store_sk#30, sum#35, count#36]
+Input [2]: [ss_store_sk#29, ss_net_profit#30]
+Keys [1]: [ss_store_sk#29]
+Functions [1]: [partial_avg(UnscaledValue(ss_net_profit#30))]
+Aggregate Attributes [2]: [sum#32, count#33]
+Results [3]: [ss_store_sk#29, sum#34, count#35]
 
 (46) Exchange
-Input [3]: [ss_store_sk#30, sum#35, count#36]
-Arguments: hashpartitioning(ss_store_sk#30, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [3]: [ss_store_sk#29, sum#34, count#35]
+Arguments: hashpartitioning(ss_store_sk#29, 5), ENSURE_REQUIREMENTS, [plan_id=7]
 
 (47) HashAggregate [codegen id : 2]
-Input [3]: [ss_store_sk#30, sum#35, count#36]
-Keys [1]: [ss_store_sk#30]
-Functions [1]: [avg(UnscaledValue(ss_net_profit#31))]
-Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#31))#37]
-Results [1]: [cast((avg(UnscaledValue(ss_net_profit#31))#37 / 100.0) as decimal(11,6)) AS rank_col#38]
+Input [3]: [ss_store_sk#29, sum#34, count#35]
+Keys [1]: [ss_store_sk#29]
+Functions [1]: [avg(UnscaledValue(ss_net_profit#30))]
+Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#30))#36]
+Results [1]: [cast((avg(UnscaledValue(ss_net_profit#30))#36 / 100.0) as decimal(11,6)) AS rank_col#37]
 
-Subquery:2 Hosting operator id = 19 Hosting Expression = ReusedSubquery Subquery scalar-subquery#12, [id=#13]
+Subquery:2 Hosting operator id = 19 Hosting Expression = ReusedSubquery Subquery scalar-subquery#12, [id=#2]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44/explain.txt
index 3156a9aa72d3c..201163e8492f4 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q44/explain.txt
@@ -82,7 +82,7 @@ Results [2]: [ss_item_sk#1 AS item_sk#10, cast((avg(UnscaledValue(ss_net_profit#
 
 (8) Filter [codegen id : 2]
 Input [2]: [item_sk#10, rank_col#11]
-Condition : (isnotnull(rank_col#11) AND (cast(rank_col#11 as decimal(13,7)) > (0.9 * Subquery scalar-subquery#12, [id=#13])))
+Condition : (isnotnull(rank_col#11) AND (cast(rank_col#11 as decimal(13,7)) > (0.9 * Subquery scalar-subquery#12, [id=#2])))
 
 (9) Sort [codegen id : 2]
 Input [2]: [item_sk#10, rank_col#11]
@@ -94,7 +94,7 @@ Arguments: [rank_col#11 ASC NULLS FIRST], rank(rank_col#11), 10, Partial
 
 (11) Exchange
 Input [2]: [item_sk#10, rank_col#11]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=2]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) Sort [codegen id : 3]
 Input [2]: [item_sk#10, rank_col#11]
@@ -106,136 +106,136 @@ Arguments: [rank_col#11 ASC NULLS FIRST], rank(rank_col#11), 10, Final
 
 (14) Window
 Input [2]: [item_sk#10, rank_col#11]
-Arguments: [rank(rank_col#11) windowspecdefinition(rank_col#11 ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#14], [rank_col#11 ASC NULLS FIRST]
+Arguments: [rank(rank_col#11) windowspecdefinition(rank_col#11 ASC NULLS FIRST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#13], [rank_col#11 ASC NULLS FIRST]
 
 (15) Filter [codegen id : 4]
-Input [3]: [item_sk#10, rank_col#11, rnk#14]
-Condition : ((rnk#14 < 11) AND isnotnull(item_sk#10))
+Input [3]: [item_sk#10, rank_col#11, rnk#13]
+Condition : ((rnk#13 < 11) AND isnotnull(item_sk#10))
 
 (16) Project [codegen id : 4]
-Output [2]: [item_sk#10, rnk#14]
-Input [3]: [item_sk#10, rank_col#11, rnk#14]
+Output [2]: [item_sk#10, rnk#13]
+Input [3]: [item_sk#10, rank_col#11, rnk#13]
 
 (17) Exchange
-Input [2]: [item_sk#10, rnk#14]
-Arguments: hashpartitioning(rnk#14, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [2]: [item_sk#10, rnk#13]
+Arguments: hashpartitioning(rnk#13, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (18) Sort [codegen id : 5]
-Input [2]: [item_sk#10, rnk#14]
-Arguments: [rnk#14 ASC NULLS FIRST], false, 0
+Input [2]: [item_sk#10, rnk#13]
+Arguments: [rnk#13 ASC NULLS FIRST], false, 0
 
 (19) ReusedExchange [Reuses operator id: 6]
-Output [3]: [ss_item_sk#15, sum#16, count#17]
+Output [3]: [ss_item_sk#14, sum#15, count#16]
 
 (20) HashAggregate [codegen id : 7]
-Input [3]: [ss_item_sk#15, sum#16, count#17]
-Keys [1]: [ss_item_sk#15]
-Functions [1]: [avg(UnscaledValue(ss_net_profit#18))]
-Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#18))#19]
-Results [2]: [ss_item_sk#15 AS item_sk#20, cast((avg(UnscaledValue(ss_net_profit#18))#19 / 100.0) as decimal(11,6)) AS rank_col#21]
+Input [3]: [ss_item_sk#14, sum#15, count#16]
+Keys [1]: [ss_item_sk#14]
+Functions [1]: [avg(UnscaledValue(ss_net_profit#17))]
+Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#17))#18]
+Results [2]: [ss_item_sk#14 AS item_sk#19, cast((avg(UnscaledValue(ss_net_profit#17))#18 / 100.0) as decimal(11,6)) AS rank_col#20]
 
 (21) Filter [codegen id : 7]
-Input [2]: [item_sk#20, rank_col#21]
-Condition : (isnotnull(rank_col#21) AND (cast(rank_col#21 as decimal(13,7)) > (0.9 * ReusedSubquery Subquery scalar-subquery#12, [id=#13])))
+Input [2]: [item_sk#19, rank_col#20]
+Condition : (isnotnull(rank_col#20) AND (cast(rank_col#20 as decimal(13,7)) > (0.9 * ReusedSubquery Subquery scalar-subquery#12, [id=#2])))
 
 (22) Sort [codegen id : 7]
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], false, 0
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], false, 0
 
 (23) WindowGroupLimit
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], rank(rank_col#21), 10, Partial
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], rank(rank_col#20), 10, Partial
 
 (24) Exchange
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=4]
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
 
 (25) Sort [codegen id : 8]
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], false, 0
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], false, 0
 
 (26) WindowGroupLimit
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank_col#21 DESC NULLS LAST], rank(rank_col#21), 10, Final
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank_col#20 DESC NULLS LAST], rank(rank_col#20), 10, Final
 
 (27) Window
-Input [2]: [item_sk#20, rank_col#21]
-Arguments: [rank(rank_col#21) windowspecdefinition(rank_col#21 DESC NULLS LAST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#22], [rank_col#21 DESC NULLS LAST]
+Input [2]: [item_sk#19, rank_col#20]
+Arguments: [rank(rank_col#20) windowspecdefinition(rank_col#20 DESC NULLS LAST, specifiedwindowframe(RowFrame, unboundedpreceding$(), currentrow$())) AS rnk#21], [rank_col#20 DESC NULLS LAST]
 
 (28) Filter [codegen id : 9]
-Input [3]: [item_sk#20, rank_col#21, rnk#22]
-Condition : ((rnk#22 < 11) AND isnotnull(item_sk#20))
+Input [3]: [item_sk#19, rank_col#20, rnk#21]
+Condition : ((rnk#21 < 11) AND isnotnull(item_sk#19))
 
 (29) Project [codegen id : 9]
-Output [2]: [item_sk#20, rnk#22]
-Input [3]: [item_sk#20, rank_col#21, rnk#22]
+Output [2]: [item_sk#19, rnk#21]
+Input [3]: [item_sk#19, rank_col#20, rnk#21]
 
 (30) Exchange
-Input [2]: [item_sk#20, rnk#22]
-Arguments: hashpartitioning(rnk#22, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [2]: [item_sk#19, rnk#21]
+Arguments: hashpartitioning(rnk#21, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (31) Sort [codegen id : 10]
-Input [2]: [item_sk#20, rnk#22]
-Arguments: [rnk#22 ASC NULLS FIRST], false, 0
+Input [2]: [item_sk#19, rnk#21]
+Arguments: [rnk#21 ASC NULLS FIRST], false, 0
 
 (32) SortMergeJoin [codegen id : 13]
-Left keys [1]: [rnk#14]
-Right keys [1]: [rnk#22]
+Left keys [1]: [rnk#13]
+Right keys [1]: [rnk#21]
 Join type: Inner
 Join condition: None
 
 (33) Project [codegen id : 13]
-Output [3]: [item_sk#10, rnk#14, item_sk#20]
-Input [4]: [item_sk#10, rnk#14, item_sk#20, rnk#22]
+Output [3]: [item_sk#10, rnk#13, item_sk#19]
+Input [4]: [item_sk#10, rnk#13, item_sk#19, rnk#21]
 
 (34) Scan parquet spark_catalog.default.item
-Output [2]: [i_item_sk#23, i_product_name#24]
+Output [2]: [i_item_sk#22, i_product_name#23]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_product_name:string>
 
 (35) ColumnarToRow [codegen id : 11]
-Input [2]: [i_item_sk#23, i_product_name#24]
+Input [2]: [i_item_sk#22, i_product_name#23]
 
 (36) Filter [codegen id : 11]
-Input [2]: [i_item_sk#23, i_product_name#24]
-Condition : isnotnull(i_item_sk#23)
+Input [2]: [i_item_sk#22, i_product_name#23]
+Condition : isnotnull(i_item_sk#22)
 
 (37) BroadcastExchange
-Input [2]: [i_item_sk#23, i_product_name#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=6]
+Input [2]: [i_item_sk#22, i_product_name#23]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
 
 (38) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [item_sk#10]
-Right keys [1]: [i_item_sk#23]
+Right keys [1]: [i_item_sk#22]
 Join type: Inner
 Join condition: None
 
 (39) Project [codegen id : 13]
-Output [3]: [rnk#14, item_sk#20, i_product_name#24]
-Input [5]: [item_sk#10, rnk#14, item_sk#20, i_item_sk#23, i_product_name#24]
+Output [3]: [rnk#13, item_sk#19, i_product_name#23]
+Input [5]: [item_sk#10, rnk#13, item_sk#19, i_item_sk#22, i_product_name#23]
 
 (40) ReusedExchange [Reuses operator id: 37]
-Output [2]: [i_item_sk#25, i_product_name#26]
+Output [2]: [i_item_sk#24, i_product_name#25]
 
 (41) BroadcastHashJoin [codegen id : 13]
-Left keys [1]: [item_sk#20]
-Right keys [1]: [i_item_sk#25]
+Left keys [1]: [item_sk#19]
+Right keys [1]: [i_item_sk#24]
 Join type: Inner
 Join condition: None
 
 (42) Project [codegen id : 13]
-Output [3]: [rnk#14, i_product_name#24 AS best_performing#27, i_product_name#26 AS worst_performing#28]
-Input [5]: [rnk#14, item_sk#20, i_product_name#24, i_item_sk#25, i_product_name#26]
+Output [3]: [rnk#13, i_product_name#23 AS best_performing#26, i_product_name#25 AS worst_performing#27]
+Input [5]: [rnk#13, item_sk#19, i_product_name#23, i_item_sk#24, i_product_name#25]
 
 (43) TakeOrderedAndProject
-Input [3]: [rnk#14, best_performing#27, worst_performing#28]
-Arguments: 100, [rnk#14 ASC NULLS FIRST], [rnk#14, best_performing#27, worst_performing#28]
+Input [3]: [rnk#13, best_performing#26, worst_performing#27]
+Arguments: 100, [rnk#13 ASC NULLS FIRST], [rnk#13, best_performing#26, worst_performing#27]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#12, [id=#13]
+Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#12, [id=#2]
 * HashAggregate (50)
 +- Exchange (49)
    +- * HashAggregate (48)
@@ -246,41 +246,41 @@ Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery
 
 
 (44) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
+Output [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_store_sk), EqualTo(ss_store_sk,4), IsNull(ss_addr_sk)]
 ReadSchema: struct<ss_addr_sk:int,ss_store_sk:int,ss_net_profit:decimal(7,2)>
 
 (45) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
+Input [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
 
 (46) Filter [codegen id : 1]
-Input [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
-Condition : ((isnotnull(ss_store_sk#30) AND (ss_store_sk#30 = 4)) AND isnull(ss_addr_sk#29))
+Input [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
+Condition : ((isnotnull(ss_store_sk#29) AND (ss_store_sk#29 = 4)) AND isnull(ss_addr_sk#28))
 
 (47) Project [codegen id : 1]
-Output [2]: [ss_store_sk#30, ss_net_profit#31]
-Input [4]: [ss_addr_sk#29, ss_store_sk#30, ss_net_profit#31, ss_sold_date_sk#32]
+Output [2]: [ss_store_sk#29, ss_net_profit#30]
+Input [4]: [ss_addr_sk#28, ss_store_sk#29, ss_net_profit#30, ss_sold_date_sk#31]
 
 (48) HashAggregate [codegen id : 1]
-Input [2]: [ss_store_sk#30, ss_net_profit#31]
-Keys [1]: [ss_store_sk#30]
-Functions [1]: [partial_avg(UnscaledValue(ss_net_profit#31))]
-Aggregate Attributes [2]: [sum#33, count#34]
-Results [3]: [ss_store_sk#30, sum#35, count#36]
+Input [2]: [ss_store_sk#29, ss_net_profit#30]
+Keys [1]: [ss_store_sk#29]
+Functions [1]: [partial_avg(UnscaledValue(ss_net_profit#30))]
+Aggregate Attributes [2]: [sum#32, count#33]
+Results [3]: [ss_store_sk#29, sum#34, count#35]
 
 (49) Exchange
-Input [3]: [ss_store_sk#30, sum#35, count#36]
-Arguments: hashpartitioning(ss_store_sk#30, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [3]: [ss_store_sk#29, sum#34, count#35]
+Arguments: hashpartitioning(ss_store_sk#29, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (50) HashAggregate [codegen id : 2]
-Input [3]: [ss_store_sk#30, sum#35, count#36]
-Keys [1]: [ss_store_sk#30]
-Functions [1]: [avg(UnscaledValue(ss_net_profit#31))]
-Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#31))#37]
-Results [1]: [cast((avg(UnscaledValue(ss_net_profit#31))#37 / 100.0) as decimal(11,6)) AS rank_col#38]
+Input [3]: [ss_store_sk#29, sum#34, count#35]
+Keys [1]: [ss_store_sk#29]
+Functions [1]: [avg(UnscaledValue(ss_net_profit#30))]
+Aggregate Attributes [1]: [avg(UnscaledValue(ss_net_profit#30))#36]
+Results [1]: [cast((avg(UnscaledValue(ss_net_profit#30))#36 / 100.0) as decimal(11,6)) AS rank_col#37]
 
-Subquery:2 Hosting operator id = 21 Hosting Expression = ReusedSubquery Subquery scalar-subquery#12, [id=#13]
+Subquery:2 Hosting operator id = 21 Hosting Expression = ReusedSubquery Subquery scalar-subquery#12, [id=#2]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/explain.txt
index 4ffd467c2dbbe..02d0c1eebba83 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/explain.txt
@@ -1,90 +1,89 @@
 == Physical Plan ==
-TakeOrderedAndProject (86)
-+- * HashAggregate (85)
-   +- Exchange (84)
-      +- * HashAggregate (83)
-         +- Union (82)
-            :- * Project (27)
-            :  +- * Filter (26)
-            :     +- Window (25)
-            :        +- * Sort (24)
-            :           +- Window (23)
-            :              +- * Sort (22)
-            :                 +- Exchange (21)
-            :                    +- * HashAggregate (20)
-            :                       +- Exchange (19)
-            :                          +- * HashAggregate (18)
-            :                             +- * Project (17)
-            :                                +- * SortMergeJoin Inner (16)
-            :                                   :- * Sort (9)
-            :                                   :  +- Exchange (8)
-            :                                   :     +- * Project (7)
-            :                                   :        +- * BroadcastHashJoin Inner BuildRight (6)
-            :                                   :           :- * Project (4)
-            :                                   :           :  +- * Filter (3)
-            :                                   :           :     +- * ColumnarToRow (2)
-            :                                   :           :        +- Scan parquet spark_catalog.default.web_sales (1)
-            :                                   :           +- ReusedExchange (5)
-            :                                   +- * Sort (15)
-            :                                      +- Exchange (14)
-            :                                         +- * Project (13)
-            :                                            +- * Filter (12)
-            :                                               +- * ColumnarToRow (11)
-            :                                                  +- Scan parquet spark_catalog.default.web_returns (10)
-            :- * Project (54)
-            :  +- * Filter (53)
-            :     +- Window (52)
-            :        +- * Sort (51)
-            :           +- Window (50)
-            :              +- * Sort (49)
-            :                 +- Exchange (48)
-            :                    +- * HashAggregate (47)
-            :                       +- Exchange (46)
-            :                          +- * HashAggregate (45)
-            :                             +- * Project (44)
-            :                                +- * SortMergeJoin Inner (43)
-            :                                   :- * Sort (36)
-            :                                   :  +- Exchange (35)
-            :                                   :     +- * Project (34)
-            :                                   :        +- * BroadcastHashJoin Inner BuildRight (33)
-            :                                   :           :- * Project (31)
-            :                                   :           :  +- * Filter (30)
-            :                                   :           :     +- * ColumnarToRow (29)
-            :                                   :           :        +- Scan parquet spark_catalog.default.catalog_sales (28)
-            :                                   :           +- ReusedExchange (32)
-            :                                   +- * Sort (42)
-            :                                      +- Exchange (41)
-            :                                         +- * Project (40)
-            :                                            +- * Filter (39)
-            :                                               +- * ColumnarToRow (38)
-            :                                                  +- Scan parquet spark_catalog.default.catalog_returns (37)
-            +- * Project (81)
-               +- * Filter (80)
-                  +- Window (79)
-                     +- * Sort (78)
-                        +- Window (77)
-                           +- * Sort (76)
-                              +- Exchange (75)
-                                 +- * HashAggregate (74)
-                                    +- Exchange (73)
-                                       +- * HashAggregate (72)
-                                          +- * Project (71)
-                                             +- * SortMergeJoin Inner (70)
-                                                :- * Sort (63)
-                                                :  +- Exchange (62)
-                                                :     +- * Project (61)
-                                                :        +- * BroadcastHashJoin Inner BuildRight (60)
-                                                :           :- * Project (58)
-                                                :           :  +- * Filter (57)
-                                                :           :     +- * ColumnarToRow (56)
-                                                :           :        +- Scan parquet spark_catalog.default.store_sales (55)
-                                                :           +- ReusedExchange (59)
-                                                +- * Sort (69)
-                                                   +- Exchange (68)
-                                                      +- * Project (67)
-                                                         +- * Filter (66)
-                                                            +- * ColumnarToRow (65)
-                                                               +- Scan parquet spark_catalog.default.store_returns (64)
+TakeOrderedAndProject (85)
++- * HashAggregate (84)
+   +- * HashAggregate (83)
+      +- Union (82)
+         :- * Project (27)
+         :  +- * Filter (26)
+         :     +- Window (25)
+         :        +- * Sort (24)
+         :           +- Window (23)
+         :              +- * Sort (22)
+         :                 +- Exchange (21)
+         :                    +- * HashAggregate (20)
+         :                       +- Exchange (19)
+         :                          +- * HashAggregate (18)
+         :                             +- * Project (17)
+         :                                +- * SortMergeJoin Inner (16)
+         :                                   :- * Sort (9)
+         :                                   :  +- Exchange (8)
+         :                                   :     +- * Project (7)
+         :                                   :        +- * BroadcastHashJoin Inner BuildRight (6)
+         :                                   :           :- * Project (4)
+         :                                   :           :  +- * Filter (3)
+         :                                   :           :     +- * ColumnarToRow (2)
+         :                                   :           :        +- Scan parquet spark_catalog.default.web_sales (1)
+         :                                   :           +- ReusedExchange (5)
+         :                                   +- * Sort (15)
+         :                                      +- Exchange (14)
+         :                                         +- * Project (13)
+         :                                            +- * Filter (12)
+         :                                               +- * ColumnarToRow (11)
+         :                                                  +- Scan parquet spark_catalog.default.web_returns (10)
+         :- * Project (54)
+         :  +- * Filter (53)
+         :     +- Window (52)
+         :        +- * Sort (51)
+         :           +- Window (50)
+         :              +- * Sort (49)
+         :                 +- Exchange (48)
+         :                    +- * HashAggregate (47)
+         :                       +- Exchange (46)
+         :                          +- * HashAggregate (45)
+         :                             +- * Project (44)
+         :                                +- * SortMergeJoin Inner (43)
+         :                                   :- * Sort (36)
+         :                                   :  +- Exchange (35)
+         :                                   :     +- * Project (34)
+         :                                   :        +- * BroadcastHashJoin Inner BuildRight (33)
+         :                                   :           :- * Project (31)
+         :                                   :           :  +- * Filter (30)
+         :                                   :           :     +- * ColumnarToRow (29)
+         :                                   :           :        +- Scan parquet spark_catalog.default.catalog_sales (28)
+         :                                   :           +- ReusedExchange (32)
+         :                                   +- * Sort (42)
+         :                                      +- Exchange (41)
+         :                                         +- * Project (40)
+         :                                            +- * Filter (39)
+         :                                               +- * ColumnarToRow (38)
+         :                                                  +- Scan parquet spark_catalog.default.catalog_returns (37)
+         +- * Project (81)
+            +- * Filter (80)
+               +- Window (79)
+                  +- * Sort (78)
+                     +- Window (77)
+                        +- * Sort (76)
+                           +- Exchange (75)
+                              +- * HashAggregate (74)
+                                 +- Exchange (73)
+                                    +- * HashAggregate (72)
+                                       +- * Project (71)
+                                          +- * SortMergeJoin Inner (70)
+                                             :- * Sort (63)
+                                             :  +- Exchange (62)
+                                             :     +- * Project (61)
+                                             :        +- * BroadcastHashJoin Inner BuildRight (60)
+                                             :           :- * Project (58)
+                                             :           :  +- * Filter (57)
+                                             :           :     +- * ColumnarToRow (56)
+                                             :           :        +- Scan parquet spark_catalog.default.store_sales (55)
+                                             :           +- ReusedExchange (59)
+                                             +- * Sort (69)
+                                                +- Exchange (68)
+                                                   +- * Project (67)
+                                                      +- * Filter (66)
+                                                         +- * ColumnarToRow (65)
+                                                            +- Scan parquet spark_catalog.default.store_returns (64)
 
 
 (1) Scan parquet spark_catalog.default.web_sales
@@ -106,7 +105,7 @@ Condition : (((((((isnotnull(ws_net_profit#5) AND isnotnull(ws_net_paid#4)) AND
 Output [5]: [ws_item_sk#1, ws_order_number#2, ws_quantity#3, ws_net_paid#4, ws_sold_date_sk#6]
 Input [6]: [ws_item_sk#1, ws_order_number#2, ws_quantity#3, ws_net_paid#4, ws_net_profit#5, ws_sold_date_sk#6]
 
-(5) ReusedExchange [Reuses operator id: 91]
+(5) ReusedExchange [Reuses operator id: 90]
 Output [1]: [d_date_sk#8]
 
 (6) BroadcastHashJoin [codegen id : 2]
@@ -228,7 +227,7 @@ Condition : (((((((isnotnull(cs_net_profit#40) AND isnotnull(cs_net_paid#39)) AN
 Output [5]: [cs_item_sk#36, cs_order_number#37, cs_quantity#38, cs_net_paid#39, cs_sold_date_sk#41]
 Input [6]: [cs_item_sk#36, cs_order_number#37, cs_quantity#38, cs_net_paid#39, cs_net_profit#40, cs_sold_date_sk#41]
 
-(32) ReusedExchange [Reuses operator id: 91]
+(32) ReusedExchange [Reuses operator id: 90]
 Output [1]: [d_date_sk#42]
 
 (33) BroadcastHashJoin [codegen id : 12]
@@ -350,7 +349,7 @@ Condition : (((((((isnotnull(ss_net_profit#74) AND isnotnull(ss_net_paid#73)) AN
 Output [5]: [ss_item_sk#70, ss_ticket_number#71, ss_quantity#72, ss_net_paid#73, ss_sold_date_sk#75]
 Input [6]: [ss_item_sk#70, ss_ticket_number#71, ss_quantity#72, ss_net_paid#73, ss_net_profit#74, ss_sold_date_sk#75]
 
-(59) ReusedExchange [Reuses operator id: 91]
+(59) ReusedExchange [Reuses operator id: 90]
 Output [1]: [d_date_sk#76]
 
 (60) BroadcastHashJoin [codegen id : 22]
@@ -462,52 +461,48 @@ Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(84) Exchange
-Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
-Arguments: hashpartitioning(channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34, 5), ENSURE_REQUIREMENTS, [plan_id=13]
-
-(85) HashAggregate [codegen id : 32]
+(84) HashAggregate [codegen id : 31]
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Keys [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(86) TakeOrderedAndProject
+(85) TakeOrderedAndProject
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Arguments: 100, [channel#35 ASC NULLS FIRST, return_rank#33 ASC NULLS FIRST, currency_rank#34 ASC NULLS FIRST], [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ws_sold_date_sk#6 IN dynamicpruning#7
-BroadcastExchange (91)
-+- * Project (90)
-   +- * Filter (89)
-      +- * ColumnarToRow (88)
-         +- Scan parquet spark_catalog.default.date_dim (87)
+BroadcastExchange (90)
++- * Project (89)
+   +- * Filter (88)
+      +- * ColumnarToRow (87)
+         +- Scan parquet spark_catalog.default.date_dim (86)
 
 
-(87) Scan parquet spark_catalog.default.date_dim
+(86) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#8, d_year#104, d_moy#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,12), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(88) ColumnarToRow [codegen id : 1]
+(87) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#8, d_year#104, d_moy#105]
 
-(89) Filter [codegen id : 1]
+(88) Filter [codegen id : 1]
 Input [3]: [d_date_sk#8, d_year#104, d_moy#105]
 Condition : ((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND (d_year#104 = 2001)) AND (d_moy#105 = 12)) AND isnotnull(d_date_sk#8))
 
-(90) Project [codegen id : 1]
+(89) Project [codegen id : 1]
 Output [1]: [d_date_sk#8]
 Input [3]: [d_date_sk#8, d_year#104, d_moy#105]
 
-(91) BroadcastExchange
+(90) BroadcastExchange
 Input [1]: [d_date_sk#8]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
 
 Subquery:2 Hosting operator id = 28 Hosting Expression = cs_sold_date_sk#41 IN dynamicpruning#7
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/simplified.txt
index 80d1661b033de..cc2ebb0c36ea8 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49.sf100/simplified.txt
@@ -1,160 +1,157 @@
 TakeOrderedAndProject [channel,return_rank,currency_rank,item,return_ratio]
-  WholeStageCodegen (32)
+  WholeStageCodegen (31)
     HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-      InputAdapter
-        Exchange [channel,item,return_ratio,return_rank,currency_rank] #1
-          WholeStageCodegen (31)
-            HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-              InputAdapter
-                Union
-                  WholeStageCodegen (10)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (9)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (8)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #2
-                                            WholeStageCodegen (7)
-                                              HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ws_item_sk] #3
-                                                    WholeStageCodegen (6)
-                                                      HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
-                                                          SortMergeJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
+      HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
+        InputAdapter
+          Union
+            WholeStageCodegen (10)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (9)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (8)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #1
+                                      WholeStageCodegen (7)
+                                        HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ws_item_sk] #2
+                                              WholeStageCodegen (6)
+                                                HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
+                                                    SortMergeJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
+                                                      InputAdapter
+                                                        WholeStageCodegen (3)
+                                                          Sort [ws_order_number,ws_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (3)
-                                                                Sort [ws_order_number,ws_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [ws_order_number,ws_item_sk] #4
-                                                                      WholeStageCodegen (2)
-                                                                        Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid]
-                                                                          BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                                            Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
-                                                                              Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
-                                                                                ColumnarToRow
-                                                                                  InputAdapter
-                                                                                    Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
-                                                                                      SubqueryBroadcast [d_date_sk] #1
-                                                                                        BroadcastExchange #5
-                                                                                          WholeStageCodegen (1)
-                                                                                            Project [d_date_sk]
-                                                                                              Filter [d_year,d_moy,d_date_sk]
-                                                                                                ColumnarToRow
-                                                                                                  InputAdapter
-                                                                                                    Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                              Exchange [ws_order_number,ws_item_sk] #3
+                                                                WholeStageCodegen (2)
+                                                                  Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid]
+                                                                    BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                                      Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
+                                                                        Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
+                                                                          ColumnarToRow
                                                                             InputAdapter
-                                                                              ReusedExchange [d_date_sk] #5
+                                                                              Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
+                                                                                SubqueryBroadcast [d_date_sk] #1
+                                                                                  BroadcastExchange #4
+                                                                                    WholeStageCodegen (1)
+                                                                                      Project [d_date_sk]
+                                                                                        Filter [d_year,d_moy,d_date_sk]
+                                                                                          ColumnarToRow
+                                                                                            InputAdapter
+                                                                                              Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                                      InputAdapter
+                                                                        ReusedExchange [d_date_sk] #4
+                                                      InputAdapter
+                                                        WholeStageCodegen (5)
+                                                          Sort [wr_order_number,wr_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (5)
-                                                                Sort [wr_order_number,wr_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [wr_order_number,wr_item_sk] #6
-                                                                      WholeStageCodegen (4)
-                                                                        Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
-                                                                          Filter [wr_return_amt,wr_order_number,wr_item_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
-                  WholeStageCodegen (20)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (19)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (18)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #7
-                                            WholeStageCodegen (17)
-                                              HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [cs_item_sk] #8
-                                                    WholeStageCodegen (16)
-                                                      HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
-                                                          SortMergeJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                              Exchange [wr_order_number,wr_item_sk] #5
+                                                                WholeStageCodegen (4)
+                                                                  Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
+                                                                    Filter [wr_return_amt,wr_order_number,wr_item_sk]
+                                                                      ColumnarToRow
+                                                                        InputAdapter
+                                                                          Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
+            WholeStageCodegen (20)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (19)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (18)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #6
+                                      WholeStageCodegen (17)
+                                        HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [cs_item_sk] #7
+                                              WholeStageCodegen (16)
+                                                HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
+                                                    SortMergeJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                      InputAdapter
+                                                        WholeStageCodegen (13)
+                                                          Sort [cs_order_number,cs_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (13)
-                                                                Sort [cs_order_number,cs_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [cs_order_number,cs_item_sk] #9
-                                                                      WholeStageCodegen (12)
-                                                                        Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid]
-                                                                          BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                                            Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
-                                                                              Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
-                                                                                ColumnarToRow
-                                                                                  InputAdapter
-                                                                                    Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
-                                                                                      ReusedSubquery [d_date_sk] #1
+                                                              Exchange [cs_order_number,cs_item_sk] #8
+                                                                WholeStageCodegen (12)
+                                                                  Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid]
+                                                                    BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                                      Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
+                                                                        Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
+                                                                          ColumnarToRow
                                                                             InputAdapter
-                                                                              ReusedExchange [d_date_sk] #5
+                                                                              Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
+                                                                                ReusedSubquery [d_date_sk] #1
+                                                                      InputAdapter
+                                                                        ReusedExchange [d_date_sk] #4
+                                                      InputAdapter
+                                                        WholeStageCodegen (15)
+                                                          Sort [cr_order_number,cr_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (15)
-                                                                Sort [cr_order_number,cr_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [cr_order_number,cr_item_sk] #10
-                                                                      WholeStageCodegen (14)
-                                                                        Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
-                                                                          Filter [cr_return_amount,cr_order_number,cr_item_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
-                  WholeStageCodegen (30)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (29)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (28)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #11
-                                            WholeStageCodegen (27)
-                                              HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ss_item_sk] #12
-                                                    WholeStageCodegen (26)
-                                                      HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
-                                                          SortMergeJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                              Exchange [cr_order_number,cr_item_sk] #9
+                                                                WholeStageCodegen (14)
+                                                                  Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
+                                                                    Filter [cr_return_amount,cr_order_number,cr_item_sk]
+                                                                      ColumnarToRow
+                                                                        InputAdapter
+                                                                          Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
+            WholeStageCodegen (30)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (29)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (28)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #10
+                                      WholeStageCodegen (27)
+                                        HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ss_item_sk] #11
+                                              WholeStageCodegen (26)
+                                                HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
+                                                    SortMergeJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                      InputAdapter
+                                                        WholeStageCodegen (23)
+                                                          Sort [ss_ticket_number,ss_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (23)
-                                                                Sort [ss_ticket_number,ss_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [ss_ticket_number,ss_item_sk] #13
-                                                                      WholeStageCodegen (22)
-                                                                        Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid]
-                                                                          BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                                            Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
-                                                                              Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
-                                                                                ColumnarToRow
-                                                                                  InputAdapter
-                                                                                    Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
-                                                                                      ReusedSubquery [d_date_sk] #1
+                                                              Exchange [ss_ticket_number,ss_item_sk] #12
+                                                                WholeStageCodegen (22)
+                                                                  Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid]
+                                                                    BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                                      Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
+                                                                        Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
+                                                                          ColumnarToRow
                                                                             InputAdapter
-                                                                              ReusedExchange [d_date_sk] #5
+                                                                              Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
+                                                                                ReusedSubquery [d_date_sk] #1
+                                                                      InputAdapter
+                                                                        ReusedExchange [d_date_sk] #4
+                                                      InputAdapter
+                                                        WholeStageCodegen (25)
+                                                          Sort [sr_ticket_number,sr_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (25)
-                                                                Sort [sr_ticket_number,sr_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [sr_ticket_number,sr_item_sk] #14
-                                                                      WholeStageCodegen (24)
-                                                                        Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
-                                                                          Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
+                                                              Exchange [sr_ticket_number,sr_item_sk] #13
+                                                                WholeStageCodegen (24)
+                                                                  Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
+                                                                    Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
+                                                                      ColumnarToRow
+                                                                        InputAdapter
+                                                                          Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/explain.txt
index 9eea658d789e4..a796c272c9acf 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/explain.txt
@@ -1,81 +1,80 @@
 == Physical Plan ==
-TakeOrderedAndProject (77)
-+- * HashAggregate (76)
-   +- Exchange (75)
-      +- * HashAggregate (74)
-         +- Union (73)
-            :- * Project (24)
-            :  +- * Filter (23)
-            :     +- Window (22)
-            :        +- * Sort (21)
-            :           +- Window (20)
-            :              +- * Sort (19)
-            :                 +- Exchange (18)
-            :                    +- * HashAggregate (17)
-            :                       +- Exchange (16)
-            :                          +- * HashAggregate (15)
-            :                             +- * Project (14)
-            :                                +- * BroadcastHashJoin Inner BuildRight (13)
-            :                                   :- * Project (11)
-            :                                   :  +- * BroadcastHashJoin Inner BuildLeft (10)
-            :                                   :     :- BroadcastExchange (5)
-            :                                   :     :  +- * Project (4)
-            :                                   :     :     +- * Filter (3)
-            :                                   :     :        +- * ColumnarToRow (2)
-            :                                   :     :           +- Scan parquet spark_catalog.default.web_sales (1)
-            :                                   :     +- * Project (9)
-            :                                   :        +- * Filter (8)
-            :                                   :           +- * ColumnarToRow (7)
-            :                                   :              +- Scan parquet spark_catalog.default.web_returns (6)
-            :                                   +- ReusedExchange (12)
-            :- * Project (48)
-            :  +- * Filter (47)
-            :     +- Window (46)
-            :        +- * Sort (45)
-            :           +- Window (44)
-            :              +- * Sort (43)
-            :                 +- Exchange (42)
-            :                    +- * HashAggregate (41)
-            :                       +- Exchange (40)
-            :                          +- * HashAggregate (39)
-            :                             +- * Project (38)
-            :                                +- * BroadcastHashJoin Inner BuildRight (37)
-            :                                   :- * Project (35)
-            :                                   :  +- * BroadcastHashJoin Inner BuildLeft (34)
-            :                                   :     :- BroadcastExchange (29)
-            :                                   :     :  +- * Project (28)
-            :                                   :     :     +- * Filter (27)
-            :                                   :     :        +- * ColumnarToRow (26)
-            :                                   :     :           +- Scan parquet spark_catalog.default.catalog_sales (25)
-            :                                   :     +- * Project (33)
-            :                                   :        +- * Filter (32)
-            :                                   :           +- * ColumnarToRow (31)
-            :                                   :              +- Scan parquet spark_catalog.default.catalog_returns (30)
-            :                                   +- ReusedExchange (36)
-            +- * Project (72)
-               +- * Filter (71)
-                  +- Window (70)
-                     +- * Sort (69)
-                        +- Window (68)
-                           +- * Sort (67)
-                              +- Exchange (66)
-                                 +- * HashAggregate (65)
-                                    +- Exchange (64)
-                                       +- * HashAggregate (63)
-                                          +- * Project (62)
-                                             +- * BroadcastHashJoin Inner BuildRight (61)
-                                                :- * Project (59)
-                                                :  +- * BroadcastHashJoin Inner BuildLeft (58)
-                                                :     :- BroadcastExchange (53)
-                                                :     :  +- * Project (52)
-                                                :     :     +- * Filter (51)
-                                                :     :        +- * ColumnarToRow (50)
-                                                :     :           +- Scan parquet spark_catalog.default.store_sales (49)
-                                                :     +- * Project (57)
-                                                :        +- * Filter (56)
-                                                :           +- * ColumnarToRow (55)
-                                                :              +- Scan parquet spark_catalog.default.store_returns (54)
-                                                +- ReusedExchange (60)
+TakeOrderedAndProject (76)
++- * HashAggregate (75)
+   +- * HashAggregate (74)
+      +- Union (73)
+         :- * Project (24)
+         :  +- * Filter (23)
+         :     +- Window (22)
+         :        +- * Sort (21)
+         :           +- Window (20)
+         :              +- * Sort (19)
+         :                 +- Exchange (18)
+         :                    +- * HashAggregate (17)
+         :                       +- Exchange (16)
+         :                          +- * HashAggregate (15)
+         :                             +- * Project (14)
+         :                                +- * BroadcastHashJoin Inner BuildRight (13)
+         :                                   :- * Project (11)
+         :                                   :  +- * BroadcastHashJoin Inner BuildLeft (10)
+         :                                   :     :- BroadcastExchange (5)
+         :                                   :     :  +- * Project (4)
+         :                                   :     :     +- * Filter (3)
+         :                                   :     :        +- * ColumnarToRow (2)
+         :                                   :     :           +- Scan parquet spark_catalog.default.web_sales (1)
+         :                                   :     +- * Project (9)
+         :                                   :        +- * Filter (8)
+         :                                   :           +- * ColumnarToRow (7)
+         :                                   :              +- Scan parquet spark_catalog.default.web_returns (6)
+         :                                   +- ReusedExchange (12)
+         :- * Project (48)
+         :  +- * Filter (47)
+         :     +- Window (46)
+         :        +- * Sort (45)
+         :           +- Window (44)
+         :              +- * Sort (43)
+         :                 +- Exchange (42)
+         :                    +- * HashAggregate (41)
+         :                       +- Exchange (40)
+         :                          +- * HashAggregate (39)
+         :                             +- * Project (38)
+         :                                +- * BroadcastHashJoin Inner BuildRight (37)
+         :                                   :- * Project (35)
+         :                                   :  +- * BroadcastHashJoin Inner BuildLeft (34)
+         :                                   :     :- BroadcastExchange (29)
+         :                                   :     :  +- * Project (28)
+         :                                   :     :     +- * Filter (27)
+         :                                   :     :        +- * ColumnarToRow (26)
+         :                                   :     :           +- Scan parquet spark_catalog.default.catalog_sales (25)
+         :                                   :     +- * Project (33)
+         :                                   :        +- * Filter (32)
+         :                                   :           +- * ColumnarToRow (31)
+         :                                   :              +- Scan parquet spark_catalog.default.catalog_returns (30)
+         :                                   +- ReusedExchange (36)
+         +- * Project (72)
+            +- * Filter (71)
+               +- Window (70)
+                  +- * Sort (69)
+                     +- Window (68)
+                        +- * Sort (67)
+                           +- Exchange (66)
+                              +- * HashAggregate (65)
+                                 +- Exchange (64)
+                                    +- * HashAggregate (63)
+                                       +- * Project (62)
+                                          +- * BroadcastHashJoin Inner BuildRight (61)
+                                             :- * Project (59)
+                                             :  +- * BroadcastHashJoin Inner BuildLeft (58)
+                                             :     :- BroadcastExchange (53)
+                                             :     :  +- * Project (52)
+                                             :     :     +- * Filter (51)
+                                             :     :        +- * ColumnarToRow (50)
+                                             :     :           +- Scan parquet spark_catalog.default.store_sales (49)
+                                             :     +- * Project (57)
+                                             :        +- * Filter (56)
+                                             :           +- * ColumnarToRow (55)
+                                             :              +- Scan parquet spark_catalog.default.store_returns (54)
+                                             +- ReusedExchange (60)
 
 
 (1) Scan parquet spark_catalog.default.web_sales
@@ -129,7 +128,7 @@ Join condition: None
 Output [6]: [ws_item_sk#1, ws_quantity#3, ws_net_paid#4, ws_sold_date_sk#6, wr_return_quantity#10, wr_return_amt#11]
 Input [9]: [ws_item_sk#1, ws_order_number#2, ws_quantity#3, ws_net_paid#4, ws_sold_date_sk#6, wr_item_sk#8, wr_order_number#9, wr_return_quantity#10, wr_return_amt#11]
 
-(12) ReusedExchange [Reuses operator id: 82]
+(12) ReusedExchange [Reuses operator id: 81]
 Output [1]: [d_date_sk#13]
 
 (13) BroadcastHashJoin [codegen id : 3]
@@ -239,7 +238,7 @@ Join condition: None
 Output [6]: [cs_item_sk#36, cs_quantity#38, cs_net_paid#39, cs_sold_date_sk#41, cr_return_quantity#44, cr_return_amount#45]
 Input [9]: [cs_item_sk#36, cs_order_number#37, cs_quantity#38, cs_net_paid#39, cs_sold_date_sk#41, cr_item_sk#42, cr_order_number#43, cr_return_quantity#44, cr_return_amount#45]
 
-(36) ReusedExchange [Reuses operator id: 82]
+(36) ReusedExchange [Reuses operator id: 81]
 Output [1]: [d_date_sk#47]
 
 (37) BroadcastHashJoin [codegen id : 10]
@@ -349,7 +348,7 @@ Join condition: None
 Output [6]: [ss_item_sk#70, ss_quantity#72, ss_net_paid#73, ss_sold_date_sk#75, sr_return_quantity#78, sr_return_amt#79]
 Input [9]: [ss_item_sk#70, ss_ticket_number#71, ss_quantity#72, ss_net_paid#73, ss_sold_date_sk#75, sr_item_sk#76, sr_ticket_number#77, sr_return_quantity#78, sr_return_amt#79]
 
-(60) ReusedExchange [Reuses operator id: 82]
+(60) ReusedExchange [Reuses operator id: 81]
 Output [1]: [d_date_sk#81]
 
 (61) BroadcastHashJoin [codegen id : 17]
@@ -417,52 +416,48 @@ Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(75) Exchange
-Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
-Arguments: hashpartitioning(channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34, 5), ENSURE_REQUIREMENTS, [plan_id=10]
-
-(76) HashAggregate [codegen id : 23]
+(75) HashAggregate [codegen id : 22]
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Keys [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(77) TakeOrderedAndProject
+(76) TakeOrderedAndProject
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Arguments: 100, [channel#35 ASC NULLS FIRST, return_rank#33 ASC NULLS FIRST, currency_rank#34 ASC NULLS FIRST], [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ws_sold_date_sk#6 IN dynamicpruning#7
-BroadcastExchange (82)
-+- * Project (81)
-   +- * Filter (80)
-      +- * ColumnarToRow (79)
-         +- Scan parquet spark_catalog.default.date_dim (78)
+BroadcastExchange (81)
++- * Project (80)
+   +- * Filter (79)
+      +- * ColumnarToRow (78)
+         +- Scan parquet spark_catalog.default.date_dim (77)
 
 
-(78) Scan parquet spark_catalog.default.date_dim
+(77) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#13, d_year#104, d_moy#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,12), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(79) ColumnarToRow [codegen id : 1]
+(78) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#13, d_year#104, d_moy#105]
 
-(80) Filter [codegen id : 1]
+(79) Filter [codegen id : 1]
 Input [3]: [d_date_sk#13, d_year#104, d_moy#105]
 Condition : ((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND (d_year#104 = 2001)) AND (d_moy#105 = 12)) AND isnotnull(d_date_sk#13))
 
-(81) Project [codegen id : 1]
+(80) Project [codegen id : 1]
 Output [1]: [d_date_sk#13]
 Input [3]: [d_date_sk#13, d_year#104, d_moy#105]
 
-(82) BroadcastExchange
+(81) BroadcastExchange
 Input [1]: [d_date_sk#13]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=11]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
 Subquery:2 Hosting operator id = 25 Hosting Expression = cs_sold_date_sk#41 IN dynamicpruning#7
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/simplified.txt
index cfb4b948b4e8b..2ea310d01171d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q49/simplified.txt
@@ -1,133 +1,130 @@
 TakeOrderedAndProject [channel,return_rank,currency_rank,item,return_ratio]
-  WholeStageCodegen (23)
+  WholeStageCodegen (22)
     HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-      InputAdapter
-        Exchange [channel,item,return_ratio,return_rank,currency_rank] #1
-          WholeStageCodegen (22)
-            HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-              InputAdapter
-                Union
-                  WholeStageCodegen (7)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (6)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (5)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #2
-                                            WholeStageCodegen (4)
-                                              HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ws_item_sk] #3
-                                                    WholeStageCodegen (3)
-                                                      HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
-                                                          BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                            Project [ws_item_sk,ws_quantity,ws_net_paid,ws_sold_date_sk,wr_return_quantity,wr_return_amt]
-                                                              BroadcastHashJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
-                                                                InputAdapter
-                                                                  BroadcastExchange #4
-                                                                    WholeStageCodegen (1)
-                                                                      Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
-                                                                        Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
-                                                                          ColumnarToRow
-                                                                            InputAdapter
-                                                                              Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
-                                                                                SubqueryBroadcast [d_date_sk] #1
-                                                                                  BroadcastExchange #5
-                                                                                    WholeStageCodegen (1)
-                                                                                      Project [d_date_sk]
-                                                                                        Filter [d_year,d_moy,d_date_sk]
-                                                                                          ColumnarToRow
-                                                                                            InputAdapter
-                                                                                              Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                                                Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
-                                                                  Filter [wr_return_amt,wr_order_number,wr_item_sk]
+      HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
+        InputAdapter
+          Union
+            WholeStageCodegen (7)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (6)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (5)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #1
+                                      WholeStageCodegen (4)
+                                        HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ws_item_sk] #2
+                                              WholeStageCodegen (3)
+                                                HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
+                                                    BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                      Project [ws_item_sk,ws_quantity,ws_net_paid,ws_sold_date_sk,wr_return_quantity,wr_return_amt]
+                                                        BroadcastHashJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
+                                                          InputAdapter
+                                                            BroadcastExchange #3
+                                                              WholeStageCodegen (1)
+                                                                Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
+                                                                  Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
                                                                     ColumnarToRow
                                                                       InputAdapter
-                                                                        Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
-                                                            InputAdapter
-                                                              ReusedExchange [d_date_sk] #5
-                  WholeStageCodegen (14)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (13)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (12)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #6
-                                            WholeStageCodegen (11)
-                                              HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [cs_item_sk] #7
-                                                    WholeStageCodegen (10)
-                                                      HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
-                                                          BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                            Project [cs_item_sk,cs_quantity,cs_net_paid,cs_sold_date_sk,cr_return_quantity,cr_return_amount]
-                                                              BroadcastHashJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                                        Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
+                                                                          SubqueryBroadcast [d_date_sk] #1
+                                                                            BroadcastExchange #4
+                                                                              WholeStageCodegen (1)
+                                                                                Project [d_date_sk]
+                                                                                  Filter [d_year,d_moy,d_date_sk]
+                                                                                    ColumnarToRow
+                                                                                      InputAdapter
+                                                                                        Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                          Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
+                                                            Filter [wr_return_amt,wr_order_number,wr_item_sk]
+                                                              ColumnarToRow
                                                                 InputAdapter
-                                                                  BroadcastExchange #8
-                                                                    WholeStageCodegen (8)
-                                                                      Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
-                                                                        Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
-                                                                          ColumnarToRow
-                                                                            InputAdapter
-                                                                              Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
-                                                                                ReusedSubquery [d_date_sk] #1
-                                                                Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
-                                                                  Filter [cr_return_amount,cr_order_number,cr_item_sk]
+                                                                  Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
+                                                      InputAdapter
+                                                        ReusedExchange [d_date_sk] #4
+            WholeStageCodegen (14)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (13)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (12)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #5
+                                      WholeStageCodegen (11)
+                                        HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [cs_item_sk] #6
+                                              WholeStageCodegen (10)
+                                                HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
+                                                    BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                      Project [cs_item_sk,cs_quantity,cs_net_paid,cs_sold_date_sk,cr_return_quantity,cr_return_amount]
+                                                        BroadcastHashJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                          InputAdapter
+                                                            BroadcastExchange #7
+                                                              WholeStageCodegen (8)
+                                                                Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
+                                                                  Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
                                                                     ColumnarToRow
                                                                       InputAdapter
-                                                                        Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
-                                                            InputAdapter
-                                                              ReusedExchange [d_date_sk] #5
-                  WholeStageCodegen (21)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (20)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (19)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #9
-                                            WholeStageCodegen (18)
-                                              HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ss_item_sk] #10
-                                                    WholeStageCodegen (17)
-                                                      HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
-                                                          BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                            Project [ss_item_sk,ss_quantity,ss_net_paid,ss_sold_date_sk,sr_return_quantity,sr_return_amt]
-                                                              BroadcastHashJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                                        Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
+                                                                          ReusedSubquery [d_date_sk] #1
+                                                          Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
+                                                            Filter [cr_return_amount,cr_order_number,cr_item_sk]
+                                                              ColumnarToRow
                                                                 InputAdapter
-                                                                  BroadcastExchange #11
-                                                                    WholeStageCodegen (15)
-                                                                      Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
-                                                                        Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
-                                                                          ColumnarToRow
-                                                                            InputAdapter
-                                                                              Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
-                                                                                ReusedSubquery [d_date_sk] #1
-                                                                Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
-                                                                  Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
+                                                                  Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
+                                                      InputAdapter
+                                                        ReusedExchange [d_date_sk] #4
+            WholeStageCodegen (21)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (20)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (19)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #8
+                                      WholeStageCodegen (18)
+                                        HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ss_item_sk] #9
+                                              WholeStageCodegen (17)
+                                                HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
+                                                    BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                      Project [ss_item_sk,ss_quantity,ss_net_paid,ss_sold_date_sk,sr_return_quantity,sr_return_amt]
+                                                        BroadcastHashJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                          InputAdapter
+                                                            BroadcastExchange #10
+                                                              WholeStageCodegen (15)
+                                                                Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
+                                                                  Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
                                                                     ColumnarToRow
                                                                       InputAdapter
-                                                                        Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
-                                                            InputAdapter
-                                                              ReusedExchange [d_date_sk] #5
+                                                                        Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
+                                                                          ReusedSubquery [d_date_sk] #1
+                                                          Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
+                                                            Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
+                                                              ColumnarToRow
+                                                                InputAdapter
+                                                                  Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
+                                                      InputAdapter
+                                                        ReusedExchange [d_date_sk] #4
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54.sf100/explain.txt
index 572452c72529e..5760432f72db8 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54.sf100/explain.txt
@@ -395,7 +395,7 @@ Input [2]: [d_date_sk#29, d_month_seq#41]
 
 (67) Filter [codegen id : 1]
 Input [2]: [d_date_sk#29, d_month_seq#41]
-Condition : (((isnotnull(d_month_seq#41) AND (d_month_seq#41 >= ReusedSubquery Subquery scalar-subquery#42, [id=#44])) AND (d_month_seq#41 <= ReusedSubquery Subquery scalar-subquery#43, [id=#45])) AND isnotnull(d_date_sk#29))
+Condition : (((isnotnull(d_month_seq#41) AND (d_month_seq#41 >= ReusedSubquery Subquery scalar-subquery#42, [id=#9])) AND (d_month_seq#41 <= ReusedSubquery Subquery scalar-subquery#43, [id=#10])) AND isnotnull(d_date_sk#29))
 
 (68) Project [codegen id : 1]
 Output [1]: [d_date_sk#29]
@@ -403,13 +403,13 @@ Input [2]: [d_date_sk#29, d_month_seq#41]
 
 (69) BroadcastExchange
 Input [1]: [d_date_sk#29]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=11]
 
-Subquery:4 Hosting operator id = 67 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#44]
+Subquery:4 Hosting operator id = 67 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#9]
 
-Subquery:5 Hosting operator id = 67 Hosting Expression = ReusedSubquery Subquery scalar-subquery#43, [id=#45]
+Subquery:5 Hosting operator id = 67 Hosting Expression = ReusedSubquery Subquery scalar-subquery#43, [id=#10]
 
-Subquery:6 Hosting operator id = 65 Hosting Expression = Subquery scalar-subquery#42, [id=#44]
+Subquery:6 Hosting operator id = 65 Hosting Expression = Subquery scalar-subquery#42, [id=#9]
 * HashAggregate (76)
 +- Exchange (75)
    +- * HashAggregate (74)
@@ -420,42 +420,42 @@ Subquery:6 Hosting operator id = 65 Hosting Expression = Subquery scalar-subquer
 
 
 (70) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#46, d_year#47, d_moy#48]
+Output [3]: [d_month_seq#44, d_year#45, d_moy#46]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,12)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (71) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#46, d_year#47, d_moy#48]
+Input [3]: [d_month_seq#44, d_year#45, d_moy#46]
 
 (72) Filter [codegen id : 1]
-Input [3]: [d_month_seq#46, d_year#47, d_moy#48]
-Condition : (((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 1998)) AND (d_moy#48 = 12))
+Input [3]: [d_month_seq#44, d_year#45, d_moy#46]
+Condition : (((isnotnull(d_year#45) AND isnotnull(d_moy#46)) AND (d_year#45 = 1998)) AND (d_moy#46 = 12))
 
 (73) Project [codegen id : 1]
-Output [1]: [(d_month_seq#46 + 1) AS (d_month_seq + 1)#49]
-Input [3]: [d_month_seq#46, d_year#47, d_moy#48]
+Output [1]: [(d_month_seq#44 + 1) AS (d_month_seq + 1)#47]
+Input [3]: [d_month_seq#44, d_year#45, d_moy#46]
 
 (74) HashAggregate [codegen id : 1]
-Input [1]: [(d_month_seq + 1)#49]
-Keys [1]: [(d_month_seq + 1)#49]
+Input [1]: [(d_month_seq + 1)#47]
+Keys [1]: [(d_month_seq + 1)#47]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 1)#49]
+Results [1]: [(d_month_seq + 1)#47]
 
 (75) Exchange
-Input [1]: [(d_month_seq + 1)#49]
-Arguments: hashpartitioning((d_month_seq + 1)#49, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [(d_month_seq + 1)#47]
+Arguments: hashpartitioning((d_month_seq + 1)#47, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (76) HashAggregate [codegen id : 2]
-Input [1]: [(d_month_seq + 1)#49]
-Keys [1]: [(d_month_seq + 1)#49]
+Input [1]: [(d_month_seq + 1)#47]
+Keys [1]: [(d_month_seq + 1)#47]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 1)#49]
+Results [1]: [(d_month_seq + 1)#47]
 
-Subquery:7 Hosting operator id = 65 Hosting Expression = Subquery scalar-subquery#43, [id=#45]
+Subquery:7 Hosting operator id = 65 Hosting Expression = Subquery scalar-subquery#43, [id=#10]
 * HashAggregate (83)
 +- Exchange (82)
    +- * HashAggregate (81)
@@ -466,39 +466,39 @@ Subquery:7 Hosting operator id = 65 Hosting Expression = Subquery scalar-subquer
 
 
 (77) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#50, d_year#51, d_moy#52]
+Output [3]: [d_month_seq#48, d_year#49, d_moy#50]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,12)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (78) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#50, d_year#51, d_moy#52]
+Input [3]: [d_month_seq#48, d_year#49, d_moy#50]
 
 (79) Filter [codegen id : 1]
-Input [3]: [d_month_seq#50, d_year#51, d_moy#52]
-Condition : (((isnotnull(d_year#51) AND isnotnull(d_moy#52)) AND (d_year#51 = 1998)) AND (d_moy#52 = 12))
+Input [3]: [d_month_seq#48, d_year#49, d_moy#50]
+Condition : (((isnotnull(d_year#49) AND isnotnull(d_moy#50)) AND (d_year#49 = 1998)) AND (d_moy#50 = 12))
 
 (80) Project [codegen id : 1]
-Output [1]: [(d_month_seq#50 + 3) AS (d_month_seq + 3)#53]
-Input [3]: [d_month_seq#50, d_year#51, d_moy#52]
+Output [1]: [(d_month_seq#48 + 3) AS (d_month_seq + 3)#51]
+Input [3]: [d_month_seq#48, d_year#49, d_moy#50]
 
 (81) HashAggregate [codegen id : 1]
-Input [1]: [(d_month_seq + 3)#53]
-Keys [1]: [(d_month_seq + 3)#53]
+Input [1]: [(d_month_seq + 3)#51]
+Keys [1]: [(d_month_seq + 3)#51]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 3)#53]
+Results [1]: [(d_month_seq + 3)#51]
 
 (82) Exchange
-Input [1]: [(d_month_seq + 3)#53]
-Arguments: hashpartitioning((d_month_seq + 3)#53, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [1]: [(d_month_seq + 3)#51]
+Arguments: hashpartitioning((d_month_seq + 3)#51, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (83) HashAggregate [codegen id : 2]
-Input [1]: [(d_month_seq + 3)#53]
-Keys [1]: [(d_month_seq + 3)#53]
+Input [1]: [(d_month_seq + 3)#51]
+Keys [1]: [(d_month_seq + 3)#51]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 3)#53]
+Results [1]: [(d_month_seq + 3)#51]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54/explain.txt
index 502d4f3ee6ab3..c2c0f217f2cfe 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q54/explain.txt
@@ -380,7 +380,7 @@ Input [2]: [d_date_sk#29, d_month_seq#41]
 
 (64) Filter [codegen id : 1]
 Input [2]: [d_date_sk#29, d_month_seq#41]
-Condition : (((isnotnull(d_month_seq#41) AND (d_month_seq#41 >= ReusedSubquery Subquery scalar-subquery#42, [id=#44])) AND (d_month_seq#41 <= ReusedSubquery Subquery scalar-subquery#43, [id=#45])) AND isnotnull(d_date_sk#29))
+Condition : (((isnotnull(d_month_seq#41) AND (d_month_seq#41 >= ReusedSubquery Subquery scalar-subquery#42, [id=#10])) AND (d_month_seq#41 <= ReusedSubquery Subquery scalar-subquery#43, [id=#11])) AND isnotnull(d_date_sk#29))
 
 (65) Project [codegen id : 1]
 Output [1]: [d_date_sk#29]
@@ -388,13 +388,13 @@ Input [2]: [d_date_sk#29, d_month_seq#41]
 
 (66) BroadcastExchange
 Input [1]: [d_date_sk#29]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=12]
 
-Subquery:4 Hosting operator id = 64 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#44]
+Subquery:4 Hosting operator id = 64 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#10]
 
-Subquery:5 Hosting operator id = 64 Hosting Expression = ReusedSubquery Subquery scalar-subquery#43, [id=#45]
+Subquery:5 Hosting operator id = 64 Hosting Expression = ReusedSubquery Subquery scalar-subquery#43, [id=#11]
 
-Subquery:6 Hosting operator id = 62 Hosting Expression = Subquery scalar-subquery#42, [id=#44]
+Subquery:6 Hosting operator id = 62 Hosting Expression = Subquery scalar-subquery#42, [id=#10]
 * HashAggregate (73)
 +- Exchange (72)
    +- * HashAggregate (71)
@@ -405,42 +405,42 @@ Subquery:6 Hosting operator id = 62 Hosting Expression = Subquery scalar-subquer
 
 
 (67) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#46, d_year#47, d_moy#48]
+Output [3]: [d_month_seq#44, d_year#45, d_moy#46]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,12)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (68) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#46, d_year#47, d_moy#48]
+Input [3]: [d_month_seq#44, d_year#45, d_moy#46]
 
 (69) Filter [codegen id : 1]
-Input [3]: [d_month_seq#46, d_year#47, d_moy#48]
-Condition : (((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 1998)) AND (d_moy#48 = 12))
+Input [3]: [d_month_seq#44, d_year#45, d_moy#46]
+Condition : (((isnotnull(d_year#45) AND isnotnull(d_moy#46)) AND (d_year#45 = 1998)) AND (d_moy#46 = 12))
 
 (70) Project [codegen id : 1]
-Output [1]: [(d_month_seq#46 + 1) AS (d_month_seq + 1)#49]
-Input [3]: [d_month_seq#46, d_year#47, d_moy#48]
+Output [1]: [(d_month_seq#44 + 1) AS (d_month_seq + 1)#47]
+Input [3]: [d_month_seq#44, d_year#45, d_moy#46]
 
 (71) HashAggregate [codegen id : 1]
-Input [1]: [(d_month_seq + 1)#49]
-Keys [1]: [(d_month_seq + 1)#49]
+Input [1]: [(d_month_seq + 1)#47]
+Keys [1]: [(d_month_seq + 1)#47]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 1)#49]
+Results [1]: [(d_month_seq + 1)#47]
 
 (72) Exchange
-Input [1]: [(d_month_seq + 1)#49]
-Arguments: hashpartitioning((d_month_seq + 1)#49, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [1]: [(d_month_seq + 1)#47]
+Arguments: hashpartitioning((d_month_seq + 1)#47, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (73) HashAggregate [codegen id : 2]
-Input [1]: [(d_month_seq + 1)#49]
-Keys [1]: [(d_month_seq + 1)#49]
+Input [1]: [(d_month_seq + 1)#47]
+Keys [1]: [(d_month_seq + 1)#47]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 1)#49]
+Results [1]: [(d_month_seq + 1)#47]
 
-Subquery:7 Hosting operator id = 62 Hosting Expression = Subquery scalar-subquery#43, [id=#45]
+Subquery:7 Hosting operator id = 62 Hosting Expression = Subquery scalar-subquery#43, [id=#11]
 * HashAggregate (80)
 +- Exchange (79)
    +- * HashAggregate (78)
@@ -451,39 +451,39 @@ Subquery:7 Hosting operator id = 62 Hosting Expression = Subquery scalar-subquer
 
 
 (74) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#50, d_year#51, d_moy#52]
+Output [3]: [d_month_seq#48, d_year#49, d_moy#50]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,12)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (75) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#50, d_year#51, d_moy#52]
+Input [3]: [d_month_seq#48, d_year#49, d_moy#50]
 
 (76) Filter [codegen id : 1]
-Input [3]: [d_month_seq#50, d_year#51, d_moy#52]
-Condition : (((isnotnull(d_year#51) AND isnotnull(d_moy#52)) AND (d_year#51 = 1998)) AND (d_moy#52 = 12))
+Input [3]: [d_month_seq#48, d_year#49, d_moy#50]
+Condition : (((isnotnull(d_year#49) AND isnotnull(d_moy#50)) AND (d_year#49 = 1998)) AND (d_moy#50 = 12))
 
 (77) Project [codegen id : 1]
-Output [1]: [(d_month_seq#50 + 3) AS (d_month_seq + 3)#53]
-Input [3]: [d_month_seq#50, d_year#51, d_moy#52]
+Output [1]: [(d_month_seq#48 + 3) AS (d_month_seq + 3)#51]
+Input [3]: [d_month_seq#48, d_year#49, d_moy#50]
 
 (78) HashAggregate [codegen id : 1]
-Input [1]: [(d_month_seq + 3)#53]
-Keys [1]: [(d_month_seq + 3)#53]
+Input [1]: [(d_month_seq + 3)#51]
+Keys [1]: [(d_month_seq + 3)#51]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 3)#53]
+Results [1]: [(d_month_seq + 3)#51]
 
 (79) Exchange
-Input [1]: [(d_month_seq + 3)#53]
-Arguments: hashpartitioning((d_month_seq + 3)#53, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [1]: [(d_month_seq + 3)#51]
+Arguments: hashpartitioning((d_month_seq + 3)#51, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (80) HashAggregate [codegen id : 2]
-Input [1]: [(d_month_seq + 3)#53]
-Keys [1]: [(d_month_seq + 3)#53]
+Input [1]: [(d_month_seq + 3)#51]
+Keys [1]: [(d_month_seq + 3)#51]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [(d_month_seq + 3)#53]
+Results [1]: [(d_month_seq + 3)#51]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/explain.txt
index 66d33e5bd5464..daf0cb82cb736 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/explain.txt
@@ -1,67 +1,66 @@
 == Physical Plan ==
-TakeOrderedAndProject (63)
-+- * HashAggregate (62)
-   +- Exchange (61)
-      +- * HashAggregate (60)
-         +- Union (59)
-            :- * HashAggregate (28)
-            :  +- Exchange (27)
-            :     +- * HashAggregate (26)
-            :        +- * Project (25)
-            :           +- * BroadcastHashJoin Inner BuildRight (24)
-            :              :- * Project (13)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (12)
-            :              :     :- * Project (6)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
-            :              :     :     :- * Filter (3)
-            :              :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :              :     :     +- ReusedExchange (4)
-            :              :     +- BroadcastExchange (11)
-            :              :        +- * Project (10)
-            :              :           +- * Filter (9)
-            :              :              +- * ColumnarToRow (8)
-            :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
-            :              +- BroadcastExchange (23)
-            :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
-            :                    :- * Filter (16)
-            :                    :  +- * ColumnarToRow (15)
-            :                    :     +- Scan parquet spark_catalog.default.item (14)
-            :                    +- BroadcastExchange (21)
-            :                       +- * Project (20)
-            :                          +- * Filter (19)
-            :                             +- * ColumnarToRow (18)
-            :                                +- Scan parquet spark_catalog.default.item (17)
-            :- * HashAggregate (43)
-            :  +- Exchange (42)
-            :     +- * HashAggregate (41)
-            :        +- * Project (40)
-            :           +- * BroadcastHashJoin Inner BuildRight (39)
-            :              :- * Project (37)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (36)
-            :              :     :- * Project (34)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
-            :              :     :     :- * Filter (31)
-            :              :     :     :  +- * ColumnarToRow (30)
-            :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
-            :              :     :     +- ReusedExchange (32)
-            :              :     +- ReusedExchange (35)
-            :              +- ReusedExchange (38)
-            +- * HashAggregate (58)
-               +- Exchange (57)
-                  +- * HashAggregate (56)
-                     +- * Project (55)
-                        +- * BroadcastHashJoin Inner BuildRight (54)
-                           :- * Project (52)
-                           :  +- * BroadcastHashJoin Inner BuildRight (51)
-                           :     :- * Project (49)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (48)
-                           :     :     :- * Filter (46)
-                           :     :     :  +- * ColumnarToRow (45)
-                           :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
-                           :     :     +- ReusedExchange (47)
-                           :     +- ReusedExchange (50)
-                           +- ReusedExchange (53)
+TakeOrderedAndProject (62)
++- * HashAggregate (61)
+   +- * HashAggregate (60)
+      +- Union (59)
+         :- * HashAggregate (28)
+         :  +- Exchange (27)
+         :     +- * HashAggregate (26)
+         :        +- * Project (25)
+         :           +- * BroadcastHashJoin Inner BuildRight (24)
+         :              :- * Project (13)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (12)
+         :              :     :- * Project (6)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
+         :              :     :     :- * Filter (3)
+         :              :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
+         :              :     :     +- ReusedExchange (4)
+         :              :     +- BroadcastExchange (11)
+         :              :        +- * Project (10)
+         :              :           +- * Filter (9)
+         :              :              +- * ColumnarToRow (8)
+         :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
+         :              +- BroadcastExchange (23)
+         :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
+         :                    :- * Filter (16)
+         :                    :  +- * ColumnarToRow (15)
+         :                    :     +- Scan parquet spark_catalog.default.item (14)
+         :                    +- BroadcastExchange (21)
+         :                       +- * Project (20)
+         :                          +- * Filter (19)
+         :                             +- * ColumnarToRow (18)
+         :                                +- Scan parquet spark_catalog.default.item (17)
+         :- * HashAggregate (43)
+         :  +- Exchange (42)
+         :     +- * HashAggregate (41)
+         :        +- * Project (40)
+         :           +- * BroadcastHashJoin Inner BuildRight (39)
+         :              :- * Project (37)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (36)
+         :              :     :- * Project (34)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
+         :              :     :     :- * Filter (31)
+         :              :     :     :  +- * ColumnarToRow (30)
+         :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
+         :              :     :     +- ReusedExchange (32)
+         :              :     +- ReusedExchange (35)
+         :              +- ReusedExchange (38)
+         +- * HashAggregate (58)
+            +- Exchange (57)
+               +- * HashAggregate (56)
+                  +- * Project (55)
+                     +- * BroadcastHashJoin Inner BuildRight (54)
+                        :- * Project (52)
+                        :  +- * BroadcastHashJoin Inner BuildRight (51)
+                        :     :- * Project (49)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (48)
+                        :     :     :- * Filter (46)
+                        :     :     :  +- * ColumnarToRow (45)
+                        :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
+                        :     :     +- ReusedExchange (47)
+                        :     +- ReusedExchange (50)
+                        +- ReusedExchange (53)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -79,7 +78,7 @@ Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Condition : (isnotnull(ss_addr_sk#2) AND isnotnull(ss_item_sk#1))
 
-(4) ReusedExchange [Reuses operator id: 68]
+(4) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#6]
 
 (5) BroadcastHashJoin [codegen id : 5]
@@ -213,7 +212,7 @@ Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_da
 Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_date_sk#20]
 Condition : (isnotnull(cs_bill_addr_sk#17) AND isnotnull(cs_item_sk#18))
 
-(32) ReusedExchange [Reuses operator id: 68]
+(32) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#21]
 
 (33) BroadcastHashJoin [codegen id : 11]
@@ -285,7 +284,7 @@ Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_da
 Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_date_sk#32]
 Condition : (isnotnull(ws_bill_addr_sk#30) AND isnotnull(ws_item_sk#29))
 
-(47) ReusedExchange [Reuses operator id: 68]
+(47) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#33]
 
 (48) BroadcastHashJoin [codegen id : 17]
@@ -351,52 +350,48 @@ Functions [1]: [partial_sum(total_sales#16)]
 Aggregate Attributes [2]: [sum#41, isEmpty#42]
 Results [3]: [i_item_id#10, sum#43, isEmpty#44]
 
-(61) Exchange
-Input [3]: [i_item_id#10, sum#43, isEmpty#44]
-Arguments: hashpartitioning(i_item_id#10, 5), ENSURE_REQUIREMENTS, [plan_id=7]
-
-(62) HashAggregate [codegen id : 20]
+(61) HashAggregate [codegen id : 19]
 Input [3]: [i_item_id#10, sum#43, isEmpty#44]
 Keys [1]: [i_item_id#10]
 Functions [1]: [sum(total_sales#16)]
 Aggregate Attributes [1]: [sum(total_sales#16)#45]
 Results [2]: [i_item_id#10, sum(total_sales#16)#45 AS total_sales#46]
 
-(63) TakeOrderedAndProject
+(62) TakeOrderedAndProject
 Input [2]: [i_item_id#10, total_sales#46]
 Arguments: 100, [total_sales#46 ASC NULLS FIRST], [i_item_id#10, total_sales#46]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (68)
-+- * Project (67)
-   +- * Filter (66)
-      +- * ColumnarToRow (65)
-         +- Scan parquet spark_catalog.default.date_dim (64)
+BroadcastExchange (67)
++- * Project (66)
+   +- * Filter (65)
+      +- * ColumnarToRow (64)
+         +- Scan parquet spark_catalog.default.date_dim (63)
 
 
-(64) Scan parquet spark_catalog.default.date_dim
+(63) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,2), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(65) ColumnarToRow [codegen id : 1]
+(64) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(66) Filter [codegen id : 1]
+(65) Filter [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Condition : ((((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 2001)) AND (d_moy#48 = 2)) AND isnotnull(d_date_sk#6))
 
-(67) Project [codegen id : 1]
+(66) Project [codegen id : 1]
 Output [1]: [d_date_sk#6]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(68) BroadcastExchange
+(67) BroadcastExchange
 Input [1]: [d_date_sk#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 Subquery:2 Hosting operator id = 29 Hosting Expression = cs_sold_date_sk#20 IN dynamicpruning#5
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/simplified.txt
index 4177a855c93a9..e15e0921767f5 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56.sf100/simplified.txt
@@ -1,105 +1,102 @@
 TakeOrderedAndProject [total_sales,i_item_id]
-  WholeStageCodegen (20)
+  WholeStageCodegen (19)
     HashAggregate [i_item_id,sum,isEmpty] [sum(total_sales),total_sales,sum,isEmpty]
-      InputAdapter
-        Exchange [i_item_id] #1
-          WholeStageCodegen (19)
-            HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
-                              Project [ss_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                  Project [ss_item_sk,ss_ext_sales_price]
-                                    BroadcastHashJoin [ss_addr_sk,ca_address_sk]
-                                      Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
-                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                          Filter [ss_addr_sk,ss_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
-                                                  SubqueryBroadcast [d_date_sk] #1
-                                                    BroadcastExchange #3
-                                                      WholeStageCodegen (1)
-                                                        Project [d_date_sk]
-                                                          Filter [d_year,d_moy,d_date_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        BroadcastExchange #4
-                                          WholeStageCodegen (2)
-                                            Project [ca_address_sk]
-                                              Filter [ca_gmt_offset,ca_address_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
-                                  InputAdapter
-                                    BroadcastExchange #5
-                                      WholeStageCodegen (4)
-                                        BroadcastHashJoin [i_item_id,i_item_id]
-                                          Filter [i_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
-                                          InputAdapter
-                                            BroadcastExchange #6
-                                              WholeStageCodegen (3)
-                                                Project [i_item_id]
-                                                  Filter [i_color]
-                                                    ColumnarToRow
-                                                      InputAdapter
-                                                        Scan parquet spark_catalog.default.item [i_item_id,i_color]
-                  WholeStageCodegen (12)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
-                              Project [cs_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                  Project [cs_item_sk,cs_ext_sales_price]
-                                    BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
-                                      Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
-                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                          Filter [cs_bill_addr_sk,cs_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
-                  WholeStageCodegen (18)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #8
-                          WholeStageCodegen (17)
-                            HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
-                              Project [ws_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                  Project [ws_item_sk,ws_ext_sales_price]
-                                    BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
-                                      Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
-                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                          Filter [ws_bill_addr_sk,ws_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
+      HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
+                        Project [ss_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ss_item_sk,i_item_sk]
+                            Project [ss_item_sk,ss_ext_sales_price]
+                              BroadcastHashJoin [ss_addr_sk,ca_address_sk]
+                                Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
+                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                    Filter [ss_addr_sk,ss_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
+                                            SubqueryBroadcast [d_date_sk] #1
+                                              BroadcastExchange #2
+                                                WholeStageCodegen (1)
+                                                  Project [d_date_sk]
+                                                    Filter [d_year,d_moy,d_date_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  BroadcastExchange #3
+                                    WholeStageCodegen (2)
+                                      Project [ca_address_sk]
+                                        Filter [ca_gmt_offset,ca_address_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
+                            InputAdapter
+                              BroadcastExchange #4
+                                WholeStageCodegen (4)
+                                  BroadcastHashJoin [i_item_id,i_item_id]
+                                    Filter [i_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
+                                    InputAdapter
+                                      BroadcastExchange #5
+                                        WholeStageCodegen (3)
+                                          Project [i_item_id]
+                                            Filter [i_color]
+                                              ColumnarToRow
+                                                InputAdapter
+                                                  Scan parquet spark_catalog.default.item [i_item_id,i_color]
+            WholeStageCodegen (12)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
+                        Project [cs_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [cs_item_sk,i_item_sk]
+                            Project [cs_item_sk,cs_ext_sales_price]
+                              BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
+                                Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
+                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                    Filter [cs_bill_addr_sk,cs_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
+            WholeStageCodegen (18)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #7
+                    WholeStageCodegen (17)
+                      HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
+                        Project [ws_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ws_item_sk,i_item_sk]
+                            Project [ws_item_sk,ws_ext_sales_price]
+                              BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
+                                Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
+                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                    Filter [ws_bill_addr_sk,ws_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/explain.txt
index 66d33e5bd5464..daf0cb82cb736 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/explain.txt
@@ -1,67 +1,66 @@
 == Physical Plan ==
-TakeOrderedAndProject (63)
-+- * HashAggregate (62)
-   +- Exchange (61)
-      +- * HashAggregate (60)
-         +- Union (59)
-            :- * HashAggregate (28)
-            :  +- Exchange (27)
-            :     +- * HashAggregate (26)
-            :        +- * Project (25)
-            :           +- * BroadcastHashJoin Inner BuildRight (24)
-            :              :- * Project (13)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (12)
-            :              :     :- * Project (6)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
-            :              :     :     :- * Filter (3)
-            :              :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :              :     :     +- ReusedExchange (4)
-            :              :     +- BroadcastExchange (11)
-            :              :        +- * Project (10)
-            :              :           +- * Filter (9)
-            :              :              +- * ColumnarToRow (8)
-            :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
-            :              +- BroadcastExchange (23)
-            :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
-            :                    :- * Filter (16)
-            :                    :  +- * ColumnarToRow (15)
-            :                    :     +- Scan parquet spark_catalog.default.item (14)
-            :                    +- BroadcastExchange (21)
-            :                       +- * Project (20)
-            :                          +- * Filter (19)
-            :                             +- * ColumnarToRow (18)
-            :                                +- Scan parquet spark_catalog.default.item (17)
-            :- * HashAggregate (43)
-            :  +- Exchange (42)
-            :     +- * HashAggregate (41)
-            :        +- * Project (40)
-            :           +- * BroadcastHashJoin Inner BuildRight (39)
-            :              :- * Project (37)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (36)
-            :              :     :- * Project (34)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
-            :              :     :     :- * Filter (31)
-            :              :     :     :  +- * ColumnarToRow (30)
-            :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
-            :              :     :     +- ReusedExchange (32)
-            :              :     +- ReusedExchange (35)
-            :              +- ReusedExchange (38)
-            +- * HashAggregate (58)
-               +- Exchange (57)
-                  +- * HashAggregate (56)
-                     +- * Project (55)
-                        +- * BroadcastHashJoin Inner BuildRight (54)
-                           :- * Project (52)
-                           :  +- * BroadcastHashJoin Inner BuildRight (51)
-                           :     :- * Project (49)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (48)
-                           :     :     :- * Filter (46)
-                           :     :     :  +- * ColumnarToRow (45)
-                           :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
-                           :     :     +- ReusedExchange (47)
-                           :     +- ReusedExchange (50)
-                           +- ReusedExchange (53)
+TakeOrderedAndProject (62)
++- * HashAggregate (61)
+   +- * HashAggregate (60)
+      +- Union (59)
+         :- * HashAggregate (28)
+         :  +- Exchange (27)
+         :     +- * HashAggregate (26)
+         :        +- * Project (25)
+         :           +- * BroadcastHashJoin Inner BuildRight (24)
+         :              :- * Project (13)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (12)
+         :              :     :- * Project (6)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
+         :              :     :     :- * Filter (3)
+         :              :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
+         :              :     :     +- ReusedExchange (4)
+         :              :     +- BroadcastExchange (11)
+         :              :        +- * Project (10)
+         :              :           +- * Filter (9)
+         :              :              +- * ColumnarToRow (8)
+         :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
+         :              +- BroadcastExchange (23)
+         :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
+         :                    :- * Filter (16)
+         :                    :  +- * ColumnarToRow (15)
+         :                    :     +- Scan parquet spark_catalog.default.item (14)
+         :                    +- BroadcastExchange (21)
+         :                       +- * Project (20)
+         :                          +- * Filter (19)
+         :                             +- * ColumnarToRow (18)
+         :                                +- Scan parquet spark_catalog.default.item (17)
+         :- * HashAggregate (43)
+         :  +- Exchange (42)
+         :     +- * HashAggregate (41)
+         :        +- * Project (40)
+         :           +- * BroadcastHashJoin Inner BuildRight (39)
+         :              :- * Project (37)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (36)
+         :              :     :- * Project (34)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
+         :              :     :     :- * Filter (31)
+         :              :     :     :  +- * ColumnarToRow (30)
+         :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
+         :              :     :     +- ReusedExchange (32)
+         :              :     +- ReusedExchange (35)
+         :              +- ReusedExchange (38)
+         +- * HashAggregate (58)
+            +- Exchange (57)
+               +- * HashAggregate (56)
+                  +- * Project (55)
+                     +- * BroadcastHashJoin Inner BuildRight (54)
+                        :- * Project (52)
+                        :  +- * BroadcastHashJoin Inner BuildRight (51)
+                        :     :- * Project (49)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (48)
+                        :     :     :- * Filter (46)
+                        :     :     :  +- * ColumnarToRow (45)
+                        :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
+                        :     :     +- ReusedExchange (47)
+                        :     +- ReusedExchange (50)
+                        +- ReusedExchange (53)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -79,7 +78,7 @@ Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Condition : (isnotnull(ss_addr_sk#2) AND isnotnull(ss_item_sk#1))
 
-(4) ReusedExchange [Reuses operator id: 68]
+(4) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#6]
 
 (5) BroadcastHashJoin [codegen id : 5]
@@ -213,7 +212,7 @@ Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_da
 Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_date_sk#20]
 Condition : (isnotnull(cs_bill_addr_sk#17) AND isnotnull(cs_item_sk#18))
 
-(32) ReusedExchange [Reuses operator id: 68]
+(32) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#21]
 
 (33) BroadcastHashJoin [codegen id : 11]
@@ -285,7 +284,7 @@ Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_da
 Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_date_sk#32]
 Condition : (isnotnull(ws_bill_addr_sk#30) AND isnotnull(ws_item_sk#29))
 
-(47) ReusedExchange [Reuses operator id: 68]
+(47) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#33]
 
 (48) BroadcastHashJoin [codegen id : 17]
@@ -351,52 +350,48 @@ Functions [1]: [partial_sum(total_sales#16)]
 Aggregate Attributes [2]: [sum#41, isEmpty#42]
 Results [3]: [i_item_id#10, sum#43, isEmpty#44]
 
-(61) Exchange
-Input [3]: [i_item_id#10, sum#43, isEmpty#44]
-Arguments: hashpartitioning(i_item_id#10, 5), ENSURE_REQUIREMENTS, [plan_id=7]
-
-(62) HashAggregate [codegen id : 20]
+(61) HashAggregate [codegen id : 19]
 Input [3]: [i_item_id#10, sum#43, isEmpty#44]
 Keys [1]: [i_item_id#10]
 Functions [1]: [sum(total_sales#16)]
 Aggregate Attributes [1]: [sum(total_sales#16)#45]
 Results [2]: [i_item_id#10, sum(total_sales#16)#45 AS total_sales#46]
 
-(63) TakeOrderedAndProject
+(62) TakeOrderedAndProject
 Input [2]: [i_item_id#10, total_sales#46]
 Arguments: 100, [total_sales#46 ASC NULLS FIRST], [i_item_id#10, total_sales#46]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (68)
-+- * Project (67)
-   +- * Filter (66)
-      +- * ColumnarToRow (65)
-         +- Scan parquet spark_catalog.default.date_dim (64)
+BroadcastExchange (67)
++- * Project (66)
+   +- * Filter (65)
+      +- * ColumnarToRow (64)
+         +- Scan parquet spark_catalog.default.date_dim (63)
 
 
-(64) Scan parquet spark_catalog.default.date_dim
+(63) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,2), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(65) ColumnarToRow [codegen id : 1]
+(64) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(66) Filter [codegen id : 1]
+(65) Filter [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Condition : ((((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 2001)) AND (d_moy#48 = 2)) AND isnotnull(d_date_sk#6))
 
-(67) Project [codegen id : 1]
+(66) Project [codegen id : 1]
 Output [1]: [d_date_sk#6]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(68) BroadcastExchange
+(67) BroadcastExchange
 Input [1]: [d_date_sk#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 Subquery:2 Hosting operator id = 29 Hosting Expression = cs_sold_date_sk#20 IN dynamicpruning#5
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/simplified.txt
index 4177a855c93a9..e15e0921767f5 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q56/simplified.txt
@@ -1,105 +1,102 @@
 TakeOrderedAndProject [total_sales,i_item_id]
-  WholeStageCodegen (20)
+  WholeStageCodegen (19)
     HashAggregate [i_item_id,sum,isEmpty] [sum(total_sales),total_sales,sum,isEmpty]
-      InputAdapter
-        Exchange [i_item_id] #1
-          WholeStageCodegen (19)
-            HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
-                              Project [ss_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                  Project [ss_item_sk,ss_ext_sales_price]
-                                    BroadcastHashJoin [ss_addr_sk,ca_address_sk]
-                                      Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
-                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                          Filter [ss_addr_sk,ss_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
-                                                  SubqueryBroadcast [d_date_sk] #1
-                                                    BroadcastExchange #3
-                                                      WholeStageCodegen (1)
-                                                        Project [d_date_sk]
-                                                          Filter [d_year,d_moy,d_date_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        BroadcastExchange #4
-                                          WholeStageCodegen (2)
-                                            Project [ca_address_sk]
-                                              Filter [ca_gmt_offset,ca_address_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
-                                  InputAdapter
-                                    BroadcastExchange #5
-                                      WholeStageCodegen (4)
-                                        BroadcastHashJoin [i_item_id,i_item_id]
-                                          Filter [i_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
-                                          InputAdapter
-                                            BroadcastExchange #6
-                                              WholeStageCodegen (3)
-                                                Project [i_item_id]
-                                                  Filter [i_color]
-                                                    ColumnarToRow
-                                                      InputAdapter
-                                                        Scan parquet spark_catalog.default.item [i_item_id,i_color]
-                  WholeStageCodegen (12)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
-                              Project [cs_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                  Project [cs_item_sk,cs_ext_sales_price]
-                                    BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
-                                      Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
-                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                          Filter [cs_bill_addr_sk,cs_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
-                  WholeStageCodegen (18)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #8
-                          WholeStageCodegen (17)
-                            HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
-                              Project [ws_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                  Project [ws_item_sk,ws_ext_sales_price]
-                                    BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
-                                      Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
-                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                          Filter [ws_bill_addr_sk,ws_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
+      HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
+                        Project [ss_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ss_item_sk,i_item_sk]
+                            Project [ss_item_sk,ss_ext_sales_price]
+                              BroadcastHashJoin [ss_addr_sk,ca_address_sk]
+                                Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
+                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                    Filter [ss_addr_sk,ss_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
+                                            SubqueryBroadcast [d_date_sk] #1
+                                              BroadcastExchange #2
+                                                WholeStageCodegen (1)
+                                                  Project [d_date_sk]
+                                                    Filter [d_year,d_moy,d_date_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  BroadcastExchange #3
+                                    WholeStageCodegen (2)
+                                      Project [ca_address_sk]
+                                        Filter [ca_gmt_offset,ca_address_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
+                            InputAdapter
+                              BroadcastExchange #4
+                                WholeStageCodegen (4)
+                                  BroadcastHashJoin [i_item_id,i_item_id]
+                                    Filter [i_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
+                                    InputAdapter
+                                      BroadcastExchange #5
+                                        WholeStageCodegen (3)
+                                          Project [i_item_id]
+                                            Filter [i_color]
+                                              ColumnarToRow
+                                                InputAdapter
+                                                  Scan parquet spark_catalog.default.item [i_item_id,i_color]
+            WholeStageCodegen (12)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
+                        Project [cs_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [cs_item_sk,i_item_sk]
+                            Project [cs_item_sk,cs_ext_sales_price]
+                              BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
+                                Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
+                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                    Filter [cs_bill_addr_sk,cs_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
+            WholeStageCodegen (18)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #7
+                    WholeStageCodegen (17)
+                      HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
+                        Project [ws_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ws_item_sk,i_item_sk]
+                            Project [ws_item_sk,ws_ext_sales_price]
+                              BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
+                                Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
+                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                    Filter [ws_bill_addr_sk,ws_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58.sf100/explain.txt
index d9083741a88e7..ef80d66899de4 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58.sf100/explain.txt
@@ -328,7 +328,7 @@ Input [2]: [d_date#40, d_week_seq#41]
 
 (55) Filter [codegen id : 1]
 Input [2]: [d_date#40, d_week_seq#41]
-Condition : (isnotnull(d_week_seq#41) AND (d_week_seq#41 = ReusedSubquery Subquery scalar-subquery#42, [id=#43]))
+Condition : (isnotnull(d_week_seq#41) AND (d_week_seq#41 = ReusedSubquery Subquery scalar-subquery#42, [id=#7]))
 
 (56) Project [codegen id : 1]
 Output [1]: [d_date#40]
@@ -336,7 +336,7 @@ Input [2]: [d_date#40, d_week_seq#41]
 
 (57) BroadcastExchange
 Input [1]: [d_date#40]
-Arguments: HashedRelationBroadcastMode(List(input[0, date, true]),false), [plan_id=7]
+Arguments: HashedRelationBroadcastMode(List(input[0, date, true]),false), [plan_id=8]
 
 (58) BroadcastHashJoin [codegen id : 2]
 Left keys [1]: [d_date#39]
@@ -350,11 +350,11 @@ Input [2]: [d_date_sk#5, d_date#39]
 
 (60) BroadcastExchange
 Input [1]: [d_date_sk#5]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
-Subquery:2 Hosting operator id = 55 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#43]
+Subquery:2 Hosting operator id = 55 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#7]
 
-Subquery:3 Hosting operator id = 53 Hosting Expression = Subquery scalar-subquery#42, [id=#43]
+Subquery:3 Hosting operator id = 53 Hosting Expression = Subquery scalar-subquery#42, [id=#7]
 * Project (64)
 +- * Filter (63)
    +- * ColumnarToRow (62)
@@ -362,22 +362,22 @@ Subquery:3 Hosting operator id = 53 Hosting Expression = Subquery scalar-subquer
 
 
 (61) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date#44, d_week_seq#45]
+Output [2]: [d_date#43, d_week_seq#44]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), EqualTo(d_date,2000-01-03)]
 ReadSchema: struct<d_date:date,d_week_seq:int>
 
 (62) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date#44, d_week_seq#45]
+Input [2]: [d_date#43, d_week_seq#44]
 
 (63) Filter [codegen id : 1]
-Input [2]: [d_date#44, d_week_seq#45]
-Condition : (isnotnull(d_date#44) AND (d_date#44 = 2000-01-03))
+Input [2]: [d_date#43, d_week_seq#44]
+Condition : (isnotnull(d_date#43) AND (d_date#43 = 2000-01-03))
 
 (64) Project [codegen id : 1]
-Output [1]: [d_week_seq#45]
-Input [2]: [d_date#44, d_week_seq#45]
+Output [1]: [d_week_seq#44]
+Input [2]: [d_date#43, d_week_seq#44]
 
 Subquery:4 Hosting operator id = 17 Hosting Expression = cs_sold_date_sk#15 IN dynamicpruning#4
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58/explain.txt
index 7f95e52cb8df5..002562616d34d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q58/explain.txt
@@ -328,7 +328,7 @@ Input [2]: [d_date#40, d_week_seq#41]
 
 (55) Filter [codegen id : 1]
 Input [2]: [d_date#40, d_week_seq#41]
-Condition : (isnotnull(d_week_seq#41) AND (d_week_seq#41 = ReusedSubquery Subquery scalar-subquery#42, [id=#43]))
+Condition : (isnotnull(d_week_seq#41) AND (d_week_seq#41 = ReusedSubquery Subquery scalar-subquery#42, [id=#7]))
 
 (56) Project [codegen id : 1]
 Output [1]: [d_date#40]
@@ -336,7 +336,7 @@ Input [2]: [d_date#40, d_week_seq#41]
 
 (57) BroadcastExchange
 Input [1]: [d_date#40]
-Arguments: HashedRelationBroadcastMode(List(input[0, date, true]),false), [plan_id=7]
+Arguments: HashedRelationBroadcastMode(List(input[0, date, true]),false), [plan_id=8]
 
 (58) BroadcastHashJoin [codegen id : 2]
 Left keys [1]: [d_date#39]
@@ -350,11 +350,11 @@ Input [2]: [d_date_sk#7, d_date#39]
 
 (60) BroadcastExchange
 Input [1]: [d_date_sk#7]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
-Subquery:2 Hosting operator id = 55 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#43]
+Subquery:2 Hosting operator id = 55 Hosting Expression = ReusedSubquery Subquery scalar-subquery#42, [id=#7]
 
-Subquery:3 Hosting operator id = 53 Hosting Expression = Subquery scalar-subquery#42, [id=#43]
+Subquery:3 Hosting operator id = 53 Hosting Expression = Subquery scalar-subquery#42, [id=#7]
 * Project (64)
 +- * Filter (63)
    +- * ColumnarToRow (62)
@@ -362,22 +362,22 @@ Subquery:3 Hosting operator id = 53 Hosting Expression = Subquery scalar-subquer
 
 
 (61) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date#44, d_week_seq#45]
+Output [2]: [d_date#43, d_week_seq#44]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), EqualTo(d_date,2000-01-03)]
 ReadSchema: struct<d_date:date,d_week_seq:int>
 
 (62) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date#44, d_week_seq#45]
+Input [2]: [d_date#43, d_week_seq#44]
 
 (63) Filter [codegen id : 1]
-Input [2]: [d_date#44, d_week_seq#45]
-Condition : (isnotnull(d_date#44) AND (d_date#44 = 2000-01-03))
+Input [2]: [d_date#43, d_week_seq#44]
+Condition : (isnotnull(d_date#43) AND (d_date#43 = 2000-01-03))
 
 (64) Project [codegen id : 1]
-Output [1]: [d_week_seq#45]
-Input [2]: [d_date#44, d_week_seq#45]
+Output [1]: [d_week_seq#44]
+Input [2]: [d_date#43, d_week_seq#44]
 
 Subquery:4 Hosting operator id = 17 Hosting Expression = cs_sold_date_sk#15 IN dynamicpruning#4
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q59.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q59.sf100/explain.txt
index 2f020e12b3fc5..4baef9301504c 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q59.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q59.sf100/explain.txt
@@ -82,11 +82,11 @@ Input [3]: [d_date_sk#4, d_week_seq#5, d_day_name#6]
 
 (6) Filter [codegen id : 1]
 Input [3]: [d_date_sk#4, d_week_seq#5, d_day_name#6]
-Condition : ((isnotnull(d_date_sk#4) AND isnotnull(d_week_seq#5)) AND might_contain(Subquery scalar-subquery#7, [id=#8], xxhash64(d_week_seq#5, 42)))
+Condition : ((isnotnull(d_date_sk#4) AND isnotnull(d_week_seq#5)) AND might_contain(Subquery scalar-subquery#7, [id=#1], xxhash64(d_week_seq#5, 42)))
 
 (7) BroadcastExchange
 Input [3]: [d_date_sk#4, d_week_seq#5, d_day_name#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=1]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=2]
 
 (8) BroadcastHashJoin [codegen id : 2]
 Left keys [1]: [ss_sold_date_sk#3]
@@ -102,222 +102,222 @@ Input [6]: [ss_store_sk#1, ss_sales_price#2, ss_sold_date_sk#3, d_date_sk#4, d_w
 Input [4]: [ss_store_sk#1, ss_sales_price#2, d_week_seq#5, d_day_name#6]
 Keys [2]: [d_week_seq#5, ss_store_sk#1]
 Functions [7]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))]
-Aggregate Attributes [7]: [sum#9, sum#10, sum#11, sum#12, sum#13, sum#14, sum#15]
-Results [9]: [d_week_seq#5, ss_store_sk#1, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21, sum#22]
+Aggregate Attributes [7]: [sum#8, sum#9, sum#10, sum#11, sum#12, sum#13, sum#14]
+Results [9]: [d_week_seq#5, ss_store_sk#1, sum#15, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21]
 
 (11) Exchange
-Input [9]: [d_week_seq#5, ss_store_sk#1, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21, sum#22]
-Arguments: hashpartitioning(d_week_seq#5, ss_store_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [9]: [d_week_seq#5, ss_store_sk#1, sum#15, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21]
+Arguments: hashpartitioning(d_week_seq#5, ss_store_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) HashAggregate [codegen id : 10]
-Input [9]: [d_week_seq#5, ss_store_sk#1, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21, sum#22]
+Input [9]: [d_week_seq#5, ss_store_sk#1, sum#15, sum#16, sum#17, sum#18, sum#19, sum#20, sum#21]
 Keys [2]: [d_week_seq#5, ss_store_sk#1]
 Functions [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END)), sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))]
-Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#24, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#25, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#29]
-Results [9]: [d_week_seq#5, ss_store_sk#1, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#23,17,2) AS sun_sales#30, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#24,17,2) AS mon_sales#31, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#25,17,2) AS tue_sales#32, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#26,17,2) AS wed_sales#33, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#27,17,2) AS thu_sales#34, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#28,17,2) AS fri_sales#35, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#29,17,2) AS sat_sales#36]
+Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#22, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#24, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#25, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#28]
+Results [9]: [d_week_seq#5, ss_store_sk#1, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Sunday   ) THEN ss_sales_price#2 END))#22,17,2) AS sun_sales#29, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Monday   ) THEN ss_sales_price#2 END))#23,17,2) AS mon_sales#30, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Tuesday  ) THEN ss_sales_price#2 END))#24,17,2) AS tue_sales#31, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Wednesday) THEN ss_sales_price#2 END))#25,17,2) AS wed_sales#32, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Thursday ) THEN ss_sales_price#2 END))#26,17,2) AS thu_sales#33, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Friday   ) THEN ss_sales_price#2 END))#27,17,2) AS fri_sales#34, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#6 = Saturday ) THEN ss_sales_price#2 END))#28,17,2) AS sat_sales#35]
 
 (13) Scan parquet spark_catalog.default.store
-Output [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
+Output [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk), IsNotNull(s_store_id)]
 ReadSchema: struct<s_store_sk:int,s_store_id:string,s_store_name:string>
 
 (14) ColumnarToRow [codegen id : 3]
-Input [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
+Input [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
 
 (15) Filter [codegen id : 3]
-Input [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
-Condition : (isnotnull(s_store_sk#37) AND isnotnull(s_store_id#38))
+Input [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
+Condition : (isnotnull(s_store_sk#36) AND isnotnull(s_store_id#37))
 
 (16) BroadcastExchange
-Input [3]: [s_store_sk#37, s_store_id#38, s_store_name#39]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=3]
+Input [3]: [s_store_sk#36, s_store_id#37, s_store_name#38]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=4]
 
 (17) BroadcastHashJoin [codegen id : 10]
 Left keys [1]: [ss_store_sk#1]
-Right keys [1]: [s_store_sk#37]
+Right keys [1]: [s_store_sk#36]
 Join type: Inner
 Join condition: None
 
 (18) Project [codegen id : 10]
-Output [10]: [d_week_seq#5, sun_sales#30, mon_sales#31, tue_sales#32, wed_sales#33, thu_sales#34, fri_sales#35, sat_sales#36, s_store_id#38, s_store_name#39]
-Input [12]: [d_week_seq#5, ss_store_sk#1, sun_sales#30, mon_sales#31, tue_sales#32, wed_sales#33, thu_sales#34, fri_sales#35, sat_sales#36, s_store_sk#37, s_store_id#38, s_store_name#39]
+Output [10]: [d_week_seq#5, sun_sales#29, mon_sales#30, tue_sales#31, wed_sales#32, thu_sales#33, fri_sales#34, sat_sales#35, s_store_id#37, s_store_name#38]
+Input [12]: [d_week_seq#5, ss_store_sk#1, sun_sales#29, mon_sales#30, tue_sales#31, wed_sales#32, thu_sales#33, fri_sales#34, sat_sales#35, s_store_sk#36, s_store_id#37, s_store_name#38]
 
 (19) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#40, d_week_seq#41]
+Output [2]: [d_month_seq#39, d_week_seq#40]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1212), LessThanOrEqual(d_month_seq,1223), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (20) ColumnarToRow [codegen id : 4]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (21) Filter [codegen id : 4]
-Input [2]: [d_month_seq#40, d_week_seq#41]
-Condition : (((isnotnull(d_month_seq#40) AND (d_month_seq#40 >= 1212)) AND (d_month_seq#40 <= 1223)) AND isnotnull(d_week_seq#41))
+Input [2]: [d_month_seq#39, d_week_seq#40]
+Condition : (((isnotnull(d_month_seq#39) AND (d_month_seq#39 >= 1212)) AND (d_month_seq#39 <= 1223)) AND isnotnull(d_week_seq#40))
 
 (22) Project [codegen id : 4]
-Output [1]: [d_week_seq#41]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Output [1]: [d_week_seq#40]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (23) BroadcastExchange
-Input [1]: [d_week_seq#41]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [d_week_seq#40]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
 
 (24) BroadcastHashJoin [codegen id : 10]
 Left keys [1]: [d_week_seq#5]
-Right keys [1]: [d_week_seq#41]
+Right keys [1]: [d_week_seq#40]
 Join type: Inner
 Join condition: None
 
 (25) Project [codegen id : 10]
-Output [10]: [s_store_name#39 AS s_store_name1#42, d_week_seq#5 AS d_week_seq1#43, s_store_id#38 AS s_store_id1#44, sun_sales#30 AS sun_sales1#45, mon_sales#31 AS mon_sales1#46, tue_sales#32 AS tue_sales1#47, wed_sales#33 AS wed_sales1#48, thu_sales#34 AS thu_sales1#49, fri_sales#35 AS fri_sales1#50, sat_sales#36 AS sat_sales1#51]
-Input [11]: [d_week_seq#5, sun_sales#30, mon_sales#31, tue_sales#32, wed_sales#33, thu_sales#34, fri_sales#35, sat_sales#36, s_store_id#38, s_store_name#39, d_week_seq#41]
+Output [10]: [s_store_name#38 AS s_store_name1#41, d_week_seq#5 AS d_week_seq1#42, s_store_id#37 AS s_store_id1#43, sun_sales#29 AS sun_sales1#44, mon_sales#30 AS mon_sales1#45, tue_sales#31 AS tue_sales1#46, wed_sales#32 AS wed_sales1#47, thu_sales#33 AS thu_sales1#48, fri_sales#34 AS fri_sales1#49, sat_sales#35 AS sat_sales1#50]
+Input [11]: [d_week_seq#5, sun_sales#29, mon_sales#30, tue_sales#31, wed_sales#32, thu_sales#33, fri_sales#34, sat_sales#35, s_store_id#37, s_store_name#38, d_week_seq#40]
 
 (26) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54]
+Output [3]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#54)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#53)]
 PushedFilters: [IsNotNull(ss_store_sk)]
 ReadSchema: struct<ss_store_sk:int,ss_sales_price:decimal(7,2)>
 
 (27) ColumnarToRow [codegen id : 6]
-Input [3]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54]
+Input [3]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53]
 
 (28) Filter [codegen id : 6]
-Input [3]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54]
-Condition : isnotnull(ss_store_sk#52)
+Input [3]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53]
+Condition : isnotnull(ss_store_sk#51)
 
 (29) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
+Output [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date_sk), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int,d_day_name:string>
 
 (30) ColumnarToRow [codegen id : 5]
-Input [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
+Input [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
 
 (31) Filter [codegen id : 5]
-Input [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
-Condition : ((isnotnull(d_date_sk#55) AND isnotnull(d_week_seq#56)) AND might_contain(Subquery scalar-subquery#58, [id=#59], xxhash64(d_week_seq#56, 42)))
+Input [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
+Condition : ((isnotnull(d_date_sk#54) AND isnotnull(d_week_seq#55)) AND might_contain(Subquery scalar-subquery#57, [id=#6], xxhash64(d_week_seq#55, 42)))
 
 (32) BroadcastExchange
-Input [3]: [d_date_sk#55, d_week_seq#56, d_day_name#57]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=5]
+Input [3]: [d_date_sk#54, d_week_seq#55, d_day_name#56]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
 
 (33) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ss_sold_date_sk#54]
-Right keys [1]: [d_date_sk#55]
+Left keys [1]: [ss_sold_date_sk#53]
+Right keys [1]: [d_date_sk#54]
 Join type: Inner
 Join condition: None
 
 (34) Project [codegen id : 6]
-Output [4]: [ss_store_sk#52, ss_sales_price#53, d_week_seq#56, d_day_name#57]
-Input [6]: [ss_store_sk#52, ss_sales_price#53, ss_sold_date_sk#54, d_date_sk#55, d_week_seq#56, d_day_name#57]
+Output [4]: [ss_store_sk#51, ss_sales_price#52, d_week_seq#55, d_day_name#56]
+Input [6]: [ss_store_sk#51, ss_sales_price#52, ss_sold_date_sk#53, d_date_sk#54, d_week_seq#55, d_day_name#56]
 
 (35) HashAggregate [codegen id : 6]
-Input [4]: [ss_store_sk#52, ss_sales_price#53, d_week_seq#56, d_day_name#57]
-Keys [2]: [d_week_seq#56, ss_store_sk#52]
-Functions [7]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Tuesday  ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))]
-Aggregate Attributes [7]: [sum#60, sum#61, sum#62, sum#63, sum#64, sum#65, sum#66]
-Results [9]: [d_week_seq#56, ss_store_sk#52, sum#67, sum#68, sum#69, sum#70, sum#71, sum#72, sum#73]
+Input [4]: [ss_store_sk#51, ss_sales_price#52, d_week_seq#55, d_day_name#56]
+Keys [2]: [d_week_seq#55, ss_store_sk#51]
+Functions [7]: [partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Tuesday  ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END)), partial_sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))]
+Aggregate Attributes [7]: [sum#58, sum#59, sum#60, sum#61, sum#62, sum#63, sum#64]
+Results [9]: [d_week_seq#55, ss_store_sk#51, sum#65, sum#66, sum#67, sum#68, sum#69, sum#70, sum#71]
 
 (36) Exchange
-Input [9]: [d_week_seq#56, ss_store_sk#52, sum#67, sum#68, sum#69, sum#70, sum#71, sum#72, sum#73]
-Arguments: hashpartitioning(d_week_seq#56, ss_store_sk#52, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [9]: [d_week_seq#55, ss_store_sk#51, sum#65, sum#66, sum#67, sum#68, sum#69, sum#70, sum#71]
+Arguments: hashpartitioning(d_week_seq#55, ss_store_sk#51, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (37) HashAggregate [codegen id : 9]
-Input [9]: [d_week_seq#56, ss_store_sk#52, sum#67, sum#68, sum#69, sum#70, sum#71, sum#72, sum#73]
-Keys [2]: [d_week_seq#56, ss_store_sk#52]
-Functions [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Tuesday  ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END)), sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))]
-Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END))#24, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Tuesday  ) THEN ss_sales_price#53 END))#25, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END))#28, sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))#29]
-Results [9]: [d_week_seq#56, ss_store_sk#52, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Sunday   ) THEN ss_sales_price#53 END))#23,17,2) AS sun_sales#74, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Monday   ) THEN ss_sales_price#53 END))#24,17,2) AS mon_sales#75, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Tuesday  ) THEN ss_sales_price#53 END))#25,17,2) AS tue_sales#76, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Wednesday) THEN ss_sales_price#53 END))#26,17,2) AS wed_sales#77, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Thursday ) THEN ss_sales_price#53 END))#27,17,2) AS thu_sales#78, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Friday   ) THEN ss_sales_price#53 END))#28,17,2) AS fri_sales#79, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#57 = Saturday ) THEN ss_sales_price#53 END))#29,17,2) AS sat_sales#80]
+Input [9]: [d_week_seq#55, ss_store_sk#51, sum#65, sum#66, sum#67, sum#68, sum#69, sum#70, sum#71]
+Keys [2]: [d_week_seq#55, ss_store_sk#51]
+Functions [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Tuesday  ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END)), sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))]
+Aggregate Attributes [7]: [sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END))#22, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END))#23, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Tuesday  ) THEN ss_sales_price#52 END))#24, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END))#25, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END))#26, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END))#27, sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))#28]
+Results [9]: [d_week_seq#55, ss_store_sk#51, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Sunday   ) THEN ss_sales_price#52 END))#22,17,2) AS sun_sales#72, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Monday   ) THEN ss_sales_price#52 END))#23,17,2) AS mon_sales#73, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Tuesday  ) THEN ss_sales_price#52 END))#24,17,2) AS tue_sales#74, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Wednesday) THEN ss_sales_price#52 END))#25,17,2) AS wed_sales#75, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Thursday ) THEN ss_sales_price#52 END))#26,17,2) AS thu_sales#76, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Friday   ) THEN ss_sales_price#52 END))#27,17,2) AS fri_sales#77, MakeDecimal(sum(UnscaledValue(CASE WHEN (d_day_name#56 = Saturday ) THEN ss_sales_price#52 END))#28,17,2) AS sat_sales#78]
 
 (38) Scan parquet spark_catalog.default.store
-Output [2]: [s_store_sk#81, s_store_id#82]
+Output [2]: [s_store_sk#79, s_store_id#80]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk), IsNotNull(s_store_id)]
 ReadSchema: struct<s_store_sk:int,s_store_id:string>
 
 (39) ColumnarToRow [codegen id : 7]
-Input [2]: [s_store_sk#81, s_store_id#82]
+Input [2]: [s_store_sk#79, s_store_id#80]
 
 (40) Filter [codegen id : 7]
-Input [2]: [s_store_sk#81, s_store_id#82]
-Condition : (isnotnull(s_store_sk#81) AND isnotnull(s_store_id#82))
+Input [2]: [s_store_sk#79, s_store_id#80]
+Condition : (isnotnull(s_store_sk#79) AND isnotnull(s_store_id#80))
 
 (41) BroadcastExchange
-Input [2]: [s_store_sk#81, s_store_id#82]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
+Input [2]: [s_store_sk#79, s_store_id#80]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=9]
 
 (42) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_store_sk#52]
-Right keys [1]: [s_store_sk#81]
+Left keys [1]: [ss_store_sk#51]
+Right keys [1]: [s_store_sk#79]
 Join type: Inner
 Join condition: None
 
 (43) Project [codegen id : 9]
-Output [9]: [d_week_seq#56, sun_sales#74, mon_sales#75, tue_sales#76, wed_sales#77, thu_sales#78, fri_sales#79, sat_sales#80, s_store_id#82]
-Input [11]: [d_week_seq#56, ss_store_sk#52, sun_sales#74, mon_sales#75, tue_sales#76, wed_sales#77, thu_sales#78, fri_sales#79, sat_sales#80, s_store_sk#81, s_store_id#82]
+Output [9]: [d_week_seq#55, sun_sales#72, mon_sales#73, tue_sales#74, wed_sales#75, thu_sales#76, fri_sales#77, sat_sales#78, s_store_id#80]
+Input [11]: [d_week_seq#55, ss_store_sk#51, sun_sales#72, mon_sales#73, tue_sales#74, wed_sales#75, thu_sales#76, fri_sales#77, sat_sales#78, s_store_sk#79, s_store_id#80]
 
 (44) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#83, d_week_seq#84]
+Output [2]: [d_month_seq#81, d_week_seq#82]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1224), LessThanOrEqual(d_month_seq,1235), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (45) ColumnarToRow [codegen id : 8]
-Input [2]: [d_month_seq#83, d_week_seq#84]
+Input [2]: [d_month_seq#81, d_week_seq#82]
 
 (46) Filter [codegen id : 8]
-Input [2]: [d_month_seq#83, d_week_seq#84]
-Condition : (((isnotnull(d_month_seq#83) AND (d_month_seq#83 >= 1224)) AND (d_month_seq#83 <= 1235)) AND isnotnull(d_week_seq#84))
+Input [2]: [d_month_seq#81, d_week_seq#82]
+Condition : (((isnotnull(d_month_seq#81) AND (d_month_seq#81 >= 1224)) AND (d_month_seq#81 <= 1235)) AND isnotnull(d_week_seq#82))
 
 (47) Project [codegen id : 8]
-Output [1]: [d_week_seq#84]
-Input [2]: [d_month_seq#83, d_week_seq#84]
+Output [1]: [d_week_seq#82]
+Input [2]: [d_month_seq#81, d_week_seq#82]
 
 (48) BroadcastExchange
-Input [1]: [d_week_seq#84]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Input [1]: [d_week_seq#82]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
 (49) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [d_week_seq#56]
-Right keys [1]: [d_week_seq#84]
+Left keys [1]: [d_week_seq#55]
+Right keys [1]: [d_week_seq#82]
 Join type: Inner
 Join condition: None
 
 (50) Project [codegen id : 9]
-Output [9]: [d_week_seq#56 AS d_week_seq2#85, s_store_id#82 AS s_store_id2#86, sun_sales#74 AS sun_sales2#87, mon_sales#75 AS mon_sales2#88, tue_sales#76 AS tue_sales2#89, wed_sales#77 AS wed_sales2#90, thu_sales#78 AS thu_sales2#91, fri_sales#79 AS fri_sales2#92, sat_sales#80 AS sat_sales2#93]
-Input [10]: [d_week_seq#56, sun_sales#74, mon_sales#75, tue_sales#76, wed_sales#77, thu_sales#78, fri_sales#79, sat_sales#80, s_store_id#82, d_week_seq#84]
+Output [9]: [d_week_seq#55 AS d_week_seq2#83, s_store_id#80 AS s_store_id2#84, sun_sales#72 AS sun_sales2#85, mon_sales#73 AS mon_sales2#86, tue_sales#74 AS tue_sales2#87, wed_sales#75 AS wed_sales2#88, thu_sales#76 AS thu_sales2#89, fri_sales#77 AS fri_sales2#90, sat_sales#78 AS sat_sales2#91]
+Input [10]: [d_week_seq#55, sun_sales#72, mon_sales#73, tue_sales#74, wed_sales#75, thu_sales#76, fri_sales#77, sat_sales#78, s_store_id#80, d_week_seq#82]
 
 (51) BroadcastExchange
-Input [9]: [d_week_seq2#85, s_store_id2#86, sun_sales2#87, mon_sales2#88, tue_sales2#89, wed_sales2#90, thu_sales2#91, fri_sales2#92, sat_sales2#93]
-Arguments: HashedRelationBroadcastMode(List(input[1, string, true], (input[0, int, true] - 52)),false), [plan_id=9]
+Input [9]: [d_week_seq2#83, s_store_id2#84, sun_sales2#85, mon_sales2#86, tue_sales2#87, wed_sales2#88, thu_sales2#89, fri_sales2#90, sat_sales2#91]
+Arguments: HashedRelationBroadcastMode(List(input[1, string, true], (input[0, int, true] - 52)),false), [plan_id=11]
 
 (52) BroadcastHashJoin [codegen id : 10]
-Left keys [2]: [s_store_id1#44, d_week_seq1#43]
-Right keys [2]: [s_store_id2#86, (d_week_seq2#85 - 52)]
+Left keys [2]: [s_store_id1#43, d_week_seq1#42]
+Right keys [2]: [s_store_id2#84, (d_week_seq2#83 - 52)]
 Join type: Inner
 Join condition: None
 
 (53) Project [codegen id : 10]
-Output [10]: [s_store_name1#42, s_store_id1#44, d_week_seq1#43, (sun_sales1#45 / sun_sales2#87) AS (sun_sales1 / sun_sales2)#94, (mon_sales1#46 / mon_sales2#88) AS (mon_sales1 / mon_sales2)#95, (tue_sales1#47 / tue_sales2#89) AS (tue_sales1 / tue_sales2)#96, (wed_sales1#48 / wed_sales2#90) AS (wed_sales1 / wed_sales2)#97, (thu_sales1#49 / thu_sales2#91) AS (thu_sales1 / thu_sales2)#98, (fri_sales1#50 / fri_sales2#92) AS (fri_sales1 / fri_sales2)#99, (sat_sales1#51 / sat_sales2#93) AS (sat_sales1 / sat_sales2)#100]
-Input [19]: [s_store_name1#42, d_week_seq1#43, s_store_id1#44, sun_sales1#45, mon_sales1#46, tue_sales1#47, wed_sales1#48, thu_sales1#49, fri_sales1#50, sat_sales1#51, d_week_seq2#85, s_store_id2#86, sun_sales2#87, mon_sales2#88, tue_sales2#89, wed_sales2#90, thu_sales2#91, fri_sales2#92, sat_sales2#93]
+Output [10]: [s_store_name1#41, s_store_id1#43, d_week_seq1#42, (sun_sales1#44 / sun_sales2#85) AS (sun_sales1 / sun_sales2)#92, (mon_sales1#45 / mon_sales2#86) AS (mon_sales1 / mon_sales2)#93, (tue_sales1#46 / tue_sales2#87) AS (tue_sales1 / tue_sales2)#94, (wed_sales1#47 / wed_sales2#88) AS (wed_sales1 / wed_sales2)#95, (thu_sales1#48 / thu_sales2#89) AS (thu_sales1 / thu_sales2)#96, (fri_sales1#49 / fri_sales2#90) AS (fri_sales1 / fri_sales2)#97, (sat_sales1#50 / sat_sales2#91) AS (sat_sales1 / sat_sales2)#98]
+Input [19]: [s_store_name1#41, d_week_seq1#42, s_store_id1#43, sun_sales1#44, mon_sales1#45, tue_sales1#46, wed_sales1#47, thu_sales1#48, fri_sales1#49, sat_sales1#50, d_week_seq2#83, s_store_id2#84, sun_sales2#85, mon_sales2#86, tue_sales2#87, wed_sales2#88, thu_sales2#89, fri_sales2#90, sat_sales2#91]
 
 (54) TakeOrderedAndProject
-Input [10]: [s_store_name1#42, s_store_id1#44, d_week_seq1#43, (sun_sales1 / sun_sales2)#94, (mon_sales1 / mon_sales2)#95, (tue_sales1 / tue_sales2)#96, (wed_sales1 / wed_sales2)#97, (thu_sales1 / thu_sales2)#98, (fri_sales1 / fri_sales2)#99, (sat_sales1 / sat_sales2)#100]
-Arguments: 100, [s_store_name1#42 ASC NULLS FIRST, s_store_id1#44 ASC NULLS FIRST, d_week_seq1#43 ASC NULLS FIRST], [s_store_name1#42, s_store_id1#44, d_week_seq1#43, (sun_sales1 / sun_sales2)#94, (mon_sales1 / mon_sales2)#95, (tue_sales1 / tue_sales2)#96, (wed_sales1 / wed_sales2)#97, (thu_sales1 / thu_sales2)#98, (fri_sales1 / fri_sales2)#99, (sat_sales1 / sat_sales2)#100]
+Input [10]: [s_store_name1#41, s_store_id1#43, d_week_seq1#42, (sun_sales1 / sun_sales2)#92, (mon_sales1 / mon_sales2)#93, (tue_sales1 / tue_sales2)#94, (wed_sales1 / wed_sales2)#95, (thu_sales1 / thu_sales2)#96, (fri_sales1 / fri_sales2)#97, (sat_sales1 / sat_sales2)#98]
+Arguments: 100, [s_store_name1#41 ASC NULLS FIRST, s_store_id1#43 ASC NULLS FIRST, d_week_seq1#42 ASC NULLS FIRST], [s_store_name1#41, s_store_id1#43, d_week_seq1#42, (sun_sales1 / sun_sales2)#92, (mon_sales1 / mon_sales2)#93, (tue_sales1 / tue_sales2)#94, (wed_sales1 / wed_sales2)#95, (thu_sales1 / thu_sales2)#96, (fri_sales1 / fri_sales2)#97, (sat_sales1 / sat_sales2)#98]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 6 Hosting Expression = Subquery scalar-subquery#7, [id=#8]
+Subquery:1 Hosting operator id = 6 Hosting Expression = Subquery scalar-subquery#7, [id=#1]
 ObjectHashAggregate (61)
 +- Exchange (60)
    +- ObjectHashAggregate (59)
@@ -328,42 +328,42 @@ ObjectHashAggregate (61)
 
 
 (55) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#40, d_week_seq#41]
+Output [2]: [d_month_seq#39, d_week_seq#40]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1212), LessThanOrEqual(d_month_seq,1223), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (56) ColumnarToRow [codegen id : 1]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (57) Filter [codegen id : 1]
-Input [2]: [d_month_seq#40, d_week_seq#41]
-Condition : (((isnotnull(d_month_seq#40) AND (d_month_seq#40 >= 1212)) AND (d_month_seq#40 <= 1223)) AND isnotnull(d_week_seq#41))
+Input [2]: [d_month_seq#39, d_week_seq#40]
+Condition : (((isnotnull(d_month_seq#39) AND (d_month_seq#39 >= 1212)) AND (d_month_seq#39 <= 1223)) AND isnotnull(d_week_seq#40))
 
 (58) Project [codegen id : 1]
-Output [1]: [d_week_seq#41]
-Input [2]: [d_month_seq#40, d_week_seq#41]
+Output [1]: [d_week_seq#40]
+Input [2]: [d_month_seq#39, d_week_seq#40]
 
 (59) ObjectHashAggregate
-Input [1]: [d_week_seq#41]
+Input [1]: [d_week_seq#40]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [buf#101]
-Results [1]: [buf#102]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [buf#99]
+Results [1]: [buf#100]
 
 (60) Exchange
-Input [1]: [buf#102]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [buf#100]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (61) ObjectHashAggregate
-Input [1]: [buf#102]
+Input [1]: [buf#100]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)#103]
-Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#41, 42), 335, 8990, 0, 0)#103 AS bloomFilter#104]
+Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)#101]
+Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#40, 42), 335, 8990, 0, 0)#101 AS bloomFilter#102]
 
-Subquery:2 Hosting operator id = 31 Hosting Expression = Subquery scalar-subquery#58, [id=#59]
+Subquery:2 Hosting operator id = 31 Hosting Expression = Subquery scalar-subquery#57, [id=#6]
 ObjectHashAggregate (68)
 +- Exchange (67)
    +- ObjectHashAggregate (66)
@@ -374,39 +374,39 @@ ObjectHashAggregate (68)
 
 
 (62) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_month_seq#83, d_week_seq#84]
+Output [2]: [d_month_seq#81, d_week_seq#82]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_month_seq), GreaterThanOrEqual(d_month_seq,1224), LessThanOrEqual(d_month_seq,1235), IsNotNull(d_week_seq)]
 ReadSchema: struct<d_month_seq:int,d_week_seq:int>
 
 (63) ColumnarToRow [codegen id : 1]
-Input [2]: [d_month_seq#83, d_week_seq#84]
+Input [2]: [d_month_seq#81, d_week_seq#82]
 
 (64) Filter [codegen id : 1]
-Input [2]: [d_month_seq#83, d_week_seq#84]
-Condition : (((isnotnull(d_month_seq#83) AND (d_month_seq#83 >= 1224)) AND (d_month_seq#83 <= 1235)) AND isnotnull(d_week_seq#84))
+Input [2]: [d_month_seq#81, d_week_seq#82]
+Condition : (((isnotnull(d_month_seq#81) AND (d_month_seq#81 >= 1224)) AND (d_month_seq#81 <= 1235)) AND isnotnull(d_week_seq#82))
 
 (65) Project [codegen id : 1]
-Output [1]: [d_week_seq#84]
-Input [2]: [d_month_seq#83, d_week_seq#84]
+Output [1]: [d_week_seq#82]
+Input [2]: [d_month_seq#81, d_week_seq#82]
 
 (66) ObjectHashAggregate
-Input [1]: [d_week_seq#84]
+Input [1]: [d_week_seq#82]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#84, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [buf#105]
-Results [1]: [buf#106]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_week_seq#82, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [buf#103]
+Results [1]: [buf#104]
 
 (67) Exchange
-Input [1]: [buf#106]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
+Input [1]: [buf#104]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (68) ObjectHashAggregate
-Input [1]: [buf#106]
+Input [1]: [buf#104]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#84, 42), 335, 8990, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#84, 42), 335, 8990, 0, 0)#107]
-Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#84, 42), 335, 8990, 0, 0)#107 AS bloomFilter#108]
+Functions [1]: [bloom_filter_agg(xxhash64(d_week_seq#82, 42), 335, 8990, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_week_seq#82, 42), 335, 8990, 0, 0)#105]
+Results [1]: [bloom_filter_agg(xxhash64(d_week_seq#82, 42), 335, 8990, 0, 0)#105 AS bloomFilter#106]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6.sf100/explain.txt
index ac69497fb26ca..8ed27e2de4bde 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6.sf100/explain.txt
@@ -280,7 +280,7 @@ Input [2]: [d_date_sk#16, d_month_seq#26]
 
 (48) Filter [codegen id : 1]
 Input [2]: [d_date_sk#16, d_month_seq#26]
-Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#28])) AND isnotnull(d_date_sk#16))
+Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#9])) AND isnotnull(d_date_sk#16))
 
 (49) Project [codegen id : 1]
 Output [1]: [d_date_sk#16]
@@ -288,11 +288,11 @@ Input [2]: [d_date_sk#16, d_month_seq#26]
 
 (50) BroadcastExchange
 Input [1]: [d_date_sk#16]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
-Subquery:2 Hosting operator id = 48 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#28]
+Subquery:2 Hosting operator id = 48 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#9]
 
-Subquery:3 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#27, [id=#28]
+Subquery:3 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#27, [id=#9]
 * HashAggregate (57)
 +- Exchange (56)
    +- * HashAggregate (55)
@@ -303,39 +303,39 @@ Subquery:3 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquer
 
 
 (51) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [3]: [d_month_seq#28, d_year#29, d_moy#30]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,1)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (52) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (53) Filter [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
-Condition : (((isnotnull(d_year#30) AND isnotnull(d_moy#31)) AND (d_year#30 = 2000)) AND (d_moy#31 = 1))
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
+Condition : (((isnotnull(d_year#29) AND isnotnull(d_moy#30)) AND (d_year#29 = 2000)) AND (d_moy#30 = 1))
 
 (54) Project [codegen id : 1]
-Output [1]: [d_month_seq#29]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [1]: [d_month_seq#28]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (55) HashAggregate [codegen id : 1]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 (56) Exchange
-Input [1]: [d_month_seq#29]
-Arguments: hashpartitioning(d_month_seq#29, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [d_month_seq#28]
+Arguments: hashpartitioning(d_month_seq#28, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (57) HashAggregate [codegen id : 2]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6/explain.txt
index 75644fea091fe..b4a11ed14917e 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q6/explain.txt
@@ -250,7 +250,7 @@ Input [2]: [d_date_sk#9, d_month_seq#26]
 
 (42) Filter [codegen id : 1]
 Input [2]: [d_date_sk#9, d_month_seq#26]
-Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#28])) AND isnotnull(d_date_sk#9))
+Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#7])) AND isnotnull(d_date_sk#9))
 
 (43) Project [codegen id : 1]
 Output [1]: [d_date_sk#9]
@@ -258,11 +258,11 @@ Input [2]: [d_date_sk#9, d_month_seq#26]
 
 (44) BroadcastExchange
 Input [1]: [d_date_sk#9]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
 
-Subquery:2 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#28]
+Subquery:2 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#7]
 
-Subquery:3 Hosting operator id = 40 Hosting Expression = Subquery scalar-subquery#27, [id=#28]
+Subquery:3 Hosting operator id = 40 Hosting Expression = Subquery scalar-subquery#27, [id=#7]
 * HashAggregate (51)
 +- Exchange (50)
    +- * HashAggregate (49)
@@ -273,39 +273,39 @@ Subquery:3 Hosting operator id = 40 Hosting Expression = Subquery scalar-subquer
 
 
 (45) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [3]: [d_month_seq#28, d_year#29, d_moy#30]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,1)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (46) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (47) Filter [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
-Condition : (((isnotnull(d_year#30) AND isnotnull(d_moy#31)) AND (d_year#30 = 2000)) AND (d_moy#31 = 1))
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
+Condition : (((isnotnull(d_year#29) AND isnotnull(d_moy#30)) AND (d_year#29 = 2000)) AND (d_moy#30 = 1))
 
 (48) Project [codegen id : 1]
-Output [1]: [d_month_seq#29]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [1]: [d_month_seq#28]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (49) HashAggregate [codegen id : 1]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 (50) Exchange
-Input [1]: [d_month_seq#29]
-Arguments: hashpartitioning(d_month_seq#29, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [1]: [d_month_seq#28]
+Arguments: hashpartitioning(d_month_seq#28, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (51) HashAggregate [codegen id : 2]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/explain.txt
index 61a1f4d927a4c..bcdaddbc10d87 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/explain.txt
@@ -1,67 +1,66 @@
 == Physical Plan ==
-TakeOrderedAndProject (63)
-+- * HashAggregate (62)
-   +- Exchange (61)
-      +- * HashAggregate (60)
-         +- Union (59)
-            :- * HashAggregate (28)
-            :  +- Exchange (27)
-            :     +- * HashAggregate (26)
-            :        +- * Project (25)
-            :           +- * BroadcastHashJoin Inner BuildRight (24)
-            :              :- * Project (13)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (12)
-            :              :     :- * Project (6)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
-            :              :     :     :- * Filter (3)
-            :              :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :              :     :     +- ReusedExchange (4)
-            :              :     +- BroadcastExchange (11)
-            :              :        +- * Project (10)
-            :              :           +- * Filter (9)
-            :              :              +- * ColumnarToRow (8)
-            :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
-            :              +- BroadcastExchange (23)
-            :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
-            :                    :- * Filter (16)
-            :                    :  +- * ColumnarToRow (15)
-            :                    :     +- Scan parquet spark_catalog.default.item (14)
-            :                    +- BroadcastExchange (21)
-            :                       +- * Project (20)
-            :                          +- * Filter (19)
-            :                             +- * ColumnarToRow (18)
-            :                                +- Scan parquet spark_catalog.default.item (17)
-            :- * HashAggregate (43)
-            :  +- Exchange (42)
-            :     +- * HashAggregate (41)
-            :        +- * Project (40)
-            :           +- * BroadcastHashJoin Inner BuildRight (39)
-            :              :- * Project (37)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (36)
-            :              :     :- * Project (34)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
-            :              :     :     :- * Filter (31)
-            :              :     :     :  +- * ColumnarToRow (30)
-            :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
-            :              :     :     +- ReusedExchange (32)
-            :              :     +- ReusedExchange (35)
-            :              +- ReusedExchange (38)
-            +- * HashAggregate (58)
-               +- Exchange (57)
-                  +- * HashAggregate (56)
-                     +- * Project (55)
-                        +- * BroadcastHashJoin Inner BuildRight (54)
-                           :- * Project (52)
-                           :  +- * BroadcastHashJoin Inner BuildRight (51)
-                           :     :- * Project (49)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (48)
-                           :     :     :- * Filter (46)
-                           :     :     :  +- * ColumnarToRow (45)
-                           :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
-                           :     :     +- ReusedExchange (47)
-                           :     +- ReusedExchange (50)
-                           +- ReusedExchange (53)
+TakeOrderedAndProject (62)
++- * HashAggregate (61)
+   +- * HashAggregate (60)
+      +- Union (59)
+         :- * HashAggregate (28)
+         :  +- Exchange (27)
+         :     +- * HashAggregate (26)
+         :        +- * Project (25)
+         :           +- * BroadcastHashJoin Inner BuildRight (24)
+         :              :- * Project (13)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (12)
+         :              :     :- * Project (6)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
+         :              :     :     :- * Filter (3)
+         :              :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
+         :              :     :     +- ReusedExchange (4)
+         :              :     +- BroadcastExchange (11)
+         :              :        +- * Project (10)
+         :              :           +- * Filter (9)
+         :              :              +- * ColumnarToRow (8)
+         :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
+         :              +- BroadcastExchange (23)
+         :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
+         :                    :- * Filter (16)
+         :                    :  +- * ColumnarToRow (15)
+         :                    :     +- Scan parquet spark_catalog.default.item (14)
+         :                    +- BroadcastExchange (21)
+         :                       +- * Project (20)
+         :                          +- * Filter (19)
+         :                             +- * ColumnarToRow (18)
+         :                                +- Scan parquet spark_catalog.default.item (17)
+         :- * HashAggregate (43)
+         :  +- Exchange (42)
+         :     +- * HashAggregate (41)
+         :        +- * Project (40)
+         :           +- * BroadcastHashJoin Inner BuildRight (39)
+         :              :- * Project (37)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (36)
+         :              :     :- * Project (34)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
+         :              :     :     :- * Filter (31)
+         :              :     :     :  +- * ColumnarToRow (30)
+         :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
+         :              :     :     +- ReusedExchange (32)
+         :              :     +- ReusedExchange (35)
+         :              +- ReusedExchange (38)
+         +- * HashAggregate (58)
+            +- Exchange (57)
+               +- * HashAggregate (56)
+                  +- * Project (55)
+                     +- * BroadcastHashJoin Inner BuildRight (54)
+                        :- * Project (52)
+                        :  +- * BroadcastHashJoin Inner BuildRight (51)
+                        :     :- * Project (49)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (48)
+                        :     :     :- * Filter (46)
+                        :     :     :  +- * ColumnarToRow (45)
+                        :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
+                        :     :     +- ReusedExchange (47)
+                        :     +- ReusedExchange (50)
+                        +- ReusedExchange (53)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -79,7 +78,7 @@ Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Condition : (isnotnull(ss_addr_sk#2) AND isnotnull(ss_item_sk#1))
 
-(4) ReusedExchange [Reuses operator id: 68]
+(4) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#6]
 
 (5) BroadcastHashJoin [codegen id : 5]
@@ -213,7 +212,7 @@ Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_da
 Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_date_sk#20]
 Condition : (isnotnull(cs_bill_addr_sk#17) AND isnotnull(cs_item_sk#18))
 
-(32) ReusedExchange [Reuses operator id: 68]
+(32) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#21]
 
 (33) BroadcastHashJoin [codegen id : 11]
@@ -285,7 +284,7 @@ Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_da
 Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_date_sk#32]
 Condition : (isnotnull(ws_bill_addr_sk#30) AND isnotnull(ws_item_sk#29))
 
-(47) ReusedExchange [Reuses operator id: 68]
+(47) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#33]
 
 (48) BroadcastHashJoin [codegen id : 17]
@@ -351,52 +350,48 @@ Functions [1]: [partial_sum(total_sales#16)]
 Aggregate Attributes [2]: [sum#41, isEmpty#42]
 Results [3]: [i_item_id#10, sum#43, isEmpty#44]
 
-(61) Exchange
-Input [3]: [i_item_id#10, sum#43, isEmpty#44]
-Arguments: hashpartitioning(i_item_id#10, 5), ENSURE_REQUIREMENTS, [plan_id=7]
-
-(62) HashAggregate [codegen id : 20]
+(61) HashAggregate [codegen id : 19]
 Input [3]: [i_item_id#10, sum#43, isEmpty#44]
 Keys [1]: [i_item_id#10]
 Functions [1]: [sum(total_sales#16)]
 Aggregate Attributes [1]: [sum(total_sales#16)#45]
 Results [2]: [i_item_id#10, sum(total_sales#16)#45 AS total_sales#46]
 
-(63) TakeOrderedAndProject
+(62) TakeOrderedAndProject
 Input [2]: [i_item_id#10, total_sales#46]
 Arguments: 100, [i_item_id#10 ASC NULLS FIRST, total_sales#46 ASC NULLS FIRST], [i_item_id#10, total_sales#46]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (68)
-+- * Project (67)
-   +- * Filter (66)
-      +- * ColumnarToRow (65)
-         +- Scan parquet spark_catalog.default.date_dim (64)
+BroadcastExchange (67)
++- * Project (66)
+   +- * Filter (65)
+      +- * ColumnarToRow (64)
+         +- Scan parquet spark_catalog.default.date_dim (63)
 
 
-(64) Scan parquet spark_catalog.default.date_dim
+(63) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,9), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(65) ColumnarToRow [codegen id : 1]
+(64) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(66) Filter [codegen id : 1]
+(65) Filter [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Condition : ((((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 1998)) AND (d_moy#48 = 9)) AND isnotnull(d_date_sk#6))
 
-(67) Project [codegen id : 1]
+(66) Project [codegen id : 1]
 Output [1]: [d_date_sk#6]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(68) BroadcastExchange
+(67) BroadcastExchange
 Input [1]: [d_date_sk#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 Subquery:2 Hosting operator id = 29 Hosting Expression = cs_sold_date_sk#20 IN dynamicpruning#5
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/simplified.txt
index 754cda4695efe..e396d2f9a147d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60.sf100/simplified.txt
@@ -1,105 +1,102 @@
 TakeOrderedAndProject [i_item_id,total_sales]
-  WholeStageCodegen (20)
+  WholeStageCodegen (19)
     HashAggregate [i_item_id,sum,isEmpty] [sum(total_sales),total_sales,sum,isEmpty]
-      InputAdapter
-        Exchange [i_item_id] #1
-          WholeStageCodegen (19)
-            HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
-                              Project [ss_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                  Project [ss_item_sk,ss_ext_sales_price]
-                                    BroadcastHashJoin [ss_addr_sk,ca_address_sk]
-                                      Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
-                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                          Filter [ss_addr_sk,ss_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
-                                                  SubqueryBroadcast [d_date_sk] #1
-                                                    BroadcastExchange #3
-                                                      WholeStageCodegen (1)
-                                                        Project [d_date_sk]
-                                                          Filter [d_year,d_moy,d_date_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        BroadcastExchange #4
-                                          WholeStageCodegen (2)
-                                            Project [ca_address_sk]
-                                              Filter [ca_gmt_offset,ca_address_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
-                                  InputAdapter
-                                    BroadcastExchange #5
-                                      WholeStageCodegen (4)
-                                        BroadcastHashJoin [i_item_id,i_item_id]
-                                          Filter [i_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
-                                          InputAdapter
-                                            BroadcastExchange #6
-                                              WholeStageCodegen (3)
-                                                Project [i_item_id]
-                                                  Filter [i_category]
-                                                    ColumnarToRow
-                                                      InputAdapter
-                                                        Scan parquet spark_catalog.default.item [i_item_id,i_category]
-                  WholeStageCodegen (12)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
-                              Project [cs_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                  Project [cs_item_sk,cs_ext_sales_price]
-                                    BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
-                                      Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
-                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                          Filter [cs_bill_addr_sk,cs_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
-                  WholeStageCodegen (18)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #8
-                          WholeStageCodegen (17)
-                            HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
-                              Project [ws_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                  Project [ws_item_sk,ws_ext_sales_price]
-                                    BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
-                                      Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
-                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                          Filter [ws_bill_addr_sk,ws_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
+      HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
+                        Project [ss_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ss_item_sk,i_item_sk]
+                            Project [ss_item_sk,ss_ext_sales_price]
+                              BroadcastHashJoin [ss_addr_sk,ca_address_sk]
+                                Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
+                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                    Filter [ss_addr_sk,ss_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
+                                            SubqueryBroadcast [d_date_sk] #1
+                                              BroadcastExchange #2
+                                                WholeStageCodegen (1)
+                                                  Project [d_date_sk]
+                                                    Filter [d_year,d_moy,d_date_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  BroadcastExchange #3
+                                    WholeStageCodegen (2)
+                                      Project [ca_address_sk]
+                                        Filter [ca_gmt_offset,ca_address_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
+                            InputAdapter
+                              BroadcastExchange #4
+                                WholeStageCodegen (4)
+                                  BroadcastHashJoin [i_item_id,i_item_id]
+                                    Filter [i_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
+                                    InputAdapter
+                                      BroadcastExchange #5
+                                        WholeStageCodegen (3)
+                                          Project [i_item_id]
+                                            Filter [i_category]
+                                              ColumnarToRow
+                                                InputAdapter
+                                                  Scan parquet spark_catalog.default.item [i_item_id,i_category]
+            WholeStageCodegen (12)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
+                        Project [cs_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [cs_item_sk,i_item_sk]
+                            Project [cs_item_sk,cs_ext_sales_price]
+                              BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
+                                Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
+                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                    Filter [cs_bill_addr_sk,cs_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
+            WholeStageCodegen (18)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #7
+                    WholeStageCodegen (17)
+                      HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
+                        Project [ws_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ws_item_sk,i_item_sk]
+                            Project [ws_item_sk,ws_ext_sales_price]
+                              BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
+                                Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
+                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                    Filter [ws_bill_addr_sk,ws_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/explain.txt
index 61a1f4d927a4c..bcdaddbc10d87 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/explain.txt
@@ -1,67 +1,66 @@
 == Physical Plan ==
-TakeOrderedAndProject (63)
-+- * HashAggregate (62)
-   +- Exchange (61)
-      +- * HashAggregate (60)
-         +- Union (59)
-            :- * HashAggregate (28)
-            :  +- Exchange (27)
-            :     +- * HashAggregate (26)
-            :        +- * Project (25)
-            :           +- * BroadcastHashJoin Inner BuildRight (24)
-            :              :- * Project (13)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (12)
-            :              :     :- * Project (6)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
-            :              :     :     :- * Filter (3)
-            :              :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :              :     :     +- ReusedExchange (4)
-            :              :     +- BroadcastExchange (11)
-            :              :        +- * Project (10)
-            :              :           +- * Filter (9)
-            :              :              +- * ColumnarToRow (8)
-            :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
-            :              +- BroadcastExchange (23)
-            :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
-            :                    :- * Filter (16)
-            :                    :  +- * ColumnarToRow (15)
-            :                    :     +- Scan parquet spark_catalog.default.item (14)
-            :                    +- BroadcastExchange (21)
-            :                       +- * Project (20)
-            :                          +- * Filter (19)
-            :                             +- * ColumnarToRow (18)
-            :                                +- Scan parquet spark_catalog.default.item (17)
-            :- * HashAggregate (43)
-            :  +- Exchange (42)
-            :     +- * HashAggregate (41)
-            :        +- * Project (40)
-            :           +- * BroadcastHashJoin Inner BuildRight (39)
-            :              :- * Project (37)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (36)
-            :              :     :- * Project (34)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
-            :              :     :     :- * Filter (31)
-            :              :     :     :  +- * ColumnarToRow (30)
-            :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
-            :              :     :     +- ReusedExchange (32)
-            :              :     +- ReusedExchange (35)
-            :              +- ReusedExchange (38)
-            +- * HashAggregate (58)
-               +- Exchange (57)
-                  +- * HashAggregate (56)
-                     +- * Project (55)
-                        +- * BroadcastHashJoin Inner BuildRight (54)
-                           :- * Project (52)
-                           :  +- * BroadcastHashJoin Inner BuildRight (51)
-                           :     :- * Project (49)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (48)
-                           :     :     :- * Filter (46)
-                           :     :     :  +- * ColumnarToRow (45)
-                           :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
-                           :     :     +- ReusedExchange (47)
-                           :     +- ReusedExchange (50)
-                           +- ReusedExchange (53)
+TakeOrderedAndProject (62)
++- * HashAggregate (61)
+   +- * HashAggregate (60)
+      +- Union (59)
+         :- * HashAggregate (28)
+         :  +- Exchange (27)
+         :     +- * HashAggregate (26)
+         :        +- * Project (25)
+         :           +- * BroadcastHashJoin Inner BuildRight (24)
+         :              :- * Project (13)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (12)
+         :              :     :- * Project (6)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (5)
+         :              :     :     :- * Filter (3)
+         :              :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     +- Scan parquet spark_catalog.default.store_sales (1)
+         :              :     :     +- ReusedExchange (4)
+         :              :     +- BroadcastExchange (11)
+         :              :        +- * Project (10)
+         :              :           +- * Filter (9)
+         :              :              +- * ColumnarToRow (8)
+         :              :                 +- Scan parquet spark_catalog.default.customer_address (7)
+         :              +- BroadcastExchange (23)
+         :                 +- * BroadcastHashJoin LeftSemi BuildRight (22)
+         :                    :- * Filter (16)
+         :                    :  +- * ColumnarToRow (15)
+         :                    :     +- Scan parquet spark_catalog.default.item (14)
+         :                    +- BroadcastExchange (21)
+         :                       +- * Project (20)
+         :                          +- * Filter (19)
+         :                             +- * ColumnarToRow (18)
+         :                                +- Scan parquet spark_catalog.default.item (17)
+         :- * HashAggregate (43)
+         :  +- Exchange (42)
+         :     +- * HashAggregate (41)
+         :        +- * Project (40)
+         :           +- * BroadcastHashJoin Inner BuildRight (39)
+         :              :- * Project (37)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (36)
+         :              :     :- * Project (34)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (33)
+         :              :     :     :- * Filter (31)
+         :              :     :     :  +- * ColumnarToRow (30)
+         :              :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (29)
+         :              :     :     +- ReusedExchange (32)
+         :              :     +- ReusedExchange (35)
+         :              +- ReusedExchange (38)
+         +- * HashAggregate (58)
+            +- Exchange (57)
+               +- * HashAggregate (56)
+                  +- * Project (55)
+                     +- * BroadcastHashJoin Inner BuildRight (54)
+                        :- * Project (52)
+                        :  +- * BroadcastHashJoin Inner BuildRight (51)
+                        :     :- * Project (49)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (48)
+                        :     :     :- * Filter (46)
+                        :     :     :  +- * ColumnarToRow (45)
+                        :     :     :     +- Scan parquet spark_catalog.default.web_sales (44)
+                        :     :     +- ReusedExchange (47)
+                        :     +- ReusedExchange (50)
+                        +- ReusedExchange (53)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -79,7 +78,7 @@ Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Input [4]: [ss_item_sk#1, ss_addr_sk#2, ss_ext_sales_price#3, ss_sold_date_sk#4]
 Condition : (isnotnull(ss_addr_sk#2) AND isnotnull(ss_item_sk#1))
 
-(4) ReusedExchange [Reuses operator id: 68]
+(4) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#6]
 
 (5) BroadcastHashJoin [codegen id : 5]
@@ -213,7 +212,7 @@ Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_da
 Input [4]: [cs_bill_addr_sk#17, cs_item_sk#18, cs_ext_sales_price#19, cs_sold_date_sk#20]
 Condition : (isnotnull(cs_bill_addr_sk#17) AND isnotnull(cs_item_sk#18))
 
-(32) ReusedExchange [Reuses operator id: 68]
+(32) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#21]
 
 (33) BroadcastHashJoin [codegen id : 11]
@@ -285,7 +284,7 @@ Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_da
 Input [4]: [ws_item_sk#29, ws_bill_addr_sk#30, ws_ext_sales_price#31, ws_sold_date_sk#32]
 Condition : (isnotnull(ws_bill_addr_sk#30) AND isnotnull(ws_item_sk#29))
 
-(47) ReusedExchange [Reuses operator id: 68]
+(47) ReusedExchange [Reuses operator id: 67]
 Output [1]: [d_date_sk#33]
 
 (48) BroadcastHashJoin [codegen id : 17]
@@ -351,52 +350,48 @@ Functions [1]: [partial_sum(total_sales#16)]
 Aggregate Attributes [2]: [sum#41, isEmpty#42]
 Results [3]: [i_item_id#10, sum#43, isEmpty#44]
 
-(61) Exchange
-Input [3]: [i_item_id#10, sum#43, isEmpty#44]
-Arguments: hashpartitioning(i_item_id#10, 5), ENSURE_REQUIREMENTS, [plan_id=7]
-
-(62) HashAggregate [codegen id : 20]
+(61) HashAggregate [codegen id : 19]
 Input [3]: [i_item_id#10, sum#43, isEmpty#44]
 Keys [1]: [i_item_id#10]
 Functions [1]: [sum(total_sales#16)]
 Aggregate Attributes [1]: [sum(total_sales#16)#45]
 Results [2]: [i_item_id#10, sum(total_sales#16)#45 AS total_sales#46]
 
-(63) TakeOrderedAndProject
+(62) TakeOrderedAndProject
 Input [2]: [i_item_id#10, total_sales#46]
 Arguments: 100, [i_item_id#10 ASC NULLS FIRST, total_sales#46 ASC NULLS FIRST], [i_item_id#10, total_sales#46]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (68)
-+- * Project (67)
-   +- * Filter (66)
-      +- * ColumnarToRow (65)
-         +- Scan parquet spark_catalog.default.date_dim (64)
+BroadcastExchange (67)
++- * Project (66)
+   +- * Filter (65)
+      +- * ColumnarToRow (64)
+         +- Scan parquet spark_catalog.default.date_dim (63)
 
 
-(64) Scan parquet spark_catalog.default.date_dim
+(63) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,1998), EqualTo(d_moy,9), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(65) ColumnarToRow [codegen id : 1]
+(64) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(66) Filter [codegen id : 1]
+(65) Filter [codegen id : 1]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 Condition : ((((isnotnull(d_year#47) AND isnotnull(d_moy#48)) AND (d_year#47 = 1998)) AND (d_moy#48 = 9)) AND isnotnull(d_date_sk#6))
 
-(67) Project [codegen id : 1]
+(66) Project [codegen id : 1]
 Output [1]: [d_date_sk#6]
 Input [3]: [d_date_sk#6, d_year#47, d_moy#48]
 
-(68) BroadcastExchange
+(67) BroadcastExchange
 Input [1]: [d_date_sk#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 Subquery:2 Hosting operator id = 29 Hosting Expression = cs_sold_date_sk#20 IN dynamicpruning#5
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/simplified.txt
index 754cda4695efe..e396d2f9a147d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q60/simplified.txt
@@ -1,105 +1,102 @@
 TakeOrderedAndProject [i_item_id,total_sales]
-  WholeStageCodegen (20)
+  WholeStageCodegen (19)
     HashAggregate [i_item_id,sum,isEmpty] [sum(total_sales),total_sales,sum,isEmpty]
-      InputAdapter
-        Exchange [i_item_id] #1
-          WholeStageCodegen (19)
-            HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
-                              Project [ss_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                  Project [ss_item_sk,ss_ext_sales_price]
-                                    BroadcastHashJoin [ss_addr_sk,ca_address_sk]
-                                      Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
-                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                          Filter [ss_addr_sk,ss_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
-                                                  SubqueryBroadcast [d_date_sk] #1
-                                                    BroadcastExchange #3
-                                                      WholeStageCodegen (1)
-                                                        Project [d_date_sk]
-                                                          Filter [d_year,d_moy,d_date_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        BroadcastExchange #4
-                                          WholeStageCodegen (2)
-                                            Project [ca_address_sk]
-                                              Filter [ca_gmt_offset,ca_address_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
-                                  InputAdapter
-                                    BroadcastExchange #5
-                                      WholeStageCodegen (4)
-                                        BroadcastHashJoin [i_item_id,i_item_id]
-                                          Filter [i_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
-                                          InputAdapter
-                                            BroadcastExchange #6
-                                              WholeStageCodegen (3)
-                                                Project [i_item_id]
-                                                  Filter [i_category]
-                                                    ColumnarToRow
-                                                      InputAdapter
-                                                        Scan parquet spark_catalog.default.item [i_item_id,i_category]
-                  WholeStageCodegen (12)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
-                              Project [cs_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                  Project [cs_item_sk,cs_ext_sales_price]
-                                    BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
-                                      Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
-                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                          Filter [cs_bill_addr_sk,cs_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
-                  WholeStageCodegen (18)
-                    HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
-                      InputAdapter
-                        Exchange [i_item_id] #8
-                          WholeStageCodegen (17)
-                            HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
-                              Project [ws_ext_sales_price,i_item_id]
-                                BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                  Project [ws_item_sk,ws_ext_sales_price]
-                                    BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
-                                      Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
-                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                          Filter [ws_bill_addr_sk,ws_item_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
-                                                  ReusedSubquery [d_date_sk] #1
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk] #3
-                                      InputAdapter
-                                        ReusedExchange [ca_address_sk] #4
-                                  InputAdapter
-                                    ReusedExchange [i_item_sk,i_item_id] #5
+      HashAggregate [i_item_id,total_sales] [sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ss_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [i_item_id,ss_ext_sales_price] [sum,sum]
+                        Project [ss_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ss_item_sk,i_item_sk]
+                            Project [ss_item_sk,ss_ext_sales_price]
+                              BroadcastHashJoin [ss_addr_sk,ca_address_sk]
+                                Project [ss_item_sk,ss_addr_sk,ss_ext_sales_price]
+                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                    Filter [ss_addr_sk,ss_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_addr_sk,ss_ext_sales_price,ss_sold_date_sk]
+                                            SubqueryBroadcast [d_date_sk] #1
+                                              BroadcastExchange #2
+                                                WholeStageCodegen (1)
+                                                  Project [d_date_sk]
+                                                    Filter [d_year,d_moy,d_date_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  BroadcastExchange #3
+                                    WholeStageCodegen (2)
+                                      Project [ca_address_sk]
+                                        Filter [ca_gmt_offset,ca_address_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.customer_address [ca_address_sk,ca_gmt_offset]
+                            InputAdapter
+                              BroadcastExchange #4
+                                WholeStageCodegen (4)
+                                  BroadcastHashJoin [i_item_id,i_item_id]
+                                    Filter [i_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.item [i_item_sk,i_item_id]
+                                    InputAdapter
+                                      BroadcastExchange #5
+                                        WholeStageCodegen (3)
+                                          Project [i_item_id]
+                                            Filter [i_category]
+                                              ColumnarToRow
+                                                InputAdapter
+                                                  Scan parquet spark_catalog.default.item [i_item_id,i_category]
+            WholeStageCodegen (12)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(cs_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [i_item_id,cs_ext_sales_price] [sum,sum]
+                        Project [cs_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [cs_item_sk,i_item_sk]
+                            Project [cs_item_sk,cs_ext_sales_price]
+                              BroadcastHashJoin [cs_bill_addr_sk,ca_address_sk]
+                                Project [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price]
+                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                    Filter [cs_bill_addr_sk,cs_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.catalog_sales [cs_bill_addr_sk,cs_item_sk,cs_ext_sales_price,cs_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
+            WholeStageCodegen (18)
+              HashAggregate [i_item_id,sum] [sum(UnscaledValue(ws_ext_sales_price)),total_sales,sum]
+                InputAdapter
+                  Exchange [i_item_id] #7
+                    WholeStageCodegen (17)
+                      HashAggregate [i_item_id,ws_ext_sales_price] [sum,sum]
+                        Project [ws_ext_sales_price,i_item_id]
+                          BroadcastHashJoin [ws_item_sk,i_item_sk]
+                            Project [ws_item_sk,ws_ext_sales_price]
+                              BroadcastHashJoin [ws_bill_addr_sk,ca_address_sk]
+                                Project [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price]
+                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                    Filter [ws_bill_addr_sk,ws_item_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_bill_addr_sk,ws_ext_sales_price,ws_sold_date_sk]
+                                            ReusedSubquery [d_date_sk] #1
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk] #2
+                                InputAdapter
+                                  ReusedExchange [ca_address_sk] #3
+                            InputAdapter
+                              ReusedExchange [i_item_sk,i_item_id] #4
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q64.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q64.sf100/explain.txt
index 8a57ad7ce8df0..446fd6f3b10d9 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q64.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q64.sf100/explain.txt
@@ -223,929 +223,929 @@ Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_ad
 
 (3) Filter [codegen id : 1]
 Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Condition : ((((((((isnotnull(ss_item_sk#1) AND isnotnull(ss_ticket_number#8)) AND isnotnull(ss_store_sk#6)) AND isnotnull(ss_customer_sk#2)) AND isnotnull(ss_cdemo_sk#3)) AND isnotnull(ss_promo_sk#7)) AND isnotnull(ss_hdemo_sk#4)) AND isnotnull(ss_addr_sk#5)) AND might_contain(Subquery scalar-subquery#14, [id=#15], xxhash64(ss_item_sk#1, 42)))
+Condition : ((((((((isnotnull(ss_item_sk#1) AND isnotnull(ss_ticket_number#8)) AND isnotnull(ss_store_sk#6)) AND isnotnull(ss_customer_sk#2)) AND isnotnull(ss_cdemo_sk#3)) AND isnotnull(ss_promo_sk#7)) AND isnotnull(ss_hdemo_sk#4)) AND isnotnull(ss_addr_sk#5)) AND might_contain(Subquery scalar-subquery#14, [id=#1], xxhash64(ss_item_sk#1, 42)))
 
 (4) Exchange
 Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#8, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#8, 5), ENSURE_REQUIREMENTS, [plan_id=2]
 
 (5) Sort [codegen id : 2]
 Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
 Arguments: [ss_item_sk#1 ASC NULLS FIRST, ss_ticket_number#8 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.store_returns
-Output [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
+Output [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_returns]
 PushedFilters: [IsNotNull(sr_item_sk), IsNotNull(sr_ticket_number)]
 ReadSchema: struct<sr_item_sk:int,sr_ticket_number:int>
 
 (7) ColumnarToRow [codegen id : 3]
-Input [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
+Input [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
 
 (8) Filter [codegen id : 3]
-Input [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
-Condition : (isnotnull(sr_item_sk#16) AND isnotnull(sr_ticket_number#17))
+Input [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
+Condition : (isnotnull(sr_item_sk#15) AND isnotnull(sr_ticket_number#16))
 
 (9) Project [codegen id : 3]
-Output [2]: [sr_item_sk#16, sr_ticket_number#17]
-Input [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
+Output [2]: [sr_item_sk#15, sr_ticket_number#16]
+Input [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
 
 (10) Exchange
-Input [2]: [sr_item_sk#16, sr_ticket_number#17]
-Arguments: hashpartitioning(sr_item_sk#16, sr_ticket_number#17, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [2]: [sr_item_sk#15, sr_ticket_number#16]
+Arguments: hashpartitioning(sr_item_sk#15, sr_ticket_number#16, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (11) Sort [codegen id : 4]
-Input [2]: [sr_item_sk#16, sr_ticket_number#17]
-Arguments: [sr_item_sk#16 ASC NULLS FIRST, sr_ticket_number#17 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#15, sr_ticket_number#16]
+Arguments: [sr_item_sk#15 ASC NULLS FIRST, sr_ticket_number#16 ASC NULLS FIRST], false, 0
 
 (12) SortMergeJoin [codegen id : 13]
 Left keys [2]: [ss_item_sk#1, ss_ticket_number#8]
-Right keys [2]: [sr_item_sk#16, sr_ticket_number#17]
+Right keys [2]: [sr_item_sk#15, sr_ticket_number#16]
 Join type: Inner
 Join condition: None
 
 (13) Project [codegen id : 13]
 Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, sr_item_sk#16, sr_ticket_number#17]
+Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, sr_item_sk#15, sr_ticket_number#16]
 
 (14) Scan parquet spark_catalog.default.catalog_sales
-Output [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
+Output [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_sales]
 PushedFilters: [IsNotNull(cs_item_sk), IsNotNull(cs_order_number)]
 ReadSchema: struct<cs_item_sk:int,cs_order_number:int,cs_ext_list_price:decimal(7,2)>
 
 (15) ColumnarToRow [codegen id : 5]
-Input [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
+Input [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
 
 (16) Filter [codegen id : 5]
-Input [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
-Condition : (isnotnull(cs_item_sk#19) AND isnotnull(cs_order_number#20))
+Input [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
+Condition : (isnotnull(cs_item_sk#18) AND isnotnull(cs_order_number#19))
 
 (17) Project [codegen id : 5]
-Output [3]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21]
-Input [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
+Output [3]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20]
+Input [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
 
 (18) Exchange
-Input [3]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21]
-Arguments: hashpartitioning(cs_item_sk#19, cs_order_number#20, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [3]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20]
+Arguments: hashpartitioning(cs_item_sk#18, cs_order_number#19, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (19) Sort [codegen id : 6]
-Input [3]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21]
-Arguments: [cs_item_sk#19 ASC NULLS FIRST, cs_order_number#20 ASC NULLS FIRST], false, 0
+Input [3]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20]
+Arguments: [cs_item_sk#18 ASC NULLS FIRST, cs_order_number#19 ASC NULLS FIRST], false, 0
 
 (20) Scan parquet spark_catalog.default.catalog_returns
-Output [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
+Output [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_returns]
 PushedFilters: [IsNotNull(cr_item_sk), IsNotNull(cr_order_number)]
 ReadSchema: struct<cr_item_sk:int,cr_order_number:int,cr_refunded_cash:decimal(7,2),cr_reversed_charge:decimal(7,2),cr_store_credit:decimal(7,2)>
 
 (21) ColumnarToRow [codegen id : 7]
-Input [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
+Input [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
 
 (22) Filter [codegen id : 7]
-Input [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
-Condition : (isnotnull(cr_item_sk#23) AND isnotnull(cr_order_number#24))
+Input [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
+Condition : (isnotnull(cr_item_sk#22) AND isnotnull(cr_order_number#23))
 
 (23) Project [codegen id : 7]
-Output [5]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Input [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
+Output [5]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Input [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
 
 (24) Exchange
-Input [5]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Arguments: hashpartitioning(cr_item_sk#23, cr_order_number#24, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Input [5]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Arguments: hashpartitioning(cr_item_sk#22, cr_order_number#23, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (25) Sort [codegen id : 8]
-Input [5]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Arguments: [cr_item_sk#23 ASC NULLS FIRST, cr_order_number#24 ASC NULLS FIRST], false, 0
+Input [5]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Arguments: [cr_item_sk#22 ASC NULLS FIRST, cr_order_number#23 ASC NULLS FIRST], false, 0
 
 (26) SortMergeJoin [codegen id : 9]
-Left keys [2]: [cs_item_sk#19, cs_order_number#20]
-Right keys [2]: [cr_item_sk#23, cr_order_number#24]
+Left keys [2]: [cs_item_sk#18, cs_order_number#19]
+Right keys [2]: [cr_item_sk#22, cr_order_number#23]
 Join type: Inner
 Join condition: None
 
 (27) Project [codegen id : 9]
-Output [5]: [cs_item_sk#19, cs_ext_list_price#21, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Input [8]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
+Output [5]: [cs_item_sk#18, cs_ext_list_price#20, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Input [8]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
 
 (28) HashAggregate [codegen id : 9]
-Input [5]: [cs_item_sk#19, cs_ext_list_price#21, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Keys [1]: [cs_item_sk#19]
-Functions [2]: [partial_sum(UnscaledValue(cs_ext_list_price#21)), partial_sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))]
-Aggregate Attributes [3]: [sum#29, sum#30, isEmpty#31]
-Results [4]: [cs_item_sk#19, sum#32, sum#33, isEmpty#34]
+Input [5]: [cs_item_sk#18, cs_ext_list_price#20, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Keys [1]: [cs_item_sk#18]
+Functions [2]: [partial_sum(UnscaledValue(cs_ext_list_price#20)), partial_sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))]
+Aggregate Attributes [3]: [sum#28, sum#29, isEmpty#30]
+Results [4]: [cs_item_sk#18, sum#31, sum#32, isEmpty#33]
 
 (29) Exchange
-Input [4]: [cs_item_sk#19, sum#32, sum#33, isEmpty#34]
-Arguments: hashpartitioning(cs_item_sk#19, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [4]: [cs_item_sk#18, sum#31, sum#32, isEmpty#33]
+Arguments: hashpartitioning(cs_item_sk#18, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (30) HashAggregate [codegen id : 10]
-Input [4]: [cs_item_sk#19, sum#32, sum#33, isEmpty#34]
-Keys [1]: [cs_item_sk#19]
-Functions [2]: [sum(UnscaledValue(cs_ext_list_price#21)), sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))]
-Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_list_price#21))#35, sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))#36]
-Results [3]: [cs_item_sk#19, MakeDecimal(sum(UnscaledValue(cs_ext_list_price#21))#35,17,2) AS sale#37, sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))#36 AS refund#38]
+Input [4]: [cs_item_sk#18, sum#31, sum#32, isEmpty#33]
+Keys [1]: [cs_item_sk#18]
+Functions [2]: [sum(UnscaledValue(cs_ext_list_price#20)), sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))]
+Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_list_price#20))#34, sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))#35]
+Results [3]: [cs_item_sk#18, MakeDecimal(sum(UnscaledValue(cs_ext_list_price#20))#34,17,2) AS sale#36, sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))#35 AS refund#37]
 
 (31) Filter [codegen id : 10]
-Input [3]: [cs_item_sk#19, sale#37, refund#38]
-Condition : ((isnotnull(sale#37) AND isnotnull(refund#38)) AND (cast(sale#37 as decimal(21,2)) > (2 * refund#38)))
+Input [3]: [cs_item_sk#18, sale#36, refund#37]
+Condition : ((isnotnull(sale#36) AND isnotnull(refund#37)) AND (cast(sale#36 as decimal(21,2)) > (2 * refund#37)))
 
 (32) Project [codegen id : 10]
-Output [1]: [cs_item_sk#19]
-Input [3]: [cs_item_sk#19, sale#37, refund#38]
+Output [1]: [cs_item_sk#18]
+Input [3]: [cs_item_sk#18, sale#36, refund#37]
 
 (33) BroadcastExchange
-Input [1]: [cs_item_sk#19]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [cs_item_sk#18]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 (34) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [cs_item_sk#19]
+Right keys [1]: [cs_item_sk#18]
 Join type: Inner
 Join condition: None
 
 (35) Project [codegen id : 13]
 Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, cs_item_sk#19]
+Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, cs_item_sk#18]
 
 (36) ReusedExchange [Reuses operator id: 220]
-Output [2]: [d_date_sk#39, d_year#40]
+Output [2]: [d_date_sk#38, d_year#39]
 
 (37) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [ss_sold_date_sk#12]
-Right keys [1]: [d_date_sk#39]
+Right keys [1]: [d_date_sk#38]
 Join type: Inner
 Join condition: None
 
 (38) Project [codegen id : 13]
-Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40]
-Input [13]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, d_date_sk#39, d_year#40]
+Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39]
+Input [13]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, d_date_sk#38, d_year#39]
 
 (39) Scan parquet spark_catalog.default.store
-Output [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
+Output [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk), IsNotNull(s_store_name), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_store_name:string,s_zip:string>
 
 (40) ColumnarToRow [codegen id : 12]
-Input [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
+Input [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
 
 (41) Filter [codegen id : 12]
-Input [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
-Condition : ((isnotnull(s_store_sk#41) AND isnotnull(s_store_name#42)) AND isnotnull(s_zip#43))
+Input [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
+Condition : ((isnotnull(s_store_sk#40) AND isnotnull(s_store_name#41)) AND isnotnull(s_zip#42))
 
 (42) BroadcastExchange
-Input [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
+Input [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=8]
 
 (43) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [ss_store_sk#6]
-Right keys [1]: [s_store_sk#41]
+Right keys [1]: [s_store_sk#40]
 Join type: Inner
 Join condition: None
 
 (44) Project [codegen id : 13]
-Output [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43]
-Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_sk#41, s_store_name#42, s_zip#43]
+Output [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42]
+Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_sk#40, s_store_name#41, s_zip#42]
 
 (45) Exchange
-Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43]
-Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42]
+Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (46) Sort [codegen id : 14]
-Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43]
+Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42]
 Arguments: [ss_customer_sk#2 ASC NULLS FIRST], false, 0
 
 (47) Scan parquet spark_catalog.default.customer
-Output [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
+Output [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer]
 PushedFilters: [IsNotNull(c_customer_sk), IsNotNull(c_first_sales_date_sk), IsNotNull(c_first_shipto_date_sk), IsNotNull(c_current_cdemo_sk), IsNotNull(c_current_hdemo_sk), IsNotNull(c_current_addr_sk)]
 ReadSchema: struct<c_customer_sk:int,c_current_cdemo_sk:int,c_current_hdemo_sk:int,c_current_addr_sk:int,c_first_shipto_date_sk:int,c_first_sales_date_sk:int>
 
 (48) ColumnarToRow [codegen id : 15]
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
 
 (49) Filter [codegen id : 15]
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Condition : (((((isnotnull(c_customer_sk#44) AND isnotnull(c_first_sales_date_sk#49)) AND isnotnull(c_first_shipto_date_sk#48)) AND isnotnull(c_current_cdemo_sk#45)) AND isnotnull(c_current_hdemo_sk#46)) AND isnotnull(c_current_addr_sk#47))
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Condition : (((((isnotnull(c_customer_sk#43) AND isnotnull(c_first_sales_date_sk#48)) AND isnotnull(c_first_shipto_date_sk#47)) AND isnotnull(c_current_cdemo_sk#44)) AND isnotnull(c_current_hdemo_sk#45)) AND isnotnull(c_current_addr_sk#46))
 
 (50) Exchange
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Arguments: hashpartitioning(c_customer_sk#44, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Arguments: hashpartitioning(c_customer_sk#43, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (51) Sort [codegen id : 16]
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Arguments: [c_customer_sk#44 ASC NULLS FIRST], false, 0
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Arguments: [c_customer_sk#43 ASC NULLS FIRST], false, 0
 
 (52) SortMergeJoin [codegen id : 19]
 Left keys [1]: [ss_customer_sk#2]
-Right keys [1]: [c_customer_sk#44]
+Right keys [1]: [c_customer_sk#43]
 Join type: Inner
 Join condition: None
 
 (53) Project [codegen id : 19]
-Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Input [18]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
+Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Input [18]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
 
 (54) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#50, d_year#51]
+Output [2]: [d_date_sk#49, d_year#50]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (55) ColumnarToRow [codegen id : 17]
-Input [2]: [d_date_sk#50, d_year#51]
+Input [2]: [d_date_sk#49, d_year#50]
 
 (56) Filter [codegen id : 17]
-Input [2]: [d_date_sk#50, d_year#51]
-Condition : isnotnull(d_date_sk#50)
+Input [2]: [d_date_sk#49, d_year#50]
+Condition : isnotnull(d_date_sk#49)
 
 (57) BroadcastExchange
-Input [2]: [d_date_sk#50, d_year#51]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=10]
+Input [2]: [d_date_sk#49, d_year#50]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=11]
 
 (58) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [c_first_sales_date_sk#49]
-Right keys [1]: [d_date_sk#50]
+Left keys [1]: [c_first_sales_date_sk#48]
+Right keys [1]: [d_date_sk#49]
 Join type: Inner
 Join condition: None
 
 (59) Project [codegen id : 19]
-Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, d_year#51]
-Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49, d_date_sk#50, d_year#51]
+Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, d_year#50]
+Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48, d_date_sk#49, d_year#50]
 
 (60) ReusedExchange [Reuses operator id: 57]
-Output [2]: [d_date_sk#52, d_year#53]
+Output [2]: [d_date_sk#51, d_year#52]
 
 (61) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [c_first_shipto_date_sk#48]
-Right keys [1]: [d_date_sk#52]
+Left keys [1]: [c_first_shipto_date_sk#47]
+Right keys [1]: [d_date_sk#51]
 Join type: Inner
 Join condition: None
 
 (62) Project [codegen id : 19]
-Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, d_year#51, d_date_sk#52, d_year#53]
+Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, d_year#50, d_date_sk#51, d_year#52]
 
 (63) Exchange
-Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Arguments: hashpartitioning(ss_cdemo_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Arguments: hashpartitioning(ss_cdemo_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (64) Sort [codegen id : 20]
-Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
+Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
 Arguments: [ss_cdemo_sk#3 ASC NULLS FIRST], false, 0
 
 (65) Scan parquet spark_catalog.default.customer_demographics
-Output [2]: [cd_demo_sk#54, cd_marital_status#55]
+Output [2]: [cd_demo_sk#53, cd_marital_status#54]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk), IsNotNull(cd_marital_status)]
 ReadSchema: struct<cd_demo_sk:int,cd_marital_status:string>
 
 (66) ColumnarToRow [codegen id : 21]
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
 
 (67) Filter [codegen id : 21]
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
-Condition : (isnotnull(cd_demo_sk#54) AND isnotnull(cd_marital_status#55))
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
+Condition : (isnotnull(cd_demo_sk#53) AND isnotnull(cd_marital_status#54))
 
 (68) Exchange
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
-Arguments: hashpartitioning(cd_demo_sk#54, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
+Arguments: hashpartitioning(cd_demo_sk#53, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (69) Sort [codegen id : 22]
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
-Arguments: [cd_demo_sk#54 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
+Arguments: [cd_demo_sk#53 ASC NULLS FIRST], false, 0
 
 (70) SortMergeJoin [codegen id : 23]
 Left keys [1]: [ss_cdemo_sk#3]
-Right keys [1]: [cd_demo_sk#54]
+Right keys [1]: [cd_demo_sk#53]
 Join type: Inner
 Join condition: None
 
 (71) Project [codegen id : 23]
-Output [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55]
-Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_demo_sk#54, cd_marital_status#55]
+Output [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54]
+Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_demo_sk#53, cd_marital_status#54]
 
 (72) Exchange
-Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55]
-Arguments: hashpartitioning(c_current_cdemo_sk#45, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54]
+Arguments: hashpartitioning(c_current_cdemo_sk#44, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (73) Sort [codegen id : 24]
-Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55]
-Arguments: [c_current_cdemo_sk#45 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54]
+Arguments: [c_current_cdemo_sk#44 ASC NULLS FIRST], false, 0
 
 (74) ReusedExchange [Reuses operator id: 68]
-Output [2]: [cd_demo_sk#56, cd_marital_status#57]
+Output [2]: [cd_demo_sk#55, cd_marital_status#56]
 
 (75) Sort [codegen id : 26]
-Input [2]: [cd_demo_sk#56, cd_marital_status#57]
-Arguments: [cd_demo_sk#56 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#55, cd_marital_status#56]
+Arguments: [cd_demo_sk#55 ASC NULLS FIRST], false, 0
 
 (76) SortMergeJoin [codegen id : 30]
-Left keys [1]: [c_current_cdemo_sk#45]
-Right keys [1]: [cd_demo_sk#56]
+Left keys [1]: [c_current_cdemo_sk#44]
+Right keys [1]: [cd_demo_sk#55]
 Join type: Inner
-Join condition: NOT (cd_marital_status#55 = cd_marital_status#57)
+Join condition: NOT (cd_marital_status#54 = cd_marital_status#56)
 
 (77) Project [codegen id : 30]
-Output [14]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Input [18]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55, cd_demo_sk#56, cd_marital_status#57]
+Output [14]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Input [18]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54, cd_demo_sk#55, cd_marital_status#56]
 
 (78) Scan parquet spark_catalog.default.promotion
-Output [1]: [p_promo_sk#58]
+Output [1]: [p_promo_sk#57]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/promotion]
 PushedFilters: [IsNotNull(p_promo_sk)]
 ReadSchema: struct<p_promo_sk:int>
 
 (79) ColumnarToRow [codegen id : 27]
-Input [1]: [p_promo_sk#58]
+Input [1]: [p_promo_sk#57]
 
 (80) Filter [codegen id : 27]
-Input [1]: [p_promo_sk#58]
-Condition : isnotnull(p_promo_sk#58)
+Input [1]: [p_promo_sk#57]
+Condition : isnotnull(p_promo_sk#57)
 
 (81) BroadcastExchange
-Input [1]: [p_promo_sk#58]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=14]
+Input [1]: [p_promo_sk#57]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=15]
 
 (82) BroadcastHashJoin [codegen id : 30]
 Left keys [1]: [ss_promo_sk#7]
-Right keys [1]: [p_promo_sk#58]
+Right keys [1]: [p_promo_sk#57]
 Join type: Inner
 Join condition: None
 
 (83) Project [codegen id : 30]
-Output [13]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, p_promo_sk#58]
+Output [13]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, p_promo_sk#57]
 
 (84) Scan parquet spark_catalog.default.household_demographics
-Output [2]: [hd_demo_sk#59, hd_income_band_sk#60]
+Output [2]: [hd_demo_sk#58, hd_income_band_sk#59]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/household_demographics]
 PushedFilters: [IsNotNull(hd_demo_sk), IsNotNull(hd_income_band_sk)]
 ReadSchema: struct<hd_demo_sk:int,hd_income_band_sk:int>
 
 (85) ColumnarToRow [codegen id : 28]
-Input [2]: [hd_demo_sk#59, hd_income_band_sk#60]
+Input [2]: [hd_demo_sk#58, hd_income_band_sk#59]
 
 (86) Filter [codegen id : 28]
-Input [2]: [hd_demo_sk#59, hd_income_band_sk#60]
-Condition : (isnotnull(hd_demo_sk#59) AND isnotnull(hd_income_band_sk#60))
+Input [2]: [hd_demo_sk#58, hd_income_band_sk#59]
+Condition : (isnotnull(hd_demo_sk#58) AND isnotnull(hd_income_band_sk#59))
 
 (87) BroadcastExchange
-Input [2]: [hd_demo_sk#59, hd_income_band_sk#60]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=15]
+Input [2]: [hd_demo_sk#58, hd_income_band_sk#59]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=16]
 
 (88) BroadcastHashJoin [codegen id : 30]
 Left keys [1]: [ss_hdemo_sk#4]
-Right keys [1]: [hd_demo_sk#59]
+Right keys [1]: [hd_demo_sk#58]
 Join type: Inner
 Join condition: None
 
 (89) Project [codegen id : 30]
-Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60]
-Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, hd_demo_sk#59, hd_income_band_sk#60]
+Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59]
+Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, hd_demo_sk#58, hd_income_band_sk#59]
 
 (90) ReusedExchange [Reuses operator id: 87]
-Output [2]: [hd_demo_sk#61, hd_income_band_sk#62]
+Output [2]: [hd_demo_sk#60, hd_income_band_sk#61]
 
 (91) BroadcastHashJoin [codegen id : 30]
-Left keys [1]: [c_current_hdemo_sk#46]
-Right keys [1]: [hd_demo_sk#61]
+Left keys [1]: [c_current_hdemo_sk#45]
+Right keys [1]: [hd_demo_sk#60]
 Join type: Inner
 Join condition: None
 
 (92) Project [codegen id : 30]
-Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62]
-Input [15]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_demo_sk#61, hd_income_band_sk#62]
+Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61]
+Input [15]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_demo_sk#60, hd_income_band_sk#61]
 
 (93) Exchange
-Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62]
-Arguments: hashpartitioning(ss_addr_sk#5, 5), ENSURE_REQUIREMENTS, [plan_id=16]
+Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61]
+Arguments: hashpartitioning(ss_addr_sk#5, 5), ENSURE_REQUIREMENTS, [plan_id=17]
 
 (94) Sort [codegen id : 31]
-Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62]
+Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61]
 Arguments: [ss_addr_sk#5 ASC NULLS FIRST], false, 0
 
 (95) Scan parquet spark_catalog.default.customer_address
-Output [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
+Output [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_street_number:string,ca_street_name:string,ca_city:string,ca_zip:string>
 
 (96) ColumnarToRow [codegen id : 32]
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
 
 (97) Filter [codegen id : 32]
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Condition : isnotnull(ca_address_sk#63)
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Condition : isnotnull(ca_address_sk#62)
 
 (98) Exchange
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: hashpartitioning(ca_address_sk#63, 5), ENSURE_REQUIREMENTS, [plan_id=17]
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: hashpartitioning(ca_address_sk#62, 5), ENSURE_REQUIREMENTS, [plan_id=18]
 
 (99) Sort [codegen id : 33]
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: [ca_address_sk#63 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: [ca_address_sk#62 ASC NULLS FIRST], false, 0
 
 (100) SortMergeJoin [codegen id : 34]
 Left keys [1]: [ss_addr_sk#5]
-Right keys [1]: [ca_address_sk#63]
+Right keys [1]: [ca_address_sk#62]
 Join type: Inner
 Join condition: None
 
 (101) Project [codegen id : 34]
-Output [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Input [18]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
+Output [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Input [18]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
 
 (102) Exchange
-Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: hashpartitioning(c_current_addr_sk#47, 5), ENSURE_REQUIREMENTS, [plan_id=18]
+Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: hashpartitioning(c_current_addr_sk#46, 5), ENSURE_REQUIREMENTS, [plan_id=19]
 
 (103) Sort [codegen id : 35]
-Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: [c_current_addr_sk#47 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: [c_current_addr_sk#46 ASC NULLS FIRST], false, 0
 
 (104) ReusedExchange [Reuses operator id: 98]
-Output [5]: [ca_address_sk#68, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
+Output [5]: [ca_address_sk#67, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
 
 (105) Sort [codegen id : 37]
-Input [5]: [ca_address_sk#68, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Arguments: [ca_address_sk#68 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#67, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Arguments: [ca_address_sk#67 ASC NULLS FIRST], false, 0
 
 (106) SortMergeJoin [codegen id : 41]
-Left keys [1]: [c_current_addr_sk#47]
-Right keys [1]: [ca_address_sk#68]
+Left keys [1]: [c_current_addr_sk#46]
+Right keys [1]: [ca_address_sk#67]
 Join type: Inner
 Join condition: None
 
 (107) Project [codegen id : 41]
-Output [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Input [21]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_address_sk#68, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
+Output [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Input [21]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_address_sk#67, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
 
 (108) Scan parquet spark_catalog.default.income_band
-Output [1]: [ib_income_band_sk#73]
+Output [1]: [ib_income_band_sk#72]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/income_band]
 PushedFilters: [IsNotNull(ib_income_band_sk)]
 ReadSchema: struct<ib_income_band_sk:int>
 
 (109) ColumnarToRow [codegen id : 38]
-Input [1]: [ib_income_band_sk#73]
+Input [1]: [ib_income_band_sk#72]
 
 (110) Filter [codegen id : 38]
-Input [1]: [ib_income_band_sk#73]
-Condition : isnotnull(ib_income_band_sk#73)
+Input [1]: [ib_income_band_sk#72]
+Condition : isnotnull(ib_income_band_sk#72)
 
 (111) BroadcastExchange
-Input [1]: [ib_income_band_sk#73]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=19]
+Input [1]: [ib_income_band_sk#72]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=20]
 
 (112) BroadcastHashJoin [codegen id : 41]
-Left keys [1]: [hd_income_band_sk#60]
-Right keys [1]: [ib_income_band_sk#73]
+Left keys [1]: [hd_income_band_sk#59]
+Right keys [1]: [ib_income_band_sk#72]
 Join type: Inner
 Join condition: None
 
 (113) Project [codegen id : 41]
-Output [18]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Input [20]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, ib_income_band_sk#73]
+Output [18]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Input [20]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, ib_income_band_sk#72]
 
 (114) ReusedExchange [Reuses operator id: 111]
-Output [1]: [ib_income_band_sk#74]
+Output [1]: [ib_income_band_sk#73]
 
 (115) BroadcastHashJoin [codegen id : 41]
-Left keys [1]: [hd_income_band_sk#62]
-Right keys [1]: [ib_income_band_sk#74]
+Left keys [1]: [hd_income_band_sk#61]
+Right keys [1]: [ib_income_band_sk#73]
 Join type: Inner
 Join condition: None
 
 (116) Project [codegen id : 41]
-Output [17]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, ib_income_band_sk#74]
+Output [17]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, ib_income_band_sk#73]
 
 (117) Scan parquet spark_catalog.default.item
-Output [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
+Output [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), In(i_color, [burlywood           ,floral              ,indian              ,medium              ,purple              ,spring              ]), GreaterThanOrEqual(i_current_price,64.00), LessThanOrEqual(i_current_price,74.00), GreaterThanOrEqual(i_current_price,65.00), LessThanOrEqual(i_current_price,79.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_color:string,i_product_name:string>
 
 (118) ColumnarToRow [codegen id : 40]
-Input [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
+Input [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
 
 (119) Filter [codegen id : 40]
-Input [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
-Condition : ((((((isnotnull(i_current_price#76) AND i_color#77 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#76 >= 64.00)) AND (i_current_price#76 <= 74.00)) AND (i_current_price#76 >= 65.00)) AND (i_current_price#76 <= 79.00)) AND isnotnull(i_item_sk#75))
+Input [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
+Condition : ((((((isnotnull(i_current_price#75) AND i_color#76 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#75 >= 64.00)) AND (i_current_price#75 <= 74.00)) AND (i_current_price#75 >= 65.00)) AND (i_current_price#75 <= 79.00)) AND isnotnull(i_item_sk#74))
 
 (120) Project [codegen id : 40]
-Output [2]: [i_item_sk#75, i_product_name#78]
-Input [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
+Output [2]: [i_item_sk#74, i_product_name#77]
+Input [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
 
 (121) BroadcastExchange
-Input [2]: [i_item_sk#75, i_product_name#78]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=20]
+Input [2]: [i_item_sk#74, i_product_name#77]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=21]
 
 (122) BroadcastHashJoin [codegen id : 41]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [i_item_sk#75]
+Right keys [1]: [i_item_sk#74]
 Join type: Inner
 Join condition: None
 
 (123) Project [codegen id : 41]
-Output [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, d_year#51, d_year#53, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, i_item_sk#75, i_product_name#78]
-Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, i_item_sk#75, i_product_name#78]
+Output [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, d_year#50, d_year#52, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, i_item_sk#74, i_product_name#77]
+Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, i_item_sk#74, i_product_name#77]
 
 (124) HashAggregate [codegen id : 41]
-Input [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, d_year#51, d_year#53, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, i_item_sk#75, i_product_name#78]
-Keys [15]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53]
+Input [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, d_year#50, d_year#52, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, i_item_sk#74, i_product_name#77]
+Keys [15]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52]
 Functions [4]: [partial_count(1), partial_sum(UnscaledValue(ss_wholesale_cost#9)), partial_sum(UnscaledValue(ss_list_price#10)), partial_sum(UnscaledValue(ss_coupon_amt#11))]
-Aggregate Attributes [4]: [count#79, sum#80, sum#81, sum#82]
-Results [19]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, count#83, sum#84, sum#85, sum#86]
+Aggregate Attributes [4]: [count#78, sum#79, sum#80, sum#81]
+Results [19]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, count#82, sum#83, sum#84, sum#85]
 
 (125) Exchange
-Input [19]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, count#83, sum#84, sum#85, sum#86]
-Arguments: hashpartitioning(i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, 5), ENSURE_REQUIREMENTS, [plan_id=21]
+Input [19]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, count#82, sum#83, sum#84, sum#85]
+Arguments: hashpartitioning(i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, 5), ENSURE_REQUIREMENTS, [plan_id=22]
 
 (126) HashAggregate [codegen id : 42]
-Input [19]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, count#83, sum#84, sum#85, sum#86]
-Keys [15]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53]
+Input [19]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, count#82, sum#83, sum#84, sum#85]
+Keys [15]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52]
 Functions [4]: [count(1), sum(UnscaledValue(ss_wholesale_cost#9)), sum(UnscaledValue(ss_list_price#10)), sum(UnscaledValue(ss_coupon_amt#11))]
-Aggregate Attributes [4]: [count(1)#87, sum(UnscaledValue(ss_wholesale_cost#9))#88, sum(UnscaledValue(ss_list_price#10))#89, sum(UnscaledValue(ss_coupon_amt#11))#90]
-Results [17]: [i_product_name#78 AS product_name#91, i_item_sk#75 AS item_sk#92, s_store_name#42 AS store_name#93, s_zip#43 AS store_zip#94, ca_street_number#64 AS b_street_number#95, ca_street_name#65 AS b_streen_name#96, ca_city#66 AS b_city#97, ca_zip#67 AS b_zip#98, ca_street_number#69 AS c_street_number#99, ca_street_name#70 AS c_street_name#100, ca_city#71 AS c_city#101, ca_zip#72 AS c_zip#102, d_year#40 AS syear#103, count(1)#87 AS cnt#104, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#9))#88,17,2) AS s1#105, MakeDecimal(sum(UnscaledValue(ss_list_price#10))#89,17,2) AS s2#106, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#11))#90,17,2) AS s3#107]
+Aggregate Attributes [4]: [count(1)#86, sum(UnscaledValue(ss_wholesale_cost#9))#87, sum(UnscaledValue(ss_list_price#10))#88, sum(UnscaledValue(ss_coupon_amt#11))#89]
+Results [17]: [i_product_name#77 AS product_name#90, i_item_sk#74 AS item_sk#91, s_store_name#41 AS store_name#92, s_zip#42 AS store_zip#93, ca_street_number#63 AS b_street_number#94, ca_street_name#64 AS b_streen_name#95, ca_city#65 AS b_city#96, ca_zip#66 AS b_zip#97, ca_street_number#68 AS c_street_number#98, ca_street_name#69 AS c_street_name#99, ca_city#70 AS c_city#100, ca_zip#71 AS c_zip#101, d_year#39 AS syear#102, count(1)#86 AS cnt#103, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#9))#87,17,2) AS s1#104, MakeDecimal(sum(UnscaledValue(ss_list_price#10))#88,17,2) AS s2#105, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#11))#89,17,2) AS s3#106]
 
 (127) Exchange
-Input [17]: [product_name#91, item_sk#92, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107]
-Arguments: hashpartitioning(item_sk#92, store_name#93, store_zip#94, 5), ENSURE_REQUIREMENTS, [plan_id=22]
+Input [17]: [product_name#90, item_sk#91, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106]
+Arguments: hashpartitioning(item_sk#91, store_name#92, store_zip#93, 5), ENSURE_REQUIREMENTS, [plan_id=23]
 
 (128) Sort [codegen id : 43]
-Input [17]: [product_name#91, item_sk#92, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107]
-Arguments: [item_sk#92 ASC NULLS FIRST, store_name#93 ASC NULLS FIRST, store_zip#94 ASC NULLS FIRST], false, 0
+Input [17]: [product_name#90, item_sk#91, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106]
+Arguments: [item_sk#91 ASC NULLS FIRST, store_name#92 ASC NULLS FIRST, store_zip#93 ASC NULLS FIRST], false, 0
 
 (129) Scan parquet spark_catalog.default.store_sales
-Output [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
+Output [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#119), dynamicpruningexpression(ss_sold_date_sk#119 IN dynamicpruning#120)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#118), dynamicpruningexpression(ss_sold_date_sk#118 IN dynamicpruning#119)]
 PushedFilters: [IsNotNull(ss_item_sk), IsNotNull(ss_ticket_number), IsNotNull(ss_store_sk), IsNotNull(ss_customer_sk), IsNotNull(ss_cdemo_sk), IsNotNull(ss_promo_sk), IsNotNull(ss_hdemo_sk), IsNotNull(ss_addr_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_customer_sk:int,ss_cdemo_sk:int,ss_hdemo_sk:int,ss_addr_sk:int,ss_store_sk:int,ss_promo_sk:int,ss_ticket_number:int,ss_wholesale_cost:decimal(7,2),ss_list_price:decimal(7,2),ss_coupon_amt:decimal(7,2)>
 
 (130) ColumnarToRow [codegen id : 44]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
 
 (131) Filter [codegen id : 44]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Condition : ((((((((isnotnull(ss_item_sk#108) AND isnotnull(ss_ticket_number#115)) AND isnotnull(ss_store_sk#113)) AND isnotnull(ss_customer_sk#109)) AND isnotnull(ss_cdemo_sk#110)) AND isnotnull(ss_promo_sk#114)) AND isnotnull(ss_hdemo_sk#111)) AND isnotnull(ss_addr_sk#112)) AND might_contain(ReusedSubquery Subquery scalar-subquery#14, [id=#15], xxhash64(ss_item_sk#108, 42)))
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Condition : ((((((((isnotnull(ss_item_sk#107) AND isnotnull(ss_ticket_number#114)) AND isnotnull(ss_store_sk#112)) AND isnotnull(ss_customer_sk#108)) AND isnotnull(ss_cdemo_sk#109)) AND isnotnull(ss_promo_sk#113)) AND isnotnull(ss_hdemo_sk#110)) AND isnotnull(ss_addr_sk#111)) AND might_contain(ReusedSubquery Subquery scalar-subquery#14, [id=#1], xxhash64(ss_item_sk#107, 42)))
 
 (132) Exchange
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Arguments: hashpartitioning(ss_item_sk#108, ss_ticket_number#115, 5), ENSURE_REQUIREMENTS, [plan_id=23]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Arguments: hashpartitioning(ss_item_sk#107, ss_ticket_number#114, 5), ENSURE_REQUIREMENTS, [plan_id=24]
 
 (133) Sort [codegen id : 45]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Arguments: [ss_item_sk#108 ASC NULLS FIRST, ss_ticket_number#115 ASC NULLS FIRST], false, 0
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Arguments: [ss_item_sk#107 ASC NULLS FIRST, ss_ticket_number#114 ASC NULLS FIRST], false, 0
 
 (134) ReusedExchange [Reuses operator id: 10]
-Output [2]: [sr_item_sk#121, sr_ticket_number#122]
+Output [2]: [sr_item_sk#120, sr_ticket_number#121]
 
 (135) Sort [codegen id : 47]
-Input [2]: [sr_item_sk#121, sr_ticket_number#122]
-Arguments: [sr_item_sk#121 ASC NULLS FIRST, sr_ticket_number#122 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#120, sr_ticket_number#121]
+Arguments: [sr_item_sk#120 ASC NULLS FIRST, sr_ticket_number#121 ASC NULLS FIRST], false, 0
 
 (136) SortMergeJoin [codegen id : 56]
-Left keys [2]: [ss_item_sk#108, ss_ticket_number#115]
-Right keys [2]: [sr_item_sk#121, sr_ticket_number#122]
+Left keys [2]: [ss_item_sk#107, ss_ticket_number#114]
+Right keys [2]: [sr_item_sk#120, sr_ticket_number#121]
 Join type: Inner
 Join condition: None
 
 (137) Project [codegen id : 56]
-Output [11]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Input [14]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119, sr_item_sk#121, sr_ticket_number#122]
+Output [11]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Input [14]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118, sr_item_sk#120, sr_ticket_number#121]
 
 (138) ReusedExchange [Reuses operator id: 33]
-Output [1]: [cs_item_sk#123]
+Output [1]: [cs_item_sk#122]
 
 (139) BroadcastHashJoin [codegen id : 56]
-Left keys [1]: [ss_item_sk#108]
-Right keys [1]: [cs_item_sk#123]
+Left keys [1]: [ss_item_sk#107]
+Right keys [1]: [cs_item_sk#122]
 Join type: Inner
 Join condition: None
 
 (140) Project [codegen id : 56]
-Output [11]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119, cs_item_sk#123]
+Output [11]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118, cs_item_sk#122]
 
 (141) ReusedExchange [Reuses operator id: 224]
-Output [2]: [d_date_sk#124, d_year#125]
+Output [2]: [d_date_sk#123, d_year#124]
 
 (142) BroadcastHashJoin [codegen id : 56]
-Left keys [1]: [ss_sold_date_sk#119]
-Right keys [1]: [d_date_sk#124]
+Left keys [1]: [ss_sold_date_sk#118]
+Right keys [1]: [d_date_sk#123]
 Join type: Inner
 Join condition: None
 
 (143) Project [codegen id : 56]
-Output [11]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125]
-Input [13]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119, d_date_sk#124, d_year#125]
+Output [11]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124]
+Input [13]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118, d_date_sk#123, d_year#124]
 
 (144) ReusedExchange [Reuses operator id: 42]
-Output [3]: [s_store_sk#126, s_store_name#127, s_zip#128]
+Output [3]: [s_store_sk#125, s_store_name#126, s_zip#127]
 
 (145) BroadcastHashJoin [codegen id : 56]
-Left keys [1]: [ss_store_sk#113]
-Right keys [1]: [s_store_sk#126]
+Left keys [1]: [ss_store_sk#112]
+Right keys [1]: [s_store_sk#125]
 Join type: Inner
 Join condition: None
 
 (146) Project [codegen id : 56]
-Output [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128]
-Input [14]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_sk#126, s_store_name#127, s_zip#128]
+Output [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127]
+Input [14]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_sk#125, s_store_name#126, s_zip#127]
 
 (147) Exchange
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128]
-Arguments: hashpartitioning(ss_customer_sk#109, 5), ENSURE_REQUIREMENTS, [plan_id=24]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127]
+Arguments: hashpartitioning(ss_customer_sk#108, 5), ENSURE_REQUIREMENTS, [plan_id=25]
 
 (148) Sort [codegen id : 57]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128]
-Arguments: [ss_customer_sk#109 ASC NULLS FIRST], false, 0
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127]
+Arguments: [ss_customer_sk#108 ASC NULLS FIRST], false, 0
 
 (149) ReusedExchange [Reuses operator id: 50]
-Output [6]: [c_customer_sk#129, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
+Output [6]: [c_customer_sk#128, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
 
 (150) Sort [codegen id : 59]
-Input [6]: [c_customer_sk#129, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
-Arguments: [c_customer_sk#129 ASC NULLS FIRST], false, 0
+Input [6]: [c_customer_sk#128, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
+Arguments: [c_customer_sk#128 ASC NULLS FIRST], false, 0
 
 (151) SortMergeJoin [codegen id : 62]
-Left keys [1]: [ss_customer_sk#109]
-Right keys [1]: [c_customer_sk#129]
+Left keys [1]: [ss_customer_sk#108]
+Right keys [1]: [c_customer_sk#128]
 Join type: Inner
 Join condition: None
 
 (152) Project [codegen id : 62]
-Output [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
-Input [18]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_customer_sk#129, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
+Output [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
+Input [18]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_customer_sk#128, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
 
 (153) ReusedExchange [Reuses operator id: 57]
-Output [2]: [d_date_sk#135, d_year#136]
+Output [2]: [d_date_sk#134, d_year#135]
 
 (154) BroadcastHashJoin [codegen id : 62]
-Left keys [1]: [c_first_sales_date_sk#134]
-Right keys [1]: [d_date_sk#135]
+Left keys [1]: [c_first_sales_date_sk#133]
+Right keys [1]: [d_date_sk#134]
 Join type: Inner
 Join condition: None
 
 (155) Project [codegen id : 62]
-Output [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, d_year#136]
-Input [18]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134, d_date_sk#135, d_year#136]
+Output [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, d_year#135]
+Input [18]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133, d_date_sk#134, d_year#135]
 
 (156) ReusedExchange [Reuses operator id: 57]
-Output [2]: [d_date_sk#137, d_year#138]
+Output [2]: [d_date_sk#136, d_year#137]
 
 (157) BroadcastHashJoin [codegen id : 62]
-Left keys [1]: [c_first_shipto_date_sk#133]
-Right keys [1]: [d_date_sk#137]
+Left keys [1]: [c_first_shipto_date_sk#132]
+Right keys [1]: [d_date_sk#136]
 Join type: Inner
 Join condition: None
 
 (158) Project [codegen id : 62]
-Output [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Input [18]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, d_year#136, d_date_sk#137, d_year#138]
+Output [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Input [18]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, d_year#135, d_date_sk#136, d_year#137]
 
 (159) Exchange
-Input [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Arguments: hashpartitioning(ss_cdemo_sk#110, 5), ENSURE_REQUIREMENTS, [plan_id=25]
+Input [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Arguments: hashpartitioning(ss_cdemo_sk#109, 5), ENSURE_REQUIREMENTS, [plan_id=26]
 
 (160) Sort [codegen id : 63]
-Input [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Arguments: [ss_cdemo_sk#110 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Arguments: [ss_cdemo_sk#109 ASC NULLS FIRST], false, 0
 
 (161) ReusedExchange [Reuses operator id: 68]
-Output [2]: [cd_demo_sk#139, cd_marital_status#140]
+Output [2]: [cd_demo_sk#138, cd_marital_status#139]
 
 (162) Sort [codegen id : 65]
-Input [2]: [cd_demo_sk#139, cd_marital_status#140]
-Arguments: [cd_demo_sk#139 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#138, cd_marital_status#139]
+Arguments: [cd_demo_sk#138 ASC NULLS FIRST], false, 0
 
 (163) SortMergeJoin [codegen id : 66]
-Left keys [1]: [ss_cdemo_sk#110]
-Right keys [1]: [cd_demo_sk#139]
+Left keys [1]: [ss_cdemo_sk#109]
+Right keys [1]: [cd_demo_sk#138]
 Join type: Inner
 Join condition: None
 
 (164) Project [codegen id : 66]
-Output [16]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140]
-Input [18]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_demo_sk#139, cd_marital_status#140]
+Output [16]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139]
+Input [18]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_demo_sk#138, cd_marital_status#139]
 
 (165) Exchange
-Input [16]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140]
-Arguments: hashpartitioning(c_current_cdemo_sk#130, 5), ENSURE_REQUIREMENTS, [plan_id=26]
+Input [16]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139]
+Arguments: hashpartitioning(c_current_cdemo_sk#129, 5), ENSURE_REQUIREMENTS, [plan_id=27]
 
 (166) Sort [codegen id : 67]
-Input [16]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140]
-Arguments: [c_current_cdemo_sk#130 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139]
+Arguments: [c_current_cdemo_sk#129 ASC NULLS FIRST], false, 0
 
 (167) ReusedExchange [Reuses operator id: 68]
-Output [2]: [cd_demo_sk#141, cd_marital_status#142]
+Output [2]: [cd_demo_sk#140, cd_marital_status#141]
 
 (168) Sort [codegen id : 69]
-Input [2]: [cd_demo_sk#141, cd_marital_status#142]
-Arguments: [cd_demo_sk#141 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#140, cd_marital_status#141]
+Arguments: [cd_demo_sk#140 ASC NULLS FIRST], false, 0
 
 (169) SortMergeJoin [codegen id : 73]
-Left keys [1]: [c_current_cdemo_sk#130]
-Right keys [1]: [cd_demo_sk#141]
+Left keys [1]: [c_current_cdemo_sk#129]
+Right keys [1]: [cd_demo_sk#140]
 Join type: Inner
-Join condition: NOT (cd_marital_status#140 = cd_marital_status#142)
+Join condition: NOT (cd_marital_status#139 = cd_marital_status#141)
 
 (170) Project [codegen id : 73]
-Output [14]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Input [18]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140, cd_demo_sk#141, cd_marital_status#142]
+Output [14]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Input [18]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139, cd_demo_sk#140, cd_marital_status#141]
 
 (171) ReusedExchange [Reuses operator id: 81]
-Output [1]: [p_promo_sk#143]
+Output [1]: [p_promo_sk#142]
 
 (172) BroadcastHashJoin [codegen id : 73]
-Left keys [1]: [ss_promo_sk#114]
-Right keys [1]: [p_promo_sk#143]
+Left keys [1]: [ss_promo_sk#113]
+Right keys [1]: [p_promo_sk#142]
 Join type: Inner
 Join condition: None
 
 (173) Project [codegen id : 73]
-Output [13]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Input [15]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, p_promo_sk#143]
+Output [13]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Input [15]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, p_promo_sk#142]
 
 (174) ReusedExchange [Reuses operator id: 87]
-Output [2]: [hd_demo_sk#144, hd_income_band_sk#145]
+Output [2]: [hd_demo_sk#143, hd_income_band_sk#144]
 
 (175) BroadcastHashJoin [codegen id : 73]
-Left keys [1]: [ss_hdemo_sk#111]
-Right keys [1]: [hd_demo_sk#144]
+Left keys [1]: [ss_hdemo_sk#110]
+Right keys [1]: [hd_demo_sk#143]
 Join type: Inner
 Join condition: None
 
 (176) Project [codegen id : 73]
-Output [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145]
-Input [15]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, hd_demo_sk#144, hd_income_band_sk#145]
+Output [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144]
+Input [15]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, hd_demo_sk#143, hd_income_band_sk#144]
 
 (177) ReusedExchange [Reuses operator id: 87]
-Output [2]: [hd_demo_sk#146, hd_income_band_sk#147]
+Output [2]: [hd_demo_sk#145, hd_income_band_sk#146]
 
 (178) BroadcastHashJoin [codegen id : 73]
-Left keys [1]: [c_current_hdemo_sk#131]
-Right keys [1]: [hd_demo_sk#146]
+Left keys [1]: [c_current_hdemo_sk#130]
+Right keys [1]: [hd_demo_sk#145]
 Join type: Inner
 Join condition: None
 
 (179) Project [codegen id : 73]
-Output [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147]
-Input [15]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_demo_sk#146, hd_income_band_sk#147]
+Output [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146]
+Input [15]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_demo_sk#145, hd_income_band_sk#146]
 
 (180) Exchange
-Input [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147]
-Arguments: hashpartitioning(ss_addr_sk#112, 5), ENSURE_REQUIREMENTS, [plan_id=27]
+Input [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146]
+Arguments: hashpartitioning(ss_addr_sk#111, 5), ENSURE_REQUIREMENTS, [plan_id=28]
 
 (181) Sort [codegen id : 74]
-Input [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147]
-Arguments: [ss_addr_sk#112 ASC NULLS FIRST], false, 0
+Input [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146]
+Arguments: [ss_addr_sk#111 ASC NULLS FIRST], false, 0
 
 (182) ReusedExchange [Reuses operator id: 98]
-Output [5]: [ca_address_sk#148, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
+Output [5]: [ca_address_sk#147, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
 
 (183) Sort [codegen id : 76]
-Input [5]: [ca_address_sk#148, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Arguments: [ca_address_sk#148 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#147, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Arguments: [ca_address_sk#147 ASC NULLS FIRST], false, 0
 
 (184) SortMergeJoin [codegen id : 77]
-Left keys [1]: [ss_addr_sk#112]
-Right keys [1]: [ca_address_sk#148]
+Left keys [1]: [ss_addr_sk#111]
+Right keys [1]: [ca_address_sk#147]
 Join type: Inner
 Join condition: None
 
 (185) Project [codegen id : 77]
-Output [16]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Input [18]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_address_sk#148, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
+Output [16]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Input [18]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_address_sk#147, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
 
 (186) Exchange
-Input [16]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Arguments: hashpartitioning(c_current_addr_sk#132, 5), ENSURE_REQUIREMENTS, [plan_id=28]
+Input [16]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Arguments: hashpartitioning(c_current_addr_sk#131, 5), ENSURE_REQUIREMENTS, [plan_id=29]
 
 (187) Sort [codegen id : 78]
-Input [16]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Arguments: [c_current_addr_sk#132 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Arguments: [c_current_addr_sk#131 ASC NULLS FIRST], false, 0
 
 (188) ReusedExchange [Reuses operator id: 98]
-Output [5]: [ca_address_sk#153, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
+Output [5]: [ca_address_sk#152, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
 
 (189) Sort [codegen id : 80]
-Input [5]: [ca_address_sk#153, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Arguments: [ca_address_sk#153 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#152, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Arguments: [ca_address_sk#152 ASC NULLS FIRST], false, 0
 
 (190) SortMergeJoin [codegen id : 84]
-Left keys [1]: [c_current_addr_sk#132]
-Right keys [1]: [ca_address_sk#153]
+Left keys [1]: [c_current_addr_sk#131]
+Right keys [1]: [ca_address_sk#152]
 Join type: Inner
 Join condition: None
 
 (191) Project [codegen id : 84]
-Output [19]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Input [21]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_address_sk#153, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
+Output [19]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Input [21]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_address_sk#152, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
 
 (192) ReusedExchange [Reuses operator id: 111]
-Output [1]: [ib_income_band_sk#158]
+Output [1]: [ib_income_band_sk#157]
 
 (193) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [hd_income_band_sk#145]
-Right keys [1]: [ib_income_band_sk#158]
+Left keys [1]: [hd_income_band_sk#144]
+Right keys [1]: [ib_income_band_sk#157]
 Join type: Inner
 Join condition: None
 
 (194) Project [codegen id : 84]
-Output [18]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Input [20]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, ib_income_band_sk#158]
+Output [18]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Input [20]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, ib_income_band_sk#157]
 
 (195) ReusedExchange [Reuses operator id: 111]
-Output [1]: [ib_income_band_sk#159]
+Output [1]: [ib_income_band_sk#158]
 
 (196) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [hd_income_band_sk#147]
-Right keys [1]: [ib_income_band_sk#159]
+Left keys [1]: [hd_income_band_sk#146]
+Right keys [1]: [ib_income_band_sk#158]
 Join type: Inner
 Join condition: None
 
 (197) Project [codegen id : 84]
-Output [17]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Input [19]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, ib_income_band_sk#159]
+Output [17]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Input [19]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, ib_income_band_sk#158]
 
 (198) ReusedExchange [Reuses operator id: 121]
-Output [2]: [i_item_sk#160, i_product_name#161]
+Output [2]: [i_item_sk#159, i_product_name#160]
 
 (199) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [ss_item_sk#108]
-Right keys [1]: [i_item_sk#160]
+Left keys [1]: [ss_item_sk#107]
+Right keys [1]: [i_item_sk#159]
 Join type: Inner
 Join condition: None
 
 (200) Project [codegen id : 84]
-Output [18]: [ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, d_year#136, d_year#138, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, i_item_sk#160, i_product_name#161]
-Input [19]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, i_item_sk#160, i_product_name#161]
+Output [18]: [ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, d_year#135, d_year#137, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, i_item_sk#159, i_product_name#160]
+Input [19]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, i_item_sk#159, i_product_name#160]
 
 (201) HashAggregate [codegen id : 84]
-Input [18]: [ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, d_year#136, d_year#138, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, i_item_sk#160, i_product_name#161]
-Keys [15]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138]
-Functions [4]: [partial_count(1), partial_sum(UnscaledValue(ss_wholesale_cost#116)), partial_sum(UnscaledValue(ss_list_price#117)), partial_sum(UnscaledValue(ss_coupon_amt#118))]
-Aggregate Attributes [4]: [count#79, sum#162, sum#163, sum#164]
-Results [19]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, count#83, sum#165, sum#166, sum#167]
+Input [18]: [ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, d_year#135, d_year#137, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, i_item_sk#159, i_product_name#160]
+Keys [15]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137]
+Functions [4]: [partial_count(1), partial_sum(UnscaledValue(ss_wholesale_cost#115)), partial_sum(UnscaledValue(ss_list_price#116)), partial_sum(UnscaledValue(ss_coupon_amt#117))]
+Aggregate Attributes [4]: [count#78, sum#161, sum#162, sum#163]
+Results [19]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, count#82, sum#164, sum#165, sum#166]
 
 (202) Exchange
-Input [19]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, count#83, sum#165, sum#166, sum#167]
-Arguments: hashpartitioning(i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, 5), ENSURE_REQUIREMENTS, [plan_id=29]
+Input [19]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, count#82, sum#164, sum#165, sum#166]
+Arguments: hashpartitioning(i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, 5), ENSURE_REQUIREMENTS, [plan_id=30]
 
 (203) HashAggregate [codegen id : 85]
-Input [19]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, count#83, sum#165, sum#166, sum#167]
-Keys [15]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138]
-Functions [4]: [count(1), sum(UnscaledValue(ss_wholesale_cost#116)), sum(UnscaledValue(ss_list_price#117)), sum(UnscaledValue(ss_coupon_amt#118))]
-Aggregate Attributes [4]: [count(1)#87, sum(UnscaledValue(ss_wholesale_cost#116))#88, sum(UnscaledValue(ss_list_price#117))#89, sum(UnscaledValue(ss_coupon_amt#118))#90]
-Results [8]: [i_item_sk#160 AS item_sk#168, s_store_name#127 AS store_name#169, s_zip#128 AS store_zip#170, d_year#125 AS syear#171, count(1)#87 AS cnt#172, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#116))#88,17,2) AS s1#173, MakeDecimal(sum(UnscaledValue(ss_list_price#117))#89,17,2) AS s2#174, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#118))#90,17,2) AS s3#175]
+Input [19]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, count#82, sum#164, sum#165, sum#166]
+Keys [15]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137]
+Functions [4]: [count(1), sum(UnscaledValue(ss_wholesale_cost#115)), sum(UnscaledValue(ss_list_price#116)), sum(UnscaledValue(ss_coupon_amt#117))]
+Aggregate Attributes [4]: [count(1)#86, sum(UnscaledValue(ss_wholesale_cost#115))#87, sum(UnscaledValue(ss_list_price#116))#88, sum(UnscaledValue(ss_coupon_amt#117))#89]
+Results [8]: [i_item_sk#159 AS item_sk#167, s_store_name#126 AS store_name#168, s_zip#127 AS store_zip#169, d_year#124 AS syear#170, count(1)#86 AS cnt#171, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#115))#87,17,2) AS s1#172, MakeDecimal(sum(UnscaledValue(ss_list_price#116))#88,17,2) AS s2#173, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#117))#89,17,2) AS s3#174]
 
 (204) Exchange
-Input [8]: [item_sk#168, store_name#169, store_zip#170, syear#171, cnt#172, s1#173, s2#174, s3#175]
-Arguments: hashpartitioning(item_sk#168, store_name#169, store_zip#170, 5), ENSURE_REQUIREMENTS, [plan_id=30]
+Input [8]: [item_sk#167, store_name#168, store_zip#169, syear#170, cnt#171, s1#172, s2#173, s3#174]
+Arguments: hashpartitioning(item_sk#167, store_name#168, store_zip#169, 5), ENSURE_REQUIREMENTS, [plan_id=31]
 
 (205) Sort [codegen id : 86]
-Input [8]: [item_sk#168, store_name#169, store_zip#170, syear#171, cnt#172, s1#173, s2#174, s3#175]
-Arguments: [item_sk#168 ASC NULLS FIRST, store_name#169 ASC NULLS FIRST, store_zip#170 ASC NULLS FIRST], false, 0
+Input [8]: [item_sk#167, store_name#168, store_zip#169, syear#170, cnt#171, s1#172, s2#173, s3#174]
+Arguments: [item_sk#167 ASC NULLS FIRST, store_name#168 ASC NULLS FIRST, store_zip#169 ASC NULLS FIRST], false, 0
 
 (206) SortMergeJoin [codegen id : 87]
-Left keys [3]: [item_sk#92, store_name#93, store_zip#94]
-Right keys [3]: [item_sk#168, store_name#169, store_zip#170]
+Left keys [3]: [item_sk#91, store_name#92, store_zip#93]
+Right keys [3]: [item_sk#167, store_name#168, store_zip#169]
 Join type: Inner
-Join condition: (cnt#172 <= cnt#104)
+Join condition: (cnt#171 <= cnt#103)
 
 (207) Project [codegen id : 87]
-Output [21]: [product_name#91, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, s1#173, s2#174, s3#175, syear#171, cnt#172]
-Input [25]: [product_name#91, item_sk#92, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, item_sk#168, store_name#169, store_zip#170, syear#171, cnt#172, s1#173, s2#174, s3#175]
+Output [21]: [product_name#90, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, s1#172, s2#173, s3#174, syear#170, cnt#171]
+Input [25]: [product_name#90, item_sk#91, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, item_sk#167, store_name#168, store_zip#169, syear#170, cnt#171, s1#172, s2#173, s3#174]
 
 (208) Exchange
-Input [21]: [product_name#91, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, s1#173, s2#174, s3#175, syear#171, cnt#172]
-Arguments: rangepartitioning(product_name#91 ASC NULLS FIRST, store_name#93 ASC NULLS FIRST, cnt#172 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=31]
+Input [21]: [product_name#90, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, s1#172, s2#173, s3#174, syear#170, cnt#171]
+Arguments: rangepartitioning(product_name#90 ASC NULLS FIRST, store_name#92 ASC NULLS FIRST, cnt#171 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=32]
 
 (209) Sort [codegen id : 88]
-Input [21]: [product_name#91, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, s1#173, s2#174, s3#175, syear#171, cnt#172]
-Arguments: [product_name#91 ASC NULLS FIRST, store_name#93 ASC NULLS FIRST, cnt#172 ASC NULLS FIRST], true, 0
+Input [21]: [product_name#90, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, s1#172, s2#173, s3#174, syear#170, cnt#171]
+Arguments: [product_name#90 ASC NULLS FIRST, store_name#92 ASC NULLS FIRST, cnt#171 ASC NULLS FIRST], true, 0
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#14, [id=#15]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#14, [id=#1]
 ObjectHashAggregate (216)
 +- Exchange (215)
    +- ObjectHashAggregate (214)
@@ -1156,40 +1156,40 @@ ObjectHashAggregate (216)
 
 
 (210) Scan parquet spark_catalog.default.item
-Output [3]: [i_item_sk#75, i_current_price#76, i_color#77]
+Output [3]: [i_item_sk#74, i_current_price#75, i_color#76]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), In(i_color, [burlywood           ,floral              ,indian              ,medium              ,purple              ,spring              ]), GreaterThanOrEqual(i_current_price,64.00), LessThanOrEqual(i_current_price,74.00), GreaterThanOrEqual(i_current_price,65.00), LessThanOrEqual(i_current_price,79.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_color:string>
 
 (211) ColumnarToRow [codegen id : 1]
-Input [3]: [i_item_sk#75, i_current_price#76, i_color#77]
+Input [3]: [i_item_sk#74, i_current_price#75, i_color#76]
 
 (212) Filter [codegen id : 1]
-Input [3]: [i_item_sk#75, i_current_price#76, i_color#77]
-Condition : ((((((isnotnull(i_current_price#76) AND i_color#77 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#76 >= 64.00)) AND (i_current_price#76 <= 74.00)) AND (i_current_price#76 >= 65.00)) AND (i_current_price#76 <= 79.00)) AND isnotnull(i_item_sk#75))
+Input [3]: [i_item_sk#74, i_current_price#75, i_color#76]
+Condition : ((((((isnotnull(i_current_price#75) AND i_color#76 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#75 >= 64.00)) AND (i_current_price#75 <= 74.00)) AND (i_current_price#75 >= 65.00)) AND (i_current_price#75 <= 79.00)) AND isnotnull(i_item_sk#74))
 
 (213) Project [codegen id : 1]
-Output [1]: [i_item_sk#75]
-Input [3]: [i_item_sk#75, i_current_price#76, i_color#77]
+Output [1]: [i_item_sk#74]
+Input [3]: [i_item_sk#74, i_current_price#75, i_color#76]
 
 (214) ObjectHashAggregate
-Input [1]: [i_item_sk#75]
+Input [1]: [i_item_sk#74]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)]
-Aggregate Attributes [1]: [buf#176]
-Results [1]: [buf#177]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)]
+Aggregate Attributes [1]: [buf#175]
+Results [1]: [buf#176]
 
 (215) Exchange
-Input [1]: [buf#177]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=32]
+Input [1]: [buf#176]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=33]
 
 (216) ObjectHashAggregate
-Input [1]: [buf#177]
+Input [1]: [buf#176]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)#178]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)#178 AS bloomFilter#179]
+Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)#177]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)#177 AS bloomFilter#178]
 
 Subquery:2 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#12 IN dynamicpruning#13
 BroadcastExchange (220)
@@ -1199,26 +1199,26 @@ BroadcastExchange (220)
 
 
 (217) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#39, d_year#40]
+Output [2]: [d_date_sk#38, d_year#39]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,1999), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (218) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#39, d_year#40]
+Input [2]: [d_date_sk#38, d_year#39]
 
 (219) Filter [codegen id : 1]
-Input [2]: [d_date_sk#39, d_year#40]
-Condition : ((isnotnull(d_year#40) AND (d_year#40 = 1999)) AND isnotnull(d_date_sk#39))
+Input [2]: [d_date_sk#38, d_year#39]
+Condition : ((isnotnull(d_year#39) AND (d_year#39 = 1999)) AND isnotnull(d_date_sk#38))
 
 (220) BroadcastExchange
-Input [2]: [d_date_sk#39, d_year#40]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=33]
+Input [2]: [d_date_sk#38, d_year#39]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=34]
 
-Subquery:3 Hosting operator id = 131 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#15]
+Subquery:3 Hosting operator id = 131 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#1]
 
-Subquery:4 Hosting operator id = 129 Hosting Expression = ss_sold_date_sk#119 IN dynamicpruning#120
+Subquery:4 Hosting operator id = 129 Hosting Expression = ss_sold_date_sk#118 IN dynamicpruning#119
 BroadcastExchange (224)
 +- * Filter (223)
    +- * ColumnarToRow (222)
@@ -1226,21 +1226,21 @@ BroadcastExchange (224)
 
 
 (221) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#124, d_year#125]
+Output [2]: [d_date_sk#123, d_year#124]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2000), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (222) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#124, d_year#125]
+Input [2]: [d_date_sk#123, d_year#124]
 
 (223) Filter [codegen id : 1]
-Input [2]: [d_date_sk#124, d_year#125]
-Condition : ((isnotnull(d_year#125) AND (d_year#125 = 2000)) AND isnotnull(d_date_sk#124))
+Input [2]: [d_date_sk#123, d_year#124]
+Condition : ((isnotnull(d_year#124) AND (d_year#124 = 2000)) AND isnotnull(d_date_sk#123))
 
 (224) BroadcastExchange
-Input [2]: [d_date_sk#124, d_year#125]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=34]
+Input [2]: [d_date_sk#123, d_year#124]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=35]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/explain.txt
index 8b70f5c67ab31..609a6d729094f 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/explain.txt
@@ -1,56 +1,55 @@
 == Physical Plan ==
-TakeOrderedAndProject (52)
-+- * HashAggregate (51)
-   +- Exchange (50)
-      +- * HashAggregate (49)
-         +- Union (48)
-            :- * HashAggregate (29)
-            :  +- Exchange (28)
-            :     +- * HashAggregate (27)
-            :        +- * Project (26)
-            :           +- * BroadcastHashJoin Inner BuildRight (25)
-            :              :- * Project (20)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (19)
-            :              :     :- * Project (17)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (16)
-            :              :     :     :- * Project (10)
-            :              :     :     :  +- * BroadcastHashJoin Inner BuildRight (9)
-            :              :     :     :     :- * Filter (3)
-            :              :     :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     :     +- Scan parquet spark_catalog.default.web_sales (1)
-            :              :     :     :     +- BroadcastExchange (8)
-            :              :     :     :        +- * Project (7)
-            :              :     :     :           +- * Filter (6)
-            :              :     :     :              +- * ColumnarToRow (5)
-            :              :     :     :                 +- Scan parquet spark_catalog.default.ship_mode (4)
-            :              :     :     +- BroadcastExchange (15)
-            :              :     :        +- * Project (14)
-            :              :     :           +- * Filter (13)
-            :              :     :              +- * ColumnarToRow (12)
-            :              :     :                 +- Scan parquet spark_catalog.default.time_dim (11)
-            :              :     +- ReusedExchange (18)
-            :              +- BroadcastExchange (24)
-            :                 +- * Filter (23)
-            :                    +- * ColumnarToRow (22)
-            :                       +- Scan parquet spark_catalog.default.warehouse (21)
-            +- * HashAggregate (47)
-               +- Exchange (46)
-                  +- * HashAggregate (45)
-                     +- * Project (44)
-                        +- * BroadcastHashJoin Inner BuildRight (43)
-                           :- * Project (41)
-                           :  +- * BroadcastHashJoin Inner BuildRight (40)
-                           :     :- * Project (38)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (37)
-                           :     :     :- * Project (35)
-                           :     :     :  +- * BroadcastHashJoin Inner BuildRight (34)
-                           :     :     :     :- * Filter (32)
-                           :     :     :     :  +- * ColumnarToRow (31)
-                           :     :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (30)
-                           :     :     :     +- ReusedExchange (33)
-                           :     :     +- ReusedExchange (36)
-                           :     +- ReusedExchange (39)
-                           +- ReusedExchange (42)
+TakeOrderedAndProject (51)
++- * HashAggregate (50)
+   +- * HashAggregate (49)
+      +- Union (48)
+         :- * HashAggregate (29)
+         :  +- Exchange (28)
+         :     +- * HashAggregate (27)
+         :        +- * Project (26)
+         :           +- * BroadcastHashJoin Inner BuildRight (25)
+         :              :- * Project (20)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (19)
+         :              :     :- * Project (17)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (16)
+         :              :     :     :- * Project (10)
+         :              :     :     :  +- * BroadcastHashJoin Inner BuildRight (9)
+         :              :     :     :     :- * Filter (3)
+         :              :     :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     :     +- Scan parquet spark_catalog.default.web_sales (1)
+         :              :     :     :     +- BroadcastExchange (8)
+         :              :     :     :        +- * Project (7)
+         :              :     :     :           +- * Filter (6)
+         :              :     :     :              +- * ColumnarToRow (5)
+         :              :     :     :                 +- Scan parquet spark_catalog.default.ship_mode (4)
+         :              :     :     +- BroadcastExchange (15)
+         :              :     :        +- * Project (14)
+         :              :     :           +- * Filter (13)
+         :              :     :              +- * ColumnarToRow (12)
+         :              :     :                 +- Scan parquet spark_catalog.default.time_dim (11)
+         :              :     +- ReusedExchange (18)
+         :              +- BroadcastExchange (24)
+         :                 +- * Filter (23)
+         :                    +- * ColumnarToRow (22)
+         :                       +- Scan parquet spark_catalog.default.warehouse (21)
+         +- * HashAggregate (47)
+            +- Exchange (46)
+               +- * HashAggregate (45)
+                  +- * Project (44)
+                     +- * BroadcastHashJoin Inner BuildRight (43)
+                        :- * Project (41)
+                        :  +- * BroadcastHashJoin Inner BuildRight (40)
+                        :     :- * Project (38)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (37)
+                        :     :     :- * Project (35)
+                        :     :     :  +- * BroadcastHashJoin Inner BuildRight (34)
+                        :     :     :     :- * Filter (32)
+                        :     :     :     :  +- * ColumnarToRow (31)
+                        :     :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (30)
+                        :     :     :     +- ReusedExchange (33)
+                        :     :     +- ReusedExchange (36)
+                        :     +- ReusedExchange (39)
+                        +- ReusedExchange (42)
 
 
 (1) Scan parquet spark_catalog.default.web_sales
@@ -132,7 +131,7 @@ Join condition: None
 Output [5]: [ws_warehouse_sk#3, ws_quantity#4, ws_ext_sales_price#5, ws_net_paid#6, ws_sold_date_sk#7]
 Input [7]: [ws_sold_time_sk#1, ws_warehouse_sk#3, ws_quantity#4, ws_ext_sales_price#5, ws_net_paid#6, ws_sold_date_sk#7, t_time_sk#11]
 
-(18) ReusedExchange [Reuses operator id: 56]
+(18) ReusedExchange [Reuses operator id: 55]
 Output [3]: [d_date_sk#13, d_year#14, d_moy#15]
 
 (19) BroadcastHashJoin [codegen id : 5]
@@ -232,7 +231,7 @@ Join condition: None
 Output [5]: [cs_warehouse_sk#171, cs_quantity#172, cs_sales_price#173, cs_net_paid_inc_tax#174, cs_sold_date_sk#175]
 Input [7]: [cs_sold_time_sk#169, cs_warehouse_sk#171, cs_quantity#172, cs_sales_price#173, cs_net_paid_inc_tax#174, cs_sold_date_sk#175, t_time_sk#177]
 
-(39) ReusedExchange [Reuses operator id: 56]
+(39) ReusedExchange [Reuses operator id: 55]
 Output [3]: [d_date_sk#178, d_year#179, d_moy#180]
 
 (40) BroadcastHashJoin [codegen id : 11]
@@ -285,47 +284,43 @@ Functions [36]: [partial_sum(jan_sales#145), partial_sum(feb_sales#146), partial
 Aggregate Attributes [72]: [sum#334, isEmpty#335, sum#336, isEmpty#337, sum#338, isEmpty#339, sum#340, isEmpty#341, sum#342, isEmpty#343, sum#344, isEmpty#345, sum#346, isEmpty#347, sum#348, isEmpty#349, sum#350, isEmpty#351, sum#352, isEmpty#353, sum#354, isEmpty#355, sum#356, isEmpty#357, sum#358, isEmpty#359, sum#360, isEmpty#361, sum#362, isEmpty#363, sum#364, isEmpty#365, sum#366, isEmpty#367, sum#368, isEmpty#369, sum#370, isEmpty#371, sum#372, isEmpty#373, sum#374, isEmpty#375, sum#376, isEmpty#377, sum#378, isEmpty#379, sum#380, isEmpty#381, sum#382, isEmpty#383, sum#384, isEmpty#385, sum#386, isEmpty#387, sum#388, isEmpty#389, sum#390, isEmpty#391, sum#392, isEmpty#393, sum#394, isEmpty#395, sum#396, isEmpty#397, sum#398, isEmpty#399, sum#400, isEmpty#401, sum#402, isEmpty#403, sum#404, isEmpty#405]
 Results [80]: [w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144, sum#406, isEmpty#407, sum#408, isEmpty#409, sum#410, isEmpty#411, sum#412, isEmpty#413, sum#414, isEmpty#415, sum#416, isEmpty#417, sum#418, isEmpty#419, sum#420, isEmpty#421, sum#422, isEmpty#423, sum#424, isEmpty#425, sum#426, isEmpty#427, sum#428, isEmpty#429, sum#430, isEmpty#431, sum#432, isEmpty#433, sum#434, isEmpty#435, sum#436, isEmpty#437, sum#438, isEmpty#439, sum#440, isEmpty#441, sum#442, isEmpty#443, sum#444, isEmpty#445, sum#446, isEmpty#447, sum#448, isEmpty#449, sum#450, isEmpty#451, sum#452, isEmpty#453, sum#454, isEmpty#455, sum#456, isEmpty#457, sum#458, isEmpty#459, sum#460, isEmpty#461, sum#462, isEmpty#463, sum#464, isEmpty#465, sum#466, isEmpty#467, sum#468, isEmpty#469, sum#470, isEmpty#471, sum#472, isEmpty#473, sum#474, isEmpty#475, sum#476, isEmpty#477]
 
-(50) Exchange
-Input [80]: [w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144, sum#406, isEmpty#407, sum#408, isEmpty#409, sum#410, isEmpty#411, sum#412, isEmpty#413, sum#414, isEmpty#415, sum#416, isEmpty#417, sum#418, isEmpty#419, sum#420, isEmpty#421, sum#422, isEmpty#423, sum#424, isEmpty#425, sum#426, isEmpty#427, sum#428, isEmpty#429, sum#430, isEmpty#431, sum#432, isEmpty#433, sum#434, isEmpty#435, sum#436, isEmpty#437, sum#438, isEmpty#439, sum#440, isEmpty#441, sum#442, isEmpty#443, sum#444, isEmpty#445, sum#446, isEmpty#447, sum#448, isEmpty#449, sum#450, isEmpty#451, sum#452, isEmpty#453, sum#454, isEmpty#455, sum#456, isEmpty#457, sum#458, isEmpty#459, sum#460, isEmpty#461, sum#462, isEmpty#463, sum#464, isEmpty#465, sum#466, isEmpty#467, sum#468, isEmpty#469, sum#470, isEmpty#471, sum#472, isEmpty#473, sum#474, isEmpty#475, sum#476, isEmpty#477]
-Arguments: hashpartitioning(w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144, 5), ENSURE_REQUIREMENTS, [plan_id=6]
-
-(51) HashAggregate [codegen id : 14]
+(50) HashAggregate [codegen id : 13]
 Input [80]: [w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144, sum#406, isEmpty#407, sum#408, isEmpty#409, sum#410, isEmpty#411, sum#412, isEmpty#413, sum#414, isEmpty#415, sum#416, isEmpty#417, sum#418, isEmpty#419, sum#420, isEmpty#421, sum#422, isEmpty#423, sum#424, isEmpty#425, sum#426, isEmpty#427, sum#428, isEmpty#429, sum#430, isEmpty#431, sum#432, isEmpty#433, sum#434, isEmpty#435, sum#436, isEmpty#437, sum#438, isEmpty#439, sum#440, isEmpty#441, sum#442, isEmpty#443, sum#444, isEmpty#445, sum#446, isEmpty#447, sum#448, isEmpty#449, sum#450, isEmpty#451, sum#452, isEmpty#453, sum#454, isEmpty#455, sum#456, isEmpty#457, sum#458, isEmpty#459, sum#460, isEmpty#461, sum#462, isEmpty#463, sum#464, isEmpty#465, sum#466, isEmpty#467, sum#468, isEmpty#469, sum#470, isEmpty#471, sum#472, isEmpty#473, sum#474, isEmpty#475, sum#476, isEmpty#477]
 Keys [8]: [w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144]
 Functions [36]: [sum(jan_sales#145), sum(feb_sales#146), sum(mar_sales#147), sum(apr_sales#148), sum(may_sales#149), sum(jun_sales#150), sum(jul_sales#151), sum(aug_sales#152), sum(sep_sales#153), sum(oct_sales#154), sum(nov_sales#155), sum(dec_sales#156), sum((jan_sales#145 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((feb_sales#146 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((mar_sales#147 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((apr_sales#148 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((may_sales#149 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((jun_sales#150 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((jul_sales#151 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((aug_sales#152 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((sep_sales#153 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((oct_sales#154 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((nov_sales#155 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum((dec_sales#156 / cast(w_warehouse_sq_ft#18 as decimal(10,0)))), sum(jan_net#157), sum(feb_net#158), sum(mar_net#159), sum(apr_net#160), sum(may_net#161), sum(jun_net#162), sum(jul_net#163), sum(aug_net#164), sum(sep_net#165), sum(oct_net#166), sum(nov_net#167), sum(dec_net#168)]
 Aggregate Attributes [36]: [sum(jan_sales#145)#478, sum(feb_sales#146)#479, sum(mar_sales#147)#480, sum(apr_sales#148)#481, sum(may_sales#149)#482, sum(jun_sales#150)#483, sum(jul_sales#151)#484, sum(aug_sales#152)#485, sum(sep_sales#153)#486, sum(oct_sales#154)#487, sum(nov_sales#155)#488, sum(dec_sales#156)#489, sum((jan_sales#145 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#490, sum((feb_sales#146 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#491, sum((mar_sales#147 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#492, sum((apr_sales#148 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#493, sum((may_sales#149 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#494, sum((jun_sales#150 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#495, sum((jul_sales#151 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#496, sum((aug_sales#152 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#497, sum((sep_sales#153 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#498, sum((oct_sales#154 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#499, sum((nov_sales#155 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#500, sum((dec_sales#156 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#501, sum(jan_net#157)#502, sum(feb_net#158)#503, sum(mar_net#159)#504, sum(apr_net#160)#505, sum(may_net#161)#506, sum(jun_net#162)#507, sum(jul_net#163)#508, sum(aug_net#164)#509, sum(sep_net#165)#510, sum(oct_net#166)#511, sum(nov_net#167)#512, sum(dec_net#168)#513]
 Results [44]: [w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144, sum(jan_sales#145)#478 AS jan_sales#514, sum(feb_sales#146)#479 AS feb_sales#515, sum(mar_sales#147)#480 AS mar_sales#516, sum(apr_sales#148)#481 AS apr_sales#517, sum(may_sales#149)#482 AS may_sales#518, sum(jun_sales#150)#483 AS jun_sales#519, sum(jul_sales#151)#484 AS jul_sales#520, sum(aug_sales#152)#485 AS aug_sales#521, sum(sep_sales#153)#486 AS sep_sales#522, sum(oct_sales#154)#487 AS oct_sales#523, sum(nov_sales#155)#488 AS nov_sales#524, sum(dec_sales#156)#489 AS dec_sales#525, sum((jan_sales#145 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#490 AS jan_sales_per_sq_foot#526, sum((feb_sales#146 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#491 AS feb_sales_per_sq_foot#527, sum((mar_sales#147 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#492 AS mar_sales_per_sq_foot#528, sum((apr_sales#148 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#493 AS apr_sales_per_sq_foot#529, sum((may_sales#149 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#494 AS may_sales_per_sq_foot#530, sum((jun_sales#150 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#495 AS jun_sales_per_sq_foot#531, sum((jul_sales#151 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#496 AS jul_sales_per_sq_foot#532, sum((aug_sales#152 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#497 AS aug_sales_per_sq_foot#533, sum((sep_sales#153 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#498 AS sep_sales_per_sq_foot#534, sum((oct_sales#154 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#499 AS oct_sales_per_sq_foot#535, sum((nov_sales#155 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#500 AS nov_sales_per_sq_foot#536, sum((dec_sales#156 / cast(w_warehouse_sq_ft#18 as decimal(10,0))))#501 AS dec_sales_per_sq_foot#537, sum(jan_net#157)#502 AS jan_net#538, sum(feb_net#158)#503 AS feb_net#539, sum(mar_net#159)#504 AS mar_net#540, sum(apr_net#160)#505 AS apr_net#541, sum(may_net#161)#506 AS may_net#542, sum(jun_net#162)#507 AS jun_net#543, sum(jul_net#163)#508 AS jul_net#544, sum(aug_net#164)#509 AS aug_net#545, sum(sep_net#165)#510 AS sep_net#546, sum(oct_net#166)#511 AS oct_net#547, sum(nov_net#167)#512 AS nov_net#548, sum(dec_net#168)#513 AS dec_net#549]
 
-(52) TakeOrderedAndProject
+(51) TakeOrderedAndProject
 Input [44]: [w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144, jan_sales#514, feb_sales#515, mar_sales#516, apr_sales#517, may_sales#518, jun_sales#519, jul_sales#520, aug_sales#521, sep_sales#522, oct_sales#523, nov_sales#524, dec_sales#525, jan_sales_per_sq_foot#526, feb_sales_per_sq_foot#527, mar_sales_per_sq_foot#528, apr_sales_per_sq_foot#529, may_sales_per_sq_foot#530, jun_sales_per_sq_foot#531, jul_sales_per_sq_foot#532, aug_sales_per_sq_foot#533, sep_sales_per_sq_foot#534, oct_sales_per_sq_foot#535, nov_sales_per_sq_foot#536, dec_sales_per_sq_foot#537, jan_net#538, feb_net#539, mar_net#540, apr_net#541, may_net#542, jun_net#543, jul_net#544, aug_net#545, sep_net#546, oct_net#547, nov_net#548, dec_net#549]
 Arguments: 100, [w_warehouse_name#17 ASC NULLS FIRST], [w_warehouse_name#17, w_warehouse_sq_ft#18, w_city#19, w_county#20, w_state#21, w_country#22, ship_carriers#143, year#144, jan_sales#514, feb_sales#515, mar_sales#516, apr_sales#517, may_sales#518, jun_sales#519, jul_sales#520, aug_sales#521, sep_sales#522, oct_sales#523, nov_sales#524, dec_sales#525, jan_sales_per_sq_foot#526, feb_sales_per_sq_foot#527, mar_sales_per_sq_foot#528, apr_sales_per_sq_foot#529, may_sales_per_sq_foot#530, jun_sales_per_sq_foot#531, jul_sales_per_sq_foot#532, aug_sales_per_sq_foot#533, sep_sales_per_sq_foot#534, oct_sales_per_sq_foot#535, nov_sales_per_sq_foot#536, dec_sales_per_sq_foot#537, jan_net#538, feb_net#539, mar_net#540, apr_net#541, may_net#542, jun_net#543, jul_net#544, aug_net#545, sep_net#546, oct_net#547, nov_net#548, dec_net#549]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ws_sold_date_sk#7 IN dynamicpruning#8
-BroadcastExchange (56)
-+- * Filter (55)
-   +- * ColumnarToRow (54)
-      +- Scan parquet spark_catalog.default.date_dim (53)
+BroadcastExchange (55)
++- * Filter (54)
+   +- * ColumnarToRow (53)
+      +- Scan parquet spark_catalog.default.date_dim (52)
 
 
-(53) Scan parquet spark_catalog.default.date_dim
+(52) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#13, d_year#14, d_moy#15]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(54) ColumnarToRow [codegen id : 1]
+(53) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#13, d_year#14, d_moy#15]
 
-(55) Filter [codegen id : 1]
+(54) Filter [codegen id : 1]
 Input [3]: [d_date_sk#13, d_year#14, d_moy#15]
 Condition : ((isnotnull(d_year#14) AND (d_year#14 = 2001)) AND isnotnull(d_date_sk#13))
 
-(56) BroadcastExchange
+(55) BroadcastExchange
 Input [3]: [d_date_sk#13, d_year#14, d_moy#15]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=6]
 
 Subquery:2 Hosting operator id = 30 Hosting Expression = cs_sold_date_sk#175 IN dynamicpruning#8
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/simplified.txt
index 53e8d4a171ba7..f2d257330feb1 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66.sf100/simplified.txt
@@ -1,86 +1,83 @@
 TakeOrderedAndProject [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_sales_per_sq_foot,feb_sales_per_sq_foot,mar_sales_per_sq_foot,apr_sales_per_sq_foot,may_sales_per_sq_foot,jun_sales_per_sq_foot,jul_sales_per_sq_foot,aug_sales_per_sq_foot,sep_sales_per_sq_foot,oct_sales_per_sq_foot,nov_sales_per_sq_foot,dec_sales_per_sq_foot,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net]
-  WholeStageCodegen (14)
+  WholeStageCodegen (13)
     HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(jan_sales),sum(feb_sales),sum(mar_sales),sum(apr_sales),sum(may_sales),sum(jun_sales),sum(jul_sales),sum(aug_sales),sum(sep_sales),sum(oct_sales),sum(nov_sales),sum(dec_sales),sum((jan_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((feb_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((mar_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((apr_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((may_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((jun_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((jul_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((aug_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((sep_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((oct_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((nov_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((dec_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum(jan_net),sum(feb_net),sum(mar_net),sum(apr_net),sum(may_net),sum(jun_net),sum(jul_net),sum(aug_net),sum(sep_net),sum(oct_net),sum(nov_net),sum(dec_net),jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_sales_per_sq_foot,feb_sales_per_sq_foot,mar_sales_per_sq_foot,apr_sales_per_sq_foot,may_sales_per_sq_foot,jun_sales_per_sq_foot,jul_sales_per_sq_foot,aug_sales_per_sq_foot,sep_sales_per_sq_foot,oct_sales_per_sq_foot,nov_sales_per_sq_foot,dec_sales_per_sq_foot,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-      InputAdapter
-        Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year] #1
-          WholeStageCodegen (13)
-            HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                      InputAdapter
-                        Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,ws_ext_sales_price,ws_quantity,ws_net_paid] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                              Project [ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                BroadcastHashJoin [ws_warehouse_sk,w_warehouse_sk]
-                                  Project [ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,d_year,d_moy]
-                                    BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                      Project [ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
-                                        BroadcastHashJoin [ws_sold_time_sk,t_time_sk]
-                                          Project [ws_sold_time_sk,ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
-                                            BroadcastHashJoin [ws_ship_mode_sk,sm_ship_mode_sk]
-                                              Filter [ws_warehouse_sk,ws_sold_time_sk,ws_ship_mode_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.web_sales [ws_sold_time_sk,ws_ship_mode_sk,ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
-                                                      SubqueryBroadcast [d_date_sk] #1
-                                                        BroadcastExchange #3
-                                                          WholeStageCodegen (1)
-                                                            Filter [d_year,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                              InputAdapter
-                                                BroadcastExchange #4
-                                                  WholeStageCodegen (1)
-                                                    Project [sm_ship_mode_sk]
-                                                      Filter [sm_carrier,sm_ship_mode_sk]
+      HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                InputAdapter
+                  Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,ws_ext_sales_price,ws_quantity,ws_net_paid] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                        Project [ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                          BroadcastHashJoin [ws_warehouse_sk,w_warehouse_sk]
+                            Project [ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,d_year,d_moy]
+                              BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                Project [ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
+                                  BroadcastHashJoin [ws_sold_time_sk,t_time_sk]
+                                    Project [ws_sold_time_sk,ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
+                                      BroadcastHashJoin [ws_ship_mode_sk,sm_ship_mode_sk]
+                                        Filter [ws_warehouse_sk,ws_sold_time_sk,ws_ship_mode_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.web_sales [ws_sold_time_sk,ws_ship_mode_sk,ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
+                                                SubqueryBroadcast [d_date_sk] #1
+                                                  BroadcastExchange #2
+                                                    WholeStageCodegen (1)
+                                                      Filter [d_year,d_date_sk]
                                                         ColumnarToRow
                                                           InputAdapter
-                                                            Scan parquet spark_catalog.default.ship_mode [sm_ship_mode_sk,sm_carrier]
-                                          InputAdapter
-                                            BroadcastExchange #5
-                                              WholeStageCodegen (2)
-                                                Project [t_time_sk]
-                                                  Filter [t_time,t_time_sk]
-                                                    ColumnarToRow
-                                                      InputAdapter
-                                                        Scan parquet spark_catalog.default.time_dim [t_time_sk,t_time]
+                                                            Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                        InputAdapter
+                                          BroadcastExchange #3
+                                            WholeStageCodegen (1)
+                                              Project [sm_ship_mode_sk]
+                                                Filter [sm_carrier,sm_ship_mode_sk]
+                                                  ColumnarToRow
+                                                    InputAdapter
+                                                      Scan parquet spark_catalog.default.ship_mode [sm_ship_mode_sk,sm_carrier]
+                                    InputAdapter
+                                      BroadcastExchange #4
+                                        WholeStageCodegen (2)
+                                          Project [t_time_sk]
+                                            Filter [t_time,t_time_sk]
+                                              ColumnarToRow
+                                                InputAdapter
+                                                  Scan parquet spark_catalog.default.time_dim [t_time_sk,t_time]
+                                InputAdapter
+                                  ReusedExchange [d_date_sk,d_year,d_moy] #2
+                            InputAdapter
+                              BroadcastExchange #5
+                                WholeStageCodegen (4)
+                                  Filter [w_warehouse_sk]
+                                    ColumnarToRow
                                       InputAdapter
-                                        ReusedExchange [d_date_sk,d_year,d_moy] #3
-                                  InputAdapter
-                                    BroadcastExchange #6
-                                      WholeStageCodegen (4)
-                                        Filter [w_warehouse_sk]
+                                        Scan parquet spark_catalog.default.warehouse [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
+            WholeStageCodegen (12)
+              HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                InputAdapter
+                  Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,cs_sales_price,cs_quantity,cs_net_paid_inc_tax] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                        Project [cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                          BroadcastHashJoin [cs_warehouse_sk,w_warehouse_sk]
+                            Project [cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,d_year,d_moy]
+                              BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                Project [cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
+                                  BroadcastHashJoin [cs_sold_time_sk,t_time_sk]
+                                    Project [cs_sold_time_sk,cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
+                                      BroadcastHashJoin [cs_ship_mode_sk,sm_ship_mode_sk]
+                                        Filter [cs_warehouse_sk,cs_sold_time_sk,cs_ship_mode_sk]
                                           ColumnarToRow
                                             InputAdapter
-                                              Scan parquet spark_catalog.default.warehouse [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
-                  WholeStageCodegen (12)
-                    HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                      InputAdapter
-                        Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,cs_sales_price,cs_quantity,cs_net_paid_inc_tax] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                              Project [cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                BroadcastHashJoin [cs_warehouse_sk,w_warehouse_sk]
-                                  Project [cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,d_year,d_moy]
-                                    BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                      Project [cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
-                                        BroadcastHashJoin [cs_sold_time_sk,t_time_sk]
-                                          Project [cs_sold_time_sk,cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
-                                            BroadcastHashJoin [cs_ship_mode_sk,sm_ship_mode_sk]
-                                              Filter [cs_warehouse_sk,cs_sold_time_sk,cs_ship_mode_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.catalog_sales [cs_sold_time_sk,cs_ship_mode_sk,cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
-                                                      ReusedSubquery [d_date_sk] #1
-                                              InputAdapter
-                                                ReusedExchange [sm_ship_mode_sk] #4
-                                          InputAdapter
-                                            ReusedExchange [t_time_sk] #5
-                                      InputAdapter
-                                        ReusedExchange [d_date_sk,d_year,d_moy] #3
-                                  InputAdapter
-                                    ReusedExchange [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country] #6
+                                              Scan parquet spark_catalog.default.catalog_sales [cs_sold_time_sk,cs_ship_mode_sk,cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
+                                                ReusedSubquery [d_date_sk] #1
+                                        InputAdapter
+                                          ReusedExchange [sm_ship_mode_sk] #3
+                                    InputAdapter
+                                      ReusedExchange [t_time_sk] #4
+                                InputAdapter
+                                  ReusedExchange [d_date_sk,d_year,d_moy] #2
+                            InputAdapter
+                              ReusedExchange [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country] #5
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/explain.txt
index 09c68efe6f11d..02a57a28f9ab0 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/explain.txt
@@ -1,56 +1,55 @@
 == Physical Plan ==
-TakeOrderedAndProject (52)
-+- * HashAggregate (51)
-   +- Exchange (50)
-      +- * HashAggregate (49)
-         +- Union (48)
-            :- * HashAggregate (29)
-            :  +- Exchange (28)
-            :     +- * HashAggregate (27)
-            :        +- * Project (26)
-            :           +- * BroadcastHashJoin Inner BuildRight (25)
-            :              :- * Project (19)
-            :              :  +- * BroadcastHashJoin Inner BuildRight (18)
-            :              :     :- * Project (12)
-            :              :     :  +- * BroadcastHashJoin Inner BuildRight (11)
-            :              :     :     :- * Project (9)
-            :              :     :     :  +- * BroadcastHashJoin Inner BuildRight (8)
-            :              :     :     :     :- * Filter (3)
-            :              :     :     :     :  +- * ColumnarToRow (2)
-            :              :     :     :     :     +- Scan parquet spark_catalog.default.web_sales (1)
-            :              :     :     :     +- BroadcastExchange (7)
-            :              :     :     :        +- * Filter (6)
-            :              :     :     :           +- * ColumnarToRow (5)
-            :              :     :     :              +- Scan parquet spark_catalog.default.warehouse (4)
-            :              :     :     +- ReusedExchange (10)
-            :              :     +- BroadcastExchange (17)
-            :              :        +- * Project (16)
-            :              :           +- * Filter (15)
-            :              :              +- * ColumnarToRow (14)
-            :              :                 +- Scan parquet spark_catalog.default.time_dim (13)
-            :              +- BroadcastExchange (24)
-            :                 +- * Project (23)
-            :                    +- * Filter (22)
-            :                       +- * ColumnarToRow (21)
-            :                          +- Scan parquet spark_catalog.default.ship_mode (20)
-            +- * HashAggregate (47)
-               +- Exchange (46)
-                  +- * HashAggregate (45)
-                     +- * Project (44)
-                        +- * BroadcastHashJoin Inner BuildRight (43)
-                           :- * Project (41)
-                           :  +- * BroadcastHashJoin Inner BuildRight (40)
-                           :     :- * Project (38)
-                           :     :  +- * BroadcastHashJoin Inner BuildRight (37)
-                           :     :     :- * Project (35)
-                           :     :     :  +- * BroadcastHashJoin Inner BuildRight (34)
-                           :     :     :     :- * Filter (32)
-                           :     :     :     :  +- * ColumnarToRow (31)
-                           :     :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (30)
-                           :     :     :     +- ReusedExchange (33)
-                           :     :     +- ReusedExchange (36)
-                           :     +- ReusedExchange (39)
-                           +- ReusedExchange (42)
+TakeOrderedAndProject (51)
++- * HashAggregate (50)
+   +- * HashAggregate (49)
+      +- Union (48)
+         :- * HashAggregate (29)
+         :  +- Exchange (28)
+         :     +- * HashAggregate (27)
+         :        +- * Project (26)
+         :           +- * BroadcastHashJoin Inner BuildRight (25)
+         :              :- * Project (19)
+         :              :  +- * BroadcastHashJoin Inner BuildRight (18)
+         :              :     :- * Project (12)
+         :              :     :  +- * BroadcastHashJoin Inner BuildRight (11)
+         :              :     :     :- * Project (9)
+         :              :     :     :  +- * BroadcastHashJoin Inner BuildRight (8)
+         :              :     :     :     :- * Filter (3)
+         :              :     :     :     :  +- * ColumnarToRow (2)
+         :              :     :     :     :     +- Scan parquet spark_catalog.default.web_sales (1)
+         :              :     :     :     +- BroadcastExchange (7)
+         :              :     :     :        +- * Filter (6)
+         :              :     :     :           +- * ColumnarToRow (5)
+         :              :     :     :              +- Scan parquet spark_catalog.default.warehouse (4)
+         :              :     :     +- ReusedExchange (10)
+         :              :     +- BroadcastExchange (17)
+         :              :        +- * Project (16)
+         :              :           +- * Filter (15)
+         :              :              +- * ColumnarToRow (14)
+         :              :                 +- Scan parquet spark_catalog.default.time_dim (13)
+         :              +- BroadcastExchange (24)
+         :                 +- * Project (23)
+         :                    +- * Filter (22)
+         :                       +- * ColumnarToRow (21)
+         :                          +- Scan parquet spark_catalog.default.ship_mode (20)
+         +- * HashAggregate (47)
+            +- Exchange (46)
+               +- * HashAggregate (45)
+                  +- * Project (44)
+                     +- * BroadcastHashJoin Inner BuildRight (43)
+                        :- * Project (41)
+                        :  +- * BroadcastHashJoin Inner BuildRight (40)
+                        :     :- * Project (38)
+                        :     :  +- * BroadcastHashJoin Inner BuildRight (37)
+                        :     :     :- * Project (35)
+                        :     :     :  +- * BroadcastHashJoin Inner BuildRight (34)
+                        :     :     :     :- * Filter (32)
+                        :     :     :     :  +- * ColumnarToRow (31)
+                        :     :     :     :     +- Scan parquet spark_catalog.default.catalog_sales (30)
+                        :     :     :     +- ReusedExchange (33)
+                        :     :     +- ReusedExchange (36)
+                        :     +- ReusedExchange (39)
+                        +- ReusedExchange (42)
 
 
 (1) Scan parquet spark_catalog.default.web_sales
@@ -96,7 +95,7 @@ Join condition: None
 Output [12]: [ws_sold_time_sk#1, ws_ship_mode_sk#2, ws_quantity#4, ws_ext_sales_price#5, ws_net_paid#6, ws_sold_date_sk#7, w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15]
 Input [14]: [ws_sold_time_sk#1, ws_ship_mode_sk#2, ws_warehouse_sk#3, ws_quantity#4, ws_ext_sales_price#5, ws_net_paid#6, ws_sold_date_sk#7, w_warehouse_sk#9, w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15]
 
-(10) ReusedExchange [Reuses operator id: 56]
+(10) ReusedExchange [Reuses operator id: 55]
 Output [3]: [d_date_sk#16, d_year#17, d_moy#18]
 
 (11) BroadcastHashJoin [codegen id : 5]
@@ -219,7 +218,7 @@ Join condition: None
 Output [12]: [cs_sold_time_sk#169, cs_ship_mode_sk#170, cs_quantity#172, cs_sales_price#173, cs_net_paid_inc_tax#174, cs_sold_date_sk#175, w_warehouse_name#177, w_warehouse_sq_ft#178, w_city#179, w_county#180, w_state#181, w_country#182]
 Input [14]: [cs_sold_time_sk#169, cs_ship_mode_sk#170, cs_warehouse_sk#171, cs_quantity#172, cs_sales_price#173, cs_net_paid_inc_tax#174, cs_sold_date_sk#175, w_warehouse_sk#176, w_warehouse_name#177, w_warehouse_sq_ft#178, w_city#179, w_county#180, w_state#181, w_country#182]
 
-(36) ReusedExchange [Reuses operator id: 56]
+(36) ReusedExchange [Reuses operator id: 55]
 Output [3]: [d_date_sk#183, d_year#184, d_moy#185]
 
 (37) BroadcastHashJoin [codegen id : 11]
@@ -285,47 +284,43 @@ Functions [36]: [partial_sum(jan_sales#145), partial_sum(feb_sales#146), partial
 Aggregate Attributes [72]: [sum#334, isEmpty#335, sum#336, isEmpty#337, sum#338, isEmpty#339, sum#340, isEmpty#341, sum#342, isEmpty#343, sum#344, isEmpty#345, sum#346, isEmpty#347, sum#348, isEmpty#349, sum#350, isEmpty#351, sum#352, isEmpty#353, sum#354, isEmpty#355, sum#356, isEmpty#357, sum#358, isEmpty#359, sum#360, isEmpty#361, sum#362, isEmpty#363, sum#364, isEmpty#365, sum#366, isEmpty#367, sum#368, isEmpty#369, sum#370, isEmpty#371, sum#372, isEmpty#373, sum#374, isEmpty#375, sum#376, isEmpty#377, sum#378, isEmpty#379, sum#380, isEmpty#381, sum#382, isEmpty#383, sum#384, isEmpty#385, sum#386, isEmpty#387, sum#388, isEmpty#389, sum#390, isEmpty#391, sum#392, isEmpty#393, sum#394, isEmpty#395, sum#396, isEmpty#397, sum#398, isEmpty#399, sum#400, isEmpty#401, sum#402, isEmpty#403, sum#404, isEmpty#405]
 Results [80]: [w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144, sum#406, isEmpty#407, sum#408, isEmpty#409, sum#410, isEmpty#411, sum#412, isEmpty#413, sum#414, isEmpty#415, sum#416, isEmpty#417, sum#418, isEmpty#419, sum#420, isEmpty#421, sum#422, isEmpty#423, sum#424, isEmpty#425, sum#426, isEmpty#427, sum#428, isEmpty#429, sum#430, isEmpty#431, sum#432, isEmpty#433, sum#434, isEmpty#435, sum#436, isEmpty#437, sum#438, isEmpty#439, sum#440, isEmpty#441, sum#442, isEmpty#443, sum#444, isEmpty#445, sum#446, isEmpty#447, sum#448, isEmpty#449, sum#450, isEmpty#451, sum#452, isEmpty#453, sum#454, isEmpty#455, sum#456, isEmpty#457, sum#458, isEmpty#459, sum#460, isEmpty#461, sum#462, isEmpty#463, sum#464, isEmpty#465, sum#466, isEmpty#467, sum#468, isEmpty#469, sum#470, isEmpty#471, sum#472, isEmpty#473, sum#474, isEmpty#475, sum#476, isEmpty#477]
 
-(50) Exchange
-Input [80]: [w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144, sum#406, isEmpty#407, sum#408, isEmpty#409, sum#410, isEmpty#411, sum#412, isEmpty#413, sum#414, isEmpty#415, sum#416, isEmpty#417, sum#418, isEmpty#419, sum#420, isEmpty#421, sum#422, isEmpty#423, sum#424, isEmpty#425, sum#426, isEmpty#427, sum#428, isEmpty#429, sum#430, isEmpty#431, sum#432, isEmpty#433, sum#434, isEmpty#435, sum#436, isEmpty#437, sum#438, isEmpty#439, sum#440, isEmpty#441, sum#442, isEmpty#443, sum#444, isEmpty#445, sum#446, isEmpty#447, sum#448, isEmpty#449, sum#450, isEmpty#451, sum#452, isEmpty#453, sum#454, isEmpty#455, sum#456, isEmpty#457, sum#458, isEmpty#459, sum#460, isEmpty#461, sum#462, isEmpty#463, sum#464, isEmpty#465, sum#466, isEmpty#467, sum#468, isEmpty#469, sum#470, isEmpty#471, sum#472, isEmpty#473, sum#474, isEmpty#475, sum#476, isEmpty#477]
-Arguments: hashpartitioning(w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144, 5), ENSURE_REQUIREMENTS, [plan_id=6]
-
-(51) HashAggregate [codegen id : 14]
+(50) HashAggregate [codegen id : 13]
 Input [80]: [w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144, sum#406, isEmpty#407, sum#408, isEmpty#409, sum#410, isEmpty#411, sum#412, isEmpty#413, sum#414, isEmpty#415, sum#416, isEmpty#417, sum#418, isEmpty#419, sum#420, isEmpty#421, sum#422, isEmpty#423, sum#424, isEmpty#425, sum#426, isEmpty#427, sum#428, isEmpty#429, sum#430, isEmpty#431, sum#432, isEmpty#433, sum#434, isEmpty#435, sum#436, isEmpty#437, sum#438, isEmpty#439, sum#440, isEmpty#441, sum#442, isEmpty#443, sum#444, isEmpty#445, sum#446, isEmpty#447, sum#448, isEmpty#449, sum#450, isEmpty#451, sum#452, isEmpty#453, sum#454, isEmpty#455, sum#456, isEmpty#457, sum#458, isEmpty#459, sum#460, isEmpty#461, sum#462, isEmpty#463, sum#464, isEmpty#465, sum#466, isEmpty#467, sum#468, isEmpty#469, sum#470, isEmpty#471, sum#472, isEmpty#473, sum#474, isEmpty#475, sum#476, isEmpty#477]
 Keys [8]: [w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144]
 Functions [36]: [sum(jan_sales#145), sum(feb_sales#146), sum(mar_sales#147), sum(apr_sales#148), sum(may_sales#149), sum(jun_sales#150), sum(jul_sales#151), sum(aug_sales#152), sum(sep_sales#153), sum(oct_sales#154), sum(nov_sales#155), sum(dec_sales#156), sum((jan_sales#145 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((feb_sales#146 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((mar_sales#147 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((apr_sales#148 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((may_sales#149 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((jun_sales#150 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((jul_sales#151 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((aug_sales#152 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((sep_sales#153 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((oct_sales#154 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((nov_sales#155 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum((dec_sales#156 / cast(w_warehouse_sq_ft#11 as decimal(10,0)))), sum(jan_net#157), sum(feb_net#158), sum(mar_net#159), sum(apr_net#160), sum(may_net#161), sum(jun_net#162), sum(jul_net#163), sum(aug_net#164), sum(sep_net#165), sum(oct_net#166), sum(nov_net#167), sum(dec_net#168)]
 Aggregate Attributes [36]: [sum(jan_sales#145)#478, sum(feb_sales#146)#479, sum(mar_sales#147)#480, sum(apr_sales#148)#481, sum(may_sales#149)#482, sum(jun_sales#150)#483, sum(jul_sales#151)#484, sum(aug_sales#152)#485, sum(sep_sales#153)#486, sum(oct_sales#154)#487, sum(nov_sales#155)#488, sum(dec_sales#156)#489, sum((jan_sales#145 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#490, sum((feb_sales#146 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#491, sum((mar_sales#147 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#492, sum((apr_sales#148 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#493, sum((may_sales#149 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#494, sum((jun_sales#150 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#495, sum((jul_sales#151 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#496, sum((aug_sales#152 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#497, sum((sep_sales#153 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#498, sum((oct_sales#154 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#499, sum((nov_sales#155 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#500, sum((dec_sales#156 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#501, sum(jan_net#157)#502, sum(feb_net#158)#503, sum(mar_net#159)#504, sum(apr_net#160)#505, sum(may_net#161)#506, sum(jun_net#162)#507, sum(jul_net#163)#508, sum(aug_net#164)#509, sum(sep_net#165)#510, sum(oct_net#166)#511, sum(nov_net#167)#512, sum(dec_net#168)#513]
 Results [44]: [w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144, sum(jan_sales#145)#478 AS jan_sales#514, sum(feb_sales#146)#479 AS feb_sales#515, sum(mar_sales#147)#480 AS mar_sales#516, sum(apr_sales#148)#481 AS apr_sales#517, sum(may_sales#149)#482 AS may_sales#518, sum(jun_sales#150)#483 AS jun_sales#519, sum(jul_sales#151)#484 AS jul_sales#520, sum(aug_sales#152)#485 AS aug_sales#521, sum(sep_sales#153)#486 AS sep_sales#522, sum(oct_sales#154)#487 AS oct_sales#523, sum(nov_sales#155)#488 AS nov_sales#524, sum(dec_sales#156)#489 AS dec_sales#525, sum((jan_sales#145 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#490 AS jan_sales_per_sq_foot#526, sum((feb_sales#146 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#491 AS feb_sales_per_sq_foot#527, sum((mar_sales#147 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#492 AS mar_sales_per_sq_foot#528, sum((apr_sales#148 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#493 AS apr_sales_per_sq_foot#529, sum((may_sales#149 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#494 AS may_sales_per_sq_foot#530, sum((jun_sales#150 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#495 AS jun_sales_per_sq_foot#531, sum((jul_sales#151 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#496 AS jul_sales_per_sq_foot#532, sum((aug_sales#152 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#497 AS aug_sales_per_sq_foot#533, sum((sep_sales#153 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#498 AS sep_sales_per_sq_foot#534, sum((oct_sales#154 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#499 AS oct_sales_per_sq_foot#535, sum((nov_sales#155 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#500 AS nov_sales_per_sq_foot#536, sum((dec_sales#156 / cast(w_warehouse_sq_ft#11 as decimal(10,0))))#501 AS dec_sales_per_sq_foot#537, sum(jan_net#157)#502 AS jan_net#538, sum(feb_net#158)#503 AS feb_net#539, sum(mar_net#159)#504 AS mar_net#540, sum(apr_net#160)#505 AS apr_net#541, sum(may_net#161)#506 AS may_net#542, sum(jun_net#162)#507 AS jun_net#543, sum(jul_net#163)#508 AS jul_net#544, sum(aug_net#164)#509 AS aug_net#545, sum(sep_net#165)#510 AS sep_net#546, sum(oct_net#166)#511 AS oct_net#547, sum(nov_net#167)#512 AS nov_net#548, sum(dec_net#168)#513 AS dec_net#549]
 
-(52) TakeOrderedAndProject
+(51) TakeOrderedAndProject
 Input [44]: [w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144, jan_sales#514, feb_sales#515, mar_sales#516, apr_sales#517, may_sales#518, jun_sales#519, jul_sales#520, aug_sales#521, sep_sales#522, oct_sales#523, nov_sales#524, dec_sales#525, jan_sales_per_sq_foot#526, feb_sales_per_sq_foot#527, mar_sales_per_sq_foot#528, apr_sales_per_sq_foot#529, may_sales_per_sq_foot#530, jun_sales_per_sq_foot#531, jul_sales_per_sq_foot#532, aug_sales_per_sq_foot#533, sep_sales_per_sq_foot#534, oct_sales_per_sq_foot#535, nov_sales_per_sq_foot#536, dec_sales_per_sq_foot#537, jan_net#538, feb_net#539, mar_net#540, apr_net#541, may_net#542, jun_net#543, jul_net#544, aug_net#545, sep_net#546, oct_net#547, nov_net#548, dec_net#549]
 Arguments: 100, [w_warehouse_name#10 ASC NULLS FIRST], [w_warehouse_name#10, w_warehouse_sq_ft#11, w_city#12, w_county#13, w_state#14, w_country#15, ship_carriers#143, year#144, jan_sales#514, feb_sales#515, mar_sales#516, apr_sales#517, may_sales#518, jun_sales#519, jul_sales#520, aug_sales#521, sep_sales#522, oct_sales#523, nov_sales#524, dec_sales#525, jan_sales_per_sq_foot#526, feb_sales_per_sq_foot#527, mar_sales_per_sq_foot#528, apr_sales_per_sq_foot#529, may_sales_per_sq_foot#530, jun_sales_per_sq_foot#531, jul_sales_per_sq_foot#532, aug_sales_per_sq_foot#533, sep_sales_per_sq_foot#534, oct_sales_per_sq_foot#535, nov_sales_per_sq_foot#536, dec_sales_per_sq_foot#537, jan_net#538, feb_net#539, mar_net#540, apr_net#541, may_net#542, jun_net#543, jul_net#544, aug_net#545, sep_net#546, oct_net#547, nov_net#548, dec_net#549]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ws_sold_date_sk#7 IN dynamicpruning#8
-BroadcastExchange (56)
-+- * Filter (55)
-   +- * ColumnarToRow (54)
-      +- Scan parquet spark_catalog.default.date_dim (53)
+BroadcastExchange (55)
++- * Filter (54)
+   +- * ColumnarToRow (53)
+      +- Scan parquet spark_catalog.default.date_dim (52)
 
 
-(53) Scan parquet spark_catalog.default.date_dim
+(52) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#16, d_year#17, d_moy#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(54) ColumnarToRow [codegen id : 1]
+(53) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#16, d_year#17, d_moy#18]
 
-(55) Filter [codegen id : 1]
+(54) Filter [codegen id : 1]
 Input [3]: [d_date_sk#16, d_year#17, d_moy#18]
 Condition : ((isnotnull(d_year#17) AND (d_year#17 = 2001)) AND isnotnull(d_date_sk#16))
 
-(56) BroadcastExchange
+(55) BroadcastExchange
 Input [3]: [d_date_sk#16, d_year#17, d_moy#18]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=6]
 
 Subquery:2 Hosting operator id = 30 Hosting Expression = cs_sold_date_sk#175 IN dynamicpruning#8
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/simplified.txt
index e0cb9e9cf6059..abcf58dcae90f 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q66/simplified.txt
@@ -1,86 +1,83 @@
 TakeOrderedAndProject [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_sales_per_sq_foot,feb_sales_per_sq_foot,mar_sales_per_sq_foot,apr_sales_per_sq_foot,may_sales_per_sq_foot,jun_sales_per_sq_foot,jul_sales_per_sq_foot,aug_sales_per_sq_foot,sep_sales_per_sq_foot,oct_sales_per_sq_foot,nov_sales_per_sq_foot,dec_sales_per_sq_foot,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net]
-  WholeStageCodegen (14)
+  WholeStageCodegen (13)
     HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(jan_sales),sum(feb_sales),sum(mar_sales),sum(apr_sales),sum(may_sales),sum(jun_sales),sum(jul_sales),sum(aug_sales),sum(sep_sales),sum(oct_sales),sum(nov_sales),sum(dec_sales),sum((jan_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((feb_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((mar_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((apr_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((may_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((jun_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((jul_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((aug_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((sep_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((oct_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((nov_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum((dec_sales / cast(w_warehouse_sq_ft as decimal(10,0)))),sum(jan_net),sum(feb_net),sum(mar_net),sum(apr_net),sum(may_net),sum(jun_net),sum(jul_net),sum(aug_net),sum(sep_net),sum(oct_net),sum(nov_net),sum(dec_net),jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_sales_per_sq_foot,feb_sales_per_sq_foot,mar_sales_per_sq_foot,apr_sales_per_sq_foot,may_sales_per_sq_foot,jun_sales_per_sq_foot,jul_sales_per_sq_foot,aug_sales_per_sq_foot,sep_sales_per_sq_foot,oct_sales_per_sq_foot,nov_sales_per_sq_foot,dec_sales_per_sq_foot,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-      InputAdapter
-        Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year] #1
-          WholeStageCodegen (13)
-            HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-              InputAdapter
-                Union
-                  WholeStageCodegen (6)
-                    HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                      InputAdapter
-                        Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #2
-                          WholeStageCodegen (5)
-                            HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,ws_ext_sales_price,ws_quantity,ws_net_paid] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                              Project [ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                BroadcastHashJoin [ws_ship_mode_sk,sm_ship_mode_sk]
-                                  Project [ws_ship_mode_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                    BroadcastHashJoin [ws_sold_time_sk,t_time_sk]
-                                      Project [ws_sold_time_sk,ws_ship_mode_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                          Project [ws_sold_time_sk,ws_ship_mode_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
-                                            BroadcastHashJoin [ws_warehouse_sk,w_warehouse_sk]
-                                              Filter [ws_warehouse_sk,ws_sold_time_sk,ws_ship_mode_sk]
+      HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+        InputAdapter
+          Union
+            WholeStageCodegen (6)
+              HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_ext_sales_price * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (ws_net_paid * cast(ws_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                InputAdapter
+                  Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #1
+                    WholeStageCodegen (5)
+                      HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,ws_ext_sales_price,ws_quantity,ws_net_paid] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                        Project [ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                          BroadcastHashJoin [ws_ship_mode_sk,sm_ship_mode_sk]
+                            Project [ws_ship_mode_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                              BroadcastHashJoin [ws_sold_time_sk,t_time_sk]
+                                Project [ws_sold_time_sk,ws_ship_mode_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                    Project [ws_sold_time_sk,ws_ship_mode_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
+                                      BroadcastHashJoin [ws_warehouse_sk,w_warehouse_sk]
+                                        Filter [ws_warehouse_sk,ws_sold_time_sk,ws_ship_mode_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.web_sales [ws_sold_time_sk,ws_ship_mode_sk,ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
+                                                SubqueryBroadcast [d_date_sk] #1
+                                                  BroadcastExchange #2
+                                                    WholeStageCodegen (1)
+                                                      Filter [d_year,d_date_sk]
+                                                        ColumnarToRow
+                                                          InputAdapter
+                                                            Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                        InputAdapter
+                                          BroadcastExchange #3
+                                            WholeStageCodegen (1)
+                                              Filter [w_warehouse_sk]
                                                 ColumnarToRow
                                                   InputAdapter
-                                                    Scan parquet spark_catalog.default.web_sales [ws_sold_time_sk,ws_ship_mode_sk,ws_warehouse_sk,ws_quantity,ws_ext_sales_price,ws_net_paid,ws_sold_date_sk]
-                                                      SubqueryBroadcast [d_date_sk] #1
-                                                        BroadcastExchange #3
-                                                          WholeStageCodegen (1)
-                                                            Filter [d_year,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                              InputAdapter
-                                                BroadcastExchange #4
-                                                  WholeStageCodegen (1)
-                                                    Filter [w_warehouse_sk]
-                                                      ColumnarToRow
-                                                        InputAdapter
-                                                          Scan parquet spark_catalog.default.warehouse [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk,d_year,d_moy] #3
-                                      InputAdapter
-                                        BroadcastExchange #5
-                                          WholeStageCodegen (3)
-                                            Project [t_time_sk]
-                                              Filter [t_time,t_time_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.time_dim [t_time_sk,t_time]
-                                  InputAdapter
-                                    BroadcastExchange #6
-                                      WholeStageCodegen (4)
-                                        Project [sm_ship_mode_sk]
-                                          Filter [sm_carrier,sm_ship_mode_sk]
-                                            ColumnarToRow
-                                              InputAdapter
-                                                Scan parquet spark_catalog.default.ship_mode [sm_ship_mode_sk,sm_carrier]
-                  WholeStageCodegen (12)
-                    HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                      InputAdapter
-                        Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #7
-                          WholeStageCodegen (11)
-                            HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,cs_sales_price,cs_quantity,cs_net_paid_inc_tax] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                              Project [cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                BroadcastHashJoin [cs_ship_mode_sk,sm_ship_mode_sk]
-                                  Project [cs_ship_mode_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                    BroadcastHashJoin [cs_sold_time_sk,t_time_sk]
-                                      Project [cs_sold_time_sk,cs_ship_mode_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
-                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                          Project [cs_sold_time_sk,cs_ship_mode_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
-                                            BroadcastHashJoin [cs_warehouse_sk,w_warehouse_sk]
-                                              Filter [cs_warehouse_sk,cs_sold_time_sk,cs_ship_mode_sk]
-                                                ColumnarToRow
-                                                  InputAdapter
-                                                    Scan parquet spark_catalog.default.catalog_sales [cs_sold_time_sk,cs_ship_mode_sk,cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
-                                                      ReusedSubquery [d_date_sk] #1
-                                              InputAdapter
-                                                ReusedExchange [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country] #4
-                                          InputAdapter
-                                            ReusedExchange [d_date_sk,d_year,d_moy] #3
-                                      InputAdapter
-                                        ReusedExchange [t_time_sk] #5
-                                  InputAdapter
-                                    ReusedExchange [sm_ship_mode_sk] #6
+                                                    Scan parquet spark_catalog.default.warehouse [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk,d_year,d_moy] #2
+                                InputAdapter
+                                  BroadcastExchange #4
+                                    WholeStageCodegen (3)
+                                      Project [t_time_sk]
+                                        Filter [t_time,t_time_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.time_dim [t_time_sk,t_time]
+                            InputAdapter
+                              BroadcastExchange #5
+                                WholeStageCodegen (4)
+                                  Project [sm_ship_mode_sk]
+                                    Filter [sm_carrier,sm_ship_mode_sk]
+                                      ColumnarToRow
+                                        InputAdapter
+                                          Scan parquet spark_catalog.default.ship_mode [sm_ship_mode_sk,sm_carrier]
+            WholeStageCodegen (12)
+              HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(CASE WHEN (d_moy = 1) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_sales_price * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 1) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 2) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 3) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 4) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 5) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 6) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 7) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 8) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 9) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 10) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 11) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),sum(CASE WHEN (d_moy = 12) THEN (cs_net_paid_inc_tax * cast(cs_quantity as decimal(10,0))) ELSE 0.00 END),ship_carriers,year,jan_sales,feb_sales,mar_sales,apr_sales,may_sales,jun_sales,jul_sales,aug_sales,sep_sales,oct_sales,nov_sales,dec_sales,jan_net,feb_net,mar_net,apr_net,may_net,jun_net,jul_net,aug_net,sep_net,oct_net,nov_net,dec_net,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                InputAdapter
+                  Exchange [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year] #6
+                    WholeStageCodegen (11)
+                      HashAggregate [w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy,cs_sales_price,cs_quantity,cs_net_paid_inc_tax] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                        Project [cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                          BroadcastHashJoin [cs_ship_mode_sk,sm_ship_mode_sk]
+                            Project [cs_ship_mode_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                              BroadcastHashJoin [cs_sold_time_sk,t_time_sk]
+                                Project [cs_sold_time_sk,cs_ship_mode_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country,d_year,d_moy]
+                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                    Project [cs_sold_time_sk,cs_ship_mode_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country]
+                                      BroadcastHashJoin [cs_warehouse_sk,w_warehouse_sk]
+                                        Filter [cs_warehouse_sk,cs_sold_time_sk,cs_ship_mode_sk]
+                                          ColumnarToRow
+                                            InputAdapter
+                                              Scan parquet spark_catalog.default.catalog_sales [cs_sold_time_sk,cs_ship_mode_sk,cs_warehouse_sk,cs_quantity,cs_sales_price,cs_net_paid_inc_tax,cs_sold_date_sk]
+                                                ReusedSubquery [d_date_sk] #1
+                                        InputAdapter
+                                          ReusedExchange [w_warehouse_sk,w_warehouse_name,w_warehouse_sq_ft,w_city,w_county,w_state,w_country] #3
+                                    InputAdapter
+                                      ReusedExchange [d_date_sk,d_year,d_moy] #2
+                                InputAdapter
+                                  ReusedExchange [t_time_sk] #4
+                            InputAdapter
+                              ReusedExchange [sm_ship_mode_sk] #5
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q69.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q69.sf100/explain.txt
index 96ca7b8cb0be3..97a6df0aeb3fb 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q69.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q69.sf100/explain.txt
@@ -60,124 +60,124 @@ Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 
 (3) Filter [codegen id : 1]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
-Condition : ((isnotnull(c_current_addr_sk#3) AND isnotnull(c_current_cdemo_sk#2)) AND might_contain(Subquery scalar-subquery#4, [id=#5], xxhash64(c_current_addr_sk#3, 42)))
+Condition : ((isnotnull(c_current_addr_sk#3) AND isnotnull(c_current_cdemo_sk#2)) AND might_contain(Subquery scalar-subquery#4, [id=#1], xxhash64(c_current_addr_sk#3, 42)))
 
 (4) Exchange
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
-Arguments: hashpartitioning(c_customer_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(c_customer_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=2]
 
 (5) Sort [codegen id : 2]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 Arguments: [c_customer_sk#1 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.store_sales
-Output [2]: [ss_customer_sk#6, ss_sold_date_sk#7]
+Output [2]: [ss_customer_sk#5, ss_sold_date_sk#6]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#7), dynamicpruningexpression(ss_sold_date_sk#7 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#6), dynamicpruningexpression(ss_sold_date_sk#6 IN dynamicpruning#7)]
 ReadSchema: struct<ss_customer_sk:int>
 
 (7) ColumnarToRow [codegen id : 4]
-Input [2]: [ss_customer_sk#6, ss_sold_date_sk#7]
+Input [2]: [ss_customer_sk#5, ss_sold_date_sk#6]
 
 (8) ReusedExchange [Reuses operator id: 59]
-Output [1]: [d_date_sk#9]
+Output [1]: [d_date_sk#8]
 
 (9) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [ss_sold_date_sk#7]
-Right keys [1]: [d_date_sk#9]
+Left keys [1]: [ss_sold_date_sk#6]
+Right keys [1]: [d_date_sk#8]
 Join type: Inner
 Join condition: None
 
 (10) Project [codegen id : 4]
-Output [1]: [ss_customer_sk#6]
-Input [3]: [ss_customer_sk#6, ss_sold_date_sk#7, d_date_sk#9]
+Output [1]: [ss_customer_sk#5]
+Input [3]: [ss_customer_sk#5, ss_sold_date_sk#6, d_date_sk#8]
 
 (11) Exchange
-Input [1]: [ss_customer_sk#6]
-Arguments: hashpartitioning(ss_customer_sk#6, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [1]: [ss_customer_sk#5]
+Arguments: hashpartitioning(ss_customer_sk#5, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) Sort [codegen id : 5]
-Input [1]: [ss_customer_sk#6]
-Arguments: [ss_customer_sk#6 ASC NULLS FIRST], false, 0
+Input [1]: [ss_customer_sk#5]
+Arguments: [ss_customer_sk#5 ASC NULLS FIRST], false, 0
 
 (13) SortMergeJoin [codegen id : 6]
 Left keys [1]: [c_customer_sk#1]
-Right keys [1]: [ss_customer_sk#6]
+Right keys [1]: [ss_customer_sk#5]
 Join type: LeftSemi
 Join condition: None
 
 (14) Scan parquet spark_catalog.default.web_sales
-Output [2]: [ws_bill_customer_sk#10, ws_sold_date_sk#11]
+Output [2]: [ws_bill_customer_sk#9, ws_sold_date_sk#10]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#11), dynamicpruningexpression(ws_sold_date_sk#11 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#10), dynamicpruningexpression(ws_sold_date_sk#10 IN dynamicpruning#7)]
 ReadSchema: struct<ws_bill_customer_sk:int>
 
 (15) ColumnarToRow [codegen id : 8]
-Input [2]: [ws_bill_customer_sk#10, ws_sold_date_sk#11]
+Input [2]: [ws_bill_customer_sk#9, ws_sold_date_sk#10]
 
 (16) ReusedExchange [Reuses operator id: 59]
-Output [1]: [d_date_sk#12]
+Output [1]: [d_date_sk#11]
 
 (17) BroadcastHashJoin [codegen id : 8]
-Left keys [1]: [ws_sold_date_sk#11]
-Right keys [1]: [d_date_sk#12]
+Left keys [1]: [ws_sold_date_sk#10]
+Right keys [1]: [d_date_sk#11]
 Join type: Inner
 Join condition: None
 
 (18) Project [codegen id : 8]
-Output [1]: [ws_bill_customer_sk#10]
-Input [3]: [ws_bill_customer_sk#10, ws_sold_date_sk#11, d_date_sk#12]
+Output [1]: [ws_bill_customer_sk#9]
+Input [3]: [ws_bill_customer_sk#9, ws_sold_date_sk#10, d_date_sk#11]
 
 (19) Exchange
-Input [1]: [ws_bill_customer_sk#10]
-Arguments: hashpartitioning(ws_bill_customer_sk#10, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [1]: [ws_bill_customer_sk#9]
+Arguments: hashpartitioning(ws_bill_customer_sk#9, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (20) Sort [codegen id : 9]
-Input [1]: [ws_bill_customer_sk#10]
-Arguments: [ws_bill_customer_sk#10 ASC NULLS FIRST], false, 0
+Input [1]: [ws_bill_customer_sk#9]
+Arguments: [ws_bill_customer_sk#9 ASC NULLS FIRST], false, 0
 
 (21) SortMergeJoin [codegen id : 10]
 Left keys [1]: [c_customer_sk#1]
-Right keys [1]: [ws_bill_customer_sk#10]
+Right keys [1]: [ws_bill_customer_sk#9]
 Join type: LeftAnti
 Join condition: None
 
 (22) Scan parquet spark_catalog.default.catalog_sales
-Output [2]: [cs_ship_customer_sk#13, cs_sold_date_sk#14]
+Output [2]: [cs_ship_customer_sk#12, cs_sold_date_sk#13]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#14), dynamicpruningexpression(cs_sold_date_sk#14 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#13), dynamicpruningexpression(cs_sold_date_sk#13 IN dynamicpruning#7)]
 ReadSchema: struct<cs_ship_customer_sk:int>
 
 (23) ColumnarToRow [codegen id : 12]
-Input [2]: [cs_ship_customer_sk#13, cs_sold_date_sk#14]
+Input [2]: [cs_ship_customer_sk#12, cs_sold_date_sk#13]
 
 (24) ReusedExchange [Reuses operator id: 59]
-Output [1]: [d_date_sk#15]
+Output [1]: [d_date_sk#14]
 
 (25) BroadcastHashJoin [codegen id : 12]
-Left keys [1]: [cs_sold_date_sk#14]
-Right keys [1]: [d_date_sk#15]
+Left keys [1]: [cs_sold_date_sk#13]
+Right keys [1]: [d_date_sk#14]
 Join type: Inner
 Join condition: None
 
 (26) Project [codegen id : 12]
-Output [1]: [cs_ship_customer_sk#13]
-Input [3]: [cs_ship_customer_sk#13, cs_sold_date_sk#14, d_date_sk#15]
+Output [1]: [cs_ship_customer_sk#12]
+Input [3]: [cs_ship_customer_sk#12, cs_sold_date_sk#13, d_date_sk#14]
 
 (27) Exchange
-Input [1]: [cs_ship_customer_sk#13]
-Arguments: hashpartitioning(cs_ship_customer_sk#13, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Input [1]: [cs_ship_customer_sk#12]
+Arguments: hashpartitioning(cs_ship_customer_sk#12, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (28) Sort [codegen id : 13]
-Input [1]: [cs_ship_customer_sk#13]
-Arguments: [cs_ship_customer_sk#13 ASC NULLS FIRST], false, 0
+Input [1]: [cs_ship_customer_sk#12]
+Arguments: [cs_ship_customer_sk#12 ASC NULLS FIRST], false, 0
 
 (29) SortMergeJoin [codegen id : 15]
 Left keys [1]: [c_customer_sk#1]
-Right keys [1]: [cs_ship_customer_sk#13]
+Right keys [1]: [cs_ship_customer_sk#12]
 Join type: LeftAnti
 Join condition: None
 
@@ -186,90 +186,90 @@ Output [2]: [c_current_cdemo_sk#2, c_current_addr_sk#3]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 
 (31) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#16, ca_state#17]
+Output [2]: [ca_address_sk#15, ca_state#16]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_state, [GA,KY,NM]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (32) ColumnarToRow [codegen id : 14]
-Input [2]: [ca_address_sk#16, ca_state#17]
+Input [2]: [ca_address_sk#15, ca_state#16]
 
 (33) Filter [codegen id : 14]
-Input [2]: [ca_address_sk#16, ca_state#17]
-Condition : (ca_state#17 IN (KY,GA,NM) AND isnotnull(ca_address_sk#16))
+Input [2]: [ca_address_sk#15, ca_state#16]
+Condition : (ca_state#16 IN (KY,GA,NM) AND isnotnull(ca_address_sk#15))
 
 (34) Project [codegen id : 14]
-Output [1]: [ca_address_sk#16]
-Input [2]: [ca_address_sk#16, ca_state#17]
+Output [1]: [ca_address_sk#15]
+Input [2]: [ca_address_sk#15, ca_state#16]
 
 (35) BroadcastExchange
-Input [1]: [ca_address_sk#16]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Input [1]: [ca_address_sk#15]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
 (36) BroadcastHashJoin [codegen id : 15]
 Left keys [1]: [c_current_addr_sk#3]
-Right keys [1]: [ca_address_sk#16]
+Right keys [1]: [ca_address_sk#15]
 Join type: Inner
 Join condition: None
 
 (37) Project [codegen id : 15]
 Output [1]: [c_current_cdemo_sk#2]
-Input [3]: [c_current_cdemo_sk#2, c_current_addr_sk#3, ca_address_sk#16]
+Input [3]: [c_current_cdemo_sk#2, c_current_addr_sk#3, ca_address_sk#15]
 
 (38) BroadcastExchange
 Input [1]: [c_current_cdemo_sk#2]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 (39) Scan parquet spark_catalog.default.customer_demographics
-Output [6]: [cd_demo_sk#18, cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
+Output [6]: [cd_demo_sk#17, cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk)]
 ReadSchema: struct<cd_demo_sk:int,cd_gender:string,cd_marital_status:string,cd_education_status:string,cd_purchase_estimate:int,cd_credit_rating:string>
 
 (40) ColumnarToRow
-Input [6]: [cd_demo_sk#18, cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
+Input [6]: [cd_demo_sk#17, cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
 
 (41) Filter
-Input [6]: [cd_demo_sk#18, cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
-Condition : isnotnull(cd_demo_sk#18)
+Input [6]: [cd_demo_sk#17, cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
+Condition : isnotnull(cd_demo_sk#17)
 
 (42) BroadcastHashJoin [codegen id : 16]
 Left keys [1]: [c_current_cdemo_sk#2]
-Right keys [1]: [cd_demo_sk#18]
+Right keys [1]: [cd_demo_sk#17]
 Join type: Inner
 Join condition: None
 
 (43) Project [codegen id : 16]
-Output [5]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
-Input [7]: [c_current_cdemo_sk#2, cd_demo_sk#18, cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
+Output [5]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
+Input [7]: [c_current_cdemo_sk#2, cd_demo_sk#17, cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
 
 (44) HashAggregate [codegen id : 16]
-Input [5]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
-Keys [5]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
+Input [5]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
+Keys [5]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
 Functions [1]: [partial_count(1)]
-Aggregate Attributes [1]: [count#24]
-Results [6]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23, count#25]
+Aggregate Attributes [1]: [count#23]
+Results [6]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22, count#24]
 
 (45) Exchange
-Input [6]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23, count#25]
-Arguments: hashpartitioning(cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [6]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22, count#24]
+Arguments: hashpartitioning(cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (46) HashAggregate [codegen id : 17]
-Input [6]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23, count#25]
-Keys [5]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cd_purchase_estimate#22, cd_credit_rating#23]
+Input [6]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22, count#24]
+Keys [5]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cd_purchase_estimate#21, cd_credit_rating#22]
 Functions [1]: [count(1)]
-Aggregate Attributes [1]: [count(1)#26]
-Results [8]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, count(1)#26 AS cnt1#27, cd_purchase_estimate#22, count(1)#26 AS cnt2#28, cd_credit_rating#23, count(1)#26 AS cnt3#29]
+Aggregate Attributes [1]: [count(1)#25]
+Results [8]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, count(1)#25 AS cnt1#26, cd_purchase_estimate#21, count(1)#25 AS cnt2#27, cd_credit_rating#22, count(1)#25 AS cnt3#28]
 
 (47) TakeOrderedAndProject
-Input [8]: [cd_gender#19, cd_marital_status#20, cd_education_status#21, cnt1#27, cd_purchase_estimate#22, cnt2#28, cd_credit_rating#23, cnt3#29]
-Arguments: 100, [cd_gender#19 ASC NULLS FIRST, cd_marital_status#20 ASC NULLS FIRST, cd_education_status#21 ASC NULLS FIRST, cd_purchase_estimate#22 ASC NULLS FIRST, cd_credit_rating#23 ASC NULLS FIRST], [cd_gender#19, cd_marital_status#20, cd_education_status#21, cnt1#27, cd_purchase_estimate#22, cnt2#28, cd_credit_rating#23, cnt3#29]
+Input [8]: [cd_gender#18, cd_marital_status#19, cd_education_status#20, cnt1#26, cd_purchase_estimate#21, cnt2#27, cd_credit_rating#22, cnt3#28]
+Arguments: 100, [cd_gender#18 ASC NULLS FIRST, cd_marital_status#19 ASC NULLS FIRST, cd_education_status#20 ASC NULLS FIRST, cd_purchase_estimate#21 ASC NULLS FIRST, cd_credit_rating#22 ASC NULLS FIRST], [cd_gender#18, cd_marital_status#19, cd_education_status#20, cnt1#26, cd_purchase_estimate#21, cnt2#27, cd_credit_rating#22, cnt3#28]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#4, [id=#5]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#4, [id=#1]
 ObjectHashAggregate (54)
 +- Exchange (53)
    +- ObjectHashAggregate (52)
@@ -280,42 +280,42 @@ ObjectHashAggregate (54)
 
 
 (48) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#16, ca_state#17]
+Output [2]: [ca_address_sk#15, ca_state#16]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_state, [GA,KY,NM]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (49) ColumnarToRow [codegen id : 1]
-Input [2]: [ca_address_sk#16, ca_state#17]
+Input [2]: [ca_address_sk#15, ca_state#16]
 
 (50) Filter [codegen id : 1]
-Input [2]: [ca_address_sk#16, ca_state#17]
-Condition : (ca_state#17 IN (KY,GA,NM) AND isnotnull(ca_address_sk#16))
+Input [2]: [ca_address_sk#15, ca_state#16]
+Condition : (ca_state#16 IN (KY,GA,NM) AND isnotnull(ca_address_sk#15))
 
 (51) Project [codegen id : 1]
-Output [1]: [ca_address_sk#16]
-Input [2]: [ca_address_sk#16, ca_state#17]
+Output [1]: [ca_address_sk#15]
+Input [2]: [ca_address_sk#15, ca_state#16]
 
 (52) ObjectHashAggregate
-Input [1]: [ca_address_sk#16]
+Input [1]: [ca_address_sk#15]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#16, 42), 55556, 899992, 0, 0)]
-Aggregate Attributes [1]: [buf#30]
-Results [1]: [buf#31]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#15, 42), 55556, 899992, 0, 0)]
+Aggregate Attributes [1]: [buf#29]
+Results [1]: [buf#30]
 
 (53) Exchange
-Input [1]: [buf#31]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
+Input [1]: [buf#30]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
 
 (54) ObjectHashAggregate
-Input [1]: [buf#31]
+Input [1]: [buf#30]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#16, 42), 55556, 899992, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#16, 42), 55556, 899992, 0, 0)#32]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#16, 42), 55556, 899992, 0, 0)#32 AS bloomFilter#33]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#15, 42), 55556, 899992, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#15, 42), 55556, 899992, 0, 0)#31]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#15, 42), 55556, 899992, 0, 0)#31 AS bloomFilter#32]
 
-Subquery:2 Hosting operator id = 6 Hosting Expression = ss_sold_date_sk#7 IN dynamicpruning#8
+Subquery:2 Hosting operator id = 6 Hosting Expression = ss_sold_date_sk#6 IN dynamicpruning#7
 BroadcastExchange (59)
 +- * Project (58)
    +- * Filter (57)
@@ -324,29 +324,29 @@ BroadcastExchange (59)
 
 
 (55) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#9, d_year#34, d_moy#35]
+Output [3]: [d_date_sk#8, d_year#33, d_moy#34]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), GreaterThanOrEqual(d_moy,4), LessThanOrEqual(d_moy,6), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (56) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#9, d_year#34, d_moy#35]
+Input [3]: [d_date_sk#8, d_year#33, d_moy#34]
 
 (57) Filter [codegen id : 1]
-Input [3]: [d_date_sk#9, d_year#34, d_moy#35]
-Condition : (((((isnotnull(d_year#34) AND isnotnull(d_moy#35)) AND (d_year#34 = 2001)) AND (d_moy#35 >= 4)) AND (d_moy#35 <= 6)) AND isnotnull(d_date_sk#9))
+Input [3]: [d_date_sk#8, d_year#33, d_moy#34]
+Condition : (((((isnotnull(d_year#33) AND isnotnull(d_moy#34)) AND (d_year#33 = 2001)) AND (d_moy#34 >= 4)) AND (d_moy#34 <= 6)) AND isnotnull(d_date_sk#8))
 
 (58) Project [codegen id : 1]
-Output [1]: [d_date_sk#9]
-Input [3]: [d_date_sk#9, d_year#34, d_moy#35]
+Output [1]: [d_date_sk#8]
+Input [3]: [d_date_sk#8, d_year#33, d_moy#34]
 
 (59) BroadcastExchange
-Input [1]: [d_date_sk#9]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
+Input [1]: [d_date_sk#8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
-Subquery:3 Hosting operator id = 14 Hosting Expression = ws_sold_date_sk#11 IN dynamicpruning#8
+Subquery:3 Hosting operator id = 14 Hosting Expression = ws_sold_date_sk#10 IN dynamicpruning#7
 
-Subquery:4 Hosting operator id = 22 Hosting Expression = cs_sold_date_sk#14 IN dynamicpruning#8
+Subquery:4 Hosting operator id = 22 Hosting Expression = cs_sold_date_sk#13 IN dynamicpruning#7
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q80.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q80.sf100/explain.txt
index c930a8f522304..99dd73592867c 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q80.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q80.sf100/explain.txt
@@ -121,494 +121,494 @@ Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_e
 
 (3) Filter [codegen id : 1]
 Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7]
-Condition : ((((isnotnull(ss_store_sk#2) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_promo_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#10], xxhash64(ss_item_sk#1, 42))) AND might_contain(Subquery scalar-subquery#11, [id=#12], xxhash64(ss_promo_sk#3, 42)))
+Condition : ((((isnotnull(ss_store_sk#2) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_promo_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#1], xxhash64(ss_item_sk#1, 42))) AND might_contain(Subquery scalar-subquery#10, [id=#2], xxhash64(ss_promo_sk#3, 42)))
 
 (4) Exchange
 Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7]
-Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#4, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#4, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (5) Sort [codegen id : 2]
 Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7]
 Arguments: [ss_item_sk#1 ASC NULLS FIRST, ss_ticket_number#4 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.store_returns
-Output [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
+Output [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_returns]
 PushedFilters: [IsNotNull(sr_item_sk), IsNotNull(sr_ticket_number)]
 ReadSchema: struct<sr_item_sk:int,sr_ticket_number:int,sr_return_amt:decimal(7,2),sr_net_loss:decimal(7,2)>
 
 (7) ColumnarToRow [codegen id : 3]
-Input [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
+Input [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
 
 (8) Filter [codegen id : 3]
-Input [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
-Condition : (isnotnull(sr_item_sk#13) AND isnotnull(sr_ticket_number#14))
+Input [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
+Condition : (isnotnull(sr_item_sk#11) AND isnotnull(sr_ticket_number#12))
 
 (9) Project [codegen id : 3]
-Output [4]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
-Input [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
+Output [4]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
+Input [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
 
 (10) Exchange
-Input [4]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
-Arguments: hashpartitioning(sr_item_sk#13, sr_ticket_number#14, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [4]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
+Arguments: hashpartitioning(sr_item_sk#11, sr_ticket_number#12, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (11) Sort [codegen id : 4]
-Input [4]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
-Arguments: [sr_item_sk#13 ASC NULLS FIRST, sr_ticket_number#14 ASC NULLS FIRST], false, 0
+Input [4]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
+Arguments: [sr_item_sk#11 ASC NULLS FIRST, sr_ticket_number#12 ASC NULLS FIRST], false, 0
 
 (12) SortMergeJoin [codegen id : 9]
 Left keys [2]: [ss_item_sk#1, ss_ticket_number#4]
-Right keys [2]: [sr_item_sk#13, sr_ticket_number#14]
+Right keys [2]: [sr_item_sk#11, sr_ticket_number#12]
 Join type: LeftOuter
 Join condition: None
 
 (13) Project [codegen id : 9]
-Output [8]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16]
-Input [11]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
+Output [8]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14]
+Input [11]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
 
 (14) Scan parquet spark_catalog.default.item
-Output [2]: [i_item_sk#18, i_current_price#19]
+Output [2]: [i_item_sk#16, i_current_price#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), GreaterThan(i_current_price,50.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2)>
 
 (15) ColumnarToRow [codegen id : 5]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (16) Filter [codegen id : 5]
-Input [2]: [i_item_sk#18, i_current_price#19]
-Condition : ((isnotnull(i_current_price#19) AND (i_current_price#19 > 50.00)) AND isnotnull(i_item_sk#18))
+Input [2]: [i_item_sk#16, i_current_price#17]
+Condition : ((isnotnull(i_current_price#17) AND (i_current_price#17 > 50.00)) AND isnotnull(i_item_sk#16))
 
 (17) Project [codegen id : 5]
-Output [1]: [i_item_sk#18]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Output [1]: [i_item_sk#16]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (18) BroadcastExchange
-Input [1]: [i_item_sk#18]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=3]
+Input [1]: [i_item_sk#16]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
 
 (19) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [i_item_sk#18]
+Right keys [1]: [i_item_sk#16]
 Join type: Inner
 Join condition: None
 
 (20) Project [codegen id : 9]
-Output [7]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16]
-Input [9]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16, i_item_sk#18]
+Output [7]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14]
+Input [9]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14, i_item_sk#16]
 
 (21) Scan parquet spark_catalog.default.promotion
-Output [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [2]: [p_promo_sk#18, p_channel_tv#19]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/promotion]
 PushedFilters: [IsNotNull(p_channel_tv), EqualTo(p_channel_tv,N), IsNotNull(p_promo_sk)]
 ReadSchema: struct<p_promo_sk:int,p_channel_tv:string>
 
 (22) ColumnarToRow [codegen id : 6]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (23) Filter [codegen id : 6]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
-Condition : ((isnotnull(p_channel_tv#21) AND (p_channel_tv#21 = N)) AND isnotnull(p_promo_sk#20))
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
+Condition : ((isnotnull(p_channel_tv#19) AND (p_channel_tv#19 = N)) AND isnotnull(p_promo_sk#18))
 
 (24) Project [codegen id : 6]
-Output [1]: [p_promo_sk#20]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [1]: [p_promo_sk#18]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (25) BroadcastExchange
-Input [1]: [p_promo_sk#20]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [p_promo_sk#18]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
 (26) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_promo_sk#3]
-Right keys [1]: [p_promo_sk#20]
+Right keys [1]: [p_promo_sk#18]
 Join type: Inner
 Join condition: None
 
 (27) Project [codegen id : 9]
-Output [6]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16]
-Input [8]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16, p_promo_sk#20]
+Output [6]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14]
+Input [8]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14, p_promo_sk#18]
 
 (28) ReusedExchange [Reuses operator id: 126]
-Output [1]: [d_date_sk#22]
+Output [1]: [d_date_sk#20]
 
 (29) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_sold_date_sk#7]
-Right keys [1]: [d_date_sk#22]
+Right keys [1]: [d_date_sk#20]
 Join type: Inner
 Join condition: None
 
 (30) Project [codegen id : 9]
-Output [5]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16]
-Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16, d_date_sk#22]
+Output [5]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14]
+Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14, d_date_sk#20]
 
 (31) Scan parquet spark_catalog.default.store
-Output [2]: [s_store_sk#23, s_store_id#24]
+Output [2]: [s_store_sk#21, s_store_id#22]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk)]
 ReadSchema: struct<s_store_sk:int,s_store_id:string>
 
 (32) ColumnarToRow [codegen id : 8]
-Input [2]: [s_store_sk#23, s_store_id#24]
+Input [2]: [s_store_sk#21, s_store_id#22]
 
 (33) Filter [codegen id : 8]
-Input [2]: [s_store_sk#23, s_store_id#24]
-Condition : isnotnull(s_store_sk#23)
+Input [2]: [s_store_sk#21, s_store_id#22]
+Condition : isnotnull(s_store_sk#21)
 
 (34) BroadcastExchange
-Input [2]: [s_store_sk#23, s_store_id#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=5]
+Input [2]: [s_store_sk#21, s_store_id#22]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
 
 (35) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_store_sk#2]
-Right keys [1]: [s_store_sk#23]
+Right keys [1]: [s_store_sk#21]
 Join type: Inner
 Join condition: None
 
 (36) Project [codegen id : 9]
-Output [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16, s_store_id#24]
-Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16, s_store_sk#23, s_store_id#24]
+Output [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14, s_store_id#22]
+Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14, s_store_sk#21, s_store_id#22]
 
 (37) HashAggregate [codegen id : 9]
-Input [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16, s_store_id#24]
-Keys [1]: [s_store_id#24]
-Functions [3]: [partial_sum(UnscaledValue(ss_ext_sales_price#5)), partial_sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00)), partial_sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#25, sum#26, isEmpty#27, sum#28, isEmpty#29]
-Results [6]: [s_store_id#24, sum#30, sum#31, isEmpty#32, sum#33, isEmpty#34]
+Input [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14, s_store_id#22]
+Keys [1]: [s_store_id#22]
+Functions [3]: [partial_sum(UnscaledValue(ss_ext_sales_price#5)), partial_sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00)), partial_sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#23, sum#24, isEmpty#25, sum#26, isEmpty#27]
+Results [6]: [s_store_id#22, sum#28, sum#29, isEmpty#30, sum#31, isEmpty#32]
 
 (38) Exchange
-Input [6]: [s_store_id#24, sum#30, sum#31, isEmpty#32, sum#33, isEmpty#34]
-Arguments: hashpartitioning(s_store_id#24, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [6]: [s_store_id#22, sum#28, sum#29, isEmpty#30, sum#31, isEmpty#32]
+Arguments: hashpartitioning(s_store_id#22, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (39) HashAggregate [codegen id : 10]
-Input [6]: [s_store_id#24, sum#30, sum#31, isEmpty#32, sum#33, isEmpty#34]
-Keys [1]: [s_store_id#24]
-Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#5)), sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00)), sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#5))#35, sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00))#36, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))#37]
-Results [5]: [MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#5))#35,17,2) AS sales#38, sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00))#36 AS returns#39, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))#37 AS profit#40, store channel AS channel#41, concat(store, s_store_id#24) AS id#42]
+Input [6]: [s_store_id#22, sum#28, sum#29, isEmpty#30, sum#31, isEmpty#32]
+Keys [1]: [s_store_id#22]
+Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#5)), sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00)), sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#5))#33, sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00))#34, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))#35]
+Results [5]: [MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#5))#33,17,2) AS sales#36, sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00))#34 AS returns#37, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))#35 AS profit#38, store channel AS channel#39, concat(store, s_store_id#22) AS id#40]
 
 (40) Scan parquet spark_catalog.default.catalog_sales
-Output [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
+Output [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#49), dynamicpruningexpression(cs_sold_date_sk#49 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#47), dynamicpruningexpression(cs_sold_date_sk#47 IN dynamicpruning#8)]
 PushedFilters: [IsNotNull(cs_catalog_page_sk), IsNotNull(cs_item_sk), IsNotNull(cs_promo_sk)]
 ReadSchema: struct<cs_catalog_page_sk:int,cs_item_sk:int,cs_promo_sk:int,cs_order_number:int,cs_ext_sales_price:decimal(7,2),cs_net_profit:decimal(7,2)>
 
 (41) ColumnarToRow [codegen id : 11]
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
 
 (42) Filter [codegen id : 11]
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
-Condition : ((((isnotnull(cs_catalog_page_sk#43) AND isnotnull(cs_item_sk#44)) AND isnotnull(cs_promo_sk#45)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#10], xxhash64(cs_item_sk#44, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#11, [id=#12], xxhash64(cs_promo_sk#45, 42)))
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
+Condition : ((((isnotnull(cs_catalog_page_sk#41) AND isnotnull(cs_item_sk#42)) AND isnotnull(cs_promo_sk#43)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#1], xxhash64(cs_item_sk#42, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#10, [id=#2], xxhash64(cs_promo_sk#43, 42)))
 
 (43) Exchange
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
-Arguments: hashpartitioning(cs_item_sk#44, cs_order_number#46, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
+Arguments: hashpartitioning(cs_item_sk#42, cs_order_number#44, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (44) Sort [codegen id : 12]
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
-Arguments: [cs_item_sk#44 ASC NULLS FIRST, cs_order_number#46 ASC NULLS FIRST], false, 0
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
+Arguments: [cs_item_sk#42 ASC NULLS FIRST, cs_order_number#44 ASC NULLS FIRST], false, 0
 
 (45) Scan parquet spark_catalog.default.catalog_returns
-Output [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
+Output [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_returns]
 PushedFilters: [IsNotNull(cr_item_sk), IsNotNull(cr_order_number)]
 ReadSchema: struct<cr_item_sk:int,cr_order_number:int,cr_return_amount:decimal(7,2),cr_net_loss:decimal(7,2)>
 
 (46) ColumnarToRow [codegen id : 13]
-Input [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
+Input [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
 
 (47) Filter [codegen id : 13]
-Input [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
-Condition : (isnotnull(cr_item_sk#50) AND isnotnull(cr_order_number#51))
+Input [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
+Condition : (isnotnull(cr_item_sk#48) AND isnotnull(cr_order_number#49))
 
 (48) Project [codegen id : 13]
-Output [4]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
-Input [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
+Output [4]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
+Input [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
 
 (49) Exchange
-Input [4]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
-Arguments: hashpartitioning(cr_item_sk#50, cr_order_number#51, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [4]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
+Arguments: hashpartitioning(cr_item_sk#48, cr_order_number#49, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (50) Sort [codegen id : 14]
-Input [4]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
-Arguments: [cr_item_sk#50 ASC NULLS FIRST, cr_order_number#51 ASC NULLS FIRST], false, 0
+Input [4]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
+Arguments: [cr_item_sk#48 ASC NULLS FIRST, cr_order_number#49 ASC NULLS FIRST], false, 0
 
 (51) SortMergeJoin [codegen id : 19]
-Left keys [2]: [cs_item_sk#44, cs_order_number#46]
-Right keys [2]: [cr_item_sk#50, cr_order_number#51]
+Left keys [2]: [cs_item_sk#42, cs_order_number#44]
+Right keys [2]: [cr_item_sk#48, cr_order_number#49]
 Join type: LeftOuter
 Join condition: None
 
 (52) Project [codegen id : 19]
-Output [8]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53]
-Input [11]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
+Output [8]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51]
+Input [11]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
 
 (53) ReusedExchange [Reuses operator id: 18]
-Output [1]: [i_item_sk#55]
+Output [1]: [i_item_sk#53]
 
 (54) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_item_sk#44]
-Right keys [1]: [i_item_sk#55]
+Left keys [1]: [cs_item_sk#42]
+Right keys [1]: [i_item_sk#53]
 Join type: Inner
 Join condition: None
 
 (55) Project [codegen id : 19]
-Output [7]: [cs_catalog_page_sk#43, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53]
-Input [9]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53, i_item_sk#55]
+Output [7]: [cs_catalog_page_sk#41, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51]
+Input [9]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51, i_item_sk#53]
 
 (56) ReusedExchange [Reuses operator id: 25]
-Output [1]: [p_promo_sk#56]
+Output [1]: [p_promo_sk#54]
 
 (57) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_promo_sk#45]
-Right keys [1]: [p_promo_sk#56]
+Left keys [1]: [cs_promo_sk#43]
+Right keys [1]: [p_promo_sk#54]
 Join type: Inner
 Join condition: None
 
 (58) Project [codegen id : 19]
-Output [6]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53]
-Input [8]: [cs_catalog_page_sk#43, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53, p_promo_sk#56]
+Output [6]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51]
+Input [8]: [cs_catalog_page_sk#41, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51, p_promo_sk#54]
 
 (59) ReusedExchange [Reuses operator id: 126]
-Output [1]: [d_date_sk#57]
+Output [1]: [d_date_sk#55]
 
 (60) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_sold_date_sk#49]
-Right keys [1]: [d_date_sk#57]
+Left keys [1]: [cs_sold_date_sk#47]
+Right keys [1]: [d_date_sk#55]
 Join type: Inner
 Join condition: None
 
 (61) Project [codegen id : 19]
-Output [5]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53]
-Input [7]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53, d_date_sk#57]
+Output [5]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51]
+Input [7]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51, d_date_sk#55]
 
 (62) Scan parquet spark_catalog.default.catalog_page
-Output [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
+Output [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_page]
 PushedFilters: [IsNotNull(cp_catalog_page_sk)]
 ReadSchema: struct<cp_catalog_page_sk:int,cp_catalog_page_id:string>
 
 (63) ColumnarToRow [codegen id : 18]
-Input [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
+Input [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
 
 (64) Filter [codegen id : 18]
-Input [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
-Condition : isnotnull(cp_catalog_page_sk#58)
+Input [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
+Condition : isnotnull(cp_catalog_page_sk#56)
 
 (65) BroadcastExchange
-Input [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=9]
+Input [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=11]
 
 (66) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_catalog_page_sk#43]
-Right keys [1]: [cp_catalog_page_sk#58]
+Left keys [1]: [cs_catalog_page_sk#41]
+Right keys [1]: [cp_catalog_page_sk#56]
 Join type: Inner
 Join condition: None
 
 (67) Project [codegen id : 19]
-Output [5]: [cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53, cp_catalog_page_id#59]
-Input [7]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53, cp_catalog_page_sk#58, cp_catalog_page_id#59]
+Output [5]: [cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51, cp_catalog_page_id#57]
+Input [7]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51, cp_catalog_page_sk#56, cp_catalog_page_id#57]
 
 (68) HashAggregate [codegen id : 19]
-Input [5]: [cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53, cp_catalog_page_id#59]
-Keys [1]: [cp_catalog_page_id#59]
-Functions [3]: [partial_sum(UnscaledValue(cs_ext_sales_price#47)), partial_sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00)), partial_sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#60, sum#61, isEmpty#62, sum#63, isEmpty#64]
-Results [6]: [cp_catalog_page_id#59, sum#65, sum#66, isEmpty#67, sum#68, isEmpty#69]
+Input [5]: [cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51, cp_catalog_page_id#57]
+Keys [1]: [cp_catalog_page_id#57]
+Functions [3]: [partial_sum(UnscaledValue(cs_ext_sales_price#45)), partial_sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00)), partial_sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#58, sum#59, isEmpty#60, sum#61, isEmpty#62]
+Results [6]: [cp_catalog_page_id#57, sum#63, sum#64, isEmpty#65, sum#66, isEmpty#67]
 
 (69) Exchange
-Input [6]: [cp_catalog_page_id#59, sum#65, sum#66, isEmpty#67, sum#68, isEmpty#69]
-Arguments: hashpartitioning(cp_catalog_page_id#59, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [6]: [cp_catalog_page_id#57, sum#63, sum#64, isEmpty#65, sum#66, isEmpty#67]
+Arguments: hashpartitioning(cp_catalog_page_id#57, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (70) HashAggregate [codegen id : 20]
-Input [6]: [cp_catalog_page_id#59, sum#65, sum#66, isEmpty#67, sum#68, isEmpty#69]
-Keys [1]: [cp_catalog_page_id#59]
-Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#47)), sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00)), sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#47))#70, sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00))#71, sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))#72]
-Results [5]: [MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#47))#70,17,2) AS sales#73, sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00))#71 AS returns#74, sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))#72 AS profit#75, catalog channel AS channel#76, concat(catalog_page, cp_catalog_page_id#59) AS id#77]
+Input [6]: [cp_catalog_page_id#57, sum#63, sum#64, isEmpty#65, sum#66, isEmpty#67]
+Keys [1]: [cp_catalog_page_id#57]
+Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#45)), sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00)), sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#45))#68, sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00))#69, sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))#70]
+Results [5]: [MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#45))#68,17,2) AS sales#71, sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00))#69 AS returns#72, sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))#70 AS profit#73, catalog channel AS channel#74, concat(catalog_page, cp_catalog_page_id#57) AS id#75]
 
 (71) Scan parquet spark_catalog.default.web_sales
-Output [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
+Output [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#84), dynamicpruningexpression(ws_sold_date_sk#84 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#82), dynamicpruningexpression(ws_sold_date_sk#82 IN dynamicpruning#8)]
 PushedFilters: [IsNotNull(ws_web_site_sk), IsNotNull(ws_item_sk), IsNotNull(ws_promo_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_web_site_sk:int,ws_promo_sk:int,ws_order_number:int,ws_ext_sales_price:decimal(7,2),ws_net_profit:decimal(7,2)>
 
 (72) ColumnarToRow [codegen id : 21]
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
 
 (73) Filter [codegen id : 21]
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
-Condition : ((((isnotnull(ws_web_site_sk#79) AND isnotnull(ws_item_sk#78)) AND isnotnull(ws_promo_sk#80)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#10], xxhash64(ws_item_sk#78, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#11, [id=#12], xxhash64(ws_promo_sk#80, 42)))
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
+Condition : ((((isnotnull(ws_web_site_sk#77) AND isnotnull(ws_item_sk#76)) AND isnotnull(ws_promo_sk#78)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#1], xxhash64(ws_item_sk#76, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#10, [id=#2], xxhash64(ws_promo_sk#78, 42)))
 
 (74) Exchange
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
-Arguments: hashpartitioning(ws_item_sk#78, ws_order_number#81, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
+Arguments: hashpartitioning(ws_item_sk#76, ws_order_number#79, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (75) Sort [codegen id : 22]
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
-Arguments: [ws_item_sk#78 ASC NULLS FIRST, ws_order_number#81 ASC NULLS FIRST], false, 0
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
+Arguments: [ws_item_sk#76 ASC NULLS FIRST, ws_order_number#79 ASC NULLS FIRST], false, 0
 
 (76) Scan parquet spark_catalog.default.web_returns
-Output [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
+Output [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_returns]
 PushedFilters: [IsNotNull(wr_item_sk), IsNotNull(wr_order_number)]
 ReadSchema: struct<wr_item_sk:int,wr_order_number:int,wr_return_amt:decimal(7,2),wr_net_loss:decimal(7,2)>
 
 (77) ColumnarToRow [codegen id : 23]
-Input [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
+Input [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
 
 (78) Filter [codegen id : 23]
-Input [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
-Condition : (isnotnull(wr_item_sk#85) AND isnotnull(wr_order_number#86))
+Input [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
+Condition : (isnotnull(wr_item_sk#83) AND isnotnull(wr_order_number#84))
 
 (79) Project [codegen id : 23]
-Output [4]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
-Input [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
+Output [4]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
+Input [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
 
 (80) Exchange
-Input [4]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
-Arguments: hashpartitioning(wr_item_sk#85, wr_order_number#86, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [4]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
+Arguments: hashpartitioning(wr_item_sk#83, wr_order_number#84, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (81) Sort [codegen id : 24]
-Input [4]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
-Arguments: [wr_item_sk#85 ASC NULLS FIRST, wr_order_number#86 ASC NULLS FIRST], false, 0
+Input [4]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
+Arguments: [wr_item_sk#83 ASC NULLS FIRST, wr_order_number#84 ASC NULLS FIRST], false, 0
 
 (82) SortMergeJoin [codegen id : 29]
-Left keys [2]: [ws_item_sk#78, ws_order_number#81]
-Right keys [2]: [wr_item_sk#85, wr_order_number#86]
+Left keys [2]: [ws_item_sk#76, ws_order_number#79]
+Right keys [2]: [wr_item_sk#83, wr_order_number#84]
 Join type: LeftOuter
 Join condition: None
 
 (83) Project [codegen id : 29]
-Output [8]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88]
-Input [11]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
+Output [8]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86]
+Input [11]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
 
 (84) ReusedExchange [Reuses operator id: 18]
-Output [1]: [i_item_sk#90]
+Output [1]: [i_item_sk#88]
 
 (85) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_item_sk#78]
-Right keys [1]: [i_item_sk#90]
+Left keys [1]: [ws_item_sk#76]
+Right keys [1]: [i_item_sk#88]
 Join type: Inner
 Join condition: None
 
 (86) Project [codegen id : 29]
-Output [7]: [ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88]
-Input [9]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88, i_item_sk#90]
+Output [7]: [ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86]
+Input [9]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86, i_item_sk#88]
 
 (87) ReusedExchange [Reuses operator id: 25]
-Output [1]: [p_promo_sk#91]
+Output [1]: [p_promo_sk#89]
 
 (88) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_promo_sk#80]
-Right keys [1]: [p_promo_sk#91]
+Left keys [1]: [ws_promo_sk#78]
+Right keys [1]: [p_promo_sk#89]
 Join type: Inner
 Join condition: None
 
 (89) Project [codegen id : 29]
-Output [6]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88]
-Input [8]: [ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88, p_promo_sk#91]
+Output [6]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86]
+Input [8]: [ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86, p_promo_sk#89]
 
 (90) ReusedExchange [Reuses operator id: 126]
-Output [1]: [d_date_sk#92]
+Output [1]: [d_date_sk#90]
 
 (91) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_sold_date_sk#84]
-Right keys [1]: [d_date_sk#92]
+Left keys [1]: [ws_sold_date_sk#82]
+Right keys [1]: [d_date_sk#90]
 Join type: Inner
 Join condition: None
 
 (92) Project [codegen id : 29]
-Output [5]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88]
-Input [7]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88, d_date_sk#92]
+Output [5]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86]
+Input [7]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86, d_date_sk#90]
 
 (93) Scan parquet spark_catalog.default.web_site
-Output [2]: [web_site_sk#93, web_site_id#94]
+Output [2]: [web_site_sk#91, web_site_id#92]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_site]
 PushedFilters: [IsNotNull(web_site_sk)]
 ReadSchema: struct<web_site_sk:int,web_site_id:string>
 
 (94) ColumnarToRow [codegen id : 28]
-Input [2]: [web_site_sk#93, web_site_id#94]
+Input [2]: [web_site_sk#91, web_site_id#92]
 
 (95) Filter [codegen id : 28]
-Input [2]: [web_site_sk#93, web_site_id#94]
-Condition : isnotnull(web_site_sk#93)
+Input [2]: [web_site_sk#91, web_site_id#92]
+Condition : isnotnull(web_site_sk#91)
 
 (96) BroadcastExchange
-Input [2]: [web_site_sk#93, web_site_id#94]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=13]
+Input [2]: [web_site_sk#91, web_site_id#92]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=15]
 
 (97) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_web_site_sk#79]
-Right keys [1]: [web_site_sk#93]
+Left keys [1]: [ws_web_site_sk#77]
+Right keys [1]: [web_site_sk#91]
 Join type: Inner
 Join condition: None
 
 (98) Project [codegen id : 29]
-Output [5]: [ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88, web_site_id#94]
-Input [7]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88, web_site_sk#93, web_site_id#94]
+Output [5]: [ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86, web_site_id#92]
+Input [7]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86, web_site_sk#91, web_site_id#92]
 
 (99) HashAggregate [codegen id : 29]
-Input [5]: [ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88, web_site_id#94]
-Keys [1]: [web_site_id#94]
-Functions [3]: [partial_sum(UnscaledValue(ws_ext_sales_price#82)), partial_sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00)), partial_sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#95, sum#96, isEmpty#97, sum#98, isEmpty#99]
-Results [6]: [web_site_id#94, sum#100, sum#101, isEmpty#102, sum#103, isEmpty#104]
+Input [5]: [ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86, web_site_id#92]
+Keys [1]: [web_site_id#92]
+Functions [3]: [partial_sum(UnscaledValue(ws_ext_sales_price#80)), partial_sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00)), partial_sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#93, sum#94, isEmpty#95, sum#96, isEmpty#97]
+Results [6]: [web_site_id#92, sum#98, sum#99, isEmpty#100, sum#101, isEmpty#102]
 
 (100) Exchange
-Input [6]: [web_site_id#94, sum#100, sum#101, isEmpty#102, sum#103, isEmpty#104]
-Arguments: hashpartitioning(web_site_id#94, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+Input [6]: [web_site_id#92, sum#98, sum#99, isEmpty#100, sum#101, isEmpty#102]
+Arguments: hashpartitioning(web_site_id#92, 5), ENSURE_REQUIREMENTS, [plan_id=16]
 
 (101) HashAggregate [codegen id : 30]
-Input [6]: [web_site_id#94, sum#100, sum#101, isEmpty#102, sum#103, isEmpty#104]
-Keys [1]: [web_site_id#94]
-Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#82)), sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00)), sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#82))#105, sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00))#106, sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))#107]
-Results [5]: [MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#82))#105,17,2) AS sales#108, sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00))#106 AS returns#109, sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))#107 AS profit#110, web channel AS channel#111, concat(web_site, web_site_id#94) AS id#112]
+Input [6]: [web_site_id#92, sum#98, sum#99, isEmpty#100, sum#101, isEmpty#102]
+Keys [1]: [web_site_id#92]
+Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#80)), sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00)), sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#80))#103, sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00))#104, sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))#105]
+Results [5]: [MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#80))#103,17,2) AS sales#106, sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00))#104 AS returns#107, sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))#105 AS profit#108, web channel AS channel#109, concat(web_site, web_site_id#92) AS id#110]
 
 (102) Union
 
 (103) Expand [codegen id : 31]
-Input [5]: [sales#38, returns#39, profit#40, channel#41, id#42]
-Arguments: [[sales#38, returns#39, profit#40, channel#41, id#42, 0], [sales#38, returns#39, profit#40, channel#41, null, 1], [sales#38, returns#39, profit#40, null, null, 3]], [sales#38, returns#39, profit#40, channel#113, id#114, spark_grouping_id#115]
+Input [5]: [sales#36, returns#37, profit#38, channel#39, id#40]
+Arguments: [[sales#36, returns#37, profit#38, channel#39, id#40, 0], [sales#36, returns#37, profit#38, channel#39, null, 1], [sales#36, returns#37, profit#38, null, null, 3]], [sales#36, returns#37, profit#38, channel#111, id#112, spark_grouping_id#113]
 
 (104) HashAggregate [codegen id : 31]
-Input [6]: [sales#38, returns#39, profit#40, channel#113, id#114, spark_grouping_id#115]
-Keys [3]: [channel#113, id#114, spark_grouping_id#115]
-Functions [3]: [partial_sum(sales#38), partial_sum(returns#39), partial_sum(profit#40)]
-Aggregate Attributes [6]: [sum#116, isEmpty#117, sum#118, isEmpty#119, sum#120, isEmpty#121]
-Results [9]: [channel#113, id#114, spark_grouping_id#115, sum#122, isEmpty#123, sum#124, isEmpty#125, sum#126, isEmpty#127]
+Input [6]: [sales#36, returns#37, profit#38, channel#111, id#112, spark_grouping_id#113]
+Keys [3]: [channel#111, id#112, spark_grouping_id#113]
+Functions [3]: [partial_sum(sales#36), partial_sum(returns#37), partial_sum(profit#38)]
+Aggregate Attributes [6]: [sum#114, isEmpty#115, sum#116, isEmpty#117, sum#118, isEmpty#119]
+Results [9]: [channel#111, id#112, spark_grouping_id#113, sum#120, isEmpty#121, sum#122, isEmpty#123, sum#124, isEmpty#125]
 
 (105) Exchange
-Input [9]: [channel#113, id#114, spark_grouping_id#115, sum#122, isEmpty#123, sum#124, isEmpty#125, sum#126, isEmpty#127]
-Arguments: hashpartitioning(channel#113, id#114, spark_grouping_id#115, 5), ENSURE_REQUIREMENTS, [plan_id=15]
+Input [9]: [channel#111, id#112, spark_grouping_id#113, sum#120, isEmpty#121, sum#122, isEmpty#123, sum#124, isEmpty#125]
+Arguments: hashpartitioning(channel#111, id#112, spark_grouping_id#113, 5), ENSURE_REQUIREMENTS, [plan_id=17]
 
 (106) HashAggregate [codegen id : 32]
-Input [9]: [channel#113, id#114, spark_grouping_id#115, sum#122, isEmpty#123, sum#124, isEmpty#125, sum#126, isEmpty#127]
-Keys [3]: [channel#113, id#114, spark_grouping_id#115]
-Functions [3]: [sum(sales#38), sum(returns#39), sum(profit#40)]
-Aggregate Attributes [3]: [sum(sales#38)#128, sum(returns#39)#129, sum(profit#40)#130]
-Results [5]: [channel#113, id#114, sum(sales#38)#128 AS sales#131, sum(returns#39)#129 AS returns#132, sum(profit#40)#130 AS profit#133]
+Input [9]: [channel#111, id#112, spark_grouping_id#113, sum#120, isEmpty#121, sum#122, isEmpty#123, sum#124, isEmpty#125]
+Keys [3]: [channel#111, id#112, spark_grouping_id#113]
+Functions [3]: [sum(sales#36), sum(returns#37), sum(profit#38)]
+Aggregate Attributes [3]: [sum(sales#36)#126, sum(returns#37)#127, sum(profit#38)#128]
+Results [5]: [channel#111, id#112, sum(sales#36)#126 AS sales#129, sum(returns#37)#127 AS returns#130, sum(profit#38)#128 AS profit#131]
 
 (107) TakeOrderedAndProject
-Input [5]: [channel#113, id#114, sales#131, returns#132, profit#133]
-Arguments: 100, [channel#113 ASC NULLS FIRST, id#114 ASC NULLS FIRST], [channel#113, id#114, sales#131, returns#132, profit#133]
+Input [5]: [channel#111, id#112, sales#129, returns#130, profit#131]
+Arguments: 100, [channel#111 ASC NULLS FIRST, id#112 ASC NULLS FIRST], [channel#111, id#112, sales#129, returns#130, profit#131]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#10]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#1]
 ObjectHashAggregate (114)
 +- Exchange (113)
    +- ObjectHashAggregate (112)
@@ -619,42 +619,42 @@ ObjectHashAggregate (114)
 
 
 (108) Scan parquet spark_catalog.default.item
-Output [2]: [i_item_sk#18, i_current_price#19]
+Output [2]: [i_item_sk#16, i_current_price#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), GreaterThan(i_current_price,50.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2)>
 
 (109) ColumnarToRow [codegen id : 1]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (110) Filter [codegen id : 1]
-Input [2]: [i_item_sk#18, i_current_price#19]
-Condition : ((isnotnull(i_current_price#19) AND (i_current_price#19 > 50.00)) AND isnotnull(i_item_sk#18))
+Input [2]: [i_item_sk#16, i_current_price#17]
+Condition : ((isnotnull(i_current_price#17) AND (i_current_price#17 > 50.00)) AND isnotnull(i_item_sk#16))
 
 (111) Project [codegen id : 1]
-Output [1]: [i_item_sk#18]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Output [1]: [i_item_sk#16]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (112) ObjectHashAggregate
-Input [1]: [i_item_sk#18]
+Input [1]: [i_item_sk#16]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)]
-Aggregate Attributes [1]: [buf#134]
-Results [1]: [buf#135]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)]
+Aggregate Attributes [1]: [buf#132]
+Results [1]: [buf#133]
 
 (113) Exchange
-Input [1]: [buf#135]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=16]
+Input [1]: [buf#133]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=18]
 
 (114) ObjectHashAggregate
-Input [1]: [buf#135]
+Input [1]: [buf#133]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)#136]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)#136 AS bloomFilter#137]
+Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)#134]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)#134 AS bloomFilter#135]
 
-Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#11, [id=#12]
+Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#10, [id=#2]
 ObjectHashAggregate (121)
 +- Exchange (120)
    +- ObjectHashAggregate (119)
@@ -665,40 +665,40 @@ ObjectHashAggregate (121)
 
 
 (115) Scan parquet spark_catalog.default.promotion
-Output [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [2]: [p_promo_sk#18, p_channel_tv#19]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/promotion]
 PushedFilters: [IsNotNull(p_channel_tv), EqualTo(p_channel_tv,N), IsNotNull(p_promo_sk)]
 ReadSchema: struct<p_promo_sk:int,p_channel_tv:string>
 
 (116) ColumnarToRow [codegen id : 1]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (117) Filter [codegen id : 1]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
-Condition : ((isnotnull(p_channel_tv#21) AND (p_channel_tv#21 = N)) AND isnotnull(p_promo_sk#20))
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
+Condition : ((isnotnull(p_channel_tv#19) AND (p_channel_tv#19 = N)) AND isnotnull(p_promo_sk#18))
 
 (118) Project [codegen id : 1]
-Output [1]: [p_promo_sk#20]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [1]: [p_promo_sk#18]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (119) ObjectHashAggregate
-Input [1]: [p_promo_sk#20]
+Input [1]: [p_promo_sk#18]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)]
-Aggregate Attributes [1]: [buf#138]
-Results [1]: [buf#139]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)]
+Aggregate Attributes [1]: [buf#136]
+Results [1]: [buf#137]
 
 (120) Exchange
-Input [1]: [buf#139]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=17]
+Input [1]: [buf#137]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=19]
 
 (121) ObjectHashAggregate
-Input [1]: [buf#139]
+Input [1]: [buf#137]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)#140]
-Results [1]: [bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)#140 AS bloomFilter#141]
+Functions [1]: [bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)#138]
+Results [1]: [bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)#138 AS bloomFilter#139]
 
 Subquery:3 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#7 IN dynamicpruning#8
 BroadcastExchange (126)
@@ -709,37 +709,37 @@ BroadcastExchange (126)
 
 
 (122) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#22, d_date#142]
+Output [2]: [d_date_sk#20, d_date#140]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2000-08-23), LessThanOrEqual(d_date,2000-09-22), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (123) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#22, d_date#142]
+Input [2]: [d_date_sk#20, d_date#140]
 
 (124) Filter [codegen id : 1]
-Input [2]: [d_date_sk#22, d_date#142]
-Condition : (((isnotnull(d_date#142) AND (d_date#142 >= 2000-08-23)) AND (d_date#142 <= 2000-09-22)) AND isnotnull(d_date_sk#22))
+Input [2]: [d_date_sk#20, d_date#140]
+Condition : (((isnotnull(d_date#140) AND (d_date#140 >= 2000-08-23)) AND (d_date#140 <= 2000-09-22)) AND isnotnull(d_date_sk#20))
 
 (125) Project [codegen id : 1]
-Output [1]: [d_date_sk#22]
-Input [2]: [d_date_sk#22, d_date#142]
+Output [1]: [d_date_sk#20]
+Input [2]: [d_date_sk#20, d_date#140]
 
 (126) BroadcastExchange
-Input [1]: [d_date_sk#22]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=18]
+Input [1]: [d_date_sk#20]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=20]
 
-Subquery:4 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#10]
+Subquery:4 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#1]
 
-Subquery:5 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:5 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#2]
 
-Subquery:6 Hosting operator id = 40 Hosting Expression = cs_sold_date_sk#49 IN dynamicpruning#8
+Subquery:6 Hosting operator id = 40 Hosting Expression = cs_sold_date_sk#47 IN dynamicpruning#8
 
-Subquery:7 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#10]
+Subquery:7 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#1]
 
-Subquery:8 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:8 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#2]
 
-Subquery:9 Hosting operator id = 71 Hosting Expression = ws_sold_date_sk#84 IN dynamicpruning#8
+Subquery:9 Hosting operator id = 71 Hosting Expression = ws_sold_date_sk#82 IN dynamicpruning#8
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q82.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q82.sf100/explain.txt
index 932a0fbef40f3..a781e5f930f25 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q82.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q82.sf100/explain.txt
@@ -113,7 +113,7 @@ Input [2]: [ss_item_sk#11, ss_sold_date_sk#12]
 
 (19) Filter [codegen id : 5]
 Input [2]: [ss_item_sk#11, ss_sold_date_sk#12]
-Condition : (isnotnull(ss_item_sk#11) AND might_contain(Subquery scalar-subquery#13, [id=#14], xxhash64(ss_item_sk#11, 42)))
+Condition : (isnotnull(ss_item_sk#11) AND might_contain(Subquery scalar-subquery#13, [id=#3], xxhash64(ss_item_sk#11, 42)))
 
 (20) Project [codegen id : 5]
 Output [1]: [ss_item_sk#11]
@@ -121,7 +121,7 @@ Input [2]: [ss_item_sk#11, ss_sold_date_sk#12]
 
 (21) Exchange
 Input [1]: [ss_item_sk#11]
-Arguments: hashpartitioning(ss_item_sk#11, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Arguments: hashpartitioning(ss_item_sk#11, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (22) Sort [codegen id : 6]
 Input [1]: [ss_item_sk#11]
@@ -146,7 +146,7 @@ Results [3]: [i_item_id#2, i_item_desc#3, i_current_price#4]
 
 (26) Exchange
 Input [3]: [i_item_id#2, i_item_desc#3, i_current_price#4]
-Arguments: hashpartitioning(i_item_id#2, i_item_desc#3, i_current_price#4, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Arguments: hashpartitioning(i_item_id#2, i_item_desc#3, i_current_price#4, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (27) HashAggregate [codegen id : 8]
 Input [3]: [i_item_id#2, i_item_desc#3, i_current_price#4]
@@ -170,28 +170,28 @@ BroadcastExchange (33)
 
 
 (29) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#10, d_date#15]
+Output [2]: [d_date_sk#10, d_date#14]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2000-05-25), LessThanOrEqual(d_date,2000-07-24), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (30) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#10, d_date#15]
+Input [2]: [d_date_sk#10, d_date#14]
 
 (31) Filter [codegen id : 1]
-Input [2]: [d_date_sk#10, d_date#15]
-Condition : (((isnotnull(d_date#15) AND (d_date#15 >= 2000-05-25)) AND (d_date#15 <= 2000-07-24)) AND isnotnull(d_date_sk#10))
+Input [2]: [d_date_sk#10, d_date#14]
+Condition : (((isnotnull(d_date#14) AND (d_date#14 >= 2000-05-25)) AND (d_date#14 <= 2000-07-24)) AND isnotnull(d_date_sk#10))
 
 (32) Project [codegen id : 1]
 Output [1]: [d_date_sk#10]
-Input [2]: [d_date_sk#10, d_date#15]
+Input [2]: [d_date_sk#10, d_date#14]
 
 (33) BroadcastExchange
 Input [1]: [d_date_sk#10]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
-Subquery:2 Hosting operator id = 19 Hosting Expression = Subquery scalar-subquery#13, [id=#14]
+Subquery:2 Hosting operator id = 19 Hosting Expression = Subquery scalar-subquery#13, [id=#3]
 ObjectHashAggregate (40)
 +- Exchange (39)
    +- ObjectHashAggregate (38)
@@ -223,18 +223,18 @@ Input [3]: [i_item_sk#1, i_current_price#4, i_manufact_id#5]
 Input [1]: [i_item_sk#1]
 Keys: []
 Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)]
-Aggregate Attributes [1]: [buf#16]
-Results [1]: [buf#17]
+Aggregate Attributes [1]: [buf#15]
+Results [1]: [buf#16]
 
 (39) Exchange
-Input [1]: [buf#17]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
+Input [1]: [buf#16]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
 
 (40) ObjectHashAggregate
-Input [1]: [buf#17]
+Input [1]: [buf#16]
 Keys: []
 Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#18]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#18 AS bloomFilter#19]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#17]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 239, 6582, 0, 0)#17 AS bloomFilter#18]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q85.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q85.sf100/explain.txt
index 410a6a1957505..302b6569d843a 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q85.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q85.sf100/explain.txt
@@ -118,7 +118,7 @@ Input [9]: [wr_item_sk#10, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_r
 
 (14) Filter [codegen id : 4]
 Input [9]: [wr_item_sk#10, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_order_number#15, wr_fee#16, wr_refunded_cash#17, wr_returned_date_sk#18]
-Condition : (((((((isnotnull(wr_item_sk#10) AND isnotnull(wr_order_number#15)) AND isnotnull(wr_refunded_cdemo_sk#11)) AND isnotnull(wr_returning_cdemo_sk#13)) AND isnotnull(wr_refunded_addr_sk#12)) AND isnotnull(wr_reason_sk#14)) AND might_contain(Subquery scalar-subquery#19, [id=#20], xxhash64(wr_refunded_cdemo_sk#11, 42))) AND might_contain(Subquery scalar-subquery#21, [id=#22], xxhash64(wr_refunded_addr_sk#12, 42)))
+Condition : (((((((isnotnull(wr_item_sk#10) AND isnotnull(wr_order_number#15)) AND isnotnull(wr_refunded_cdemo_sk#11)) AND isnotnull(wr_returning_cdemo_sk#13)) AND isnotnull(wr_refunded_addr_sk#12)) AND isnotnull(wr_reason_sk#14)) AND might_contain(Subquery scalar-subquery#19, [id=#3], xxhash64(wr_refunded_cdemo_sk#11, 42))) AND might_contain(Subquery scalar-subquery#20, [id=#4], xxhash64(wr_refunded_addr_sk#12, 42)))
 
 (15) Project [codegen id : 4]
 Output [8]: [wr_item_sk#10, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_order_number#15, wr_fee#16, wr_refunded_cash#17]
@@ -126,7 +126,7 @@ Input [9]: [wr_item_sk#10, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_r
 
 (16) Exchange
 Input [8]: [wr_item_sk#10, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_order_number#15, wr_fee#16, wr_refunded_cash#17]
-Arguments: hashpartitioning(wr_item_sk#10, wr_order_number#15, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Arguments: hashpartitioning(wr_item_sk#10, wr_order_number#15, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (17) Sort [codegen id : 5]
 Input [8]: [wr_item_sk#10, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_order_number#15, wr_fee#16, wr_refunded_cash#17]
@@ -143,167 +143,167 @@ Output [10]: [ws_quantity#4, ws_sales_price#5, ws_net_profit#6, ws_sold_date_sk#
 Input [14]: [ws_item_sk#1, ws_order_number#3, ws_quantity#4, ws_sales_price#5, ws_net_profit#6, ws_sold_date_sk#7, wr_item_sk#10, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_order_number#15, wr_fee#16, wr_refunded_cash#17]
 
 (20) Scan parquet spark_catalog.default.customer_demographics
-Output [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
+Output [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk), IsNotNull(cd_marital_status), IsNotNull(cd_education_status), Or(Or(And(EqualTo(cd_marital_status,M),EqualTo(cd_education_status,Advanced Degree     )),And(EqualTo(cd_marital_status,S),EqualTo(cd_education_status,College             ))),And(EqualTo(cd_marital_status,W),EqualTo(cd_education_status,2 yr Degree         )))]
 ReadSchema: struct<cd_demo_sk:int,cd_marital_status:string,cd_education_status:string>
 
 (21) ColumnarToRow [codegen id : 6]
-Input [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
+Input [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
 
 (22) Filter [codegen id : 6]
-Input [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
-Condition : (((isnotnull(cd_demo_sk#23) AND isnotnull(cd_marital_status#24)) AND isnotnull(cd_education_status#25)) AND ((((cd_marital_status#24 = M) AND (cd_education_status#25 = Advanced Degree     )) OR ((cd_marital_status#24 = S) AND (cd_education_status#25 = College             ))) OR ((cd_marital_status#24 = W) AND (cd_education_status#25 = 2 yr Degree         ))))
+Input [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
+Condition : (((isnotnull(cd_demo_sk#21) AND isnotnull(cd_marital_status#22)) AND isnotnull(cd_education_status#23)) AND ((((cd_marital_status#22 = M) AND (cd_education_status#23 = Advanced Degree     )) OR ((cd_marital_status#22 = S) AND (cd_education_status#23 = College             ))) OR ((cd_marital_status#22 = W) AND (cd_education_status#23 = 2 yr Degree         ))))
 
 (23) BroadcastExchange
-Input [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=4]
+Input [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=6]
 
 (24) BroadcastHashJoin [codegen id : 7]
 Left keys [1]: [wr_refunded_cdemo_sk#11]
-Right keys [1]: [cd_demo_sk#23]
+Right keys [1]: [cd_demo_sk#21]
 Join type: Inner
-Join condition: ((((((cd_marital_status#24 = M) AND (cd_education_status#25 = Advanced Degree     )) AND (ws_sales_price#5 >= 100.00)) AND (ws_sales_price#5 <= 150.00)) OR ((((cd_marital_status#24 = S) AND (cd_education_status#25 = College             )) AND (ws_sales_price#5 >= 50.00)) AND (ws_sales_price#5 <= 100.00))) OR ((((cd_marital_status#24 = W) AND (cd_education_status#25 = 2 yr Degree         )) AND (ws_sales_price#5 >= 150.00)) AND (ws_sales_price#5 <= 200.00)))
+Join condition: ((((((cd_marital_status#22 = M) AND (cd_education_status#23 = Advanced Degree     )) AND (ws_sales_price#5 >= 100.00)) AND (ws_sales_price#5 <= 150.00)) OR ((((cd_marital_status#22 = S) AND (cd_education_status#23 = College             )) AND (ws_sales_price#5 >= 50.00)) AND (ws_sales_price#5 <= 100.00))) OR ((((cd_marital_status#22 = W) AND (cd_education_status#23 = 2 yr Degree         )) AND (ws_sales_price#5 >= 150.00)) AND (ws_sales_price#5 <= 200.00)))
 
 (25) Project [codegen id : 7]
-Output [10]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#24, cd_education_status#25]
-Input [13]: [ws_quantity#4, ws_sales_price#5, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
+Output [10]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#22, cd_education_status#23]
+Input [13]: [ws_quantity#4, ws_sales_price#5, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_cdemo_sk#11, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
 
 (26) Exchange
-Input [10]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#24, cd_education_status#25]
-Arguments: hashpartitioning(wr_returning_cdemo_sk#13, cd_marital_status#24, cd_education_status#25, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [10]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#22, cd_education_status#23]
+Arguments: hashpartitioning(wr_returning_cdemo_sk#13, cd_marital_status#22, cd_education_status#23, 5), ENSURE_REQUIREMENTS, [plan_id=7]
 
 (27) Sort [codegen id : 8]
-Input [10]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#24, cd_education_status#25]
-Arguments: [wr_returning_cdemo_sk#13 ASC NULLS FIRST, cd_marital_status#24 ASC NULLS FIRST, cd_education_status#25 ASC NULLS FIRST], false, 0
+Input [10]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#22, cd_education_status#23]
+Arguments: [wr_returning_cdemo_sk#13 ASC NULLS FIRST, cd_marital_status#22 ASC NULLS FIRST, cd_education_status#23 ASC NULLS FIRST], false, 0
 
 (28) Scan parquet spark_catalog.default.customer_demographics
-Output [3]: [cd_demo_sk#26, cd_marital_status#27, cd_education_status#28]
+Output [3]: [cd_demo_sk#24, cd_marital_status#25, cd_education_status#26]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk), IsNotNull(cd_marital_status), IsNotNull(cd_education_status)]
 ReadSchema: struct<cd_demo_sk:int,cd_marital_status:string,cd_education_status:string>
 
 (29) ColumnarToRow [codegen id : 9]
-Input [3]: [cd_demo_sk#26, cd_marital_status#27, cd_education_status#28]
+Input [3]: [cd_demo_sk#24, cd_marital_status#25, cd_education_status#26]
 
 (30) Filter [codegen id : 9]
-Input [3]: [cd_demo_sk#26, cd_marital_status#27, cd_education_status#28]
-Condition : ((isnotnull(cd_demo_sk#26) AND isnotnull(cd_marital_status#27)) AND isnotnull(cd_education_status#28))
+Input [3]: [cd_demo_sk#24, cd_marital_status#25, cd_education_status#26]
+Condition : ((isnotnull(cd_demo_sk#24) AND isnotnull(cd_marital_status#25)) AND isnotnull(cd_education_status#26))
 
 (31) Exchange
-Input [3]: [cd_demo_sk#26, cd_marital_status#27, cd_education_status#28]
-Arguments: hashpartitioning(cd_demo_sk#26, cd_marital_status#27, cd_education_status#28, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [3]: [cd_demo_sk#24, cd_marital_status#25, cd_education_status#26]
+Arguments: hashpartitioning(cd_demo_sk#24, cd_marital_status#25, cd_education_status#26, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (32) Sort [codegen id : 10]
-Input [3]: [cd_demo_sk#26, cd_marital_status#27, cd_education_status#28]
-Arguments: [cd_demo_sk#26 ASC NULLS FIRST, cd_marital_status#27 ASC NULLS FIRST, cd_education_status#28 ASC NULLS FIRST], false, 0
+Input [3]: [cd_demo_sk#24, cd_marital_status#25, cd_education_status#26]
+Arguments: [cd_demo_sk#24 ASC NULLS FIRST, cd_marital_status#25 ASC NULLS FIRST, cd_education_status#26 ASC NULLS FIRST], false, 0
 
 (33) SortMergeJoin [codegen id : 14]
-Left keys [3]: [wr_returning_cdemo_sk#13, cd_marital_status#24, cd_education_status#25]
-Right keys [3]: [cd_demo_sk#26, cd_marital_status#27, cd_education_status#28]
+Left keys [3]: [wr_returning_cdemo_sk#13, cd_marital_status#22, cd_education_status#23]
+Right keys [3]: [cd_demo_sk#24, cd_marital_status#25, cd_education_status#26]
 Join type: Inner
 Join condition: None
 
 (34) Project [codegen id : 14]
 Output [7]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17]
-Input [13]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#24, cd_education_status#25, cd_demo_sk#26, cd_marital_status#27, cd_education_status#28]
+Input [13]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_returning_cdemo_sk#13, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, cd_marital_status#22, cd_education_status#23, cd_demo_sk#24, cd_marital_status#25, cd_education_status#26]
 
 (35) Scan parquet spark_catalog.default.customer_address
-Output [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
+Output [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_country), EqualTo(ca_country,United States), IsNotNull(ca_address_sk), Or(Or(In(ca_state, [IN,NJ,OH]),In(ca_state, [CT,KY,WI])),In(ca_state, [AR,IA,LA]))]
 ReadSchema: struct<ca_address_sk:int,ca_state:string,ca_country:string>
 
 (36) ColumnarToRow [codegen id : 11]
-Input [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
+Input [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
 
 (37) Filter [codegen id : 11]
-Input [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
-Condition : (((isnotnull(ca_country#31) AND (ca_country#31 = United States)) AND isnotnull(ca_address_sk#29)) AND ((ca_state#30 IN (IN,OH,NJ) OR ca_state#30 IN (WI,CT,KY)) OR ca_state#30 IN (LA,IA,AR)))
+Input [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
+Condition : (((isnotnull(ca_country#29) AND (ca_country#29 = United States)) AND isnotnull(ca_address_sk#27)) AND ((ca_state#28 IN (IN,OH,NJ) OR ca_state#28 IN (WI,CT,KY)) OR ca_state#28 IN (LA,IA,AR)))
 
 (38) Project [codegen id : 11]
-Output [2]: [ca_address_sk#29, ca_state#30]
-Input [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
+Output [2]: [ca_address_sk#27, ca_state#28]
+Input [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
 
 (39) BroadcastExchange
-Input [2]: [ca_address_sk#29, ca_state#30]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
+Input [2]: [ca_address_sk#27, ca_state#28]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
 (40) BroadcastHashJoin [codegen id : 14]
 Left keys [1]: [wr_refunded_addr_sk#12]
-Right keys [1]: [ca_address_sk#29]
+Right keys [1]: [ca_address_sk#27]
 Join type: Inner
-Join condition: ((((ca_state#30 IN (IN,OH,NJ) AND (ws_net_profit#6 >= 100.00)) AND (ws_net_profit#6 <= 200.00)) OR ((ca_state#30 IN (WI,CT,KY) AND (ws_net_profit#6 >= 150.00)) AND (ws_net_profit#6 <= 300.00))) OR ((ca_state#30 IN (LA,IA,AR) AND (ws_net_profit#6 >= 50.00)) AND (ws_net_profit#6 <= 250.00)))
+Join condition: ((((ca_state#28 IN (IN,OH,NJ) AND (ws_net_profit#6 >= 100.00)) AND (ws_net_profit#6 <= 200.00)) OR ((ca_state#28 IN (WI,CT,KY) AND (ws_net_profit#6 >= 150.00)) AND (ws_net_profit#6 <= 300.00))) OR ((ca_state#28 IN (LA,IA,AR) AND (ws_net_profit#6 >= 50.00)) AND (ws_net_profit#6 <= 250.00)))
 
 (41) Project [codegen id : 14]
 Output [5]: [ws_quantity#4, ws_sold_date_sk#7, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17]
-Input [9]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, ca_address_sk#29, ca_state#30]
+Input [9]: [ws_quantity#4, ws_net_profit#6, ws_sold_date_sk#7, wr_refunded_addr_sk#12, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, ca_address_sk#27, ca_state#28]
 
 (42) ReusedExchange [Reuses operator id: 59]
-Output [1]: [d_date_sk#32]
+Output [1]: [d_date_sk#30]
 
 (43) BroadcastHashJoin [codegen id : 14]
 Left keys [1]: [ws_sold_date_sk#7]
-Right keys [1]: [d_date_sk#32]
+Right keys [1]: [d_date_sk#30]
 Join type: Inner
 Join condition: None
 
 (44) Project [codegen id : 14]
 Output [4]: [ws_quantity#4, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17]
-Input [6]: [ws_quantity#4, ws_sold_date_sk#7, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, d_date_sk#32]
+Input [6]: [ws_quantity#4, ws_sold_date_sk#7, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, d_date_sk#30]
 
 (45) Scan parquet spark_catalog.default.reason
-Output [2]: [r_reason_sk#33, r_reason_desc#34]
+Output [2]: [r_reason_sk#31, r_reason_desc#32]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/reason]
 PushedFilters: [IsNotNull(r_reason_sk)]
 ReadSchema: struct<r_reason_sk:int,r_reason_desc:string>
 
 (46) ColumnarToRow [codegen id : 13]
-Input [2]: [r_reason_sk#33, r_reason_desc#34]
+Input [2]: [r_reason_sk#31, r_reason_desc#32]
 
 (47) Filter [codegen id : 13]
-Input [2]: [r_reason_sk#33, r_reason_desc#34]
-Condition : isnotnull(r_reason_sk#33)
+Input [2]: [r_reason_sk#31, r_reason_desc#32]
+Condition : isnotnull(r_reason_sk#31)
 
 (48) BroadcastExchange
-Input [2]: [r_reason_sk#33, r_reason_desc#34]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=8]
+Input [2]: [r_reason_sk#31, r_reason_desc#32]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=10]
 
 (49) BroadcastHashJoin [codegen id : 14]
 Left keys [1]: [wr_reason_sk#14]
-Right keys [1]: [r_reason_sk#33]
+Right keys [1]: [r_reason_sk#31]
 Join type: Inner
 Join condition: None
 
 (50) Project [codegen id : 14]
-Output [4]: [ws_quantity#4, wr_fee#16, wr_refunded_cash#17, r_reason_desc#34]
-Input [6]: [ws_quantity#4, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, r_reason_sk#33, r_reason_desc#34]
+Output [4]: [ws_quantity#4, wr_fee#16, wr_refunded_cash#17, r_reason_desc#32]
+Input [6]: [ws_quantity#4, wr_reason_sk#14, wr_fee#16, wr_refunded_cash#17, r_reason_sk#31, r_reason_desc#32]
 
 (51) HashAggregate [codegen id : 14]
-Input [4]: [ws_quantity#4, wr_fee#16, wr_refunded_cash#17, r_reason_desc#34]
-Keys [1]: [r_reason_desc#34]
+Input [4]: [ws_quantity#4, wr_fee#16, wr_refunded_cash#17, r_reason_desc#32]
+Keys [1]: [r_reason_desc#32]
 Functions [3]: [partial_avg(ws_quantity#4), partial_avg(UnscaledValue(wr_refunded_cash#17)), partial_avg(UnscaledValue(wr_fee#16))]
-Aggregate Attributes [6]: [sum#35, count#36, sum#37, count#38, sum#39, count#40]
-Results [7]: [r_reason_desc#34, sum#41, count#42, sum#43, count#44, sum#45, count#46]
+Aggregate Attributes [6]: [sum#33, count#34, sum#35, count#36, sum#37, count#38]
+Results [7]: [r_reason_desc#32, sum#39, count#40, sum#41, count#42, sum#43, count#44]
 
 (52) Exchange
-Input [7]: [r_reason_desc#34, sum#41, count#42, sum#43, count#44, sum#45, count#46]
-Arguments: hashpartitioning(r_reason_desc#34, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Input [7]: [r_reason_desc#32, sum#39, count#40, sum#41, count#42, sum#43, count#44]
+Arguments: hashpartitioning(r_reason_desc#32, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (53) HashAggregate [codegen id : 15]
-Input [7]: [r_reason_desc#34, sum#41, count#42, sum#43, count#44, sum#45, count#46]
-Keys [1]: [r_reason_desc#34]
+Input [7]: [r_reason_desc#32, sum#39, count#40, sum#41, count#42, sum#43, count#44]
+Keys [1]: [r_reason_desc#32]
 Functions [3]: [avg(ws_quantity#4), avg(UnscaledValue(wr_refunded_cash#17)), avg(UnscaledValue(wr_fee#16))]
-Aggregate Attributes [3]: [avg(ws_quantity#4)#47, avg(UnscaledValue(wr_refunded_cash#17))#48, avg(UnscaledValue(wr_fee#16))#49]
-Results [4]: [substr(r_reason_desc#34, 1, 20) AS substr(r_reason_desc, 1, 20)#50, avg(ws_quantity#4)#47 AS avg(ws_quantity)#51, cast((avg(UnscaledValue(wr_refunded_cash#17))#48 / 100.0) as decimal(11,6)) AS avg(wr_refunded_cash)#52, cast((avg(UnscaledValue(wr_fee#16))#49 / 100.0) as decimal(11,6)) AS avg(wr_fee)#53]
+Aggregate Attributes [3]: [avg(ws_quantity#4)#45, avg(UnscaledValue(wr_refunded_cash#17))#46, avg(UnscaledValue(wr_fee#16))#47]
+Results [4]: [substr(r_reason_desc#32, 1, 20) AS substr(r_reason_desc, 1, 20)#48, avg(ws_quantity#4)#45 AS avg(ws_quantity)#49, cast((avg(UnscaledValue(wr_refunded_cash#17))#46 / 100.0) as decimal(11,6)) AS avg(wr_refunded_cash)#50, cast((avg(UnscaledValue(wr_fee#16))#47 / 100.0) as decimal(11,6)) AS avg(wr_fee)#51]
 
 (54) TakeOrderedAndProject
-Input [4]: [substr(r_reason_desc, 1, 20)#50, avg(ws_quantity)#51, avg(wr_refunded_cash)#52, avg(wr_fee)#53]
-Arguments: 100, [substr(r_reason_desc, 1, 20)#50 ASC NULLS FIRST, avg(ws_quantity)#51 ASC NULLS FIRST, avg(wr_refunded_cash)#52 ASC NULLS FIRST, avg(wr_fee)#53 ASC NULLS FIRST], [substr(r_reason_desc, 1, 20)#50, avg(ws_quantity)#51, avg(wr_refunded_cash)#52, avg(wr_fee)#53]
+Input [4]: [substr(r_reason_desc, 1, 20)#48, avg(ws_quantity)#49, avg(wr_refunded_cash)#50, avg(wr_fee)#51]
+Arguments: 100, [substr(r_reason_desc, 1, 20)#48 ASC NULLS FIRST, avg(ws_quantity)#49 ASC NULLS FIRST, avg(wr_refunded_cash)#50 ASC NULLS FIRST, avg(wr_fee)#51 ASC NULLS FIRST], [substr(r_reason_desc, 1, 20)#48, avg(ws_quantity)#49, avg(wr_refunded_cash)#50, avg(wr_fee)#51]
 
 ===== Subqueries =====
 
@@ -316,28 +316,28 @@ BroadcastExchange (59)
 
 
 (55) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#32, d_year#54]
+Output [2]: [d_date_sk#30, d_year#52]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2000), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (56) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#32, d_year#54]
+Input [2]: [d_date_sk#30, d_year#52]
 
 (57) Filter [codegen id : 1]
-Input [2]: [d_date_sk#32, d_year#54]
-Condition : ((isnotnull(d_year#54) AND (d_year#54 = 2000)) AND isnotnull(d_date_sk#32))
+Input [2]: [d_date_sk#30, d_year#52]
+Condition : ((isnotnull(d_year#52) AND (d_year#52 = 2000)) AND isnotnull(d_date_sk#30))
 
 (58) Project [codegen id : 1]
-Output [1]: [d_date_sk#32]
-Input [2]: [d_date_sk#32, d_year#54]
+Output [1]: [d_date_sk#30]
+Input [2]: [d_date_sk#30, d_year#52]
 
 (59) BroadcastExchange
-Input [1]: [d_date_sk#32]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
+Input [1]: [d_date_sk#30]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=12]
 
-Subquery:2 Hosting operator id = 14 Hosting Expression = Subquery scalar-subquery#19, [id=#20]
+Subquery:2 Hosting operator id = 14 Hosting Expression = Subquery scalar-subquery#19, [id=#3]
 ObjectHashAggregate (66)
 +- Exchange (65)
    +- ObjectHashAggregate (64)
@@ -348,42 +348,42 @@ ObjectHashAggregate (66)
 
 
 (60) Scan parquet spark_catalog.default.customer_demographics
-Output [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
+Output [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk), IsNotNull(cd_marital_status), IsNotNull(cd_education_status), Or(Or(And(EqualTo(cd_marital_status,M),EqualTo(cd_education_status,Advanced Degree     )),And(EqualTo(cd_marital_status,S),EqualTo(cd_education_status,College             ))),And(EqualTo(cd_marital_status,W),EqualTo(cd_education_status,2 yr Degree         )))]
 ReadSchema: struct<cd_demo_sk:int,cd_marital_status:string,cd_education_status:string>
 
 (61) ColumnarToRow [codegen id : 1]
-Input [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
+Input [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
 
 (62) Filter [codegen id : 1]
-Input [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
-Condition : (((isnotnull(cd_demo_sk#23) AND isnotnull(cd_marital_status#24)) AND isnotnull(cd_education_status#25)) AND ((((cd_marital_status#24 = M) AND (cd_education_status#25 = Advanced Degree     )) OR ((cd_marital_status#24 = S) AND (cd_education_status#25 = College             ))) OR ((cd_marital_status#24 = W) AND (cd_education_status#25 = 2 yr Degree         ))))
+Input [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
+Condition : (((isnotnull(cd_demo_sk#21) AND isnotnull(cd_marital_status#22)) AND isnotnull(cd_education_status#23)) AND ((((cd_marital_status#22 = M) AND (cd_education_status#23 = Advanced Degree     )) OR ((cd_marital_status#22 = S) AND (cd_education_status#23 = College             ))) OR ((cd_marital_status#22 = W) AND (cd_education_status#23 = 2 yr Degree         ))))
 
 (63) Project [codegen id : 1]
-Output [1]: [cd_demo_sk#23]
-Input [3]: [cd_demo_sk#23, cd_marital_status#24, cd_education_status#25]
+Output [1]: [cd_demo_sk#21]
+Input [3]: [cd_demo_sk#21, cd_marital_status#22, cd_education_status#23]
 
 (64) ObjectHashAggregate
-Input [1]: [cd_demo_sk#23]
+Input [1]: [cd_demo_sk#21]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(cd_demo_sk#23, 42), 159981, 2239471, 0, 0)]
-Aggregate Attributes [1]: [buf#55]
-Results [1]: [buf#56]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(cd_demo_sk#21, 42), 159981, 2239471, 0, 0)]
+Aggregate Attributes [1]: [buf#53]
+Results [1]: [buf#54]
 
 (65) Exchange
-Input [1]: [buf#56]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
+Input [1]: [buf#54]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (66) ObjectHashAggregate
-Input [1]: [buf#56]
+Input [1]: [buf#54]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(cd_demo_sk#23, 42), 159981, 2239471, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(cd_demo_sk#23, 42), 159981, 2239471, 0, 0)#57]
-Results [1]: [bloom_filter_agg(xxhash64(cd_demo_sk#23, 42), 159981, 2239471, 0, 0)#57 AS bloomFilter#58]
+Functions [1]: [bloom_filter_agg(xxhash64(cd_demo_sk#21, 42), 159981, 2239471, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(cd_demo_sk#21, 42), 159981, 2239471, 0, 0)#55]
+Results [1]: [bloom_filter_agg(xxhash64(cd_demo_sk#21, 42), 159981, 2239471, 0, 0)#55 AS bloomFilter#56]
 
-Subquery:3 Hosting operator id = 14 Hosting Expression = Subquery scalar-subquery#21, [id=#22]
+Subquery:3 Hosting operator id = 14 Hosting Expression = Subquery scalar-subquery#20, [id=#4]
 ObjectHashAggregate (73)
 +- Exchange (72)
    +- ObjectHashAggregate (71)
@@ -394,39 +394,39 @@ ObjectHashAggregate (73)
 
 
 (67) Scan parquet spark_catalog.default.customer_address
-Output [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
+Output [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_country), EqualTo(ca_country,United States), IsNotNull(ca_address_sk), Or(Or(In(ca_state, [IN,NJ,OH]),In(ca_state, [CT,KY,WI])),In(ca_state, [AR,IA,LA]))]
 ReadSchema: struct<ca_address_sk:int,ca_state:string,ca_country:string>
 
 (68) ColumnarToRow [codegen id : 1]
-Input [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
+Input [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
 
 (69) Filter [codegen id : 1]
-Input [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
-Condition : (((isnotnull(ca_country#31) AND (ca_country#31 = United States)) AND isnotnull(ca_address_sk#29)) AND ((ca_state#30 IN (IN,OH,NJ) OR ca_state#30 IN (WI,CT,KY)) OR ca_state#30 IN (LA,IA,AR)))
+Input [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
+Condition : (((isnotnull(ca_country#29) AND (ca_country#29 = United States)) AND isnotnull(ca_address_sk#27)) AND ((ca_state#28 IN (IN,OH,NJ) OR ca_state#28 IN (WI,CT,KY)) OR ca_state#28 IN (LA,IA,AR)))
 
 (70) Project [codegen id : 1]
-Output [1]: [ca_address_sk#29]
-Input [3]: [ca_address_sk#29, ca_state#30, ca_country#31]
+Output [1]: [ca_address_sk#27]
+Input [3]: [ca_address_sk#27, ca_state#28, ca_country#29]
 
 (71) ObjectHashAggregate
-Input [1]: [ca_address_sk#29]
+Input [1]: [ca_address_sk#27]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#29, 42), 152837, 2153999, 0, 0)]
-Aggregate Attributes [1]: [buf#59]
-Results [1]: [buf#60]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#27, 42), 152837, 2153999, 0, 0)]
+Aggregate Attributes [1]: [buf#57]
+Results [1]: [buf#58]
 
 (72) Exchange
-Input [1]: [buf#60]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
+Input [1]: [buf#58]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=14]
 
 (73) ObjectHashAggregate
-Input [1]: [buf#60]
+Input [1]: [buf#58]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#29, 42), 152837, 2153999, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#29, 42), 152837, 2153999, 0, 0)#61]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#29, 42), 152837, 2153999, 0, 0)#61 AS bloomFilter#62]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#27, 42), 152837, 2153999, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#27, 42), 152837, 2153999, 0, 0)#59]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#27, 42), 152837, 2153999, 0, 0)#59 AS bloomFilter#60]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9.sf100/explain.txt
index e32db674082ee..b789c51891fc3 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9.sf100/explain.txt
@@ -20,12 +20,12 @@ Input [1]: [r_reason_sk#1]
 Condition : (isnotnull(r_reason_sk#1) AND (r_reason_sk#1 = 1))
 
 (4) Project [codegen id : 1]
-Output [5]: [CASE WHEN (Subquery scalar-subquery#2, [id=#3].count(1) > 62316685) THEN ReusedSubquery Subquery scalar-subquery#2, [id=#3].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#2, [id=#3].avg(ss_net_paid) END AS bucket1#4, CASE WHEN (Subquery scalar-subquery#5, [id=#6].count(1) > 19045798) THEN ReusedSubquery Subquery scalar-subquery#5, [id=#6].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#5, [id=#6].avg(ss_net_paid) END AS bucket2#7, CASE WHEN (Subquery scalar-subquery#8, [id=#9].count(1) > 365541424) THEN ReusedSubquery Subquery scalar-subquery#8, [id=#9].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#8, [id=#9].avg(ss_net_paid) END AS bucket3#10, CASE WHEN (Subquery scalar-subquery#11, [id=#12].count(1) > 216357808) THEN ReusedSubquery Subquery scalar-subquery#11, [id=#12].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#11, [id=#12].avg(ss_net_paid) END AS bucket4#13, CASE WHEN (Subquery scalar-subquery#14, [id=#15].count(1) > 184483884) THEN ReusedSubquery Subquery scalar-subquery#14, [id=#15].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#14, [id=#15].avg(ss_net_paid) END AS bucket5#16]
+Output [5]: [CASE WHEN (Subquery scalar-subquery#2, [id=#1].count(1) > 62316685) THEN ReusedSubquery Subquery scalar-subquery#2, [id=#1].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#2, [id=#1].avg(ss_net_paid) END AS bucket1#3, CASE WHEN (Subquery scalar-subquery#4, [id=#2].count(1) > 19045798) THEN ReusedSubquery Subquery scalar-subquery#4, [id=#2].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#4, [id=#2].avg(ss_net_paid) END AS bucket2#5, CASE WHEN (Subquery scalar-subquery#6, [id=#3].count(1) > 365541424) THEN ReusedSubquery Subquery scalar-subquery#6, [id=#3].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#6, [id=#3].avg(ss_net_paid) END AS bucket3#7, CASE WHEN (Subquery scalar-subquery#8, [id=#4].count(1) > 216357808) THEN ReusedSubquery Subquery scalar-subquery#8, [id=#4].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#8, [id=#4].avg(ss_net_paid) END AS bucket4#9, CASE WHEN (Subquery scalar-subquery#10, [id=#5].count(1) > 184483884) THEN ReusedSubquery Subquery scalar-subquery#10, [id=#5].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#10, [id=#5].avg(ss_net_paid) END AS bucket5#11]
 Input [1]: [r_reason_sk#1]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#2, [id=#3]
+Subquery:1 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#2, [id=#1]
 * Project (12)
 +- * HashAggregate (11)
    +- Exchange (10)
@@ -37,50 +37,50 @@ Subquery:1 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery
 
 
 (5) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
+Output [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,1), LessThanOrEqual(ss_quantity,20)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (6) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
+Input [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
 
 (7) Filter [codegen id : 1]
-Input [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
-Condition : ((isnotnull(ss_quantity#17) AND (ss_quantity#17 >= 1)) AND (ss_quantity#17 <= 20))
+Input [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
+Condition : ((isnotnull(ss_quantity#12) AND (ss_quantity#12 >= 1)) AND (ss_quantity#12 <= 20))
 
 (8) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#18, ss_net_paid#19]
-Input [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
+Output [2]: [ss_ext_discount_amt#13, ss_net_paid#14]
+Input [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
 
 (9) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#18, ss_net_paid#19]
+Input [2]: [ss_ext_discount_amt#13, ss_net_paid#14]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#18)), partial_avg(UnscaledValue(ss_net_paid#19))]
-Aggregate Attributes [5]: [count#21, sum#22, count#23, sum#24, count#25]
-Results [5]: [count#26, sum#27, count#28, sum#29, count#30]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#13)), partial_avg(UnscaledValue(ss_net_paid#14))]
+Aggregate Attributes [5]: [count#16, sum#17, count#18, sum#19, count#20]
+Results [5]: [count#21, sum#22, count#23, sum#24, count#25]
 
 (10) Exchange
-Input [5]: [count#26, sum#27, count#28, sum#29, count#30]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=1]
+Input [5]: [count#21, sum#22, count#23, sum#24, count#25]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
 
 (11) HashAggregate [codegen id : 2]
-Input [5]: [count#26, sum#27, count#28, sum#29, count#30]
+Input [5]: [count#21, sum#22, count#23, sum#24, count#25]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#18)), avg(UnscaledValue(ss_net_paid#19))]
-Aggregate Attributes [3]: [count(1)#31, avg(UnscaledValue(ss_ext_discount_amt#18))#32, avg(UnscaledValue(ss_net_paid#19))#33]
-Results [3]: [count(1)#31 AS count(1)#34, cast((avg(UnscaledValue(ss_ext_discount_amt#18))#32 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#35, cast((avg(UnscaledValue(ss_net_paid#19))#33 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#36]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#13)), avg(UnscaledValue(ss_net_paid#14))]
+Aggregate Attributes [3]: [count(1)#26, avg(UnscaledValue(ss_ext_discount_amt#13))#27, avg(UnscaledValue(ss_net_paid#14))#28]
+Results [3]: [count(1)#26 AS count(1)#29, cast((avg(UnscaledValue(ss_ext_discount_amt#13))#27 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#30, cast((avg(UnscaledValue(ss_net_paid#14))#28 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#31]
 
 (12) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#34, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#35, avg(ss_net_paid), avg(ss_net_paid)#36) AS mergedValue#37]
-Input [3]: [count(1)#34, avg(ss_ext_discount_amt)#35, avg(ss_net_paid)#36]
+Output [1]: [named_struct(count(1), count(1)#29, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#30, avg(ss_net_paid), avg(ss_net_paid)#31) AS mergedValue#32]
+Input [3]: [count(1)#29, avg(ss_ext_discount_amt)#30, avg(ss_net_paid)#31]
 
-Subquery:2 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#3]
+Subquery:2 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#1]
 
-Subquery:3 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#3]
+Subquery:3 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#1]
 
-Subquery:4 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#5, [id=#6]
+Subquery:4 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#4, [id=#2]
 * Project (20)
 +- * HashAggregate (19)
    +- Exchange (18)
@@ -92,50 +92,50 @@ Subquery:4 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery
 
 
 (13) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
+Output [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,21), LessThanOrEqual(ss_quantity,40)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (14) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
+Input [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
 
 (15) Filter [codegen id : 1]
-Input [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
-Condition : ((isnotnull(ss_quantity#38) AND (ss_quantity#38 >= 21)) AND (ss_quantity#38 <= 40))
+Input [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
+Condition : ((isnotnull(ss_quantity#33) AND (ss_quantity#33 >= 21)) AND (ss_quantity#33 <= 40))
 
 (16) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#39, ss_net_paid#40]
-Input [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
+Output [2]: [ss_ext_discount_amt#34, ss_net_paid#35]
+Input [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
 
 (17) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#39, ss_net_paid#40]
+Input [2]: [ss_ext_discount_amt#34, ss_net_paid#35]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#39)), partial_avg(UnscaledValue(ss_net_paid#40))]
-Aggregate Attributes [5]: [count#42, sum#43, count#44, sum#45, count#46]
-Results [5]: [count#47, sum#48, count#49, sum#50, count#51]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#34)), partial_avg(UnscaledValue(ss_net_paid#35))]
+Aggregate Attributes [5]: [count#37, sum#38, count#39, sum#40, count#41]
+Results [5]: [count#42, sum#43, count#44, sum#45, count#46]
 
 (18) Exchange
-Input [5]: [count#47, sum#48, count#49, sum#50, count#51]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=2]
+Input [5]: [count#42, sum#43, count#44, sum#45, count#46]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
 
 (19) HashAggregate [codegen id : 2]
-Input [5]: [count#47, sum#48, count#49, sum#50, count#51]
+Input [5]: [count#42, sum#43, count#44, sum#45, count#46]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#39)), avg(UnscaledValue(ss_net_paid#40))]
-Aggregate Attributes [3]: [count(1)#52, avg(UnscaledValue(ss_ext_discount_amt#39))#53, avg(UnscaledValue(ss_net_paid#40))#54]
-Results [3]: [count(1)#52 AS count(1)#55, cast((avg(UnscaledValue(ss_ext_discount_amt#39))#53 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#56, cast((avg(UnscaledValue(ss_net_paid#40))#54 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#57]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#34)), avg(UnscaledValue(ss_net_paid#35))]
+Aggregate Attributes [3]: [count(1)#47, avg(UnscaledValue(ss_ext_discount_amt#34))#48, avg(UnscaledValue(ss_net_paid#35))#49]
+Results [3]: [count(1)#47 AS count(1)#50, cast((avg(UnscaledValue(ss_ext_discount_amt#34))#48 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#51, cast((avg(UnscaledValue(ss_net_paid#35))#49 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#52]
 
 (20) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#55, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#56, avg(ss_net_paid), avg(ss_net_paid)#57) AS mergedValue#58]
-Input [3]: [count(1)#55, avg(ss_ext_discount_amt)#56, avg(ss_net_paid)#57]
+Output [1]: [named_struct(count(1), count(1)#50, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#51, avg(ss_net_paid), avg(ss_net_paid)#52) AS mergedValue#53]
+Input [3]: [count(1)#50, avg(ss_ext_discount_amt)#51, avg(ss_net_paid)#52]
 
-Subquery:5 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#5, [id=#6]
+Subquery:5 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#4, [id=#2]
 
-Subquery:6 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#5, [id=#6]
+Subquery:6 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#4, [id=#2]
 
-Subquery:7 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#8, [id=#9]
+Subquery:7 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#6, [id=#3]
 * Project (28)
 +- * HashAggregate (27)
    +- Exchange (26)
@@ -147,50 +147,50 @@ Subquery:7 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery
 
 
 (21) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
+Output [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,41), LessThanOrEqual(ss_quantity,60)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (22) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
+Input [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
 
 (23) Filter [codegen id : 1]
-Input [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
-Condition : ((isnotnull(ss_quantity#59) AND (ss_quantity#59 >= 41)) AND (ss_quantity#59 <= 60))
+Input [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
+Condition : ((isnotnull(ss_quantity#54) AND (ss_quantity#54 >= 41)) AND (ss_quantity#54 <= 60))
 
 (24) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#60, ss_net_paid#61]
-Input [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
+Output [2]: [ss_ext_discount_amt#55, ss_net_paid#56]
+Input [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
 
 (25) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#60, ss_net_paid#61]
+Input [2]: [ss_ext_discount_amt#55, ss_net_paid#56]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#60)), partial_avg(UnscaledValue(ss_net_paid#61))]
-Aggregate Attributes [5]: [count#63, sum#64, count#65, sum#66, count#67]
-Results [5]: [count#68, sum#69, count#70, sum#71, count#72]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#55)), partial_avg(UnscaledValue(ss_net_paid#56))]
+Aggregate Attributes [5]: [count#58, sum#59, count#60, sum#61, count#62]
+Results [5]: [count#63, sum#64, count#65, sum#66, count#67]
 
 (26) Exchange
-Input [5]: [count#68, sum#69, count#70, sum#71, count#72]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=3]
+Input [5]: [count#63, sum#64, count#65, sum#66, count#67]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
 
 (27) HashAggregate [codegen id : 2]
-Input [5]: [count#68, sum#69, count#70, sum#71, count#72]
+Input [5]: [count#63, sum#64, count#65, sum#66, count#67]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#60)), avg(UnscaledValue(ss_net_paid#61))]
-Aggregate Attributes [3]: [count(1)#73, avg(UnscaledValue(ss_ext_discount_amt#60))#74, avg(UnscaledValue(ss_net_paid#61))#75]
-Results [3]: [count(1)#73 AS count(1)#76, cast((avg(UnscaledValue(ss_ext_discount_amt#60))#74 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#77, cast((avg(UnscaledValue(ss_net_paid#61))#75 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#78]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#55)), avg(UnscaledValue(ss_net_paid#56))]
+Aggregate Attributes [3]: [count(1)#68, avg(UnscaledValue(ss_ext_discount_amt#55))#69, avg(UnscaledValue(ss_net_paid#56))#70]
+Results [3]: [count(1)#68 AS count(1)#71, cast((avg(UnscaledValue(ss_ext_discount_amt#55))#69 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#72, cast((avg(UnscaledValue(ss_net_paid#56))#70 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#73]
 
 (28) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#76, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#77, avg(ss_net_paid), avg(ss_net_paid)#78) AS mergedValue#79]
-Input [3]: [count(1)#76, avg(ss_ext_discount_amt)#77, avg(ss_net_paid)#78]
+Output [1]: [named_struct(count(1), count(1)#71, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#72, avg(ss_net_paid), avg(ss_net_paid)#73) AS mergedValue#74]
+Input [3]: [count(1)#71, avg(ss_ext_discount_amt)#72, avg(ss_net_paid)#73]
 
-Subquery:8 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#9]
+Subquery:8 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#6, [id=#3]
 
-Subquery:9 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#9]
+Subquery:9 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#6, [id=#3]
 
-Subquery:10 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#11, [id=#12]
+Subquery:10 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#8, [id=#4]
 * Project (36)
 +- * HashAggregate (35)
    +- Exchange (34)
@@ -202,50 +202,50 @@ Subquery:10 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquer
 
 
 (29) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
+Output [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,61), LessThanOrEqual(ss_quantity,80)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (30) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
+Input [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
 
 (31) Filter [codegen id : 1]
-Input [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
-Condition : ((isnotnull(ss_quantity#80) AND (ss_quantity#80 >= 61)) AND (ss_quantity#80 <= 80))
+Input [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
+Condition : ((isnotnull(ss_quantity#75) AND (ss_quantity#75 >= 61)) AND (ss_quantity#75 <= 80))
 
 (32) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#81, ss_net_paid#82]
-Input [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
+Output [2]: [ss_ext_discount_amt#76, ss_net_paid#77]
+Input [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
 
 (33) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#81, ss_net_paid#82]
+Input [2]: [ss_ext_discount_amt#76, ss_net_paid#77]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#81)), partial_avg(UnscaledValue(ss_net_paid#82))]
-Aggregate Attributes [5]: [count#84, sum#85, count#86, sum#87, count#88]
-Results [5]: [count#89, sum#90, count#91, sum#92, count#93]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#76)), partial_avg(UnscaledValue(ss_net_paid#77))]
+Aggregate Attributes [5]: [count#79, sum#80, count#81, sum#82, count#83]
+Results [5]: [count#84, sum#85, count#86, sum#87, count#88]
 
 (34) Exchange
-Input [5]: [count#89, sum#90, count#91, sum#92, count#93]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=4]
+Input [5]: [count#84, sum#85, count#86, sum#87, count#88]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
 
 (35) HashAggregate [codegen id : 2]
-Input [5]: [count#89, sum#90, count#91, sum#92, count#93]
+Input [5]: [count#84, sum#85, count#86, sum#87, count#88]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#81)), avg(UnscaledValue(ss_net_paid#82))]
-Aggregate Attributes [3]: [count(1)#94, avg(UnscaledValue(ss_ext_discount_amt#81))#95, avg(UnscaledValue(ss_net_paid#82))#96]
-Results [3]: [count(1)#94 AS count(1)#97, cast((avg(UnscaledValue(ss_ext_discount_amt#81))#95 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#98, cast((avg(UnscaledValue(ss_net_paid#82))#96 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#99]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#76)), avg(UnscaledValue(ss_net_paid#77))]
+Aggregate Attributes [3]: [count(1)#89, avg(UnscaledValue(ss_ext_discount_amt#76))#90, avg(UnscaledValue(ss_net_paid#77))#91]
+Results [3]: [count(1)#89 AS count(1)#92, cast((avg(UnscaledValue(ss_ext_discount_amt#76))#90 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#93, cast((avg(UnscaledValue(ss_net_paid#77))#91 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#94]
 
 (36) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#97, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#98, avg(ss_net_paid), avg(ss_net_paid)#99) AS mergedValue#100]
-Input [3]: [count(1)#97, avg(ss_ext_discount_amt)#98, avg(ss_net_paid)#99]
+Output [1]: [named_struct(count(1), count(1)#92, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#93, avg(ss_net_paid), avg(ss_net_paid)#94) AS mergedValue#95]
+Input [3]: [count(1)#92, avg(ss_ext_discount_amt)#93, avg(ss_net_paid)#94]
 
-Subquery:11 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:11 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#4]
 
-Subquery:12 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:12 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#4]
 
-Subquery:13 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#14, [id=#15]
+Subquery:13 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#10, [id=#5]
 * Project (44)
 +- * HashAggregate (43)
    +- Exchange (42)
@@ -257,47 +257,47 @@ Subquery:13 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquer
 
 
 (37) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
+Output [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,81), LessThanOrEqual(ss_quantity,100)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (38) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
+Input [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
 
 (39) Filter [codegen id : 1]
-Input [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
-Condition : ((isnotnull(ss_quantity#101) AND (ss_quantity#101 >= 81)) AND (ss_quantity#101 <= 100))
+Input [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
+Condition : ((isnotnull(ss_quantity#96) AND (ss_quantity#96 >= 81)) AND (ss_quantity#96 <= 100))
 
 (40) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#102, ss_net_paid#103]
-Input [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
+Output [2]: [ss_ext_discount_amt#97, ss_net_paid#98]
+Input [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
 
 (41) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#102, ss_net_paid#103]
+Input [2]: [ss_ext_discount_amt#97, ss_net_paid#98]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#102)), partial_avg(UnscaledValue(ss_net_paid#103))]
-Aggregate Attributes [5]: [count#105, sum#106, count#107, sum#108, count#109]
-Results [5]: [count#110, sum#111, count#112, sum#113, count#114]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#97)), partial_avg(UnscaledValue(ss_net_paid#98))]
+Aggregate Attributes [5]: [count#100, sum#101, count#102, sum#103, count#104]
+Results [5]: [count#105, sum#106, count#107, sum#108, count#109]
 
 (42) Exchange
-Input [5]: [count#110, sum#111, count#112, sum#113, count#114]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
+Input [5]: [count#105, sum#106, count#107, sum#108, count#109]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
 
 (43) HashAggregate [codegen id : 2]
-Input [5]: [count#110, sum#111, count#112, sum#113, count#114]
+Input [5]: [count#105, sum#106, count#107, sum#108, count#109]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#102)), avg(UnscaledValue(ss_net_paid#103))]
-Aggregate Attributes [3]: [count(1)#115, avg(UnscaledValue(ss_ext_discount_amt#102))#116, avg(UnscaledValue(ss_net_paid#103))#117]
-Results [3]: [count(1)#115 AS count(1)#118, cast((avg(UnscaledValue(ss_ext_discount_amt#102))#116 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#119, cast((avg(UnscaledValue(ss_net_paid#103))#117 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#120]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#97)), avg(UnscaledValue(ss_net_paid#98))]
+Aggregate Attributes [3]: [count(1)#110, avg(UnscaledValue(ss_ext_discount_amt#97))#111, avg(UnscaledValue(ss_net_paid#98))#112]
+Results [3]: [count(1)#110 AS count(1)#113, cast((avg(UnscaledValue(ss_ext_discount_amt#97))#111 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#114, cast((avg(UnscaledValue(ss_net_paid#98))#112 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#115]
 
 (44) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#118, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#119, avg(ss_net_paid), avg(ss_net_paid)#120) AS mergedValue#121]
-Input [3]: [count(1)#118, avg(ss_ext_discount_amt)#119, avg(ss_net_paid)#120]
+Output [1]: [named_struct(count(1), count(1)#113, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#114, avg(ss_net_paid), avg(ss_net_paid)#115) AS mergedValue#116]
+Input [3]: [count(1)#113, avg(ss_ext_discount_amt)#114, avg(ss_net_paid)#115]
 
-Subquery:14 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#15]
+Subquery:14 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#5]
 
-Subquery:15 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#15]
+Subquery:15 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#5]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9/explain.txt
index e32db674082ee..b789c51891fc3 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q9/explain.txt
@@ -20,12 +20,12 @@ Input [1]: [r_reason_sk#1]
 Condition : (isnotnull(r_reason_sk#1) AND (r_reason_sk#1 = 1))
 
 (4) Project [codegen id : 1]
-Output [5]: [CASE WHEN (Subquery scalar-subquery#2, [id=#3].count(1) > 62316685) THEN ReusedSubquery Subquery scalar-subquery#2, [id=#3].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#2, [id=#3].avg(ss_net_paid) END AS bucket1#4, CASE WHEN (Subquery scalar-subquery#5, [id=#6].count(1) > 19045798) THEN ReusedSubquery Subquery scalar-subquery#5, [id=#6].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#5, [id=#6].avg(ss_net_paid) END AS bucket2#7, CASE WHEN (Subquery scalar-subquery#8, [id=#9].count(1) > 365541424) THEN ReusedSubquery Subquery scalar-subquery#8, [id=#9].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#8, [id=#9].avg(ss_net_paid) END AS bucket3#10, CASE WHEN (Subquery scalar-subquery#11, [id=#12].count(1) > 216357808) THEN ReusedSubquery Subquery scalar-subquery#11, [id=#12].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#11, [id=#12].avg(ss_net_paid) END AS bucket4#13, CASE WHEN (Subquery scalar-subquery#14, [id=#15].count(1) > 184483884) THEN ReusedSubquery Subquery scalar-subquery#14, [id=#15].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#14, [id=#15].avg(ss_net_paid) END AS bucket5#16]
+Output [5]: [CASE WHEN (Subquery scalar-subquery#2, [id=#1].count(1) > 62316685) THEN ReusedSubquery Subquery scalar-subquery#2, [id=#1].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#2, [id=#1].avg(ss_net_paid) END AS bucket1#3, CASE WHEN (Subquery scalar-subquery#4, [id=#2].count(1) > 19045798) THEN ReusedSubquery Subquery scalar-subquery#4, [id=#2].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#4, [id=#2].avg(ss_net_paid) END AS bucket2#5, CASE WHEN (Subquery scalar-subquery#6, [id=#3].count(1) > 365541424) THEN ReusedSubquery Subquery scalar-subquery#6, [id=#3].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#6, [id=#3].avg(ss_net_paid) END AS bucket3#7, CASE WHEN (Subquery scalar-subquery#8, [id=#4].count(1) > 216357808) THEN ReusedSubquery Subquery scalar-subquery#8, [id=#4].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#8, [id=#4].avg(ss_net_paid) END AS bucket4#9, CASE WHEN (Subquery scalar-subquery#10, [id=#5].count(1) > 184483884) THEN ReusedSubquery Subquery scalar-subquery#10, [id=#5].avg(ss_ext_discount_amt) ELSE ReusedSubquery Subquery scalar-subquery#10, [id=#5].avg(ss_net_paid) END AS bucket5#11]
 Input [1]: [r_reason_sk#1]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#2, [id=#3]
+Subquery:1 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#2, [id=#1]
 * Project (12)
 +- * HashAggregate (11)
    +- Exchange (10)
@@ -37,50 +37,50 @@ Subquery:1 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery
 
 
 (5) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
+Output [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,1), LessThanOrEqual(ss_quantity,20)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (6) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
+Input [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
 
 (7) Filter [codegen id : 1]
-Input [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
-Condition : ((isnotnull(ss_quantity#17) AND (ss_quantity#17 >= 1)) AND (ss_quantity#17 <= 20))
+Input [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
+Condition : ((isnotnull(ss_quantity#12) AND (ss_quantity#12 >= 1)) AND (ss_quantity#12 <= 20))
 
 (8) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#18, ss_net_paid#19]
-Input [4]: [ss_quantity#17, ss_ext_discount_amt#18, ss_net_paid#19, ss_sold_date_sk#20]
+Output [2]: [ss_ext_discount_amt#13, ss_net_paid#14]
+Input [4]: [ss_quantity#12, ss_ext_discount_amt#13, ss_net_paid#14, ss_sold_date_sk#15]
 
 (9) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#18, ss_net_paid#19]
+Input [2]: [ss_ext_discount_amt#13, ss_net_paid#14]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#18)), partial_avg(UnscaledValue(ss_net_paid#19))]
-Aggregate Attributes [5]: [count#21, sum#22, count#23, sum#24, count#25]
-Results [5]: [count#26, sum#27, count#28, sum#29, count#30]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#13)), partial_avg(UnscaledValue(ss_net_paid#14))]
+Aggregate Attributes [5]: [count#16, sum#17, count#18, sum#19, count#20]
+Results [5]: [count#21, sum#22, count#23, sum#24, count#25]
 
 (10) Exchange
-Input [5]: [count#26, sum#27, count#28, sum#29, count#30]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=1]
+Input [5]: [count#21, sum#22, count#23, sum#24, count#25]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
 
 (11) HashAggregate [codegen id : 2]
-Input [5]: [count#26, sum#27, count#28, sum#29, count#30]
+Input [5]: [count#21, sum#22, count#23, sum#24, count#25]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#18)), avg(UnscaledValue(ss_net_paid#19))]
-Aggregate Attributes [3]: [count(1)#31, avg(UnscaledValue(ss_ext_discount_amt#18))#32, avg(UnscaledValue(ss_net_paid#19))#33]
-Results [3]: [count(1)#31 AS count(1)#34, cast((avg(UnscaledValue(ss_ext_discount_amt#18))#32 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#35, cast((avg(UnscaledValue(ss_net_paid#19))#33 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#36]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#13)), avg(UnscaledValue(ss_net_paid#14))]
+Aggregate Attributes [3]: [count(1)#26, avg(UnscaledValue(ss_ext_discount_amt#13))#27, avg(UnscaledValue(ss_net_paid#14))#28]
+Results [3]: [count(1)#26 AS count(1)#29, cast((avg(UnscaledValue(ss_ext_discount_amt#13))#27 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#30, cast((avg(UnscaledValue(ss_net_paid#14))#28 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#31]
 
 (12) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#34, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#35, avg(ss_net_paid), avg(ss_net_paid)#36) AS mergedValue#37]
-Input [3]: [count(1)#34, avg(ss_ext_discount_amt)#35, avg(ss_net_paid)#36]
+Output [1]: [named_struct(count(1), count(1)#29, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#30, avg(ss_net_paid), avg(ss_net_paid)#31) AS mergedValue#32]
+Input [3]: [count(1)#29, avg(ss_ext_discount_amt)#30, avg(ss_net_paid)#31]
 
-Subquery:2 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#3]
+Subquery:2 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#1]
 
-Subquery:3 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#3]
+Subquery:3 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#2, [id=#1]
 
-Subquery:4 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#5, [id=#6]
+Subquery:4 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#4, [id=#2]
 * Project (20)
 +- * HashAggregate (19)
    +- Exchange (18)
@@ -92,50 +92,50 @@ Subquery:4 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery
 
 
 (13) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
+Output [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,21), LessThanOrEqual(ss_quantity,40)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (14) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
+Input [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
 
 (15) Filter [codegen id : 1]
-Input [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
-Condition : ((isnotnull(ss_quantity#38) AND (ss_quantity#38 >= 21)) AND (ss_quantity#38 <= 40))
+Input [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
+Condition : ((isnotnull(ss_quantity#33) AND (ss_quantity#33 >= 21)) AND (ss_quantity#33 <= 40))
 
 (16) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#39, ss_net_paid#40]
-Input [4]: [ss_quantity#38, ss_ext_discount_amt#39, ss_net_paid#40, ss_sold_date_sk#41]
+Output [2]: [ss_ext_discount_amt#34, ss_net_paid#35]
+Input [4]: [ss_quantity#33, ss_ext_discount_amt#34, ss_net_paid#35, ss_sold_date_sk#36]
 
 (17) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#39, ss_net_paid#40]
+Input [2]: [ss_ext_discount_amt#34, ss_net_paid#35]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#39)), partial_avg(UnscaledValue(ss_net_paid#40))]
-Aggregate Attributes [5]: [count#42, sum#43, count#44, sum#45, count#46]
-Results [5]: [count#47, sum#48, count#49, sum#50, count#51]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#34)), partial_avg(UnscaledValue(ss_net_paid#35))]
+Aggregate Attributes [5]: [count#37, sum#38, count#39, sum#40, count#41]
+Results [5]: [count#42, sum#43, count#44, sum#45, count#46]
 
 (18) Exchange
-Input [5]: [count#47, sum#48, count#49, sum#50, count#51]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=2]
+Input [5]: [count#42, sum#43, count#44, sum#45, count#46]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
 
 (19) HashAggregate [codegen id : 2]
-Input [5]: [count#47, sum#48, count#49, sum#50, count#51]
+Input [5]: [count#42, sum#43, count#44, sum#45, count#46]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#39)), avg(UnscaledValue(ss_net_paid#40))]
-Aggregate Attributes [3]: [count(1)#52, avg(UnscaledValue(ss_ext_discount_amt#39))#53, avg(UnscaledValue(ss_net_paid#40))#54]
-Results [3]: [count(1)#52 AS count(1)#55, cast((avg(UnscaledValue(ss_ext_discount_amt#39))#53 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#56, cast((avg(UnscaledValue(ss_net_paid#40))#54 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#57]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#34)), avg(UnscaledValue(ss_net_paid#35))]
+Aggregate Attributes [3]: [count(1)#47, avg(UnscaledValue(ss_ext_discount_amt#34))#48, avg(UnscaledValue(ss_net_paid#35))#49]
+Results [3]: [count(1)#47 AS count(1)#50, cast((avg(UnscaledValue(ss_ext_discount_amt#34))#48 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#51, cast((avg(UnscaledValue(ss_net_paid#35))#49 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#52]
 
 (20) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#55, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#56, avg(ss_net_paid), avg(ss_net_paid)#57) AS mergedValue#58]
-Input [3]: [count(1)#55, avg(ss_ext_discount_amt)#56, avg(ss_net_paid)#57]
+Output [1]: [named_struct(count(1), count(1)#50, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#51, avg(ss_net_paid), avg(ss_net_paid)#52) AS mergedValue#53]
+Input [3]: [count(1)#50, avg(ss_ext_discount_amt)#51, avg(ss_net_paid)#52]
 
-Subquery:5 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#5, [id=#6]
+Subquery:5 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#4, [id=#2]
 
-Subquery:6 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#5, [id=#6]
+Subquery:6 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#4, [id=#2]
 
-Subquery:7 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#8, [id=#9]
+Subquery:7 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#6, [id=#3]
 * Project (28)
 +- * HashAggregate (27)
    +- Exchange (26)
@@ -147,50 +147,50 @@ Subquery:7 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery
 
 
 (21) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
+Output [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,41), LessThanOrEqual(ss_quantity,60)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (22) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
+Input [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
 
 (23) Filter [codegen id : 1]
-Input [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
-Condition : ((isnotnull(ss_quantity#59) AND (ss_quantity#59 >= 41)) AND (ss_quantity#59 <= 60))
+Input [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
+Condition : ((isnotnull(ss_quantity#54) AND (ss_quantity#54 >= 41)) AND (ss_quantity#54 <= 60))
 
 (24) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#60, ss_net_paid#61]
-Input [4]: [ss_quantity#59, ss_ext_discount_amt#60, ss_net_paid#61, ss_sold_date_sk#62]
+Output [2]: [ss_ext_discount_amt#55, ss_net_paid#56]
+Input [4]: [ss_quantity#54, ss_ext_discount_amt#55, ss_net_paid#56, ss_sold_date_sk#57]
 
 (25) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#60, ss_net_paid#61]
+Input [2]: [ss_ext_discount_amt#55, ss_net_paid#56]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#60)), partial_avg(UnscaledValue(ss_net_paid#61))]
-Aggregate Attributes [5]: [count#63, sum#64, count#65, sum#66, count#67]
-Results [5]: [count#68, sum#69, count#70, sum#71, count#72]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#55)), partial_avg(UnscaledValue(ss_net_paid#56))]
+Aggregate Attributes [5]: [count#58, sum#59, count#60, sum#61, count#62]
+Results [5]: [count#63, sum#64, count#65, sum#66, count#67]
 
 (26) Exchange
-Input [5]: [count#68, sum#69, count#70, sum#71, count#72]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=3]
+Input [5]: [count#63, sum#64, count#65, sum#66, count#67]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
 
 (27) HashAggregate [codegen id : 2]
-Input [5]: [count#68, sum#69, count#70, sum#71, count#72]
+Input [5]: [count#63, sum#64, count#65, sum#66, count#67]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#60)), avg(UnscaledValue(ss_net_paid#61))]
-Aggregate Attributes [3]: [count(1)#73, avg(UnscaledValue(ss_ext_discount_amt#60))#74, avg(UnscaledValue(ss_net_paid#61))#75]
-Results [3]: [count(1)#73 AS count(1)#76, cast((avg(UnscaledValue(ss_ext_discount_amt#60))#74 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#77, cast((avg(UnscaledValue(ss_net_paid#61))#75 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#78]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#55)), avg(UnscaledValue(ss_net_paid#56))]
+Aggregate Attributes [3]: [count(1)#68, avg(UnscaledValue(ss_ext_discount_amt#55))#69, avg(UnscaledValue(ss_net_paid#56))#70]
+Results [3]: [count(1)#68 AS count(1)#71, cast((avg(UnscaledValue(ss_ext_discount_amt#55))#69 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#72, cast((avg(UnscaledValue(ss_net_paid#56))#70 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#73]
 
 (28) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#76, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#77, avg(ss_net_paid), avg(ss_net_paid)#78) AS mergedValue#79]
-Input [3]: [count(1)#76, avg(ss_ext_discount_amt)#77, avg(ss_net_paid)#78]
+Output [1]: [named_struct(count(1), count(1)#71, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#72, avg(ss_net_paid), avg(ss_net_paid)#73) AS mergedValue#74]
+Input [3]: [count(1)#71, avg(ss_ext_discount_amt)#72, avg(ss_net_paid)#73]
 
-Subquery:8 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#9]
+Subquery:8 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#6, [id=#3]
 
-Subquery:9 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#9]
+Subquery:9 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#6, [id=#3]
 
-Subquery:10 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#11, [id=#12]
+Subquery:10 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#8, [id=#4]
 * Project (36)
 +- * HashAggregate (35)
    +- Exchange (34)
@@ -202,50 +202,50 @@ Subquery:10 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquer
 
 
 (29) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
+Output [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,61), LessThanOrEqual(ss_quantity,80)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (30) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
+Input [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
 
 (31) Filter [codegen id : 1]
-Input [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
-Condition : ((isnotnull(ss_quantity#80) AND (ss_quantity#80 >= 61)) AND (ss_quantity#80 <= 80))
+Input [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
+Condition : ((isnotnull(ss_quantity#75) AND (ss_quantity#75 >= 61)) AND (ss_quantity#75 <= 80))
 
 (32) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#81, ss_net_paid#82]
-Input [4]: [ss_quantity#80, ss_ext_discount_amt#81, ss_net_paid#82, ss_sold_date_sk#83]
+Output [2]: [ss_ext_discount_amt#76, ss_net_paid#77]
+Input [4]: [ss_quantity#75, ss_ext_discount_amt#76, ss_net_paid#77, ss_sold_date_sk#78]
 
 (33) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#81, ss_net_paid#82]
+Input [2]: [ss_ext_discount_amt#76, ss_net_paid#77]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#81)), partial_avg(UnscaledValue(ss_net_paid#82))]
-Aggregate Attributes [5]: [count#84, sum#85, count#86, sum#87, count#88]
-Results [5]: [count#89, sum#90, count#91, sum#92, count#93]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#76)), partial_avg(UnscaledValue(ss_net_paid#77))]
+Aggregate Attributes [5]: [count#79, sum#80, count#81, sum#82, count#83]
+Results [5]: [count#84, sum#85, count#86, sum#87, count#88]
 
 (34) Exchange
-Input [5]: [count#89, sum#90, count#91, sum#92, count#93]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=4]
+Input [5]: [count#84, sum#85, count#86, sum#87, count#88]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
 
 (35) HashAggregate [codegen id : 2]
-Input [5]: [count#89, sum#90, count#91, sum#92, count#93]
+Input [5]: [count#84, sum#85, count#86, sum#87, count#88]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#81)), avg(UnscaledValue(ss_net_paid#82))]
-Aggregate Attributes [3]: [count(1)#94, avg(UnscaledValue(ss_ext_discount_amt#81))#95, avg(UnscaledValue(ss_net_paid#82))#96]
-Results [3]: [count(1)#94 AS count(1)#97, cast((avg(UnscaledValue(ss_ext_discount_amt#81))#95 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#98, cast((avg(UnscaledValue(ss_net_paid#82))#96 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#99]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#76)), avg(UnscaledValue(ss_net_paid#77))]
+Aggregate Attributes [3]: [count(1)#89, avg(UnscaledValue(ss_ext_discount_amt#76))#90, avg(UnscaledValue(ss_net_paid#77))#91]
+Results [3]: [count(1)#89 AS count(1)#92, cast((avg(UnscaledValue(ss_ext_discount_amt#76))#90 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#93, cast((avg(UnscaledValue(ss_net_paid#77))#91 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#94]
 
 (36) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#97, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#98, avg(ss_net_paid), avg(ss_net_paid)#99) AS mergedValue#100]
-Input [3]: [count(1)#97, avg(ss_ext_discount_amt)#98, avg(ss_net_paid)#99]
+Output [1]: [named_struct(count(1), count(1)#92, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#93, avg(ss_net_paid), avg(ss_net_paid)#94) AS mergedValue#95]
+Input [3]: [count(1)#92, avg(ss_ext_discount_amt)#93, avg(ss_net_paid)#94]
 
-Subquery:11 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:11 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#4]
 
-Subquery:12 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:12 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#8, [id=#4]
 
-Subquery:13 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#14, [id=#15]
+Subquery:13 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquery#10, [id=#5]
 * Project (44)
 +- * HashAggregate (43)
    +- Exchange (42)
@@ -257,47 +257,47 @@ Subquery:13 Hosting operator id = 4 Hosting Expression = Subquery scalar-subquer
 
 
 (37) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
+Output [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_quantity), GreaterThanOrEqual(ss_quantity,81), LessThanOrEqual(ss_quantity,100)]
 ReadSchema: struct<ss_quantity:int,ss_ext_discount_amt:decimal(7,2),ss_net_paid:decimal(7,2)>
 
 (38) ColumnarToRow [codegen id : 1]
-Input [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
+Input [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
 
 (39) Filter [codegen id : 1]
-Input [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
-Condition : ((isnotnull(ss_quantity#101) AND (ss_quantity#101 >= 81)) AND (ss_quantity#101 <= 100))
+Input [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
+Condition : ((isnotnull(ss_quantity#96) AND (ss_quantity#96 >= 81)) AND (ss_quantity#96 <= 100))
 
 (40) Project [codegen id : 1]
-Output [2]: [ss_ext_discount_amt#102, ss_net_paid#103]
-Input [4]: [ss_quantity#101, ss_ext_discount_amt#102, ss_net_paid#103, ss_sold_date_sk#104]
+Output [2]: [ss_ext_discount_amt#97, ss_net_paid#98]
+Input [4]: [ss_quantity#96, ss_ext_discount_amt#97, ss_net_paid#98, ss_sold_date_sk#99]
 
 (41) HashAggregate [codegen id : 1]
-Input [2]: [ss_ext_discount_amt#102, ss_net_paid#103]
+Input [2]: [ss_ext_discount_amt#97, ss_net_paid#98]
 Keys: []
-Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#102)), partial_avg(UnscaledValue(ss_net_paid#103))]
-Aggregate Attributes [5]: [count#105, sum#106, count#107, sum#108, count#109]
-Results [5]: [count#110, sum#111, count#112, sum#113, count#114]
+Functions [3]: [partial_count(1), partial_avg(UnscaledValue(ss_ext_discount_amt#97)), partial_avg(UnscaledValue(ss_net_paid#98))]
+Aggregate Attributes [5]: [count#100, sum#101, count#102, sum#103, count#104]
+Results [5]: [count#105, sum#106, count#107, sum#108, count#109]
 
 (42) Exchange
-Input [5]: [count#110, sum#111, count#112, sum#113, count#114]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
+Input [5]: [count#105, sum#106, count#107, sum#108, count#109]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
 
 (43) HashAggregate [codegen id : 2]
-Input [5]: [count#110, sum#111, count#112, sum#113, count#114]
+Input [5]: [count#105, sum#106, count#107, sum#108, count#109]
 Keys: []
-Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#102)), avg(UnscaledValue(ss_net_paid#103))]
-Aggregate Attributes [3]: [count(1)#115, avg(UnscaledValue(ss_ext_discount_amt#102))#116, avg(UnscaledValue(ss_net_paid#103))#117]
-Results [3]: [count(1)#115 AS count(1)#118, cast((avg(UnscaledValue(ss_ext_discount_amt#102))#116 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#119, cast((avg(UnscaledValue(ss_net_paid#103))#117 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#120]
+Functions [3]: [count(1), avg(UnscaledValue(ss_ext_discount_amt#97)), avg(UnscaledValue(ss_net_paid#98))]
+Aggregate Attributes [3]: [count(1)#110, avg(UnscaledValue(ss_ext_discount_amt#97))#111, avg(UnscaledValue(ss_net_paid#98))#112]
+Results [3]: [count(1)#110 AS count(1)#113, cast((avg(UnscaledValue(ss_ext_discount_amt#97))#111 / 100.0) as decimal(11,6)) AS avg(ss_ext_discount_amt)#114, cast((avg(UnscaledValue(ss_net_paid#98))#112 / 100.0) as decimal(11,6)) AS avg(ss_net_paid)#115]
 
 (44) Project [codegen id : 2]
-Output [1]: [named_struct(count(1), count(1)#118, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#119, avg(ss_net_paid), avg(ss_net_paid)#120) AS mergedValue#121]
-Input [3]: [count(1)#118, avg(ss_ext_discount_amt)#119, avg(ss_net_paid)#120]
+Output [1]: [named_struct(count(1), count(1)#113, avg(ss_ext_discount_amt), avg(ss_ext_discount_amt)#114, avg(ss_net_paid), avg(ss_net_paid)#115) AS mergedValue#116]
+Input [3]: [count(1)#113, avg(ss_ext_discount_amt)#114, avg(ss_net_paid)#115]
 
-Subquery:14 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#15]
+Subquery:14 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#5]
 
-Subquery:15 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#15]
+Subquery:15 Hosting operator id = 4 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#5]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q92.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q92.sf100/explain.txt
index dce5f37bb95a4..1211227c840af 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q92.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q92.sf100/explain.txt
@@ -65,42 +65,42 @@ Input [3]: [ws_item_sk#3, ws_ext_discount_amt#4, ws_sold_date_sk#5]
 
 (8) Filter [codegen id : 3]
 Input [3]: [ws_item_sk#3, ws_ext_discount_amt#4, ws_sold_date_sk#5]
-Condition : (isnotnull(ws_item_sk#3) AND might_contain(Subquery scalar-subquery#7, [id=#8], xxhash64(ws_item_sk#3, 42)))
+Condition : (isnotnull(ws_item_sk#3) AND might_contain(Subquery scalar-subquery#7, [id=#2], xxhash64(ws_item_sk#3, 42)))
 
 (9) ReusedExchange [Reuses operator id: 41]
-Output [1]: [d_date_sk#9]
+Output [1]: [d_date_sk#8]
 
 (10) BroadcastHashJoin [codegen id : 3]
 Left keys [1]: [ws_sold_date_sk#5]
-Right keys [1]: [d_date_sk#9]
+Right keys [1]: [d_date_sk#8]
 Join type: Inner
 Join condition: None
 
 (11) Project [codegen id : 3]
 Output [2]: [ws_item_sk#3, ws_ext_discount_amt#4]
-Input [4]: [ws_item_sk#3, ws_ext_discount_amt#4, ws_sold_date_sk#5, d_date_sk#9]
+Input [4]: [ws_item_sk#3, ws_ext_discount_amt#4, ws_sold_date_sk#5, d_date_sk#8]
 
 (12) HashAggregate [codegen id : 3]
 Input [2]: [ws_item_sk#3, ws_ext_discount_amt#4]
 Keys [1]: [ws_item_sk#3]
 Functions [1]: [partial_avg(UnscaledValue(ws_ext_discount_amt#4))]
-Aggregate Attributes [2]: [sum#10, count#11]
-Results [3]: [ws_item_sk#3, sum#12, count#13]
+Aggregate Attributes [2]: [sum#9, count#10]
+Results [3]: [ws_item_sk#3, sum#11, count#12]
 
 (13) Exchange
-Input [3]: [ws_item_sk#3, sum#12, count#13]
-Arguments: hashpartitioning(ws_item_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [3]: [ws_item_sk#3, sum#11, count#12]
+Arguments: hashpartitioning(ws_item_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (14) HashAggregate
-Input [3]: [ws_item_sk#3, sum#12, count#13]
+Input [3]: [ws_item_sk#3, sum#11, count#12]
 Keys [1]: [ws_item_sk#3]
 Functions [1]: [avg(UnscaledValue(ws_ext_discount_amt#4))]
-Aggregate Attributes [1]: [avg(UnscaledValue(ws_ext_discount_amt#4))#14]
-Results [2]: [(1.3 * cast((avg(UnscaledValue(ws_ext_discount_amt#4))#14 / 100.0) as decimal(11,6))) AS (1.3 * avg(ws_ext_discount_amt))#15, ws_item_sk#3]
+Aggregate Attributes [1]: [avg(UnscaledValue(ws_ext_discount_amt#4))#13]
+Results [2]: [(1.3 * cast((avg(UnscaledValue(ws_ext_discount_amt#4))#13 / 100.0) as decimal(11,6))) AS (1.3 * avg(ws_ext_discount_amt))#14, ws_item_sk#3]
 
 (15) Filter
-Input [2]: [(1.3 * avg(ws_ext_discount_amt))#15, ws_item_sk#3]
-Condition : isnotnull((1.3 * avg(ws_ext_discount_amt))#15)
+Input [2]: [(1.3 * avg(ws_ext_discount_amt))#14, ws_item_sk#3]
+Condition : isnotnull((1.3 * avg(ws_ext_discount_amt))#14)
 
 (16) BroadcastHashJoin [codegen id : 4]
 Left keys [1]: [i_item_sk#1]
@@ -109,72 +109,72 @@ Join type: Inner
 Join condition: None
 
 (17) Project [codegen id : 4]
-Output [2]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#15]
-Input [3]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#15, ws_item_sk#3]
+Output [2]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#14]
+Input [3]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#14, ws_item_sk#3]
 
 (18) BroadcastExchange
-Input [2]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#15]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=3]
+Input [2]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#14]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
 
 (19) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_item_sk#16, ws_ext_discount_amt#17, ws_sold_date_sk#18]
+Output [3]: [ws_item_sk#15, ws_ext_discount_amt#16, ws_sold_date_sk#17]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#18), dynamicpruningexpression(ws_sold_date_sk#18 IN dynamicpruning#6)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#17), dynamicpruningexpression(ws_sold_date_sk#17 IN dynamicpruning#6)]
 PushedFilters: [IsNotNull(ws_item_sk), IsNotNull(ws_ext_discount_amt)]
 ReadSchema: struct<ws_item_sk:int,ws_ext_discount_amt:decimal(7,2)>
 
 (20) ColumnarToRow
-Input [3]: [ws_item_sk#16, ws_ext_discount_amt#17, ws_sold_date_sk#18]
+Input [3]: [ws_item_sk#15, ws_ext_discount_amt#16, ws_sold_date_sk#17]
 
 (21) Filter
-Input [3]: [ws_item_sk#16, ws_ext_discount_amt#17, ws_sold_date_sk#18]
-Condition : (isnotnull(ws_item_sk#16) AND isnotnull(ws_ext_discount_amt#17))
+Input [3]: [ws_item_sk#15, ws_ext_discount_amt#16, ws_sold_date_sk#17]
+Condition : (isnotnull(ws_item_sk#15) AND isnotnull(ws_ext_discount_amt#16))
 
 (22) BroadcastHashJoin [codegen id : 6]
 Left keys [1]: [i_item_sk#1]
-Right keys [1]: [ws_item_sk#16]
+Right keys [1]: [ws_item_sk#15]
 Join type: Inner
-Join condition: (cast(ws_ext_discount_amt#17 as decimal(14,7)) > (1.3 * avg(ws_ext_discount_amt))#15)
+Join condition: (cast(ws_ext_discount_amt#16 as decimal(14,7)) > (1.3 * avg(ws_ext_discount_amt))#14)
 
 (23) Project [codegen id : 6]
-Output [2]: [ws_ext_discount_amt#17, ws_sold_date_sk#18]
-Input [5]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#15, ws_item_sk#16, ws_ext_discount_amt#17, ws_sold_date_sk#18]
+Output [2]: [ws_ext_discount_amt#16, ws_sold_date_sk#17]
+Input [5]: [i_item_sk#1, (1.3 * avg(ws_ext_discount_amt))#14, ws_item_sk#15, ws_ext_discount_amt#16, ws_sold_date_sk#17]
 
 (24) ReusedExchange [Reuses operator id: 41]
-Output [1]: [d_date_sk#19]
+Output [1]: [d_date_sk#18]
 
 (25) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#18]
-Right keys [1]: [d_date_sk#19]
+Left keys [1]: [ws_sold_date_sk#17]
+Right keys [1]: [d_date_sk#18]
 Join type: Inner
 Join condition: None
 
 (26) Project [codegen id : 6]
-Output [1]: [ws_ext_discount_amt#17]
-Input [3]: [ws_ext_discount_amt#17, ws_sold_date_sk#18, d_date_sk#19]
+Output [1]: [ws_ext_discount_amt#16]
+Input [3]: [ws_ext_discount_amt#16, ws_sold_date_sk#17, d_date_sk#18]
 
 (27) HashAggregate [codegen id : 6]
-Input [1]: [ws_ext_discount_amt#17]
+Input [1]: [ws_ext_discount_amt#16]
 Keys: []
-Functions [1]: [partial_sum(UnscaledValue(ws_ext_discount_amt#17))]
-Aggregate Attributes [1]: [sum#20]
-Results [1]: [sum#21]
+Functions [1]: [partial_sum(UnscaledValue(ws_ext_discount_amt#16))]
+Aggregate Attributes [1]: [sum#19]
+Results [1]: [sum#20]
 
 (28) Exchange
-Input [1]: [sum#21]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=4]
+Input [1]: [sum#20]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
 
 (29) HashAggregate [codegen id : 7]
-Input [1]: [sum#21]
+Input [1]: [sum#20]
 Keys: []
-Functions [1]: [sum(UnscaledValue(ws_ext_discount_amt#17))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ws_ext_discount_amt#17))#22]
-Results [1]: [MakeDecimal(sum(UnscaledValue(ws_ext_discount_amt#17))#22,17,2) AS Excess Discount Amount #23]
+Functions [1]: [sum(UnscaledValue(ws_ext_discount_amt#16))]
+Aggregate Attributes [1]: [sum(UnscaledValue(ws_ext_discount_amt#16))#21]
+Results [1]: [MakeDecimal(sum(UnscaledValue(ws_ext_discount_amt#16))#21,17,2) AS Excess Discount Amount #22]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#7, [id=#8]
+Subquery:1 Hosting operator id = 8 Hosting Expression = Subquery scalar-subquery#7, [id=#2]
 ObjectHashAggregate (36)
 +- Exchange (35)
    +- ObjectHashAggregate (34)
@@ -206,19 +206,19 @@ Input [2]: [i_item_sk#1, i_manufact_id#2]
 Input [1]: [i_item_sk#1]
 Keys: []
 Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)]
-Aggregate Attributes [1]: [buf#24]
-Results [1]: [buf#25]
+Aggregate Attributes [1]: [buf#23]
+Results [1]: [buf#24]
 
 (35) Exchange
-Input [1]: [buf#25]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
+Input [1]: [buf#24]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
 
 (36) ObjectHashAggregate
-Input [1]: [buf#25]
+Input [1]: [buf#24]
 Keys: []
 Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#26]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#26 AS bloomFilter#27]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#25]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#1, 42), 199, 5556, 0, 0)#25 AS bloomFilter#26]
 
 Subquery:2 Hosting operator id = 6 Hosting Expression = ws_sold_date_sk#5 IN dynamicpruning#6
 BroadcastExchange (41)
@@ -229,27 +229,27 @@ BroadcastExchange (41)
 
 
 (37) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#9, d_date#28]
+Output [2]: [d_date_sk#8, d_date#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,2000-01-27), LessThanOrEqual(d_date,2000-04-26), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (38) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#9, d_date#28]
+Input [2]: [d_date_sk#8, d_date#27]
 
 (39) Filter [codegen id : 1]
-Input [2]: [d_date_sk#9, d_date#28]
-Condition : (((isnotnull(d_date#28) AND (d_date#28 >= 2000-01-27)) AND (d_date#28 <= 2000-04-26)) AND isnotnull(d_date_sk#9))
+Input [2]: [d_date_sk#8, d_date#27]
+Condition : (((isnotnull(d_date#27) AND (d_date#27 >= 2000-01-27)) AND (d_date#27 <= 2000-04-26)) AND isnotnull(d_date_sk#8))
 
 (40) Project [codegen id : 1]
-Output [1]: [d_date_sk#9]
-Input [2]: [d_date_sk#9, d_date#28]
+Output [1]: [d_date_sk#8]
+Input [2]: [d_date_sk#8, d_date#27]
 
 (41) BroadcastExchange
-Input [1]: [d_date_sk#9]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [d_date_sk#8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
-Subquery:3 Hosting operator id = 19 Hosting Expression = ws_sold_date_sk#18 IN dynamicpruning#6
+Subquery:3 Hosting operator id = 19 Hosting Expression = ws_sold_date_sk#17 IN dynamicpruning#6
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q94.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q94.sf100/explain.txt
index ff096bf4509ae..5c2214a3c726f 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q94.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q94.sf100/explain.txt
@@ -58,7 +58,7 @@ Input [8]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_warehouse
 
 (3) Filter [codegen id : 1]
 Input [8]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_warehouse_sk#4, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7, ws_sold_date_sk#8]
-Condition : (((((isnotnull(ws_ship_date_sk#1) AND isnotnull(ws_ship_addr_sk#2)) AND isnotnull(ws_web_site_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#10], xxhash64(ws_ship_addr_sk#2, 42))) AND might_contain(Subquery scalar-subquery#11, [id=#12], xxhash64(ws_web_site_sk#3, 42))) AND might_contain(Subquery scalar-subquery#13, [id=#14], xxhash64(ws_ship_date_sk#1, 42)))
+Condition : (((((isnotnull(ws_ship_date_sk#1) AND isnotnull(ws_ship_addr_sk#2)) AND isnotnull(ws_web_site_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#1], xxhash64(ws_ship_addr_sk#2, 42))) AND might_contain(Subquery scalar-subquery#10, [id=#2], xxhash64(ws_web_site_sk#3, 42))) AND might_contain(Subquery scalar-subquery#11, [id=#3], xxhash64(ws_ship_date_sk#1, 42)))
 
 (4) Project [codegen id : 1]
 Output [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_warehouse_sk#4, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
@@ -66,201 +66,201 @@ Input [8]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_warehouse
 
 (5) Exchange
 Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_warehouse_sk#4, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
-Arguments: hashpartitioning(ws_order_number#5, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(ws_order_number#5, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (6) Sort [codegen id : 2]
 Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_warehouse_sk#4, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
 Arguments: [ws_order_number#5 ASC NULLS FIRST], false, 0
 
 (7) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_warehouse_sk#15, ws_order_number#16, ws_sold_date_sk#17]
+Output [3]: [ws_warehouse_sk#12, ws_order_number#13, ws_sold_date_sk#14]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_sales]
 ReadSchema: struct<ws_warehouse_sk:int,ws_order_number:int>
 
 (8) ColumnarToRow [codegen id : 3]
-Input [3]: [ws_warehouse_sk#15, ws_order_number#16, ws_sold_date_sk#17]
+Input [3]: [ws_warehouse_sk#12, ws_order_number#13, ws_sold_date_sk#14]
 
 (9) Project [codegen id : 3]
-Output [2]: [ws_warehouse_sk#15, ws_order_number#16]
-Input [3]: [ws_warehouse_sk#15, ws_order_number#16, ws_sold_date_sk#17]
+Output [2]: [ws_warehouse_sk#12, ws_order_number#13]
+Input [3]: [ws_warehouse_sk#12, ws_order_number#13, ws_sold_date_sk#14]
 
 (10) Exchange
-Input [2]: [ws_warehouse_sk#15, ws_order_number#16]
-Arguments: hashpartitioning(ws_order_number#16, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [2]: [ws_warehouse_sk#12, ws_order_number#13]
+Arguments: hashpartitioning(ws_order_number#13, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (11) Sort [codegen id : 4]
-Input [2]: [ws_warehouse_sk#15, ws_order_number#16]
-Arguments: [ws_order_number#16 ASC NULLS FIRST], false, 0
+Input [2]: [ws_warehouse_sk#12, ws_order_number#13]
+Arguments: [ws_order_number#13 ASC NULLS FIRST], false, 0
 
 (12) SortMergeJoin [codegen id : 5]
 Left keys [1]: [ws_order_number#5]
-Right keys [1]: [ws_order_number#16]
+Right keys [1]: [ws_order_number#13]
 Join type: LeftSemi
-Join condition: NOT (ws_warehouse_sk#4 = ws_warehouse_sk#15)
+Join condition: NOT (ws_warehouse_sk#4 = ws_warehouse_sk#12)
 
 (13) Project [codegen id : 5]
 Output [6]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
 Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_warehouse_sk#4, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
 
 (14) Scan parquet spark_catalog.default.web_returns
-Output [2]: [wr_order_number#18, wr_returned_date_sk#19]
+Output [2]: [wr_order_number#15, wr_returned_date_sk#16]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_returns]
 ReadSchema: struct<wr_order_number:int>
 
 (15) ColumnarToRow [codegen id : 6]
-Input [2]: [wr_order_number#18, wr_returned_date_sk#19]
+Input [2]: [wr_order_number#15, wr_returned_date_sk#16]
 
 (16) Project [codegen id : 6]
-Output [1]: [wr_order_number#18]
-Input [2]: [wr_order_number#18, wr_returned_date_sk#19]
+Output [1]: [wr_order_number#15]
+Input [2]: [wr_order_number#15, wr_returned_date_sk#16]
 
 (17) Exchange
-Input [1]: [wr_order_number#18]
-Arguments: hashpartitioning(wr_order_number#18, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [1]: [wr_order_number#15]
+Arguments: hashpartitioning(wr_order_number#15, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (18) Sort [codegen id : 7]
-Input [1]: [wr_order_number#18]
-Arguments: [wr_order_number#18 ASC NULLS FIRST], false, 0
+Input [1]: [wr_order_number#15]
+Arguments: [wr_order_number#15 ASC NULLS FIRST], false, 0
 
 (19) SortMergeJoin [codegen id : 11]
 Left keys [1]: [ws_order_number#5]
-Right keys [1]: [wr_order_number#18]
+Right keys [1]: [wr_order_number#15]
 Join type: LeftAnti
 Join condition: None
 
 (20) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#20, ca_state#21]
+Output [2]: [ca_address_sk#17, ca_state#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_state), EqualTo(ca_state,IL), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (21) ColumnarToRow [codegen id : 8]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (22) Filter [codegen id : 8]
-Input [2]: [ca_address_sk#20, ca_state#21]
-Condition : ((isnotnull(ca_state#21) AND (ca_state#21 = IL)) AND isnotnull(ca_address_sk#20))
+Input [2]: [ca_address_sk#17, ca_state#18]
+Condition : ((isnotnull(ca_state#18) AND (ca_state#18 = IL)) AND isnotnull(ca_address_sk#17))
 
 (23) Project [codegen id : 8]
-Output [1]: [ca_address_sk#20]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (24) BroadcastExchange
-Input [1]: [ca_address_sk#20]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [ca_address_sk#17]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 (25) BroadcastHashJoin [codegen id : 11]
 Left keys [1]: [ws_ship_addr_sk#2]
-Right keys [1]: [ca_address_sk#20]
+Right keys [1]: [ca_address_sk#17]
 Join type: Inner
 Join condition: None
 
 (26) Project [codegen id : 11]
 Output [5]: [ws_ship_date_sk#1, ws_web_site_sk#3, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
-Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7, ca_address_sk#20]
+Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7, ca_address_sk#17]
 
 (27) Scan parquet spark_catalog.default.web_site
-Output [2]: [web_site_sk#22, web_company_name#23]
+Output [2]: [web_site_sk#19, web_company_name#20]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_site]
 PushedFilters: [IsNotNull(web_company_name), EqualTo(web_company_name,pri                                               ), IsNotNull(web_site_sk)]
 ReadSchema: struct<web_site_sk:int,web_company_name:string>
 
 (28) ColumnarToRow [codegen id : 9]
-Input [2]: [web_site_sk#22, web_company_name#23]
+Input [2]: [web_site_sk#19, web_company_name#20]
 
 (29) Filter [codegen id : 9]
-Input [2]: [web_site_sk#22, web_company_name#23]
-Condition : ((isnotnull(web_company_name#23) AND (web_company_name#23 = pri                                               )) AND isnotnull(web_site_sk#22))
+Input [2]: [web_site_sk#19, web_company_name#20]
+Condition : ((isnotnull(web_company_name#20) AND (web_company_name#20 = pri                                               )) AND isnotnull(web_site_sk#19))
 
 (30) Project [codegen id : 9]
-Output [1]: [web_site_sk#22]
-Input [2]: [web_site_sk#22, web_company_name#23]
+Output [1]: [web_site_sk#19]
+Input [2]: [web_site_sk#19, web_company_name#20]
 
 (31) BroadcastExchange
-Input [1]: [web_site_sk#22]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Input [1]: [web_site_sk#19]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
 
 (32) BroadcastHashJoin [codegen id : 11]
 Left keys [1]: [ws_web_site_sk#3]
-Right keys [1]: [web_site_sk#22]
+Right keys [1]: [web_site_sk#19]
 Join type: Inner
 Join condition: None
 
 (33) Project [codegen id : 11]
 Output [4]: [ws_ship_date_sk#1, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
-Input [6]: [ws_ship_date_sk#1, ws_web_site_sk#3, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7, web_site_sk#22]
+Input [6]: [ws_ship_date_sk#1, ws_web_site_sk#3, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7, web_site_sk#19]
 
 (34) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_date#25]
+Output [2]: [d_date_sk#21, d_date#22]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,1999-02-01), LessThanOrEqual(d_date,1999-04-02), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (35) ColumnarToRow [codegen id : 10]
-Input [2]: [d_date_sk#24, d_date#25]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (36) Filter [codegen id : 10]
-Input [2]: [d_date_sk#24, d_date#25]
-Condition : (((isnotnull(d_date#25) AND (d_date#25 >= 1999-02-01)) AND (d_date#25 <= 1999-04-02)) AND isnotnull(d_date_sk#24))
+Input [2]: [d_date_sk#21, d_date#22]
+Condition : (((isnotnull(d_date#22) AND (d_date#22 >= 1999-02-01)) AND (d_date#22 <= 1999-04-02)) AND isnotnull(d_date_sk#21))
 
 (37) Project [codegen id : 10]
-Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_date#25]
+Output [1]: [d_date_sk#21]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (38) BroadcastExchange
-Input [1]: [d_date_sk#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [d_date_sk#21]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
 (39) BroadcastHashJoin [codegen id : 11]
 Left keys [1]: [ws_ship_date_sk#1]
-Right keys [1]: [d_date_sk#24]
+Right keys [1]: [d_date_sk#21]
 Join type: Inner
 Join condition: None
 
 (40) Project [codegen id : 11]
 Output [3]: [ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
-Input [5]: [ws_ship_date_sk#1, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7, d_date_sk#24]
+Input [5]: [ws_ship_date_sk#1, ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7, d_date_sk#21]
 
 (41) HashAggregate [codegen id : 11]
 Input [3]: [ws_order_number#5, ws_ext_ship_cost#6, ws_net_profit#7]
 Keys [1]: [ws_order_number#5]
 Functions [2]: [partial_sum(UnscaledValue(ws_ext_ship_cost#6)), partial_sum(UnscaledValue(ws_net_profit#7))]
-Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#6))#26, sum(UnscaledValue(ws_net_profit#7))#27]
-Results [3]: [ws_order_number#5, sum#28, sum#29]
+Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#6))#23, sum(UnscaledValue(ws_net_profit#7))#24]
+Results [3]: [ws_order_number#5, sum#25, sum#26]
 
 (42) HashAggregate [codegen id : 11]
-Input [3]: [ws_order_number#5, sum#28, sum#29]
+Input [3]: [ws_order_number#5, sum#25, sum#26]
 Keys [1]: [ws_order_number#5]
 Functions [2]: [merge_sum(UnscaledValue(ws_ext_ship_cost#6)), merge_sum(UnscaledValue(ws_net_profit#7))]
-Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#6))#26, sum(UnscaledValue(ws_net_profit#7))#27]
-Results [3]: [ws_order_number#5, sum#28, sum#29]
+Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#6))#23, sum(UnscaledValue(ws_net_profit#7))#24]
+Results [3]: [ws_order_number#5, sum#25, sum#26]
 
 (43) HashAggregate [codegen id : 11]
-Input [3]: [ws_order_number#5, sum#28, sum#29]
+Input [3]: [ws_order_number#5, sum#25, sum#26]
 Keys: []
 Functions [3]: [merge_sum(UnscaledValue(ws_ext_ship_cost#6)), merge_sum(UnscaledValue(ws_net_profit#7)), partial_count(distinct ws_order_number#5)]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#6))#26, sum(UnscaledValue(ws_net_profit#7))#27, count(ws_order_number#5)#30]
-Results [3]: [sum#28, sum#29, count#31]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#6))#23, sum(UnscaledValue(ws_net_profit#7))#24, count(ws_order_number#5)#27]
+Results [3]: [sum#25, sum#26, count#28]
 
 (44) Exchange
-Input [3]: [sum#28, sum#29, count#31]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
+Input [3]: [sum#25, sum#26, count#28]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
 
 (45) HashAggregate [codegen id : 12]
-Input [3]: [sum#28, sum#29, count#31]
+Input [3]: [sum#25, sum#26, count#28]
 Keys: []
 Functions [3]: [sum(UnscaledValue(ws_ext_ship_cost#6)), sum(UnscaledValue(ws_net_profit#7)), count(distinct ws_order_number#5)]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#6))#26, sum(UnscaledValue(ws_net_profit#7))#27, count(ws_order_number#5)#30]
-Results [3]: [count(ws_order_number#5)#30 AS order count #32, MakeDecimal(sum(UnscaledValue(ws_ext_ship_cost#6))#26,17,2) AS total shipping cost #33, MakeDecimal(sum(UnscaledValue(ws_net_profit#7))#27,17,2) AS total net profit #34]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#6))#23, sum(UnscaledValue(ws_net_profit#7))#24, count(ws_order_number#5)#27]
+Results [3]: [count(ws_order_number#5)#27 AS order count #29, MakeDecimal(sum(UnscaledValue(ws_ext_ship_cost#6))#23,17,2) AS total shipping cost #30, MakeDecimal(sum(UnscaledValue(ws_net_profit#7))#24,17,2) AS total net profit #31]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#10]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#1]
 ObjectHashAggregate (52)
 +- Exchange (51)
    +- ObjectHashAggregate (50)
@@ -271,42 +271,42 @@ ObjectHashAggregate (52)
 
 
 (46) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#20, ca_state#21]
+Output [2]: [ca_address_sk#17, ca_state#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_state), EqualTo(ca_state,IL), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (47) ColumnarToRow [codegen id : 1]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (48) Filter [codegen id : 1]
-Input [2]: [ca_address_sk#20, ca_state#21]
-Condition : ((isnotnull(ca_state#21) AND (ca_state#21 = IL)) AND isnotnull(ca_address_sk#20))
+Input [2]: [ca_address_sk#17, ca_state#18]
+Condition : ((isnotnull(ca_state#18) AND (ca_state#18 = IL)) AND isnotnull(ca_address_sk#17))
 
 (49) Project [codegen id : 1]
-Output [1]: [ca_address_sk#20]
-Input [2]: [ca_address_sk#20, ca_state#21]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_state#18]
 
 (50) ObjectHashAggregate
-Input [1]: [ca_address_sk#20]
+Input [1]: [ca_address_sk#17]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)]
-Aggregate Attributes [1]: [buf#35]
-Results [1]: [buf#36]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)]
+Aggregate Attributes [1]: [buf#32]
+Results [1]: [buf#33]
 
 (51) Exchange
-Input [1]: [buf#36]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
+Input [1]: [buf#33]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
 
 (52) ObjectHashAggregate
-Input [1]: [buf#36]
+Input [1]: [buf#33]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)#37]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#20, 42), 17961, 333176, 0, 0)#37 AS bloomFilter#38]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)#34]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 17961, 333176, 0, 0)#34 AS bloomFilter#35]
 
-Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#11, [id=#12]
+Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#10, [id=#2]
 ObjectHashAggregate (59)
 +- Exchange (58)
    +- ObjectHashAggregate (57)
@@ -317,42 +317,42 @@ ObjectHashAggregate (59)
 
 
 (53) Scan parquet spark_catalog.default.web_site
-Output [2]: [web_site_sk#22, web_company_name#23]
+Output [2]: [web_site_sk#19, web_company_name#20]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_site]
 PushedFilters: [IsNotNull(web_company_name), EqualTo(web_company_name,pri                                               ), IsNotNull(web_site_sk)]
 ReadSchema: struct<web_site_sk:int,web_company_name:string>
 
 (54) ColumnarToRow [codegen id : 1]
-Input [2]: [web_site_sk#22, web_company_name#23]
+Input [2]: [web_site_sk#19, web_company_name#20]
 
 (55) Filter [codegen id : 1]
-Input [2]: [web_site_sk#22, web_company_name#23]
-Condition : ((isnotnull(web_company_name#23) AND (web_company_name#23 = pri                                               )) AND isnotnull(web_site_sk#22))
+Input [2]: [web_site_sk#19, web_company_name#20]
+Condition : ((isnotnull(web_company_name#20) AND (web_company_name#20 = pri                                               )) AND isnotnull(web_site_sk#19))
 
 (56) Project [codegen id : 1]
-Output [1]: [web_site_sk#22]
-Input [2]: [web_site_sk#22, web_company_name#23]
+Output [1]: [web_site_sk#19]
+Input [2]: [web_site_sk#19, web_company_name#20]
 
 (57) ObjectHashAggregate
-Input [1]: [web_site_sk#22]
+Input [1]: [web_site_sk#19]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(web_site_sk#22, 42), 4, 144, 0, 0)]
-Aggregate Attributes [1]: [buf#39]
-Results [1]: [buf#40]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(web_site_sk#19, 42), 4, 144, 0, 0)]
+Aggregate Attributes [1]: [buf#36]
+Results [1]: [buf#37]
 
 (58) Exchange
-Input [1]: [buf#40]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
+Input [1]: [buf#37]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (59) ObjectHashAggregate
-Input [1]: [buf#40]
+Input [1]: [buf#37]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(web_site_sk#22, 42), 4, 144, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(web_site_sk#22, 42), 4, 144, 0, 0)#41]
-Results [1]: [bloom_filter_agg(xxhash64(web_site_sk#22, 42), 4, 144, 0, 0)#41 AS bloomFilter#42]
+Functions [1]: [bloom_filter_agg(xxhash64(web_site_sk#19, 42), 4, 144, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(web_site_sk#19, 42), 4, 144, 0, 0)#38]
+Results [1]: [bloom_filter_agg(xxhash64(web_site_sk#19, 42), 4, 144, 0, 0)#38 AS bloomFilter#39]
 
-Subquery:3 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#13, [id=#14]
+Subquery:3 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#11, [id=#3]
 ObjectHashAggregate (66)
 +- Exchange (65)
    +- ObjectHashAggregate (64)
@@ -363,39 +363,39 @@ ObjectHashAggregate (66)
 
 
 (60) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_date#25]
+Output [2]: [d_date_sk#21, d_date#22]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,1999-02-01), LessThanOrEqual(d_date,1999-04-02), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (61) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#24, d_date#25]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (62) Filter [codegen id : 1]
-Input [2]: [d_date_sk#24, d_date#25]
-Condition : (((isnotnull(d_date#25) AND (d_date#25 >= 1999-02-01)) AND (d_date#25 <= 1999-04-02)) AND isnotnull(d_date_sk#24))
+Input [2]: [d_date_sk#21, d_date#22]
+Condition : (((isnotnull(d_date#22) AND (d_date#22 >= 1999-02-01)) AND (d_date#22 <= 1999-04-02)) AND isnotnull(d_date_sk#21))
 
 (63) Project [codegen id : 1]
-Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_date#25]
+Output [1]: [d_date_sk#21]
+Input [2]: [d_date_sk#21, d_date#22]
 
 (64) ObjectHashAggregate
-Input [1]: [d_date_sk#24]
+Input [1]: [d_date_sk#21]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)]
-Aggregate Attributes [1]: [buf#43]
-Results [1]: [buf#44]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)]
+Aggregate Attributes [1]: [buf#40]
+Results [1]: [buf#41]
 
 (65) Exchange
-Input [1]: [buf#44]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [buf#41]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (66) ObjectHashAggregate
-Input [1]: [buf#44]
+Input [1]: [buf#41]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)#45]
-Results [1]: [bloom_filter_agg(xxhash64(d_date_sk#24, 42), 73049, 1141755, 0, 0)#45 AS bloomFilter#46]
+Functions [1]: [bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)#42]
+Results [1]: [bloom_filter_agg(xxhash64(d_date_sk#21, 42), 73049, 1141755, 0, 0)#42 AS bloomFilter#43]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q95.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q95.sf100/explain.txt
index ad3cbcf223b27..839a0d1eebb8c 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q95.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v1_4/q95.sf100/explain.txt
@@ -70,7 +70,7 @@ Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_num
 
 (3) Filter [codegen id : 1]
 Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6, ws_sold_date_sk#7]
-Condition : (((((isnotnull(ws_ship_date_sk#1) AND isnotnull(ws_ship_addr_sk#2)) AND isnotnull(ws_web_site_sk#3)) AND might_contain(Subquery scalar-subquery#8, [id=#9], xxhash64(ws_ship_addr_sk#2, 42))) AND might_contain(Subquery scalar-subquery#10, [id=#11], xxhash64(ws_web_site_sk#3, 42))) AND might_contain(Subquery scalar-subquery#12, [id=#13], xxhash64(ws_ship_date_sk#1, 42)))
+Condition : (((((isnotnull(ws_ship_date_sk#1) AND isnotnull(ws_ship_addr_sk#2)) AND isnotnull(ws_web_site_sk#3)) AND might_contain(Subquery scalar-subquery#8, [id=#1], xxhash64(ws_ship_addr_sk#2, 42))) AND might_contain(Subquery scalar-subquery#9, [id=#2], xxhash64(ws_web_site_sk#3, 42))) AND might_contain(Subquery scalar-subquery#10, [id=#3], xxhash64(ws_ship_date_sk#1, 42)))
 
 (4) Project [codegen id : 1]
 Output [6]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6]
@@ -78,254 +78,254 @@ Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_num
 
 (5) Exchange
 Input [6]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6]
-Arguments: hashpartitioning(ws_order_number#4, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(ws_order_number#4, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (6) Sort [codegen id : 2]
 Input [6]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6]
 Arguments: [ws_order_number#4 ASC NULLS FIRST], false, 0
 
 (7) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_warehouse_sk#14, ws_order_number#15, ws_sold_date_sk#16]
+Output [3]: [ws_warehouse_sk#11, ws_order_number#12, ws_sold_date_sk#13]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_sales]
 PushedFilters: [IsNotNull(ws_order_number), IsNotNull(ws_warehouse_sk)]
 ReadSchema: struct<ws_warehouse_sk:int,ws_order_number:int>
 
 (8) ColumnarToRow [codegen id : 3]
-Input [3]: [ws_warehouse_sk#14, ws_order_number#15, ws_sold_date_sk#16]
+Input [3]: [ws_warehouse_sk#11, ws_order_number#12, ws_sold_date_sk#13]
 
 (9) Filter [codegen id : 3]
-Input [3]: [ws_warehouse_sk#14, ws_order_number#15, ws_sold_date_sk#16]
-Condition : (isnotnull(ws_order_number#15) AND isnotnull(ws_warehouse_sk#14))
+Input [3]: [ws_warehouse_sk#11, ws_order_number#12, ws_sold_date_sk#13]
+Condition : (isnotnull(ws_order_number#12) AND isnotnull(ws_warehouse_sk#11))
 
 (10) Project [codegen id : 3]
-Output [2]: [ws_warehouse_sk#14, ws_order_number#15]
-Input [3]: [ws_warehouse_sk#14, ws_order_number#15, ws_sold_date_sk#16]
+Output [2]: [ws_warehouse_sk#11, ws_order_number#12]
+Input [3]: [ws_warehouse_sk#11, ws_order_number#12, ws_sold_date_sk#13]
 
 (11) Exchange
-Input [2]: [ws_warehouse_sk#14, ws_order_number#15]
-Arguments: hashpartitioning(ws_order_number#15, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [2]: [ws_warehouse_sk#11, ws_order_number#12]
+Arguments: hashpartitioning(ws_order_number#12, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (12) Sort [codegen id : 4]
-Input [2]: [ws_warehouse_sk#14, ws_order_number#15]
-Arguments: [ws_order_number#15 ASC NULLS FIRST], false, 0
+Input [2]: [ws_warehouse_sk#11, ws_order_number#12]
+Arguments: [ws_order_number#12 ASC NULLS FIRST], false, 0
 
 (13) ReusedExchange [Reuses operator id: 11]
-Output [2]: [ws_warehouse_sk#17, ws_order_number#18]
+Output [2]: [ws_warehouse_sk#14, ws_order_number#15]
 
 (14) Sort [codegen id : 6]
-Input [2]: [ws_warehouse_sk#17, ws_order_number#18]
-Arguments: [ws_order_number#18 ASC NULLS FIRST], false, 0
+Input [2]: [ws_warehouse_sk#14, ws_order_number#15]
+Arguments: [ws_order_number#15 ASC NULLS FIRST], false, 0
 
 (15) SortMergeJoin [codegen id : 7]
-Left keys [1]: [ws_order_number#15]
-Right keys [1]: [ws_order_number#18]
+Left keys [1]: [ws_order_number#12]
+Right keys [1]: [ws_order_number#15]
 Join type: Inner
-Join condition: NOT (ws_warehouse_sk#14 = ws_warehouse_sk#17)
+Join condition: NOT (ws_warehouse_sk#11 = ws_warehouse_sk#14)
 
 (16) Project [codegen id : 7]
-Output [1]: [ws_order_number#15]
-Input [4]: [ws_warehouse_sk#14, ws_order_number#15, ws_warehouse_sk#17, ws_order_number#18]
+Output [1]: [ws_order_number#12]
+Input [4]: [ws_warehouse_sk#11, ws_order_number#12, ws_warehouse_sk#14, ws_order_number#15]
 
 (17) SortMergeJoin [codegen id : 8]
 Left keys [1]: [ws_order_number#4]
-Right keys [1]: [ws_order_number#15]
+Right keys [1]: [ws_order_number#12]
 Join type: LeftSemi
 Join condition: None
 
 (18) Scan parquet spark_catalog.default.web_returns
-Output [2]: [wr_order_number#19, wr_returned_date_sk#20]
+Output [2]: [wr_order_number#16, wr_returned_date_sk#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_returns]
 PushedFilters: [IsNotNull(wr_order_number)]
 ReadSchema: struct<wr_order_number:int>
 
 (19) ColumnarToRow [codegen id : 9]
-Input [2]: [wr_order_number#19, wr_returned_date_sk#20]
+Input [2]: [wr_order_number#16, wr_returned_date_sk#17]
 
 (20) Filter [codegen id : 9]
-Input [2]: [wr_order_number#19, wr_returned_date_sk#20]
-Condition : isnotnull(wr_order_number#19)
+Input [2]: [wr_order_number#16, wr_returned_date_sk#17]
+Condition : isnotnull(wr_order_number#16)
 
 (21) Project [codegen id : 9]
-Output [1]: [wr_order_number#19]
-Input [2]: [wr_order_number#19, wr_returned_date_sk#20]
+Output [1]: [wr_order_number#16]
+Input [2]: [wr_order_number#16, wr_returned_date_sk#17]
 
 (22) Exchange
-Input [1]: [wr_order_number#19]
-Arguments: hashpartitioning(wr_order_number#19, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [1]: [wr_order_number#16]
+Arguments: hashpartitioning(wr_order_number#16, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (23) Sort [codegen id : 10]
-Input [1]: [wr_order_number#19]
-Arguments: [wr_order_number#19 ASC NULLS FIRST], false, 0
+Input [1]: [wr_order_number#16]
+Arguments: [wr_order_number#16 ASC NULLS FIRST], false, 0
 
 (24) ReusedExchange [Reuses operator id: 11]
-Output [2]: [ws_warehouse_sk#21, ws_order_number#22]
+Output [2]: [ws_warehouse_sk#18, ws_order_number#19]
 
 (25) Sort [codegen id : 12]
-Input [2]: [ws_warehouse_sk#21, ws_order_number#22]
-Arguments: [ws_order_number#22 ASC NULLS FIRST], false, 0
+Input [2]: [ws_warehouse_sk#18, ws_order_number#19]
+Arguments: [ws_order_number#19 ASC NULLS FIRST], false, 0
 
 (26) SortMergeJoin [codegen id : 13]
-Left keys [1]: [wr_order_number#19]
-Right keys [1]: [ws_order_number#22]
+Left keys [1]: [wr_order_number#16]
+Right keys [1]: [ws_order_number#19]
 Join type: Inner
 Join condition: None
 
 (27) ReusedExchange [Reuses operator id: 11]
-Output [2]: [ws_warehouse_sk#23, ws_order_number#24]
+Output [2]: [ws_warehouse_sk#20, ws_order_number#21]
 
 (28) Sort [codegen id : 15]
-Input [2]: [ws_warehouse_sk#23, ws_order_number#24]
-Arguments: [ws_order_number#24 ASC NULLS FIRST], false, 0
+Input [2]: [ws_warehouse_sk#20, ws_order_number#21]
+Arguments: [ws_order_number#21 ASC NULLS FIRST], false, 0
 
 (29) SortMergeJoin [codegen id : 16]
-Left keys [1]: [ws_order_number#22]
-Right keys [1]: [ws_order_number#24]
+Left keys [1]: [ws_order_number#19]
+Right keys [1]: [ws_order_number#21]
 Join type: Inner
-Join condition: NOT (ws_warehouse_sk#21 = ws_warehouse_sk#23)
+Join condition: NOT (ws_warehouse_sk#18 = ws_warehouse_sk#20)
 
 (30) Project [codegen id : 16]
-Output [1]: [wr_order_number#19]
-Input [5]: [wr_order_number#19, ws_warehouse_sk#21, ws_order_number#22, ws_warehouse_sk#23, ws_order_number#24]
+Output [1]: [wr_order_number#16]
+Input [5]: [wr_order_number#16, ws_warehouse_sk#18, ws_order_number#19, ws_warehouse_sk#20, ws_order_number#21]
 
 (31) SortMergeJoin [codegen id : 20]
 Left keys [1]: [ws_order_number#4]
-Right keys [1]: [wr_order_number#19]
+Right keys [1]: [wr_order_number#16]
 Join type: LeftSemi
 Join condition: None
 
 (32) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#25, ca_state#26]
+Output [2]: [ca_address_sk#22, ca_state#23]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_state), EqualTo(ca_state,IL), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (33) ColumnarToRow [codegen id : 17]
-Input [2]: [ca_address_sk#25, ca_state#26]
+Input [2]: [ca_address_sk#22, ca_state#23]
 
 (34) Filter [codegen id : 17]
-Input [2]: [ca_address_sk#25, ca_state#26]
-Condition : ((isnotnull(ca_state#26) AND (ca_state#26 = IL)) AND isnotnull(ca_address_sk#25))
+Input [2]: [ca_address_sk#22, ca_state#23]
+Condition : ((isnotnull(ca_state#23) AND (ca_state#23 = IL)) AND isnotnull(ca_address_sk#22))
 
 (35) Project [codegen id : 17]
-Output [1]: [ca_address_sk#25]
-Input [2]: [ca_address_sk#25, ca_state#26]
+Output [1]: [ca_address_sk#22]
+Input [2]: [ca_address_sk#22, ca_state#23]
 
 (36) BroadcastExchange
-Input [1]: [ca_address_sk#25]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [ca_address_sk#22]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 (37) BroadcastHashJoin [codegen id : 20]
 Left keys [1]: [ws_ship_addr_sk#2]
-Right keys [1]: [ca_address_sk#25]
+Right keys [1]: [ca_address_sk#22]
 Join type: Inner
 Join condition: None
 
 (38) Project [codegen id : 20]
 Output [5]: [ws_ship_date_sk#1, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6]
-Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6, ca_address_sk#25]
+Input [7]: [ws_ship_date_sk#1, ws_ship_addr_sk#2, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6, ca_address_sk#22]
 
 (39) Scan parquet spark_catalog.default.web_site
-Output [2]: [web_site_sk#27, web_company_name#28]
+Output [2]: [web_site_sk#24, web_company_name#25]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_site]
 PushedFilters: [IsNotNull(web_company_name), EqualTo(web_company_name,pri                                               ), IsNotNull(web_site_sk)]
 ReadSchema: struct<web_site_sk:int,web_company_name:string>
 
 (40) ColumnarToRow [codegen id : 18]
-Input [2]: [web_site_sk#27, web_company_name#28]
+Input [2]: [web_site_sk#24, web_company_name#25]
 
 (41) Filter [codegen id : 18]
-Input [2]: [web_site_sk#27, web_company_name#28]
-Condition : ((isnotnull(web_company_name#28) AND (web_company_name#28 = pri                                               )) AND isnotnull(web_site_sk#27))
+Input [2]: [web_site_sk#24, web_company_name#25]
+Condition : ((isnotnull(web_company_name#25) AND (web_company_name#25 = pri                                               )) AND isnotnull(web_site_sk#24))
 
 (42) Project [codegen id : 18]
-Output [1]: [web_site_sk#27]
-Input [2]: [web_site_sk#27, web_company_name#28]
+Output [1]: [web_site_sk#24]
+Input [2]: [web_site_sk#24, web_company_name#25]
 
 (43) BroadcastExchange
-Input [1]: [web_site_sk#27]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Input [1]: [web_site_sk#24]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
 
 (44) BroadcastHashJoin [codegen id : 20]
 Left keys [1]: [ws_web_site_sk#3]
-Right keys [1]: [web_site_sk#27]
+Right keys [1]: [web_site_sk#24]
 Join type: Inner
 Join condition: None
 
 (45) Project [codegen id : 20]
 Output [4]: [ws_ship_date_sk#1, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6]
-Input [6]: [ws_ship_date_sk#1, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6, web_site_sk#27]
+Input [6]: [ws_ship_date_sk#1, ws_web_site_sk#3, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6, web_site_sk#24]
 
 (46) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#29, d_date#30]
+Output [2]: [d_date_sk#26, d_date#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,1999-02-01), LessThanOrEqual(d_date,1999-04-02), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (47) ColumnarToRow [codegen id : 19]
-Input [2]: [d_date_sk#29, d_date#30]
+Input [2]: [d_date_sk#26, d_date#27]
 
 (48) Filter [codegen id : 19]
-Input [2]: [d_date_sk#29, d_date#30]
-Condition : (((isnotnull(d_date#30) AND (d_date#30 >= 1999-02-01)) AND (d_date#30 <= 1999-04-02)) AND isnotnull(d_date_sk#29))
+Input [2]: [d_date_sk#26, d_date#27]
+Condition : (((isnotnull(d_date#27) AND (d_date#27 >= 1999-02-01)) AND (d_date#27 <= 1999-04-02)) AND isnotnull(d_date_sk#26))
 
 (49) Project [codegen id : 19]
-Output [1]: [d_date_sk#29]
-Input [2]: [d_date_sk#29, d_date#30]
+Output [1]: [d_date_sk#26]
+Input [2]: [d_date_sk#26, d_date#27]
 
 (50) BroadcastExchange
-Input [1]: [d_date_sk#29]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [d_date_sk#26]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
 (51) BroadcastHashJoin [codegen id : 20]
 Left keys [1]: [ws_ship_date_sk#1]
-Right keys [1]: [d_date_sk#29]
+Right keys [1]: [d_date_sk#26]
 Join type: Inner
 Join condition: None
 
 (52) Project [codegen id : 20]
 Output [3]: [ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6]
-Input [5]: [ws_ship_date_sk#1, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6, d_date_sk#29]
+Input [5]: [ws_ship_date_sk#1, ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6, d_date_sk#26]
 
 (53) HashAggregate [codegen id : 20]
 Input [3]: [ws_order_number#4, ws_ext_ship_cost#5, ws_net_profit#6]
 Keys [1]: [ws_order_number#4]
 Functions [2]: [partial_sum(UnscaledValue(ws_ext_ship_cost#5)), partial_sum(UnscaledValue(ws_net_profit#6))]
-Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#5))#31, sum(UnscaledValue(ws_net_profit#6))#32]
-Results [3]: [ws_order_number#4, sum#33, sum#34]
+Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#5))#28, sum(UnscaledValue(ws_net_profit#6))#29]
+Results [3]: [ws_order_number#4, sum#30, sum#31]
 
 (54) HashAggregate [codegen id : 20]
-Input [3]: [ws_order_number#4, sum#33, sum#34]
+Input [3]: [ws_order_number#4, sum#30, sum#31]
 Keys [1]: [ws_order_number#4]
 Functions [2]: [merge_sum(UnscaledValue(ws_ext_ship_cost#5)), merge_sum(UnscaledValue(ws_net_profit#6))]
-Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#5))#31, sum(UnscaledValue(ws_net_profit#6))#32]
-Results [3]: [ws_order_number#4, sum#33, sum#34]
+Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_ship_cost#5))#28, sum(UnscaledValue(ws_net_profit#6))#29]
+Results [3]: [ws_order_number#4, sum#30, sum#31]
 
 (55) HashAggregate [codegen id : 20]
-Input [3]: [ws_order_number#4, sum#33, sum#34]
+Input [3]: [ws_order_number#4, sum#30, sum#31]
 Keys: []
 Functions [3]: [merge_sum(UnscaledValue(ws_ext_ship_cost#5)), merge_sum(UnscaledValue(ws_net_profit#6)), partial_count(distinct ws_order_number#4)]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#5))#31, sum(UnscaledValue(ws_net_profit#6))#32, count(ws_order_number#4)#35]
-Results [3]: [sum#33, sum#34, count#36]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#5))#28, sum(UnscaledValue(ws_net_profit#6))#29, count(ws_order_number#4)#32]
+Results [3]: [sum#30, sum#31, count#33]
 
 (56) Exchange
-Input [3]: [sum#33, sum#34, count#36]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
+Input [3]: [sum#30, sum#31, count#33]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
 
 (57) HashAggregate [codegen id : 21]
-Input [3]: [sum#33, sum#34, count#36]
+Input [3]: [sum#30, sum#31, count#33]
 Keys: []
 Functions [3]: [sum(UnscaledValue(ws_ext_ship_cost#5)), sum(UnscaledValue(ws_net_profit#6)), count(distinct ws_order_number#4)]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#5))#31, sum(UnscaledValue(ws_net_profit#6))#32, count(ws_order_number#4)#35]
-Results [3]: [count(ws_order_number#4)#35 AS order count #37, MakeDecimal(sum(UnscaledValue(ws_ext_ship_cost#5))#31,17,2) AS total shipping cost #38, MakeDecimal(sum(UnscaledValue(ws_net_profit#6))#32,17,2) AS total net profit #39]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_ship_cost#5))#28, sum(UnscaledValue(ws_net_profit#6))#29, count(ws_order_number#4)#32]
+Results [3]: [count(ws_order_number#4)#32 AS order count #34, MakeDecimal(sum(UnscaledValue(ws_ext_ship_cost#5))#28,17,2) AS total shipping cost #35, MakeDecimal(sum(UnscaledValue(ws_net_profit#6))#29,17,2) AS total net profit #36]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#8, [id=#9]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#8, [id=#1]
 ObjectHashAggregate (64)
 +- Exchange (63)
    +- ObjectHashAggregate (62)
@@ -336,42 +336,42 @@ ObjectHashAggregate (64)
 
 
 (58) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#25, ca_state#26]
+Output [2]: [ca_address_sk#22, ca_state#23]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_state), EqualTo(ca_state,IL), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_state:string>
 
 (59) ColumnarToRow [codegen id : 1]
-Input [2]: [ca_address_sk#25, ca_state#26]
+Input [2]: [ca_address_sk#22, ca_state#23]
 
 (60) Filter [codegen id : 1]
-Input [2]: [ca_address_sk#25, ca_state#26]
-Condition : ((isnotnull(ca_state#26) AND (ca_state#26 = IL)) AND isnotnull(ca_address_sk#25))
+Input [2]: [ca_address_sk#22, ca_state#23]
+Condition : ((isnotnull(ca_state#23) AND (ca_state#23 = IL)) AND isnotnull(ca_address_sk#22))
 
 (61) Project [codegen id : 1]
-Output [1]: [ca_address_sk#25]
-Input [2]: [ca_address_sk#25, ca_state#26]
+Output [1]: [ca_address_sk#22]
+Input [2]: [ca_address_sk#22, ca_state#23]
 
 (62) ObjectHashAggregate
-Input [1]: [ca_address_sk#25]
+Input [1]: [ca_address_sk#22]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#25, 42), 17961, 333176, 0, 0)]
-Aggregate Attributes [1]: [buf#40]
-Results [1]: [buf#41]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#22, 42), 17961, 333176, 0, 0)]
+Aggregate Attributes [1]: [buf#37]
+Results [1]: [buf#38]
 
 (63) Exchange
-Input [1]: [buf#41]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
+Input [1]: [buf#38]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=11]
 
 (64) ObjectHashAggregate
-Input [1]: [buf#41]
+Input [1]: [buf#38]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#25, 42), 17961, 333176, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#25, 42), 17961, 333176, 0, 0)#42]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#25, 42), 17961, 333176, 0, 0)#42 AS bloomFilter#43]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#22, 42), 17961, 333176, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#22, 42), 17961, 333176, 0, 0)#39]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#22, 42), 17961, 333176, 0, 0)#39 AS bloomFilter#40]
 
-Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#10, [id=#11]
+Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#2]
 ObjectHashAggregate (71)
 +- Exchange (70)
    +- ObjectHashAggregate (69)
@@ -382,42 +382,42 @@ ObjectHashAggregate (71)
 
 
 (65) Scan parquet spark_catalog.default.web_site
-Output [2]: [web_site_sk#27, web_company_name#28]
+Output [2]: [web_site_sk#24, web_company_name#25]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_site]
 PushedFilters: [IsNotNull(web_company_name), EqualTo(web_company_name,pri                                               ), IsNotNull(web_site_sk)]
 ReadSchema: struct<web_site_sk:int,web_company_name:string>
 
 (66) ColumnarToRow [codegen id : 1]
-Input [2]: [web_site_sk#27, web_company_name#28]
+Input [2]: [web_site_sk#24, web_company_name#25]
 
 (67) Filter [codegen id : 1]
-Input [2]: [web_site_sk#27, web_company_name#28]
-Condition : ((isnotnull(web_company_name#28) AND (web_company_name#28 = pri                                               )) AND isnotnull(web_site_sk#27))
+Input [2]: [web_site_sk#24, web_company_name#25]
+Condition : ((isnotnull(web_company_name#25) AND (web_company_name#25 = pri                                               )) AND isnotnull(web_site_sk#24))
 
 (68) Project [codegen id : 1]
-Output [1]: [web_site_sk#27]
-Input [2]: [web_site_sk#27, web_company_name#28]
+Output [1]: [web_site_sk#24]
+Input [2]: [web_site_sk#24, web_company_name#25]
 
 (69) ObjectHashAggregate
-Input [1]: [web_site_sk#27]
+Input [1]: [web_site_sk#24]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(web_site_sk#27, 42), 4, 144, 0, 0)]
-Aggregate Attributes [1]: [buf#44]
-Results [1]: [buf#45]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(web_site_sk#24, 42), 4, 144, 0, 0)]
+Aggregate Attributes [1]: [buf#41]
+Results [1]: [buf#42]
 
 (70) Exchange
-Input [1]: [buf#45]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=9]
+Input [1]: [buf#42]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
 
 (71) ObjectHashAggregate
-Input [1]: [buf#45]
+Input [1]: [buf#42]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(web_site_sk#27, 42), 4, 144, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(web_site_sk#27, 42), 4, 144, 0, 0)#46]
-Results [1]: [bloom_filter_agg(xxhash64(web_site_sk#27, 42), 4, 144, 0, 0)#46 AS bloomFilter#47]
+Functions [1]: [bloom_filter_agg(xxhash64(web_site_sk#24, 42), 4, 144, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(web_site_sk#24, 42), 4, 144, 0, 0)#43]
+Results [1]: [bloom_filter_agg(xxhash64(web_site_sk#24, 42), 4, 144, 0, 0)#43 AS bloomFilter#44]
 
-Subquery:3 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#12, [id=#13]
+Subquery:3 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#10, [id=#3]
 ObjectHashAggregate (78)
 +- Exchange (77)
    +- ObjectHashAggregate (76)
@@ -428,39 +428,39 @@ ObjectHashAggregate (78)
 
 
 (72) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#29, d_date#30]
+Output [2]: [d_date_sk#26, d_date#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,1999-02-01), LessThanOrEqual(d_date,1999-04-02), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (73) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#29, d_date#30]
+Input [2]: [d_date_sk#26, d_date#27]
 
 (74) Filter [codegen id : 1]
-Input [2]: [d_date_sk#29, d_date#30]
-Condition : (((isnotnull(d_date#30) AND (d_date#30 >= 1999-02-01)) AND (d_date#30 <= 1999-04-02)) AND isnotnull(d_date_sk#29))
+Input [2]: [d_date_sk#26, d_date#27]
+Condition : (((isnotnull(d_date#27) AND (d_date#27 >= 1999-02-01)) AND (d_date#27 <= 1999-04-02)) AND isnotnull(d_date_sk#26))
 
 (75) Project [codegen id : 1]
-Output [1]: [d_date_sk#29]
-Input [2]: [d_date_sk#29, d_date#30]
+Output [1]: [d_date_sk#26]
+Input [2]: [d_date_sk#26, d_date#27]
 
 (76) ObjectHashAggregate
-Input [1]: [d_date_sk#29]
+Input [1]: [d_date_sk#26]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(d_date_sk#29, 42), 73049, 1141755, 0, 0)]
-Aggregate Attributes [1]: [buf#48]
-Results [1]: [buf#49]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(d_date_sk#26, 42), 73049, 1141755, 0, 0)]
+Aggregate Attributes [1]: [buf#45]
+Results [1]: [buf#46]
 
 (77) Exchange
-Input [1]: [buf#49]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [buf#46]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (78) ObjectHashAggregate
-Input [1]: [buf#49]
+Input [1]: [buf#46]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(d_date_sk#29, 42), 73049, 1141755, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_date_sk#29, 42), 73049, 1141755, 0, 0)#50]
-Results [1]: [bloom_filter_agg(xxhash64(d_date_sk#29, 42), 73049, 1141755, 0, 0)#50 AS bloomFilter#51]
+Functions [1]: [bloom_filter_agg(xxhash64(d_date_sk#26, 42), 73049, 1141755, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(d_date_sk#26, 42), 73049, 1141755, 0, 0)#47]
+Results [1]: [bloom_filter_agg(xxhash64(d_date_sk#26, 42), 73049, 1141755, 0, 0)#47 AS bloomFilter#48]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q10a.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q10a.sf100/explain.txt
index 72298764a9e36..c8cab1aecdb74 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q10a.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q10a.sf100/explain.txt
@@ -58,112 +58,112 @@ Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 
 (3) Filter [codegen id : 1]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
-Condition : ((isnotnull(c_current_addr_sk#3) AND isnotnull(c_current_cdemo_sk#2)) AND might_contain(Subquery scalar-subquery#4, [id=#5], xxhash64(c_current_addr_sk#3, 42)))
+Condition : ((isnotnull(c_current_addr_sk#3) AND isnotnull(c_current_cdemo_sk#2)) AND might_contain(Subquery scalar-subquery#4, [id=#1], xxhash64(c_current_addr_sk#3, 42)))
 
 (4) Exchange
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
-Arguments: hashpartitioning(c_customer_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(c_customer_sk#1, 5), ENSURE_REQUIREMENTS, [plan_id=2]
 
 (5) Sort [codegen id : 2]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 Arguments: [c_customer_sk#1 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.store_sales
-Output [2]: [ss_customer_sk#6, ss_sold_date_sk#7]
+Output [2]: [ss_customer_sk#5, ss_sold_date_sk#6]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#7), dynamicpruningexpression(ss_sold_date_sk#7 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#6), dynamicpruningexpression(ss_sold_date_sk#6 IN dynamicpruning#7)]
 ReadSchema: struct<ss_customer_sk:int>
 
 (7) ColumnarToRow [codegen id : 4]
-Input [2]: [ss_customer_sk#6, ss_sold_date_sk#7]
+Input [2]: [ss_customer_sk#5, ss_sold_date_sk#6]
 
 (8) ReusedExchange [Reuses operator id: 57]
-Output [1]: [d_date_sk#9]
+Output [1]: [d_date_sk#8]
 
 (9) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [ss_sold_date_sk#7]
-Right keys [1]: [d_date_sk#9]
+Left keys [1]: [ss_sold_date_sk#6]
+Right keys [1]: [d_date_sk#8]
 Join type: Inner
 Join condition: None
 
 (10) Project [codegen id : 4]
-Output [1]: [ss_customer_sk#6]
-Input [3]: [ss_customer_sk#6, ss_sold_date_sk#7, d_date_sk#9]
+Output [1]: [ss_customer_sk#5]
+Input [3]: [ss_customer_sk#5, ss_sold_date_sk#6, d_date_sk#8]
 
 (11) Exchange
-Input [1]: [ss_customer_sk#6]
-Arguments: hashpartitioning(ss_customer_sk#6, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [1]: [ss_customer_sk#5]
+Arguments: hashpartitioning(ss_customer_sk#5, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (12) Sort [codegen id : 5]
-Input [1]: [ss_customer_sk#6]
-Arguments: [ss_customer_sk#6 ASC NULLS FIRST], false, 0
+Input [1]: [ss_customer_sk#5]
+Arguments: [ss_customer_sk#5 ASC NULLS FIRST], false, 0
 
 (13) SortMergeJoin [codegen id : 6]
 Left keys [1]: [c_customer_sk#1]
-Right keys [1]: [ss_customer_sk#6]
+Right keys [1]: [ss_customer_sk#5]
 Join type: LeftSemi
 Join condition: None
 
 (14) Scan parquet spark_catalog.default.web_sales
-Output [2]: [ws_bill_customer_sk#10, ws_sold_date_sk#11]
+Output [2]: [ws_bill_customer_sk#9, ws_sold_date_sk#10]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#11), dynamicpruningexpression(ws_sold_date_sk#11 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#10), dynamicpruningexpression(ws_sold_date_sk#10 IN dynamicpruning#7)]
 ReadSchema: struct<ws_bill_customer_sk:int>
 
 (15) ColumnarToRow [codegen id : 8]
-Input [2]: [ws_bill_customer_sk#10, ws_sold_date_sk#11]
+Input [2]: [ws_bill_customer_sk#9, ws_sold_date_sk#10]
 
 (16) ReusedExchange [Reuses operator id: 57]
-Output [1]: [d_date_sk#12]
+Output [1]: [d_date_sk#11]
 
 (17) BroadcastHashJoin [codegen id : 8]
-Left keys [1]: [ws_sold_date_sk#11]
-Right keys [1]: [d_date_sk#12]
+Left keys [1]: [ws_sold_date_sk#10]
+Right keys [1]: [d_date_sk#11]
 Join type: Inner
 Join condition: None
 
 (18) Project [codegen id : 8]
-Output [1]: [ws_bill_customer_sk#10 AS customer_sk#13]
-Input [3]: [ws_bill_customer_sk#10, ws_sold_date_sk#11, d_date_sk#12]
+Output [1]: [ws_bill_customer_sk#9 AS customer_sk#12]
+Input [3]: [ws_bill_customer_sk#9, ws_sold_date_sk#10, d_date_sk#11]
 
 (19) Scan parquet spark_catalog.default.catalog_sales
-Output [2]: [cs_ship_customer_sk#14, cs_sold_date_sk#15]
+Output [2]: [cs_ship_customer_sk#13, cs_sold_date_sk#14]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#15), dynamicpruningexpression(cs_sold_date_sk#15 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#14), dynamicpruningexpression(cs_sold_date_sk#14 IN dynamicpruning#7)]
 ReadSchema: struct<cs_ship_customer_sk:int>
 
 (20) ColumnarToRow [codegen id : 10]
-Input [2]: [cs_ship_customer_sk#14, cs_sold_date_sk#15]
+Input [2]: [cs_ship_customer_sk#13, cs_sold_date_sk#14]
 
 (21) ReusedExchange [Reuses operator id: 57]
-Output [1]: [d_date_sk#16]
+Output [1]: [d_date_sk#15]
 
 (22) BroadcastHashJoin [codegen id : 10]
-Left keys [1]: [cs_sold_date_sk#15]
-Right keys [1]: [d_date_sk#16]
+Left keys [1]: [cs_sold_date_sk#14]
+Right keys [1]: [d_date_sk#15]
 Join type: Inner
 Join condition: None
 
 (23) Project [codegen id : 10]
-Output [1]: [cs_ship_customer_sk#14 AS customer_sk#17]
-Input [3]: [cs_ship_customer_sk#14, cs_sold_date_sk#15, d_date_sk#16]
+Output [1]: [cs_ship_customer_sk#13 AS customer_sk#16]
+Input [3]: [cs_ship_customer_sk#13, cs_sold_date_sk#14, d_date_sk#15]
 
 (24) Union
 
 (25) Exchange
-Input [1]: [customer_sk#13]
-Arguments: hashpartitioning(customer_sk#13, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [1]: [customer_sk#12]
+Arguments: hashpartitioning(customer_sk#12, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (26) Sort [codegen id : 11]
-Input [1]: [customer_sk#13]
-Arguments: [customer_sk#13 ASC NULLS FIRST], false, 0
+Input [1]: [customer_sk#12]
+Arguments: [customer_sk#12 ASC NULLS FIRST], false, 0
 
 (27) SortMergeJoin [codegen id : 13]
 Left keys [1]: [c_customer_sk#1]
-Right keys [1]: [customer_sk#13]
+Right keys [1]: [customer_sk#12]
 Join type: LeftSemi
 Join condition: None
 
@@ -172,90 +172,90 @@ Output [2]: [c_current_cdemo_sk#2, c_current_addr_sk#3]
 Input [3]: [c_customer_sk#1, c_current_cdemo_sk#2, c_current_addr_sk#3]
 
 (29) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#18, ca_county#19]
+Output [2]: [ca_address_sk#17, ca_county#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_county, [Dona Ana County,Douglas County,Gaines County,Richland County,Walker County]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_county:string>
 
 (30) ColumnarToRow [codegen id : 12]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (31) Filter [codegen id : 12]
-Input [2]: [ca_address_sk#18, ca_county#19]
-Condition : (ca_county#19 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#18))
+Input [2]: [ca_address_sk#17, ca_county#18]
+Condition : (ca_county#18 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#17))
 
 (32) Project [codegen id : 12]
-Output [1]: [ca_address_sk#18]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (33) BroadcastExchange
-Input [1]: [ca_address_sk#18]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [ca_address_sk#17]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
 
 (34) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [c_current_addr_sk#3]
-Right keys [1]: [ca_address_sk#18]
+Right keys [1]: [ca_address_sk#17]
 Join type: Inner
 Join condition: None
 
 (35) Project [codegen id : 13]
 Output [1]: [c_current_cdemo_sk#2]
-Input [3]: [c_current_cdemo_sk#2, c_current_addr_sk#3, ca_address_sk#18]
+Input [3]: [c_current_cdemo_sk#2, c_current_addr_sk#3, ca_address_sk#17]
 
 (36) BroadcastExchange
 Input [1]: [c_current_cdemo_sk#2]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
 (37) Scan parquet spark_catalog.default.customer_demographics
-Output [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Output [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk)]
 ReadSchema: struct<cd_demo_sk:int,cd_gender:string,cd_marital_status:string,cd_education_status:string,cd_purchase_estimate:int,cd_credit_rating:string,cd_dep_count:int,cd_dep_employed_count:int,cd_dep_college_count:int>
 
 (38) ColumnarToRow
-Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Input [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 
 (39) Filter
-Input [9]: [cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Condition : isnotnull(cd_demo_sk#20)
+Input [9]: [cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Condition : isnotnull(cd_demo_sk#19)
 
 (40) BroadcastHashJoin [codegen id : 14]
 Left keys [1]: [c_current_cdemo_sk#2]
-Right keys [1]: [cd_demo_sk#20]
+Right keys [1]: [cd_demo_sk#19]
 Join type: Inner
 Join condition: None
 
 (41) Project [codegen id : 14]
-Output [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Input [10]: [c_current_cdemo_sk#2, cd_demo_sk#20, cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Output [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Input [10]: [c_current_cdemo_sk#2, cd_demo_sk#19, cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 
 (42) HashAggregate [codegen id : 14]
-Input [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
-Keys [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Input [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
+Keys [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 Functions [1]: [partial_count(1)]
-Aggregate Attributes [1]: [count#29]
-Results [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
+Aggregate Attributes [1]: [count#28]
+Results [9]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, count#29]
 
 (43) Exchange
-Input [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
-Arguments: hashpartitioning(cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [9]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, count#29]
+Arguments: hashpartitioning(cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, 5), ENSURE_REQUIREMENTS, [plan_id=7]
 
 (44) HashAggregate [codegen id : 15]
-Input [9]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28, count#30]
-Keys [8]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cd_purchase_estimate#24, cd_credit_rating#25, cd_dep_count#26, cd_dep_employed_count#27, cd_dep_college_count#28]
+Input [9]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27, count#29]
+Keys [8]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cd_purchase_estimate#23, cd_credit_rating#24, cd_dep_count#25, cd_dep_employed_count#26, cd_dep_college_count#27]
 Functions [1]: [count(1)]
-Aggregate Attributes [1]: [count(1)#31]
-Results [14]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, count(1)#31 AS cnt1#32, cd_purchase_estimate#24, count(1)#31 AS cnt2#33, cd_credit_rating#25, count(1)#31 AS cnt3#34, cd_dep_count#26, count(1)#31 AS cnt4#35, cd_dep_employed_count#27, count(1)#31 AS cnt5#36, cd_dep_college_count#28, count(1)#31 AS cnt6#37]
+Aggregate Attributes [1]: [count(1)#30]
+Results [14]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, count(1)#30 AS cnt1#31, cd_purchase_estimate#23, count(1)#30 AS cnt2#32, cd_credit_rating#24, count(1)#30 AS cnt3#33, cd_dep_count#25, count(1)#30 AS cnt4#34, cd_dep_employed_count#26, count(1)#30 AS cnt5#35, cd_dep_college_count#27, count(1)#30 AS cnt6#36]
 
 (45) TakeOrderedAndProject
-Input [14]: [cd_gender#21, cd_marital_status#22, cd_education_status#23, cnt1#32, cd_purchase_estimate#24, cnt2#33, cd_credit_rating#25, cnt3#34, cd_dep_count#26, cnt4#35, cd_dep_employed_count#27, cnt5#36, cd_dep_college_count#28, cnt6#37]
-Arguments: 100, [cd_gender#21 ASC NULLS FIRST, cd_marital_status#22 ASC NULLS FIRST, cd_education_status#23 ASC NULLS FIRST, cd_purchase_estimate#24 ASC NULLS FIRST, cd_credit_rating#25 ASC NULLS FIRST, cd_dep_count#26 ASC NULLS FIRST, cd_dep_employed_count#27 ASC NULLS FIRST, cd_dep_college_count#28 ASC NULLS FIRST], [cd_gender#21, cd_marital_status#22, cd_education_status#23, cnt1#32, cd_purchase_estimate#24, cnt2#33, cd_credit_rating#25, cnt3#34, cd_dep_count#26, cnt4#35, cd_dep_employed_count#27, cnt5#36, cd_dep_college_count#28, cnt6#37]
+Input [14]: [cd_gender#20, cd_marital_status#21, cd_education_status#22, cnt1#31, cd_purchase_estimate#23, cnt2#32, cd_credit_rating#24, cnt3#33, cd_dep_count#25, cnt4#34, cd_dep_employed_count#26, cnt5#35, cd_dep_college_count#27, cnt6#36]
+Arguments: 100, [cd_gender#20 ASC NULLS FIRST, cd_marital_status#21 ASC NULLS FIRST, cd_education_status#22 ASC NULLS FIRST, cd_purchase_estimate#23 ASC NULLS FIRST, cd_credit_rating#24 ASC NULLS FIRST, cd_dep_count#25 ASC NULLS FIRST, cd_dep_employed_count#26 ASC NULLS FIRST, cd_dep_college_count#27 ASC NULLS FIRST], [cd_gender#20, cd_marital_status#21, cd_education_status#22, cnt1#31, cd_purchase_estimate#23, cnt2#32, cd_credit_rating#24, cnt3#33, cd_dep_count#25, cnt4#34, cd_dep_employed_count#26, cnt5#35, cd_dep_college_count#27, cnt6#36]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#4, [id=#5]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#4, [id=#1]
 ObjectHashAggregate (52)
 +- Exchange (51)
    +- ObjectHashAggregate (50)
@@ -266,42 +266,42 @@ ObjectHashAggregate (52)
 
 
 (46) Scan parquet spark_catalog.default.customer_address
-Output [2]: [ca_address_sk#18, ca_county#19]
+Output [2]: [ca_address_sk#17, ca_county#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [In(ca_county, [Dona Ana County,Douglas County,Gaines County,Richland County,Walker County]), IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_county:string>
 
 (47) ColumnarToRow [codegen id : 1]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (48) Filter [codegen id : 1]
-Input [2]: [ca_address_sk#18, ca_county#19]
-Condition : (ca_county#19 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#18))
+Input [2]: [ca_address_sk#17, ca_county#18]
+Condition : (ca_county#18 IN (Walker County,Richland County,Gaines County,Douglas County,Dona Ana County) AND isnotnull(ca_address_sk#17))
 
 (49) Project [codegen id : 1]
-Output [1]: [ca_address_sk#18]
-Input [2]: [ca_address_sk#18, ca_county#19]
+Output [1]: [ca_address_sk#17]
+Input [2]: [ca_address_sk#17, ca_county#18]
 
 (50) ObjectHashAggregate
-Input [1]: [ca_address_sk#18]
+Input [1]: [ca_address_sk#17]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)]
-Aggregate Attributes [1]: [buf#38]
-Results [1]: [buf#39]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)]
+Aggregate Attributes [1]: [buf#37]
+Results [1]: [buf#38]
 
 (51) Exchange
-Input [1]: [buf#39]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=7]
+Input [1]: [buf#38]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=8]
 
 (52) ObjectHashAggregate
-Input [1]: [buf#39]
+Input [1]: [buf#38]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)#40]
-Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#18, 42), 2555, 57765, 0, 0)#40 AS bloomFilter#41]
+Functions [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)#39]
+Results [1]: [bloom_filter_agg(xxhash64(ca_address_sk#17, 42), 2555, 57765, 0, 0)#39 AS bloomFilter#40]
 
-Subquery:2 Hosting operator id = 6 Hosting Expression = ss_sold_date_sk#7 IN dynamicpruning#8
+Subquery:2 Hosting operator id = 6 Hosting Expression = ss_sold_date_sk#6 IN dynamicpruning#7
 BroadcastExchange (57)
 +- * Project (56)
    +- * Filter (55)
@@ -310,29 +310,29 @@ BroadcastExchange (57)
 
 
 (53) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#9, d_year#42, d_moy#43]
+Output [3]: [d_date_sk#8, d_year#41, d_moy#42]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2002), GreaterThanOrEqual(d_moy,4), LessThanOrEqual(d_moy,7), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
 (54) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#9, d_year#42, d_moy#43]
+Input [3]: [d_date_sk#8, d_year#41, d_moy#42]
 
 (55) Filter [codegen id : 1]
-Input [3]: [d_date_sk#9, d_year#42, d_moy#43]
-Condition : (((((isnotnull(d_year#42) AND isnotnull(d_moy#43)) AND (d_year#42 = 2002)) AND (d_moy#43 >= 4)) AND (d_moy#43 <= 7)) AND isnotnull(d_date_sk#9))
+Input [3]: [d_date_sk#8, d_year#41, d_moy#42]
+Condition : (((((isnotnull(d_year#41) AND isnotnull(d_moy#42)) AND (d_year#41 = 2002)) AND (d_moy#42 >= 4)) AND (d_moy#42 <= 7)) AND isnotnull(d_date_sk#8))
 
 (56) Project [codegen id : 1]
-Output [1]: [d_date_sk#9]
-Input [3]: [d_date_sk#9, d_year#42, d_moy#43]
+Output [1]: [d_date_sk#8]
+Input [3]: [d_date_sk#8, d_year#41, d_moy#42]
 
 (57) BroadcastExchange
-Input [1]: [d_date_sk#9]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
+Input [1]: [d_date_sk#8]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
 
-Subquery:3 Hosting operator id = 14 Hosting Expression = ws_sold_date_sk#11 IN dynamicpruning#8
+Subquery:3 Hosting operator id = 14 Hosting Expression = ws_sold_date_sk#10 IN dynamicpruning#7
 
-Subquery:4 Hosting operator id = 19 Hosting Expression = cs_sold_date_sk#15 IN dynamicpruning#8
+Subquery:4 Hosting operator id = 19 Hosting Expression = cs_sold_date_sk#14 IN dynamicpruning#7
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14.sf100/explain.txt
index fafd7fd75cbd7..f12e3de2b1432 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14.sf100/explain.txt
@@ -429,97 +429,97 @@ Results [6]: [store AS channel#49, i_brand_id#38, i_class_id#39, i_category_id#4
 
 (72) Filter [codegen id : 76]
 Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51]
-Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
 
 (73) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Output [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#57), dynamicpruningexpression(ss_sold_date_sk#57 IN dynamicpruning#58)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#56), dynamicpruningexpression(ss_sold_date_sk#56 IN dynamicpruning#57)]
 PushedFilters: [IsNotNull(ss_item_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (74) ColumnarToRow [codegen id : 74]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 
 (75) Filter [codegen id : 74]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
-Condition : isnotnull(ss_item_sk#54)
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
+Condition : isnotnull(ss_item_sk#53)
 
 (76) ReusedExchange [Reuses operator id: 56]
-Output [1]: [ss_item_sk#59]
+Output [1]: [ss_item_sk#58]
 
 (77) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [ss_item_sk#59]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [ss_item_sk#58]
 Join type: LeftSemi
 Join condition: None
 
 (78) ReusedExchange [Reuses operator id: 128]
-Output [1]: [d_date_sk#60]
+Output [1]: [d_date_sk#59]
 
 (79) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_sold_date_sk#57]
-Right keys [1]: [d_date_sk#60]
+Left keys [1]: [ss_sold_date_sk#56]
+Right keys [1]: [d_date_sk#59]
 Join type: Inner
 Join condition: None
 
 (80) Project [codegen id : 74]
-Output [3]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56]
-Input [5]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, d_date_sk#60]
+Output [3]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55]
+Input [5]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, d_date_sk#59]
 
 (81) ReusedExchange [Reuses operator id: 66]
-Output [4]: [i_item_sk#61, i_brand_id#62, i_class_id#63, i_category_id#64]
+Output [4]: [i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
 
 (82) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [i_item_sk#61]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [i_item_sk#60]
 Join type: Inner
 Join condition: None
 
 (83) Project [codegen id : 74]
-Output [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#62, i_class_id#63, i_category_id#64]
-Input [7]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, i_item_sk#61, i_brand_id#62, i_class_id#63, i_category_id#64]
+Output [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#61, i_class_id#62, i_category_id#63]
+Input [7]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
 
 (84) HashAggregate [codegen id : 74]
-Input [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#62, i_class_id#63, i_category_id#64]
-Keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
-Functions [2]: [partial_sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), partial_count(1)]
-Aggregate Attributes [3]: [sum#65, isEmpty#66, count#67]
-Results [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#68, isEmpty#69, count#70]
+Input [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#61, i_class_id#62, i_category_id#63]
+Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
+Functions [2]: [partial_sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), partial_count(1)]
+Aggregate Attributes [3]: [sum#64, isEmpty#65, count#66]
+Results [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
 
 (85) Exchange
-Input [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#68, isEmpty#69, count#70]
-Arguments: hashpartitioning(i_brand_id#62, i_class_id#63, i_category_id#64, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
+Arguments: hashpartitioning(i_brand_id#61, i_class_id#62, i_category_id#63, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (86) HashAggregate [codegen id : 75]
-Input [6]: [i_brand_id#62, i_class_id#63, i_category_id#64, sum#68, isEmpty#69, count#70]
-Keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
-Functions [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71, count(1)#72]
-Results [6]: [store AS channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71 AS sales#74, count(1)#72 AS number_sales#75]
+Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
+Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
+Functions [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70, count(1)#71]
+Results [6]: [store AS channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70 AS sales#73, count(1)#71 AS number_sales#74]
 
 (87) Filter [codegen id : 75]
-Input [6]: [channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
-Condition : (isnotnull(sales#74) AND (cast(sales#74 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
+Condition : (isnotnull(sales#73) AND (cast(sales#73 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
 
 (88) BroadcastExchange
-Input [6]: [channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
-Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=13]
+Input [6]: [channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
+Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=14]
 
 (89) BroadcastHashJoin [codegen id : 76]
 Left keys [3]: [i_brand_id#38, i_class_id#39, i_category_id#40]
-Right keys [3]: [i_brand_id#62, i_class_id#63, i_category_id#64]
+Right keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
 Join type: Inner
 Join condition: None
 
 (90) TakeOrderedAndProject
-Input [12]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
-Arguments: 100, [i_brand_id#38 ASC NULLS FIRST, i_class_id#39 ASC NULLS FIRST, i_category_id#40 ASC NULLS FIRST], [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#73, i_brand_id#62, i_class_id#63, i_category_id#64, sales#74, number_sales#75]
+Input [12]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
+Arguments: 100, [i_brand_id#38 ASC NULLS FIRST, i_class_id#39 ASC NULLS FIRST, i_category_id#40 ASC NULLS FIRST], [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51, channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#52, [id=#53]
+Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#52, [id=#12]
 * HashAggregate (109)
 +- Exchange (108)
    +- * HashAggregate (107)
@@ -542,99 +542,99 @@ Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquer
 
 
 (91) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Output [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#78), dynamicpruningexpression(ss_sold_date_sk#78 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#77), dynamicpruningexpression(ss_sold_date_sk#77 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (92) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Input [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 
 (93) ReusedExchange [Reuses operator id: 123]
-Output [1]: [d_date_sk#79]
+Output [1]: [d_date_sk#78]
 
 (94) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#78]
-Right keys [1]: [d_date_sk#79]
+Left keys [1]: [ss_sold_date_sk#77]
+Right keys [1]: [d_date_sk#78]
 Join type: Inner
 Join condition: None
 
 (95) Project [codegen id : 2]
-Output [2]: [ss_quantity#76 AS quantity#80, ss_list_price#77 AS list_price#81]
-Input [4]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78, d_date_sk#79]
+Output [2]: [ss_quantity#75 AS quantity#79, ss_list_price#76 AS list_price#80]
+Input [4]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77, d_date_sk#78]
 
 (96) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Output [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#84), dynamicpruningexpression(cs_sold_date_sk#84 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#83), dynamicpruningexpression(cs_sold_date_sk#83 IN dynamicpruning#12)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (97) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Input [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 
 (98) ReusedExchange [Reuses operator id: 123]
-Output [1]: [d_date_sk#85]
+Output [1]: [d_date_sk#84]
 
 (99) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#84]
-Right keys [1]: [d_date_sk#85]
+Left keys [1]: [cs_sold_date_sk#83]
+Right keys [1]: [d_date_sk#84]
 Join type: Inner
 Join condition: None
 
 (100) Project [codegen id : 4]
-Output [2]: [cs_quantity#82 AS quantity#86, cs_list_price#83 AS list_price#87]
-Input [4]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84, d_date_sk#85]
+Output [2]: [cs_quantity#81 AS quantity#85, cs_list_price#82 AS list_price#86]
+Input [4]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83, d_date_sk#84]
 
 (101) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Output [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#90), dynamicpruningexpression(ws_sold_date_sk#90 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#89), dynamicpruningexpression(ws_sold_date_sk#89 IN dynamicpruning#12)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (102) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Input [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 
 (103) ReusedExchange [Reuses operator id: 123]
-Output [1]: [d_date_sk#91]
+Output [1]: [d_date_sk#90]
 
 (104) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#90]
-Right keys [1]: [d_date_sk#91]
+Left keys [1]: [ws_sold_date_sk#89]
+Right keys [1]: [d_date_sk#90]
 Join type: Inner
 Join condition: None
 
 (105) Project [codegen id : 6]
-Output [2]: [ws_quantity#88 AS quantity#92, ws_list_price#89 AS list_price#93]
-Input [4]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90, d_date_sk#91]
+Output [2]: [ws_quantity#87 AS quantity#91, ws_list_price#88 AS list_price#92]
+Input [4]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89, d_date_sk#90]
 
 (106) Union
 
 (107) HashAggregate [codegen id : 7]
-Input [2]: [quantity#80, list_price#81]
+Input [2]: [quantity#79, list_price#80]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [2]: [sum#94, count#95]
-Results [2]: [sum#96, count#97]
+Functions [1]: [partial_avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [2]: [sum#93, count#94]
+Results [2]: [sum#95, count#96]
 
 (108) Exchange
-Input [2]: [sum#96, count#97]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=14]
+Input [2]: [sum#95, count#96]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=15]
 
 (109) HashAggregate [codegen id : 8]
-Input [2]: [sum#96, count#97]
+Input [2]: [sum#95, count#96]
 Keys: []
-Functions [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98]
-Results [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98 AS average_sales#99]
+Functions [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97]
+Results [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97 AS average_sales#98]
 
-Subquery:2 Hosting operator id = 91 Hosting Expression = ss_sold_date_sk#78 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 91 Hosting Expression = ss_sold_date_sk#77 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 96 Hosting Expression = cs_sold_date_sk#84 IN dynamicpruning#12
+Subquery:3 Hosting operator id = 96 Hosting Expression = cs_sold_date_sk#83 IN dynamicpruning#12
 
-Subquery:4 Hosting operator id = 101 Hosting Expression = ws_sold_date_sk#90 IN dynamicpruning#12
+Subquery:4 Hosting operator id = 101 Hosting Expression = ws_sold_date_sk#89 IN dynamicpruning#12
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
 BroadcastExchange (114)
@@ -645,30 +645,30 @@ BroadcastExchange (114)
 
 
 (110) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#36, d_week_seq#100]
+Output [2]: [d_date_sk#36, d_week_seq#99]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#101), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#100), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (111) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#36, d_week_seq#100]
+Input [2]: [d_date_sk#36, d_week_seq#99]
 
 (112) Filter [codegen id : 1]
-Input [2]: [d_date_sk#36, d_week_seq#100]
-Condition : ((isnotnull(d_week_seq#100) AND (d_week_seq#100 = ReusedSubquery Subquery scalar-subquery#101, [id=#102])) AND isnotnull(d_date_sk#36))
+Input [2]: [d_date_sk#36, d_week_seq#99]
+Condition : ((isnotnull(d_week_seq#99) AND (d_week_seq#99 = ReusedSubquery Subquery scalar-subquery#100, [id=#16])) AND isnotnull(d_date_sk#36))
 
 (113) Project [codegen id : 1]
 Output [1]: [d_date_sk#36]
-Input [2]: [d_date_sk#36, d_week_seq#100]
+Input [2]: [d_date_sk#36, d_week_seq#99]
 
 (114) BroadcastExchange
 Input [1]: [d_date_sk#36]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
 
-Subquery:6 Hosting operator id = 112 Hosting Expression = ReusedSubquery Subquery scalar-subquery#101, [id=#102]
+Subquery:6 Hosting operator id = 112 Hosting Expression = ReusedSubquery Subquery scalar-subquery#100, [id=#16]
 
-Subquery:7 Hosting operator id = 110 Hosting Expression = Subquery scalar-subquery#101, [id=#102]
+Subquery:7 Hosting operator id = 110 Hosting Expression = Subquery scalar-subquery#100, [id=#16]
 * Project (118)
 +- * Filter (117)
    +- * ColumnarToRow (116)
@@ -676,22 +676,22 @@ Subquery:7 Hosting operator id = 110 Hosting Expression = Subquery scalar-subque
 
 
 (115) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,1999), EqualTo(d_moy,12), EqualTo(d_dom,16)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (116) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 (117) Filter [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
-Condition : (((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND isnotnull(d_dom#106)) AND (d_year#104 = 1999)) AND (d_moy#105 = 12)) AND (d_dom#106 = 16))
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
+Condition : (((((isnotnull(d_year#102) AND isnotnull(d_moy#103)) AND isnotnull(d_dom#104)) AND (d_year#102 = 1999)) AND (d_moy#103 = 12)) AND (d_dom#104 = 16))
 
 (118) Project [codegen id : 1]
-Output [1]: [d_week_seq#103]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [1]: [d_week_seq#101]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 Subquery:8 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
 BroadcastExchange (123)
@@ -702,34 +702,34 @@ BroadcastExchange (123)
 
 
 (119) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#13, d_year#107]
+Output [2]: [d_date_sk#13, d_year#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1998), LessThanOrEqual(d_year,2000), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (120) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#107]
+Input [2]: [d_date_sk#13, d_year#105]
 
 (121) Filter [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#107]
-Condition : (((isnotnull(d_year#107) AND (d_year#107 >= 1998)) AND (d_year#107 <= 2000)) AND isnotnull(d_date_sk#13))
+Input [2]: [d_date_sk#13, d_year#105]
+Condition : (((isnotnull(d_year#105) AND (d_year#105 >= 1998)) AND (d_year#105 <= 2000)) AND isnotnull(d_date_sk#13))
 
 (122) Project [codegen id : 1]
 Output [1]: [d_date_sk#13]
-Input [2]: [d_date_sk#13, d_year#107]
+Input [2]: [d_date_sk#13, d_year#105]
 
 (123) BroadcastExchange
 Input [1]: [d_date_sk#13]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=18]
 
 Subquery:9 Hosting operator id = 18 Hosting Expression = cs_sold_date_sk#19 IN dynamicpruning#12
 
 Subquery:10 Hosting operator id = 41 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:11 Hosting operator id = 87 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:11 Hosting operator id = 87 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
 
-Subquery:12 Hosting operator id = 73 Hosting Expression = ss_sold_date_sk#57 IN dynamicpruning#58
+Subquery:12 Hosting operator id = 73 Hosting Expression = ss_sold_date_sk#56 IN dynamicpruning#57
 BroadcastExchange (128)
 +- * Project (127)
    +- * Filter (126)
@@ -738,30 +738,30 @@ BroadcastExchange (128)
 
 
 (124) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#60, d_week_seq#108]
+Output [2]: [d_date_sk#59, d_week_seq#106]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#109), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#107), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (125) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#60, d_week_seq#108]
+Input [2]: [d_date_sk#59, d_week_seq#106]
 
 (126) Filter [codegen id : 1]
-Input [2]: [d_date_sk#60, d_week_seq#108]
-Condition : ((isnotnull(d_week_seq#108) AND (d_week_seq#108 = ReusedSubquery Subquery scalar-subquery#109, [id=#110])) AND isnotnull(d_date_sk#60))
+Input [2]: [d_date_sk#59, d_week_seq#106]
+Condition : ((isnotnull(d_week_seq#106) AND (d_week_seq#106 = ReusedSubquery Subquery scalar-subquery#107, [id=#19])) AND isnotnull(d_date_sk#59))
 
 (127) Project [codegen id : 1]
-Output [1]: [d_date_sk#60]
-Input [2]: [d_date_sk#60, d_week_seq#108]
+Output [1]: [d_date_sk#59]
+Input [2]: [d_date_sk#59, d_week_seq#106]
 
 (128) BroadcastExchange
-Input [1]: [d_date_sk#60]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=17]
+Input [1]: [d_date_sk#59]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=20]
 
-Subquery:13 Hosting operator id = 126 Hosting Expression = ReusedSubquery Subquery scalar-subquery#109, [id=#110]
+Subquery:13 Hosting operator id = 126 Hosting Expression = ReusedSubquery Subquery scalar-subquery#107, [id=#19]
 
-Subquery:14 Hosting operator id = 124 Hosting Expression = Subquery scalar-subquery#109, [id=#110]
+Subquery:14 Hosting operator id = 124 Hosting Expression = Subquery scalar-subquery#107, [id=#19]
 * Project (132)
 +- * Filter (131)
    +- * ColumnarToRow (130)
@@ -769,21 +769,21 @@ Subquery:14 Hosting operator id = 124 Hosting Expression = Subquery scalar-subqu
 
 
 (129) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,1998), EqualTo(d_moy,12), EqualTo(d_dom,16)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (130) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 (131) Filter [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
-Condition : (((((isnotnull(d_year#112) AND isnotnull(d_moy#113)) AND isnotnull(d_dom#114)) AND (d_year#112 = 1998)) AND (d_moy#113 = 12)) AND (d_dom#114 = 16))
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
+Condition : (((((isnotnull(d_year#109) AND isnotnull(d_moy#110)) AND isnotnull(d_dom#111)) AND (d_year#109 = 1998)) AND (d_moy#110 = 12)) AND (d_dom#111 = 16))
 
 (132) Project [codegen id : 1]
-Output [1]: [d_week_seq#111]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [1]: [d_week_seq#108]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14/explain.txt
index 4d69899b3b17a..fc7f6859ad64e 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14/explain.txt
@@ -399,97 +399,97 @@ Results [6]: [store AS channel#49, i_brand_id#37, i_class_id#38, i_category_id#3
 
 (66) Filter [codegen id : 52]
 Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51]
-Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
 
 (67) Scan parquet spark_catalog.default.store_sales
-Output [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Output [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#57), dynamicpruningexpression(ss_sold_date_sk#57 IN dynamicpruning#58)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#56), dynamicpruningexpression(ss_sold_date_sk#56 IN dynamicpruning#57)]
 PushedFilters: [IsNotNull(ss_item_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (68) ColumnarToRow [codegen id : 50]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
 
 (69) Filter [codegen id : 50]
-Input [4]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57]
-Condition : isnotnull(ss_item_sk#54)
+Input [4]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56]
+Condition : isnotnull(ss_item_sk#53)
 
 (70) ReusedExchange [Reuses operator id: 50]
-Output [1]: [ss_item_sk#59]
+Output [1]: [ss_item_sk#58]
 
 (71) BroadcastHashJoin [codegen id : 50]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [ss_item_sk#59]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [ss_item_sk#58]
 Join type: LeftSemi
 Join condition: None
 
 (72) ReusedExchange [Reuses operator id: 57]
-Output [4]: [i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
+Output [4]: [i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
 
 (73) BroadcastHashJoin [codegen id : 50]
-Left keys [1]: [ss_item_sk#54]
-Right keys [1]: [i_item_sk#60]
+Left keys [1]: [ss_item_sk#53]
+Right keys [1]: [i_item_sk#59]
 Join type: Inner
 Join condition: None
 
 (74) Project [codegen id : 50]
-Output [6]: [ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, i_brand_id#61, i_class_id#62, i_category_id#63]
-Input [8]: [ss_item_sk#54, ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
+Output [6]: [ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, i_brand_id#60, i_class_id#61, i_category_id#62]
+Input [8]: [ss_item_sk#53, ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
 
 (75) ReusedExchange [Reuses operator id: 122]
-Output [1]: [d_date_sk#64]
+Output [1]: [d_date_sk#63]
 
 (76) BroadcastHashJoin [codegen id : 50]
-Left keys [1]: [ss_sold_date_sk#57]
-Right keys [1]: [d_date_sk#64]
+Left keys [1]: [ss_sold_date_sk#56]
+Right keys [1]: [d_date_sk#63]
 Join type: Inner
 Join condition: None
 
 (77) Project [codegen id : 50]
-Output [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#61, i_class_id#62, i_category_id#63]
-Input [7]: [ss_quantity#55, ss_list_price#56, ss_sold_date_sk#57, i_brand_id#61, i_class_id#62, i_category_id#63, d_date_sk#64]
+Output [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#60, i_class_id#61, i_category_id#62]
+Input [7]: [ss_quantity#54, ss_list_price#55, ss_sold_date_sk#56, i_brand_id#60, i_class_id#61, i_category_id#62, d_date_sk#63]
 
 (78) HashAggregate [codegen id : 50]
-Input [5]: [ss_quantity#55, ss_list_price#56, i_brand_id#61, i_class_id#62, i_category_id#63]
-Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
-Functions [2]: [partial_sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), partial_count(1)]
-Aggregate Attributes [3]: [sum#65, isEmpty#66, count#67]
-Results [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#68, isEmpty#69, count#70]
+Input [5]: [ss_quantity#54, ss_list_price#55, i_brand_id#60, i_class_id#61, i_category_id#62]
+Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
+Functions [2]: [partial_sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), partial_count(1)]
+Aggregate Attributes [3]: [sum#64, isEmpty#65, count#66]
+Results [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
 
 (79) Exchange
-Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#68, isEmpty#69, count#70]
-Arguments: hashpartitioning(i_brand_id#61, i_class_id#62, i_category_id#63, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
+Arguments: hashpartitioning(i_brand_id#60, i_class_id#61, i_category_id#62, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (80) HashAggregate [codegen id : 51]
-Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#68, isEmpty#69, count#70]
-Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
-Functions [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71, count(1)#72]
-Results [6]: [store AS channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sum((cast(ss_quantity#55 as decimal(10,0)) * ss_list_price#56))#71 AS sales#74, count(1)#72 AS number_sales#75]
+Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
+Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
+Functions [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70, count(1)#71]
+Results [6]: [store AS channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sum((cast(ss_quantity#54 as decimal(10,0)) * ss_list_price#55))#70 AS sales#73, count(1)#71 AS number_sales#74]
 
 (81) Filter [codegen id : 51]
-Input [6]: [channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
-Condition : (isnotnull(sales#74) AND (cast(sales#74 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
+Condition : (isnotnull(sales#73) AND (cast(sales#73 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
 
 (82) BroadcastExchange
-Input [6]: [channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
-Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=11]
+Input [6]: [channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
+Arguments: HashedRelationBroadcastMode(List(input[1, int, true], input[2, int, true], input[3, int, true]),false), [plan_id=12]
 
 (83) BroadcastHashJoin [codegen id : 52]
 Left keys [3]: [i_brand_id#37, i_class_id#38, i_category_id#39]
-Right keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
+Right keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
 Join type: Inner
 Join condition: None
 
 (84) TakeOrderedAndProject
-Input [12]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
-Arguments: 100, [i_brand_id#37 ASC NULLS FIRST, i_class_id#38 ASC NULLS FIRST, i_category_id#39 ASC NULLS FIRST], [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#73, i_brand_id#61, i_class_id#62, i_category_id#63, sales#74, number_sales#75]
+Input [12]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
+Arguments: 100, [i_brand_id#37 ASC NULLS FIRST, i_class_id#38 ASC NULLS FIRST, i_category_id#39 ASC NULLS FIRST], [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51, channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#52, [id=#53]
+Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#52, [id=#10]
 * HashAggregate (103)
 +- Exchange (102)
    +- * HashAggregate (101)
@@ -512,99 +512,99 @@ Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquer
 
 
 (85) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Output [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#78), dynamicpruningexpression(ss_sold_date_sk#78 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#77), dynamicpruningexpression(ss_sold_date_sk#77 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
 (86) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78]
+Input [3]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77]
 
 (87) ReusedExchange [Reuses operator id: 117]
-Output [1]: [d_date_sk#79]
+Output [1]: [d_date_sk#78]
 
 (88) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#78]
-Right keys [1]: [d_date_sk#79]
+Left keys [1]: [ss_sold_date_sk#77]
+Right keys [1]: [d_date_sk#78]
 Join type: Inner
 Join condition: None
 
 (89) Project [codegen id : 2]
-Output [2]: [ss_quantity#76 AS quantity#80, ss_list_price#77 AS list_price#81]
-Input [4]: [ss_quantity#76, ss_list_price#77, ss_sold_date_sk#78, d_date_sk#79]
+Output [2]: [ss_quantity#75 AS quantity#79, ss_list_price#76 AS list_price#80]
+Input [4]: [ss_quantity#75, ss_list_price#76, ss_sold_date_sk#77, d_date_sk#78]
 
 (90) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Output [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#84), dynamicpruningexpression(cs_sold_date_sk#84 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#83), dynamicpruningexpression(cs_sold_date_sk#83 IN dynamicpruning#12)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (91) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84]
+Input [3]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83]
 
 (92) ReusedExchange [Reuses operator id: 117]
-Output [1]: [d_date_sk#85]
+Output [1]: [d_date_sk#84]
 
 (93) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#84]
-Right keys [1]: [d_date_sk#85]
+Left keys [1]: [cs_sold_date_sk#83]
+Right keys [1]: [d_date_sk#84]
 Join type: Inner
 Join condition: None
 
 (94) Project [codegen id : 4]
-Output [2]: [cs_quantity#82 AS quantity#86, cs_list_price#83 AS list_price#87]
-Input [4]: [cs_quantity#82, cs_list_price#83, cs_sold_date_sk#84, d_date_sk#85]
+Output [2]: [cs_quantity#81 AS quantity#85, cs_list_price#82 AS list_price#86]
+Input [4]: [cs_quantity#81, cs_list_price#82, cs_sold_date_sk#83, d_date_sk#84]
 
 (95) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Output [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#90), dynamicpruningexpression(ws_sold_date_sk#90 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#89), dynamicpruningexpression(ws_sold_date_sk#89 IN dynamicpruning#12)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (96) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90]
+Input [3]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89]
 
 (97) ReusedExchange [Reuses operator id: 117]
-Output [1]: [d_date_sk#91]
+Output [1]: [d_date_sk#90]
 
 (98) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#90]
-Right keys [1]: [d_date_sk#91]
+Left keys [1]: [ws_sold_date_sk#89]
+Right keys [1]: [d_date_sk#90]
 Join type: Inner
 Join condition: None
 
 (99) Project [codegen id : 6]
-Output [2]: [ws_quantity#88 AS quantity#92, ws_list_price#89 AS list_price#93]
-Input [4]: [ws_quantity#88, ws_list_price#89, ws_sold_date_sk#90, d_date_sk#91]
+Output [2]: [ws_quantity#87 AS quantity#91, ws_list_price#88 AS list_price#92]
+Input [4]: [ws_quantity#87, ws_list_price#88, ws_sold_date_sk#89, d_date_sk#90]
 
 (100) Union
 
 (101) HashAggregate [codegen id : 7]
-Input [2]: [quantity#80, list_price#81]
+Input [2]: [quantity#79, list_price#80]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [2]: [sum#94, count#95]
-Results [2]: [sum#96, count#97]
+Functions [1]: [partial_avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [2]: [sum#93, count#94]
+Results [2]: [sum#95, count#96]
 
 (102) Exchange
-Input [2]: [sum#96, count#97]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
+Input [2]: [sum#95, count#96]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (103) HashAggregate [codegen id : 8]
-Input [2]: [sum#96, count#97]
+Input [2]: [sum#95, count#96]
 Keys: []
-Functions [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))]
-Aggregate Attributes [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98]
-Results [1]: [avg((cast(quantity#80 as decimal(10,0)) * list_price#81))#98 AS average_sales#99]
+Functions [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))]
+Aggregate Attributes [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97]
+Results [1]: [avg((cast(quantity#79 as decimal(10,0)) * list_price#80))#97 AS average_sales#98]
 
-Subquery:2 Hosting operator id = 85 Hosting Expression = ss_sold_date_sk#78 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 85 Hosting Expression = ss_sold_date_sk#77 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 90 Hosting Expression = cs_sold_date_sk#84 IN dynamicpruning#12
+Subquery:3 Hosting operator id = 90 Hosting Expression = cs_sold_date_sk#83 IN dynamicpruning#12
 
-Subquery:4 Hosting operator id = 95 Hosting Expression = ws_sold_date_sk#90 IN dynamicpruning#12
+Subquery:4 Hosting operator id = 95 Hosting Expression = ws_sold_date_sk#89 IN dynamicpruning#12
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
 BroadcastExchange (108)
@@ -615,30 +615,30 @@ BroadcastExchange (108)
 
 
 (104) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#40, d_week_seq#100]
+Output [2]: [d_date_sk#40, d_week_seq#99]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#101), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#100), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (105) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#40, d_week_seq#100]
+Input [2]: [d_date_sk#40, d_week_seq#99]
 
 (106) Filter [codegen id : 1]
-Input [2]: [d_date_sk#40, d_week_seq#100]
-Condition : ((isnotnull(d_week_seq#100) AND (d_week_seq#100 = ReusedSubquery Subquery scalar-subquery#101, [id=#102])) AND isnotnull(d_date_sk#40))
+Input [2]: [d_date_sk#40, d_week_seq#99]
+Condition : ((isnotnull(d_week_seq#99) AND (d_week_seq#99 = ReusedSubquery Subquery scalar-subquery#100, [id=#14])) AND isnotnull(d_date_sk#40))
 
 (107) Project [codegen id : 1]
 Output [1]: [d_date_sk#40]
-Input [2]: [d_date_sk#40, d_week_seq#100]
+Input [2]: [d_date_sk#40, d_week_seq#99]
 
 (108) BroadcastExchange
 Input [1]: [d_date_sk#40]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
 
-Subquery:6 Hosting operator id = 106 Hosting Expression = ReusedSubquery Subquery scalar-subquery#101, [id=#102]
+Subquery:6 Hosting operator id = 106 Hosting Expression = ReusedSubquery Subquery scalar-subquery#100, [id=#14]
 
-Subquery:7 Hosting operator id = 104 Hosting Expression = Subquery scalar-subquery#101, [id=#102]
+Subquery:7 Hosting operator id = 104 Hosting Expression = Subquery scalar-subquery#100, [id=#14]
 * Project (112)
 +- * Filter (111)
    +- * ColumnarToRow (110)
@@ -646,22 +646,22 @@ Subquery:7 Hosting operator id = 104 Hosting Expression = Subquery scalar-subque
 
 
 (109) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,1999), EqualTo(d_moy,12), EqualTo(d_dom,16)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (110) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 (111) Filter [codegen id : 1]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
-Condition : (((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND isnotnull(d_dom#106)) AND (d_year#104 = 1999)) AND (d_moy#105 = 12)) AND (d_dom#106 = 16))
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
+Condition : (((((isnotnull(d_year#102) AND isnotnull(d_moy#103)) AND isnotnull(d_dom#104)) AND (d_year#102 = 1999)) AND (d_moy#103 = 12)) AND (d_dom#104 = 16))
 
 (112) Project [codegen id : 1]
-Output [1]: [d_week_seq#103]
-Input [4]: [d_week_seq#103, d_year#104, d_moy#105, d_dom#106]
+Output [1]: [d_week_seq#101]
+Input [4]: [d_week_seq#101, d_year#102, d_moy#103, d_dom#104]
 
 Subquery:8 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
 BroadcastExchange (117)
@@ -672,34 +672,34 @@ BroadcastExchange (117)
 
 
 (113) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_year#107]
+Output [2]: [d_date_sk#24, d_year#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1998), LessThanOrEqual(d_year,2000), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (114) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#107]
+Input [2]: [d_date_sk#24, d_year#105]
 
 (115) Filter [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#107]
-Condition : (((isnotnull(d_year#107) AND (d_year#107 >= 1998)) AND (d_year#107 <= 2000)) AND isnotnull(d_date_sk#24))
+Input [2]: [d_date_sk#24, d_year#105]
+Condition : (((isnotnull(d_year#105) AND (d_year#105 >= 1998)) AND (d_year#105 <= 2000)) AND isnotnull(d_date_sk#24))
 
 (116) Project [codegen id : 1]
 Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_year#107]
+Input [2]: [d_date_sk#24, d_year#105]
 
 (117) BroadcastExchange
 Input [1]: [d_date_sk#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
 
 Subquery:9 Hosting operator id = 13 Hosting Expression = cs_sold_date_sk#18 IN dynamicpruning#12
 
 Subquery:10 Hosting operator id = 36 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:11 Hosting operator id = 81 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:11 Hosting operator id = 81 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
 
-Subquery:12 Hosting operator id = 67 Hosting Expression = ss_sold_date_sk#57 IN dynamicpruning#58
+Subquery:12 Hosting operator id = 67 Hosting Expression = ss_sold_date_sk#56 IN dynamicpruning#57
 BroadcastExchange (122)
 +- * Project (121)
    +- * Filter (120)
@@ -708,30 +708,30 @@ BroadcastExchange (122)
 
 
 (118) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#64, d_week_seq#108]
+Output [2]: [d_date_sk#63, d_week_seq#106]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
-PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#109), IsNotNull(d_date_sk)]
+PushedFilters: [IsNotNull(d_week_seq), EqualTo(d_week_seq,ScalarSubquery#107), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_week_seq:int>
 
 (119) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#64, d_week_seq#108]
+Input [2]: [d_date_sk#63, d_week_seq#106]
 
 (120) Filter [codegen id : 1]
-Input [2]: [d_date_sk#64, d_week_seq#108]
-Condition : ((isnotnull(d_week_seq#108) AND (d_week_seq#108 = ReusedSubquery Subquery scalar-subquery#109, [id=#110])) AND isnotnull(d_date_sk#64))
+Input [2]: [d_date_sk#63, d_week_seq#106]
+Condition : ((isnotnull(d_week_seq#106) AND (d_week_seq#106 = ReusedSubquery Subquery scalar-subquery#107, [id=#17])) AND isnotnull(d_date_sk#63))
 
 (121) Project [codegen id : 1]
-Output [1]: [d_date_sk#64]
-Input [2]: [d_date_sk#64, d_week_seq#108]
+Output [1]: [d_date_sk#63]
+Input [2]: [d_date_sk#63, d_week_seq#106]
 
 (122) BroadcastExchange
-Input [1]: [d_date_sk#64]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
+Input [1]: [d_date_sk#63]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=18]
 
-Subquery:13 Hosting operator id = 120 Hosting Expression = ReusedSubquery Subquery scalar-subquery#109, [id=#110]
+Subquery:13 Hosting operator id = 120 Hosting Expression = ReusedSubquery Subquery scalar-subquery#107, [id=#17]
 
-Subquery:14 Hosting operator id = 118 Hosting Expression = Subquery scalar-subquery#109, [id=#110]
+Subquery:14 Hosting operator id = 118 Hosting Expression = Subquery scalar-subquery#107, [id=#17]
 * Project (126)
 +- * Filter (125)
    +- * ColumnarToRow (124)
@@ -739,21 +739,21 @@ Subquery:14 Hosting operator id = 118 Hosting Expression = Subquery scalar-subqu
 
 
 (123) Scan parquet spark_catalog.default.date_dim
-Output [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), IsNotNull(d_dom), EqualTo(d_year,1998), EqualTo(d_moy,12), EqualTo(d_dom,16)]
 ReadSchema: struct<d_week_seq:int,d_year:int,d_moy:int,d_dom:int>
 
 (124) ColumnarToRow [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 (125) Filter [codegen id : 1]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
-Condition : (((((isnotnull(d_year#112) AND isnotnull(d_moy#113)) AND isnotnull(d_dom#114)) AND (d_year#112 = 1998)) AND (d_moy#113 = 12)) AND (d_dom#114 = 16))
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
+Condition : (((((isnotnull(d_year#109) AND isnotnull(d_moy#110)) AND isnotnull(d_dom#111)) AND (d_year#109 = 1998)) AND (d_moy#110 = 12)) AND (d_dom#111 = 16))
 
 (126) Project [codegen id : 1]
-Output [1]: [d_week_seq#111]
-Input [4]: [d_week_seq#111, d_year#112, d_moy#113, d_dom#114]
+Output [1]: [d_week_seq#108]
+Input [4]: [d_week_seq#108, d_year#109, d_moy#110, d_dom#111]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/explain.txt
index d4a848eceacba..73858da641308 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/explain.txt
@@ -1,135 +1,174 @@
 == Physical Plan ==
-TakeOrderedAndProject (131)
-+- * HashAggregate (130)
-   +- Exchange (129)
-      +- * HashAggregate (128)
-         +- Union (127)
-            :- * HashAggregate (106)
-            :  +- Exchange (105)
-            :     +- * HashAggregate (104)
-            :        +- Union (103)
-            :           :- * Filter (72)
-            :           :  +- * HashAggregate (71)
-            :           :     +- Exchange (70)
-            :           :        +- * HashAggregate (69)
-            :           :           +- * Project (68)
-            :           :              +- * BroadcastHashJoin Inner BuildRight (67)
-            :           :                 :- * Project (60)
-            :           :                 :  +- * BroadcastHashJoin Inner BuildRight (59)
-            :           :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (57)
-            :           :                 :     :  :- * Filter (3)
-            :           :                 :     :  :  +- * ColumnarToRow (2)
-            :           :                 :     :  :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :           :                 :     :  +- BroadcastExchange (56)
-            :           :                 :     :     +- * Project (55)
-            :           :                 :     :        +- * BroadcastHashJoin Inner BuildRight (54)
-            :           :                 :     :           :- * Filter (6)
-            :           :                 :     :           :  +- * ColumnarToRow (5)
-            :           :                 :     :           :     +- Scan parquet spark_catalog.default.item (4)
-            :           :                 :     :           +- BroadcastExchange (53)
-            :           :                 :     :              +- * SortMergeJoin LeftSemi (52)
-            :           :                 :     :                 :- * Sort (40)
-            :           :                 :     :                 :  +- Exchange (39)
-            :           :                 :     :                 :     +- * HashAggregate (38)
-            :           :                 :     :                 :        +- Exchange (37)
-            :           :                 :     :                 :           +- * HashAggregate (36)
-            :           :                 :     :                 :              +- * Project (35)
-            :           :                 :     :                 :                 +- * BroadcastHashJoin Inner BuildRight (34)
-            :           :                 :     :                 :                    :- * Project (12)
-            :           :                 :     :                 :                    :  +- * BroadcastHashJoin Inner BuildRight (11)
-            :           :                 :     :                 :                    :     :- * Filter (9)
-            :           :                 :     :                 :                    :     :  +- * ColumnarToRow (8)
-            :           :                 :     :                 :                    :     :     +- Scan parquet spark_catalog.default.store_sales (7)
-            :           :                 :     :                 :                    :     +- ReusedExchange (10)
-            :           :                 :     :                 :                    +- BroadcastExchange (33)
-            :           :                 :     :                 :                       +- * SortMergeJoin LeftSemi (32)
-            :           :                 :     :                 :                          :- * Sort (17)
-            :           :                 :     :                 :                          :  +- Exchange (16)
-            :           :                 :     :                 :                          :     +- * Filter (15)
-            :           :                 :     :                 :                          :        +- * ColumnarToRow (14)
-            :           :                 :     :                 :                          :           +- Scan parquet spark_catalog.default.item (13)
-            :           :                 :     :                 :                          +- * Sort (31)
-            :           :                 :     :                 :                             +- Exchange (30)
-            :           :                 :     :                 :                                +- * Project (29)
-            :           :                 :     :                 :                                   +- * BroadcastHashJoin Inner BuildRight (28)
-            :           :                 :     :                 :                                      :- * Project (23)
-            :           :                 :     :                 :                                      :  +- * BroadcastHashJoin Inner BuildRight (22)
-            :           :                 :     :                 :                                      :     :- * Filter (20)
-            :           :                 :     :                 :                                      :     :  +- * ColumnarToRow (19)
-            :           :                 :     :                 :                                      :     :     +- Scan parquet spark_catalog.default.catalog_sales (18)
-            :           :                 :     :                 :                                      :     +- ReusedExchange (21)
-            :           :                 :     :                 :                                      +- BroadcastExchange (27)
-            :           :                 :     :                 :                                         +- * Filter (26)
-            :           :                 :     :                 :                                            +- * ColumnarToRow (25)
-            :           :                 :     :                 :                                               +- Scan parquet spark_catalog.default.item (24)
-            :           :                 :     :                 +- * Sort (51)
-            :           :                 :     :                    +- Exchange (50)
-            :           :                 :     :                       +- * Project (49)
-            :           :                 :     :                          +- * BroadcastHashJoin Inner BuildRight (48)
-            :           :                 :     :                             :- * Project (46)
-            :           :                 :     :                             :  +- * BroadcastHashJoin Inner BuildRight (45)
-            :           :                 :     :                             :     :- * Filter (43)
-            :           :                 :     :                             :     :  +- * ColumnarToRow (42)
-            :           :                 :     :                             :     :     +- Scan parquet spark_catalog.default.web_sales (41)
-            :           :                 :     :                             :     +- ReusedExchange (44)
-            :           :                 :     :                             +- ReusedExchange (47)
-            :           :                 :     +- ReusedExchange (58)
-            :           :                 +- BroadcastExchange (66)
-            :           :                    +- * BroadcastHashJoin LeftSemi BuildRight (65)
-            :           :                       :- * Filter (63)
-            :           :                       :  +- * ColumnarToRow (62)
-            :           :                       :     +- Scan parquet spark_catalog.default.item (61)
-            :           :                       +- ReusedExchange (64)
-            :           :- * Filter (87)
-            :           :  +- * HashAggregate (86)
-            :           :     +- Exchange (85)
-            :           :        +- * HashAggregate (84)
-            :           :           +- * Project (83)
-            :           :              +- * BroadcastHashJoin Inner BuildRight (82)
-            :           :                 :- * Project (80)
-            :           :                 :  +- * BroadcastHashJoin Inner BuildRight (79)
-            :           :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (77)
-            :           :                 :     :  :- * Filter (75)
-            :           :                 :     :  :  +- * ColumnarToRow (74)
-            :           :                 :     :  :     +- Scan parquet spark_catalog.default.catalog_sales (73)
-            :           :                 :     :  +- ReusedExchange (76)
-            :           :                 :     +- ReusedExchange (78)
-            :           :                 +- ReusedExchange (81)
-            :           +- * Filter (102)
-            :              +- * HashAggregate (101)
-            :                 +- Exchange (100)
-            :                    +- * HashAggregate (99)
-            :                       +- * Project (98)
-            :                          +- * BroadcastHashJoin Inner BuildRight (97)
-            :                             :- * Project (95)
-            :                             :  +- * BroadcastHashJoin Inner BuildRight (94)
-            :                             :     :- * BroadcastHashJoin LeftSemi BuildRight (92)
-            :                             :     :  :- * Filter (90)
-            :                             :     :  :  +- * ColumnarToRow (89)
-            :                             :     :  :     +- Scan parquet spark_catalog.default.web_sales (88)
-            :                             :     :  +- ReusedExchange (91)
-            :                             :     +- ReusedExchange (93)
-            :                             +- ReusedExchange (96)
-            :- * HashAggregate (111)
-            :  +- Exchange (110)
-            :     +- * HashAggregate (109)
-            :        +- * HashAggregate (108)
-            :           +- ReusedExchange (107)
-            :- * HashAggregate (116)
-            :  +- Exchange (115)
-            :     +- * HashAggregate (114)
-            :        +- * HashAggregate (113)
-            :           +- ReusedExchange (112)
-            :- * HashAggregate (121)
-            :  +- Exchange (120)
-            :     +- * HashAggregate (119)
-            :        +- * HashAggregate (118)
-            :           +- ReusedExchange (117)
-            +- * HashAggregate (126)
-               +- Exchange (125)
-                  +- * HashAggregate (124)
-                     +- * HashAggregate (123)
-                        +- ReusedExchange (122)
+TakeOrderedAndProject (170)
++- * HashAggregate (169)
+   +- Exchange (168)
+      +- * HashAggregate (167)
+         +- Union (166)
+            :- * HashAggregate (105)
+            :  +- * HashAggregate (104)
+            :     +- Union (103)
+            :        :- * Filter (72)
+            :        :  +- * HashAggregate (71)
+            :        :     +- Exchange (70)
+            :        :        +- * HashAggregate (69)
+            :        :           +- * Project (68)
+            :        :              +- * BroadcastHashJoin Inner BuildRight (67)
+            :        :                 :- * Project (60)
+            :        :                 :  +- * BroadcastHashJoin Inner BuildRight (59)
+            :        :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (57)
+            :        :                 :     :  :- * Filter (3)
+            :        :                 :     :  :  +- * ColumnarToRow (2)
+            :        :                 :     :  :     +- Scan parquet spark_catalog.default.store_sales (1)
+            :        :                 :     :  +- BroadcastExchange (56)
+            :        :                 :     :     +- * Project (55)
+            :        :                 :     :        +- * BroadcastHashJoin Inner BuildRight (54)
+            :        :                 :     :           :- * Filter (6)
+            :        :                 :     :           :  +- * ColumnarToRow (5)
+            :        :                 :     :           :     +- Scan parquet spark_catalog.default.item (4)
+            :        :                 :     :           +- BroadcastExchange (53)
+            :        :                 :     :              +- * SortMergeJoin LeftSemi (52)
+            :        :                 :     :                 :- * Sort (40)
+            :        :                 :     :                 :  +- Exchange (39)
+            :        :                 :     :                 :     +- * HashAggregate (38)
+            :        :                 :     :                 :        +- Exchange (37)
+            :        :                 :     :                 :           +- * HashAggregate (36)
+            :        :                 :     :                 :              +- * Project (35)
+            :        :                 :     :                 :                 +- * BroadcastHashJoin Inner BuildRight (34)
+            :        :                 :     :                 :                    :- * Project (12)
+            :        :                 :     :                 :                    :  +- * BroadcastHashJoin Inner BuildRight (11)
+            :        :                 :     :                 :                    :     :- * Filter (9)
+            :        :                 :     :                 :                    :     :  +- * ColumnarToRow (8)
+            :        :                 :     :                 :                    :     :     +- Scan parquet spark_catalog.default.store_sales (7)
+            :        :                 :     :                 :                    :     +- ReusedExchange (10)
+            :        :                 :     :                 :                    +- BroadcastExchange (33)
+            :        :                 :     :                 :                       +- * SortMergeJoin LeftSemi (32)
+            :        :                 :     :                 :                          :- * Sort (17)
+            :        :                 :     :                 :                          :  +- Exchange (16)
+            :        :                 :     :                 :                          :     +- * Filter (15)
+            :        :                 :     :                 :                          :        +- * ColumnarToRow (14)
+            :        :                 :     :                 :                          :           +- Scan parquet spark_catalog.default.item (13)
+            :        :                 :     :                 :                          +- * Sort (31)
+            :        :                 :     :                 :                             +- Exchange (30)
+            :        :                 :     :                 :                                +- * Project (29)
+            :        :                 :     :                 :                                   +- * BroadcastHashJoin Inner BuildRight (28)
+            :        :                 :     :                 :                                      :- * Project (23)
+            :        :                 :     :                 :                                      :  +- * BroadcastHashJoin Inner BuildRight (22)
+            :        :                 :     :                 :                                      :     :- * Filter (20)
+            :        :                 :     :                 :                                      :     :  +- * ColumnarToRow (19)
+            :        :                 :     :                 :                                      :     :     +- Scan parquet spark_catalog.default.catalog_sales (18)
+            :        :                 :     :                 :                                      :     +- ReusedExchange (21)
+            :        :                 :     :                 :                                      +- BroadcastExchange (27)
+            :        :                 :     :                 :                                         +- * Filter (26)
+            :        :                 :     :                 :                                            +- * ColumnarToRow (25)
+            :        :                 :     :                 :                                               +- Scan parquet spark_catalog.default.item (24)
+            :        :                 :     :                 +- * Sort (51)
+            :        :                 :     :                    +- Exchange (50)
+            :        :                 :     :                       +- * Project (49)
+            :        :                 :     :                          +- * BroadcastHashJoin Inner BuildRight (48)
+            :        :                 :     :                             :- * Project (46)
+            :        :                 :     :                             :  +- * BroadcastHashJoin Inner BuildRight (45)
+            :        :                 :     :                             :     :- * Filter (43)
+            :        :                 :     :                             :     :  +- * ColumnarToRow (42)
+            :        :                 :     :                             :     :     +- Scan parquet spark_catalog.default.web_sales (41)
+            :        :                 :     :                             :     +- ReusedExchange (44)
+            :        :                 :     :                             +- ReusedExchange (47)
+            :        :                 :     +- ReusedExchange (58)
+            :        :                 +- BroadcastExchange (66)
+            :        :                    +- * BroadcastHashJoin LeftSemi BuildRight (65)
+            :        :                       :- * Filter (63)
+            :        :                       :  +- * ColumnarToRow (62)
+            :        :                       :     +- Scan parquet spark_catalog.default.item (61)
+            :        :                       +- ReusedExchange (64)
+            :        :- * Filter (87)
+            :        :  +- * HashAggregate (86)
+            :        :     +- Exchange (85)
+            :        :        +- * HashAggregate (84)
+            :        :           +- * Project (83)
+            :        :              +- * BroadcastHashJoin Inner BuildRight (82)
+            :        :                 :- * Project (80)
+            :        :                 :  +- * BroadcastHashJoin Inner BuildRight (79)
+            :        :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (77)
+            :        :                 :     :  :- * Filter (75)
+            :        :                 :     :  :  +- * ColumnarToRow (74)
+            :        :                 :     :  :     +- Scan parquet spark_catalog.default.catalog_sales (73)
+            :        :                 :     :  +- ReusedExchange (76)
+            :        :                 :     +- ReusedExchange (78)
+            :        :                 +- ReusedExchange (81)
+            :        +- * Filter (102)
+            :           +- * HashAggregate (101)
+            :              +- Exchange (100)
+            :                 +- * HashAggregate (99)
+            :                    +- * Project (98)
+            :                       +- * BroadcastHashJoin Inner BuildRight (97)
+            :                          :- * Project (95)
+            :                          :  +- * BroadcastHashJoin Inner BuildRight (94)
+            :                          :     :- * BroadcastHashJoin LeftSemi BuildRight (92)
+            :                          :     :  :- * Filter (90)
+            :                          :     :  :  +- * ColumnarToRow (89)
+            :                          :     :  :     +- Scan parquet spark_catalog.default.web_sales (88)
+            :                          :     :  +- ReusedExchange (91)
+            :                          :     +- ReusedExchange (93)
+            :                          +- ReusedExchange (96)
+            :- * HashAggregate (120)
+            :  +- Exchange (119)
+            :     +- * HashAggregate (118)
+            :        +- * HashAggregate (117)
+            :           +- * HashAggregate (116)
+            :              +- Union (115)
+            :                 :- * Filter (108)
+            :                 :  +- * HashAggregate (107)
+            :                 :     +- ReusedExchange (106)
+            :                 :- * Filter (111)
+            :                 :  +- * HashAggregate (110)
+            :                 :     +- ReusedExchange (109)
+            :                 +- * Filter (114)
+            :                    +- * HashAggregate (113)
+            :                       +- ReusedExchange (112)
+            :- * HashAggregate (135)
+            :  +- Exchange (134)
+            :     +- * HashAggregate (133)
+            :        +- * HashAggregate (132)
+            :           +- * HashAggregate (131)
+            :              +- Union (130)
+            :                 :- * Filter (123)
+            :                 :  +- * HashAggregate (122)
+            :                 :     +- ReusedExchange (121)
+            :                 :- * Filter (126)
+            :                 :  +- * HashAggregate (125)
+            :                 :     +- ReusedExchange (124)
+            :                 +- * Filter (129)
+            :                    +- * HashAggregate (128)
+            :                       +- ReusedExchange (127)
+            :- * HashAggregate (150)
+            :  +- Exchange (149)
+            :     +- * HashAggregate (148)
+            :        +- * HashAggregate (147)
+            :           +- * HashAggregate (146)
+            :              +- Union (145)
+            :                 :- * Filter (138)
+            :                 :  +- * HashAggregate (137)
+            :                 :     +- ReusedExchange (136)
+            :                 :- * Filter (141)
+            :                 :  +- * HashAggregate (140)
+            :                 :     +- ReusedExchange (139)
+            :                 +- * Filter (144)
+            :                    +- * HashAggregate (143)
+            :                       +- ReusedExchange (142)
+            +- * HashAggregate (165)
+               +- Exchange (164)
+                  +- * HashAggregate (163)
+                     +- * HashAggregate (162)
+                        +- * HashAggregate (161)
+                           +- Union (160)
+                              :- * Filter (153)
+                              :  +- * HashAggregate (152)
+                              :     +- ReusedExchange (151)
+                              :- * Filter (156)
+                              :  +- * HashAggregate (155)
+                              :     +- ReusedExchange (154)
+                              +- * Filter (159)
+                                 +- * HashAggregate (158)
+                                    +- ReusedExchange (157)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -176,7 +215,7 @@ Input [2]: [ss_item_sk#10, ss_sold_date_sk#11]
 Input [2]: [ss_item_sk#10, ss_sold_date_sk#11]
 Condition : isnotnull(ss_item_sk#10)
 
-(10) ReusedExchange [Reuses operator id: 165]
+(10) ReusedExchange [Reuses operator id: 204]
 Output [1]: [d_date_sk#13]
 
 (11) BroadcastHashJoin [codegen id : 9]
@@ -226,7 +265,7 @@ Input [2]: [cs_item_sk#18, cs_sold_date_sk#19]
 Input [2]: [cs_item_sk#18, cs_sold_date_sk#19]
 Condition : isnotnull(cs_item_sk#18)
 
-(21) ReusedExchange [Reuses operator id: 165]
+(21) ReusedExchange [Reuses operator id: 204]
 Output [1]: [d_date_sk#20]
 
 (22) BroadcastHashJoin [codegen id : 6]
@@ -336,7 +375,7 @@ Input [2]: [ws_item_sk#28, ws_sold_date_sk#29]
 Input [2]: [ws_item_sk#28, ws_sold_date_sk#29]
 Condition : isnotnull(ws_item_sk#28)
 
-(44) ReusedExchange [Reuses operator id: 165]
+(44) ReusedExchange [Reuses operator id: 204]
 Output [1]: [d_date_sk#30]
 
 (45) BroadcastHashJoin [codegen id : 14]
@@ -400,7 +439,7 @@ Right keys [1]: [ss_item_sk#35]
 Join type: LeftSemi
 Join condition: None
 
-(58) ReusedExchange [Reuses operator id: 160]
+(58) ReusedExchange [Reuses operator id: 199]
 Output [1]: [d_date_sk#36]
 
 (59) BroadcastHashJoin [codegen id : 37]
@@ -470,151 +509,151 @@ Results [6]: [store AS channel#49, i_brand_id#38, i_class_id#39, i_category_id#4
 
 (72) Filter [codegen id : 38]
 Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51]
-Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
 
 (73) Scan parquet spark_catalog.default.catalog_sales
-Output [4]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57]
+Output [4]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#57), dynamicpruningexpression(cs_sold_date_sk#57 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#56), dynamicpruningexpression(cs_sold_date_sk#56 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(cs_item_sk)]
 ReadSchema: struct<cs_item_sk:int,cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (74) ColumnarToRow [codegen id : 75]
-Input [4]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57]
+Input [4]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56]
 
 (75) Filter [codegen id : 75]
-Input [4]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57]
-Condition : isnotnull(cs_item_sk#54)
+Input [4]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56]
+Condition : isnotnull(cs_item_sk#53)
 
 (76) ReusedExchange [Reuses operator id: 56]
-Output [1]: [ss_item_sk#58]
+Output [1]: [ss_item_sk#57]
 
 (77) BroadcastHashJoin [codegen id : 75]
-Left keys [1]: [cs_item_sk#54]
-Right keys [1]: [ss_item_sk#58]
+Left keys [1]: [cs_item_sk#53]
+Right keys [1]: [ss_item_sk#57]
 Join type: LeftSemi
 Join condition: None
 
-(78) ReusedExchange [Reuses operator id: 160]
-Output [1]: [d_date_sk#59]
+(78) ReusedExchange [Reuses operator id: 199]
+Output [1]: [d_date_sk#58]
 
 (79) BroadcastHashJoin [codegen id : 75]
-Left keys [1]: [cs_sold_date_sk#57]
-Right keys [1]: [d_date_sk#59]
+Left keys [1]: [cs_sold_date_sk#56]
+Right keys [1]: [d_date_sk#58]
 Join type: Inner
 Join condition: None
 
 (80) Project [codegen id : 75]
-Output [3]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56]
-Input [5]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57, d_date_sk#59]
+Output [3]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55]
+Input [5]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56, d_date_sk#58]
 
 (81) ReusedExchange [Reuses operator id: 66]
-Output [4]: [i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
+Output [4]: [i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
 
 (82) BroadcastHashJoin [codegen id : 75]
-Left keys [1]: [cs_item_sk#54]
-Right keys [1]: [i_item_sk#60]
+Left keys [1]: [cs_item_sk#53]
+Right keys [1]: [i_item_sk#59]
 Join type: Inner
 Join condition: None
 
 (83) Project [codegen id : 75]
-Output [5]: [cs_quantity#55, cs_list_price#56, i_brand_id#61, i_class_id#62, i_category_id#63]
-Input [7]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, i_item_sk#60, i_brand_id#61, i_class_id#62, i_category_id#63]
+Output [5]: [cs_quantity#54, cs_list_price#55, i_brand_id#60, i_class_id#61, i_category_id#62]
+Input [7]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
 
 (84) HashAggregate [codegen id : 75]
-Input [5]: [cs_quantity#55, cs_list_price#56, i_brand_id#61, i_class_id#62, i_category_id#63]
-Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
-Functions [2]: [partial_sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56)), partial_count(1)]
-Aggregate Attributes [3]: [sum#64, isEmpty#65, count#66]
-Results [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
+Input [5]: [cs_quantity#54, cs_list_price#55, i_brand_id#60, i_class_id#61, i_category_id#62]
+Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
+Functions [2]: [partial_sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55)), partial_count(1)]
+Aggregate Attributes [3]: [sum#63, isEmpty#64, count#65]
+Results [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#66, isEmpty#67, count#68]
 
 (85) Exchange
-Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
-Arguments: hashpartitioning(i_brand_id#61, i_class_id#62, i_category_id#63, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#66, isEmpty#67, count#68]
+Arguments: hashpartitioning(i_brand_id#60, i_class_id#61, i_category_id#62, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (86) HashAggregate [codegen id : 76]
-Input [6]: [i_brand_id#61, i_class_id#62, i_category_id#63, sum#67, isEmpty#68, count#69]
-Keys [3]: [i_brand_id#61, i_class_id#62, i_category_id#63]
-Functions [2]: [sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56)), count(1)]
-Aggregate Attributes [2]: [sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56))#70, count(1)#71]
-Results [6]: [catalog AS channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56))#70 AS sales#73, count(1)#71 AS number_sales#74]
+Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#66, isEmpty#67, count#68]
+Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
+Functions [2]: [sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55))#69, count(1)#70]
+Results [6]: [catalog AS channel#71, i_brand_id#60, i_class_id#61, i_category_id#62, sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55))#69 AS sales#72, count(1)#70 AS number_sales#73]
 
 (87) Filter [codegen id : 76]
-Input [6]: [channel#72, i_brand_id#61, i_class_id#62, i_category_id#63, sales#73, number_sales#74]
-Condition : (isnotnull(sales#73) AND (cast(sales#73 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#71, i_brand_id#60, i_class_id#61, i_category_id#62, sales#72, number_sales#73]
+Condition : (isnotnull(sales#72) AND (cast(sales#72 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
 
 (88) Scan parquet spark_catalog.default.web_sales
-Output [4]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78]
+Output [4]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#78), dynamicpruningexpression(ws_sold_date_sk#78 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#77), dynamicpruningexpression(ws_sold_date_sk#77 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(ws_item_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (89) ColumnarToRow [codegen id : 113]
-Input [4]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78]
+Input [4]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77]
 
 (90) Filter [codegen id : 113]
-Input [4]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78]
-Condition : isnotnull(ws_item_sk#75)
+Input [4]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77]
+Condition : isnotnull(ws_item_sk#74)
 
 (91) ReusedExchange [Reuses operator id: 56]
-Output [1]: [ss_item_sk#79]
+Output [1]: [ss_item_sk#78]
 
 (92) BroadcastHashJoin [codegen id : 113]
-Left keys [1]: [ws_item_sk#75]
-Right keys [1]: [ss_item_sk#79]
+Left keys [1]: [ws_item_sk#74]
+Right keys [1]: [ss_item_sk#78]
 Join type: LeftSemi
 Join condition: None
 
-(93) ReusedExchange [Reuses operator id: 160]
-Output [1]: [d_date_sk#80]
+(93) ReusedExchange [Reuses operator id: 199]
+Output [1]: [d_date_sk#79]
 
 (94) BroadcastHashJoin [codegen id : 113]
-Left keys [1]: [ws_sold_date_sk#78]
-Right keys [1]: [d_date_sk#80]
+Left keys [1]: [ws_sold_date_sk#77]
+Right keys [1]: [d_date_sk#79]
 Join type: Inner
 Join condition: None
 
 (95) Project [codegen id : 113]
-Output [3]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77]
-Input [5]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78, d_date_sk#80]
+Output [3]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76]
+Input [5]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77, d_date_sk#79]
 
 (96) ReusedExchange [Reuses operator id: 66]
-Output [4]: [i_item_sk#81, i_brand_id#82, i_class_id#83, i_category_id#84]
+Output [4]: [i_item_sk#80, i_brand_id#81, i_class_id#82, i_category_id#83]
 
 (97) BroadcastHashJoin [codegen id : 113]
-Left keys [1]: [ws_item_sk#75]
-Right keys [1]: [i_item_sk#81]
+Left keys [1]: [ws_item_sk#74]
+Right keys [1]: [i_item_sk#80]
 Join type: Inner
 Join condition: None
 
 (98) Project [codegen id : 113]
-Output [5]: [ws_quantity#76, ws_list_price#77, i_brand_id#82, i_class_id#83, i_category_id#84]
-Input [7]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, i_item_sk#81, i_brand_id#82, i_class_id#83, i_category_id#84]
+Output [5]: [ws_quantity#75, ws_list_price#76, i_brand_id#81, i_class_id#82, i_category_id#83]
+Input [7]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, i_item_sk#80, i_brand_id#81, i_class_id#82, i_category_id#83]
 
 (99) HashAggregate [codegen id : 113]
-Input [5]: [ws_quantity#76, ws_list_price#77, i_brand_id#82, i_class_id#83, i_category_id#84]
-Keys [3]: [i_brand_id#82, i_class_id#83, i_category_id#84]
-Functions [2]: [partial_sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77)), partial_count(1)]
-Aggregate Attributes [3]: [sum#85, isEmpty#86, count#87]
-Results [6]: [i_brand_id#82, i_class_id#83, i_category_id#84, sum#88, isEmpty#89, count#90]
+Input [5]: [ws_quantity#75, ws_list_price#76, i_brand_id#81, i_class_id#82, i_category_id#83]
+Keys [3]: [i_brand_id#81, i_class_id#82, i_category_id#83]
+Functions [2]: [partial_sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76)), partial_count(1)]
+Aggregate Attributes [3]: [sum#84, isEmpty#85, count#86]
+Results [6]: [i_brand_id#81, i_class_id#82, i_category_id#83, sum#87, isEmpty#88, count#89]
 
 (100) Exchange
-Input [6]: [i_brand_id#82, i_class_id#83, i_category_id#84, sum#88, isEmpty#89, count#90]
-Arguments: hashpartitioning(i_brand_id#82, i_class_id#83, i_category_id#84, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+Input [6]: [i_brand_id#81, i_class_id#82, i_category_id#83, sum#87, isEmpty#88, count#89]
+Arguments: hashpartitioning(i_brand_id#81, i_class_id#82, i_category_id#83, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (101) HashAggregate [codegen id : 114]
-Input [6]: [i_brand_id#82, i_class_id#83, i_category_id#84, sum#88, isEmpty#89, count#90]
-Keys [3]: [i_brand_id#82, i_class_id#83, i_category_id#84]
-Functions [2]: [sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77))#91, count(1)#92]
-Results [6]: [web AS channel#93, i_brand_id#82, i_class_id#83, i_category_id#84, sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77))#91 AS sales#94, count(1)#92 AS number_sales#95]
+Input [6]: [i_brand_id#81, i_class_id#82, i_category_id#83, sum#87, isEmpty#88, count#89]
+Keys [3]: [i_brand_id#81, i_class_id#82, i_category_id#83]
+Functions [2]: [sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76))#90, count(1)#91]
+Results [6]: [web AS channel#92, i_brand_id#81, i_class_id#82, i_category_id#83, sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76))#90 AS sales#93, count(1)#91 AS number_sales#94]
 
 (102) Filter [codegen id : 114]
-Input [6]: [channel#93, i_brand_id#82, i_class_id#83, i_category_id#84, sales#94, number_sales#95]
-Condition : (isnotnull(sales#94) AND (cast(sales#94 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#92, i_brand_id#81, i_class_id#82, i_category_id#83, sales#93, number_sales#94]
+Condition : (isnotnull(sales#93) AND (cast(sales#93 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
 
 (103) Union
 
@@ -622,360 +661,548 @@ Condition : (isnotnull(sales#94) AND (cast(sales#94 as decimal(32,6)) > cast(Reu
 Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sales#50, number_sales#51]
 Keys [4]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40]
 Functions [2]: [partial_sum(sales#50), partial_sum(number_sales#51)]
-Aggregate Attributes [3]: [sum#96, isEmpty#97, sum#98]
-Results [7]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum#99, isEmpty#100, sum#101]
+Aggregate Attributes [3]: [sum#95, isEmpty#96, sum#97]
+Results [7]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum#98, isEmpty#99, sum#100]
 
-(105) Exchange
-Input [7]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum#99, isEmpty#100, sum#101]
-Arguments: hashpartitioning(channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, 5), ENSURE_REQUIREMENTS, [plan_id=14]
-
-(106) HashAggregate [codegen id : 116]
-Input [7]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum#99, isEmpty#100, sum#101]
+(105) HashAggregate [codegen id : 115]
+Input [7]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum#98, isEmpty#99, sum#100]
 Keys [4]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40]
 Functions [2]: [sum(sales#50), sum(number_sales#51)]
-Aggregate Attributes [2]: [sum(sales#50)#102, sum(number_sales#51)#103]
-Results [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum(sales#50)#102 AS sum_sales#104, sum(number_sales#51)#103 AS number_sales#105]
-
-(107) ReusedExchange [Reuses operator id: 105]
-Output [7]: [channel#106, i_brand_id#107, i_class_id#108, i_category_id#109, sum#110, isEmpty#111, sum#112]
-
-(108) HashAggregate [codegen id : 232]
-Input [7]: [channel#106, i_brand_id#107, i_class_id#108, i_category_id#109, sum#110, isEmpty#111, sum#112]
-Keys [4]: [channel#106, i_brand_id#107, i_class_id#108, i_category_id#109]
+Aggregate Attributes [2]: [sum(sales#50)#101, sum(number_sales#51)#102]
+Results [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum(sales#50)#101 AS sum_sales#103, sum(number_sales#51)#102 AS number_sales#104]
+
+(106) ReusedExchange [Reuses operator id: 70]
+Output [6]: [i_brand_id#105, i_class_id#106, i_category_id#107, sum#108, isEmpty#109, count#46]
+
+(107) HashAggregate [codegen id : 153]
+Input [6]: [i_brand_id#105, i_class_id#106, i_category_id#107, sum#108, isEmpty#109, count#46]
+Keys [3]: [i_brand_id#105, i_class_id#106, i_category_id#107]
+Functions [2]: [sum((cast(ss_quantity#110 as decimal(10,0)) * ss_list_price#111)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#110 as decimal(10,0)) * ss_list_price#111))#47, count(1)#48]
+Results [6]: [store AS channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sum((cast(ss_quantity#110 as decimal(10,0)) * ss_list_price#111))#47 AS sales#113, count(1)#48 AS number_sales#114]
+
+(108) Filter [codegen id : 153]
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sales#113, number_sales#114]
+Condition : (isnotnull(sales#113) AND (cast(sales#113 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(109) ReusedExchange [Reuses operator id: 85]
+Output [6]: [i_brand_id#115, i_class_id#116, i_category_id#117, sum#118, isEmpty#119, count#68]
+
+(110) HashAggregate [codegen id : 191]
+Input [6]: [i_brand_id#115, i_class_id#116, i_category_id#117, sum#118, isEmpty#119, count#68]
+Keys [3]: [i_brand_id#115, i_class_id#116, i_category_id#117]
+Functions [2]: [sum((cast(cs_quantity#120 as decimal(10,0)) * cs_list_price#121)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#120 as decimal(10,0)) * cs_list_price#121))#69, count(1)#70]
+Results [6]: [catalog AS channel#122, i_brand_id#115, i_class_id#116, i_category_id#117, sum((cast(cs_quantity#120 as decimal(10,0)) * cs_list_price#121))#69 AS sales#123, count(1)#70 AS number_sales#124]
+
+(111) Filter [codegen id : 191]
+Input [6]: [channel#122, i_brand_id#115, i_class_id#116, i_category_id#117, sales#123, number_sales#124]
+Condition : (isnotnull(sales#123) AND (cast(sales#123 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(112) ReusedExchange [Reuses operator id: 100]
+Output [6]: [i_brand_id#125, i_class_id#126, i_category_id#127, sum#128, isEmpty#129, count#89]
+
+(113) HashAggregate [codegen id : 229]
+Input [6]: [i_brand_id#125, i_class_id#126, i_category_id#127, sum#128, isEmpty#129, count#89]
+Keys [3]: [i_brand_id#125, i_class_id#126, i_category_id#127]
+Functions [2]: [sum((cast(ws_quantity#130 as decimal(10,0)) * ws_list_price#131)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#130 as decimal(10,0)) * ws_list_price#131))#90, count(1)#91]
+Results [6]: [web AS channel#132, i_brand_id#125, i_class_id#126, i_category_id#127, sum((cast(ws_quantity#130 as decimal(10,0)) * ws_list_price#131))#90 AS sales#133, count(1)#91 AS number_sales#134]
+
+(114) Filter [codegen id : 229]
+Input [6]: [channel#132, i_brand_id#125, i_class_id#126, i_category_id#127, sales#133, number_sales#134]
+Condition : (isnotnull(sales#133) AND (cast(sales#133 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(115) Union
+
+(116) HashAggregate [codegen id : 230]
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sales#113, number_sales#114]
+Keys [4]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107]
+Functions [2]: [partial_sum(sales#113), partial_sum(number_sales#114)]
+Aggregate Attributes [3]: [sum#135, isEmpty#136, sum#137]
+Results [7]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sum#138, isEmpty#139, sum#140]
+
+(117) HashAggregate [codegen id : 230]
+Input [7]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sum#138, isEmpty#139, sum#140]
+Keys [4]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107]
 Functions [2]: [sum(sales#113), sum(number_sales#114)]
-Aggregate Attributes [2]: [sum(sales#113)#102, sum(number_sales#114)#103]
-Results [5]: [channel#106, i_brand_id#107, i_class_id#108, sum(sales#113)#102 AS sum_sales#115, sum(number_sales#114)#103 AS number_sales#116]
-
-(109) HashAggregate [codegen id : 232]
-Input [5]: [channel#106, i_brand_id#107, i_class_id#108, sum_sales#115, number_sales#116]
-Keys [3]: [channel#106, i_brand_id#107, i_class_id#108]
-Functions [2]: [partial_sum(sum_sales#115), partial_sum(number_sales#116)]
-Aggregate Attributes [3]: [sum#117, isEmpty#118, sum#119]
-Results [6]: [channel#106, i_brand_id#107, i_class_id#108, sum#120, isEmpty#121, sum#122]
-
-(110) Exchange
-Input [6]: [channel#106, i_brand_id#107, i_class_id#108, sum#120, isEmpty#121, sum#122]
-Arguments: hashpartitioning(channel#106, i_brand_id#107, i_class_id#108, 5), ENSURE_REQUIREMENTS, [plan_id=15]
-
-(111) HashAggregate [codegen id : 233]
-Input [6]: [channel#106, i_brand_id#107, i_class_id#108, sum#120, isEmpty#121, sum#122]
-Keys [3]: [channel#106, i_brand_id#107, i_class_id#108]
-Functions [2]: [sum(sum_sales#115), sum(number_sales#116)]
-Aggregate Attributes [2]: [sum(sum_sales#115)#123, sum(number_sales#116)#124]
-Results [6]: [channel#106, i_brand_id#107, i_class_id#108, null AS i_category_id#125, sum(sum_sales#115)#123 AS sum(sum_sales)#126, sum(number_sales#116)#124 AS sum(number_sales)#127]
-
-(112) ReusedExchange [Reuses operator id: 105]
-Output [7]: [channel#128, i_brand_id#129, i_class_id#130, i_category_id#131, sum#132, isEmpty#133, sum#134]
-
-(113) HashAggregate [codegen id : 349]
-Input [7]: [channel#128, i_brand_id#129, i_class_id#130, i_category_id#131, sum#132, isEmpty#133, sum#134]
-Keys [4]: [channel#128, i_brand_id#129, i_class_id#130, i_category_id#131]
-Functions [2]: [sum(sales#135), sum(number_sales#136)]
-Aggregate Attributes [2]: [sum(sales#135)#102, sum(number_sales#136)#103]
-Results [4]: [channel#128, i_brand_id#129, sum(sales#135)#102 AS sum_sales#137, sum(number_sales#136)#103 AS number_sales#138]
-
-(114) HashAggregate [codegen id : 349]
-Input [4]: [channel#128, i_brand_id#129, sum_sales#137, number_sales#138]
-Keys [2]: [channel#128, i_brand_id#129]
-Functions [2]: [partial_sum(sum_sales#137), partial_sum(number_sales#138)]
-Aggregate Attributes [3]: [sum#139, isEmpty#140, sum#141]
-Results [5]: [channel#128, i_brand_id#129, sum#142, isEmpty#143, sum#144]
-
-(115) Exchange
-Input [5]: [channel#128, i_brand_id#129, sum#142, isEmpty#143, sum#144]
-Arguments: hashpartitioning(channel#128, i_brand_id#129, 5), ENSURE_REQUIREMENTS, [plan_id=16]
-
-(116) HashAggregate [codegen id : 350]
-Input [5]: [channel#128, i_brand_id#129, sum#142, isEmpty#143, sum#144]
-Keys [2]: [channel#128, i_brand_id#129]
-Functions [2]: [sum(sum_sales#137), sum(number_sales#138)]
-Aggregate Attributes [2]: [sum(sum_sales#137)#145, sum(number_sales#138)#146]
-Results [6]: [channel#128, i_brand_id#129, null AS i_class_id#147, null AS i_category_id#148, sum(sum_sales#137)#145 AS sum(sum_sales)#149, sum(number_sales#138)#146 AS sum(number_sales)#150]
-
-(117) ReusedExchange [Reuses operator id: 105]
-Output [7]: [channel#151, i_brand_id#152, i_class_id#153, i_category_id#154, sum#155, isEmpty#156, sum#157]
-
-(118) HashAggregate [codegen id : 466]
-Input [7]: [channel#151, i_brand_id#152, i_class_id#153, i_category_id#154, sum#155, isEmpty#156, sum#157]
-Keys [4]: [channel#151, i_brand_id#152, i_class_id#153, i_category_id#154]
-Functions [2]: [sum(sales#158), sum(number_sales#159)]
-Aggregate Attributes [2]: [sum(sales#158)#102, sum(number_sales#159)#103]
-Results [3]: [channel#151, sum(sales#158)#102 AS sum_sales#160, sum(number_sales#159)#103 AS number_sales#161]
-
-(119) HashAggregate [codegen id : 466]
-Input [3]: [channel#151, sum_sales#160, number_sales#161]
-Keys [1]: [channel#151]
-Functions [2]: [partial_sum(sum_sales#160), partial_sum(number_sales#161)]
-Aggregate Attributes [3]: [sum#162, isEmpty#163, sum#164]
-Results [4]: [channel#151, sum#165, isEmpty#166, sum#167]
-
-(120) Exchange
-Input [4]: [channel#151, sum#165, isEmpty#166, sum#167]
-Arguments: hashpartitioning(channel#151, 5), ENSURE_REQUIREMENTS, [plan_id=17]
-
-(121) HashAggregate [codegen id : 467]
-Input [4]: [channel#151, sum#165, isEmpty#166, sum#167]
-Keys [1]: [channel#151]
-Functions [2]: [sum(sum_sales#160), sum(number_sales#161)]
-Aggregate Attributes [2]: [sum(sum_sales#160)#168, sum(number_sales#161)#169]
-Results [6]: [channel#151, null AS i_brand_id#170, null AS i_class_id#171, null AS i_category_id#172, sum(sum_sales#160)#168 AS sum(sum_sales)#173, sum(number_sales#161)#169 AS sum(number_sales)#174]
-
-(122) ReusedExchange [Reuses operator id: 105]
-Output [7]: [channel#175, i_brand_id#176, i_class_id#177, i_category_id#178, sum#179, isEmpty#180, sum#181]
-
-(123) HashAggregate [codegen id : 583]
-Input [7]: [channel#175, i_brand_id#176, i_class_id#177, i_category_id#178, sum#179, isEmpty#180, sum#181]
-Keys [4]: [channel#175, i_brand_id#176, i_class_id#177, i_category_id#178]
-Functions [2]: [sum(sales#182), sum(number_sales#183)]
-Aggregate Attributes [2]: [sum(sales#182)#102, sum(number_sales#183)#103]
-Results [2]: [sum(sales#182)#102 AS sum_sales#184, sum(number_sales#183)#103 AS number_sales#185]
-
-(124) HashAggregate [codegen id : 583]
-Input [2]: [sum_sales#184, number_sales#185]
+Aggregate Attributes [2]: [sum(sales#113)#101, sum(number_sales#114)#102]
+Results [5]: [channel#112, i_brand_id#105, i_class_id#106, sum(sales#113)#101 AS sum_sales#141, sum(number_sales#114)#102 AS number_sales#142]
+
+(118) HashAggregate [codegen id : 230]
+Input [5]: [channel#112, i_brand_id#105, i_class_id#106, sum_sales#141, number_sales#142]
+Keys [3]: [channel#112, i_brand_id#105, i_class_id#106]
+Functions [2]: [partial_sum(sum_sales#141), partial_sum(number_sales#142)]
+Aggregate Attributes [3]: [sum#143, isEmpty#144, sum#145]
+Results [6]: [channel#112, i_brand_id#105, i_class_id#106, sum#146, isEmpty#147, sum#148]
+
+(119) Exchange
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, sum#146, isEmpty#147, sum#148]
+Arguments: hashpartitioning(channel#112, i_brand_id#105, i_class_id#106, 5), ENSURE_REQUIREMENTS, [plan_id=15]
+
+(120) HashAggregate [codegen id : 231]
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, sum#146, isEmpty#147, sum#148]
+Keys [3]: [channel#112, i_brand_id#105, i_class_id#106]
+Functions [2]: [sum(sum_sales#141), sum(number_sales#142)]
+Aggregate Attributes [2]: [sum(sum_sales#141)#149, sum(number_sales#142)#150]
+Results [6]: [channel#112, i_brand_id#105, i_class_id#106, null AS i_category_id#151, sum(sum_sales#141)#149 AS sum(sum_sales)#152, sum(number_sales#142)#150 AS sum(number_sales)#153]
+
+(121) ReusedExchange [Reuses operator id: 70]
+Output [6]: [i_brand_id#154, i_class_id#155, i_category_id#156, sum#157, isEmpty#158, count#46]
+
+(122) HashAggregate [codegen id : 269]
+Input [6]: [i_brand_id#154, i_class_id#155, i_category_id#156, sum#157, isEmpty#158, count#46]
+Keys [3]: [i_brand_id#154, i_class_id#155, i_category_id#156]
+Functions [2]: [sum((cast(ss_quantity#159 as decimal(10,0)) * ss_list_price#160)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#159 as decimal(10,0)) * ss_list_price#160))#47, count(1)#48]
+Results [6]: [store AS channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sum((cast(ss_quantity#159 as decimal(10,0)) * ss_list_price#160))#47 AS sales#162, count(1)#48 AS number_sales#163]
+
+(123) Filter [codegen id : 269]
+Input [6]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sales#162, number_sales#163]
+Condition : (isnotnull(sales#162) AND (cast(sales#162 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(124) ReusedExchange [Reuses operator id: 85]
+Output [6]: [i_brand_id#164, i_class_id#165, i_category_id#166, sum#167, isEmpty#168, count#68]
+
+(125) HashAggregate [codegen id : 307]
+Input [6]: [i_brand_id#164, i_class_id#165, i_category_id#166, sum#167, isEmpty#168, count#68]
+Keys [3]: [i_brand_id#164, i_class_id#165, i_category_id#166]
+Functions [2]: [sum((cast(cs_quantity#169 as decimal(10,0)) * cs_list_price#170)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#169 as decimal(10,0)) * cs_list_price#170))#69, count(1)#70]
+Results [6]: [catalog AS channel#171, i_brand_id#164, i_class_id#165, i_category_id#166, sum((cast(cs_quantity#169 as decimal(10,0)) * cs_list_price#170))#69 AS sales#172, count(1)#70 AS number_sales#173]
+
+(126) Filter [codegen id : 307]
+Input [6]: [channel#171, i_brand_id#164, i_class_id#165, i_category_id#166, sales#172, number_sales#173]
+Condition : (isnotnull(sales#172) AND (cast(sales#172 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(127) ReusedExchange [Reuses operator id: 100]
+Output [6]: [i_brand_id#174, i_class_id#175, i_category_id#176, sum#177, isEmpty#178, count#89]
+
+(128) HashAggregate [codegen id : 345]
+Input [6]: [i_brand_id#174, i_class_id#175, i_category_id#176, sum#177, isEmpty#178, count#89]
+Keys [3]: [i_brand_id#174, i_class_id#175, i_category_id#176]
+Functions [2]: [sum((cast(ws_quantity#179 as decimal(10,0)) * ws_list_price#180)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#179 as decimal(10,0)) * ws_list_price#180))#90, count(1)#91]
+Results [6]: [web AS channel#181, i_brand_id#174, i_class_id#175, i_category_id#176, sum((cast(ws_quantity#179 as decimal(10,0)) * ws_list_price#180))#90 AS sales#182, count(1)#91 AS number_sales#183]
+
+(129) Filter [codegen id : 345]
+Input [6]: [channel#181, i_brand_id#174, i_class_id#175, i_category_id#176, sales#182, number_sales#183]
+Condition : (isnotnull(sales#182) AND (cast(sales#182 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(130) Union
+
+(131) HashAggregate [codegen id : 346]
+Input [6]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sales#162, number_sales#163]
+Keys [4]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156]
+Functions [2]: [partial_sum(sales#162), partial_sum(number_sales#163)]
+Aggregate Attributes [3]: [sum#184, isEmpty#185, sum#186]
+Results [7]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sum#187, isEmpty#188, sum#189]
+
+(132) HashAggregate [codegen id : 346]
+Input [7]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sum#187, isEmpty#188, sum#189]
+Keys [4]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156]
+Functions [2]: [sum(sales#162), sum(number_sales#163)]
+Aggregate Attributes [2]: [sum(sales#162)#101, sum(number_sales#163)#102]
+Results [4]: [channel#161, i_brand_id#154, sum(sales#162)#101 AS sum_sales#190, sum(number_sales#163)#102 AS number_sales#191]
+
+(133) HashAggregate [codegen id : 346]
+Input [4]: [channel#161, i_brand_id#154, sum_sales#190, number_sales#191]
+Keys [2]: [channel#161, i_brand_id#154]
+Functions [2]: [partial_sum(sum_sales#190), partial_sum(number_sales#191)]
+Aggregate Attributes [3]: [sum#192, isEmpty#193, sum#194]
+Results [5]: [channel#161, i_brand_id#154, sum#195, isEmpty#196, sum#197]
+
+(134) Exchange
+Input [5]: [channel#161, i_brand_id#154, sum#195, isEmpty#196, sum#197]
+Arguments: hashpartitioning(channel#161, i_brand_id#154, 5), ENSURE_REQUIREMENTS, [plan_id=16]
+
+(135) HashAggregate [codegen id : 347]
+Input [5]: [channel#161, i_brand_id#154, sum#195, isEmpty#196, sum#197]
+Keys [2]: [channel#161, i_brand_id#154]
+Functions [2]: [sum(sum_sales#190), sum(number_sales#191)]
+Aggregate Attributes [2]: [sum(sum_sales#190)#198, sum(number_sales#191)#199]
+Results [6]: [channel#161, i_brand_id#154, null AS i_class_id#200, null AS i_category_id#201, sum(sum_sales#190)#198 AS sum(sum_sales)#202, sum(number_sales#191)#199 AS sum(number_sales)#203]
+
+(136) ReusedExchange [Reuses operator id: 70]
+Output [6]: [i_brand_id#204, i_class_id#205, i_category_id#206, sum#207, isEmpty#208, count#46]
+
+(137) HashAggregate [codegen id : 385]
+Input [6]: [i_brand_id#204, i_class_id#205, i_category_id#206, sum#207, isEmpty#208, count#46]
+Keys [3]: [i_brand_id#204, i_class_id#205, i_category_id#206]
+Functions [2]: [sum((cast(ss_quantity#209 as decimal(10,0)) * ss_list_price#210)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#209 as decimal(10,0)) * ss_list_price#210))#47, count(1)#48]
+Results [6]: [store AS channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sum((cast(ss_quantity#209 as decimal(10,0)) * ss_list_price#210))#47 AS sales#212, count(1)#48 AS number_sales#213]
+
+(138) Filter [codegen id : 385]
+Input [6]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sales#212, number_sales#213]
+Condition : (isnotnull(sales#212) AND (cast(sales#212 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(139) ReusedExchange [Reuses operator id: 85]
+Output [6]: [i_brand_id#214, i_class_id#215, i_category_id#216, sum#217, isEmpty#218, count#68]
+
+(140) HashAggregate [codegen id : 423]
+Input [6]: [i_brand_id#214, i_class_id#215, i_category_id#216, sum#217, isEmpty#218, count#68]
+Keys [3]: [i_brand_id#214, i_class_id#215, i_category_id#216]
+Functions [2]: [sum((cast(cs_quantity#219 as decimal(10,0)) * cs_list_price#220)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#219 as decimal(10,0)) * cs_list_price#220))#69, count(1)#70]
+Results [6]: [catalog AS channel#221, i_brand_id#214, i_class_id#215, i_category_id#216, sum((cast(cs_quantity#219 as decimal(10,0)) * cs_list_price#220))#69 AS sales#222, count(1)#70 AS number_sales#223]
+
+(141) Filter [codegen id : 423]
+Input [6]: [channel#221, i_brand_id#214, i_class_id#215, i_category_id#216, sales#222, number_sales#223]
+Condition : (isnotnull(sales#222) AND (cast(sales#222 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(142) ReusedExchange [Reuses operator id: 100]
+Output [6]: [i_brand_id#224, i_class_id#225, i_category_id#226, sum#227, isEmpty#228, count#89]
+
+(143) HashAggregate [codegen id : 461]
+Input [6]: [i_brand_id#224, i_class_id#225, i_category_id#226, sum#227, isEmpty#228, count#89]
+Keys [3]: [i_brand_id#224, i_class_id#225, i_category_id#226]
+Functions [2]: [sum((cast(ws_quantity#229 as decimal(10,0)) * ws_list_price#230)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#229 as decimal(10,0)) * ws_list_price#230))#90, count(1)#91]
+Results [6]: [web AS channel#231, i_brand_id#224, i_class_id#225, i_category_id#226, sum((cast(ws_quantity#229 as decimal(10,0)) * ws_list_price#230))#90 AS sales#232, count(1)#91 AS number_sales#233]
+
+(144) Filter [codegen id : 461]
+Input [6]: [channel#231, i_brand_id#224, i_class_id#225, i_category_id#226, sales#232, number_sales#233]
+Condition : (isnotnull(sales#232) AND (cast(sales#232 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(145) Union
+
+(146) HashAggregate [codegen id : 462]
+Input [6]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sales#212, number_sales#213]
+Keys [4]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206]
+Functions [2]: [partial_sum(sales#212), partial_sum(number_sales#213)]
+Aggregate Attributes [3]: [sum#234, isEmpty#235, sum#236]
+Results [7]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sum#237, isEmpty#238, sum#239]
+
+(147) HashAggregate [codegen id : 462]
+Input [7]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sum#237, isEmpty#238, sum#239]
+Keys [4]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206]
+Functions [2]: [sum(sales#212), sum(number_sales#213)]
+Aggregate Attributes [2]: [sum(sales#212)#101, sum(number_sales#213)#102]
+Results [3]: [channel#211, sum(sales#212)#101 AS sum_sales#240, sum(number_sales#213)#102 AS number_sales#241]
+
+(148) HashAggregate [codegen id : 462]
+Input [3]: [channel#211, sum_sales#240, number_sales#241]
+Keys [1]: [channel#211]
+Functions [2]: [partial_sum(sum_sales#240), partial_sum(number_sales#241)]
+Aggregate Attributes [3]: [sum#242, isEmpty#243, sum#244]
+Results [4]: [channel#211, sum#245, isEmpty#246, sum#247]
+
+(149) Exchange
+Input [4]: [channel#211, sum#245, isEmpty#246, sum#247]
+Arguments: hashpartitioning(channel#211, 5), ENSURE_REQUIREMENTS, [plan_id=17]
+
+(150) HashAggregate [codegen id : 463]
+Input [4]: [channel#211, sum#245, isEmpty#246, sum#247]
+Keys [1]: [channel#211]
+Functions [2]: [sum(sum_sales#240), sum(number_sales#241)]
+Aggregate Attributes [2]: [sum(sum_sales#240)#248, sum(number_sales#241)#249]
+Results [6]: [channel#211, null AS i_brand_id#250, null AS i_class_id#251, null AS i_category_id#252, sum(sum_sales#240)#248 AS sum(sum_sales)#253, sum(number_sales#241)#249 AS sum(number_sales)#254]
+
+(151) ReusedExchange [Reuses operator id: 70]
+Output [6]: [i_brand_id#255, i_class_id#256, i_category_id#257, sum#258, isEmpty#259, count#46]
+
+(152) HashAggregate [codegen id : 501]
+Input [6]: [i_brand_id#255, i_class_id#256, i_category_id#257, sum#258, isEmpty#259, count#46]
+Keys [3]: [i_brand_id#255, i_class_id#256, i_category_id#257]
+Functions [2]: [sum((cast(ss_quantity#260 as decimal(10,0)) * ss_list_price#261)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#260 as decimal(10,0)) * ss_list_price#261))#47, count(1)#48]
+Results [6]: [store AS channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sum((cast(ss_quantity#260 as decimal(10,0)) * ss_list_price#261))#47 AS sales#263, count(1)#48 AS number_sales#264]
+
+(153) Filter [codegen id : 501]
+Input [6]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sales#263, number_sales#264]
+Condition : (isnotnull(sales#263) AND (cast(sales#263 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(154) ReusedExchange [Reuses operator id: 85]
+Output [6]: [i_brand_id#265, i_class_id#266, i_category_id#267, sum#268, isEmpty#269, count#68]
+
+(155) HashAggregate [codegen id : 539]
+Input [6]: [i_brand_id#265, i_class_id#266, i_category_id#267, sum#268, isEmpty#269, count#68]
+Keys [3]: [i_brand_id#265, i_class_id#266, i_category_id#267]
+Functions [2]: [sum((cast(cs_quantity#270 as decimal(10,0)) * cs_list_price#271)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#270 as decimal(10,0)) * cs_list_price#271))#69, count(1)#70]
+Results [6]: [catalog AS channel#272, i_brand_id#265, i_class_id#266, i_category_id#267, sum((cast(cs_quantity#270 as decimal(10,0)) * cs_list_price#271))#69 AS sales#273, count(1)#70 AS number_sales#274]
+
+(156) Filter [codegen id : 539]
+Input [6]: [channel#272, i_brand_id#265, i_class_id#266, i_category_id#267, sales#273, number_sales#274]
+Condition : (isnotnull(sales#273) AND (cast(sales#273 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(157) ReusedExchange [Reuses operator id: 100]
+Output [6]: [i_brand_id#275, i_class_id#276, i_category_id#277, sum#278, isEmpty#279, count#89]
+
+(158) HashAggregate [codegen id : 577]
+Input [6]: [i_brand_id#275, i_class_id#276, i_category_id#277, sum#278, isEmpty#279, count#89]
+Keys [3]: [i_brand_id#275, i_class_id#276, i_category_id#277]
+Functions [2]: [sum((cast(ws_quantity#280 as decimal(10,0)) * ws_list_price#281)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#280 as decimal(10,0)) * ws_list_price#281))#90, count(1)#91]
+Results [6]: [web AS channel#282, i_brand_id#275, i_class_id#276, i_category_id#277, sum((cast(ws_quantity#280 as decimal(10,0)) * ws_list_price#281))#90 AS sales#283, count(1)#91 AS number_sales#284]
+
+(159) Filter [codegen id : 577]
+Input [6]: [channel#282, i_brand_id#275, i_class_id#276, i_category_id#277, sales#283, number_sales#284]
+Condition : (isnotnull(sales#283) AND (cast(sales#283 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#12] as decimal(32,6))))
+
+(160) Union
+
+(161) HashAggregate [codegen id : 578]
+Input [6]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sales#263, number_sales#264]
+Keys [4]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257]
+Functions [2]: [partial_sum(sales#263), partial_sum(number_sales#264)]
+Aggregate Attributes [3]: [sum#285, isEmpty#286, sum#287]
+Results [7]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sum#288, isEmpty#289, sum#290]
+
+(162) HashAggregate [codegen id : 578]
+Input [7]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sum#288, isEmpty#289, sum#290]
+Keys [4]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257]
+Functions [2]: [sum(sales#263), sum(number_sales#264)]
+Aggregate Attributes [2]: [sum(sales#263)#101, sum(number_sales#264)#102]
+Results [2]: [sum(sales#263)#101 AS sum_sales#291, sum(number_sales#264)#102 AS number_sales#292]
+
+(163) HashAggregate [codegen id : 578]
+Input [2]: [sum_sales#291, number_sales#292]
 Keys: []
-Functions [2]: [partial_sum(sum_sales#184), partial_sum(number_sales#185)]
-Aggregate Attributes [3]: [sum#186, isEmpty#187, sum#188]
-Results [3]: [sum#189, isEmpty#190, sum#191]
+Functions [2]: [partial_sum(sum_sales#291), partial_sum(number_sales#292)]
+Aggregate Attributes [3]: [sum#293, isEmpty#294, sum#295]
+Results [3]: [sum#296, isEmpty#297, sum#298]
 
-(125) Exchange
-Input [3]: [sum#189, isEmpty#190, sum#191]
+(164) Exchange
+Input [3]: [sum#296, isEmpty#297, sum#298]
 Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=18]
 
-(126) HashAggregate [codegen id : 584]
-Input [3]: [sum#189, isEmpty#190, sum#191]
+(165) HashAggregate [codegen id : 579]
+Input [3]: [sum#296, isEmpty#297, sum#298]
 Keys: []
-Functions [2]: [sum(sum_sales#184), sum(number_sales#185)]
-Aggregate Attributes [2]: [sum(sum_sales#184)#192, sum(number_sales#185)#193]
-Results [6]: [null AS channel#194, null AS i_brand_id#195, null AS i_class_id#196, null AS i_category_id#197, sum(sum_sales#184)#192 AS sum(sum_sales)#198, sum(number_sales#185)#193 AS sum(number_sales)#199]
+Functions [2]: [sum(sum_sales#291), sum(number_sales#292)]
+Aggregate Attributes [2]: [sum(sum_sales#291)#299, sum(number_sales#292)#300]
+Results [6]: [null AS channel#301, null AS i_brand_id#302, null AS i_class_id#303, null AS i_category_id#304, sum(sum_sales#291)#299 AS sum(sum_sales)#305, sum(number_sales#292)#300 AS sum(number_sales)#306]
 
-(127) Union
+(166) Union
 
-(128) HashAggregate [codegen id : 585]
-Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
-Keys [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
+(167) HashAggregate [codegen id : 580]
+Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
+Keys [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
 Functions: []
 Aggregate Attributes: []
-Results [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
+Results [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
 
-(129) Exchange
-Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
-Arguments: hashpartitioning(channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105, 5), ENSURE_REQUIREMENTS, [plan_id=19]
+(168) Exchange
+Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
+Arguments: hashpartitioning(channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104, 5), ENSURE_REQUIREMENTS, [plan_id=19]
 
-(130) HashAggregate [codegen id : 586]
-Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
-Keys [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
+(169) HashAggregate [codegen id : 581]
+Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
+Keys [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
 Functions: []
 Aggregate Attributes: []
-Results [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
+Results [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
 
-(131) TakeOrderedAndProject
-Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
-Arguments: 100, [channel#49 ASC NULLS FIRST, i_brand_id#38 ASC NULLS FIRST, i_class_id#39 ASC NULLS FIRST, i_category_id#40 ASC NULLS FIRST], [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#104, number_sales#105]
+(170) TakeOrderedAndProject
+Input [6]: [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
+Arguments: 100, [channel#49 ASC NULLS FIRST, i_brand_id#38 ASC NULLS FIRST, i_class_id#39 ASC NULLS FIRST, i_category_id#40 ASC NULLS FIRST], [channel#49, i_brand_id#38, i_class_id#39, i_category_id#40, sum_sales#103, number_sales#104]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#52, [id=#53]
-* HashAggregate (150)
-+- Exchange (149)
-   +- * HashAggregate (148)
-      +- Union (147)
-         :- * Project (136)
-         :  +- * BroadcastHashJoin Inner BuildRight (135)
-         :     :- * ColumnarToRow (133)
-         :     :  +- Scan parquet spark_catalog.default.store_sales (132)
-         :     +- ReusedExchange (134)
-         :- * Project (141)
-         :  +- * BroadcastHashJoin Inner BuildRight (140)
-         :     :- * ColumnarToRow (138)
-         :     :  +- Scan parquet spark_catalog.default.catalog_sales (137)
-         :     +- ReusedExchange (139)
-         +- * Project (146)
-            +- * BroadcastHashJoin Inner BuildRight (145)
-               :- * ColumnarToRow (143)
-               :  +- Scan parquet spark_catalog.default.web_sales (142)
-               +- ReusedExchange (144)
-
-
-(132) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#200, ss_list_price#201, ss_sold_date_sk#202]
+Subquery:1 Hosting operator id = 72 Hosting Expression = Subquery scalar-subquery#52, [id=#12]
+* HashAggregate (189)
++- Exchange (188)
+   +- * HashAggregate (187)
+      +- Union (186)
+         :- * Project (175)
+         :  +- * BroadcastHashJoin Inner BuildRight (174)
+         :     :- * ColumnarToRow (172)
+         :     :  +- Scan parquet spark_catalog.default.store_sales (171)
+         :     +- ReusedExchange (173)
+         :- * Project (180)
+         :  +- * BroadcastHashJoin Inner BuildRight (179)
+         :     :- * ColumnarToRow (177)
+         :     :  +- Scan parquet spark_catalog.default.catalog_sales (176)
+         :     +- ReusedExchange (178)
+         +- * Project (185)
+            +- * BroadcastHashJoin Inner BuildRight (184)
+               :- * ColumnarToRow (182)
+               :  +- Scan parquet spark_catalog.default.web_sales (181)
+               +- ReusedExchange (183)
+
+
+(171) Scan parquet spark_catalog.default.store_sales
+Output [3]: [ss_quantity#307, ss_list_price#308, ss_sold_date_sk#309]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#202), dynamicpruningexpression(ss_sold_date_sk#202 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#309), dynamicpruningexpression(ss_sold_date_sk#309 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
-(133) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#200, ss_list_price#201, ss_sold_date_sk#202]
+(172) ColumnarToRow [codegen id : 2]
+Input [3]: [ss_quantity#307, ss_list_price#308, ss_sold_date_sk#309]
 
-(134) ReusedExchange [Reuses operator id: 165]
-Output [1]: [d_date_sk#203]
+(173) ReusedExchange [Reuses operator id: 204]
+Output [1]: [d_date_sk#310]
 
-(135) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#202]
-Right keys [1]: [d_date_sk#203]
+(174) BroadcastHashJoin [codegen id : 2]
+Left keys [1]: [ss_sold_date_sk#309]
+Right keys [1]: [d_date_sk#310]
 Join type: Inner
 Join condition: None
 
-(136) Project [codegen id : 2]
-Output [2]: [ss_quantity#200 AS quantity#204, ss_list_price#201 AS list_price#205]
-Input [4]: [ss_quantity#200, ss_list_price#201, ss_sold_date_sk#202, d_date_sk#203]
+(175) Project [codegen id : 2]
+Output [2]: [ss_quantity#307 AS quantity#311, ss_list_price#308 AS list_price#312]
+Input [4]: [ss_quantity#307, ss_list_price#308, ss_sold_date_sk#309, d_date_sk#310]
 
-(137) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#206, cs_list_price#207, cs_sold_date_sk#208]
+(176) Scan parquet spark_catalog.default.catalog_sales
+Output [3]: [cs_quantity#313, cs_list_price#314, cs_sold_date_sk#315]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#208), dynamicpruningexpression(cs_sold_date_sk#208 IN dynamicpruning#209)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#315), dynamicpruningexpression(cs_sold_date_sk#315 IN dynamicpruning#316)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
-(138) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#206, cs_list_price#207, cs_sold_date_sk#208]
+(177) ColumnarToRow [codegen id : 4]
+Input [3]: [cs_quantity#313, cs_list_price#314, cs_sold_date_sk#315]
 
-(139) ReusedExchange [Reuses operator id: 155]
-Output [1]: [d_date_sk#210]
+(178) ReusedExchange [Reuses operator id: 194]
+Output [1]: [d_date_sk#317]
 
-(140) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#208]
-Right keys [1]: [d_date_sk#210]
+(179) BroadcastHashJoin [codegen id : 4]
+Left keys [1]: [cs_sold_date_sk#315]
+Right keys [1]: [d_date_sk#317]
 Join type: Inner
 Join condition: None
 
-(141) Project [codegen id : 4]
-Output [2]: [cs_quantity#206 AS quantity#211, cs_list_price#207 AS list_price#212]
-Input [4]: [cs_quantity#206, cs_list_price#207, cs_sold_date_sk#208, d_date_sk#210]
+(180) Project [codegen id : 4]
+Output [2]: [cs_quantity#313 AS quantity#318, cs_list_price#314 AS list_price#319]
+Input [4]: [cs_quantity#313, cs_list_price#314, cs_sold_date_sk#315, d_date_sk#317]
 
-(142) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#213, ws_list_price#214, ws_sold_date_sk#215]
+(181) Scan parquet spark_catalog.default.web_sales
+Output [3]: [ws_quantity#320, ws_list_price#321, ws_sold_date_sk#322]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#215), dynamicpruningexpression(ws_sold_date_sk#215 IN dynamicpruning#209)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#322), dynamicpruningexpression(ws_sold_date_sk#322 IN dynamicpruning#316)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
-(143) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#213, ws_list_price#214, ws_sold_date_sk#215]
+(182) ColumnarToRow [codegen id : 6]
+Input [3]: [ws_quantity#320, ws_list_price#321, ws_sold_date_sk#322]
 
-(144) ReusedExchange [Reuses operator id: 155]
-Output [1]: [d_date_sk#216]
+(183) ReusedExchange [Reuses operator id: 194]
+Output [1]: [d_date_sk#323]
 
-(145) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#215]
-Right keys [1]: [d_date_sk#216]
+(184) BroadcastHashJoin [codegen id : 6]
+Left keys [1]: [ws_sold_date_sk#322]
+Right keys [1]: [d_date_sk#323]
 Join type: Inner
 Join condition: None
 
-(146) Project [codegen id : 6]
-Output [2]: [ws_quantity#213 AS quantity#217, ws_list_price#214 AS list_price#218]
-Input [4]: [ws_quantity#213, ws_list_price#214, ws_sold_date_sk#215, d_date_sk#216]
+(185) Project [codegen id : 6]
+Output [2]: [ws_quantity#320 AS quantity#324, ws_list_price#321 AS list_price#325]
+Input [4]: [ws_quantity#320, ws_list_price#321, ws_sold_date_sk#322, d_date_sk#323]
 
-(147) Union
+(186) Union
 
-(148) HashAggregate [codegen id : 7]
-Input [2]: [quantity#204, list_price#205]
+(187) HashAggregate [codegen id : 7]
+Input [2]: [quantity#311, list_price#312]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#204 as decimal(10,0)) * list_price#205))]
-Aggregate Attributes [2]: [sum#219, count#220]
-Results [2]: [sum#221, count#222]
+Functions [1]: [partial_avg((cast(quantity#311 as decimal(10,0)) * list_price#312))]
+Aggregate Attributes [2]: [sum#326, count#327]
+Results [2]: [sum#328, count#329]
 
-(149) Exchange
-Input [2]: [sum#221, count#222]
+(188) Exchange
+Input [2]: [sum#328, count#329]
 Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=20]
 
-(150) HashAggregate [codegen id : 8]
-Input [2]: [sum#221, count#222]
+(189) HashAggregate [codegen id : 8]
+Input [2]: [sum#328, count#329]
 Keys: []
-Functions [1]: [avg((cast(quantity#204 as decimal(10,0)) * list_price#205))]
-Aggregate Attributes [1]: [avg((cast(quantity#204 as decimal(10,0)) * list_price#205))#223]
-Results [1]: [avg((cast(quantity#204 as decimal(10,0)) * list_price#205))#223 AS average_sales#224]
+Functions [1]: [avg((cast(quantity#311 as decimal(10,0)) * list_price#312))]
+Aggregate Attributes [1]: [avg((cast(quantity#311 as decimal(10,0)) * list_price#312))#330]
+Results [1]: [avg((cast(quantity#311 as decimal(10,0)) * list_price#312))#330 AS average_sales#331]
 
-Subquery:2 Hosting operator id = 132 Hosting Expression = ss_sold_date_sk#202 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 171 Hosting Expression = ss_sold_date_sk#309 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 137 Hosting Expression = cs_sold_date_sk#208 IN dynamicpruning#209
-BroadcastExchange (155)
-+- * Project (154)
-   +- * Filter (153)
-      +- * ColumnarToRow (152)
-         +- Scan parquet spark_catalog.default.date_dim (151)
+Subquery:3 Hosting operator id = 176 Hosting Expression = cs_sold_date_sk#315 IN dynamicpruning#316
+BroadcastExchange (194)
++- * Project (193)
+   +- * Filter (192)
+      +- * ColumnarToRow (191)
+         +- Scan parquet spark_catalog.default.date_dim (190)
 
 
-(151) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#210, d_year#225]
+(190) Scan parquet spark_catalog.default.date_dim
+Output [2]: [d_date_sk#317, d_year#332]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1998), LessThanOrEqual(d_year,2000), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
-(152) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#210, d_year#225]
+(191) ColumnarToRow [codegen id : 1]
+Input [2]: [d_date_sk#317, d_year#332]
 
-(153) Filter [codegen id : 1]
-Input [2]: [d_date_sk#210, d_year#225]
-Condition : (((isnotnull(d_year#225) AND (d_year#225 >= 1998)) AND (d_year#225 <= 2000)) AND isnotnull(d_date_sk#210))
+(192) Filter [codegen id : 1]
+Input [2]: [d_date_sk#317, d_year#332]
+Condition : (((isnotnull(d_year#332) AND (d_year#332 >= 1998)) AND (d_year#332 <= 2000)) AND isnotnull(d_date_sk#317))
 
-(154) Project [codegen id : 1]
-Output [1]: [d_date_sk#210]
-Input [2]: [d_date_sk#210, d_year#225]
+(193) Project [codegen id : 1]
+Output [1]: [d_date_sk#317]
+Input [2]: [d_date_sk#317, d_year#332]
 
-(155) BroadcastExchange
-Input [1]: [d_date_sk#210]
+(194) BroadcastExchange
+Input [1]: [d_date_sk#317]
 Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=21]
 
-Subquery:4 Hosting operator id = 142 Hosting Expression = ws_sold_date_sk#215 IN dynamicpruning#209
+Subquery:4 Hosting operator id = 181 Hosting Expression = ws_sold_date_sk#322 IN dynamicpruning#316
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (160)
-+- * Project (159)
-   +- * Filter (158)
-      +- * ColumnarToRow (157)
-         +- Scan parquet spark_catalog.default.date_dim (156)
+BroadcastExchange (199)
++- * Project (198)
+   +- * Filter (197)
+      +- * ColumnarToRow (196)
+         +- Scan parquet spark_catalog.default.date_dim (195)
 
 
-(156) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#36, d_year#226, d_moy#227]
+(195) Scan parquet spark_catalog.default.date_dim
+Output [3]: [d_date_sk#36, d_year#333, d_moy#334]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,11), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(157) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#36, d_year#226, d_moy#227]
+(196) ColumnarToRow [codegen id : 1]
+Input [3]: [d_date_sk#36, d_year#333, d_moy#334]
 
-(158) Filter [codegen id : 1]
-Input [3]: [d_date_sk#36, d_year#226, d_moy#227]
-Condition : ((((isnotnull(d_year#226) AND isnotnull(d_moy#227)) AND (d_year#226 = 2000)) AND (d_moy#227 = 11)) AND isnotnull(d_date_sk#36))
+(197) Filter [codegen id : 1]
+Input [3]: [d_date_sk#36, d_year#333, d_moy#334]
+Condition : ((((isnotnull(d_year#333) AND isnotnull(d_moy#334)) AND (d_year#333 = 2000)) AND (d_moy#334 = 11)) AND isnotnull(d_date_sk#36))
 
-(159) Project [codegen id : 1]
+(198) Project [codegen id : 1]
 Output [1]: [d_date_sk#36]
-Input [3]: [d_date_sk#36, d_year#226, d_moy#227]
+Input [3]: [d_date_sk#36, d_year#333, d_moy#334]
 
-(160) BroadcastExchange
+(199) BroadcastExchange
 Input [1]: [d_date_sk#36]
 Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=22]
 
 Subquery:6 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
-BroadcastExchange (165)
-+- * Project (164)
-   +- * Filter (163)
-      +- * ColumnarToRow (162)
-         +- Scan parquet spark_catalog.default.date_dim (161)
+BroadcastExchange (204)
++- * Project (203)
+   +- * Filter (202)
+      +- * ColumnarToRow (201)
+         +- Scan parquet spark_catalog.default.date_dim (200)
 
 
-(161) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#13, d_year#228]
+(200) Scan parquet spark_catalog.default.date_dim
+Output [2]: [d_date_sk#13, d_year#335]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1999), LessThanOrEqual(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
-(162) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#228]
+(201) ColumnarToRow [codegen id : 1]
+Input [2]: [d_date_sk#13, d_year#335]
 
-(163) Filter [codegen id : 1]
-Input [2]: [d_date_sk#13, d_year#228]
-Condition : (((isnotnull(d_year#228) AND (d_year#228 >= 1999)) AND (d_year#228 <= 2001)) AND isnotnull(d_date_sk#13))
+(202) Filter [codegen id : 1]
+Input [2]: [d_date_sk#13, d_year#335]
+Condition : (((isnotnull(d_year#335) AND (d_year#335 >= 1999)) AND (d_year#335 <= 2001)) AND isnotnull(d_date_sk#13))
 
-(164) Project [codegen id : 1]
+(203) Project [codegen id : 1]
 Output [1]: [d_date_sk#13]
-Input [2]: [d_date_sk#13, d_year#228]
+Input [2]: [d_date_sk#13, d_year#335]
 
-(165) BroadcastExchange
+(204) BroadcastExchange
 Input [1]: [d_date_sk#13]
 Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=23]
 
@@ -983,12 +1210,36 @@ Subquery:7 Hosting operator id = 18 Hosting Expression = cs_sold_date_sk#19 IN d
 
 Subquery:8 Hosting operator id = 41 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:9 Hosting operator id = 87 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:9 Hosting operator id = 87 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:10 Hosting operator id = 73 Hosting Expression = cs_sold_date_sk#56 IN dynamicpruning#5
+
+Subquery:11 Hosting operator id = 102 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:12 Hosting operator id = 88 Hosting Expression = ws_sold_date_sk#77 IN dynamicpruning#5
+
+Subquery:13 Hosting operator id = 108 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:14 Hosting operator id = 111 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:15 Hosting operator id = 114 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:16 Hosting operator id = 123 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:17 Hosting operator id = 126 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:18 Hosting operator id = 129 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:19 Hosting operator id = 138 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:20 Hosting operator id = 141 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
+
+Subquery:21 Hosting operator id = 144 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
 
-Subquery:10 Hosting operator id = 73 Hosting Expression = cs_sold_date_sk#57 IN dynamicpruning#5
+Subquery:22 Hosting operator id = 153 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
 
-Subquery:11 Hosting operator id = 102 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:23 Hosting operator id = 156 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
 
-Subquery:12 Hosting operator id = 88 Hosting Expression = ws_sold_date_sk#78 IN dynamicpruning#5
+Subquery:24 Hosting operator id = 159 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#12]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/simplified.txt
index 84c70b046c7d8..795ef4fad4f1d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a.sf100/simplified.txt
@@ -1,279 +1,352 @@
 TakeOrderedAndProject [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales]
-  WholeStageCodegen (586)
+  WholeStageCodegen (581)
     HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales]
       InputAdapter
         Exchange [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales] #1
-          WholeStageCodegen (585)
+          WholeStageCodegen (580)
             HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales]
               InputAdapter
                 Union
-                  WholeStageCodegen (116)
+                  WholeStageCodegen (115)
                     HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                      InputAdapter
-                        Exchange [channel,i_brand_id,i_class_id,i_category_id] #2
-                          WholeStageCodegen (115)
-                            HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
-                              InputAdapter
-                                Union
-                                  WholeStageCodegen (38)
-                                    Filter [sales]
-                                      Subquery #3
-                                        WholeStageCodegen (8)
-                                          HashAggregate [sum,count] [avg((cast(quantity as decimal(10,0)) * list_price)),average_sales,sum,count]
-                                            InputAdapter
-                                              Exchange #16
-                                                WholeStageCodegen (7)
-                                                  HashAggregate [quantity,list_price] [sum,count,sum,count]
-                                                    InputAdapter
-                                                      Union
-                                                        WholeStageCodegen (2)
-                                                          Project [ss_quantity,ss_list_price]
-                                                            BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.store_sales [ss_quantity,ss_list_price,ss_sold_date_sk]
-                                                                    ReusedSubquery [d_date_sk] #2
-                                                              InputAdapter
-                                                                ReusedExchange [d_date_sk] #9
-                                                        WholeStageCodegen (4)
-                                                          Project [cs_quantity,cs_list_price]
-                                                            BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.catalog_sales [cs_quantity,cs_list_price,cs_sold_date_sk]
-                                                                    SubqueryBroadcast [d_date_sk] #4
-                                                                      BroadcastExchange #17
-                                                                        WholeStageCodegen (1)
-                                                                          Project [d_date_sk]
-                                                                            Filter [d_year,d_date_sk]
-                                                                              ColumnarToRow
-                                                                                InputAdapter
-                                                                                  Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
-                                                              InputAdapter
-                                                                ReusedExchange [d_date_sk] #17
-                                                        WholeStageCodegen (6)
-                                                          Project [ws_quantity,ws_list_price]
-                                                            BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.web_sales [ws_quantity,ws_list_price,ws_sold_date_sk]
-                                                                    ReusedSubquery [d_date_sk] #4
-                                                              InputAdapter
-                                                                ReusedExchange [d_date_sk] #17
-                                      HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
-                                        InputAdapter
-                                          Exchange [i_brand_id,i_class_id,i_category_id] #3
-                                            WholeStageCodegen (37)
-                                              HashAggregate [i_brand_id,i_class_id,i_category_id,ss_quantity,ss_list_price] [sum,isEmpty,count,sum,isEmpty,count]
-                                                Project [ss_quantity,ss_list_price,i_brand_id,i_class_id,i_category_id]
-                                                  BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                                    Project [ss_item_sk,ss_quantity,ss_list_price]
+                      HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                        InputAdapter
+                          Union
+                            WholeStageCodegen (38)
+                              Filter [sales]
+                                Subquery #3
+                                  WholeStageCodegen (8)
+                                    HashAggregate [sum,count] [avg((cast(quantity as decimal(10,0)) * list_price)),average_sales,sum,count]
+                                      InputAdapter
+                                        Exchange #15
+                                          WholeStageCodegen (7)
+                                            HashAggregate [quantity,list_price] [sum,count,sum,count]
+                                              InputAdapter
+                                                Union
+                                                  WholeStageCodegen (2)
+                                                    Project [ss_quantity,ss_list_price]
                                                       BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                        BroadcastHashJoin [ss_item_sk,ss_item_sk]
-                                                          Filter [ss_item_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_quantity,ss_list_price,ss_sold_date_sk]
-                                                                  SubqueryBroadcast [d_date_sk] #1
-                                                                    BroadcastExchange #4
-                                                                      WholeStageCodegen (1)
-                                                                        Project [d_date_sk]
-                                                                          Filter [d_year,d_moy,d_date_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                        ColumnarToRow
+                                                          InputAdapter
+                                                            Scan parquet spark_catalog.default.store_sales [ss_quantity,ss_list_price,ss_sold_date_sk]
+                                                              ReusedSubquery [d_date_sk] #2
+                                                        InputAdapter
+                                                          ReusedExchange [d_date_sk] #8
+                                                  WholeStageCodegen (4)
+                                                    Project [cs_quantity,cs_list_price]
+                                                      BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                        ColumnarToRow
+                                                          InputAdapter
+                                                            Scan parquet spark_catalog.default.catalog_sales [cs_quantity,cs_list_price,cs_sold_date_sk]
+                                                              SubqueryBroadcast [d_date_sk] #4
+                                                                BroadcastExchange #16
+                                                                  WholeStageCodegen (1)
+                                                                    Project [d_date_sk]
+                                                                      Filter [d_year,d_date_sk]
+                                                                        ColumnarToRow
+                                                                          InputAdapter
+                                                                            Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
+                                                        InputAdapter
+                                                          ReusedExchange [d_date_sk] #16
+                                                  WholeStageCodegen (6)
+                                                    Project [ws_quantity,ws_list_price]
+                                                      BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                        ColumnarToRow
                                                           InputAdapter
-                                                            BroadcastExchange #5
-                                                              WholeStageCodegen (17)
-                                                                Project [i_item_sk]
-                                                                  BroadcastHashJoin [i_brand_id,i_class_id,i_category_id,brand_id,class_id,category_id]
-                                                                    Filter [i_brand_id,i_class_id,i_category_id]
+                                                            Scan parquet spark_catalog.default.web_sales [ws_quantity,ws_list_price,ws_sold_date_sk]
+                                                              ReusedSubquery [d_date_sk] #4
+                                                        InputAdapter
+                                                          ReusedExchange [d_date_sk] #16
+                                HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                  InputAdapter
+                                    Exchange [i_brand_id,i_class_id,i_category_id] #2
+                                      WholeStageCodegen (37)
+                                        HashAggregate [i_brand_id,i_class_id,i_category_id,ss_quantity,ss_list_price] [sum,isEmpty,count,sum,isEmpty,count]
+                                          Project [ss_quantity,ss_list_price,i_brand_id,i_class_id,i_category_id]
+                                            BroadcastHashJoin [ss_item_sk,i_item_sk]
+                                              Project [ss_item_sk,ss_quantity,ss_list_price]
+                                                BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                  BroadcastHashJoin [ss_item_sk,ss_item_sk]
+                                                    Filter [ss_item_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_quantity,ss_list_price,ss_sold_date_sk]
+                                                            SubqueryBroadcast [d_date_sk] #1
+                                                              BroadcastExchange #3
+                                                                WholeStageCodegen (1)
+                                                                  Project [d_date_sk]
+                                                                    Filter [d_year,d_moy,d_date_sk]
                                                                       ColumnarToRow
                                                                         InputAdapter
-                                                                          Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                                    InputAdapter
-                                                                      BroadcastExchange #6
-                                                                        WholeStageCodegen (16)
-                                                                          SortMergeJoin [brand_id,class_id,category_id,i_brand_id,i_class_id,i_category_id]
+                                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                    InputAdapter
+                                                      BroadcastExchange #4
+                                                        WholeStageCodegen (17)
+                                                          Project [i_item_sk]
+                                                            BroadcastHashJoin [i_brand_id,i_class_id,i_category_id,brand_id,class_id,category_id]
+                                                              Filter [i_brand_id,i_class_id,i_category_id]
+                                                                ColumnarToRow
+                                                                  InputAdapter
+                                                                    Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                              InputAdapter
+                                                                BroadcastExchange #5
+                                                                  WholeStageCodegen (16)
+                                                                    SortMergeJoin [brand_id,class_id,category_id,i_brand_id,i_class_id,i_category_id]
+                                                                      InputAdapter
+                                                                        WholeStageCodegen (11)
+                                                                          Sort [brand_id,class_id,category_id]
                                                                             InputAdapter
-                                                                              WholeStageCodegen (11)
-                                                                                Sort [brand_id,class_id,category_id]
-                                                                                  InputAdapter
-                                                                                    Exchange [brand_id,class_id,category_id] #7
-                                                                                      WholeStageCodegen (10)
-                                                                                        HashAggregate [brand_id,class_id,category_id]
-                                                                                          InputAdapter
-                                                                                            Exchange [brand_id,class_id,category_id] #8
-                                                                                              WholeStageCodegen (9)
-                                                                                                HashAggregate [brand_id,class_id,category_id]
-                                                                                                  Project [i_brand_id,i_class_id,i_category_id]
-                                                                                                    BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                                                                                      Project [ss_item_sk]
-                                                                                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                                                                          Filter [ss_item_sk]
-                                                                                                            ColumnarToRow
-                                                                                                              InputAdapter
-                                                                                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_sold_date_sk]
-                                                                                                                  SubqueryBroadcast [d_date_sk] #2
-                                                                                                                    BroadcastExchange #9
-                                                                                                                      WholeStageCodegen (1)
-                                                                                                                        Project [d_date_sk]
-                                                                                                                          Filter [d_year,d_date_sk]
-                                                                                                                            ColumnarToRow
-                                                                                                                              InputAdapter
-                                                                                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
-                                                                                                          InputAdapter
-                                                                                                            ReusedExchange [d_date_sk] #9
-                                                                                                      InputAdapter
-                                                                                                        BroadcastExchange #10
-                                                                                                          WholeStageCodegen (8)
-                                                                                                            SortMergeJoin [i_brand_id,i_class_id,i_category_id,i_brand_id,i_class_id,i_category_id]
+                                                                              Exchange [brand_id,class_id,category_id] #6
+                                                                                WholeStageCodegen (10)
+                                                                                  HashAggregate [brand_id,class_id,category_id]
+                                                                                    InputAdapter
+                                                                                      Exchange [brand_id,class_id,category_id] #7
+                                                                                        WholeStageCodegen (9)
+                                                                                          HashAggregate [brand_id,class_id,category_id]
+                                                                                            Project [i_brand_id,i_class_id,i_category_id]
+                                                                                              BroadcastHashJoin [ss_item_sk,i_item_sk]
+                                                                                                Project [ss_item_sk]
+                                                                                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                                                                    Filter [ss_item_sk]
+                                                                                                      ColumnarToRow
+                                                                                                        InputAdapter
+                                                                                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_sold_date_sk]
+                                                                                                            SubqueryBroadcast [d_date_sk] #2
+                                                                                                              BroadcastExchange #8
+                                                                                                                WholeStageCodegen (1)
+                                                                                                                  Project [d_date_sk]
+                                                                                                                    Filter [d_year,d_date_sk]
+                                                                                                                      ColumnarToRow
+                                                                                                                        InputAdapter
+                                                                                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
+                                                                                                    InputAdapter
+                                                                                                      ReusedExchange [d_date_sk] #8
+                                                                                                InputAdapter
+                                                                                                  BroadcastExchange #9
+                                                                                                    WholeStageCodegen (8)
+                                                                                                      SortMergeJoin [i_brand_id,i_class_id,i_category_id,i_brand_id,i_class_id,i_category_id]
+                                                                                                        InputAdapter
+                                                                                                          WholeStageCodegen (3)
+                                                                                                            Sort [i_brand_id,i_class_id,i_category_id]
                                                                                                               InputAdapter
-                                                                                                                WholeStageCodegen (3)
-                                                                                                                  Sort [i_brand_id,i_class_id,i_category_id]
-                                                                                                                    InputAdapter
-                                                                                                                      Exchange [i_brand_id,i_class_id,i_category_id] #11
-                                                                                                                        WholeStageCodegen (2)
-                                                                                                                          Filter [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                                                                                            ColumnarToRow
-                                                                                                                              InputAdapter
-                                                                                                                                Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                                Exchange [i_brand_id,i_class_id,i_category_id] #10
+                                                                                                                  WholeStageCodegen (2)
+                                                                                                                    Filter [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                                      ColumnarToRow
+                                                                                                                        InputAdapter
+                                                                                                                          Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                        InputAdapter
+                                                                                                          WholeStageCodegen (7)
+                                                                                                            Sort [i_brand_id,i_class_id,i_category_id]
                                                                                                               InputAdapter
-                                                                                                                WholeStageCodegen (7)
-                                                                                                                  Sort [i_brand_id,i_class_id,i_category_id]
-                                                                                                                    InputAdapter
-                                                                                                                      Exchange [i_brand_id,i_class_id,i_category_id] #12
-                                                                                                                        WholeStageCodegen (6)
-                                                                                                                          Project [i_brand_id,i_class_id,i_category_id]
-                                                                                                                            BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                                                                                                              Project [cs_item_sk]
-                                                                                                                                BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                                                                                                  Filter [cs_item_sk]
-                                                                                                                                    ColumnarToRow
-                                                                                                                                      InputAdapter
-                                                                                                                                        Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_sold_date_sk]
-                                                                                                                                          ReusedSubquery [d_date_sk] #2
+                                                                                                                Exchange [i_brand_id,i_class_id,i_category_id] #11
+                                                                                                                  WholeStageCodegen (6)
+                                                                                                                    Project [i_brand_id,i_class_id,i_category_id]
+                                                                                                                      BroadcastHashJoin [cs_item_sk,i_item_sk]
+                                                                                                                        Project [cs_item_sk]
+                                                                                                                          BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                                                                                            Filter [cs_item_sk]
+                                                                                                                              ColumnarToRow
+                                                                                                                                InputAdapter
+                                                                                                                                  Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_sold_date_sk]
+                                                                                                                                    ReusedSubquery [d_date_sk] #2
+                                                                                                                            InputAdapter
+                                                                                                                              ReusedExchange [d_date_sk] #8
+                                                                                                                        InputAdapter
+                                                                                                                          BroadcastExchange #12
+                                                                                                                            WholeStageCodegen (5)
+                                                                                                                              Filter [i_item_sk]
+                                                                                                                                ColumnarToRow
                                                                                                                                   InputAdapter
-                                                                                                                                    ReusedExchange [d_date_sk] #9
-                                                                                                                              InputAdapter
-                                                                                                                                BroadcastExchange #13
-                                                                                                                                  WholeStageCodegen (5)
-                                                                                                                                    Filter [i_item_sk]
-                                                                                                                                      ColumnarToRow
-                                                                                                                                        InputAdapter
-                                                                                                                                          Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                                                    Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                      InputAdapter
+                                                                        WholeStageCodegen (15)
+                                                                          Sort [i_brand_id,i_class_id,i_category_id]
                                                                             InputAdapter
-                                                                              WholeStageCodegen (15)
-                                                                                Sort [i_brand_id,i_class_id,i_category_id]
-                                                                                  InputAdapter
-                                                                                    Exchange [i_brand_id,i_class_id,i_category_id] #14
-                                                                                      WholeStageCodegen (14)
-                                                                                        Project [i_brand_id,i_class_id,i_category_id]
-                                                                                          BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                                                                            Project [ws_item_sk]
-                                                                                              BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                                                                Filter [ws_item_sk]
-                                                                                                  ColumnarToRow
-                                                                                                    InputAdapter
-                                                                                                      Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_sold_date_sk]
-                                                                                                        ReusedSubquery [d_date_sk] #2
-                                                                                                InputAdapter
-                                                                                                  ReusedExchange [d_date_sk] #9
-                                                                                            InputAdapter
-                                                                                              ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #13
-                                                        InputAdapter
-                                                          ReusedExchange [d_date_sk] #4
-                                                    InputAdapter
-                                                      BroadcastExchange #15
-                                                        WholeStageCodegen (36)
-                                                          BroadcastHashJoin [i_item_sk,ss_item_sk]
-                                                            Filter [i_item_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                            InputAdapter
-                                                              ReusedExchange [ss_item_sk] #5
-                                  WholeStageCodegen (76)
-                                    Filter [sales]
-                                      ReusedSubquery [average_sales] #3
-                                      HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
-                                        InputAdapter
-                                          Exchange [i_brand_id,i_class_id,i_category_id] #18
-                                            WholeStageCodegen (75)
-                                              HashAggregate [i_brand_id,i_class_id,i_category_id,cs_quantity,cs_list_price] [sum,isEmpty,count,sum,isEmpty,count]
-                                                Project [cs_quantity,cs_list_price,i_brand_id,i_class_id,i_category_id]
-                                                  BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                                    Project [cs_item_sk,cs_quantity,cs_list_price]
-                                                      BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                        BroadcastHashJoin [cs_item_sk,ss_item_sk]
-                                                          Filter [cs_item_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_quantity,cs_list_price,cs_sold_date_sk]
-                                                                  ReusedSubquery [d_date_sk] #1
+                                                                              Exchange [i_brand_id,i_class_id,i_category_id] #13
+                                                                                WholeStageCodegen (14)
+                                                                                  Project [i_brand_id,i_class_id,i_category_id]
+                                                                                    BroadcastHashJoin [ws_item_sk,i_item_sk]
+                                                                                      Project [ws_item_sk]
+                                                                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                                                          Filter [ws_item_sk]
+                                                                                            ColumnarToRow
+                                                                                              InputAdapter
+                                                                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_sold_date_sk]
+                                                                                                  ReusedSubquery [d_date_sk] #2
+                                                                                          InputAdapter
+                                                                                            ReusedExchange [d_date_sk] #8
+                                                                                      InputAdapter
+                                                                                        ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #12
+                                                  InputAdapter
+                                                    ReusedExchange [d_date_sk] #3
+                                              InputAdapter
+                                                BroadcastExchange #14
+                                                  WholeStageCodegen (36)
+                                                    BroadcastHashJoin [i_item_sk,ss_item_sk]
+                                                      Filter [i_item_sk]
+                                                        ColumnarToRow
                                                           InputAdapter
-                                                            ReusedExchange [ss_item_sk] #5
+                                                            Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                      InputAdapter
+                                                        ReusedExchange [ss_item_sk] #4
+                            WholeStageCodegen (76)
+                              Filter [sales]
+                                ReusedSubquery [average_sales] #3
+                                HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                  InputAdapter
+                                    Exchange [i_brand_id,i_class_id,i_category_id] #17
+                                      WholeStageCodegen (75)
+                                        HashAggregate [i_brand_id,i_class_id,i_category_id,cs_quantity,cs_list_price] [sum,isEmpty,count,sum,isEmpty,count]
+                                          Project [cs_quantity,cs_list_price,i_brand_id,i_class_id,i_category_id]
+                                            BroadcastHashJoin [cs_item_sk,i_item_sk]
+                                              Project [cs_item_sk,cs_quantity,cs_list_price]
+                                                BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                  BroadcastHashJoin [cs_item_sk,ss_item_sk]
+                                                    Filter [cs_item_sk]
+                                                      ColumnarToRow
                                                         InputAdapter
-                                                          ReusedExchange [d_date_sk] #4
+                                                          Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_quantity,cs_list_price,cs_sold_date_sk]
+                                                            ReusedSubquery [d_date_sk] #1
                                                     InputAdapter
-                                                      ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #15
-                                  WholeStageCodegen (114)
-                                    Filter [sales]
-                                      ReusedSubquery [average_sales] #3
-                                      HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
-                                        InputAdapter
-                                          Exchange [i_brand_id,i_class_id,i_category_id] #19
-                                            WholeStageCodegen (113)
-                                              HashAggregate [i_brand_id,i_class_id,i_category_id,ws_quantity,ws_list_price] [sum,isEmpty,count,sum,isEmpty,count]
-                                                Project [ws_quantity,ws_list_price,i_brand_id,i_class_id,i_category_id]
-                                                  BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                                    Project [ws_item_sk,ws_quantity,ws_list_price]
-                                                      BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                        BroadcastHashJoin [ws_item_sk,ss_item_sk]
-                                                          Filter [ws_item_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_quantity,ws_list_price,ws_sold_date_sk]
-                                                                  ReusedSubquery [d_date_sk] #1
-                                                          InputAdapter
-                                                            ReusedExchange [ss_item_sk] #5
+                                                      ReusedExchange [ss_item_sk] #4
+                                                  InputAdapter
+                                                    ReusedExchange [d_date_sk] #3
+                                              InputAdapter
+                                                ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #14
+                            WholeStageCodegen (114)
+                              Filter [sales]
+                                ReusedSubquery [average_sales] #3
+                                HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                  InputAdapter
+                                    Exchange [i_brand_id,i_class_id,i_category_id] #18
+                                      WholeStageCodegen (113)
+                                        HashAggregate [i_brand_id,i_class_id,i_category_id,ws_quantity,ws_list_price] [sum,isEmpty,count,sum,isEmpty,count]
+                                          Project [ws_quantity,ws_list_price,i_brand_id,i_class_id,i_category_id]
+                                            BroadcastHashJoin [ws_item_sk,i_item_sk]
+                                              Project [ws_item_sk,ws_quantity,ws_list_price]
+                                                BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                  BroadcastHashJoin [ws_item_sk,ss_item_sk]
+                                                    Filter [ws_item_sk]
+                                                      ColumnarToRow
                                                         InputAdapter
-                                                          ReusedExchange [d_date_sk] #4
+                                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_quantity,ws_list_price,ws_sold_date_sk]
+                                                            ReusedSubquery [d_date_sk] #1
                                                     InputAdapter
-                                                      ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #15
-                  WholeStageCodegen (233)
+                                                      ReusedExchange [ss_item_sk] #4
+                                                  InputAdapter
+                                                    ReusedExchange [d_date_sk] #3
+                                              InputAdapter
+                                                ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #14
+                  WholeStageCodegen (231)
                     HashAggregate [channel,i_brand_id,i_class_id,sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange [channel,i_brand_id,i_class_id] #20
-                          WholeStageCodegen (232)
+                        Exchange [channel,i_brand_id,i_class_id] #19
+                          WholeStageCodegen (230)
                             HashAggregate [channel,i_brand_id,i_class_id,sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
-                  WholeStageCodegen (350)
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (153)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (191)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #17
+                                      WholeStageCodegen (229)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #18
+                  WholeStageCodegen (347)
                     HashAggregate [channel,i_brand_id,sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),i_class_id,i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange [channel,i_brand_id] #21
-                          WholeStageCodegen (349)
+                        Exchange [channel,i_brand_id] #20
+                          WholeStageCodegen (346)
                             HashAggregate [channel,i_brand_id,sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
-                  WholeStageCodegen (467)
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (269)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (307)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #17
+                                      WholeStageCodegen (345)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #18
+                  WholeStageCodegen (463)
                     HashAggregate [channel,sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),i_brand_id,i_class_id,i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange [channel] #22
-                          WholeStageCodegen (466)
+                        Exchange [channel] #21
+                          WholeStageCodegen (462)
                             HashAggregate [channel,sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
-                  WholeStageCodegen (584)
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (385)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (423)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #17
+                                      WholeStageCodegen (461)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #18
+                  WholeStageCodegen (579)
                     HashAggregate [sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),channel,i_brand_id,i_class_id,i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange #23
-                          WholeStageCodegen (583)
+                        Exchange #22
+                          WholeStageCodegen (578)
                             HashAggregate [sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (501)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (539)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #17
+                                      WholeStageCodegen (577)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #18
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/explain.txt
index cdad294331fea..1cff6ef4600a1 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/explain.txt
@@ -1,129 +1,168 @@
 == Physical Plan ==
-TakeOrderedAndProject (125)
-+- * HashAggregate (124)
-   +- Exchange (123)
-      +- * HashAggregate (122)
-         +- Union (121)
-            :- * HashAggregate (100)
-            :  +- Exchange (99)
-            :     +- * HashAggregate (98)
-            :        +- Union (97)
-            :           :- * Filter (66)
-            :           :  +- * HashAggregate (65)
-            :           :     +- Exchange (64)
-            :           :        +- * HashAggregate (63)
-            :           :           +- * Project (62)
-            :           :              +- * BroadcastHashJoin Inner BuildRight (61)
-            :           :                 :- * Project (59)
-            :           :                 :  +- * BroadcastHashJoin Inner BuildRight (58)
-            :           :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (51)
-            :           :                 :     :  :- * Filter (3)
-            :           :                 :     :  :  +- * ColumnarToRow (2)
-            :           :                 :     :  :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :           :                 :     :  +- BroadcastExchange (50)
-            :           :                 :     :     +- * Project (49)
-            :           :                 :     :        +- * BroadcastHashJoin Inner BuildRight (48)
-            :           :                 :     :           :- * Filter (6)
-            :           :                 :     :           :  +- * ColumnarToRow (5)
-            :           :                 :     :           :     +- Scan parquet spark_catalog.default.item (4)
-            :           :                 :     :           +- BroadcastExchange (47)
-            :           :                 :     :              +- * BroadcastHashJoin LeftSemi BuildRight (46)
-            :           :                 :     :                 :- * HashAggregate (35)
-            :           :                 :     :                 :  +- Exchange (34)
-            :           :                 :     :                 :     +- * HashAggregate (33)
-            :           :                 :     :                 :        +- * Project (32)
-            :           :                 :     :                 :           +- * BroadcastHashJoin Inner BuildRight (31)
-            :           :                 :     :                 :              :- * Project (29)
-            :           :                 :     :                 :              :  +- * BroadcastHashJoin Inner BuildRight (28)
-            :           :                 :     :                 :              :     :- * Filter (9)
-            :           :                 :     :                 :              :     :  +- * ColumnarToRow (8)
-            :           :                 :     :                 :              :     :     +- Scan parquet spark_catalog.default.store_sales (7)
-            :           :                 :     :                 :              :     +- BroadcastExchange (27)
-            :           :                 :     :                 :              :        +- * BroadcastHashJoin LeftSemi BuildRight (26)
-            :           :                 :     :                 :              :           :- * Filter (12)
-            :           :                 :     :                 :              :           :  +- * ColumnarToRow (11)
-            :           :                 :     :                 :              :           :     +- Scan parquet spark_catalog.default.item (10)
-            :           :                 :     :                 :              :           +- BroadcastExchange (25)
-            :           :                 :     :                 :              :              +- * Project (24)
-            :           :                 :     :                 :              :                 +- * BroadcastHashJoin Inner BuildRight (23)
-            :           :                 :     :                 :              :                    :- * Project (21)
-            :           :                 :     :                 :              :                    :  +- * BroadcastHashJoin Inner BuildRight (20)
-            :           :                 :     :                 :              :                    :     :- * Filter (15)
-            :           :                 :     :                 :              :                    :     :  +- * ColumnarToRow (14)
-            :           :                 :     :                 :              :                    :     :     +- Scan parquet spark_catalog.default.catalog_sales (13)
-            :           :                 :     :                 :              :                    :     +- BroadcastExchange (19)
-            :           :                 :     :                 :              :                    :        +- * Filter (18)
-            :           :                 :     :                 :              :                    :           +- * ColumnarToRow (17)
-            :           :                 :     :                 :              :                    :              +- Scan parquet spark_catalog.default.item (16)
-            :           :                 :     :                 :              :                    +- ReusedExchange (22)
-            :           :                 :     :                 :              +- ReusedExchange (30)
-            :           :                 :     :                 +- BroadcastExchange (45)
-            :           :                 :     :                    +- * Project (44)
-            :           :                 :     :                       +- * BroadcastHashJoin Inner BuildRight (43)
-            :           :                 :     :                          :- * Project (41)
-            :           :                 :     :                          :  +- * BroadcastHashJoin Inner BuildRight (40)
-            :           :                 :     :                          :     :- * Filter (38)
-            :           :                 :     :                          :     :  +- * ColumnarToRow (37)
-            :           :                 :     :                          :     :     +- Scan parquet spark_catalog.default.web_sales (36)
-            :           :                 :     :                          :     +- ReusedExchange (39)
-            :           :                 :     :                          +- ReusedExchange (42)
-            :           :                 :     +- BroadcastExchange (57)
-            :           :                 :        +- * BroadcastHashJoin LeftSemi BuildRight (56)
-            :           :                 :           :- * Filter (54)
-            :           :                 :           :  +- * ColumnarToRow (53)
-            :           :                 :           :     +- Scan parquet spark_catalog.default.item (52)
-            :           :                 :           +- ReusedExchange (55)
-            :           :                 +- ReusedExchange (60)
-            :           :- * Filter (81)
-            :           :  +- * HashAggregate (80)
-            :           :     +- Exchange (79)
-            :           :        +- * HashAggregate (78)
-            :           :           +- * Project (77)
-            :           :              +- * BroadcastHashJoin Inner BuildRight (76)
-            :           :                 :- * Project (74)
-            :           :                 :  +- * BroadcastHashJoin Inner BuildRight (73)
-            :           :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (71)
-            :           :                 :     :  :- * Filter (69)
-            :           :                 :     :  :  +- * ColumnarToRow (68)
-            :           :                 :     :  :     +- Scan parquet spark_catalog.default.catalog_sales (67)
-            :           :                 :     :  +- ReusedExchange (70)
-            :           :                 :     +- ReusedExchange (72)
-            :           :                 +- ReusedExchange (75)
-            :           +- * Filter (96)
-            :              +- * HashAggregate (95)
-            :                 +- Exchange (94)
-            :                    +- * HashAggregate (93)
-            :                       +- * Project (92)
-            :                          +- * BroadcastHashJoin Inner BuildRight (91)
-            :                             :- * Project (89)
-            :                             :  +- * BroadcastHashJoin Inner BuildRight (88)
-            :                             :     :- * BroadcastHashJoin LeftSemi BuildRight (86)
-            :                             :     :  :- * Filter (84)
-            :                             :     :  :  +- * ColumnarToRow (83)
-            :                             :     :  :     +- Scan parquet spark_catalog.default.web_sales (82)
-            :                             :     :  +- ReusedExchange (85)
-            :                             :     +- ReusedExchange (87)
-            :                             +- ReusedExchange (90)
-            :- * HashAggregate (105)
-            :  +- Exchange (104)
-            :     +- * HashAggregate (103)
-            :        +- * HashAggregate (102)
-            :           +- ReusedExchange (101)
-            :- * HashAggregate (110)
-            :  +- Exchange (109)
-            :     +- * HashAggregate (108)
-            :        +- * HashAggregate (107)
-            :           +- ReusedExchange (106)
-            :- * HashAggregate (115)
-            :  +- Exchange (114)
-            :     +- * HashAggregate (113)
-            :        +- * HashAggregate (112)
-            :           +- ReusedExchange (111)
-            +- * HashAggregate (120)
-               +- Exchange (119)
-                  +- * HashAggregate (118)
-                     +- * HashAggregate (117)
-                        +- ReusedExchange (116)
+TakeOrderedAndProject (164)
++- * HashAggregate (163)
+   +- Exchange (162)
+      +- * HashAggregate (161)
+         +- Union (160)
+            :- * HashAggregate (99)
+            :  +- * HashAggregate (98)
+            :     +- Union (97)
+            :        :- * Filter (66)
+            :        :  +- * HashAggregate (65)
+            :        :     +- Exchange (64)
+            :        :        +- * HashAggregate (63)
+            :        :           +- * Project (62)
+            :        :              +- * BroadcastHashJoin Inner BuildRight (61)
+            :        :                 :- * Project (59)
+            :        :                 :  +- * BroadcastHashJoin Inner BuildRight (58)
+            :        :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (51)
+            :        :                 :     :  :- * Filter (3)
+            :        :                 :     :  :  +- * ColumnarToRow (2)
+            :        :                 :     :  :     +- Scan parquet spark_catalog.default.store_sales (1)
+            :        :                 :     :  +- BroadcastExchange (50)
+            :        :                 :     :     +- * Project (49)
+            :        :                 :     :        +- * BroadcastHashJoin Inner BuildRight (48)
+            :        :                 :     :           :- * Filter (6)
+            :        :                 :     :           :  +- * ColumnarToRow (5)
+            :        :                 :     :           :     +- Scan parquet spark_catalog.default.item (4)
+            :        :                 :     :           +- BroadcastExchange (47)
+            :        :                 :     :              +- * BroadcastHashJoin LeftSemi BuildRight (46)
+            :        :                 :     :                 :- * HashAggregate (35)
+            :        :                 :     :                 :  +- Exchange (34)
+            :        :                 :     :                 :     +- * HashAggregate (33)
+            :        :                 :     :                 :        +- * Project (32)
+            :        :                 :     :                 :           +- * BroadcastHashJoin Inner BuildRight (31)
+            :        :                 :     :                 :              :- * Project (29)
+            :        :                 :     :                 :              :  +- * BroadcastHashJoin Inner BuildRight (28)
+            :        :                 :     :                 :              :     :- * Filter (9)
+            :        :                 :     :                 :              :     :  +- * ColumnarToRow (8)
+            :        :                 :     :                 :              :     :     +- Scan parquet spark_catalog.default.store_sales (7)
+            :        :                 :     :                 :              :     +- BroadcastExchange (27)
+            :        :                 :     :                 :              :        +- * BroadcastHashJoin LeftSemi BuildRight (26)
+            :        :                 :     :                 :              :           :- * Filter (12)
+            :        :                 :     :                 :              :           :  +- * ColumnarToRow (11)
+            :        :                 :     :                 :              :           :     +- Scan parquet spark_catalog.default.item (10)
+            :        :                 :     :                 :              :           +- BroadcastExchange (25)
+            :        :                 :     :                 :              :              +- * Project (24)
+            :        :                 :     :                 :              :                 +- * BroadcastHashJoin Inner BuildRight (23)
+            :        :                 :     :                 :              :                    :- * Project (21)
+            :        :                 :     :                 :              :                    :  +- * BroadcastHashJoin Inner BuildRight (20)
+            :        :                 :     :                 :              :                    :     :- * Filter (15)
+            :        :                 :     :                 :              :                    :     :  +- * ColumnarToRow (14)
+            :        :                 :     :                 :              :                    :     :     +- Scan parquet spark_catalog.default.catalog_sales (13)
+            :        :                 :     :                 :              :                    :     +- BroadcastExchange (19)
+            :        :                 :     :                 :              :                    :        +- * Filter (18)
+            :        :                 :     :                 :              :                    :           +- * ColumnarToRow (17)
+            :        :                 :     :                 :              :                    :              +- Scan parquet spark_catalog.default.item (16)
+            :        :                 :     :                 :              :                    +- ReusedExchange (22)
+            :        :                 :     :                 :              +- ReusedExchange (30)
+            :        :                 :     :                 +- BroadcastExchange (45)
+            :        :                 :     :                    +- * Project (44)
+            :        :                 :     :                       +- * BroadcastHashJoin Inner BuildRight (43)
+            :        :                 :     :                          :- * Project (41)
+            :        :                 :     :                          :  +- * BroadcastHashJoin Inner BuildRight (40)
+            :        :                 :     :                          :     :- * Filter (38)
+            :        :                 :     :                          :     :  +- * ColumnarToRow (37)
+            :        :                 :     :                          :     :     +- Scan parquet spark_catalog.default.web_sales (36)
+            :        :                 :     :                          :     +- ReusedExchange (39)
+            :        :                 :     :                          +- ReusedExchange (42)
+            :        :                 :     +- BroadcastExchange (57)
+            :        :                 :        +- * BroadcastHashJoin LeftSemi BuildRight (56)
+            :        :                 :           :- * Filter (54)
+            :        :                 :           :  +- * ColumnarToRow (53)
+            :        :                 :           :     +- Scan parquet spark_catalog.default.item (52)
+            :        :                 :           +- ReusedExchange (55)
+            :        :                 +- ReusedExchange (60)
+            :        :- * Filter (81)
+            :        :  +- * HashAggregate (80)
+            :        :     +- Exchange (79)
+            :        :        +- * HashAggregate (78)
+            :        :           +- * Project (77)
+            :        :              +- * BroadcastHashJoin Inner BuildRight (76)
+            :        :                 :- * Project (74)
+            :        :                 :  +- * BroadcastHashJoin Inner BuildRight (73)
+            :        :                 :     :- * BroadcastHashJoin LeftSemi BuildRight (71)
+            :        :                 :     :  :- * Filter (69)
+            :        :                 :     :  :  +- * ColumnarToRow (68)
+            :        :                 :     :  :     +- Scan parquet spark_catalog.default.catalog_sales (67)
+            :        :                 :     :  +- ReusedExchange (70)
+            :        :                 :     +- ReusedExchange (72)
+            :        :                 +- ReusedExchange (75)
+            :        +- * Filter (96)
+            :           +- * HashAggregate (95)
+            :              +- Exchange (94)
+            :                 +- * HashAggregate (93)
+            :                    +- * Project (92)
+            :                       +- * BroadcastHashJoin Inner BuildRight (91)
+            :                          :- * Project (89)
+            :                          :  +- * BroadcastHashJoin Inner BuildRight (88)
+            :                          :     :- * BroadcastHashJoin LeftSemi BuildRight (86)
+            :                          :     :  :- * Filter (84)
+            :                          :     :  :  +- * ColumnarToRow (83)
+            :                          :     :  :     +- Scan parquet spark_catalog.default.web_sales (82)
+            :                          :     :  +- ReusedExchange (85)
+            :                          :     +- ReusedExchange (87)
+            :                          +- ReusedExchange (90)
+            :- * HashAggregate (114)
+            :  +- Exchange (113)
+            :     +- * HashAggregate (112)
+            :        +- * HashAggregate (111)
+            :           +- * HashAggregate (110)
+            :              +- Union (109)
+            :                 :- * Filter (102)
+            :                 :  +- * HashAggregate (101)
+            :                 :     +- ReusedExchange (100)
+            :                 :- * Filter (105)
+            :                 :  +- * HashAggregate (104)
+            :                 :     +- ReusedExchange (103)
+            :                 +- * Filter (108)
+            :                    +- * HashAggregate (107)
+            :                       +- ReusedExchange (106)
+            :- * HashAggregate (129)
+            :  +- Exchange (128)
+            :     +- * HashAggregate (127)
+            :        +- * HashAggregate (126)
+            :           +- * HashAggregate (125)
+            :              +- Union (124)
+            :                 :- * Filter (117)
+            :                 :  +- * HashAggregate (116)
+            :                 :     +- ReusedExchange (115)
+            :                 :- * Filter (120)
+            :                 :  +- * HashAggregate (119)
+            :                 :     +- ReusedExchange (118)
+            :                 +- * Filter (123)
+            :                    +- * HashAggregate (122)
+            :                       +- ReusedExchange (121)
+            :- * HashAggregate (144)
+            :  +- Exchange (143)
+            :     +- * HashAggregate (142)
+            :        +- * HashAggregate (141)
+            :           +- * HashAggregate (140)
+            :              +- Union (139)
+            :                 :- * Filter (132)
+            :                 :  +- * HashAggregate (131)
+            :                 :     +- ReusedExchange (130)
+            :                 :- * Filter (135)
+            :                 :  +- * HashAggregate (134)
+            :                 :     +- ReusedExchange (133)
+            :                 +- * Filter (138)
+            :                    +- * HashAggregate (137)
+            :                       +- ReusedExchange (136)
+            +- * HashAggregate (159)
+               +- Exchange (158)
+                  +- * HashAggregate (157)
+                     +- * HashAggregate (156)
+                        +- * HashAggregate (155)
+                           +- Union (154)
+                              :- * Filter (147)
+                              :  +- * HashAggregate (146)
+                              :     +- ReusedExchange (145)
+                              :- * Filter (150)
+                              :  +- * HashAggregate (149)
+                              :     +- ReusedExchange (148)
+                              +- * Filter (153)
+                                 +- * HashAggregate (152)
+                                    +- ReusedExchange (151)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -227,7 +266,7 @@ Join condition: None
 Output [4]: [cs_sold_date_sk#18, i_brand_id#20, i_class_id#21, i_category_id#22]
 Input [6]: [cs_item_sk#17, cs_sold_date_sk#18, i_item_sk#19, i_brand_id#20, i_class_id#21, i_category_id#22]
 
-(22) ReusedExchange [Reuses operator id: 159]
+(22) ReusedExchange [Reuses operator id: 198]
 Output [1]: [d_date_sk#23]
 
 (23) BroadcastHashJoin [codegen id : 3]
@@ -264,7 +303,7 @@ Join condition: None
 Output [4]: [ss_sold_date_sk#11, i_brand_id#14, i_class_id#15, i_category_id#16]
 Input [6]: [ss_item_sk#10, ss_sold_date_sk#11, i_item_sk#13, i_brand_id#14, i_class_id#15, i_category_id#16]
 
-(30) ReusedExchange [Reuses operator id: 159]
+(30) ReusedExchange [Reuses operator id: 198]
 Output [1]: [d_date_sk#24]
 
 (31) BroadcastHashJoin [codegen id : 6]
@@ -323,7 +362,7 @@ Join condition: None
 Output [4]: [ws_sold_date_sk#29, i_brand_id#31, i_class_id#32, i_category_id#33]
 Input [6]: [ws_item_sk#28, ws_sold_date_sk#29, i_item_sk#30, i_brand_id#31, i_class_id#32, i_category_id#33]
 
-(42) ReusedExchange [Reuses operator id: 159]
+(42) ReusedExchange [Reuses operator id: 198]
 Output [1]: [d_date_sk#34]
 
 (43) BroadcastHashJoin [codegen id : 9]
@@ -407,7 +446,7 @@ Join condition: None
 Output [6]: [ss_quantity#2, ss_list_price#3, ss_sold_date_sk#4, i_brand_id#37, i_class_id#38, i_category_id#39]
 Input [8]: [ss_item_sk#1, ss_quantity#2, ss_list_price#3, ss_sold_date_sk#4, i_item_sk#36, i_brand_id#37, i_class_id#38, i_category_id#39]
 
-(60) ReusedExchange [Reuses operator id: 154]
+(60) ReusedExchange [Reuses operator id: 193]
 Output [1]: [d_date_sk#40]
 
 (61) BroadcastHashJoin [codegen id : 25]
@@ -440,151 +479,151 @@ Results [6]: [store AS channel#49, i_brand_id#37, i_class_id#38, i_category_id#3
 
 (66) Filter [codegen id : 26]
 Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51]
-Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Condition : (isnotnull(sales#50) AND (cast(sales#50 as decimal(32,6)) > cast(Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
 
 (67) Scan parquet spark_catalog.default.catalog_sales
-Output [4]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57]
+Output [4]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#57), dynamicpruningexpression(cs_sold_date_sk#57 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#56), dynamicpruningexpression(cs_sold_date_sk#56 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(cs_item_sk)]
 ReadSchema: struct<cs_item_sk:int,cs_quantity:int,cs_list_price:decimal(7,2)>
 
 (68) ColumnarToRow [codegen id : 51]
-Input [4]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57]
+Input [4]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56]
 
 (69) Filter [codegen id : 51]
-Input [4]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57]
-Condition : isnotnull(cs_item_sk#54)
+Input [4]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56]
+Condition : isnotnull(cs_item_sk#53)
 
 (70) ReusedExchange [Reuses operator id: 50]
-Output [1]: [ss_item_sk#58]
+Output [1]: [ss_item_sk#57]
 
 (71) BroadcastHashJoin [codegen id : 51]
-Left keys [1]: [cs_item_sk#54]
-Right keys [1]: [ss_item_sk#58]
+Left keys [1]: [cs_item_sk#53]
+Right keys [1]: [ss_item_sk#57]
 Join type: LeftSemi
 Join condition: None
 
 (72) ReusedExchange [Reuses operator id: 57]
-Output [4]: [i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
+Output [4]: [i_item_sk#58, i_brand_id#59, i_class_id#60, i_category_id#61]
 
 (73) BroadcastHashJoin [codegen id : 51]
-Left keys [1]: [cs_item_sk#54]
-Right keys [1]: [i_item_sk#59]
+Left keys [1]: [cs_item_sk#53]
+Right keys [1]: [i_item_sk#58]
 Join type: Inner
 Join condition: None
 
 (74) Project [codegen id : 51]
-Output [6]: [cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57, i_brand_id#60, i_class_id#61, i_category_id#62]
-Input [8]: [cs_item_sk#54, cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57, i_item_sk#59, i_brand_id#60, i_class_id#61, i_category_id#62]
+Output [6]: [cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56, i_brand_id#59, i_class_id#60, i_category_id#61]
+Input [8]: [cs_item_sk#53, cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56, i_item_sk#58, i_brand_id#59, i_class_id#60, i_category_id#61]
 
-(75) ReusedExchange [Reuses operator id: 154]
-Output [1]: [d_date_sk#63]
+(75) ReusedExchange [Reuses operator id: 193]
+Output [1]: [d_date_sk#62]
 
 (76) BroadcastHashJoin [codegen id : 51]
-Left keys [1]: [cs_sold_date_sk#57]
-Right keys [1]: [d_date_sk#63]
+Left keys [1]: [cs_sold_date_sk#56]
+Right keys [1]: [d_date_sk#62]
 Join type: Inner
 Join condition: None
 
 (77) Project [codegen id : 51]
-Output [5]: [cs_quantity#55, cs_list_price#56, i_brand_id#60, i_class_id#61, i_category_id#62]
-Input [7]: [cs_quantity#55, cs_list_price#56, cs_sold_date_sk#57, i_brand_id#60, i_class_id#61, i_category_id#62, d_date_sk#63]
+Output [5]: [cs_quantity#54, cs_list_price#55, i_brand_id#59, i_class_id#60, i_category_id#61]
+Input [7]: [cs_quantity#54, cs_list_price#55, cs_sold_date_sk#56, i_brand_id#59, i_class_id#60, i_category_id#61, d_date_sk#62]
 
 (78) HashAggregate [codegen id : 51]
-Input [5]: [cs_quantity#55, cs_list_price#56, i_brand_id#60, i_class_id#61, i_category_id#62]
-Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
-Functions [2]: [partial_sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56)), partial_count(1)]
-Aggregate Attributes [3]: [sum#64, isEmpty#65, count#66]
-Results [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
+Input [5]: [cs_quantity#54, cs_list_price#55, i_brand_id#59, i_class_id#60, i_category_id#61]
+Keys [3]: [i_brand_id#59, i_class_id#60, i_category_id#61]
+Functions [2]: [partial_sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55)), partial_count(1)]
+Aggregate Attributes [3]: [sum#63, isEmpty#64, count#65]
+Results [6]: [i_brand_id#59, i_class_id#60, i_category_id#61, sum#66, isEmpty#67, count#68]
 
 (79) Exchange
-Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
-Arguments: hashpartitioning(i_brand_id#60, i_class_id#61, i_category_id#62, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [6]: [i_brand_id#59, i_class_id#60, i_category_id#61, sum#66, isEmpty#67, count#68]
+Arguments: hashpartitioning(i_brand_id#59, i_class_id#60, i_category_id#61, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (80) HashAggregate [codegen id : 52]
-Input [6]: [i_brand_id#60, i_class_id#61, i_category_id#62, sum#67, isEmpty#68, count#69]
-Keys [3]: [i_brand_id#60, i_class_id#61, i_category_id#62]
-Functions [2]: [sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56)), count(1)]
-Aggregate Attributes [2]: [sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56))#70, count(1)#71]
-Results [6]: [catalog AS channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sum((cast(cs_quantity#55 as decimal(10,0)) * cs_list_price#56))#70 AS sales#73, count(1)#71 AS number_sales#74]
+Input [6]: [i_brand_id#59, i_class_id#60, i_category_id#61, sum#66, isEmpty#67, count#68]
+Keys [3]: [i_brand_id#59, i_class_id#60, i_category_id#61]
+Functions [2]: [sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55))#69, count(1)#70]
+Results [6]: [catalog AS channel#71, i_brand_id#59, i_class_id#60, i_category_id#61, sum((cast(cs_quantity#54 as decimal(10,0)) * cs_list_price#55))#69 AS sales#72, count(1)#70 AS number_sales#73]
 
 (81) Filter [codegen id : 52]
-Input [6]: [channel#72, i_brand_id#60, i_class_id#61, i_category_id#62, sales#73, number_sales#74]
-Condition : (isnotnull(sales#73) AND (cast(sales#73 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#71, i_brand_id#59, i_class_id#60, i_category_id#61, sales#72, number_sales#73]
+Condition : (isnotnull(sales#72) AND (cast(sales#72 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
 
 (82) Scan parquet spark_catalog.default.web_sales
-Output [4]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78]
+Output [4]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#78), dynamicpruningexpression(ws_sold_date_sk#78 IN dynamicpruning#5)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#77), dynamicpruningexpression(ws_sold_date_sk#77 IN dynamicpruning#5)]
 PushedFilters: [IsNotNull(ws_item_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_quantity:int,ws_list_price:decimal(7,2)>
 
 (83) ColumnarToRow [codegen id : 77]
-Input [4]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78]
+Input [4]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77]
 
 (84) Filter [codegen id : 77]
-Input [4]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78]
-Condition : isnotnull(ws_item_sk#75)
+Input [4]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77]
+Condition : isnotnull(ws_item_sk#74)
 
 (85) ReusedExchange [Reuses operator id: 50]
-Output [1]: [ss_item_sk#79]
+Output [1]: [ss_item_sk#78]
 
 (86) BroadcastHashJoin [codegen id : 77]
-Left keys [1]: [ws_item_sk#75]
-Right keys [1]: [ss_item_sk#79]
+Left keys [1]: [ws_item_sk#74]
+Right keys [1]: [ss_item_sk#78]
 Join type: LeftSemi
 Join condition: None
 
 (87) ReusedExchange [Reuses operator id: 57]
-Output [4]: [i_item_sk#80, i_brand_id#81, i_class_id#82, i_category_id#83]
+Output [4]: [i_item_sk#79, i_brand_id#80, i_class_id#81, i_category_id#82]
 
 (88) BroadcastHashJoin [codegen id : 77]
-Left keys [1]: [ws_item_sk#75]
-Right keys [1]: [i_item_sk#80]
+Left keys [1]: [ws_item_sk#74]
+Right keys [1]: [i_item_sk#79]
 Join type: Inner
 Join condition: None
 
 (89) Project [codegen id : 77]
-Output [6]: [ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78, i_brand_id#81, i_class_id#82, i_category_id#83]
-Input [8]: [ws_item_sk#75, ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78, i_item_sk#80, i_brand_id#81, i_class_id#82, i_category_id#83]
+Output [6]: [ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77, i_brand_id#80, i_class_id#81, i_category_id#82]
+Input [8]: [ws_item_sk#74, ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77, i_item_sk#79, i_brand_id#80, i_class_id#81, i_category_id#82]
 
-(90) ReusedExchange [Reuses operator id: 154]
-Output [1]: [d_date_sk#84]
+(90) ReusedExchange [Reuses operator id: 193]
+Output [1]: [d_date_sk#83]
 
 (91) BroadcastHashJoin [codegen id : 77]
-Left keys [1]: [ws_sold_date_sk#78]
-Right keys [1]: [d_date_sk#84]
+Left keys [1]: [ws_sold_date_sk#77]
+Right keys [1]: [d_date_sk#83]
 Join type: Inner
 Join condition: None
 
 (92) Project [codegen id : 77]
-Output [5]: [ws_quantity#76, ws_list_price#77, i_brand_id#81, i_class_id#82, i_category_id#83]
-Input [7]: [ws_quantity#76, ws_list_price#77, ws_sold_date_sk#78, i_brand_id#81, i_class_id#82, i_category_id#83, d_date_sk#84]
+Output [5]: [ws_quantity#75, ws_list_price#76, i_brand_id#80, i_class_id#81, i_category_id#82]
+Input [7]: [ws_quantity#75, ws_list_price#76, ws_sold_date_sk#77, i_brand_id#80, i_class_id#81, i_category_id#82, d_date_sk#83]
 
 (93) HashAggregate [codegen id : 77]
-Input [5]: [ws_quantity#76, ws_list_price#77, i_brand_id#81, i_class_id#82, i_category_id#83]
-Keys [3]: [i_brand_id#81, i_class_id#82, i_category_id#83]
-Functions [2]: [partial_sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77)), partial_count(1)]
-Aggregate Attributes [3]: [sum#85, isEmpty#86, count#87]
-Results [6]: [i_brand_id#81, i_class_id#82, i_category_id#83, sum#88, isEmpty#89, count#90]
+Input [5]: [ws_quantity#75, ws_list_price#76, i_brand_id#80, i_class_id#81, i_category_id#82]
+Keys [3]: [i_brand_id#80, i_class_id#81, i_category_id#82]
+Functions [2]: [partial_sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76)), partial_count(1)]
+Aggregate Attributes [3]: [sum#84, isEmpty#85, count#86]
+Results [6]: [i_brand_id#80, i_class_id#81, i_category_id#82, sum#87, isEmpty#88, count#89]
 
 (94) Exchange
-Input [6]: [i_brand_id#81, i_class_id#82, i_category_id#83, sum#88, isEmpty#89, count#90]
-Arguments: hashpartitioning(i_brand_id#81, i_class_id#82, i_category_id#83, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [6]: [i_brand_id#80, i_class_id#81, i_category_id#82, sum#87, isEmpty#88, count#89]
+Arguments: hashpartitioning(i_brand_id#80, i_class_id#81, i_category_id#82, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (95) HashAggregate [codegen id : 78]
-Input [6]: [i_brand_id#81, i_class_id#82, i_category_id#83, sum#88, isEmpty#89, count#90]
-Keys [3]: [i_brand_id#81, i_class_id#82, i_category_id#83]
-Functions [2]: [sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77)), count(1)]
-Aggregate Attributes [2]: [sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77))#91, count(1)#92]
-Results [6]: [web AS channel#93, i_brand_id#81, i_class_id#82, i_category_id#83, sum((cast(ws_quantity#76 as decimal(10,0)) * ws_list_price#77))#91 AS sales#94, count(1)#92 AS number_sales#95]
+Input [6]: [i_brand_id#80, i_class_id#81, i_category_id#82, sum#87, isEmpty#88, count#89]
+Keys [3]: [i_brand_id#80, i_class_id#81, i_category_id#82]
+Functions [2]: [sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76))#90, count(1)#91]
+Results [6]: [web AS channel#92, i_brand_id#80, i_class_id#81, i_category_id#82, sum((cast(ws_quantity#75 as decimal(10,0)) * ws_list_price#76))#90 AS sales#93, count(1)#91 AS number_sales#94]
 
 (96) Filter [codegen id : 78]
-Input [6]: [channel#93, i_brand_id#81, i_class_id#82, i_category_id#83, sales#94, number_sales#95]
-Condition : (isnotnull(sales#94) AND (cast(sales#94 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#53] as decimal(32,6))))
+Input [6]: [channel#92, i_brand_id#80, i_class_id#81, i_category_id#82, sales#93, number_sales#94]
+Condition : (isnotnull(sales#93) AND (cast(sales#93 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
 
 (97) Union
 
@@ -592,360 +631,548 @@ Condition : (isnotnull(sales#94) AND (cast(sales#94 as decimal(32,6)) > cast(Reu
 Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sales#50, number_sales#51]
 Keys [4]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39]
 Functions [2]: [partial_sum(sales#50), partial_sum(number_sales#51)]
-Aggregate Attributes [3]: [sum#96, isEmpty#97, sum#98]
-Results [7]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum#99, isEmpty#100, sum#101]
+Aggregate Attributes [3]: [sum#95, isEmpty#96, sum#97]
+Results [7]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum#98, isEmpty#99, sum#100]
 
-(99) Exchange
-Input [7]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum#99, isEmpty#100, sum#101]
-Arguments: hashpartitioning(channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, 5), ENSURE_REQUIREMENTS, [plan_id=12]
-
-(100) HashAggregate [codegen id : 80]
-Input [7]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum#99, isEmpty#100, sum#101]
+(99) HashAggregate [codegen id : 79]
+Input [7]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum#98, isEmpty#99, sum#100]
 Keys [4]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39]
 Functions [2]: [sum(sales#50), sum(number_sales#51)]
-Aggregate Attributes [2]: [sum(sales#50)#102, sum(number_sales#51)#103]
-Results [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum(sales#50)#102 AS sum_sales#104, sum(number_sales#51)#103 AS number_sales#105]
-
-(101) ReusedExchange [Reuses operator id: 99]
-Output [7]: [channel#106, i_brand_id#107, i_class_id#108, i_category_id#109, sum#110, isEmpty#111, sum#112]
-
-(102) HashAggregate [codegen id : 160]
-Input [7]: [channel#106, i_brand_id#107, i_class_id#108, i_category_id#109, sum#110, isEmpty#111, sum#112]
-Keys [4]: [channel#106, i_brand_id#107, i_class_id#108, i_category_id#109]
+Aggregate Attributes [2]: [sum(sales#50)#101, sum(number_sales#51)#102]
+Results [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum(sales#50)#101 AS sum_sales#103, sum(number_sales#51)#102 AS number_sales#104]
+
+(100) ReusedExchange [Reuses operator id: 64]
+Output [6]: [i_brand_id#105, i_class_id#106, i_category_id#107, sum#108, isEmpty#109, count#46]
+
+(101) HashAggregate [codegen id : 105]
+Input [6]: [i_brand_id#105, i_class_id#106, i_category_id#107, sum#108, isEmpty#109, count#46]
+Keys [3]: [i_brand_id#105, i_class_id#106, i_category_id#107]
+Functions [2]: [sum((cast(ss_quantity#110 as decimal(10,0)) * ss_list_price#111)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#110 as decimal(10,0)) * ss_list_price#111))#47, count(1)#48]
+Results [6]: [store AS channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sum((cast(ss_quantity#110 as decimal(10,0)) * ss_list_price#111))#47 AS sales#113, count(1)#48 AS number_sales#114]
+
+(102) Filter [codegen id : 105]
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sales#113, number_sales#114]
+Condition : (isnotnull(sales#113) AND (cast(sales#113 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(103) ReusedExchange [Reuses operator id: 79]
+Output [6]: [i_brand_id#115, i_class_id#116, i_category_id#117, sum#118, isEmpty#119, count#68]
+
+(104) HashAggregate [codegen id : 131]
+Input [6]: [i_brand_id#115, i_class_id#116, i_category_id#117, sum#118, isEmpty#119, count#68]
+Keys [3]: [i_brand_id#115, i_class_id#116, i_category_id#117]
+Functions [2]: [sum((cast(cs_quantity#120 as decimal(10,0)) * cs_list_price#121)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#120 as decimal(10,0)) * cs_list_price#121))#69, count(1)#70]
+Results [6]: [catalog AS channel#122, i_brand_id#115, i_class_id#116, i_category_id#117, sum((cast(cs_quantity#120 as decimal(10,0)) * cs_list_price#121))#69 AS sales#123, count(1)#70 AS number_sales#124]
+
+(105) Filter [codegen id : 131]
+Input [6]: [channel#122, i_brand_id#115, i_class_id#116, i_category_id#117, sales#123, number_sales#124]
+Condition : (isnotnull(sales#123) AND (cast(sales#123 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(106) ReusedExchange [Reuses operator id: 94]
+Output [6]: [i_brand_id#125, i_class_id#126, i_category_id#127, sum#128, isEmpty#129, count#89]
+
+(107) HashAggregate [codegen id : 157]
+Input [6]: [i_brand_id#125, i_class_id#126, i_category_id#127, sum#128, isEmpty#129, count#89]
+Keys [3]: [i_brand_id#125, i_class_id#126, i_category_id#127]
+Functions [2]: [sum((cast(ws_quantity#130 as decimal(10,0)) * ws_list_price#131)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#130 as decimal(10,0)) * ws_list_price#131))#90, count(1)#91]
+Results [6]: [web AS channel#132, i_brand_id#125, i_class_id#126, i_category_id#127, sum((cast(ws_quantity#130 as decimal(10,0)) * ws_list_price#131))#90 AS sales#133, count(1)#91 AS number_sales#134]
+
+(108) Filter [codegen id : 157]
+Input [6]: [channel#132, i_brand_id#125, i_class_id#126, i_category_id#127, sales#133, number_sales#134]
+Condition : (isnotnull(sales#133) AND (cast(sales#133 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(109) Union
+
+(110) HashAggregate [codegen id : 158]
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sales#113, number_sales#114]
+Keys [4]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107]
+Functions [2]: [partial_sum(sales#113), partial_sum(number_sales#114)]
+Aggregate Attributes [3]: [sum#135, isEmpty#136, sum#137]
+Results [7]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sum#138, isEmpty#139, sum#140]
+
+(111) HashAggregate [codegen id : 158]
+Input [7]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107, sum#138, isEmpty#139, sum#140]
+Keys [4]: [channel#112, i_brand_id#105, i_class_id#106, i_category_id#107]
 Functions [2]: [sum(sales#113), sum(number_sales#114)]
-Aggregate Attributes [2]: [sum(sales#113)#102, sum(number_sales#114)#103]
-Results [5]: [channel#106, i_brand_id#107, i_class_id#108, sum(sales#113)#102 AS sum_sales#115, sum(number_sales#114)#103 AS number_sales#116]
-
-(103) HashAggregate [codegen id : 160]
-Input [5]: [channel#106, i_brand_id#107, i_class_id#108, sum_sales#115, number_sales#116]
-Keys [3]: [channel#106, i_brand_id#107, i_class_id#108]
-Functions [2]: [partial_sum(sum_sales#115), partial_sum(number_sales#116)]
-Aggregate Attributes [3]: [sum#117, isEmpty#118, sum#119]
-Results [6]: [channel#106, i_brand_id#107, i_class_id#108, sum#120, isEmpty#121, sum#122]
-
-(104) Exchange
-Input [6]: [channel#106, i_brand_id#107, i_class_id#108, sum#120, isEmpty#121, sum#122]
-Arguments: hashpartitioning(channel#106, i_brand_id#107, i_class_id#108, 5), ENSURE_REQUIREMENTS, [plan_id=13]
-
-(105) HashAggregate [codegen id : 161]
-Input [6]: [channel#106, i_brand_id#107, i_class_id#108, sum#120, isEmpty#121, sum#122]
-Keys [3]: [channel#106, i_brand_id#107, i_class_id#108]
-Functions [2]: [sum(sum_sales#115), sum(number_sales#116)]
-Aggregate Attributes [2]: [sum(sum_sales#115)#123, sum(number_sales#116)#124]
-Results [6]: [channel#106, i_brand_id#107, i_class_id#108, null AS i_category_id#125, sum(sum_sales#115)#123 AS sum(sum_sales)#126, sum(number_sales#116)#124 AS sum(number_sales)#127]
-
-(106) ReusedExchange [Reuses operator id: 99]
-Output [7]: [channel#128, i_brand_id#129, i_class_id#130, i_category_id#131, sum#132, isEmpty#133, sum#134]
-
-(107) HashAggregate [codegen id : 241]
-Input [7]: [channel#128, i_brand_id#129, i_class_id#130, i_category_id#131, sum#132, isEmpty#133, sum#134]
-Keys [4]: [channel#128, i_brand_id#129, i_class_id#130, i_category_id#131]
-Functions [2]: [sum(sales#135), sum(number_sales#136)]
-Aggregate Attributes [2]: [sum(sales#135)#102, sum(number_sales#136)#103]
-Results [4]: [channel#128, i_brand_id#129, sum(sales#135)#102 AS sum_sales#137, sum(number_sales#136)#103 AS number_sales#138]
-
-(108) HashAggregate [codegen id : 241]
-Input [4]: [channel#128, i_brand_id#129, sum_sales#137, number_sales#138]
-Keys [2]: [channel#128, i_brand_id#129]
-Functions [2]: [partial_sum(sum_sales#137), partial_sum(number_sales#138)]
-Aggregate Attributes [3]: [sum#139, isEmpty#140, sum#141]
-Results [5]: [channel#128, i_brand_id#129, sum#142, isEmpty#143, sum#144]
-
-(109) Exchange
-Input [5]: [channel#128, i_brand_id#129, sum#142, isEmpty#143, sum#144]
-Arguments: hashpartitioning(channel#128, i_brand_id#129, 5), ENSURE_REQUIREMENTS, [plan_id=14]
-
-(110) HashAggregate [codegen id : 242]
-Input [5]: [channel#128, i_brand_id#129, sum#142, isEmpty#143, sum#144]
-Keys [2]: [channel#128, i_brand_id#129]
-Functions [2]: [sum(sum_sales#137), sum(number_sales#138)]
-Aggregate Attributes [2]: [sum(sum_sales#137)#145, sum(number_sales#138)#146]
-Results [6]: [channel#128, i_brand_id#129, null AS i_class_id#147, null AS i_category_id#148, sum(sum_sales#137)#145 AS sum(sum_sales)#149, sum(number_sales#138)#146 AS sum(number_sales)#150]
-
-(111) ReusedExchange [Reuses operator id: 99]
-Output [7]: [channel#151, i_brand_id#152, i_class_id#153, i_category_id#154, sum#155, isEmpty#156, sum#157]
-
-(112) HashAggregate [codegen id : 322]
-Input [7]: [channel#151, i_brand_id#152, i_class_id#153, i_category_id#154, sum#155, isEmpty#156, sum#157]
-Keys [4]: [channel#151, i_brand_id#152, i_class_id#153, i_category_id#154]
-Functions [2]: [sum(sales#158), sum(number_sales#159)]
-Aggregate Attributes [2]: [sum(sales#158)#102, sum(number_sales#159)#103]
-Results [3]: [channel#151, sum(sales#158)#102 AS sum_sales#160, sum(number_sales#159)#103 AS number_sales#161]
-
-(113) HashAggregate [codegen id : 322]
-Input [3]: [channel#151, sum_sales#160, number_sales#161]
-Keys [1]: [channel#151]
-Functions [2]: [partial_sum(sum_sales#160), partial_sum(number_sales#161)]
-Aggregate Attributes [3]: [sum#162, isEmpty#163, sum#164]
-Results [4]: [channel#151, sum#165, isEmpty#166, sum#167]
-
-(114) Exchange
-Input [4]: [channel#151, sum#165, isEmpty#166, sum#167]
-Arguments: hashpartitioning(channel#151, 5), ENSURE_REQUIREMENTS, [plan_id=15]
-
-(115) HashAggregate [codegen id : 323]
-Input [4]: [channel#151, sum#165, isEmpty#166, sum#167]
-Keys [1]: [channel#151]
-Functions [2]: [sum(sum_sales#160), sum(number_sales#161)]
-Aggregate Attributes [2]: [sum(sum_sales#160)#168, sum(number_sales#161)#169]
-Results [6]: [channel#151, null AS i_brand_id#170, null AS i_class_id#171, null AS i_category_id#172, sum(sum_sales#160)#168 AS sum(sum_sales)#173, sum(number_sales#161)#169 AS sum(number_sales)#174]
-
-(116) ReusedExchange [Reuses operator id: 99]
-Output [7]: [channel#175, i_brand_id#176, i_class_id#177, i_category_id#178, sum#179, isEmpty#180, sum#181]
-
-(117) HashAggregate [codegen id : 403]
-Input [7]: [channel#175, i_brand_id#176, i_class_id#177, i_category_id#178, sum#179, isEmpty#180, sum#181]
-Keys [4]: [channel#175, i_brand_id#176, i_class_id#177, i_category_id#178]
-Functions [2]: [sum(sales#182), sum(number_sales#183)]
-Aggregate Attributes [2]: [sum(sales#182)#102, sum(number_sales#183)#103]
-Results [2]: [sum(sales#182)#102 AS sum_sales#184, sum(number_sales#183)#103 AS number_sales#185]
-
-(118) HashAggregate [codegen id : 403]
-Input [2]: [sum_sales#184, number_sales#185]
+Aggregate Attributes [2]: [sum(sales#113)#101, sum(number_sales#114)#102]
+Results [5]: [channel#112, i_brand_id#105, i_class_id#106, sum(sales#113)#101 AS sum_sales#141, sum(number_sales#114)#102 AS number_sales#142]
+
+(112) HashAggregate [codegen id : 158]
+Input [5]: [channel#112, i_brand_id#105, i_class_id#106, sum_sales#141, number_sales#142]
+Keys [3]: [channel#112, i_brand_id#105, i_class_id#106]
+Functions [2]: [partial_sum(sum_sales#141), partial_sum(number_sales#142)]
+Aggregate Attributes [3]: [sum#143, isEmpty#144, sum#145]
+Results [6]: [channel#112, i_brand_id#105, i_class_id#106, sum#146, isEmpty#147, sum#148]
+
+(113) Exchange
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, sum#146, isEmpty#147, sum#148]
+Arguments: hashpartitioning(channel#112, i_brand_id#105, i_class_id#106, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+
+(114) HashAggregate [codegen id : 159]
+Input [6]: [channel#112, i_brand_id#105, i_class_id#106, sum#146, isEmpty#147, sum#148]
+Keys [3]: [channel#112, i_brand_id#105, i_class_id#106]
+Functions [2]: [sum(sum_sales#141), sum(number_sales#142)]
+Aggregate Attributes [2]: [sum(sum_sales#141)#149, sum(number_sales#142)#150]
+Results [6]: [channel#112, i_brand_id#105, i_class_id#106, null AS i_category_id#151, sum(sum_sales#141)#149 AS sum(sum_sales)#152, sum(number_sales#142)#150 AS sum(number_sales)#153]
+
+(115) ReusedExchange [Reuses operator id: 64]
+Output [6]: [i_brand_id#154, i_class_id#155, i_category_id#156, sum#157, isEmpty#158, count#46]
+
+(116) HashAggregate [codegen id : 185]
+Input [6]: [i_brand_id#154, i_class_id#155, i_category_id#156, sum#157, isEmpty#158, count#46]
+Keys [3]: [i_brand_id#154, i_class_id#155, i_category_id#156]
+Functions [2]: [sum((cast(ss_quantity#159 as decimal(10,0)) * ss_list_price#160)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#159 as decimal(10,0)) * ss_list_price#160))#47, count(1)#48]
+Results [6]: [store AS channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sum((cast(ss_quantity#159 as decimal(10,0)) * ss_list_price#160))#47 AS sales#162, count(1)#48 AS number_sales#163]
+
+(117) Filter [codegen id : 185]
+Input [6]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sales#162, number_sales#163]
+Condition : (isnotnull(sales#162) AND (cast(sales#162 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(118) ReusedExchange [Reuses operator id: 79]
+Output [6]: [i_brand_id#164, i_class_id#165, i_category_id#166, sum#167, isEmpty#168, count#68]
+
+(119) HashAggregate [codegen id : 211]
+Input [6]: [i_brand_id#164, i_class_id#165, i_category_id#166, sum#167, isEmpty#168, count#68]
+Keys [3]: [i_brand_id#164, i_class_id#165, i_category_id#166]
+Functions [2]: [sum((cast(cs_quantity#169 as decimal(10,0)) * cs_list_price#170)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#169 as decimal(10,0)) * cs_list_price#170))#69, count(1)#70]
+Results [6]: [catalog AS channel#171, i_brand_id#164, i_class_id#165, i_category_id#166, sum((cast(cs_quantity#169 as decimal(10,0)) * cs_list_price#170))#69 AS sales#172, count(1)#70 AS number_sales#173]
+
+(120) Filter [codegen id : 211]
+Input [6]: [channel#171, i_brand_id#164, i_class_id#165, i_category_id#166, sales#172, number_sales#173]
+Condition : (isnotnull(sales#172) AND (cast(sales#172 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(121) ReusedExchange [Reuses operator id: 94]
+Output [6]: [i_brand_id#174, i_class_id#175, i_category_id#176, sum#177, isEmpty#178, count#89]
+
+(122) HashAggregate [codegen id : 237]
+Input [6]: [i_brand_id#174, i_class_id#175, i_category_id#176, sum#177, isEmpty#178, count#89]
+Keys [3]: [i_brand_id#174, i_class_id#175, i_category_id#176]
+Functions [2]: [sum((cast(ws_quantity#179 as decimal(10,0)) * ws_list_price#180)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#179 as decimal(10,0)) * ws_list_price#180))#90, count(1)#91]
+Results [6]: [web AS channel#181, i_brand_id#174, i_class_id#175, i_category_id#176, sum((cast(ws_quantity#179 as decimal(10,0)) * ws_list_price#180))#90 AS sales#182, count(1)#91 AS number_sales#183]
+
+(123) Filter [codegen id : 237]
+Input [6]: [channel#181, i_brand_id#174, i_class_id#175, i_category_id#176, sales#182, number_sales#183]
+Condition : (isnotnull(sales#182) AND (cast(sales#182 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(124) Union
+
+(125) HashAggregate [codegen id : 238]
+Input [6]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sales#162, number_sales#163]
+Keys [4]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156]
+Functions [2]: [partial_sum(sales#162), partial_sum(number_sales#163)]
+Aggregate Attributes [3]: [sum#184, isEmpty#185, sum#186]
+Results [7]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sum#187, isEmpty#188, sum#189]
+
+(126) HashAggregate [codegen id : 238]
+Input [7]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156, sum#187, isEmpty#188, sum#189]
+Keys [4]: [channel#161, i_brand_id#154, i_class_id#155, i_category_id#156]
+Functions [2]: [sum(sales#162), sum(number_sales#163)]
+Aggregate Attributes [2]: [sum(sales#162)#101, sum(number_sales#163)#102]
+Results [4]: [channel#161, i_brand_id#154, sum(sales#162)#101 AS sum_sales#190, sum(number_sales#163)#102 AS number_sales#191]
+
+(127) HashAggregate [codegen id : 238]
+Input [4]: [channel#161, i_brand_id#154, sum_sales#190, number_sales#191]
+Keys [2]: [channel#161, i_brand_id#154]
+Functions [2]: [partial_sum(sum_sales#190), partial_sum(number_sales#191)]
+Aggregate Attributes [3]: [sum#192, isEmpty#193, sum#194]
+Results [5]: [channel#161, i_brand_id#154, sum#195, isEmpty#196, sum#197]
+
+(128) Exchange
+Input [5]: [channel#161, i_brand_id#154, sum#195, isEmpty#196, sum#197]
+Arguments: hashpartitioning(channel#161, i_brand_id#154, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+
+(129) HashAggregate [codegen id : 239]
+Input [5]: [channel#161, i_brand_id#154, sum#195, isEmpty#196, sum#197]
+Keys [2]: [channel#161, i_brand_id#154]
+Functions [2]: [sum(sum_sales#190), sum(number_sales#191)]
+Aggregate Attributes [2]: [sum(sum_sales#190)#198, sum(number_sales#191)#199]
+Results [6]: [channel#161, i_brand_id#154, null AS i_class_id#200, null AS i_category_id#201, sum(sum_sales#190)#198 AS sum(sum_sales)#202, sum(number_sales#191)#199 AS sum(number_sales)#203]
+
+(130) ReusedExchange [Reuses operator id: 64]
+Output [6]: [i_brand_id#204, i_class_id#205, i_category_id#206, sum#207, isEmpty#208, count#46]
+
+(131) HashAggregate [codegen id : 265]
+Input [6]: [i_brand_id#204, i_class_id#205, i_category_id#206, sum#207, isEmpty#208, count#46]
+Keys [3]: [i_brand_id#204, i_class_id#205, i_category_id#206]
+Functions [2]: [sum((cast(ss_quantity#209 as decimal(10,0)) * ss_list_price#210)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#209 as decimal(10,0)) * ss_list_price#210))#47, count(1)#48]
+Results [6]: [store AS channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sum((cast(ss_quantity#209 as decimal(10,0)) * ss_list_price#210))#47 AS sales#212, count(1)#48 AS number_sales#213]
+
+(132) Filter [codegen id : 265]
+Input [6]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sales#212, number_sales#213]
+Condition : (isnotnull(sales#212) AND (cast(sales#212 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(133) ReusedExchange [Reuses operator id: 79]
+Output [6]: [i_brand_id#214, i_class_id#215, i_category_id#216, sum#217, isEmpty#218, count#68]
+
+(134) HashAggregate [codegen id : 291]
+Input [6]: [i_brand_id#214, i_class_id#215, i_category_id#216, sum#217, isEmpty#218, count#68]
+Keys [3]: [i_brand_id#214, i_class_id#215, i_category_id#216]
+Functions [2]: [sum((cast(cs_quantity#219 as decimal(10,0)) * cs_list_price#220)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#219 as decimal(10,0)) * cs_list_price#220))#69, count(1)#70]
+Results [6]: [catalog AS channel#221, i_brand_id#214, i_class_id#215, i_category_id#216, sum((cast(cs_quantity#219 as decimal(10,0)) * cs_list_price#220))#69 AS sales#222, count(1)#70 AS number_sales#223]
+
+(135) Filter [codegen id : 291]
+Input [6]: [channel#221, i_brand_id#214, i_class_id#215, i_category_id#216, sales#222, number_sales#223]
+Condition : (isnotnull(sales#222) AND (cast(sales#222 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(136) ReusedExchange [Reuses operator id: 94]
+Output [6]: [i_brand_id#224, i_class_id#225, i_category_id#226, sum#227, isEmpty#228, count#89]
+
+(137) HashAggregate [codegen id : 317]
+Input [6]: [i_brand_id#224, i_class_id#225, i_category_id#226, sum#227, isEmpty#228, count#89]
+Keys [3]: [i_brand_id#224, i_class_id#225, i_category_id#226]
+Functions [2]: [sum((cast(ws_quantity#229 as decimal(10,0)) * ws_list_price#230)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#229 as decimal(10,0)) * ws_list_price#230))#90, count(1)#91]
+Results [6]: [web AS channel#231, i_brand_id#224, i_class_id#225, i_category_id#226, sum((cast(ws_quantity#229 as decimal(10,0)) * ws_list_price#230))#90 AS sales#232, count(1)#91 AS number_sales#233]
+
+(138) Filter [codegen id : 317]
+Input [6]: [channel#231, i_brand_id#224, i_class_id#225, i_category_id#226, sales#232, number_sales#233]
+Condition : (isnotnull(sales#232) AND (cast(sales#232 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(139) Union
+
+(140) HashAggregate [codegen id : 318]
+Input [6]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sales#212, number_sales#213]
+Keys [4]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206]
+Functions [2]: [partial_sum(sales#212), partial_sum(number_sales#213)]
+Aggregate Attributes [3]: [sum#234, isEmpty#235, sum#236]
+Results [7]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sum#237, isEmpty#238, sum#239]
+
+(141) HashAggregate [codegen id : 318]
+Input [7]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206, sum#237, isEmpty#238, sum#239]
+Keys [4]: [channel#211, i_brand_id#204, i_class_id#205, i_category_id#206]
+Functions [2]: [sum(sales#212), sum(number_sales#213)]
+Aggregate Attributes [2]: [sum(sales#212)#101, sum(number_sales#213)#102]
+Results [3]: [channel#211, sum(sales#212)#101 AS sum_sales#240, sum(number_sales#213)#102 AS number_sales#241]
+
+(142) HashAggregate [codegen id : 318]
+Input [3]: [channel#211, sum_sales#240, number_sales#241]
+Keys [1]: [channel#211]
+Functions [2]: [partial_sum(sum_sales#240), partial_sum(number_sales#241)]
+Aggregate Attributes [3]: [sum#242, isEmpty#243, sum#244]
+Results [4]: [channel#211, sum#245, isEmpty#246, sum#247]
+
+(143) Exchange
+Input [4]: [channel#211, sum#245, isEmpty#246, sum#247]
+Arguments: hashpartitioning(channel#211, 5), ENSURE_REQUIREMENTS, [plan_id=15]
+
+(144) HashAggregate [codegen id : 319]
+Input [4]: [channel#211, sum#245, isEmpty#246, sum#247]
+Keys [1]: [channel#211]
+Functions [2]: [sum(sum_sales#240), sum(number_sales#241)]
+Aggregate Attributes [2]: [sum(sum_sales#240)#248, sum(number_sales#241)#249]
+Results [6]: [channel#211, null AS i_brand_id#250, null AS i_class_id#251, null AS i_category_id#252, sum(sum_sales#240)#248 AS sum(sum_sales)#253, sum(number_sales#241)#249 AS sum(number_sales)#254]
+
+(145) ReusedExchange [Reuses operator id: 64]
+Output [6]: [i_brand_id#255, i_class_id#256, i_category_id#257, sum#258, isEmpty#259, count#46]
+
+(146) HashAggregate [codegen id : 345]
+Input [6]: [i_brand_id#255, i_class_id#256, i_category_id#257, sum#258, isEmpty#259, count#46]
+Keys [3]: [i_brand_id#255, i_class_id#256, i_category_id#257]
+Functions [2]: [sum((cast(ss_quantity#260 as decimal(10,0)) * ss_list_price#261)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ss_quantity#260 as decimal(10,0)) * ss_list_price#261))#47, count(1)#48]
+Results [6]: [store AS channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sum((cast(ss_quantity#260 as decimal(10,0)) * ss_list_price#261))#47 AS sales#263, count(1)#48 AS number_sales#264]
+
+(147) Filter [codegen id : 345]
+Input [6]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sales#263, number_sales#264]
+Condition : (isnotnull(sales#263) AND (cast(sales#263 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(148) ReusedExchange [Reuses operator id: 79]
+Output [6]: [i_brand_id#265, i_class_id#266, i_category_id#267, sum#268, isEmpty#269, count#68]
+
+(149) HashAggregate [codegen id : 371]
+Input [6]: [i_brand_id#265, i_class_id#266, i_category_id#267, sum#268, isEmpty#269, count#68]
+Keys [3]: [i_brand_id#265, i_class_id#266, i_category_id#267]
+Functions [2]: [sum((cast(cs_quantity#270 as decimal(10,0)) * cs_list_price#271)), count(1)]
+Aggregate Attributes [2]: [sum((cast(cs_quantity#270 as decimal(10,0)) * cs_list_price#271))#69, count(1)#70]
+Results [6]: [catalog AS channel#272, i_brand_id#265, i_class_id#266, i_category_id#267, sum((cast(cs_quantity#270 as decimal(10,0)) * cs_list_price#271))#69 AS sales#273, count(1)#70 AS number_sales#274]
+
+(150) Filter [codegen id : 371]
+Input [6]: [channel#272, i_brand_id#265, i_class_id#266, i_category_id#267, sales#273, number_sales#274]
+Condition : (isnotnull(sales#273) AND (cast(sales#273 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(151) ReusedExchange [Reuses operator id: 94]
+Output [6]: [i_brand_id#275, i_class_id#276, i_category_id#277, sum#278, isEmpty#279, count#89]
+
+(152) HashAggregate [codegen id : 397]
+Input [6]: [i_brand_id#275, i_class_id#276, i_category_id#277, sum#278, isEmpty#279, count#89]
+Keys [3]: [i_brand_id#275, i_class_id#276, i_category_id#277]
+Functions [2]: [sum((cast(ws_quantity#280 as decimal(10,0)) * ws_list_price#281)), count(1)]
+Aggregate Attributes [2]: [sum((cast(ws_quantity#280 as decimal(10,0)) * ws_list_price#281))#90, count(1)#91]
+Results [6]: [web AS channel#282, i_brand_id#275, i_class_id#276, i_category_id#277, sum((cast(ws_quantity#280 as decimal(10,0)) * ws_list_price#281))#90 AS sales#283, count(1)#91 AS number_sales#284]
+
+(153) Filter [codegen id : 397]
+Input [6]: [channel#282, i_brand_id#275, i_class_id#276, i_category_id#277, sales#283, number_sales#284]
+Condition : (isnotnull(sales#283) AND (cast(sales#283 as decimal(32,6)) > cast(ReusedSubquery Subquery scalar-subquery#52, [id=#10] as decimal(32,6))))
+
+(154) Union
+
+(155) HashAggregate [codegen id : 398]
+Input [6]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sales#263, number_sales#264]
+Keys [4]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257]
+Functions [2]: [partial_sum(sales#263), partial_sum(number_sales#264)]
+Aggregate Attributes [3]: [sum#285, isEmpty#286, sum#287]
+Results [7]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sum#288, isEmpty#289, sum#290]
+
+(156) HashAggregate [codegen id : 398]
+Input [7]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257, sum#288, isEmpty#289, sum#290]
+Keys [4]: [channel#262, i_brand_id#255, i_class_id#256, i_category_id#257]
+Functions [2]: [sum(sales#263), sum(number_sales#264)]
+Aggregate Attributes [2]: [sum(sales#263)#101, sum(number_sales#264)#102]
+Results [2]: [sum(sales#263)#101 AS sum_sales#291, sum(number_sales#264)#102 AS number_sales#292]
+
+(157) HashAggregate [codegen id : 398]
+Input [2]: [sum_sales#291, number_sales#292]
 Keys: []
-Functions [2]: [partial_sum(sum_sales#184), partial_sum(number_sales#185)]
-Aggregate Attributes [3]: [sum#186, isEmpty#187, sum#188]
-Results [3]: [sum#189, isEmpty#190, sum#191]
+Functions [2]: [partial_sum(sum_sales#291), partial_sum(number_sales#292)]
+Aggregate Attributes [3]: [sum#293, isEmpty#294, sum#295]
+Results [3]: [sum#296, isEmpty#297, sum#298]
 
-(119) Exchange
-Input [3]: [sum#189, isEmpty#190, sum#191]
+(158) Exchange
+Input [3]: [sum#296, isEmpty#297, sum#298]
 Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=16]
 
-(120) HashAggregate [codegen id : 404]
-Input [3]: [sum#189, isEmpty#190, sum#191]
+(159) HashAggregate [codegen id : 399]
+Input [3]: [sum#296, isEmpty#297, sum#298]
 Keys: []
-Functions [2]: [sum(sum_sales#184), sum(number_sales#185)]
-Aggregate Attributes [2]: [sum(sum_sales#184)#192, sum(number_sales#185)#193]
-Results [6]: [null AS channel#194, null AS i_brand_id#195, null AS i_class_id#196, null AS i_category_id#197, sum(sum_sales#184)#192 AS sum(sum_sales)#198, sum(number_sales#185)#193 AS sum(number_sales)#199]
+Functions [2]: [sum(sum_sales#291), sum(number_sales#292)]
+Aggregate Attributes [2]: [sum(sum_sales#291)#299, sum(number_sales#292)#300]
+Results [6]: [null AS channel#301, null AS i_brand_id#302, null AS i_class_id#303, null AS i_category_id#304, sum(sum_sales#291)#299 AS sum(sum_sales)#305, sum(number_sales#292)#300 AS sum(number_sales)#306]
 
-(121) Union
+(160) Union
 
-(122) HashAggregate [codegen id : 405]
-Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
-Keys [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
+(161) HashAggregate [codegen id : 400]
+Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
+Keys [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
 Functions: []
 Aggregate Attributes: []
-Results [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
+Results [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
 
-(123) Exchange
-Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
-Arguments: hashpartitioning(channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105, 5), ENSURE_REQUIREMENTS, [plan_id=17]
+(162) Exchange
+Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
+Arguments: hashpartitioning(channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104, 5), ENSURE_REQUIREMENTS, [plan_id=17]
 
-(124) HashAggregate [codegen id : 406]
-Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
-Keys [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
+(163) HashAggregate [codegen id : 401]
+Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
+Keys [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
 Functions: []
 Aggregate Attributes: []
-Results [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
+Results [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
 
-(125) TakeOrderedAndProject
-Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
-Arguments: 100, [channel#49 ASC NULLS FIRST, i_brand_id#37 ASC NULLS FIRST, i_class_id#38 ASC NULLS FIRST, i_category_id#39 ASC NULLS FIRST], [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#104, number_sales#105]
+(164) TakeOrderedAndProject
+Input [6]: [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
+Arguments: 100, [channel#49 ASC NULLS FIRST, i_brand_id#37 ASC NULLS FIRST, i_class_id#38 ASC NULLS FIRST, i_category_id#39 ASC NULLS FIRST], [channel#49, i_brand_id#37, i_class_id#38, i_category_id#39, sum_sales#103, number_sales#104]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#52, [id=#53]
-* HashAggregate (144)
-+- Exchange (143)
-   +- * HashAggregate (142)
-      +- Union (141)
-         :- * Project (130)
-         :  +- * BroadcastHashJoin Inner BuildRight (129)
-         :     :- * ColumnarToRow (127)
-         :     :  +- Scan parquet spark_catalog.default.store_sales (126)
-         :     +- ReusedExchange (128)
-         :- * Project (135)
-         :  +- * BroadcastHashJoin Inner BuildRight (134)
-         :     :- * ColumnarToRow (132)
-         :     :  +- Scan parquet spark_catalog.default.catalog_sales (131)
-         :     +- ReusedExchange (133)
-         +- * Project (140)
-            +- * BroadcastHashJoin Inner BuildRight (139)
-               :- * ColumnarToRow (137)
-               :  +- Scan parquet spark_catalog.default.web_sales (136)
-               +- ReusedExchange (138)
-
-
-(126) Scan parquet spark_catalog.default.store_sales
-Output [3]: [ss_quantity#200, ss_list_price#201, ss_sold_date_sk#202]
+Subquery:1 Hosting operator id = 66 Hosting Expression = Subquery scalar-subquery#52, [id=#10]
+* HashAggregate (183)
++- Exchange (182)
+   +- * HashAggregate (181)
+      +- Union (180)
+         :- * Project (169)
+         :  +- * BroadcastHashJoin Inner BuildRight (168)
+         :     :- * ColumnarToRow (166)
+         :     :  +- Scan parquet spark_catalog.default.store_sales (165)
+         :     +- ReusedExchange (167)
+         :- * Project (174)
+         :  +- * BroadcastHashJoin Inner BuildRight (173)
+         :     :- * ColumnarToRow (171)
+         :     :  +- Scan parquet spark_catalog.default.catalog_sales (170)
+         :     +- ReusedExchange (172)
+         +- * Project (179)
+            +- * BroadcastHashJoin Inner BuildRight (178)
+               :- * ColumnarToRow (176)
+               :  +- Scan parquet spark_catalog.default.web_sales (175)
+               +- ReusedExchange (177)
+
+
+(165) Scan parquet spark_catalog.default.store_sales
+Output [3]: [ss_quantity#307, ss_list_price#308, ss_sold_date_sk#309]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#202), dynamicpruningexpression(ss_sold_date_sk#202 IN dynamicpruning#12)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#309), dynamicpruningexpression(ss_sold_date_sk#309 IN dynamicpruning#12)]
 ReadSchema: struct<ss_quantity:int,ss_list_price:decimal(7,2)>
 
-(127) ColumnarToRow [codegen id : 2]
-Input [3]: [ss_quantity#200, ss_list_price#201, ss_sold_date_sk#202]
+(166) ColumnarToRow [codegen id : 2]
+Input [3]: [ss_quantity#307, ss_list_price#308, ss_sold_date_sk#309]
 
-(128) ReusedExchange [Reuses operator id: 159]
-Output [1]: [d_date_sk#203]
+(167) ReusedExchange [Reuses operator id: 198]
+Output [1]: [d_date_sk#310]
 
-(129) BroadcastHashJoin [codegen id : 2]
-Left keys [1]: [ss_sold_date_sk#202]
-Right keys [1]: [d_date_sk#203]
+(168) BroadcastHashJoin [codegen id : 2]
+Left keys [1]: [ss_sold_date_sk#309]
+Right keys [1]: [d_date_sk#310]
 Join type: Inner
 Join condition: None
 
-(130) Project [codegen id : 2]
-Output [2]: [ss_quantity#200 AS quantity#204, ss_list_price#201 AS list_price#205]
-Input [4]: [ss_quantity#200, ss_list_price#201, ss_sold_date_sk#202, d_date_sk#203]
+(169) Project [codegen id : 2]
+Output [2]: [ss_quantity#307 AS quantity#311, ss_list_price#308 AS list_price#312]
+Input [4]: [ss_quantity#307, ss_list_price#308, ss_sold_date_sk#309, d_date_sk#310]
 
-(131) Scan parquet spark_catalog.default.catalog_sales
-Output [3]: [cs_quantity#206, cs_list_price#207, cs_sold_date_sk#208]
+(170) Scan parquet spark_catalog.default.catalog_sales
+Output [3]: [cs_quantity#313, cs_list_price#314, cs_sold_date_sk#315]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#208), dynamicpruningexpression(cs_sold_date_sk#208 IN dynamicpruning#209)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#315), dynamicpruningexpression(cs_sold_date_sk#315 IN dynamicpruning#316)]
 ReadSchema: struct<cs_quantity:int,cs_list_price:decimal(7,2)>
 
-(132) ColumnarToRow [codegen id : 4]
-Input [3]: [cs_quantity#206, cs_list_price#207, cs_sold_date_sk#208]
+(171) ColumnarToRow [codegen id : 4]
+Input [3]: [cs_quantity#313, cs_list_price#314, cs_sold_date_sk#315]
 
-(133) ReusedExchange [Reuses operator id: 149]
-Output [1]: [d_date_sk#210]
+(172) ReusedExchange [Reuses operator id: 188]
+Output [1]: [d_date_sk#317]
 
-(134) BroadcastHashJoin [codegen id : 4]
-Left keys [1]: [cs_sold_date_sk#208]
-Right keys [1]: [d_date_sk#210]
+(173) BroadcastHashJoin [codegen id : 4]
+Left keys [1]: [cs_sold_date_sk#315]
+Right keys [1]: [d_date_sk#317]
 Join type: Inner
 Join condition: None
 
-(135) Project [codegen id : 4]
-Output [2]: [cs_quantity#206 AS quantity#211, cs_list_price#207 AS list_price#212]
-Input [4]: [cs_quantity#206, cs_list_price#207, cs_sold_date_sk#208, d_date_sk#210]
+(174) Project [codegen id : 4]
+Output [2]: [cs_quantity#313 AS quantity#318, cs_list_price#314 AS list_price#319]
+Input [4]: [cs_quantity#313, cs_list_price#314, cs_sold_date_sk#315, d_date_sk#317]
 
-(136) Scan parquet spark_catalog.default.web_sales
-Output [3]: [ws_quantity#213, ws_list_price#214, ws_sold_date_sk#215]
+(175) Scan parquet spark_catalog.default.web_sales
+Output [3]: [ws_quantity#320, ws_list_price#321, ws_sold_date_sk#322]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#215), dynamicpruningexpression(ws_sold_date_sk#215 IN dynamicpruning#209)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#322), dynamicpruningexpression(ws_sold_date_sk#322 IN dynamicpruning#316)]
 ReadSchema: struct<ws_quantity:int,ws_list_price:decimal(7,2)>
 
-(137) ColumnarToRow [codegen id : 6]
-Input [3]: [ws_quantity#213, ws_list_price#214, ws_sold_date_sk#215]
+(176) ColumnarToRow [codegen id : 6]
+Input [3]: [ws_quantity#320, ws_list_price#321, ws_sold_date_sk#322]
 
-(138) ReusedExchange [Reuses operator id: 149]
-Output [1]: [d_date_sk#216]
+(177) ReusedExchange [Reuses operator id: 188]
+Output [1]: [d_date_sk#323]
 
-(139) BroadcastHashJoin [codegen id : 6]
-Left keys [1]: [ws_sold_date_sk#215]
-Right keys [1]: [d_date_sk#216]
+(178) BroadcastHashJoin [codegen id : 6]
+Left keys [1]: [ws_sold_date_sk#322]
+Right keys [1]: [d_date_sk#323]
 Join type: Inner
 Join condition: None
 
-(140) Project [codegen id : 6]
-Output [2]: [ws_quantity#213 AS quantity#217, ws_list_price#214 AS list_price#218]
-Input [4]: [ws_quantity#213, ws_list_price#214, ws_sold_date_sk#215, d_date_sk#216]
+(179) Project [codegen id : 6]
+Output [2]: [ws_quantity#320 AS quantity#324, ws_list_price#321 AS list_price#325]
+Input [4]: [ws_quantity#320, ws_list_price#321, ws_sold_date_sk#322, d_date_sk#323]
 
-(141) Union
+(180) Union
 
-(142) HashAggregate [codegen id : 7]
-Input [2]: [quantity#204, list_price#205]
+(181) HashAggregate [codegen id : 7]
+Input [2]: [quantity#311, list_price#312]
 Keys: []
-Functions [1]: [partial_avg((cast(quantity#204 as decimal(10,0)) * list_price#205))]
-Aggregate Attributes [2]: [sum#219, count#220]
-Results [2]: [sum#221, count#222]
+Functions [1]: [partial_avg((cast(quantity#311 as decimal(10,0)) * list_price#312))]
+Aggregate Attributes [2]: [sum#326, count#327]
+Results [2]: [sum#328, count#329]
 
-(143) Exchange
-Input [2]: [sum#221, count#222]
+(182) Exchange
+Input [2]: [sum#328, count#329]
 Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=18]
 
-(144) HashAggregate [codegen id : 8]
-Input [2]: [sum#221, count#222]
+(183) HashAggregate [codegen id : 8]
+Input [2]: [sum#328, count#329]
 Keys: []
-Functions [1]: [avg((cast(quantity#204 as decimal(10,0)) * list_price#205))]
-Aggregate Attributes [1]: [avg((cast(quantity#204 as decimal(10,0)) * list_price#205))#223]
-Results [1]: [avg((cast(quantity#204 as decimal(10,0)) * list_price#205))#223 AS average_sales#224]
+Functions [1]: [avg((cast(quantity#311 as decimal(10,0)) * list_price#312))]
+Aggregate Attributes [1]: [avg((cast(quantity#311 as decimal(10,0)) * list_price#312))#330]
+Results [1]: [avg((cast(quantity#311 as decimal(10,0)) * list_price#312))#330 AS average_sales#331]
 
-Subquery:2 Hosting operator id = 126 Hosting Expression = ss_sold_date_sk#202 IN dynamicpruning#12
+Subquery:2 Hosting operator id = 165 Hosting Expression = ss_sold_date_sk#309 IN dynamicpruning#12
 
-Subquery:3 Hosting operator id = 131 Hosting Expression = cs_sold_date_sk#208 IN dynamicpruning#209
-BroadcastExchange (149)
-+- * Project (148)
-   +- * Filter (147)
-      +- * ColumnarToRow (146)
-         +- Scan parquet spark_catalog.default.date_dim (145)
+Subquery:3 Hosting operator id = 170 Hosting Expression = cs_sold_date_sk#315 IN dynamicpruning#316
+BroadcastExchange (188)
++- * Project (187)
+   +- * Filter (186)
+      +- * ColumnarToRow (185)
+         +- Scan parquet spark_catalog.default.date_dim (184)
 
 
-(145) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#210, d_year#225]
+(184) Scan parquet spark_catalog.default.date_dim
+Output [2]: [d_date_sk#317, d_year#332]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1998), LessThanOrEqual(d_year,2000), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
-(146) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#210, d_year#225]
+(185) ColumnarToRow [codegen id : 1]
+Input [2]: [d_date_sk#317, d_year#332]
 
-(147) Filter [codegen id : 1]
-Input [2]: [d_date_sk#210, d_year#225]
-Condition : (((isnotnull(d_year#225) AND (d_year#225 >= 1998)) AND (d_year#225 <= 2000)) AND isnotnull(d_date_sk#210))
+(186) Filter [codegen id : 1]
+Input [2]: [d_date_sk#317, d_year#332]
+Condition : (((isnotnull(d_year#332) AND (d_year#332 >= 1998)) AND (d_year#332 <= 2000)) AND isnotnull(d_date_sk#317))
 
-(148) Project [codegen id : 1]
-Output [1]: [d_date_sk#210]
-Input [2]: [d_date_sk#210, d_year#225]
+(187) Project [codegen id : 1]
+Output [1]: [d_date_sk#317]
+Input [2]: [d_date_sk#317, d_year#332]
 
-(149) BroadcastExchange
-Input [1]: [d_date_sk#210]
+(188) BroadcastExchange
+Input [1]: [d_date_sk#317]
 Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=19]
 
-Subquery:4 Hosting operator id = 136 Hosting Expression = ws_sold_date_sk#215 IN dynamicpruning#209
+Subquery:4 Hosting operator id = 175 Hosting Expression = ws_sold_date_sk#322 IN dynamicpruning#316
 
 Subquery:5 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (154)
-+- * Project (153)
-   +- * Filter (152)
-      +- * ColumnarToRow (151)
-         +- Scan parquet spark_catalog.default.date_dim (150)
+BroadcastExchange (193)
++- * Project (192)
+   +- * Filter (191)
+      +- * ColumnarToRow (190)
+         +- Scan parquet spark_catalog.default.date_dim (189)
 
 
-(150) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_date_sk#40, d_year#226, d_moy#227]
+(189) Scan parquet spark_catalog.default.date_dim
+Output [3]: [d_date_sk#40, d_year#333, d_moy#334]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,11), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(151) ColumnarToRow [codegen id : 1]
-Input [3]: [d_date_sk#40, d_year#226, d_moy#227]
+(190) ColumnarToRow [codegen id : 1]
+Input [3]: [d_date_sk#40, d_year#333, d_moy#334]
 
-(152) Filter [codegen id : 1]
-Input [3]: [d_date_sk#40, d_year#226, d_moy#227]
-Condition : ((((isnotnull(d_year#226) AND isnotnull(d_moy#227)) AND (d_year#226 = 2000)) AND (d_moy#227 = 11)) AND isnotnull(d_date_sk#40))
+(191) Filter [codegen id : 1]
+Input [3]: [d_date_sk#40, d_year#333, d_moy#334]
+Condition : ((((isnotnull(d_year#333) AND isnotnull(d_moy#334)) AND (d_year#333 = 2000)) AND (d_moy#334 = 11)) AND isnotnull(d_date_sk#40))
 
-(153) Project [codegen id : 1]
+(192) Project [codegen id : 1]
 Output [1]: [d_date_sk#40]
-Input [3]: [d_date_sk#40, d_year#226, d_moy#227]
+Input [3]: [d_date_sk#40, d_year#333, d_moy#334]
 
-(154) BroadcastExchange
+(193) BroadcastExchange
 Input [1]: [d_date_sk#40]
 Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=20]
 
 Subquery:6 Hosting operator id = 7 Hosting Expression = ss_sold_date_sk#11 IN dynamicpruning#12
-BroadcastExchange (159)
-+- * Project (158)
-   +- * Filter (157)
-      +- * ColumnarToRow (156)
-         +- Scan parquet spark_catalog.default.date_dim (155)
+BroadcastExchange (198)
++- * Project (197)
+   +- * Filter (196)
+      +- * ColumnarToRow (195)
+         +- Scan parquet spark_catalog.default.date_dim (194)
 
 
-(155) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#24, d_year#228]
+(194) Scan parquet spark_catalog.default.date_dim
+Output [2]: [d_date_sk#24, d_year#335]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), GreaterThanOrEqual(d_year,1999), LessThanOrEqual(d_year,2001), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
-(156) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#228]
+(195) ColumnarToRow [codegen id : 1]
+Input [2]: [d_date_sk#24, d_year#335]
 
-(157) Filter [codegen id : 1]
-Input [2]: [d_date_sk#24, d_year#228]
-Condition : (((isnotnull(d_year#228) AND (d_year#228 >= 1999)) AND (d_year#228 <= 2001)) AND isnotnull(d_date_sk#24))
+(196) Filter [codegen id : 1]
+Input [2]: [d_date_sk#24, d_year#335]
+Condition : (((isnotnull(d_year#335) AND (d_year#335 >= 1999)) AND (d_year#335 <= 2001)) AND isnotnull(d_date_sk#24))
 
-(158) Project [codegen id : 1]
+(197) Project [codegen id : 1]
 Output [1]: [d_date_sk#24]
-Input [2]: [d_date_sk#24, d_year#228]
+Input [2]: [d_date_sk#24, d_year#335]
 
-(159) BroadcastExchange
+(198) BroadcastExchange
 Input [1]: [d_date_sk#24]
 Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=21]
 
@@ -953,12 +1180,36 @@ Subquery:7 Hosting operator id = 13 Hosting Expression = cs_sold_date_sk#18 IN d
 
 Subquery:8 Hosting operator id = 36 Hosting Expression = ws_sold_date_sk#29 IN dynamicpruning#12
 
-Subquery:9 Hosting operator id = 81 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:9 Hosting operator id = 81 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:10 Hosting operator id = 67 Hosting Expression = cs_sold_date_sk#56 IN dynamicpruning#5
+
+Subquery:11 Hosting operator id = 96 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:12 Hosting operator id = 82 Hosting Expression = ws_sold_date_sk#77 IN dynamicpruning#5
+
+Subquery:13 Hosting operator id = 102 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:14 Hosting operator id = 105 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:15 Hosting operator id = 108 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:16 Hosting operator id = 117 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:17 Hosting operator id = 120 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:18 Hosting operator id = 123 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:19 Hosting operator id = 132 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:20 Hosting operator id = 135 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
+
+Subquery:21 Hosting operator id = 138 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
 
-Subquery:10 Hosting operator id = 67 Hosting Expression = cs_sold_date_sk#57 IN dynamicpruning#5
+Subquery:22 Hosting operator id = 147 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
 
-Subquery:11 Hosting operator id = 96 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#53]
+Subquery:23 Hosting operator id = 150 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
 
-Subquery:12 Hosting operator id = 82 Hosting Expression = ws_sold_date_sk#78 IN dynamicpruning#5
+Subquery:24 Hosting operator id = 153 Hosting Expression = ReusedSubquery Subquery scalar-subquery#52, [id=#10]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/simplified.txt
index ed3b4abc008f0..6e8a78082dbea 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q14a/simplified.txt
@@ -1,261 +1,334 @@
 TakeOrderedAndProject [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales]
-  WholeStageCodegen (406)
+  WholeStageCodegen (401)
     HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales]
       InputAdapter
         Exchange [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales] #1
-          WholeStageCodegen (405)
+          WholeStageCodegen (400)
             HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum_sales,number_sales]
               InputAdapter
                 Union
-                  WholeStageCodegen (80)
+                  WholeStageCodegen (79)
                     HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                      InputAdapter
-                        Exchange [channel,i_brand_id,i_class_id,i_category_id] #2
-                          WholeStageCodegen (79)
-                            HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
-                              InputAdapter
-                                Union
-                                  WholeStageCodegen (26)
-                                    Filter [sales]
-                                      Subquery #3
-                                        WholeStageCodegen (8)
-                                          HashAggregate [sum,count] [avg((cast(quantity as decimal(10,0)) * list_price)),average_sales,sum,count]
-                                            InputAdapter
-                                              Exchange #14
-                                                WholeStageCodegen (7)
-                                                  HashAggregate [quantity,list_price] [sum,count,sum,count]
-                                                    InputAdapter
-                                                      Union
-                                                        WholeStageCodegen (2)
-                                                          Project [ss_quantity,ss_list_price]
-                                                            BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.store_sales [ss_quantity,ss_list_price,ss_sold_date_sk]
-                                                                    ReusedSubquery [d_date_sk] #2
-                                                              InputAdapter
-                                                                ReusedExchange [d_date_sk] #8
-                                                        WholeStageCodegen (4)
-                                                          Project [cs_quantity,cs_list_price]
-                                                            BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.catalog_sales [cs_quantity,cs_list_price,cs_sold_date_sk]
-                                                                    SubqueryBroadcast [d_date_sk] #4
-                                                                      BroadcastExchange #15
-                                                                        WholeStageCodegen (1)
-                                                                          Project [d_date_sk]
-                                                                            Filter [d_year,d_date_sk]
-                                                                              ColumnarToRow
-                                                                                InputAdapter
-                                                                                  Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
-                                                              InputAdapter
-                                                                ReusedExchange [d_date_sk] #15
-                                                        WholeStageCodegen (6)
-                                                          Project [ws_quantity,ws_list_price]
-                                                            BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.web_sales [ws_quantity,ws_list_price,ws_sold_date_sk]
-                                                                    ReusedSubquery [d_date_sk] #4
-                                                              InputAdapter
-                                                                ReusedExchange [d_date_sk] #15
-                                      HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
-                                        InputAdapter
-                                          Exchange [i_brand_id,i_class_id,i_category_id] #3
-                                            WholeStageCodegen (25)
-                                              HashAggregate [i_brand_id,i_class_id,i_category_id,ss_quantity,ss_list_price] [sum,isEmpty,count,sum,isEmpty,count]
-                                                Project [ss_quantity,ss_list_price,i_brand_id,i_class_id,i_category_id]
-                                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                    Project [ss_quantity,ss_list_price,ss_sold_date_sk,i_brand_id,i_class_id,i_category_id]
-                                                      BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                                        BroadcastHashJoin [ss_item_sk,ss_item_sk]
-                                                          Filter [ss_item_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_quantity,ss_list_price,ss_sold_date_sk]
-                                                                  SubqueryBroadcast [d_date_sk] #1
-                                                                    BroadcastExchange #4
-                                                                      WholeStageCodegen (1)
-                                                                        Project [d_date_sk]
-                                                                          Filter [d_year,d_moy,d_date_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                      HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                        InputAdapter
+                          Union
+                            WholeStageCodegen (26)
+                              Filter [sales]
+                                Subquery #3
+                                  WholeStageCodegen (8)
+                                    HashAggregate [sum,count] [avg((cast(quantity as decimal(10,0)) * list_price)),average_sales,sum,count]
+                                      InputAdapter
+                                        Exchange #13
+                                          WholeStageCodegen (7)
+                                            HashAggregate [quantity,list_price] [sum,count,sum,count]
+                                              InputAdapter
+                                                Union
+                                                  WholeStageCodegen (2)
+                                                    Project [ss_quantity,ss_list_price]
+                                                      BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                        ColumnarToRow
                                                           InputAdapter
-                                                            BroadcastExchange #5
-                                                              WholeStageCodegen (11)
-                                                                Project [i_item_sk]
-                                                                  BroadcastHashJoin [i_brand_id,i_class_id,i_category_id,brand_id,class_id,category_id]
-                                                                    Filter [i_brand_id,i_class_id,i_category_id]
+                                                            Scan parquet spark_catalog.default.store_sales [ss_quantity,ss_list_price,ss_sold_date_sk]
+                                                              ReusedSubquery [d_date_sk] #2
+                                                        InputAdapter
+                                                          ReusedExchange [d_date_sk] #7
+                                                  WholeStageCodegen (4)
+                                                    Project [cs_quantity,cs_list_price]
+                                                      BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                        ColumnarToRow
+                                                          InputAdapter
+                                                            Scan parquet spark_catalog.default.catalog_sales [cs_quantity,cs_list_price,cs_sold_date_sk]
+                                                              SubqueryBroadcast [d_date_sk] #4
+                                                                BroadcastExchange #14
+                                                                  WholeStageCodegen (1)
+                                                                    Project [d_date_sk]
+                                                                      Filter [d_year,d_date_sk]
+                                                                        ColumnarToRow
+                                                                          InputAdapter
+                                                                            Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
+                                                        InputAdapter
+                                                          ReusedExchange [d_date_sk] #14
+                                                  WholeStageCodegen (6)
+                                                    Project [ws_quantity,ws_list_price]
+                                                      BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                        ColumnarToRow
+                                                          InputAdapter
+                                                            Scan parquet spark_catalog.default.web_sales [ws_quantity,ws_list_price,ws_sold_date_sk]
+                                                              ReusedSubquery [d_date_sk] #4
+                                                        InputAdapter
+                                                          ReusedExchange [d_date_sk] #14
+                                HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                  InputAdapter
+                                    Exchange [i_brand_id,i_class_id,i_category_id] #2
+                                      WholeStageCodegen (25)
+                                        HashAggregate [i_brand_id,i_class_id,i_category_id,ss_quantity,ss_list_price] [sum,isEmpty,count,sum,isEmpty,count]
+                                          Project [ss_quantity,ss_list_price,i_brand_id,i_class_id,i_category_id]
+                                            BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                              Project [ss_quantity,ss_list_price,ss_sold_date_sk,i_brand_id,i_class_id,i_category_id]
+                                                BroadcastHashJoin [ss_item_sk,i_item_sk]
+                                                  BroadcastHashJoin [ss_item_sk,ss_item_sk]
+                                                    Filter [ss_item_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_quantity,ss_list_price,ss_sold_date_sk]
+                                                            SubqueryBroadcast [d_date_sk] #1
+                                                              BroadcastExchange #3
+                                                                WholeStageCodegen (1)
+                                                                  Project [d_date_sk]
+                                                                    Filter [d_year,d_moy,d_date_sk]
                                                                       ColumnarToRow
                                                                         InputAdapter
-                                                                          Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                                    InputAdapter
-                                                                      BroadcastExchange #6
-                                                                        WholeStageCodegen (10)
-                                                                          BroadcastHashJoin [brand_id,class_id,category_id,i_brand_id,i_class_id,i_category_id]
-                                                                            HashAggregate [brand_id,class_id,category_id]
-                                                                              InputAdapter
-                                                                                Exchange [brand_id,class_id,category_id] #7
-                                                                                  WholeStageCodegen (6)
-                                                                                    HashAggregate [brand_id,class_id,category_id]
-                                                                                      Project [i_brand_id,i_class_id,i_category_id]
-                                                                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                                                          Project [ss_sold_date_sk,i_brand_id,i_class_id,i_category_id]
-                                                                                            BroadcastHashJoin [ss_item_sk,i_item_sk]
-                                                                                              Filter [ss_item_sk]
-                                                                                                ColumnarToRow
-                                                                                                  InputAdapter
-                                                                                                    Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_sold_date_sk]
-                                                                                                      SubqueryBroadcast [d_date_sk] #2
-                                                                                                        BroadcastExchange #8
-                                                                                                          WholeStageCodegen (1)
-                                                                                                            Project [d_date_sk]
-                                                                                                              Filter [d_year,d_date_sk]
+                                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                    InputAdapter
+                                                      BroadcastExchange #4
+                                                        WholeStageCodegen (11)
+                                                          Project [i_item_sk]
+                                                            BroadcastHashJoin [i_brand_id,i_class_id,i_category_id,brand_id,class_id,category_id]
+                                                              Filter [i_brand_id,i_class_id,i_category_id]
+                                                                ColumnarToRow
+                                                                  InputAdapter
+                                                                    Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                              InputAdapter
+                                                                BroadcastExchange #5
+                                                                  WholeStageCodegen (10)
+                                                                    BroadcastHashJoin [brand_id,class_id,category_id,i_brand_id,i_class_id,i_category_id]
+                                                                      HashAggregate [brand_id,class_id,category_id]
+                                                                        InputAdapter
+                                                                          Exchange [brand_id,class_id,category_id] #6
+                                                                            WholeStageCodegen (6)
+                                                                              HashAggregate [brand_id,class_id,category_id]
+                                                                                Project [i_brand_id,i_class_id,i_category_id]
+                                                                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                                                    Project [ss_sold_date_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                      BroadcastHashJoin [ss_item_sk,i_item_sk]
+                                                                                        Filter [ss_item_sk]
+                                                                                          ColumnarToRow
+                                                                                            InputAdapter
+                                                                                              Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_sold_date_sk]
+                                                                                                SubqueryBroadcast [d_date_sk] #2
+                                                                                                  BroadcastExchange #7
+                                                                                                    WholeStageCodegen (1)
+                                                                                                      Project [d_date_sk]
+                                                                                                        Filter [d_year,d_date_sk]
+                                                                                                          ColumnarToRow
+                                                                                                            InputAdapter
+                                                                                                              Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
+                                                                                        InputAdapter
+                                                                                          BroadcastExchange #8
+                                                                                            WholeStageCodegen (4)
+                                                                                              BroadcastHashJoin [i_brand_id,i_class_id,i_category_id,i_brand_id,i_class_id,i_category_id]
+                                                                                                Filter [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                  ColumnarToRow
+                                                                                                    InputAdapter
+                                                                                                      Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                InputAdapter
+                                                                                                  BroadcastExchange #9
+                                                                                                    WholeStageCodegen (3)
+                                                                                                      Project [i_brand_id,i_class_id,i_category_id]
+                                                                                                        BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                                                                          Project [cs_sold_date_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                            BroadcastHashJoin [cs_item_sk,i_item_sk]
+                                                                                                              Filter [cs_item_sk]
                                                                                                                 ColumnarToRow
                                                                                                                   InputAdapter
-                                                                                                                    Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year]
-                                                                                              InputAdapter
-                                                                                                BroadcastExchange #9
-                                                                                                  WholeStageCodegen (4)
-                                                                                                    BroadcastHashJoin [i_brand_id,i_class_id,i_category_id,i_brand_id,i_class_id,i_category_id]
-                                                                                                      Filter [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                                                                        ColumnarToRow
-                                                                                                          InputAdapter
-                                                                                                            Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                                                                      InputAdapter
-                                                                                                        BroadcastExchange #10
-                                                                                                          WholeStageCodegen (3)
-                                                                                                            Project [i_brand_id,i_class_id,i_category_id]
-                                                                                                              BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                                                                                Project [cs_sold_date_sk,i_brand_id,i_class_id,i_category_id]
-                                                                                                                  BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                                                                                                    Filter [cs_item_sk]
+                                                                                                                    Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_sold_date_sk]
+                                                                                                                      ReusedSubquery [d_date_sk] #2
+                                                                                                              InputAdapter
+                                                                                                                BroadcastExchange #10
+                                                                                                                  WholeStageCodegen (1)
+                                                                                                                    Filter [i_item_sk]
                                                                                                                       ColumnarToRow
                                                                                                                         InputAdapter
-                                                                                                                          Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_sold_date_sk]
-                                                                                                                            ReusedSubquery [d_date_sk] #2
-                                                                                                                    InputAdapter
-                                                                                                                      BroadcastExchange #11
-                                                                                                                        WholeStageCodegen (1)
-                                                                                                                          Filter [i_item_sk]
-                                                                                                                            ColumnarToRow
-                                                                                                                              InputAdapter
-                                                                                                                                Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                                                                                InputAdapter
-                                                                                                                  ReusedExchange [d_date_sk] #8
-                                                                                          InputAdapter
-                                                                                            ReusedExchange [d_date_sk] #8
-                                                                            InputAdapter
-                                                                              BroadcastExchange #12
-                                                                                WholeStageCodegen (9)
-                                                                                  Project [i_brand_id,i_class_id,i_category_id]
-                                                                                    BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                                                      Project [ws_sold_date_sk,i_brand_id,i_class_id,i_category_id]
-                                                                                        BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                                                                          Filter [ws_item_sk]
-                                                                                            ColumnarToRow
-                                                                                              InputAdapter
-                                                                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_sold_date_sk]
-                                                                                                  ReusedSubquery [d_date_sk] #2
-                                                                                          InputAdapter
-                                                                                            ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #11
-                                                                                      InputAdapter
-                                                                                        ReusedExchange [d_date_sk] #8
-                                                        InputAdapter
-                                                          BroadcastExchange #13
-                                                            WholeStageCodegen (23)
-                                                              BroadcastHashJoin [i_item_sk,ss_item_sk]
-                                                                Filter [i_item_sk]
-                                                                  ColumnarToRow
-                                                                    InputAdapter
-                                                                      Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
-                                                                InputAdapter
-                                                                  ReusedExchange [ss_item_sk] #5
-                                                    InputAdapter
-                                                      ReusedExchange [d_date_sk] #4
-                                  WholeStageCodegen (52)
-                                    Filter [sales]
-                                      ReusedSubquery [average_sales] #3
-                                      HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
-                                        InputAdapter
-                                          Exchange [i_brand_id,i_class_id,i_category_id] #16
-                                            WholeStageCodegen (51)
-                                              HashAggregate [i_brand_id,i_class_id,i_category_id,cs_quantity,cs_list_price] [sum,isEmpty,count,sum,isEmpty,count]
-                                                Project [cs_quantity,cs_list_price,i_brand_id,i_class_id,i_category_id]
-                                                  BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                    Project [cs_quantity,cs_list_price,cs_sold_date_sk,i_brand_id,i_class_id,i_category_id]
-                                                      BroadcastHashJoin [cs_item_sk,i_item_sk]
-                                                        BroadcastHashJoin [cs_item_sk,ss_item_sk]
-                                                          Filter [cs_item_sk]
+                                                                                                                          Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                                          InputAdapter
+                                                                                                            ReusedExchange [d_date_sk] #7
+                                                                                    InputAdapter
+                                                                                      ReusedExchange [d_date_sk] #7
+                                                                      InputAdapter
+                                                                        BroadcastExchange #11
+                                                                          WholeStageCodegen (9)
+                                                                            Project [i_brand_id,i_class_id,i_category_id]
+                                                                              BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                                                Project [ws_sold_date_sk,i_brand_id,i_class_id,i_category_id]
+                                                                                  BroadcastHashJoin [ws_item_sk,i_item_sk]
+                                                                                    Filter [ws_item_sk]
+                                                                                      ColumnarToRow
+                                                                                        InputAdapter
+                                                                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_sold_date_sk]
+                                                                                            ReusedSubquery [d_date_sk] #2
+                                                                                    InputAdapter
+                                                                                      ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #10
+                                                                                InputAdapter
+                                                                                  ReusedExchange [d_date_sk] #7
+                                                  InputAdapter
+                                                    BroadcastExchange #12
+                                                      WholeStageCodegen (23)
+                                                        BroadcastHashJoin [i_item_sk,ss_item_sk]
+                                                          Filter [i_item_sk]
                                                             ColumnarToRow
                                                               InputAdapter
-                                                                Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_quantity,cs_list_price,cs_sold_date_sk]
-                                                                  ReusedSubquery [d_date_sk] #1
+                                                                Scan parquet spark_catalog.default.item [i_item_sk,i_brand_id,i_class_id,i_category_id]
                                                           InputAdapter
-                                                            ReusedExchange [ss_item_sk] #5
+                                                            ReusedExchange [ss_item_sk] #4
+                                              InputAdapter
+                                                ReusedExchange [d_date_sk] #3
+                            WholeStageCodegen (52)
+                              Filter [sales]
+                                ReusedSubquery [average_sales] #3
+                                HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                  InputAdapter
+                                    Exchange [i_brand_id,i_class_id,i_category_id] #15
+                                      WholeStageCodegen (51)
+                                        HashAggregate [i_brand_id,i_class_id,i_category_id,cs_quantity,cs_list_price] [sum,isEmpty,count,sum,isEmpty,count]
+                                          Project [cs_quantity,cs_list_price,i_brand_id,i_class_id,i_category_id]
+                                            BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                              Project [cs_quantity,cs_list_price,cs_sold_date_sk,i_brand_id,i_class_id,i_category_id]
+                                                BroadcastHashJoin [cs_item_sk,i_item_sk]
+                                                  BroadcastHashJoin [cs_item_sk,ss_item_sk]
+                                                    Filter [cs_item_sk]
+                                                      ColumnarToRow
                                                         InputAdapter
-                                                          ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #13
+                                                          Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_quantity,cs_list_price,cs_sold_date_sk]
+                                                            ReusedSubquery [d_date_sk] #1
                                                     InputAdapter
-                                                      ReusedExchange [d_date_sk] #4
-                                  WholeStageCodegen (78)
-                                    Filter [sales]
-                                      ReusedSubquery [average_sales] #3
-                                      HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
-                                        InputAdapter
-                                          Exchange [i_brand_id,i_class_id,i_category_id] #17
-                                            WholeStageCodegen (77)
-                                              HashAggregate [i_brand_id,i_class_id,i_category_id,ws_quantity,ws_list_price] [sum,isEmpty,count,sum,isEmpty,count]
-                                                Project [ws_quantity,ws_list_price,i_brand_id,i_class_id,i_category_id]
-                                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                    Project [ws_quantity,ws_list_price,ws_sold_date_sk,i_brand_id,i_class_id,i_category_id]
-                                                      BroadcastHashJoin [ws_item_sk,i_item_sk]
-                                                        BroadcastHashJoin [ws_item_sk,ss_item_sk]
-                                                          Filter [ws_item_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_quantity,ws_list_price,ws_sold_date_sk]
-                                                                  ReusedSubquery [d_date_sk] #1
-                                                          InputAdapter
-                                                            ReusedExchange [ss_item_sk] #5
+                                                      ReusedExchange [ss_item_sk] #4
+                                                  InputAdapter
+                                                    ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #12
+                                              InputAdapter
+                                                ReusedExchange [d_date_sk] #3
+                            WholeStageCodegen (78)
+                              Filter [sales]
+                                ReusedSubquery [average_sales] #3
+                                HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                  InputAdapter
+                                    Exchange [i_brand_id,i_class_id,i_category_id] #16
+                                      WholeStageCodegen (77)
+                                        HashAggregate [i_brand_id,i_class_id,i_category_id,ws_quantity,ws_list_price] [sum,isEmpty,count,sum,isEmpty,count]
+                                          Project [ws_quantity,ws_list_price,i_brand_id,i_class_id,i_category_id]
+                                            BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                              Project [ws_quantity,ws_list_price,ws_sold_date_sk,i_brand_id,i_class_id,i_category_id]
+                                                BroadcastHashJoin [ws_item_sk,i_item_sk]
+                                                  BroadcastHashJoin [ws_item_sk,ss_item_sk]
+                                                    Filter [ws_item_sk]
+                                                      ColumnarToRow
                                                         InputAdapter
-                                                          ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #13
+                                                          Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_quantity,ws_list_price,ws_sold_date_sk]
+                                                            ReusedSubquery [d_date_sk] #1
                                                     InputAdapter
-                                                      ReusedExchange [d_date_sk] #4
-                  WholeStageCodegen (161)
+                                                      ReusedExchange [ss_item_sk] #4
+                                                  InputAdapter
+                                                    ReusedExchange [i_item_sk,i_brand_id,i_class_id,i_category_id] #12
+                                              InputAdapter
+                                                ReusedExchange [d_date_sk] #3
+                  WholeStageCodegen (159)
                     HashAggregate [channel,i_brand_id,i_class_id,sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange [channel,i_brand_id,i_class_id] #18
-                          WholeStageCodegen (160)
+                        Exchange [channel,i_brand_id,i_class_id] #17
+                          WholeStageCodegen (158)
                             HashAggregate [channel,i_brand_id,i_class_id,sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
-                  WholeStageCodegen (242)
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (105)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (131)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #15
+                                      WholeStageCodegen (157)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #16
+                  WholeStageCodegen (239)
                     HashAggregate [channel,i_brand_id,sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),i_class_id,i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange [channel,i_brand_id] #19
-                          WholeStageCodegen (241)
+                        Exchange [channel,i_brand_id] #18
+                          WholeStageCodegen (238)
                             HashAggregate [channel,i_brand_id,sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
-                  WholeStageCodegen (323)
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (185)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (211)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #15
+                                      WholeStageCodegen (237)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #16
+                  WholeStageCodegen (319)
                     HashAggregate [channel,sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),i_brand_id,i_class_id,i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange [channel] #20
-                          WholeStageCodegen (322)
+                        Exchange [channel] #19
+                          WholeStageCodegen (318)
                             HashAggregate [channel,sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
-                  WholeStageCodegen (404)
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (265)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (291)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #15
+                                      WholeStageCodegen (317)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #16
+                  WholeStageCodegen (399)
                     HashAggregate [sum,isEmpty,sum] [sum(sum_sales),sum(number_salesL),channel,i_brand_id,i_class_id,i_category_id,sum(sum_sales),sum(number_sales),sum,isEmpty,sum]
                       InputAdapter
-                        Exchange #21
-                          WholeStageCodegen (403)
+                        Exchange #20
+                          WholeStageCodegen (398)
                             HashAggregate [sum_sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
                               HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] [sum(sales),sum(number_salesL),sum_sales,number_sales,sum,isEmpty,sum]
-                                InputAdapter
-                                  ReusedExchange [channel,i_brand_id,i_class_id,i_category_id,sum,isEmpty,sum] #2
+                                HashAggregate [channel,i_brand_id,i_class_id,i_category_id,sales,number_sales] [sum,isEmpty,sum,sum,isEmpty,sum]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (345)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ss_quantity as decimal(10,0)) * ss_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #2
+                                      WholeStageCodegen (371)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(cs_quantity as decimal(10,0)) * cs_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #15
+                                      WholeStageCodegen (397)
+                                        Filter [sales]
+                                          ReusedSubquery [average_sales] #3
+                                          HashAggregate [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] [sum((cast(ws_quantity as decimal(10,0)) * ws_list_price)),count(1),channel,sales,number_sales,sum,isEmpty,count]
+                                            InputAdapter
+                                              ReusedExchange [i_brand_id,i_class_id,i_category_id,sum,isEmpty,count] #16
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24.sf100/explain.txt
index 9d80077e99372..bcee3f2faaf32 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24.sf100/explain.txt
@@ -265,11 +265,11 @@ Results [4]: [c_last_name#13, c_first_name#12, s_store_name#2, sum(netpaid#33)#3
 
 (46) Filter [codegen id : 11]
 Input [4]: [c_last_name#13, c_first_name#12, s_store_name#2, paid#39]
-Condition : (isnotnull(paid#39) AND (cast(paid#39 as decimal(33,8)) > cast(Subquery scalar-subquery#40, [id=#41] as decimal(33,8))))
+Condition : (isnotnull(paid#39) AND (cast(paid#39 as decimal(33,8)) > cast(Subquery scalar-subquery#40, [id=#9] as decimal(33,8))))
 
 (47) Exchange
 Input [4]: [c_last_name#13, c_first_name#12, s_store_name#2, paid#39]
-Arguments: rangepartitioning(c_last_name#13 ASC NULLS FIRST, c_first_name#12 ASC NULLS FIRST, s_store_name#2 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Arguments: rangepartitioning(c_last_name#13 ASC NULLS FIRST, c_first_name#12 ASC NULLS FIRST, s_store_name#2 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (48) Sort [codegen id : 12]
 Input [4]: [c_last_name#13, c_first_name#12, s_store_name#2, paid#39]
@@ -277,7 +277,7 @@ Arguments: [c_last_name#13 ASC NULLS FIRST, c_first_name#12 ASC NULLS FIRST, s_s
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#40, [id=#41]
+Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#40, [id=#9]
 * HashAggregate (76)
 +- Exchange (75)
    +- * HashAggregate (74)
@@ -309,135 +309,135 @@ Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquer
 
 
 (49) ReusedExchange [Reuses operator id: 17]
-Output [7]: [s_store_sk#42, s_store_name#43, s_state#44, ca_state#45, c_customer_sk#46, c_first_name#47, c_last_name#48]
+Output [7]: [s_store_sk#41, s_store_name#42, s_state#43, ca_state#44, c_customer_sk#45, c_first_name#46, c_last_name#47]
 
 (50) Scan parquet spark_catalog.default.store_sales
-Output [6]: [ss_item_sk#49, ss_customer_sk#50, ss_store_sk#51, ss_ticket_number#52, ss_net_paid#53, ss_sold_date_sk#54]
+Output [6]: [ss_item_sk#48, ss_customer_sk#49, ss_store_sk#50, ss_ticket_number#51, ss_net_paid#52, ss_sold_date_sk#53]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_sales]
 PushedFilters: [IsNotNull(ss_ticket_number), IsNotNull(ss_item_sk), IsNotNull(ss_store_sk), IsNotNull(ss_customer_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_customer_sk:int,ss_store_sk:int,ss_ticket_number:int,ss_net_paid:decimal(7,2)>
 
 (51) ColumnarToRow
-Input [6]: [ss_item_sk#49, ss_customer_sk#50, ss_store_sk#51, ss_ticket_number#52, ss_net_paid#53, ss_sold_date_sk#54]
+Input [6]: [ss_item_sk#48, ss_customer_sk#49, ss_store_sk#50, ss_ticket_number#51, ss_net_paid#52, ss_sold_date_sk#53]
 
 (52) Filter
-Input [6]: [ss_item_sk#49, ss_customer_sk#50, ss_store_sk#51, ss_ticket_number#52, ss_net_paid#53, ss_sold_date_sk#54]
-Condition : (((isnotnull(ss_ticket_number#52) AND isnotnull(ss_item_sk#49)) AND isnotnull(ss_store_sk#51)) AND isnotnull(ss_customer_sk#50))
+Input [6]: [ss_item_sk#48, ss_customer_sk#49, ss_store_sk#50, ss_ticket_number#51, ss_net_paid#52, ss_sold_date_sk#53]
+Condition : (((isnotnull(ss_ticket_number#51) AND isnotnull(ss_item_sk#48)) AND isnotnull(ss_store_sk#50)) AND isnotnull(ss_customer_sk#49))
 
 (53) Project
-Output [5]: [ss_item_sk#49, ss_customer_sk#50, ss_store_sk#51, ss_ticket_number#52, ss_net_paid#53]
-Input [6]: [ss_item_sk#49, ss_customer_sk#50, ss_store_sk#51, ss_ticket_number#52, ss_net_paid#53, ss_sold_date_sk#54]
+Output [5]: [ss_item_sk#48, ss_customer_sk#49, ss_store_sk#50, ss_ticket_number#51, ss_net_paid#52]
+Input [6]: [ss_item_sk#48, ss_customer_sk#49, ss_store_sk#50, ss_ticket_number#51, ss_net_paid#52, ss_sold_date_sk#53]
 
 (54) BroadcastHashJoin [codegen id : 4]
-Left keys [2]: [s_store_sk#42, c_customer_sk#46]
-Right keys [2]: [ss_store_sk#51, ss_customer_sk#50]
+Left keys [2]: [s_store_sk#41, c_customer_sk#45]
+Right keys [2]: [ss_store_sk#50, ss_customer_sk#49]
 Join type: Inner
 Join condition: None
 
 (55) Project [codegen id : 4]
-Output [8]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53]
-Input [12]: [s_store_sk#42, s_store_name#43, s_state#44, ca_state#45, c_customer_sk#46, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_customer_sk#50, ss_store_sk#51, ss_ticket_number#52, ss_net_paid#53]
+Output [8]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52]
+Input [12]: [s_store_sk#41, s_store_name#42, s_state#43, ca_state#44, c_customer_sk#45, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_customer_sk#49, ss_store_sk#50, ss_ticket_number#51, ss_net_paid#52]
 
 (56) Exchange
-Input [8]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53]
-Arguments: hashpartitioning(ss_item_sk#49, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [8]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52]
+Arguments: hashpartitioning(ss_item_sk#48, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (57) Sort [codegen id : 5]
-Input [8]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53]
-Arguments: [ss_item_sk#49 ASC NULLS FIRST], false, 0
+Input [8]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52]
+Arguments: [ss_item_sk#48 ASC NULLS FIRST], false, 0
 
 (58) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#55, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
+Output [6]: [i_item_sk#54, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (59) ColumnarToRow [codegen id : 6]
-Input [6]: [i_item_sk#55, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
+Input [6]: [i_item_sk#54, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
 
 (60) Filter [codegen id : 6]
-Input [6]: [i_item_sk#55, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
-Condition : isnotnull(i_item_sk#55)
+Input [6]: [i_item_sk#54, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
+Condition : isnotnull(i_item_sk#54)
 
 (61) Exchange
-Input [6]: [i_item_sk#55, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
-Arguments: hashpartitioning(i_item_sk#55, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [6]: [i_item_sk#54, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
+Arguments: hashpartitioning(i_item_sk#54, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (62) Sort [codegen id : 7]
-Input [6]: [i_item_sk#55, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
-Arguments: [i_item_sk#55 ASC NULLS FIRST], false, 0
+Input [6]: [i_item_sk#54, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
+Arguments: [i_item_sk#54 ASC NULLS FIRST], false, 0
 
 (63) SortMergeJoin [codegen id : 8]
-Left keys [1]: [ss_item_sk#49]
-Right keys [1]: [i_item_sk#55]
+Left keys [1]: [ss_item_sk#48]
+Right keys [1]: [i_item_sk#54]
 Join type: Inner
 Join condition: None
 
 (64) Project [codegen id : 8]
-Output [13]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
-Input [14]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53, i_item_sk#55, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
+Output [13]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
+Input [14]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52, i_item_sk#54, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
 
 (65) Exchange
-Input [13]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
-Arguments: hashpartitioning(ss_ticket_number#52, ss_item_sk#49, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [13]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
+Arguments: hashpartitioning(ss_ticket_number#51, ss_item_sk#48, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (66) Sort [codegen id : 9]
-Input [13]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60]
-Arguments: [ss_ticket_number#52 ASC NULLS FIRST, ss_item_sk#49 ASC NULLS FIRST], false, 0
+Input [13]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59]
+Arguments: [ss_ticket_number#51 ASC NULLS FIRST, ss_item_sk#48 ASC NULLS FIRST], false, 0
 
 (67) ReusedExchange [Reuses operator id: 36]
-Output [2]: [sr_item_sk#61, sr_ticket_number#62]
+Output [2]: [sr_item_sk#60, sr_ticket_number#61]
 
 (68) Sort [codegen id : 11]
-Input [2]: [sr_item_sk#61, sr_ticket_number#62]
-Arguments: [sr_ticket_number#62 ASC NULLS FIRST, sr_item_sk#61 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#60, sr_ticket_number#61]
+Arguments: [sr_ticket_number#61 ASC NULLS FIRST, sr_item_sk#60 ASC NULLS FIRST], false, 0
 
 (69) SortMergeJoin [codegen id : 12]
-Left keys [2]: [ss_ticket_number#52, ss_item_sk#49]
-Right keys [2]: [sr_ticket_number#62, sr_item_sk#61]
+Left keys [2]: [ss_ticket_number#51, ss_item_sk#48]
+Right keys [2]: [sr_ticket_number#61, sr_item_sk#60]
 Join type: Inner
 Join condition: None
 
 (70) Project [codegen id : 12]
-Output [11]: [ss_net_paid#53, s_store_name#43, s_state#44, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60, c_first_name#47, c_last_name#48, ca_state#45]
-Input [15]: [s_store_name#43, s_state#44, ca_state#45, c_first_name#47, c_last_name#48, ss_item_sk#49, ss_ticket_number#52, ss_net_paid#53, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60, sr_item_sk#61, sr_ticket_number#62]
+Output [11]: [ss_net_paid#52, s_store_name#42, s_state#43, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59, c_first_name#46, c_last_name#47, ca_state#44]
+Input [15]: [s_store_name#42, s_state#43, ca_state#44, c_first_name#46, c_last_name#47, ss_item_sk#48, ss_ticket_number#51, ss_net_paid#52, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59, sr_item_sk#60, sr_ticket_number#61]
 
 (71) HashAggregate [codegen id : 12]
-Input [11]: [ss_net_paid#53, s_store_name#43, s_state#44, i_current_price#56, i_size#57, i_color#58, i_units#59, i_manager_id#60, c_first_name#47, c_last_name#48, ca_state#45]
-Keys [10]: [c_last_name#48, c_first_name#47, s_store_name#43, ca_state#45, s_state#44, i_color#58, i_current_price#56, i_manager_id#60, i_units#59, i_size#57]
-Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#53))]
-Aggregate Attributes [1]: [sum#63]
-Results [11]: [c_last_name#48, c_first_name#47, s_store_name#43, ca_state#45, s_state#44, i_color#58, i_current_price#56, i_manager_id#60, i_units#59, i_size#57, sum#64]
+Input [11]: [ss_net_paid#52, s_store_name#42, s_state#43, i_current_price#55, i_size#56, i_color#57, i_units#58, i_manager_id#59, c_first_name#46, c_last_name#47, ca_state#44]
+Keys [10]: [c_last_name#47, c_first_name#46, s_store_name#42, ca_state#44, s_state#43, i_color#57, i_current_price#55, i_manager_id#59, i_units#58, i_size#56]
+Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#52))]
+Aggregate Attributes [1]: [sum#62]
+Results [11]: [c_last_name#47, c_first_name#46, s_store_name#42, ca_state#44, s_state#43, i_color#57, i_current_price#55, i_manager_id#59, i_units#58, i_size#56, sum#63]
 
 (72) Exchange
-Input [11]: [c_last_name#48, c_first_name#47, s_store_name#43, ca_state#45, s_state#44, i_color#58, i_current_price#56, i_manager_id#60, i_units#59, i_size#57, sum#64]
-Arguments: hashpartitioning(c_last_name#48, c_first_name#47, s_store_name#43, ca_state#45, s_state#44, i_color#58, i_current_price#56, i_manager_id#60, i_units#59, i_size#57, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+Input [11]: [c_last_name#47, c_first_name#46, s_store_name#42, ca_state#44, s_state#43, i_color#57, i_current_price#55, i_manager_id#59, i_units#58, i_size#56, sum#63]
+Arguments: hashpartitioning(c_last_name#47, c_first_name#46, s_store_name#42, ca_state#44, s_state#43, i_color#57, i_current_price#55, i_manager_id#59, i_units#58, i_size#56, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (73) HashAggregate [codegen id : 13]
-Input [11]: [c_last_name#48, c_first_name#47, s_store_name#43, ca_state#45, s_state#44, i_color#58, i_current_price#56, i_manager_id#60, i_units#59, i_size#57, sum#64]
-Keys [10]: [c_last_name#48, c_first_name#47, s_store_name#43, ca_state#45, s_state#44, i_color#58, i_current_price#56, i_manager_id#60, i_units#59, i_size#57]
-Functions [1]: [sum(UnscaledValue(ss_net_paid#53))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#53))#32]
-Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#53))#32,17,2) AS netpaid#65]
+Input [11]: [c_last_name#47, c_first_name#46, s_store_name#42, ca_state#44, s_state#43, i_color#57, i_current_price#55, i_manager_id#59, i_units#58, i_size#56, sum#63]
+Keys [10]: [c_last_name#47, c_first_name#46, s_store_name#42, ca_state#44, s_state#43, i_color#57, i_current_price#55, i_manager_id#59, i_units#58, i_size#56]
+Functions [1]: [sum(UnscaledValue(ss_net_paid#52))]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#52))#32]
+Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#52))#32,17,2) AS netpaid#64]
 
 (74) HashAggregate [codegen id : 13]
-Input [1]: [netpaid#65]
+Input [1]: [netpaid#64]
 Keys: []
-Functions [1]: [partial_avg(netpaid#65)]
-Aggregate Attributes [2]: [sum#66, count#67]
-Results [2]: [sum#68, count#69]
+Functions [1]: [partial_avg(netpaid#64)]
+Aggregate Attributes [2]: [sum#65, count#66]
+Results [2]: [sum#67, count#68]
 
 (75) Exchange
-Input [2]: [sum#68, count#69]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=14]
+Input [2]: [sum#67, count#68]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=15]
 
 (76) HashAggregate [codegen id : 14]
-Input [2]: [sum#68, count#69]
+Input [2]: [sum#67, count#68]
 Keys: []
-Functions [1]: [avg(netpaid#65)]
-Aggregate Attributes [1]: [avg(netpaid#65)#70]
-Results [1]: [(0.05 * avg(netpaid#65)#70) AS (0.05 * avg(netpaid))#71]
+Functions [1]: [avg(netpaid#64)]
+Aggregate Attributes [1]: [avg(netpaid#64)#69]
+Results [1]: [(0.05 * avg(netpaid#64)#69) AS (0.05 * avg(netpaid))#70]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24/explain.txt
index 99912f05b1374..7340d3b2dc935 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q24/explain.txt
@@ -265,11 +265,11 @@ Results [4]: [c_last_name#24, c_first_name#23, s_store_name#11, sum(netpaid#33)#
 
 (46) Filter [codegen id : 11]
 Input [4]: [c_last_name#24, c_first_name#23, s_store_name#11, paid#39]
-Condition : (isnotnull(paid#39) AND (cast(paid#39 as decimal(33,8)) > cast(Subquery scalar-subquery#40, [id=#41] as decimal(33,8))))
+Condition : (isnotnull(paid#39) AND (cast(paid#39 as decimal(33,8)) > cast(Subquery scalar-subquery#40, [id=#9] as decimal(33,8))))
 
 (47) Exchange
 Input [4]: [c_last_name#24, c_first_name#23, s_store_name#11, paid#39]
-Arguments: rangepartitioning(c_last_name#24 ASC NULLS FIRST, c_first_name#23 ASC NULLS FIRST, s_store_name#11 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Arguments: rangepartitioning(c_last_name#24 ASC NULLS FIRST, c_first_name#23 ASC NULLS FIRST, s_store_name#11 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (48) Sort [codegen id : 12]
 Input [4]: [c_last_name#24, c_first_name#23, s_store_name#11, paid#39]
@@ -277,7 +277,7 @@ Arguments: [c_last_name#24 ASC NULLS FIRST, c_first_name#23 ASC NULLS FIRST, s_s
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#40, [id=#41]
+Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#40, [id=#9]
 * HashAggregate (75)
 +- Exchange (74)
    +- * HashAggregate (73)
@@ -308,130 +308,130 @@ Subquery:1 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquer
 
 
 (49) ReusedExchange [Reuses operator id: 5]
-Output [5]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46]
+Output [5]: [ss_item_sk#41, ss_customer_sk#42, ss_store_sk#43, ss_ticket_number#44, ss_net_paid#45]
 
 (50) Sort [codegen id : 2]
-Input [5]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46]
-Arguments: [ss_ticket_number#45 ASC NULLS FIRST, ss_item_sk#42 ASC NULLS FIRST], false, 0
+Input [5]: [ss_item_sk#41, ss_customer_sk#42, ss_store_sk#43, ss_ticket_number#44, ss_net_paid#45]
+Arguments: [ss_ticket_number#44 ASC NULLS FIRST, ss_item_sk#41 ASC NULLS FIRST], false, 0
 
 (51) ReusedExchange [Reuses operator id: 11]
-Output [2]: [sr_item_sk#47, sr_ticket_number#48]
+Output [2]: [sr_item_sk#46, sr_ticket_number#47]
 
 (52) Sort [codegen id : 4]
-Input [2]: [sr_item_sk#47, sr_ticket_number#48]
-Arguments: [sr_ticket_number#48 ASC NULLS FIRST, sr_item_sk#47 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#46, sr_ticket_number#47]
+Arguments: [sr_ticket_number#47 ASC NULLS FIRST, sr_item_sk#46 ASC NULLS FIRST], false, 0
 
 (53) SortMergeJoin [codegen id : 9]
-Left keys [2]: [ss_ticket_number#45, ss_item_sk#42]
-Right keys [2]: [sr_ticket_number#48, sr_item_sk#47]
+Left keys [2]: [ss_ticket_number#44, ss_item_sk#41]
+Right keys [2]: [sr_ticket_number#47, sr_item_sk#46]
 Join type: Inner
 Join condition: None
 
 (54) Project [codegen id : 9]
-Output [4]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_net_paid#46]
-Input [7]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_ticket_number#45, ss_net_paid#46, sr_item_sk#47, sr_ticket_number#48]
+Output [4]: [ss_item_sk#41, ss_customer_sk#42, ss_store_sk#43, ss_net_paid#45]
+Input [7]: [ss_item_sk#41, ss_customer_sk#42, ss_store_sk#43, ss_ticket_number#44, ss_net_paid#45, sr_item_sk#46, sr_ticket_number#47]
 
 (55) ReusedExchange [Reuses operator id: 19]
-Output [4]: [s_store_sk#49, s_store_name#50, s_state#51, s_zip#52]
+Output [4]: [s_store_sk#48, s_store_name#49, s_state#50, s_zip#51]
 
 (56) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_store_sk#44]
-Right keys [1]: [s_store_sk#49]
+Left keys [1]: [ss_store_sk#43]
+Right keys [1]: [s_store_sk#48]
 Join type: Inner
 Join condition: None
 
 (57) Project [codegen id : 9]
-Output [6]: [ss_item_sk#42, ss_customer_sk#43, ss_net_paid#46, s_store_name#50, s_state#51, s_zip#52]
-Input [8]: [ss_item_sk#42, ss_customer_sk#43, ss_store_sk#44, ss_net_paid#46, s_store_sk#49, s_store_name#50, s_state#51, s_zip#52]
+Output [6]: [ss_item_sk#41, ss_customer_sk#42, ss_net_paid#45, s_store_name#49, s_state#50, s_zip#51]
+Input [8]: [ss_item_sk#41, ss_customer_sk#42, ss_store_sk#43, ss_net_paid#45, s_store_sk#48, s_store_name#49, s_state#50, s_zip#51]
 
 (58) Scan parquet spark_catalog.default.item
-Output [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Output [6]: [i_item_sk#52, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_size:string,i_color:string,i_units:string,i_manager_id:int>
 
 (59) ColumnarToRow [codegen id : 6]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Input [6]: [i_item_sk#52, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57]
 
 (60) Filter [codegen id : 6]
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Condition : isnotnull(i_item_sk#53)
+Input [6]: [i_item_sk#52, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57]
+Condition : isnotnull(i_item_sk#52)
 
 (61) BroadcastExchange
-Input [6]: [i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=10]
+Input [6]: [i_item_sk#52, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=11]
 
 (62) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_item_sk#42]
-Right keys [1]: [i_item_sk#53]
+Left keys [1]: [ss_item_sk#41]
+Right keys [1]: [i_item_sk#52]
 Join type: Inner
 Join condition: None
 
 (63) Project [codegen id : 9]
-Output [10]: [ss_customer_sk#43, ss_net_paid#46, s_store_name#50, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
-Input [12]: [ss_item_sk#42, ss_customer_sk#43, ss_net_paid#46, s_store_name#50, s_state#51, s_zip#52, i_item_sk#53, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58]
+Output [10]: [ss_customer_sk#42, ss_net_paid#45, s_store_name#49, s_state#50, s_zip#51, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57]
+Input [12]: [ss_item_sk#41, ss_customer_sk#42, ss_net_paid#45, s_store_name#49, s_state#50, s_zip#51, i_item_sk#52, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57]
 
 (64) ReusedExchange [Reuses operator id: 31]
-Output [5]: [c_customer_sk#59, c_current_addr_sk#60, c_first_name#61, c_last_name#62, c_birth_country#63]
+Output [5]: [c_customer_sk#58, c_current_addr_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
 
 (65) BroadcastHashJoin [codegen id : 9]
-Left keys [1]: [ss_customer_sk#43]
-Right keys [1]: [c_customer_sk#59]
+Left keys [1]: [ss_customer_sk#42]
+Right keys [1]: [c_customer_sk#58]
 Join type: Inner
 Join condition: None
 
 (66) Project [codegen id : 9]
-Output [13]: [ss_net_paid#46, s_store_name#50, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_current_addr_sk#60, c_first_name#61, c_last_name#62, c_birth_country#63]
-Input [15]: [ss_customer_sk#43, ss_net_paid#46, s_store_name#50, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_customer_sk#59, c_current_addr_sk#60, c_first_name#61, c_last_name#62, c_birth_country#63]
+Output [13]: [ss_net_paid#45, s_store_name#49, s_state#50, s_zip#51, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57, c_current_addr_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
+Input [15]: [ss_customer_sk#42, ss_net_paid#45, s_store_name#49, s_state#50, s_zip#51, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57, c_customer_sk#58, c_current_addr_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62]
 
 (67) ReusedExchange [Reuses operator id: 37]
-Output [4]: [ca_address_sk#64, ca_state#65, ca_zip#66, ca_country#67]
+Output [4]: [ca_address_sk#63, ca_state#64, ca_zip#65, ca_country#66]
 
 (68) BroadcastHashJoin [codegen id : 9]
-Left keys [3]: [c_current_addr_sk#60, c_birth_country#63, s_zip#52]
-Right keys [3]: [ca_address_sk#64, upper(ca_country#67), ca_zip#66]
+Left keys [3]: [c_current_addr_sk#59, c_birth_country#62, s_zip#51]
+Right keys [3]: [ca_address_sk#63, upper(ca_country#66), ca_zip#65]
 Join type: Inner
 Join condition: None
 
 (69) Project [codegen id : 9]
-Output [11]: [ss_net_paid#46, s_store_name#50, s_state#51, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#61, c_last_name#62, ca_state#65]
-Input [17]: [ss_net_paid#46, s_store_name#50, s_state#51, s_zip#52, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_current_addr_sk#60, c_first_name#61, c_last_name#62, c_birth_country#63, ca_address_sk#64, ca_state#65, ca_zip#66, ca_country#67]
+Output [11]: [ss_net_paid#45, s_store_name#49, s_state#50, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57, c_first_name#60, c_last_name#61, ca_state#64]
+Input [17]: [ss_net_paid#45, s_store_name#49, s_state#50, s_zip#51, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57, c_current_addr_sk#59, c_first_name#60, c_last_name#61, c_birth_country#62, ca_address_sk#63, ca_state#64, ca_zip#65, ca_country#66]
 
 (70) HashAggregate [codegen id : 9]
-Input [11]: [ss_net_paid#46, s_store_name#50, s_state#51, i_current_price#54, i_size#55, i_color#56, i_units#57, i_manager_id#58, c_first_name#61, c_last_name#62, ca_state#65]
-Keys [10]: [c_last_name#62, c_first_name#61, s_store_name#50, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55]
-Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#46))]
-Aggregate Attributes [1]: [sum#68]
-Results [11]: [c_last_name#62, c_first_name#61, s_store_name#50, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
+Input [11]: [ss_net_paid#45, s_store_name#49, s_state#50, i_current_price#53, i_size#54, i_color#55, i_units#56, i_manager_id#57, c_first_name#60, c_last_name#61, ca_state#64]
+Keys [10]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#64, s_state#50, i_color#55, i_current_price#53, i_manager_id#57, i_units#56, i_size#54]
+Functions [1]: [partial_sum(UnscaledValue(ss_net_paid#45))]
+Aggregate Attributes [1]: [sum#67]
+Results [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#64, s_state#50, i_color#55, i_current_price#53, i_manager_id#57, i_units#56, i_size#54, sum#68]
 
 (71) Exchange
-Input [11]: [c_last_name#62, c_first_name#61, s_store_name#50, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
-Arguments: hashpartitioning(c_last_name#62, c_first_name#61, s_store_name#50, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#64, s_state#50, i_color#55, i_current_price#53, i_manager_id#57, i_units#56, i_size#54, sum#68]
+Arguments: hashpartitioning(c_last_name#61, c_first_name#60, s_store_name#49, ca_state#64, s_state#50, i_color#55, i_current_price#53, i_manager_id#57, i_units#56, i_size#54, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (72) HashAggregate [codegen id : 10]
-Input [11]: [c_last_name#62, c_first_name#61, s_store_name#50, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55, sum#69]
-Keys [10]: [c_last_name#62, c_first_name#61, s_store_name#50, ca_state#65, s_state#51, i_color#56, i_current_price#54, i_manager_id#58, i_units#57, i_size#55]
-Functions [1]: [sum(UnscaledValue(ss_net_paid#46))]
-Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#46))#32]
-Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#46))#32,17,2) AS netpaid#70]
+Input [11]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#64, s_state#50, i_color#55, i_current_price#53, i_manager_id#57, i_units#56, i_size#54, sum#68]
+Keys [10]: [c_last_name#61, c_first_name#60, s_store_name#49, ca_state#64, s_state#50, i_color#55, i_current_price#53, i_manager_id#57, i_units#56, i_size#54]
+Functions [1]: [sum(UnscaledValue(ss_net_paid#45))]
+Aggregate Attributes [1]: [sum(UnscaledValue(ss_net_paid#45))#32]
+Results [1]: [MakeDecimal(sum(UnscaledValue(ss_net_paid#45))#32,17,2) AS netpaid#69]
 
 (73) HashAggregate [codegen id : 10]
-Input [1]: [netpaid#70]
+Input [1]: [netpaid#69]
 Keys: []
-Functions [1]: [partial_avg(netpaid#70)]
-Aggregate Attributes [2]: [sum#71, count#72]
-Results [2]: [sum#73, count#74]
+Functions [1]: [partial_avg(netpaid#69)]
+Aggregate Attributes [2]: [sum#70, count#71]
+Results [2]: [sum#72, count#73]
 
 (74) Exchange
-Input [2]: [sum#73, count#74]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=12]
+Input [2]: [sum#72, count#73]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
 (75) HashAggregate [codegen id : 11]
-Input [2]: [sum#73, count#74]
+Input [2]: [sum#72, count#73]
 Keys: []
-Functions [1]: [avg(netpaid#70)]
-Aggregate Attributes [1]: [avg(netpaid#70)#75]
-Results [1]: [(0.05 * avg(netpaid#70)#75) AS (0.05 * avg(netpaid))#76]
+Functions [1]: [avg(netpaid#69)]
+Aggregate Attributes [1]: [avg(netpaid#69)#74]
+Results [1]: [(0.05 * avg(netpaid#69)#74) AS (0.05 * avg(netpaid))#75]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/explain.txt
index 429efb5e203c6..03aed216685fe 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/explain.txt
@@ -1,90 +1,89 @@
 == Physical Plan ==
-TakeOrderedAndProject (86)
-+- * HashAggregate (85)
-   +- Exchange (84)
-      +- * HashAggregate (83)
-         +- Union (82)
-            :- * Project (27)
-            :  +- * Filter (26)
-            :     +- Window (25)
-            :        +- * Sort (24)
-            :           +- Window (23)
-            :              +- * Sort (22)
-            :                 +- Exchange (21)
-            :                    +- * HashAggregate (20)
-            :                       +- Exchange (19)
-            :                          +- * HashAggregate (18)
-            :                             +- * Project (17)
-            :                                +- * SortMergeJoin Inner (16)
-            :                                   :- * Sort (9)
-            :                                   :  +- Exchange (8)
-            :                                   :     +- * Project (7)
-            :                                   :        +- * BroadcastHashJoin Inner BuildRight (6)
-            :                                   :           :- * Project (4)
-            :                                   :           :  +- * Filter (3)
-            :                                   :           :     +- * ColumnarToRow (2)
-            :                                   :           :        +- Scan parquet spark_catalog.default.web_sales (1)
-            :                                   :           +- ReusedExchange (5)
-            :                                   +- * Sort (15)
-            :                                      +- Exchange (14)
-            :                                         +- * Project (13)
-            :                                            +- * Filter (12)
-            :                                               +- * ColumnarToRow (11)
-            :                                                  +- Scan parquet spark_catalog.default.web_returns (10)
-            :- * Project (54)
-            :  +- * Filter (53)
-            :     +- Window (52)
-            :        +- * Sort (51)
-            :           +- Window (50)
-            :              +- * Sort (49)
-            :                 +- Exchange (48)
-            :                    +- * HashAggregate (47)
-            :                       +- Exchange (46)
-            :                          +- * HashAggregate (45)
-            :                             +- * Project (44)
-            :                                +- * SortMergeJoin Inner (43)
-            :                                   :- * Sort (36)
-            :                                   :  +- Exchange (35)
-            :                                   :     +- * Project (34)
-            :                                   :        +- * BroadcastHashJoin Inner BuildRight (33)
-            :                                   :           :- * Project (31)
-            :                                   :           :  +- * Filter (30)
-            :                                   :           :     +- * ColumnarToRow (29)
-            :                                   :           :        +- Scan parquet spark_catalog.default.catalog_sales (28)
-            :                                   :           +- ReusedExchange (32)
-            :                                   +- * Sort (42)
-            :                                      +- Exchange (41)
-            :                                         +- * Project (40)
-            :                                            +- * Filter (39)
-            :                                               +- * ColumnarToRow (38)
-            :                                                  +- Scan parquet spark_catalog.default.catalog_returns (37)
-            +- * Project (81)
-               +- * Filter (80)
-                  +- Window (79)
-                     +- * Sort (78)
-                        +- Window (77)
-                           +- * Sort (76)
-                              +- Exchange (75)
-                                 +- * HashAggregate (74)
-                                    +- Exchange (73)
-                                       +- * HashAggregate (72)
-                                          +- * Project (71)
-                                             +- * SortMergeJoin Inner (70)
-                                                :- * Sort (63)
-                                                :  +- Exchange (62)
-                                                :     +- * Project (61)
-                                                :        +- * BroadcastHashJoin Inner BuildRight (60)
-                                                :           :- * Project (58)
-                                                :           :  +- * Filter (57)
-                                                :           :     +- * ColumnarToRow (56)
-                                                :           :        +- Scan parquet spark_catalog.default.store_sales (55)
-                                                :           +- ReusedExchange (59)
-                                                +- * Sort (69)
-                                                   +- Exchange (68)
-                                                      +- * Project (67)
-                                                         +- * Filter (66)
-                                                            +- * ColumnarToRow (65)
-                                                               +- Scan parquet spark_catalog.default.store_returns (64)
+TakeOrderedAndProject (85)
++- * HashAggregate (84)
+   +- * HashAggregate (83)
+      +- Union (82)
+         :- * Project (27)
+         :  +- * Filter (26)
+         :     +- Window (25)
+         :        +- * Sort (24)
+         :           +- Window (23)
+         :              +- * Sort (22)
+         :                 +- Exchange (21)
+         :                    +- * HashAggregate (20)
+         :                       +- Exchange (19)
+         :                          +- * HashAggregate (18)
+         :                             +- * Project (17)
+         :                                +- * SortMergeJoin Inner (16)
+         :                                   :- * Sort (9)
+         :                                   :  +- Exchange (8)
+         :                                   :     +- * Project (7)
+         :                                   :        +- * BroadcastHashJoin Inner BuildRight (6)
+         :                                   :           :- * Project (4)
+         :                                   :           :  +- * Filter (3)
+         :                                   :           :     +- * ColumnarToRow (2)
+         :                                   :           :        +- Scan parquet spark_catalog.default.web_sales (1)
+         :                                   :           +- ReusedExchange (5)
+         :                                   +- * Sort (15)
+         :                                      +- Exchange (14)
+         :                                         +- * Project (13)
+         :                                            +- * Filter (12)
+         :                                               +- * ColumnarToRow (11)
+         :                                                  +- Scan parquet spark_catalog.default.web_returns (10)
+         :- * Project (54)
+         :  +- * Filter (53)
+         :     +- Window (52)
+         :        +- * Sort (51)
+         :           +- Window (50)
+         :              +- * Sort (49)
+         :                 +- Exchange (48)
+         :                    +- * HashAggregate (47)
+         :                       +- Exchange (46)
+         :                          +- * HashAggregate (45)
+         :                             +- * Project (44)
+         :                                +- * SortMergeJoin Inner (43)
+         :                                   :- * Sort (36)
+         :                                   :  +- Exchange (35)
+         :                                   :     +- * Project (34)
+         :                                   :        +- * BroadcastHashJoin Inner BuildRight (33)
+         :                                   :           :- * Project (31)
+         :                                   :           :  +- * Filter (30)
+         :                                   :           :     +- * ColumnarToRow (29)
+         :                                   :           :        +- Scan parquet spark_catalog.default.catalog_sales (28)
+         :                                   :           +- ReusedExchange (32)
+         :                                   +- * Sort (42)
+         :                                      +- Exchange (41)
+         :                                         +- * Project (40)
+         :                                            +- * Filter (39)
+         :                                               +- * ColumnarToRow (38)
+         :                                                  +- Scan parquet spark_catalog.default.catalog_returns (37)
+         +- * Project (81)
+            +- * Filter (80)
+               +- Window (79)
+                  +- * Sort (78)
+                     +- Window (77)
+                        +- * Sort (76)
+                           +- Exchange (75)
+                              +- * HashAggregate (74)
+                                 +- Exchange (73)
+                                    +- * HashAggregate (72)
+                                       +- * Project (71)
+                                          +- * SortMergeJoin Inner (70)
+                                             :- * Sort (63)
+                                             :  +- Exchange (62)
+                                             :     +- * Project (61)
+                                             :        +- * BroadcastHashJoin Inner BuildRight (60)
+                                             :           :- * Project (58)
+                                             :           :  +- * Filter (57)
+                                             :           :     +- * ColumnarToRow (56)
+                                             :           :        +- Scan parquet spark_catalog.default.store_sales (55)
+                                             :           +- ReusedExchange (59)
+                                             +- * Sort (69)
+                                                +- Exchange (68)
+                                                   +- * Project (67)
+                                                      +- * Filter (66)
+                                                         +- * ColumnarToRow (65)
+                                                            +- Scan parquet spark_catalog.default.store_returns (64)
 
 
 (1) Scan parquet spark_catalog.default.web_sales
@@ -106,7 +105,7 @@ Condition : (((((((isnotnull(ws_net_profit#5) AND isnotnull(ws_net_paid#4)) AND
 Output [5]: [ws_item_sk#1, ws_order_number#2, ws_quantity#3, ws_net_paid#4, ws_sold_date_sk#6]
 Input [6]: [ws_item_sk#1, ws_order_number#2, ws_quantity#3, ws_net_paid#4, ws_net_profit#5, ws_sold_date_sk#6]
 
-(5) ReusedExchange [Reuses operator id: 91]
+(5) ReusedExchange [Reuses operator id: 90]
 Output [1]: [d_date_sk#8]
 
 (6) BroadcastHashJoin [codegen id : 2]
@@ -228,7 +227,7 @@ Condition : (((((((isnotnull(cs_net_profit#40) AND isnotnull(cs_net_paid#39)) AN
 Output [5]: [cs_item_sk#36, cs_order_number#37, cs_quantity#38, cs_net_paid#39, cs_sold_date_sk#41]
 Input [6]: [cs_item_sk#36, cs_order_number#37, cs_quantity#38, cs_net_paid#39, cs_net_profit#40, cs_sold_date_sk#41]
 
-(32) ReusedExchange [Reuses operator id: 91]
+(32) ReusedExchange [Reuses operator id: 90]
 Output [1]: [d_date_sk#42]
 
 (33) BroadcastHashJoin [codegen id : 12]
@@ -350,7 +349,7 @@ Condition : (((((((isnotnull(ss_net_profit#74) AND isnotnull(ss_net_paid#73)) AN
 Output [5]: [ss_item_sk#70, ss_ticket_number#71, ss_quantity#72, ss_net_paid#73, ss_sold_date_sk#75]
 Input [6]: [ss_item_sk#70, ss_ticket_number#71, ss_quantity#72, ss_net_paid#73, ss_net_profit#74, ss_sold_date_sk#75]
 
-(59) ReusedExchange [Reuses operator id: 91]
+(59) ReusedExchange [Reuses operator id: 90]
 Output [1]: [d_date_sk#76]
 
 (60) BroadcastHashJoin [codegen id : 22]
@@ -462,52 +461,48 @@ Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(84) Exchange
-Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
-Arguments: hashpartitioning(channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34, 5), ENSURE_REQUIREMENTS, [plan_id=13]
-
-(85) HashAggregate [codegen id : 32]
+(84) HashAggregate [codegen id : 31]
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Keys [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(86) TakeOrderedAndProject
+(85) TakeOrderedAndProject
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Arguments: 100, [channel#35 ASC NULLS FIRST, return_rank#33 ASC NULLS FIRST, currency_rank#34 ASC NULLS FIRST, item#30 ASC NULLS FIRST], [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ws_sold_date_sk#6 IN dynamicpruning#7
-BroadcastExchange (91)
-+- * Project (90)
-   +- * Filter (89)
-      +- * ColumnarToRow (88)
-         +- Scan parquet spark_catalog.default.date_dim (87)
+BroadcastExchange (90)
++- * Project (89)
+   +- * Filter (88)
+      +- * ColumnarToRow (87)
+         +- Scan parquet spark_catalog.default.date_dim (86)
 
 
-(87) Scan parquet spark_catalog.default.date_dim
+(86) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#8, d_year#104, d_moy#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,12), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(88) ColumnarToRow [codegen id : 1]
+(87) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#8, d_year#104, d_moy#105]
 
-(89) Filter [codegen id : 1]
+(88) Filter [codegen id : 1]
 Input [3]: [d_date_sk#8, d_year#104, d_moy#105]
 Condition : ((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND (d_year#104 = 2001)) AND (d_moy#105 = 12)) AND isnotnull(d_date_sk#8))
 
-(90) Project [codegen id : 1]
+(89) Project [codegen id : 1]
 Output [1]: [d_date_sk#8]
 Input [3]: [d_date_sk#8, d_year#104, d_moy#105]
 
-(91) BroadcastExchange
+(90) BroadcastExchange
 Input [1]: [d_date_sk#8]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=14]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=13]
 
 Subquery:2 Hosting operator id = 28 Hosting Expression = cs_sold_date_sk#41 IN dynamicpruning#7
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/simplified.txt
index 80d1661b033de..cc2ebb0c36ea8 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49.sf100/simplified.txt
@@ -1,160 +1,157 @@
 TakeOrderedAndProject [channel,return_rank,currency_rank,item,return_ratio]
-  WholeStageCodegen (32)
+  WholeStageCodegen (31)
     HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-      InputAdapter
-        Exchange [channel,item,return_ratio,return_rank,currency_rank] #1
-          WholeStageCodegen (31)
-            HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-              InputAdapter
-                Union
-                  WholeStageCodegen (10)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (9)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (8)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #2
-                                            WholeStageCodegen (7)
-                                              HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ws_item_sk] #3
-                                                    WholeStageCodegen (6)
-                                                      HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
-                                                          SortMergeJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
+      HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
+        InputAdapter
+          Union
+            WholeStageCodegen (10)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (9)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (8)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #1
+                                      WholeStageCodegen (7)
+                                        HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ws_item_sk] #2
+                                              WholeStageCodegen (6)
+                                                HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
+                                                    SortMergeJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
+                                                      InputAdapter
+                                                        WholeStageCodegen (3)
+                                                          Sort [ws_order_number,ws_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (3)
-                                                                Sort [ws_order_number,ws_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [ws_order_number,ws_item_sk] #4
-                                                                      WholeStageCodegen (2)
-                                                                        Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid]
-                                                                          BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                                            Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
-                                                                              Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
-                                                                                ColumnarToRow
-                                                                                  InputAdapter
-                                                                                    Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
-                                                                                      SubqueryBroadcast [d_date_sk] #1
-                                                                                        BroadcastExchange #5
-                                                                                          WholeStageCodegen (1)
-                                                                                            Project [d_date_sk]
-                                                                                              Filter [d_year,d_moy,d_date_sk]
-                                                                                                ColumnarToRow
-                                                                                                  InputAdapter
-                                                                                                    Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                              Exchange [ws_order_number,ws_item_sk] #3
+                                                                WholeStageCodegen (2)
+                                                                  Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid]
+                                                                    BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                                      Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
+                                                                        Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
+                                                                          ColumnarToRow
                                                                             InputAdapter
-                                                                              ReusedExchange [d_date_sk] #5
+                                                                              Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
+                                                                                SubqueryBroadcast [d_date_sk] #1
+                                                                                  BroadcastExchange #4
+                                                                                    WholeStageCodegen (1)
+                                                                                      Project [d_date_sk]
+                                                                                        Filter [d_year,d_moy,d_date_sk]
+                                                                                          ColumnarToRow
+                                                                                            InputAdapter
+                                                                                              Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                                      InputAdapter
+                                                                        ReusedExchange [d_date_sk] #4
+                                                      InputAdapter
+                                                        WholeStageCodegen (5)
+                                                          Sort [wr_order_number,wr_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (5)
-                                                                Sort [wr_order_number,wr_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [wr_order_number,wr_item_sk] #6
-                                                                      WholeStageCodegen (4)
-                                                                        Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
-                                                                          Filter [wr_return_amt,wr_order_number,wr_item_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
-                  WholeStageCodegen (20)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (19)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (18)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #7
-                                            WholeStageCodegen (17)
-                                              HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [cs_item_sk] #8
-                                                    WholeStageCodegen (16)
-                                                      HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
-                                                          SortMergeJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                              Exchange [wr_order_number,wr_item_sk] #5
+                                                                WholeStageCodegen (4)
+                                                                  Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
+                                                                    Filter [wr_return_amt,wr_order_number,wr_item_sk]
+                                                                      ColumnarToRow
+                                                                        InputAdapter
+                                                                          Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
+            WholeStageCodegen (20)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (19)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (18)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #6
+                                      WholeStageCodegen (17)
+                                        HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [cs_item_sk] #7
+                                              WholeStageCodegen (16)
+                                                HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
+                                                    SortMergeJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                      InputAdapter
+                                                        WholeStageCodegen (13)
+                                                          Sort [cs_order_number,cs_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (13)
-                                                                Sort [cs_order_number,cs_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [cs_order_number,cs_item_sk] #9
-                                                                      WholeStageCodegen (12)
-                                                                        Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid]
-                                                                          BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                                            Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
-                                                                              Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
-                                                                                ColumnarToRow
-                                                                                  InputAdapter
-                                                                                    Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
-                                                                                      ReusedSubquery [d_date_sk] #1
+                                                              Exchange [cs_order_number,cs_item_sk] #8
+                                                                WholeStageCodegen (12)
+                                                                  Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid]
+                                                                    BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                                      Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
+                                                                        Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
+                                                                          ColumnarToRow
                                                                             InputAdapter
-                                                                              ReusedExchange [d_date_sk] #5
+                                                                              Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
+                                                                                ReusedSubquery [d_date_sk] #1
+                                                                      InputAdapter
+                                                                        ReusedExchange [d_date_sk] #4
+                                                      InputAdapter
+                                                        WholeStageCodegen (15)
+                                                          Sort [cr_order_number,cr_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (15)
-                                                                Sort [cr_order_number,cr_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [cr_order_number,cr_item_sk] #10
-                                                                      WholeStageCodegen (14)
-                                                                        Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
-                                                                          Filter [cr_return_amount,cr_order_number,cr_item_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
-                  WholeStageCodegen (30)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (29)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (28)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #11
-                                            WholeStageCodegen (27)
-                                              HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ss_item_sk] #12
-                                                    WholeStageCodegen (26)
-                                                      HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
-                                                          SortMergeJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                              Exchange [cr_order_number,cr_item_sk] #9
+                                                                WholeStageCodegen (14)
+                                                                  Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
+                                                                    Filter [cr_return_amount,cr_order_number,cr_item_sk]
+                                                                      ColumnarToRow
+                                                                        InputAdapter
+                                                                          Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
+            WholeStageCodegen (30)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (29)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (28)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #10
+                                      WholeStageCodegen (27)
+                                        HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ss_item_sk] #11
+                                              WholeStageCodegen (26)
+                                                HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
+                                                    SortMergeJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                      InputAdapter
+                                                        WholeStageCodegen (23)
+                                                          Sort [ss_ticket_number,ss_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (23)
-                                                                Sort [ss_ticket_number,ss_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [ss_ticket_number,ss_item_sk] #13
-                                                                      WholeStageCodegen (22)
-                                                                        Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid]
-                                                                          BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                                            Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
-                                                                              Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
-                                                                                ColumnarToRow
-                                                                                  InputAdapter
-                                                                                    Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
-                                                                                      ReusedSubquery [d_date_sk] #1
+                                                              Exchange [ss_ticket_number,ss_item_sk] #12
+                                                                WholeStageCodegen (22)
+                                                                  Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid]
+                                                                    BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                                      Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
+                                                                        Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
+                                                                          ColumnarToRow
                                                                             InputAdapter
-                                                                              ReusedExchange [d_date_sk] #5
+                                                                              Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
+                                                                                ReusedSubquery [d_date_sk] #1
+                                                                      InputAdapter
+                                                                        ReusedExchange [d_date_sk] #4
+                                                      InputAdapter
+                                                        WholeStageCodegen (25)
+                                                          Sort [sr_ticket_number,sr_item_sk]
                                                             InputAdapter
-                                                              WholeStageCodegen (25)
-                                                                Sort [sr_ticket_number,sr_item_sk]
-                                                                  InputAdapter
-                                                                    Exchange [sr_ticket_number,sr_item_sk] #14
-                                                                      WholeStageCodegen (24)
-                                                                        Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
-                                                                          Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
+                                                              Exchange [sr_ticket_number,sr_item_sk] #13
+                                                                WholeStageCodegen (24)
+                                                                  Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
+                                                                    Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
+                                                                      ColumnarToRow
+                                                                        InputAdapter
+                                                                          Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/explain.txt
index fea7a9fe207df..5af506b8109b2 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/explain.txt
@@ -1,81 +1,80 @@
 == Physical Plan ==
-TakeOrderedAndProject (77)
-+- * HashAggregate (76)
-   +- Exchange (75)
-      +- * HashAggregate (74)
-         +- Union (73)
-            :- * Project (24)
-            :  +- * Filter (23)
-            :     +- Window (22)
-            :        +- * Sort (21)
-            :           +- Window (20)
-            :              +- * Sort (19)
-            :                 +- Exchange (18)
-            :                    +- * HashAggregate (17)
-            :                       +- Exchange (16)
-            :                          +- * HashAggregate (15)
-            :                             +- * Project (14)
-            :                                +- * BroadcastHashJoin Inner BuildRight (13)
-            :                                   :- * Project (11)
-            :                                   :  +- * BroadcastHashJoin Inner BuildLeft (10)
-            :                                   :     :- BroadcastExchange (5)
-            :                                   :     :  +- * Project (4)
-            :                                   :     :     +- * Filter (3)
-            :                                   :     :        +- * ColumnarToRow (2)
-            :                                   :     :           +- Scan parquet spark_catalog.default.web_sales (1)
-            :                                   :     +- * Project (9)
-            :                                   :        +- * Filter (8)
-            :                                   :           +- * ColumnarToRow (7)
-            :                                   :              +- Scan parquet spark_catalog.default.web_returns (6)
-            :                                   +- ReusedExchange (12)
-            :- * Project (48)
-            :  +- * Filter (47)
-            :     +- Window (46)
-            :        +- * Sort (45)
-            :           +- Window (44)
-            :              +- * Sort (43)
-            :                 +- Exchange (42)
-            :                    +- * HashAggregate (41)
-            :                       +- Exchange (40)
-            :                          +- * HashAggregate (39)
-            :                             +- * Project (38)
-            :                                +- * BroadcastHashJoin Inner BuildRight (37)
-            :                                   :- * Project (35)
-            :                                   :  +- * BroadcastHashJoin Inner BuildLeft (34)
-            :                                   :     :- BroadcastExchange (29)
-            :                                   :     :  +- * Project (28)
-            :                                   :     :     +- * Filter (27)
-            :                                   :     :        +- * ColumnarToRow (26)
-            :                                   :     :           +- Scan parquet spark_catalog.default.catalog_sales (25)
-            :                                   :     +- * Project (33)
-            :                                   :        +- * Filter (32)
-            :                                   :           +- * ColumnarToRow (31)
-            :                                   :              +- Scan parquet spark_catalog.default.catalog_returns (30)
-            :                                   +- ReusedExchange (36)
-            +- * Project (72)
-               +- * Filter (71)
-                  +- Window (70)
-                     +- * Sort (69)
-                        +- Window (68)
-                           +- * Sort (67)
-                              +- Exchange (66)
-                                 +- * HashAggregate (65)
-                                    +- Exchange (64)
-                                       +- * HashAggregate (63)
-                                          +- * Project (62)
-                                             +- * BroadcastHashJoin Inner BuildRight (61)
-                                                :- * Project (59)
-                                                :  +- * BroadcastHashJoin Inner BuildLeft (58)
-                                                :     :- BroadcastExchange (53)
-                                                :     :  +- * Project (52)
-                                                :     :     +- * Filter (51)
-                                                :     :        +- * ColumnarToRow (50)
-                                                :     :           +- Scan parquet spark_catalog.default.store_sales (49)
-                                                :     +- * Project (57)
-                                                :        +- * Filter (56)
-                                                :           +- * ColumnarToRow (55)
-                                                :              +- Scan parquet spark_catalog.default.store_returns (54)
-                                                +- ReusedExchange (60)
+TakeOrderedAndProject (76)
++- * HashAggregate (75)
+   +- * HashAggregate (74)
+      +- Union (73)
+         :- * Project (24)
+         :  +- * Filter (23)
+         :     +- Window (22)
+         :        +- * Sort (21)
+         :           +- Window (20)
+         :              +- * Sort (19)
+         :                 +- Exchange (18)
+         :                    +- * HashAggregate (17)
+         :                       +- Exchange (16)
+         :                          +- * HashAggregate (15)
+         :                             +- * Project (14)
+         :                                +- * BroadcastHashJoin Inner BuildRight (13)
+         :                                   :- * Project (11)
+         :                                   :  +- * BroadcastHashJoin Inner BuildLeft (10)
+         :                                   :     :- BroadcastExchange (5)
+         :                                   :     :  +- * Project (4)
+         :                                   :     :     +- * Filter (3)
+         :                                   :     :        +- * ColumnarToRow (2)
+         :                                   :     :           +- Scan parquet spark_catalog.default.web_sales (1)
+         :                                   :     +- * Project (9)
+         :                                   :        +- * Filter (8)
+         :                                   :           +- * ColumnarToRow (7)
+         :                                   :              +- Scan parquet spark_catalog.default.web_returns (6)
+         :                                   +- ReusedExchange (12)
+         :- * Project (48)
+         :  +- * Filter (47)
+         :     +- Window (46)
+         :        +- * Sort (45)
+         :           +- Window (44)
+         :              +- * Sort (43)
+         :                 +- Exchange (42)
+         :                    +- * HashAggregate (41)
+         :                       +- Exchange (40)
+         :                          +- * HashAggregate (39)
+         :                             +- * Project (38)
+         :                                +- * BroadcastHashJoin Inner BuildRight (37)
+         :                                   :- * Project (35)
+         :                                   :  +- * BroadcastHashJoin Inner BuildLeft (34)
+         :                                   :     :- BroadcastExchange (29)
+         :                                   :     :  +- * Project (28)
+         :                                   :     :     +- * Filter (27)
+         :                                   :     :        +- * ColumnarToRow (26)
+         :                                   :     :           +- Scan parquet spark_catalog.default.catalog_sales (25)
+         :                                   :     +- * Project (33)
+         :                                   :        +- * Filter (32)
+         :                                   :           +- * ColumnarToRow (31)
+         :                                   :              +- Scan parquet spark_catalog.default.catalog_returns (30)
+         :                                   +- ReusedExchange (36)
+         +- * Project (72)
+            +- * Filter (71)
+               +- Window (70)
+                  +- * Sort (69)
+                     +- Window (68)
+                        +- * Sort (67)
+                           +- Exchange (66)
+                              +- * HashAggregate (65)
+                                 +- Exchange (64)
+                                    +- * HashAggregate (63)
+                                       +- * Project (62)
+                                          +- * BroadcastHashJoin Inner BuildRight (61)
+                                             :- * Project (59)
+                                             :  +- * BroadcastHashJoin Inner BuildLeft (58)
+                                             :     :- BroadcastExchange (53)
+                                             :     :  +- * Project (52)
+                                             :     :     +- * Filter (51)
+                                             :     :        +- * ColumnarToRow (50)
+                                             :     :           +- Scan parquet spark_catalog.default.store_sales (49)
+                                             :     +- * Project (57)
+                                             :        +- * Filter (56)
+                                             :           +- * ColumnarToRow (55)
+                                             :              +- Scan parquet spark_catalog.default.store_returns (54)
+                                             +- ReusedExchange (60)
 
 
 (1) Scan parquet spark_catalog.default.web_sales
@@ -129,7 +128,7 @@ Join condition: None
 Output [6]: [ws_item_sk#1, ws_quantity#3, ws_net_paid#4, ws_sold_date_sk#6, wr_return_quantity#10, wr_return_amt#11]
 Input [9]: [ws_item_sk#1, ws_order_number#2, ws_quantity#3, ws_net_paid#4, ws_sold_date_sk#6, wr_item_sk#8, wr_order_number#9, wr_return_quantity#10, wr_return_amt#11]
 
-(12) ReusedExchange [Reuses operator id: 82]
+(12) ReusedExchange [Reuses operator id: 81]
 Output [1]: [d_date_sk#13]
 
 (13) BroadcastHashJoin [codegen id : 3]
@@ -239,7 +238,7 @@ Join condition: None
 Output [6]: [cs_item_sk#36, cs_quantity#38, cs_net_paid#39, cs_sold_date_sk#41, cr_return_quantity#44, cr_return_amount#45]
 Input [9]: [cs_item_sk#36, cs_order_number#37, cs_quantity#38, cs_net_paid#39, cs_sold_date_sk#41, cr_item_sk#42, cr_order_number#43, cr_return_quantity#44, cr_return_amount#45]
 
-(36) ReusedExchange [Reuses operator id: 82]
+(36) ReusedExchange [Reuses operator id: 81]
 Output [1]: [d_date_sk#47]
 
 (37) BroadcastHashJoin [codegen id : 10]
@@ -349,7 +348,7 @@ Join condition: None
 Output [6]: [ss_item_sk#70, ss_quantity#72, ss_net_paid#73, ss_sold_date_sk#75, sr_return_quantity#78, sr_return_amt#79]
 Input [9]: [ss_item_sk#70, ss_ticket_number#71, ss_quantity#72, ss_net_paid#73, ss_sold_date_sk#75, sr_item_sk#76, sr_ticket_number#77, sr_return_quantity#78, sr_return_amt#79]
 
-(60) ReusedExchange [Reuses operator id: 82]
+(60) ReusedExchange [Reuses operator id: 81]
 Output [1]: [d_date_sk#81]
 
 (61) BroadcastHashJoin [codegen id : 17]
@@ -417,52 +416,48 @@ Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(75) Exchange
-Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
-Arguments: hashpartitioning(channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34, 5), ENSURE_REQUIREMENTS, [plan_id=10]
-
-(76) HashAggregate [codegen id : 23]
+(75) HashAggregate [codegen id : 22]
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Keys [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
-(77) TakeOrderedAndProject
+(76) TakeOrderedAndProject
 Input [5]: [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 Arguments: 100, [channel#35 ASC NULLS FIRST, return_rank#33 ASC NULLS FIRST, currency_rank#34 ASC NULLS FIRST, item#30 ASC NULLS FIRST], [channel#35, item#30, return_ratio#31, return_rank#33, currency_rank#34]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ws_sold_date_sk#6 IN dynamicpruning#7
-BroadcastExchange (82)
-+- * Project (81)
-   +- * Filter (80)
-      +- * ColumnarToRow (79)
-         +- Scan parquet spark_catalog.default.date_dim (78)
+BroadcastExchange (81)
++- * Project (80)
+   +- * Filter (79)
+      +- * ColumnarToRow (78)
+         +- Scan parquet spark_catalog.default.date_dim (77)
 
 
-(78) Scan parquet spark_catalog.default.date_dim
+(77) Scan parquet spark_catalog.default.date_dim
 Output [3]: [d_date_sk#13, d_year#104, d_moy#105]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2001), EqualTo(d_moy,12), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int,d_moy:int>
 
-(79) ColumnarToRow [codegen id : 1]
+(78) ColumnarToRow [codegen id : 1]
 Input [3]: [d_date_sk#13, d_year#104, d_moy#105]
 
-(80) Filter [codegen id : 1]
+(79) Filter [codegen id : 1]
 Input [3]: [d_date_sk#13, d_year#104, d_moy#105]
 Condition : ((((isnotnull(d_year#104) AND isnotnull(d_moy#105)) AND (d_year#104 = 2001)) AND (d_moy#105 = 12)) AND isnotnull(d_date_sk#13))
 
-(81) Project [codegen id : 1]
+(80) Project [codegen id : 1]
 Output [1]: [d_date_sk#13]
 Input [3]: [d_date_sk#13, d_year#104, d_moy#105]
 
-(82) BroadcastExchange
+(81) BroadcastExchange
 Input [1]: [d_date_sk#13]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=11]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
 Subquery:2 Hosting operator id = 25 Hosting Expression = cs_sold_date_sk#41 IN dynamicpruning#7
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/simplified.txt
index cfb4b948b4e8b..2ea310d01171d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q49/simplified.txt
@@ -1,133 +1,130 @@
 TakeOrderedAndProject [channel,return_rank,currency_rank,item,return_ratio]
-  WholeStageCodegen (23)
+  WholeStageCodegen (22)
     HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-      InputAdapter
-        Exchange [channel,item,return_ratio,return_rank,currency_rank] #1
-          WholeStageCodegen (22)
-            HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
-              InputAdapter
-                Union
-                  WholeStageCodegen (7)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (6)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (5)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #2
-                                            WholeStageCodegen (4)
-                                              HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ws_item_sk] #3
-                                                    WholeStageCodegen (3)
-                                                      HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
-                                                          BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                            Project [ws_item_sk,ws_quantity,ws_net_paid,ws_sold_date_sk,wr_return_quantity,wr_return_amt]
-                                                              BroadcastHashJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
-                                                                InputAdapter
-                                                                  BroadcastExchange #4
-                                                                    WholeStageCodegen (1)
-                                                                      Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
-                                                                        Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
-                                                                          ColumnarToRow
-                                                                            InputAdapter
-                                                                              Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
-                                                                                SubqueryBroadcast [d_date_sk] #1
-                                                                                  BroadcastExchange #5
-                                                                                    WholeStageCodegen (1)
-                                                                                      Project [d_date_sk]
-                                                                                        Filter [d_year,d_moy,d_date_sk]
-                                                                                          ColumnarToRow
-                                                                                            InputAdapter
-                                                                                              Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
-                                                                Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
-                                                                  Filter [wr_return_amt,wr_order_number,wr_item_sk]
+      HashAggregate [channel,item,return_ratio,return_rank,currency_rank]
+        InputAdapter
+          Union
+            WholeStageCodegen (7)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (6)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (5)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #1
+                                      WholeStageCodegen (4)
+                                        HashAggregate [ws_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(wr_return_quantity, 0)),sum(coalesce(ws_quantity, 0)),sum(coalesce(cast(wr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ws_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ws_item_sk] #2
+                                              WholeStageCodegen (3)
+                                                HashAggregate [ws_item_sk,wr_return_quantity,ws_quantity,wr_return_amt,ws_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ws_item_sk,ws_quantity,ws_net_paid,wr_return_quantity,wr_return_amt]
+                                                    BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                      Project [ws_item_sk,ws_quantity,ws_net_paid,ws_sold_date_sk,wr_return_quantity,wr_return_amt]
+                                                        BroadcastHashJoin [ws_order_number,ws_item_sk,wr_order_number,wr_item_sk]
+                                                          InputAdapter
+                                                            BroadcastExchange #3
+                                                              WholeStageCodegen (1)
+                                                                Project [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_sold_date_sk]
+                                                                  Filter [ws_net_profit,ws_net_paid,ws_quantity,ws_order_number,ws_item_sk]
                                                                     ColumnarToRow
                                                                       InputAdapter
-                                                                        Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
-                                                            InputAdapter
-                                                              ReusedExchange [d_date_sk] #5
-                  WholeStageCodegen (14)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (13)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (12)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #6
-                                            WholeStageCodegen (11)
-                                              HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [cs_item_sk] #7
-                                                    WholeStageCodegen (10)
-                                                      HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
-                                                          BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
-                                                            Project [cs_item_sk,cs_quantity,cs_net_paid,cs_sold_date_sk,cr_return_quantity,cr_return_amount]
-                                                              BroadcastHashJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                                        Scan parquet spark_catalog.default.web_sales [ws_item_sk,ws_order_number,ws_quantity,ws_net_paid,ws_net_profit,ws_sold_date_sk]
+                                                                          SubqueryBroadcast [d_date_sk] #1
+                                                                            BroadcastExchange #4
+                                                                              WholeStageCodegen (1)
+                                                                                Project [d_date_sk]
+                                                                                  Filter [d_year,d_moy,d_date_sk]
+                                                                                    ColumnarToRow
+                                                                                      InputAdapter
+                                                                                        Scan parquet spark_catalog.default.date_dim [d_date_sk,d_year,d_moy]
+                                                          Project [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt]
+                                                            Filter [wr_return_amt,wr_order_number,wr_item_sk]
+                                                              ColumnarToRow
                                                                 InputAdapter
-                                                                  BroadcastExchange #8
-                                                                    WholeStageCodegen (8)
-                                                                      Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
-                                                                        Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
-                                                                          ColumnarToRow
-                                                                            InputAdapter
-                                                                              Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
-                                                                                ReusedSubquery [d_date_sk] #1
-                                                                Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
-                                                                  Filter [cr_return_amount,cr_order_number,cr_item_sk]
+                                                                  Scan parquet spark_catalog.default.web_returns [wr_item_sk,wr_order_number,wr_return_quantity,wr_return_amt,wr_returned_date_sk]
+                                                      InputAdapter
+                                                        ReusedExchange [d_date_sk] #4
+            WholeStageCodegen (14)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (13)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (12)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #5
+                                      WholeStageCodegen (11)
+                                        HashAggregate [cs_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(cr_return_quantity, 0)),sum(coalesce(cs_quantity, 0)),sum(coalesce(cast(cr_return_amount as decimal(12,2)), 0.00)),sum(coalesce(cast(cs_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [cs_item_sk] #6
+                                              WholeStageCodegen (10)
+                                                HashAggregate [cs_item_sk,cr_return_quantity,cs_quantity,cr_return_amount,cs_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [cs_item_sk,cs_quantity,cs_net_paid,cr_return_quantity,cr_return_amount]
+                                                    BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                      Project [cs_item_sk,cs_quantity,cs_net_paid,cs_sold_date_sk,cr_return_quantity,cr_return_amount]
+                                                        BroadcastHashJoin [cs_order_number,cs_item_sk,cr_order_number,cr_item_sk]
+                                                          InputAdapter
+                                                            BroadcastExchange #7
+                                                              WholeStageCodegen (8)
+                                                                Project [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_sold_date_sk]
+                                                                  Filter [cs_net_profit,cs_net_paid,cs_quantity,cs_order_number,cs_item_sk]
                                                                     ColumnarToRow
                                                                       InputAdapter
-                                                                        Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
-                                                            InputAdapter
-                                                              ReusedExchange [d_date_sk] #5
-                  WholeStageCodegen (21)
-                    Project [item,return_ratio,return_rank,currency_rank]
-                      Filter [return_rank,currency_rank]
-                        InputAdapter
-                          Window [currency_ratio]
-                            WholeStageCodegen (20)
-                              Sort [currency_ratio]
-                                InputAdapter
-                                  Window [return_ratio]
-                                    WholeStageCodegen (19)
-                                      Sort [return_ratio]
-                                        InputAdapter
-                                          Exchange #9
-                                            WholeStageCodegen (18)
-                                              HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                InputAdapter
-                                                  Exchange [ss_item_sk] #10
-                                                    WholeStageCodegen (17)
-                                                      HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
-                                                        Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
-                                                          BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                            Project [ss_item_sk,ss_quantity,ss_net_paid,ss_sold_date_sk,sr_return_quantity,sr_return_amt]
-                                                              BroadcastHashJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                                        Scan parquet spark_catalog.default.catalog_sales [cs_item_sk,cs_order_number,cs_quantity,cs_net_paid,cs_net_profit,cs_sold_date_sk]
+                                                                          ReusedSubquery [d_date_sk] #1
+                                                          Project [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount]
+                                                            Filter [cr_return_amount,cr_order_number,cr_item_sk]
+                                                              ColumnarToRow
                                                                 InputAdapter
-                                                                  BroadcastExchange #11
-                                                                    WholeStageCodegen (15)
-                                                                      Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
-                                                                        Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
-                                                                          ColumnarToRow
-                                                                            InputAdapter
-                                                                              Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
-                                                                                ReusedSubquery [d_date_sk] #1
-                                                                Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
-                                                                  Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
+                                                                  Scan parquet spark_catalog.default.catalog_returns [cr_item_sk,cr_order_number,cr_return_quantity,cr_return_amount,cr_returned_date_sk]
+                                                      InputAdapter
+                                                        ReusedExchange [d_date_sk] #4
+            WholeStageCodegen (21)
+              Project [item,return_ratio,return_rank,currency_rank]
+                Filter [return_rank,currency_rank]
+                  InputAdapter
+                    Window [currency_ratio]
+                      WholeStageCodegen (20)
+                        Sort [currency_ratio]
+                          InputAdapter
+                            Window [return_ratio]
+                              WholeStageCodegen (19)
+                                Sort [return_ratio]
+                                  InputAdapter
+                                    Exchange #8
+                                      WholeStageCodegen (18)
+                                        HashAggregate [ss_item_sk,sum,sum,sum,isEmpty,sum,isEmpty] [sum(coalesce(sr_return_quantity, 0)),sum(coalesce(ss_quantity, 0)),sum(coalesce(cast(sr_return_amt as decimal(12,2)), 0.00)),sum(coalesce(cast(ss_net_paid as decimal(12,2)), 0.00)),item,return_ratio,currency_ratio,sum,sum,sum,isEmpty,sum,isEmpty]
+                                          InputAdapter
+                                            Exchange [ss_item_sk] #9
+                                              WholeStageCodegen (17)
+                                                HashAggregate [ss_item_sk,sr_return_quantity,ss_quantity,sr_return_amt,ss_net_paid] [sum,sum,sum,isEmpty,sum,isEmpty,sum,sum,sum,isEmpty,sum,isEmpty]
+                                                  Project [ss_item_sk,ss_quantity,ss_net_paid,sr_return_quantity,sr_return_amt]
+                                                    BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                      Project [ss_item_sk,ss_quantity,ss_net_paid,ss_sold_date_sk,sr_return_quantity,sr_return_amt]
+                                                        BroadcastHashJoin [ss_ticket_number,ss_item_sk,sr_ticket_number,sr_item_sk]
+                                                          InputAdapter
+                                                            BroadcastExchange #10
+                                                              WholeStageCodegen (15)
+                                                                Project [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_sold_date_sk]
+                                                                  Filter [ss_net_profit,ss_net_paid,ss_quantity,ss_ticket_number,ss_item_sk]
                                                                     ColumnarToRow
                                                                       InputAdapter
-                                                                        Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
-                                                            InputAdapter
-                                                              ReusedExchange [d_date_sk] #5
+                                                                        Scan parquet spark_catalog.default.store_sales [ss_item_sk,ss_ticket_number,ss_quantity,ss_net_paid,ss_net_profit,ss_sold_date_sk]
+                                                                          ReusedSubquery [d_date_sk] #1
+                                                          Project [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt]
+                                                            Filter [sr_return_amt,sr_ticket_number,sr_item_sk]
+                                                              ColumnarToRow
+                                                                InputAdapter
+                                                                  Scan parquet spark_catalog.default.store_returns [sr_item_sk,sr_ticket_number,sr_return_quantity,sr_return_amt,sr_returned_date_sk]
+                                                      InputAdapter
+                                                        ReusedExchange [d_date_sk] #4
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6.sf100/explain.txt
index 82a6e00c79c4b..4d3c75623de5a 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6.sf100/explain.txt
@@ -280,7 +280,7 @@ Input [2]: [d_date_sk#16, d_month_seq#26]
 
 (48) Filter [codegen id : 1]
 Input [2]: [d_date_sk#16, d_month_seq#26]
-Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#28])) AND isnotnull(d_date_sk#16))
+Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#9])) AND isnotnull(d_date_sk#16))
 
 (49) Project [codegen id : 1]
 Output [1]: [d_date_sk#16]
@@ -288,11 +288,11 @@ Input [2]: [d_date_sk#16, d_month_seq#26]
 
 (50) BroadcastExchange
 Input [1]: [d_date_sk#16]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=9]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=10]
 
-Subquery:2 Hosting operator id = 48 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#28]
+Subquery:2 Hosting operator id = 48 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#9]
 
-Subquery:3 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#27, [id=#28]
+Subquery:3 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquery#27, [id=#9]
 * HashAggregate (57)
 +- Exchange (56)
    +- * HashAggregate (55)
@@ -303,39 +303,39 @@ Subquery:3 Hosting operator id = 46 Hosting Expression = Subquery scalar-subquer
 
 
 (51) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [3]: [d_month_seq#28, d_year#29, d_moy#30]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,1)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (52) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (53) Filter [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
-Condition : (((isnotnull(d_year#30) AND isnotnull(d_moy#31)) AND (d_year#30 = 2000)) AND (d_moy#31 = 1))
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
+Condition : (((isnotnull(d_year#29) AND isnotnull(d_moy#30)) AND (d_year#29 = 2000)) AND (d_moy#30 = 1))
 
 (54) Project [codegen id : 1]
-Output [1]: [d_month_seq#29]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [1]: [d_month_seq#28]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (55) HashAggregate [codegen id : 1]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 (56) Exchange
-Input [1]: [d_month_seq#29]
-Arguments: hashpartitioning(d_month_seq#29, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [1]: [d_month_seq#28]
+Arguments: hashpartitioning(d_month_seq#28, 5), ENSURE_REQUIREMENTS, [plan_id=11]
 
 (57) HashAggregate [codegen id : 2]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6/explain.txt
index 507d4991a046a..43e849ef42a4f 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q6/explain.txt
@@ -250,7 +250,7 @@ Input [2]: [d_date_sk#9, d_month_seq#26]
 
 (42) Filter [codegen id : 1]
 Input [2]: [d_date_sk#9, d_month_seq#26]
-Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#28])) AND isnotnull(d_date_sk#9))
+Condition : ((isnotnull(d_month_seq#26) AND (d_month_seq#26 = ReusedSubquery Subquery scalar-subquery#27, [id=#7])) AND isnotnull(d_date_sk#9))
 
 (43) Project [codegen id : 1]
 Output [1]: [d_date_sk#9]
@@ -258,11 +258,11 @@ Input [2]: [d_date_sk#9, d_month_seq#26]
 
 (44) BroadcastExchange
 Input [1]: [d_date_sk#9]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=8]
 
-Subquery:2 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#28]
+Subquery:2 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#27, [id=#7]
 
-Subquery:3 Hosting operator id = 40 Hosting Expression = Subquery scalar-subquery#27, [id=#28]
+Subquery:3 Hosting operator id = 40 Hosting Expression = Subquery scalar-subquery#27, [id=#7]
 * HashAggregate (51)
 +- Exchange (50)
    +- * HashAggregate (49)
@@ -273,39 +273,39 @@ Subquery:3 Hosting operator id = 40 Hosting Expression = Subquery scalar-subquer
 
 
 (45) Scan parquet spark_catalog.default.date_dim
-Output [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [3]: [d_month_seq#28, d_year#29, d_moy#30]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), IsNotNull(d_moy), EqualTo(d_year,2000), EqualTo(d_moy,1)]
 ReadSchema: struct<d_month_seq:int,d_year:int,d_moy:int>
 
 (46) ColumnarToRow [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (47) Filter [codegen id : 1]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
-Condition : (((isnotnull(d_year#30) AND isnotnull(d_moy#31)) AND (d_year#30 = 2000)) AND (d_moy#31 = 1))
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
+Condition : (((isnotnull(d_year#29) AND isnotnull(d_moy#30)) AND (d_year#29 = 2000)) AND (d_moy#30 = 1))
 
 (48) Project [codegen id : 1]
-Output [1]: [d_month_seq#29]
-Input [3]: [d_month_seq#29, d_year#30, d_moy#31]
+Output [1]: [d_month_seq#28]
+Input [3]: [d_month_seq#28, d_year#29, d_moy#30]
 
 (49) HashAggregate [codegen id : 1]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 (50) Exchange
-Input [1]: [d_month_seq#29]
-Arguments: hashpartitioning(d_month_seq#29, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [1]: [d_month_seq#28]
+Arguments: hashpartitioning(d_month_seq#28, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (51) HashAggregate [codegen id : 2]
-Input [1]: [d_month_seq#29]
-Keys [1]: [d_month_seq#29]
+Input [1]: [d_month_seq#28]
+Keys [1]: [d_month_seq#28]
 Functions: []
 Aggregate Attributes: []
-Results [1]: [d_month_seq#29]
+Results [1]: [d_month_seq#28]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q64.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q64.sf100/explain.txt
index 50beb9878641c..73ce194ac7e04 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q64.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q64.sf100/explain.txt
@@ -223,929 +223,929 @@ Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_ad
 
 (3) Filter [codegen id : 1]
 Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Condition : ((((((((isnotnull(ss_item_sk#1) AND isnotnull(ss_ticket_number#8)) AND isnotnull(ss_store_sk#6)) AND isnotnull(ss_customer_sk#2)) AND isnotnull(ss_cdemo_sk#3)) AND isnotnull(ss_promo_sk#7)) AND isnotnull(ss_hdemo_sk#4)) AND isnotnull(ss_addr_sk#5)) AND might_contain(Subquery scalar-subquery#14, [id=#15], xxhash64(ss_item_sk#1, 42)))
+Condition : ((((((((isnotnull(ss_item_sk#1) AND isnotnull(ss_ticket_number#8)) AND isnotnull(ss_store_sk#6)) AND isnotnull(ss_customer_sk#2)) AND isnotnull(ss_cdemo_sk#3)) AND isnotnull(ss_promo_sk#7)) AND isnotnull(ss_hdemo_sk#4)) AND isnotnull(ss_addr_sk#5)) AND might_contain(Subquery scalar-subquery#14, [id=#1], xxhash64(ss_item_sk#1, 42)))
 
 (4) Exchange
 Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#8, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#8, 5), ENSURE_REQUIREMENTS, [plan_id=2]
 
 (5) Sort [codegen id : 2]
 Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
 Arguments: [ss_item_sk#1 ASC NULLS FIRST, ss_ticket_number#8 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.store_returns
-Output [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
+Output [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_returns]
 PushedFilters: [IsNotNull(sr_item_sk), IsNotNull(sr_ticket_number)]
 ReadSchema: struct<sr_item_sk:int,sr_ticket_number:int>
 
 (7) ColumnarToRow [codegen id : 3]
-Input [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
+Input [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
 
 (8) Filter [codegen id : 3]
-Input [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
-Condition : (isnotnull(sr_item_sk#16) AND isnotnull(sr_ticket_number#17))
+Input [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
+Condition : (isnotnull(sr_item_sk#15) AND isnotnull(sr_ticket_number#16))
 
 (9) Project [codegen id : 3]
-Output [2]: [sr_item_sk#16, sr_ticket_number#17]
-Input [3]: [sr_item_sk#16, sr_ticket_number#17, sr_returned_date_sk#18]
+Output [2]: [sr_item_sk#15, sr_ticket_number#16]
+Input [3]: [sr_item_sk#15, sr_ticket_number#16, sr_returned_date_sk#17]
 
 (10) Exchange
-Input [2]: [sr_item_sk#16, sr_ticket_number#17]
-Arguments: hashpartitioning(sr_item_sk#16, sr_ticket_number#17, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [2]: [sr_item_sk#15, sr_ticket_number#16]
+Arguments: hashpartitioning(sr_item_sk#15, sr_ticket_number#16, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (11) Sort [codegen id : 4]
-Input [2]: [sr_item_sk#16, sr_ticket_number#17]
-Arguments: [sr_item_sk#16 ASC NULLS FIRST, sr_ticket_number#17 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#15, sr_ticket_number#16]
+Arguments: [sr_item_sk#15 ASC NULLS FIRST, sr_ticket_number#16 ASC NULLS FIRST], false, 0
 
 (12) SortMergeJoin [codegen id : 13]
 Left keys [2]: [ss_item_sk#1, ss_ticket_number#8]
-Right keys [2]: [sr_item_sk#16, sr_ticket_number#17]
+Right keys [2]: [sr_item_sk#15, sr_ticket_number#16]
 Join type: Inner
 Join condition: None
 
 (13) Project [codegen id : 13]
 Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, sr_item_sk#16, sr_ticket_number#17]
+Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_ticket_number#8, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, sr_item_sk#15, sr_ticket_number#16]
 
 (14) Scan parquet spark_catalog.default.catalog_sales
-Output [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
+Output [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_sales]
 PushedFilters: [IsNotNull(cs_item_sk), IsNotNull(cs_order_number)]
 ReadSchema: struct<cs_item_sk:int,cs_order_number:int,cs_ext_list_price:decimal(7,2)>
 
 (15) ColumnarToRow [codegen id : 5]
-Input [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
+Input [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
 
 (16) Filter [codegen id : 5]
-Input [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
-Condition : (isnotnull(cs_item_sk#19) AND isnotnull(cs_order_number#20))
+Input [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
+Condition : (isnotnull(cs_item_sk#18) AND isnotnull(cs_order_number#19))
 
 (17) Project [codegen id : 5]
-Output [3]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21]
-Input [4]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cs_sold_date_sk#22]
+Output [3]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20]
+Input [4]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cs_sold_date_sk#21]
 
 (18) Exchange
-Input [3]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21]
-Arguments: hashpartitioning(cs_item_sk#19, cs_order_number#20, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [3]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20]
+Arguments: hashpartitioning(cs_item_sk#18, cs_order_number#19, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (19) Sort [codegen id : 6]
-Input [3]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21]
-Arguments: [cs_item_sk#19 ASC NULLS FIRST, cs_order_number#20 ASC NULLS FIRST], false, 0
+Input [3]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20]
+Arguments: [cs_item_sk#18 ASC NULLS FIRST, cs_order_number#19 ASC NULLS FIRST], false, 0
 
 (20) Scan parquet spark_catalog.default.catalog_returns
-Output [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
+Output [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_returns]
 PushedFilters: [IsNotNull(cr_item_sk), IsNotNull(cr_order_number)]
 ReadSchema: struct<cr_item_sk:int,cr_order_number:int,cr_refunded_cash:decimal(7,2),cr_reversed_charge:decimal(7,2),cr_store_credit:decimal(7,2)>
 
 (21) ColumnarToRow [codegen id : 7]
-Input [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
+Input [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
 
 (22) Filter [codegen id : 7]
-Input [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
-Condition : (isnotnull(cr_item_sk#23) AND isnotnull(cr_order_number#24))
+Input [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
+Condition : (isnotnull(cr_item_sk#22) AND isnotnull(cr_order_number#23))
 
 (23) Project [codegen id : 7]
-Output [5]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Input [6]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27, cr_returned_date_sk#28]
+Output [5]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Input [6]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26, cr_returned_date_sk#27]
 
 (24) Exchange
-Input [5]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Arguments: hashpartitioning(cr_item_sk#23, cr_order_number#24, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Input [5]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Arguments: hashpartitioning(cr_item_sk#22, cr_order_number#23, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (25) Sort [codegen id : 8]
-Input [5]: [cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Arguments: [cr_item_sk#23 ASC NULLS FIRST, cr_order_number#24 ASC NULLS FIRST], false, 0
+Input [5]: [cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Arguments: [cr_item_sk#22 ASC NULLS FIRST, cr_order_number#23 ASC NULLS FIRST], false, 0
 
 (26) SortMergeJoin [codegen id : 9]
-Left keys [2]: [cs_item_sk#19, cs_order_number#20]
-Right keys [2]: [cr_item_sk#23, cr_order_number#24]
+Left keys [2]: [cs_item_sk#18, cs_order_number#19]
+Right keys [2]: [cr_item_sk#22, cr_order_number#23]
 Join type: Inner
 Join condition: None
 
 (27) Project [codegen id : 9]
-Output [5]: [cs_item_sk#19, cs_ext_list_price#21, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Input [8]: [cs_item_sk#19, cs_order_number#20, cs_ext_list_price#21, cr_item_sk#23, cr_order_number#24, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
+Output [5]: [cs_item_sk#18, cs_ext_list_price#20, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Input [8]: [cs_item_sk#18, cs_order_number#19, cs_ext_list_price#20, cr_item_sk#22, cr_order_number#23, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
 
 (28) HashAggregate [codegen id : 9]
-Input [5]: [cs_item_sk#19, cs_ext_list_price#21, cr_refunded_cash#25, cr_reversed_charge#26, cr_store_credit#27]
-Keys [1]: [cs_item_sk#19]
-Functions [2]: [partial_sum(UnscaledValue(cs_ext_list_price#21)), partial_sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))]
-Aggregate Attributes [3]: [sum#29, sum#30, isEmpty#31]
-Results [4]: [cs_item_sk#19, sum#32, sum#33, isEmpty#34]
+Input [5]: [cs_item_sk#18, cs_ext_list_price#20, cr_refunded_cash#24, cr_reversed_charge#25, cr_store_credit#26]
+Keys [1]: [cs_item_sk#18]
+Functions [2]: [partial_sum(UnscaledValue(cs_ext_list_price#20)), partial_sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))]
+Aggregate Attributes [3]: [sum#28, sum#29, isEmpty#30]
+Results [4]: [cs_item_sk#18, sum#31, sum#32, isEmpty#33]
 
 (29) Exchange
-Input [4]: [cs_item_sk#19, sum#32, sum#33, isEmpty#34]
-Arguments: hashpartitioning(cs_item_sk#19, 5), ENSURE_REQUIREMENTS, [plan_id=5]
+Input [4]: [cs_item_sk#18, sum#31, sum#32, isEmpty#33]
+Arguments: hashpartitioning(cs_item_sk#18, 5), ENSURE_REQUIREMENTS, [plan_id=6]
 
 (30) HashAggregate [codegen id : 10]
-Input [4]: [cs_item_sk#19, sum#32, sum#33, isEmpty#34]
-Keys [1]: [cs_item_sk#19]
-Functions [2]: [sum(UnscaledValue(cs_ext_list_price#21)), sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))]
-Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_list_price#21))#35, sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))#36]
-Results [3]: [cs_item_sk#19, MakeDecimal(sum(UnscaledValue(cs_ext_list_price#21))#35,17,2) AS sale#37, sum(((cr_refunded_cash#25 + cr_reversed_charge#26) + cr_store_credit#27))#36 AS refund#38]
+Input [4]: [cs_item_sk#18, sum#31, sum#32, isEmpty#33]
+Keys [1]: [cs_item_sk#18]
+Functions [2]: [sum(UnscaledValue(cs_ext_list_price#20)), sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))]
+Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_list_price#20))#34, sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))#35]
+Results [3]: [cs_item_sk#18, MakeDecimal(sum(UnscaledValue(cs_ext_list_price#20))#34,17,2) AS sale#36, sum(((cr_refunded_cash#24 + cr_reversed_charge#25) + cr_store_credit#26))#35 AS refund#37]
 
 (31) Filter [codegen id : 10]
-Input [3]: [cs_item_sk#19, sale#37, refund#38]
-Condition : ((isnotnull(sale#37) AND isnotnull(refund#38)) AND (cast(sale#37 as decimal(21,2)) > (2 * refund#38)))
+Input [3]: [cs_item_sk#18, sale#36, refund#37]
+Condition : ((isnotnull(sale#36) AND isnotnull(refund#37)) AND (cast(sale#36 as decimal(21,2)) > (2 * refund#37)))
 
 (32) Project [codegen id : 10]
-Output [1]: [cs_item_sk#19]
-Input [3]: [cs_item_sk#19, sale#37, refund#38]
+Output [1]: [cs_item_sk#18]
+Input [3]: [cs_item_sk#18, sale#36, refund#37]
 
 (33) BroadcastExchange
-Input [1]: [cs_item_sk#19]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
+Input [1]: [cs_item_sk#18]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=7]
 
 (34) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [cs_item_sk#19]
+Right keys [1]: [cs_item_sk#18]
 Join type: Inner
 Join condition: None
 
 (35) Project [codegen id : 13]
 Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12]
-Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, cs_item_sk#19]
+Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, cs_item_sk#18]
 
 (36) ReusedExchange [Reuses operator id: 220]
-Output [2]: [d_date_sk#39, d_year#40]
+Output [2]: [d_date_sk#38, d_year#39]
 
 (37) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [ss_sold_date_sk#12]
-Right keys [1]: [d_date_sk#39]
+Right keys [1]: [d_date_sk#38]
 Join type: Inner
 Join condition: None
 
 (38) Project [codegen id : 13]
-Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40]
-Input [13]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, d_date_sk#39, d_year#40]
+Output [11]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39]
+Input [13]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, ss_sold_date_sk#12, d_date_sk#38, d_year#39]
 
 (39) Scan parquet spark_catalog.default.store
-Output [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
+Output [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk), IsNotNull(s_store_name), IsNotNull(s_zip)]
 ReadSchema: struct<s_store_sk:int,s_store_name:string,s_zip:string>
 
 (40) ColumnarToRow [codegen id : 12]
-Input [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
+Input [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
 
 (41) Filter [codegen id : 12]
-Input [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
-Condition : ((isnotnull(s_store_sk#41) AND isnotnull(s_store_name#42)) AND isnotnull(s_zip#43))
+Input [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
+Condition : ((isnotnull(s_store_sk#40) AND isnotnull(s_store_name#41)) AND isnotnull(s_zip#42))
 
 (42) BroadcastExchange
-Input [3]: [s_store_sk#41, s_store_name#42, s_zip#43]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
+Input [3]: [s_store_sk#40, s_store_name#41, s_zip#42]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=8]
 
 (43) BroadcastHashJoin [codegen id : 13]
 Left keys [1]: [ss_store_sk#6]
-Right keys [1]: [s_store_sk#41]
+Right keys [1]: [s_store_sk#40]
 Join type: Inner
 Join condition: None
 
 (44) Project [codegen id : 13]
-Output [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43]
-Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_sk#41, s_store_name#42, s_zip#43]
+Output [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42]
+Input [14]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_store_sk#6, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_sk#40, s_store_name#41, s_zip#42]
 
 (45) Exchange
-Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43]
-Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42]
+Arguments: hashpartitioning(ss_customer_sk#2, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (46) Sort [codegen id : 14]
-Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43]
+Input [12]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42]
 Arguments: [ss_customer_sk#2 ASC NULLS FIRST], false, 0
 
 (47) Scan parquet spark_catalog.default.customer
-Output [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
+Output [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer]
 PushedFilters: [IsNotNull(c_customer_sk), IsNotNull(c_first_sales_date_sk), IsNotNull(c_first_shipto_date_sk), IsNotNull(c_current_cdemo_sk), IsNotNull(c_current_hdemo_sk), IsNotNull(c_current_addr_sk)]
 ReadSchema: struct<c_customer_sk:int,c_current_cdemo_sk:int,c_current_hdemo_sk:int,c_current_addr_sk:int,c_first_shipto_date_sk:int,c_first_sales_date_sk:int>
 
 (48) ColumnarToRow [codegen id : 15]
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
 
 (49) Filter [codegen id : 15]
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Condition : (((((isnotnull(c_customer_sk#44) AND isnotnull(c_first_sales_date_sk#49)) AND isnotnull(c_first_shipto_date_sk#48)) AND isnotnull(c_current_cdemo_sk#45)) AND isnotnull(c_current_hdemo_sk#46)) AND isnotnull(c_current_addr_sk#47))
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Condition : (((((isnotnull(c_customer_sk#43) AND isnotnull(c_first_sales_date_sk#48)) AND isnotnull(c_first_shipto_date_sk#47)) AND isnotnull(c_current_cdemo_sk#44)) AND isnotnull(c_current_hdemo_sk#45)) AND isnotnull(c_current_addr_sk#46))
 
 (50) Exchange
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Arguments: hashpartitioning(c_customer_sk#44, 5), ENSURE_REQUIREMENTS, [plan_id=9]
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Arguments: hashpartitioning(c_customer_sk#43, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (51) Sort [codegen id : 16]
-Input [6]: [c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Arguments: [c_customer_sk#44 ASC NULLS FIRST], false, 0
+Input [6]: [c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Arguments: [c_customer_sk#43 ASC NULLS FIRST], false, 0
 
 (52) SortMergeJoin [codegen id : 19]
 Left keys [1]: [ss_customer_sk#2]
-Right keys [1]: [c_customer_sk#44]
+Right keys [1]: [c_customer_sk#43]
 Join type: Inner
 Join condition: None
 
 (53) Project [codegen id : 19]
-Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
-Input [18]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_customer_sk#44, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49]
+Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
+Input [18]: [ss_item_sk#1, ss_customer_sk#2, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_customer_sk#43, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48]
 
 (54) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#50, d_year#51]
+Output [2]: [d_date_sk#49, d_year#50]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (55) ColumnarToRow [codegen id : 17]
-Input [2]: [d_date_sk#50, d_year#51]
+Input [2]: [d_date_sk#49, d_year#50]
 
 (56) Filter [codegen id : 17]
-Input [2]: [d_date_sk#50, d_year#51]
-Condition : isnotnull(d_date_sk#50)
+Input [2]: [d_date_sk#49, d_year#50]
+Condition : isnotnull(d_date_sk#49)
 
 (57) BroadcastExchange
-Input [2]: [d_date_sk#50, d_year#51]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=10]
+Input [2]: [d_date_sk#49, d_year#50]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=11]
 
 (58) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [c_first_sales_date_sk#49]
-Right keys [1]: [d_date_sk#50]
+Left keys [1]: [c_first_sales_date_sk#48]
+Right keys [1]: [d_date_sk#49]
 Join type: Inner
 Join condition: None
 
 (59) Project [codegen id : 19]
-Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, d_year#51]
-Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, c_first_sales_date_sk#49, d_date_sk#50, d_year#51]
+Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, d_year#50]
+Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, c_first_sales_date_sk#48, d_date_sk#49, d_year#50]
 
 (60) ReusedExchange [Reuses operator id: 57]
-Output [2]: [d_date_sk#52, d_year#53]
+Output [2]: [d_date_sk#51, d_year#52]
 
 (61) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [c_first_shipto_date_sk#48]
-Right keys [1]: [d_date_sk#52]
+Left keys [1]: [c_first_shipto_date_sk#47]
+Right keys [1]: [d_date_sk#51]
 Join type: Inner
 Join condition: None
 
 (62) Project [codegen id : 19]
-Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, c_first_shipto_date_sk#48, d_year#51, d_date_sk#52, d_year#53]
+Output [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, c_first_shipto_date_sk#47, d_year#50, d_date_sk#51, d_year#52]
 
 (63) Exchange
-Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Arguments: hashpartitioning(ss_cdemo_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Arguments: hashpartitioning(ss_cdemo_sk#3, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (64) Sort [codegen id : 20]
-Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
+Input [16]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
 Arguments: [ss_cdemo_sk#3 ASC NULLS FIRST], false, 0
 
 (65) Scan parquet spark_catalog.default.customer_demographics
-Output [2]: [cd_demo_sk#54, cd_marital_status#55]
+Output [2]: [cd_demo_sk#53, cd_marital_status#54]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_demographics]
 PushedFilters: [IsNotNull(cd_demo_sk), IsNotNull(cd_marital_status)]
 ReadSchema: struct<cd_demo_sk:int,cd_marital_status:string>
 
 (66) ColumnarToRow [codegen id : 21]
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
 
 (67) Filter [codegen id : 21]
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
-Condition : (isnotnull(cd_demo_sk#54) AND isnotnull(cd_marital_status#55))
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
+Condition : (isnotnull(cd_demo_sk#53) AND isnotnull(cd_marital_status#54))
 
 (68) Exchange
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
-Arguments: hashpartitioning(cd_demo_sk#54, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
+Arguments: hashpartitioning(cd_demo_sk#53, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (69) Sort [codegen id : 22]
-Input [2]: [cd_demo_sk#54, cd_marital_status#55]
-Arguments: [cd_demo_sk#54 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#53, cd_marital_status#54]
+Arguments: [cd_demo_sk#53 ASC NULLS FIRST], false, 0
 
 (70) SortMergeJoin [codegen id : 23]
 Left keys [1]: [ss_cdemo_sk#3]
-Right keys [1]: [cd_demo_sk#54]
+Right keys [1]: [cd_demo_sk#53]
 Join type: Inner
 Join condition: None
 
 (71) Project [codegen id : 23]
-Output [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55]
-Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_demo_sk#54, cd_marital_status#55]
+Output [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54]
+Input [18]: [ss_item_sk#1, ss_cdemo_sk#3, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_demo_sk#53, cd_marital_status#54]
 
 (72) Exchange
-Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55]
-Arguments: hashpartitioning(c_current_cdemo_sk#45, 5), ENSURE_REQUIREMENTS, [plan_id=13]
+Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54]
+Arguments: hashpartitioning(c_current_cdemo_sk#44, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (73) Sort [codegen id : 24]
-Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55]
-Arguments: [c_current_cdemo_sk#45 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54]
+Arguments: [c_current_cdemo_sk#44 ASC NULLS FIRST], false, 0
 
 (74) ReusedExchange [Reuses operator id: 68]
-Output [2]: [cd_demo_sk#56, cd_marital_status#57]
+Output [2]: [cd_demo_sk#55, cd_marital_status#56]
 
 (75) Sort [codegen id : 26]
-Input [2]: [cd_demo_sk#56, cd_marital_status#57]
-Arguments: [cd_demo_sk#56 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#55, cd_marital_status#56]
+Arguments: [cd_demo_sk#55 ASC NULLS FIRST], false, 0
 
 (76) SortMergeJoin [codegen id : 30]
-Left keys [1]: [c_current_cdemo_sk#45]
-Right keys [1]: [cd_demo_sk#56]
+Left keys [1]: [c_current_cdemo_sk#44]
+Right keys [1]: [cd_demo_sk#55]
 Join type: Inner
-Join condition: NOT (cd_marital_status#55 = cd_marital_status#57)
+Join condition: NOT (cd_marital_status#54 = cd_marital_status#56)
 
 (77) Project [codegen id : 30]
-Output [14]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Input [18]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_cdemo_sk#45, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, cd_marital_status#55, cd_demo_sk#56, cd_marital_status#57]
+Output [14]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Input [18]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_cdemo_sk#44, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, cd_marital_status#54, cd_demo_sk#55, cd_marital_status#56]
 
 (78) Scan parquet spark_catalog.default.promotion
-Output [1]: [p_promo_sk#58]
+Output [1]: [p_promo_sk#57]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/promotion]
 PushedFilters: [IsNotNull(p_promo_sk)]
 ReadSchema: struct<p_promo_sk:int>
 
 (79) ColumnarToRow [codegen id : 27]
-Input [1]: [p_promo_sk#58]
+Input [1]: [p_promo_sk#57]
 
 (80) Filter [codegen id : 27]
-Input [1]: [p_promo_sk#58]
-Condition : isnotnull(p_promo_sk#58)
+Input [1]: [p_promo_sk#57]
+Condition : isnotnull(p_promo_sk#57)
 
 (81) BroadcastExchange
-Input [1]: [p_promo_sk#58]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=14]
+Input [1]: [p_promo_sk#57]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=15]
 
 (82) BroadcastHashJoin [codegen id : 30]
 Left keys [1]: [ss_promo_sk#7]
-Right keys [1]: [p_promo_sk#58]
+Right keys [1]: [p_promo_sk#57]
 Join type: Inner
 Join condition: None
 
 (83) Project [codegen id : 30]
-Output [13]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53]
-Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, p_promo_sk#58]
+Output [13]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52]
+Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_promo_sk#7, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, p_promo_sk#57]
 
 (84) Scan parquet spark_catalog.default.household_demographics
-Output [2]: [hd_demo_sk#59, hd_income_band_sk#60]
+Output [2]: [hd_demo_sk#58, hd_income_band_sk#59]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/household_demographics]
 PushedFilters: [IsNotNull(hd_demo_sk), IsNotNull(hd_income_band_sk)]
 ReadSchema: struct<hd_demo_sk:int,hd_income_band_sk:int>
 
 (85) ColumnarToRow [codegen id : 28]
-Input [2]: [hd_demo_sk#59, hd_income_band_sk#60]
+Input [2]: [hd_demo_sk#58, hd_income_band_sk#59]
 
 (86) Filter [codegen id : 28]
-Input [2]: [hd_demo_sk#59, hd_income_band_sk#60]
-Condition : (isnotnull(hd_demo_sk#59) AND isnotnull(hd_income_band_sk#60))
+Input [2]: [hd_demo_sk#58, hd_income_band_sk#59]
+Condition : (isnotnull(hd_demo_sk#58) AND isnotnull(hd_income_band_sk#59))
 
 (87) BroadcastExchange
-Input [2]: [hd_demo_sk#59, hd_income_band_sk#60]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=15]
+Input [2]: [hd_demo_sk#58, hd_income_band_sk#59]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=16]
 
 (88) BroadcastHashJoin [codegen id : 30]
 Left keys [1]: [ss_hdemo_sk#4]
-Right keys [1]: [hd_demo_sk#59]
+Right keys [1]: [hd_demo_sk#58]
 Join type: Inner
 Join condition: None
 
 (89) Project [codegen id : 30]
-Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60]
-Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, hd_demo_sk#59, hd_income_band_sk#60]
+Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59]
+Input [15]: [ss_item_sk#1, ss_hdemo_sk#4, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, hd_demo_sk#58, hd_income_band_sk#59]
 
 (90) ReusedExchange [Reuses operator id: 87]
-Output [2]: [hd_demo_sk#61, hd_income_band_sk#62]
+Output [2]: [hd_demo_sk#60, hd_income_band_sk#61]
 
 (91) BroadcastHashJoin [codegen id : 30]
-Left keys [1]: [c_current_hdemo_sk#46]
-Right keys [1]: [hd_demo_sk#61]
+Left keys [1]: [c_current_hdemo_sk#45]
+Right keys [1]: [hd_demo_sk#60]
 Join type: Inner
 Join condition: None
 
 (92) Project [codegen id : 30]
-Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62]
-Input [15]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_hdemo_sk#46, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_demo_sk#61, hd_income_band_sk#62]
+Output [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61]
+Input [15]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_hdemo_sk#45, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_demo_sk#60, hd_income_band_sk#61]
 
 (93) Exchange
-Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62]
-Arguments: hashpartitioning(ss_addr_sk#5, 5), ENSURE_REQUIREMENTS, [plan_id=16]
+Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61]
+Arguments: hashpartitioning(ss_addr_sk#5, 5), ENSURE_REQUIREMENTS, [plan_id=17]
 
 (94) Sort [codegen id : 31]
-Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62]
+Input [13]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61]
 Arguments: [ss_addr_sk#5 ASC NULLS FIRST], false, 0
 
 (95) Scan parquet spark_catalog.default.customer_address
-Output [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
+Output [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer_address]
 PushedFilters: [IsNotNull(ca_address_sk)]
 ReadSchema: struct<ca_address_sk:int,ca_street_number:string,ca_street_name:string,ca_city:string,ca_zip:string>
 
 (96) ColumnarToRow [codegen id : 32]
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
 
 (97) Filter [codegen id : 32]
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Condition : isnotnull(ca_address_sk#63)
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Condition : isnotnull(ca_address_sk#62)
 
 (98) Exchange
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: hashpartitioning(ca_address_sk#63, 5), ENSURE_REQUIREMENTS, [plan_id=17]
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: hashpartitioning(ca_address_sk#62, 5), ENSURE_REQUIREMENTS, [plan_id=18]
 
 (99) Sort [codegen id : 33]
-Input [5]: [ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: [ca_address_sk#63 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: [ca_address_sk#62 ASC NULLS FIRST], false, 0
 
 (100) SortMergeJoin [codegen id : 34]
 Left keys [1]: [ss_addr_sk#5]
-Right keys [1]: [ca_address_sk#63]
+Right keys [1]: [ca_address_sk#62]
 Join type: Inner
 Join condition: None
 
 (101) Project [codegen id : 34]
-Output [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Input [18]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_address_sk#63, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
+Output [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Input [18]: [ss_item_sk#1, ss_addr_sk#5, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_address_sk#62, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
 
 (102) Exchange
-Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: hashpartitioning(c_current_addr_sk#47, 5), ENSURE_REQUIREMENTS, [plan_id=18]
+Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: hashpartitioning(c_current_addr_sk#46, 5), ENSURE_REQUIREMENTS, [plan_id=19]
 
 (103) Sort [codegen id : 35]
-Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67]
-Arguments: [c_current_addr_sk#47 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66]
+Arguments: [c_current_addr_sk#46 ASC NULLS FIRST], false, 0
 
 (104) ReusedExchange [Reuses operator id: 98]
-Output [5]: [ca_address_sk#68, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
+Output [5]: [ca_address_sk#67, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
 
 (105) Sort [codegen id : 37]
-Input [5]: [ca_address_sk#68, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Arguments: [ca_address_sk#68 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#67, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Arguments: [ca_address_sk#67 ASC NULLS FIRST], false, 0
 
 (106) SortMergeJoin [codegen id : 41]
-Left keys [1]: [c_current_addr_sk#47]
-Right keys [1]: [ca_address_sk#68]
+Left keys [1]: [c_current_addr_sk#46]
+Right keys [1]: [ca_address_sk#67]
 Join type: Inner
 Join condition: None
 
 (107) Project [codegen id : 41]
-Output [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Input [21]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, c_current_addr_sk#47, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_address_sk#68, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
+Output [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Input [21]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, c_current_addr_sk#46, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_address_sk#67, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
 
 (108) Scan parquet spark_catalog.default.income_band
-Output [1]: [ib_income_band_sk#73]
+Output [1]: [ib_income_band_sk#72]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/income_band]
 PushedFilters: [IsNotNull(ib_income_band_sk)]
 ReadSchema: struct<ib_income_band_sk:int>
 
 (109) ColumnarToRow [codegen id : 38]
-Input [1]: [ib_income_band_sk#73]
+Input [1]: [ib_income_band_sk#72]
 
 (110) Filter [codegen id : 38]
-Input [1]: [ib_income_band_sk#73]
-Condition : isnotnull(ib_income_band_sk#73)
+Input [1]: [ib_income_band_sk#72]
+Condition : isnotnull(ib_income_band_sk#72)
 
 (111) BroadcastExchange
-Input [1]: [ib_income_band_sk#73]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=19]
+Input [1]: [ib_income_band_sk#72]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=20]
 
 (112) BroadcastHashJoin [codegen id : 41]
-Left keys [1]: [hd_income_band_sk#60]
-Right keys [1]: [ib_income_band_sk#73]
+Left keys [1]: [hd_income_band_sk#59]
+Right keys [1]: [ib_income_band_sk#72]
 Join type: Inner
 Join condition: None
 
 (113) Project [codegen id : 41]
-Output [18]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Input [20]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#60, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, ib_income_band_sk#73]
+Output [18]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Input [20]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#59, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, ib_income_band_sk#72]
 
 (114) ReusedExchange [Reuses operator id: 111]
-Output [1]: [ib_income_band_sk#74]
+Output [1]: [ib_income_band_sk#73]
 
 (115) BroadcastHashJoin [codegen id : 41]
-Left keys [1]: [hd_income_band_sk#62]
-Right keys [1]: [ib_income_band_sk#74]
+Left keys [1]: [hd_income_band_sk#61]
+Right keys [1]: [ib_income_band_sk#73]
 Join type: Inner
 Join condition: None
 
 (116) Project [codegen id : 41]
-Output [17]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72]
-Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, hd_income_band_sk#62, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, ib_income_band_sk#74]
+Output [17]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71]
+Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, hd_income_band_sk#61, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, ib_income_band_sk#73]
 
 (117) Scan parquet spark_catalog.default.item
-Output [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
+Output [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), In(i_color, [burlywood           ,floral              ,indian              ,medium              ,purple              ,spring              ]), GreaterThanOrEqual(i_current_price,64.00), LessThanOrEqual(i_current_price,74.00), GreaterThanOrEqual(i_current_price,65.00), LessThanOrEqual(i_current_price,79.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_color:string,i_product_name:string>
 
 (118) ColumnarToRow [codegen id : 40]
-Input [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
+Input [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
 
 (119) Filter [codegen id : 40]
-Input [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
-Condition : ((((((isnotnull(i_current_price#76) AND i_color#77 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#76 >= 64.00)) AND (i_current_price#76 <= 74.00)) AND (i_current_price#76 >= 65.00)) AND (i_current_price#76 <= 79.00)) AND isnotnull(i_item_sk#75))
+Input [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
+Condition : ((((((isnotnull(i_current_price#75) AND i_color#76 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#75 >= 64.00)) AND (i_current_price#75 <= 74.00)) AND (i_current_price#75 >= 65.00)) AND (i_current_price#75 <= 79.00)) AND isnotnull(i_item_sk#74))
 
 (120) Project [codegen id : 40]
-Output [2]: [i_item_sk#75, i_product_name#78]
-Input [4]: [i_item_sk#75, i_current_price#76, i_color#77, i_product_name#78]
+Output [2]: [i_item_sk#74, i_product_name#77]
+Input [4]: [i_item_sk#74, i_current_price#75, i_color#76, i_product_name#77]
 
 (121) BroadcastExchange
-Input [2]: [i_item_sk#75, i_product_name#78]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=20]
+Input [2]: [i_item_sk#74, i_product_name#77]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=21]
 
 (122) BroadcastHashJoin [codegen id : 41]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [i_item_sk#75]
+Right keys [1]: [i_item_sk#74]
 Join type: Inner
 Join condition: None
 
 (123) Project [codegen id : 41]
-Output [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, d_year#51, d_year#53, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, i_item_sk#75, i_product_name#78]
-Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, s_store_name#42, s_zip#43, d_year#51, d_year#53, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, i_item_sk#75, i_product_name#78]
+Output [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, d_year#50, d_year#52, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, i_item_sk#74, i_product_name#77]
+Input [19]: [ss_item_sk#1, ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, s_store_name#41, s_zip#42, d_year#50, d_year#52, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, i_item_sk#74, i_product_name#77]
 
 (124) HashAggregate [codegen id : 41]
-Input [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#40, d_year#51, d_year#53, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, i_item_sk#75, i_product_name#78]
-Keys [15]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53]
+Input [18]: [ss_wholesale_cost#9, ss_list_price#10, ss_coupon_amt#11, d_year#39, d_year#50, d_year#52, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, i_item_sk#74, i_product_name#77]
+Keys [15]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52]
 Functions [4]: [partial_count(1), partial_sum(UnscaledValue(ss_wholesale_cost#9)), partial_sum(UnscaledValue(ss_list_price#10)), partial_sum(UnscaledValue(ss_coupon_amt#11))]
-Aggregate Attributes [4]: [count#79, sum#80, sum#81, sum#82]
-Results [19]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, count#83, sum#84, sum#85, sum#86]
+Aggregate Attributes [4]: [count#78, sum#79, sum#80, sum#81]
+Results [19]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, count#82, sum#83, sum#84, sum#85]
 
 (125) Exchange
-Input [19]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, count#83, sum#84, sum#85, sum#86]
-Arguments: hashpartitioning(i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, 5), ENSURE_REQUIREMENTS, [plan_id=21]
+Input [19]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, count#82, sum#83, sum#84, sum#85]
+Arguments: hashpartitioning(i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, 5), ENSURE_REQUIREMENTS, [plan_id=22]
 
 (126) HashAggregate [codegen id : 42]
-Input [19]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53, count#83, sum#84, sum#85, sum#86]
-Keys [15]: [i_product_name#78, i_item_sk#75, s_store_name#42, s_zip#43, ca_street_number#64, ca_street_name#65, ca_city#66, ca_zip#67, ca_street_number#69, ca_street_name#70, ca_city#71, ca_zip#72, d_year#40, d_year#51, d_year#53]
+Input [19]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52, count#82, sum#83, sum#84, sum#85]
+Keys [15]: [i_product_name#77, i_item_sk#74, s_store_name#41, s_zip#42, ca_street_number#63, ca_street_name#64, ca_city#65, ca_zip#66, ca_street_number#68, ca_street_name#69, ca_city#70, ca_zip#71, d_year#39, d_year#50, d_year#52]
 Functions [4]: [count(1), sum(UnscaledValue(ss_wholesale_cost#9)), sum(UnscaledValue(ss_list_price#10)), sum(UnscaledValue(ss_coupon_amt#11))]
-Aggregate Attributes [4]: [count(1)#87, sum(UnscaledValue(ss_wholesale_cost#9))#88, sum(UnscaledValue(ss_list_price#10))#89, sum(UnscaledValue(ss_coupon_amt#11))#90]
-Results [17]: [i_product_name#78 AS product_name#91, i_item_sk#75 AS item_sk#92, s_store_name#42 AS store_name#93, s_zip#43 AS store_zip#94, ca_street_number#64 AS b_street_number#95, ca_street_name#65 AS b_streen_name#96, ca_city#66 AS b_city#97, ca_zip#67 AS b_zip#98, ca_street_number#69 AS c_street_number#99, ca_street_name#70 AS c_street_name#100, ca_city#71 AS c_city#101, ca_zip#72 AS c_zip#102, d_year#40 AS syear#103, count(1)#87 AS cnt#104, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#9))#88,17,2) AS s1#105, MakeDecimal(sum(UnscaledValue(ss_list_price#10))#89,17,2) AS s2#106, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#11))#90,17,2) AS s3#107]
+Aggregate Attributes [4]: [count(1)#86, sum(UnscaledValue(ss_wholesale_cost#9))#87, sum(UnscaledValue(ss_list_price#10))#88, sum(UnscaledValue(ss_coupon_amt#11))#89]
+Results [17]: [i_product_name#77 AS product_name#90, i_item_sk#74 AS item_sk#91, s_store_name#41 AS store_name#92, s_zip#42 AS store_zip#93, ca_street_number#63 AS b_street_number#94, ca_street_name#64 AS b_streen_name#95, ca_city#65 AS b_city#96, ca_zip#66 AS b_zip#97, ca_street_number#68 AS c_street_number#98, ca_street_name#69 AS c_street_name#99, ca_city#70 AS c_city#100, ca_zip#71 AS c_zip#101, d_year#39 AS syear#102, count(1)#86 AS cnt#103, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#9))#87,17,2) AS s1#104, MakeDecimal(sum(UnscaledValue(ss_list_price#10))#88,17,2) AS s2#105, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#11))#89,17,2) AS s3#106]
 
 (127) Exchange
-Input [17]: [product_name#91, item_sk#92, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107]
-Arguments: hashpartitioning(item_sk#92, store_name#93, store_zip#94, 5), ENSURE_REQUIREMENTS, [plan_id=22]
+Input [17]: [product_name#90, item_sk#91, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106]
+Arguments: hashpartitioning(item_sk#91, store_name#92, store_zip#93, 5), ENSURE_REQUIREMENTS, [plan_id=23]
 
 (128) Sort [codegen id : 43]
-Input [17]: [product_name#91, item_sk#92, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107]
-Arguments: [item_sk#92 ASC NULLS FIRST, store_name#93 ASC NULLS FIRST, store_zip#94 ASC NULLS FIRST], false, 0
+Input [17]: [product_name#90, item_sk#91, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106]
+Arguments: [item_sk#91 ASC NULLS FIRST, store_name#92 ASC NULLS FIRST, store_zip#93 ASC NULLS FIRST], false, 0
 
 (129) Scan parquet spark_catalog.default.store_sales
-Output [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
+Output [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#119), dynamicpruningexpression(ss_sold_date_sk#119 IN dynamicpruning#120)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#118), dynamicpruningexpression(ss_sold_date_sk#118 IN dynamicpruning#119)]
 PushedFilters: [IsNotNull(ss_item_sk), IsNotNull(ss_ticket_number), IsNotNull(ss_store_sk), IsNotNull(ss_customer_sk), IsNotNull(ss_cdemo_sk), IsNotNull(ss_promo_sk), IsNotNull(ss_hdemo_sk), IsNotNull(ss_addr_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_customer_sk:int,ss_cdemo_sk:int,ss_hdemo_sk:int,ss_addr_sk:int,ss_store_sk:int,ss_promo_sk:int,ss_ticket_number:int,ss_wholesale_cost:decimal(7,2),ss_list_price:decimal(7,2),ss_coupon_amt:decimal(7,2)>
 
 (130) ColumnarToRow [codegen id : 44]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
 
 (131) Filter [codegen id : 44]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Condition : ((((((((isnotnull(ss_item_sk#108) AND isnotnull(ss_ticket_number#115)) AND isnotnull(ss_store_sk#113)) AND isnotnull(ss_customer_sk#109)) AND isnotnull(ss_cdemo_sk#110)) AND isnotnull(ss_promo_sk#114)) AND isnotnull(ss_hdemo_sk#111)) AND isnotnull(ss_addr_sk#112)) AND might_contain(ReusedSubquery Subquery scalar-subquery#14, [id=#15], xxhash64(ss_item_sk#108, 42)))
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Condition : ((((((((isnotnull(ss_item_sk#107) AND isnotnull(ss_ticket_number#114)) AND isnotnull(ss_store_sk#112)) AND isnotnull(ss_customer_sk#108)) AND isnotnull(ss_cdemo_sk#109)) AND isnotnull(ss_promo_sk#113)) AND isnotnull(ss_hdemo_sk#110)) AND isnotnull(ss_addr_sk#111)) AND might_contain(ReusedSubquery Subquery scalar-subquery#14, [id=#1], xxhash64(ss_item_sk#107, 42)))
 
 (132) Exchange
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Arguments: hashpartitioning(ss_item_sk#108, ss_ticket_number#115, 5), ENSURE_REQUIREMENTS, [plan_id=23]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Arguments: hashpartitioning(ss_item_sk#107, ss_ticket_number#114, 5), ENSURE_REQUIREMENTS, [plan_id=24]
 
 (133) Sort [codegen id : 45]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Arguments: [ss_item_sk#108 ASC NULLS FIRST, ss_ticket_number#115 ASC NULLS FIRST], false, 0
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Arguments: [ss_item_sk#107 ASC NULLS FIRST, ss_ticket_number#114 ASC NULLS FIRST], false, 0
 
 (134) ReusedExchange [Reuses operator id: 10]
-Output [2]: [sr_item_sk#121, sr_ticket_number#122]
+Output [2]: [sr_item_sk#120, sr_ticket_number#121]
 
 (135) Sort [codegen id : 47]
-Input [2]: [sr_item_sk#121, sr_ticket_number#122]
-Arguments: [sr_item_sk#121 ASC NULLS FIRST, sr_ticket_number#122 ASC NULLS FIRST], false, 0
+Input [2]: [sr_item_sk#120, sr_ticket_number#121]
+Arguments: [sr_item_sk#120 ASC NULLS FIRST, sr_ticket_number#121 ASC NULLS FIRST], false, 0
 
 (136) SortMergeJoin [codegen id : 56]
-Left keys [2]: [ss_item_sk#108, ss_ticket_number#115]
-Right keys [2]: [sr_item_sk#121, sr_ticket_number#122]
+Left keys [2]: [ss_item_sk#107, ss_ticket_number#114]
+Right keys [2]: [sr_item_sk#120, sr_ticket_number#121]
 Join type: Inner
 Join condition: None
 
 (137) Project [codegen id : 56]
-Output [11]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Input [14]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_ticket_number#115, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119, sr_item_sk#121, sr_ticket_number#122]
+Output [11]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Input [14]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_ticket_number#114, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118, sr_item_sk#120, sr_ticket_number#121]
 
 (138) ReusedExchange [Reuses operator id: 33]
-Output [1]: [cs_item_sk#123]
+Output [1]: [cs_item_sk#122]
 
 (139) BroadcastHashJoin [codegen id : 56]
-Left keys [1]: [ss_item_sk#108]
-Right keys [1]: [cs_item_sk#123]
+Left keys [1]: [ss_item_sk#107]
+Right keys [1]: [cs_item_sk#122]
 Join type: Inner
 Join condition: None
 
 (140) Project [codegen id : 56]
-Output [11]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119, cs_item_sk#123]
+Output [11]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118, cs_item_sk#122]
 
 (141) ReusedExchange [Reuses operator id: 224]
-Output [2]: [d_date_sk#124, d_year#125]
+Output [2]: [d_date_sk#123, d_year#124]
 
 (142) BroadcastHashJoin [codegen id : 56]
-Left keys [1]: [ss_sold_date_sk#119]
-Right keys [1]: [d_date_sk#124]
+Left keys [1]: [ss_sold_date_sk#118]
+Right keys [1]: [d_date_sk#123]
 Join type: Inner
 Join condition: None
 
 (143) Project [codegen id : 56]
-Output [11]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125]
-Input [13]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, ss_sold_date_sk#119, d_date_sk#124, d_year#125]
+Output [11]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124]
+Input [13]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, ss_sold_date_sk#118, d_date_sk#123, d_year#124]
 
 (144) ReusedExchange [Reuses operator id: 42]
-Output [3]: [s_store_sk#126, s_store_name#127, s_zip#128]
+Output [3]: [s_store_sk#125, s_store_name#126, s_zip#127]
 
 (145) BroadcastHashJoin [codegen id : 56]
-Left keys [1]: [ss_store_sk#113]
-Right keys [1]: [s_store_sk#126]
+Left keys [1]: [ss_store_sk#112]
+Right keys [1]: [s_store_sk#125]
 Join type: Inner
 Join condition: None
 
 (146) Project [codegen id : 56]
-Output [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128]
-Input [14]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_store_sk#113, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_sk#126, s_store_name#127, s_zip#128]
+Output [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127]
+Input [14]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_store_sk#112, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_sk#125, s_store_name#126, s_zip#127]
 
 (147) Exchange
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128]
-Arguments: hashpartitioning(ss_customer_sk#109, 5), ENSURE_REQUIREMENTS, [plan_id=24]
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127]
+Arguments: hashpartitioning(ss_customer_sk#108, 5), ENSURE_REQUIREMENTS, [plan_id=25]
 
 (148) Sort [codegen id : 57]
-Input [12]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128]
-Arguments: [ss_customer_sk#109 ASC NULLS FIRST], false, 0
+Input [12]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127]
+Arguments: [ss_customer_sk#108 ASC NULLS FIRST], false, 0
 
 (149) ReusedExchange [Reuses operator id: 50]
-Output [6]: [c_customer_sk#129, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
+Output [6]: [c_customer_sk#128, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
 
 (150) Sort [codegen id : 59]
-Input [6]: [c_customer_sk#129, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
-Arguments: [c_customer_sk#129 ASC NULLS FIRST], false, 0
+Input [6]: [c_customer_sk#128, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
+Arguments: [c_customer_sk#128 ASC NULLS FIRST], false, 0
 
 (151) SortMergeJoin [codegen id : 62]
-Left keys [1]: [ss_customer_sk#109]
-Right keys [1]: [c_customer_sk#129]
+Left keys [1]: [ss_customer_sk#108]
+Right keys [1]: [c_customer_sk#128]
 Join type: Inner
 Join condition: None
 
 (152) Project [codegen id : 62]
-Output [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
-Input [18]: [ss_item_sk#108, ss_customer_sk#109, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_customer_sk#129, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134]
+Output [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
+Input [18]: [ss_item_sk#107, ss_customer_sk#108, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_customer_sk#128, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133]
 
 (153) ReusedExchange [Reuses operator id: 57]
-Output [2]: [d_date_sk#135, d_year#136]
+Output [2]: [d_date_sk#134, d_year#135]
 
 (154) BroadcastHashJoin [codegen id : 62]
-Left keys [1]: [c_first_sales_date_sk#134]
-Right keys [1]: [d_date_sk#135]
+Left keys [1]: [c_first_sales_date_sk#133]
+Right keys [1]: [d_date_sk#134]
 Join type: Inner
 Join condition: None
 
 (155) Project [codegen id : 62]
-Output [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, d_year#136]
-Input [18]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, c_first_sales_date_sk#134, d_date_sk#135, d_year#136]
+Output [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, d_year#135]
+Input [18]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, c_first_sales_date_sk#133, d_date_sk#134, d_year#135]
 
 (156) ReusedExchange [Reuses operator id: 57]
-Output [2]: [d_date_sk#137, d_year#138]
+Output [2]: [d_date_sk#136, d_year#137]
 
 (157) BroadcastHashJoin [codegen id : 62]
-Left keys [1]: [c_first_shipto_date_sk#133]
-Right keys [1]: [d_date_sk#137]
+Left keys [1]: [c_first_shipto_date_sk#132]
+Right keys [1]: [d_date_sk#136]
 Join type: Inner
 Join condition: None
 
 (158) Project [codegen id : 62]
-Output [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Input [18]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, c_first_shipto_date_sk#133, d_year#136, d_date_sk#137, d_year#138]
+Output [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Input [18]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, c_first_shipto_date_sk#132, d_year#135, d_date_sk#136, d_year#137]
 
 (159) Exchange
-Input [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Arguments: hashpartitioning(ss_cdemo_sk#110, 5), ENSURE_REQUIREMENTS, [plan_id=25]
+Input [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Arguments: hashpartitioning(ss_cdemo_sk#109, 5), ENSURE_REQUIREMENTS, [plan_id=26]
 
 (160) Sort [codegen id : 63]
-Input [16]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Arguments: [ss_cdemo_sk#110 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Arguments: [ss_cdemo_sk#109 ASC NULLS FIRST], false, 0
 
 (161) ReusedExchange [Reuses operator id: 68]
-Output [2]: [cd_demo_sk#139, cd_marital_status#140]
+Output [2]: [cd_demo_sk#138, cd_marital_status#139]
 
 (162) Sort [codegen id : 65]
-Input [2]: [cd_demo_sk#139, cd_marital_status#140]
-Arguments: [cd_demo_sk#139 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#138, cd_marital_status#139]
+Arguments: [cd_demo_sk#138 ASC NULLS FIRST], false, 0
 
 (163) SortMergeJoin [codegen id : 66]
-Left keys [1]: [ss_cdemo_sk#110]
-Right keys [1]: [cd_demo_sk#139]
+Left keys [1]: [ss_cdemo_sk#109]
+Right keys [1]: [cd_demo_sk#138]
 Join type: Inner
 Join condition: None
 
 (164) Project [codegen id : 66]
-Output [16]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140]
-Input [18]: [ss_item_sk#108, ss_cdemo_sk#110, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_demo_sk#139, cd_marital_status#140]
+Output [16]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139]
+Input [18]: [ss_item_sk#107, ss_cdemo_sk#109, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_demo_sk#138, cd_marital_status#139]
 
 (165) Exchange
-Input [16]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140]
-Arguments: hashpartitioning(c_current_cdemo_sk#130, 5), ENSURE_REQUIREMENTS, [plan_id=26]
+Input [16]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139]
+Arguments: hashpartitioning(c_current_cdemo_sk#129, 5), ENSURE_REQUIREMENTS, [plan_id=27]
 
 (166) Sort [codegen id : 67]
-Input [16]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140]
-Arguments: [c_current_cdemo_sk#130 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139]
+Arguments: [c_current_cdemo_sk#129 ASC NULLS FIRST], false, 0
 
 (167) ReusedExchange [Reuses operator id: 68]
-Output [2]: [cd_demo_sk#141, cd_marital_status#142]
+Output [2]: [cd_demo_sk#140, cd_marital_status#141]
 
 (168) Sort [codegen id : 69]
-Input [2]: [cd_demo_sk#141, cd_marital_status#142]
-Arguments: [cd_demo_sk#141 ASC NULLS FIRST], false, 0
+Input [2]: [cd_demo_sk#140, cd_marital_status#141]
+Arguments: [cd_demo_sk#140 ASC NULLS FIRST], false, 0
 
 (169) SortMergeJoin [codegen id : 73]
-Left keys [1]: [c_current_cdemo_sk#130]
-Right keys [1]: [cd_demo_sk#141]
+Left keys [1]: [c_current_cdemo_sk#129]
+Right keys [1]: [cd_demo_sk#140]
 Join type: Inner
-Join condition: NOT (cd_marital_status#140 = cd_marital_status#142)
+Join condition: NOT (cd_marital_status#139 = cd_marital_status#141)
 
 (170) Project [codegen id : 73]
-Output [14]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Input [18]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_cdemo_sk#130, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, cd_marital_status#140, cd_demo_sk#141, cd_marital_status#142]
+Output [14]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Input [18]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_cdemo_sk#129, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, cd_marital_status#139, cd_demo_sk#140, cd_marital_status#141]
 
 (171) ReusedExchange [Reuses operator id: 81]
-Output [1]: [p_promo_sk#143]
+Output [1]: [p_promo_sk#142]
 
 (172) BroadcastHashJoin [codegen id : 73]
-Left keys [1]: [ss_promo_sk#114]
-Right keys [1]: [p_promo_sk#143]
+Left keys [1]: [ss_promo_sk#113]
+Right keys [1]: [p_promo_sk#142]
 Join type: Inner
 Join condition: None
 
 (173) Project [codegen id : 73]
-Output [13]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138]
-Input [15]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_promo_sk#114, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, p_promo_sk#143]
+Output [13]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137]
+Input [15]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_promo_sk#113, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, p_promo_sk#142]
 
 (174) ReusedExchange [Reuses operator id: 87]
-Output [2]: [hd_demo_sk#144, hd_income_band_sk#145]
+Output [2]: [hd_demo_sk#143, hd_income_band_sk#144]
 
 (175) BroadcastHashJoin [codegen id : 73]
-Left keys [1]: [ss_hdemo_sk#111]
-Right keys [1]: [hd_demo_sk#144]
+Left keys [1]: [ss_hdemo_sk#110]
+Right keys [1]: [hd_demo_sk#143]
 Join type: Inner
 Join condition: None
 
 (176) Project [codegen id : 73]
-Output [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145]
-Input [15]: [ss_item_sk#108, ss_hdemo_sk#111, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, hd_demo_sk#144, hd_income_band_sk#145]
+Output [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144]
+Input [15]: [ss_item_sk#107, ss_hdemo_sk#110, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, hd_demo_sk#143, hd_income_band_sk#144]
 
 (177) ReusedExchange [Reuses operator id: 87]
-Output [2]: [hd_demo_sk#146, hd_income_band_sk#147]
+Output [2]: [hd_demo_sk#145, hd_income_band_sk#146]
 
 (178) BroadcastHashJoin [codegen id : 73]
-Left keys [1]: [c_current_hdemo_sk#131]
-Right keys [1]: [hd_demo_sk#146]
+Left keys [1]: [c_current_hdemo_sk#130]
+Right keys [1]: [hd_demo_sk#145]
 Join type: Inner
 Join condition: None
 
 (179) Project [codegen id : 73]
-Output [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147]
-Input [15]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_hdemo_sk#131, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_demo_sk#146, hd_income_band_sk#147]
+Output [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146]
+Input [15]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_hdemo_sk#130, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_demo_sk#145, hd_income_band_sk#146]
 
 (180) Exchange
-Input [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147]
-Arguments: hashpartitioning(ss_addr_sk#112, 5), ENSURE_REQUIREMENTS, [plan_id=27]
+Input [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146]
+Arguments: hashpartitioning(ss_addr_sk#111, 5), ENSURE_REQUIREMENTS, [plan_id=28]
 
 (181) Sort [codegen id : 74]
-Input [13]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147]
-Arguments: [ss_addr_sk#112 ASC NULLS FIRST], false, 0
+Input [13]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146]
+Arguments: [ss_addr_sk#111 ASC NULLS FIRST], false, 0
 
 (182) ReusedExchange [Reuses operator id: 98]
-Output [5]: [ca_address_sk#148, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
+Output [5]: [ca_address_sk#147, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
 
 (183) Sort [codegen id : 76]
-Input [5]: [ca_address_sk#148, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Arguments: [ca_address_sk#148 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#147, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Arguments: [ca_address_sk#147 ASC NULLS FIRST], false, 0
 
 (184) SortMergeJoin [codegen id : 77]
-Left keys [1]: [ss_addr_sk#112]
-Right keys [1]: [ca_address_sk#148]
+Left keys [1]: [ss_addr_sk#111]
+Right keys [1]: [ca_address_sk#147]
 Join type: Inner
 Join condition: None
 
 (185) Project [codegen id : 77]
-Output [16]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Input [18]: [ss_item_sk#108, ss_addr_sk#112, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_address_sk#148, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
+Output [16]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Input [18]: [ss_item_sk#107, ss_addr_sk#111, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_address_sk#147, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
 
 (186) Exchange
-Input [16]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Arguments: hashpartitioning(c_current_addr_sk#132, 5), ENSURE_REQUIREMENTS, [plan_id=28]
+Input [16]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Arguments: hashpartitioning(c_current_addr_sk#131, 5), ENSURE_REQUIREMENTS, [plan_id=29]
 
 (187) Sort [codegen id : 78]
-Input [16]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152]
-Arguments: [c_current_addr_sk#132 ASC NULLS FIRST], false, 0
+Input [16]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151]
+Arguments: [c_current_addr_sk#131 ASC NULLS FIRST], false, 0
 
 (188) ReusedExchange [Reuses operator id: 98]
-Output [5]: [ca_address_sk#153, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
+Output [5]: [ca_address_sk#152, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
 
 (189) Sort [codegen id : 80]
-Input [5]: [ca_address_sk#153, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Arguments: [ca_address_sk#153 ASC NULLS FIRST], false, 0
+Input [5]: [ca_address_sk#152, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Arguments: [ca_address_sk#152 ASC NULLS FIRST], false, 0
 
 (190) SortMergeJoin [codegen id : 84]
-Left keys [1]: [c_current_addr_sk#132]
-Right keys [1]: [ca_address_sk#153]
+Left keys [1]: [c_current_addr_sk#131]
+Right keys [1]: [ca_address_sk#152]
 Join type: Inner
 Join condition: None
 
 (191) Project [codegen id : 84]
-Output [19]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Input [21]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, c_current_addr_sk#132, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_address_sk#153, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
+Output [19]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Input [21]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, c_current_addr_sk#131, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_address_sk#152, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
 
 (192) ReusedExchange [Reuses operator id: 111]
-Output [1]: [ib_income_band_sk#158]
+Output [1]: [ib_income_band_sk#157]
 
 (193) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [hd_income_band_sk#145]
-Right keys [1]: [ib_income_band_sk#158]
+Left keys [1]: [hd_income_band_sk#144]
+Right keys [1]: [ib_income_band_sk#157]
 Join type: Inner
 Join condition: None
 
 (194) Project [codegen id : 84]
-Output [18]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Input [20]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#145, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, ib_income_band_sk#158]
+Output [18]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Input [20]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#144, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, ib_income_band_sk#157]
 
 (195) ReusedExchange [Reuses operator id: 111]
-Output [1]: [ib_income_band_sk#159]
+Output [1]: [ib_income_band_sk#158]
 
 (196) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [hd_income_band_sk#147]
-Right keys [1]: [ib_income_band_sk#159]
+Left keys [1]: [hd_income_band_sk#146]
+Right keys [1]: [ib_income_band_sk#158]
 Join type: Inner
 Join condition: None
 
 (197) Project [codegen id : 84]
-Output [17]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157]
-Input [19]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, hd_income_band_sk#147, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, ib_income_band_sk#159]
+Output [17]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156]
+Input [19]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, hd_income_band_sk#146, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, ib_income_band_sk#158]
 
 (198) ReusedExchange [Reuses operator id: 121]
-Output [2]: [i_item_sk#160, i_product_name#161]
+Output [2]: [i_item_sk#159, i_product_name#160]
 
 (199) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [ss_item_sk#108]
-Right keys [1]: [i_item_sk#160]
+Left keys [1]: [ss_item_sk#107]
+Right keys [1]: [i_item_sk#159]
 Join type: Inner
 Join condition: None
 
 (200) Project [codegen id : 84]
-Output [18]: [ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, d_year#136, d_year#138, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, i_item_sk#160, i_product_name#161]
-Input [19]: [ss_item_sk#108, ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, s_store_name#127, s_zip#128, d_year#136, d_year#138, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, i_item_sk#160, i_product_name#161]
+Output [18]: [ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, d_year#135, d_year#137, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, i_item_sk#159, i_product_name#160]
+Input [19]: [ss_item_sk#107, ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, s_store_name#126, s_zip#127, d_year#135, d_year#137, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, i_item_sk#159, i_product_name#160]
 
 (201) HashAggregate [codegen id : 84]
-Input [18]: [ss_wholesale_cost#116, ss_list_price#117, ss_coupon_amt#118, d_year#125, d_year#136, d_year#138, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, i_item_sk#160, i_product_name#161]
-Keys [15]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138]
-Functions [4]: [partial_count(1), partial_sum(UnscaledValue(ss_wholesale_cost#116)), partial_sum(UnscaledValue(ss_list_price#117)), partial_sum(UnscaledValue(ss_coupon_amt#118))]
-Aggregate Attributes [4]: [count#79, sum#162, sum#163, sum#164]
-Results [19]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, count#83, sum#165, sum#166, sum#167]
+Input [18]: [ss_wholesale_cost#115, ss_list_price#116, ss_coupon_amt#117, d_year#124, d_year#135, d_year#137, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, i_item_sk#159, i_product_name#160]
+Keys [15]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137]
+Functions [4]: [partial_count(1), partial_sum(UnscaledValue(ss_wholesale_cost#115)), partial_sum(UnscaledValue(ss_list_price#116)), partial_sum(UnscaledValue(ss_coupon_amt#117))]
+Aggregate Attributes [4]: [count#78, sum#161, sum#162, sum#163]
+Results [19]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, count#82, sum#164, sum#165, sum#166]
 
 (202) Exchange
-Input [19]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, count#83, sum#165, sum#166, sum#167]
-Arguments: hashpartitioning(i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, 5), ENSURE_REQUIREMENTS, [plan_id=29]
+Input [19]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, count#82, sum#164, sum#165, sum#166]
+Arguments: hashpartitioning(i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, 5), ENSURE_REQUIREMENTS, [plan_id=30]
 
 (203) HashAggregate [codegen id : 85]
-Input [19]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138, count#83, sum#165, sum#166, sum#167]
-Keys [15]: [i_product_name#161, i_item_sk#160, s_store_name#127, s_zip#128, ca_street_number#149, ca_street_name#150, ca_city#151, ca_zip#152, ca_street_number#154, ca_street_name#155, ca_city#156, ca_zip#157, d_year#125, d_year#136, d_year#138]
-Functions [4]: [count(1), sum(UnscaledValue(ss_wholesale_cost#116)), sum(UnscaledValue(ss_list_price#117)), sum(UnscaledValue(ss_coupon_amt#118))]
-Aggregate Attributes [4]: [count(1)#87, sum(UnscaledValue(ss_wholesale_cost#116))#88, sum(UnscaledValue(ss_list_price#117))#89, sum(UnscaledValue(ss_coupon_amt#118))#90]
-Results [8]: [i_item_sk#160 AS item_sk#168, s_store_name#127 AS store_name#169, s_zip#128 AS store_zip#170, d_year#125 AS syear#171, count(1)#87 AS cnt#172, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#116))#88,17,2) AS s1#173, MakeDecimal(sum(UnscaledValue(ss_list_price#117))#89,17,2) AS s2#174, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#118))#90,17,2) AS s3#175]
+Input [19]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137, count#82, sum#164, sum#165, sum#166]
+Keys [15]: [i_product_name#160, i_item_sk#159, s_store_name#126, s_zip#127, ca_street_number#148, ca_street_name#149, ca_city#150, ca_zip#151, ca_street_number#153, ca_street_name#154, ca_city#155, ca_zip#156, d_year#124, d_year#135, d_year#137]
+Functions [4]: [count(1), sum(UnscaledValue(ss_wholesale_cost#115)), sum(UnscaledValue(ss_list_price#116)), sum(UnscaledValue(ss_coupon_amt#117))]
+Aggregate Attributes [4]: [count(1)#86, sum(UnscaledValue(ss_wholesale_cost#115))#87, sum(UnscaledValue(ss_list_price#116))#88, sum(UnscaledValue(ss_coupon_amt#117))#89]
+Results [8]: [i_item_sk#159 AS item_sk#167, s_store_name#126 AS store_name#168, s_zip#127 AS store_zip#169, d_year#124 AS syear#170, count(1)#86 AS cnt#171, MakeDecimal(sum(UnscaledValue(ss_wholesale_cost#115))#87,17,2) AS s1#172, MakeDecimal(sum(UnscaledValue(ss_list_price#116))#88,17,2) AS s2#173, MakeDecimal(sum(UnscaledValue(ss_coupon_amt#117))#89,17,2) AS s3#174]
 
 (204) Exchange
-Input [8]: [item_sk#168, store_name#169, store_zip#170, syear#171, cnt#172, s1#173, s2#174, s3#175]
-Arguments: hashpartitioning(item_sk#168, store_name#169, store_zip#170, 5), ENSURE_REQUIREMENTS, [plan_id=30]
+Input [8]: [item_sk#167, store_name#168, store_zip#169, syear#170, cnt#171, s1#172, s2#173, s3#174]
+Arguments: hashpartitioning(item_sk#167, store_name#168, store_zip#169, 5), ENSURE_REQUIREMENTS, [plan_id=31]
 
 (205) Sort [codegen id : 86]
-Input [8]: [item_sk#168, store_name#169, store_zip#170, syear#171, cnt#172, s1#173, s2#174, s3#175]
-Arguments: [item_sk#168 ASC NULLS FIRST, store_name#169 ASC NULLS FIRST, store_zip#170 ASC NULLS FIRST], false, 0
+Input [8]: [item_sk#167, store_name#168, store_zip#169, syear#170, cnt#171, s1#172, s2#173, s3#174]
+Arguments: [item_sk#167 ASC NULLS FIRST, store_name#168 ASC NULLS FIRST, store_zip#169 ASC NULLS FIRST], false, 0
 
 (206) SortMergeJoin [codegen id : 87]
-Left keys [3]: [item_sk#92, store_name#93, store_zip#94]
-Right keys [3]: [item_sk#168, store_name#169, store_zip#170]
+Left keys [3]: [item_sk#91, store_name#92, store_zip#93]
+Right keys [3]: [item_sk#167, store_name#168, store_zip#169]
 Join type: Inner
-Join condition: (cnt#172 <= cnt#104)
+Join condition: (cnt#171 <= cnt#103)
 
 (207) Project [codegen id : 87]
-Output [21]: [product_name#91, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, s1#173, s2#174, s3#175, syear#171, cnt#172]
-Input [25]: [product_name#91, item_sk#92, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, item_sk#168, store_name#169, store_zip#170, syear#171, cnt#172, s1#173, s2#174, s3#175]
+Output [21]: [product_name#90, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, s1#172, s2#173, s3#174, syear#170, cnt#171]
+Input [25]: [product_name#90, item_sk#91, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, item_sk#167, store_name#168, store_zip#169, syear#170, cnt#171, s1#172, s2#173, s3#174]
 
 (208) Exchange
-Input [21]: [product_name#91, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, s1#173, s2#174, s3#175, syear#171, cnt#172]
-Arguments: rangepartitioning(product_name#91 ASC NULLS FIRST, store_name#93 ASC NULLS FIRST, cnt#172 ASC NULLS FIRST, s1#105 ASC NULLS FIRST, s1#173 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=31]
+Input [21]: [product_name#90, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, s1#172, s2#173, s3#174, syear#170, cnt#171]
+Arguments: rangepartitioning(product_name#90 ASC NULLS FIRST, store_name#92 ASC NULLS FIRST, cnt#171 ASC NULLS FIRST, s1#104 ASC NULLS FIRST, s1#172 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=32]
 
 (209) Sort [codegen id : 88]
-Input [21]: [product_name#91, store_name#93, store_zip#94, b_street_number#95, b_streen_name#96, b_city#97, b_zip#98, c_street_number#99, c_street_name#100, c_city#101, c_zip#102, syear#103, cnt#104, s1#105, s2#106, s3#107, s1#173, s2#174, s3#175, syear#171, cnt#172]
-Arguments: [product_name#91 ASC NULLS FIRST, store_name#93 ASC NULLS FIRST, cnt#172 ASC NULLS FIRST, s1#105 ASC NULLS FIRST, s1#173 ASC NULLS FIRST], true, 0
+Input [21]: [product_name#90, store_name#92, store_zip#93, b_street_number#94, b_streen_name#95, b_city#96, b_zip#97, c_street_number#98, c_street_name#99, c_city#100, c_zip#101, syear#102, cnt#103, s1#104, s2#105, s3#106, s1#172, s2#173, s3#174, syear#170, cnt#171]
+Arguments: [product_name#90 ASC NULLS FIRST, store_name#92 ASC NULLS FIRST, cnt#171 ASC NULLS FIRST, s1#104 ASC NULLS FIRST, s1#172 ASC NULLS FIRST], true, 0
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#14, [id=#15]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#14, [id=#1]
 ObjectHashAggregate (216)
 +- Exchange (215)
    +- ObjectHashAggregate (214)
@@ -1156,40 +1156,40 @@ ObjectHashAggregate (216)
 
 
 (210) Scan parquet spark_catalog.default.item
-Output [3]: [i_item_sk#75, i_current_price#76, i_color#77]
+Output [3]: [i_item_sk#74, i_current_price#75, i_color#76]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), In(i_color, [burlywood           ,floral              ,indian              ,medium              ,purple              ,spring              ]), GreaterThanOrEqual(i_current_price,64.00), LessThanOrEqual(i_current_price,74.00), GreaterThanOrEqual(i_current_price,65.00), LessThanOrEqual(i_current_price,79.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2),i_color:string>
 
 (211) ColumnarToRow [codegen id : 1]
-Input [3]: [i_item_sk#75, i_current_price#76, i_color#77]
+Input [3]: [i_item_sk#74, i_current_price#75, i_color#76]
 
 (212) Filter [codegen id : 1]
-Input [3]: [i_item_sk#75, i_current_price#76, i_color#77]
-Condition : ((((((isnotnull(i_current_price#76) AND i_color#77 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#76 >= 64.00)) AND (i_current_price#76 <= 74.00)) AND (i_current_price#76 >= 65.00)) AND (i_current_price#76 <= 79.00)) AND isnotnull(i_item_sk#75))
+Input [3]: [i_item_sk#74, i_current_price#75, i_color#76]
+Condition : ((((((isnotnull(i_current_price#75) AND i_color#76 IN (purple              ,burlywood           ,indian              ,spring              ,floral              ,medium              )) AND (i_current_price#75 >= 64.00)) AND (i_current_price#75 <= 74.00)) AND (i_current_price#75 >= 65.00)) AND (i_current_price#75 <= 79.00)) AND isnotnull(i_item_sk#74))
 
 (213) Project [codegen id : 1]
-Output [1]: [i_item_sk#75]
-Input [3]: [i_item_sk#75, i_current_price#76, i_color#77]
+Output [1]: [i_item_sk#74]
+Input [3]: [i_item_sk#74, i_current_price#75, i_color#76]
 
 (214) ObjectHashAggregate
-Input [1]: [i_item_sk#75]
+Input [1]: [i_item_sk#74]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)]
-Aggregate Attributes [1]: [buf#176]
-Results [1]: [buf#177]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)]
+Aggregate Attributes [1]: [buf#175]
+Results [1]: [buf#176]
 
 (215) Exchange
-Input [1]: [buf#177]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=32]
+Input [1]: [buf#176]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=33]
 
 (216) ObjectHashAggregate
-Input [1]: [buf#177]
+Input [1]: [buf#176]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)#178]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#75, 42), 1250, 30121, 0, 0)#178 AS bloomFilter#179]
+Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)#177]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#74, 42), 1250, 30121, 0, 0)#177 AS bloomFilter#178]
 
 Subquery:2 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#12 IN dynamicpruning#13
 BroadcastExchange (220)
@@ -1199,26 +1199,26 @@ BroadcastExchange (220)
 
 
 (217) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#39, d_year#40]
+Output [2]: [d_date_sk#38, d_year#39]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,1999), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (218) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#39, d_year#40]
+Input [2]: [d_date_sk#38, d_year#39]
 
 (219) Filter [codegen id : 1]
-Input [2]: [d_date_sk#39, d_year#40]
-Condition : ((isnotnull(d_year#40) AND (d_year#40 = 1999)) AND isnotnull(d_date_sk#39))
+Input [2]: [d_date_sk#38, d_year#39]
+Condition : ((isnotnull(d_year#39) AND (d_year#39 = 1999)) AND isnotnull(d_date_sk#38))
 
 (220) BroadcastExchange
-Input [2]: [d_date_sk#39, d_year#40]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=33]
+Input [2]: [d_date_sk#38, d_year#39]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=34]
 
-Subquery:3 Hosting operator id = 131 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#15]
+Subquery:3 Hosting operator id = 131 Hosting Expression = ReusedSubquery Subquery scalar-subquery#14, [id=#1]
 
-Subquery:4 Hosting operator id = 129 Hosting Expression = ss_sold_date_sk#119 IN dynamicpruning#120
+Subquery:4 Hosting operator id = 129 Hosting Expression = ss_sold_date_sk#118 IN dynamicpruning#119
 BroadcastExchange (224)
 +- * Filter (223)
    +- * ColumnarToRow (222)
@@ -1226,21 +1226,21 @@ BroadcastExchange (224)
 
 
 (221) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#124, d_year#125]
+Output [2]: [d_date_sk#123, d_year#124]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_year), EqualTo(d_year,2000), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_year:int>
 
 (222) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#124, d_year#125]
+Input [2]: [d_date_sk#123, d_year#124]
 
 (223) Filter [codegen id : 1]
-Input [2]: [d_date_sk#124, d_year#125]
-Condition : ((isnotnull(d_year#125) AND (d_year#125 = 2000)) AND isnotnull(d_date_sk#124))
+Input [2]: [d_date_sk#123, d_year#124]
+Condition : ((isnotnull(d_year#124) AND (d_year#124 = 2000)) AND isnotnull(d_date_sk#123))
 
 (224) BroadcastExchange
-Input [2]: [d_date_sk#124, d_year#125]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=34]
+Input [2]: [d_date_sk#123, d_year#124]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=35]
 
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/explain.txt
index 3676f5f5fc21b..d088cb0190d7a 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/explain.txt
@@ -1,102 +1,133 @@
 == Physical Plan ==
-TakeOrderedAndProject (98)
-+- * HashAggregate (97)
-   +- Exchange (96)
-      +- * HashAggregate (95)
-         +- Union (94)
-            :- * HashAggregate (83)
-            :  +- Exchange (82)
-            :     +- * HashAggregate (81)
-            :        +- Union (80)
-            :           :- * Project (30)
-            :           :  +- * BroadcastHashJoin LeftOuter BuildRight (29)
-            :           :     :- * HashAggregate (15)
-            :           :     :  +- Exchange (14)
-            :           :     :     +- * HashAggregate (13)
-            :           :     :        +- * Project (12)
-            :           :     :           +- * BroadcastHashJoin Inner BuildRight (11)
-            :           :     :              :- * Project (6)
-            :           :     :              :  +- * BroadcastHashJoin Inner BuildRight (5)
-            :           :     :              :     :- * Filter (3)
-            :           :     :              :     :  +- * ColumnarToRow (2)
-            :           :     :              :     :     +- Scan parquet spark_catalog.default.store_sales (1)
-            :           :     :              :     +- ReusedExchange (4)
-            :           :     :              +- BroadcastExchange (10)
-            :           :     :                 +- * Filter (9)
-            :           :     :                    +- * ColumnarToRow (8)
-            :           :     :                       +- Scan parquet spark_catalog.default.store (7)
-            :           :     +- BroadcastExchange (28)
-            :           :        +- * HashAggregate (27)
-            :           :           +- Exchange (26)
-            :           :              +- * HashAggregate (25)
-            :           :                 +- * Project (24)
-            :           :                    +- * BroadcastHashJoin Inner BuildRight (23)
-            :           :                       :- * Project (21)
-            :           :                       :  +- * BroadcastHashJoin Inner BuildRight (20)
-            :           :                       :     :- * Filter (18)
-            :           :                       :     :  +- * ColumnarToRow (17)
-            :           :                       :     :     +- Scan parquet spark_catalog.default.store_returns (16)
-            :           :                       :     +- ReusedExchange (19)
-            :           :                       +- ReusedExchange (22)
-            :           :- * Project (49)
-            :           :  +- * BroadcastNestedLoopJoin Inner BuildRight (48)
-            :           :     :- * HashAggregate (38)
-            :           :     :  +- Exchange (37)
-            :           :     :     +- * HashAggregate (36)
-            :           :     :        +- * Project (35)
-            :           :     :           +- * BroadcastHashJoin Inner BuildRight (34)
-            :           :     :              :- * ColumnarToRow (32)
-            :           :     :              :  +- Scan parquet spark_catalog.default.catalog_sales (31)
-            :           :     :              +- ReusedExchange (33)
-            :           :     +- BroadcastExchange (47)
-            :           :        +- * HashAggregate (46)
-            :           :           +- Exchange (45)
-            :           :              +- * HashAggregate (44)
-            :           :                 +- * Project (43)
-            :           :                    +- * BroadcastHashJoin Inner BuildRight (42)
-            :           :                       :- * ColumnarToRow (40)
-            :           :                       :  +- Scan parquet spark_catalog.default.catalog_returns (39)
-            :           :                       +- ReusedExchange (41)
-            :           +- * Project (79)
-            :              +- * BroadcastHashJoin LeftOuter BuildRight (78)
-            :                 :- * HashAggregate (64)
-            :                 :  +- Exchange (63)
-            :                 :     +- * HashAggregate (62)
-            :                 :        +- * Project (61)
-            :                 :           +- * BroadcastHashJoin Inner BuildRight (60)
-            :                 :              :- * Project (55)
-            :                 :              :  +- * BroadcastHashJoin Inner BuildRight (54)
-            :                 :              :     :- * Filter (52)
-            :                 :              :     :  +- * ColumnarToRow (51)
-            :                 :              :     :     +- Scan parquet spark_catalog.default.web_sales (50)
-            :                 :              :     +- ReusedExchange (53)
-            :                 :              +- BroadcastExchange (59)
-            :                 :                 +- * Filter (58)
-            :                 :                    +- * ColumnarToRow (57)
-            :                 :                       +- Scan parquet spark_catalog.default.web_page (56)
-            :                 +- BroadcastExchange (77)
-            :                    +- * HashAggregate (76)
-            :                       +- Exchange (75)
-            :                          +- * HashAggregate (74)
-            :                             +- * Project (73)
-            :                                +- * BroadcastHashJoin Inner BuildRight (72)
-            :                                   :- * Project (70)
-            :                                   :  +- * BroadcastHashJoin Inner BuildRight (69)
-            :                                   :     :- * Filter (67)
-            :                                   :     :  +- * ColumnarToRow (66)
-            :                                   :     :     +- Scan parquet spark_catalog.default.web_returns (65)
-            :                                   :     +- ReusedExchange (68)
-            :                                   +- ReusedExchange (71)
-            :- * HashAggregate (88)
-            :  +- Exchange (87)
-            :     +- * HashAggregate (86)
-            :        +- * HashAggregate (85)
-            :           +- ReusedExchange (84)
-            +- * HashAggregate (93)
-               +- Exchange (92)
-                  +- * HashAggregate (91)
-                     +- * HashAggregate (90)
-                        +- ReusedExchange (89)
+TakeOrderedAndProject (129)
++- * HashAggregate (128)
+   +- Exchange (127)
+      +- * HashAggregate (126)
+         +- Union (125)
+            :- * HashAggregate (82)
+            :  +- * HashAggregate (81)
+            :     +- Union (80)
+            :        :- * Project (30)
+            :        :  +- * BroadcastHashJoin LeftOuter BuildRight (29)
+            :        :     :- * HashAggregate (15)
+            :        :     :  +- Exchange (14)
+            :        :     :     +- * HashAggregate (13)
+            :        :     :        +- * Project (12)
+            :        :     :           +- * BroadcastHashJoin Inner BuildRight (11)
+            :        :     :              :- * Project (6)
+            :        :     :              :  +- * BroadcastHashJoin Inner BuildRight (5)
+            :        :     :              :     :- * Filter (3)
+            :        :     :              :     :  +- * ColumnarToRow (2)
+            :        :     :              :     :     +- Scan parquet spark_catalog.default.store_sales (1)
+            :        :     :              :     +- ReusedExchange (4)
+            :        :     :              +- BroadcastExchange (10)
+            :        :     :                 +- * Filter (9)
+            :        :     :                    +- * ColumnarToRow (8)
+            :        :     :                       +- Scan parquet spark_catalog.default.store (7)
+            :        :     +- BroadcastExchange (28)
+            :        :        +- * HashAggregate (27)
+            :        :           +- Exchange (26)
+            :        :              +- * HashAggregate (25)
+            :        :                 +- * Project (24)
+            :        :                    +- * BroadcastHashJoin Inner BuildRight (23)
+            :        :                       :- * Project (21)
+            :        :                       :  +- * BroadcastHashJoin Inner BuildRight (20)
+            :        :                       :     :- * Filter (18)
+            :        :                       :     :  +- * ColumnarToRow (17)
+            :        :                       :     :     +- Scan parquet spark_catalog.default.store_returns (16)
+            :        :                       :     +- ReusedExchange (19)
+            :        :                       +- ReusedExchange (22)
+            :        :- * Project (49)
+            :        :  +- * BroadcastNestedLoopJoin Inner BuildRight (48)
+            :        :     :- * HashAggregate (38)
+            :        :     :  +- Exchange (37)
+            :        :     :     +- * HashAggregate (36)
+            :        :     :        +- * Project (35)
+            :        :     :           +- * BroadcastHashJoin Inner BuildRight (34)
+            :        :     :              :- * ColumnarToRow (32)
+            :        :     :              :  +- Scan parquet spark_catalog.default.catalog_sales (31)
+            :        :     :              +- ReusedExchange (33)
+            :        :     +- BroadcastExchange (47)
+            :        :        +- * HashAggregate (46)
+            :        :           +- Exchange (45)
+            :        :              +- * HashAggregate (44)
+            :        :                 +- * Project (43)
+            :        :                    +- * BroadcastHashJoin Inner BuildRight (42)
+            :        :                       :- * ColumnarToRow (40)
+            :        :                       :  +- Scan parquet spark_catalog.default.catalog_returns (39)
+            :        :                       +- ReusedExchange (41)
+            :        +- * Project (79)
+            :           +- * BroadcastHashJoin LeftOuter BuildRight (78)
+            :              :- * HashAggregate (64)
+            :              :  +- Exchange (63)
+            :              :     +- * HashAggregate (62)
+            :              :        +- * Project (61)
+            :              :           +- * BroadcastHashJoin Inner BuildRight (60)
+            :              :              :- * Project (55)
+            :              :              :  +- * BroadcastHashJoin Inner BuildRight (54)
+            :              :              :     :- * Filter (52)
+            :              :              :     :  +- * ColumnarToRow (51)
+            :              :              :     :     +- Scan parquet spark_catalog.default.web_sales (50)
+            :              :              :     +- ReusedExchange (53)
+            :              :              +- BroadcastExchange (59)
+            :              :                 +- * Filter (58)
+            :              :                    +- * ColumnarToRow (57)
+            :              :                       +- Scan parquet spark_catalog.default.web_page (56)
+            :              +- BroadcastExchange (77)
+            :                 +- * HashAggregate (76)
+            :                    +- Exchange (75)
+            :                       +- * HashAggregate (74)
+            :                          +- * Project (73)
+            :                             +- * BroadcastHashJoin Inner BuildRight (72)
+            :                                :- * Project (70)
+            :                                :  +- * BroadcastHashJoin Inner BuildRight (69)
+            :                                :     :- * Filter (67)
+            :                                :     :  +- * ColumnarToRow (66)
+            :                                :     :     +- Scan parquet spark_catalog.default.web_returns (65)
+            :                                :     +- ReusedExchange (68)
+            :                                +- ReusedExchange (71)
+            :- * HashAggregate (103)
+            :  +- Exchange (102)
+            :     +- * HashAggregate (101)
+            :        +- * HashAggregate (100)
+            :           +- * HashAggregate (99)
+            :              +- Union (98)
+            :                 :- * Project (87)
+            :                 :  +- * BroadcastHashJoin LeftOuter BuildRight (86)
+            :                 :     :- * HashAggregate (84)
+            :                 :     :  +- ReusedExchange (83)
+            :                 :     +- ReusedExchange (85)
+            :                 :- * Project (92)
+            :                 :  +- * BroadcastNestedLoopJoin Inner BuildRight (91)
+            :                 :     :- * HashAggregate (89)
+            :                 :     :  +- ReusedExchange (88)
+            :                 :     +- ReusedExchange (90)
+            :                 +- * Project (97)
+            :                    +- * BroadcastHashJoin LeftOuter BuildRight (96)
+            :                       :- * HashAggregate (94)
+            :                       :  +- ReusedExchange (93)
+            :                       +- ReusedExchange (95)
+            +- * HashAggregate (124)
+               +- Exchange (123)
+                  +- * HashAggregate (122)
+                     +- * HashAggregate (121)
+                        +- * HashAggregate (120)
+                           +- Union (119)
+                              :- * Project (108)
+                              :  +- * BroadcastHashJoin LeftOuter BuildRight (107)
+                              :     :- * HashAggregate (105)
+                              :     :  +- ReusedExchange (104)
+                              :     +- ReusedExchange (106)
+                              :- * Project (113)
+                              :  +- * BroadcastNestedLoopJoin Inner BuildRight (112)
+                              :     :- * HashAggregate (110)
+                              :     :  +- ReusedExchange (109)
+                              :     +- ReusedExchange (111)
+                              +- * Project (118)
+                                 +- * BroadcastHashJoin LeftOuter BuildRight (117)
+                                    :- * HashAggregate (115)
+                                    :  +- ReusedExchange (114)
+                                    +- ReusedExchange (116)
 
 
 (1) Scan parquet spark_catalog.default.store_sales
@@ -114,7 +145,7 @@ Input [4]: [ss_store_sk#1, ss_ext_sales_price#2, ss_net_profit#3, ss_sold_date_s
 Input [4]: [ss_store_sk#1, ss_ext_sales_price#2, ss_net_profit#3, ss_sold_date_sk#4]
 Condition : isnotnull(ss_store_sk#1)
 
-(4) ReusedExchange [Reuses operator id: 103]
+(4) ReusedExchange [Reuses operator id: 134]
 Output [1]: [d_date_sk#6]
 
 (5) BroadcastHashJoin [codegen id : 3]
@@ -188,7 +219,7 @@ Input [4]: [sr_store_sk#16, sr_return_amt#17, sr_net_loss#18, sr_returned_date_s
 Input [4]: [sr_store_sk#16, sr_return_amt#17, sr_net_loss#18, sr_returned_date_sk#19]
 Condition : isnotnull(sr_store_sk#16)
 
-(19) ReusedExchange [Reuses operator id: 103]
+(19) ReusedExchange [Reuses operator id: 134]
 Output [1]: [d_date_sk#20]
 
 (20) BroadcastHashJoin [codegen id : 6]
@@ -256,7 +287,7 @@ ReadSchema: struct<cs_call_center_sk:int,cs_ext_sales_price:decimal(7,2),cs_net_
 (32) ColumnarToRow [codegen id : 10]
 Input [4]: [cs_call_center_sk#34, cs_ext_sales_price#35, cs_net_profit#36, cs_sold_date_sk#37]
 
-(33) ReusedExchange [Reuses operator id: 103]
+(33) ReusedExchange [Reuses operator id: 134]
 Output [1]: [d_date_sk#38]
 
 (34) BroadcastHashJoin [codegen id : 10]
@@ -297,7 +328,7 @@ ReadSchema: struct<cr_return_amount:decimal(7,2),cr_net_loss:decimal(7,2)>
 (40) ColumnarToRow [codegen id : 12]
 Input [3]: [cr_return_amount#47, cr_net_loss#48, cr_returned_date_sk#49]
 
-(41) ReusedExchange [Reuses operator id: 103]
+(41) ReusedExchange [Reuses operator id: 134]
 Output [1]: [d_date_sk#50]
 
 (42) BroadcastHashJoin [codegen id : 12]
@@ -355,7 +386,7 @@ Input [4]: [ws_web_page_sk#62, ws_ext_sales_price#63, ws_net_profit#64, ws_sold_
 Input [4]: [ws_web_page_sk#62, ws_ext_sales_price#63, ws_net_profit#64, ws_sold_date_sk#65]
 Condition : isnotnull(ws_web_page_sk#62)
 
-(53) ReusedExchange [Reuses operator id: 103]
+(53) ReusedExchange [Reuses operator id: 134]
 Output [1]: [d_date_sk#66]
 
 (54) BroadcastHashJoin [codegen id : 17]
@@ -429,7 +460,7 @@ Input [4]: [wr_web_page_sk#76, wr_return_amt#77, wr_net_loss#78, wr_returned_dat
 Input [4]: [wr_web_page_sk#76, wr_return_amt#77, wr_net_loss#78, wr_returned_date_sk#79]
 Condition : isnotnull(wr_web_page_sk#76)
 
-(68) ReusedExchange [Reuses operator id: 103]
+(68) ReusedExchange [Reuses operator id: 134]
 Output [1]: [d_date_sk#80]
 
 (69) BroadcastHashJoin [codegen id : 20]
@@ -496,128 +527,270 @@ Functions [3]: [partial_sum(sales#14), partial_sum(returns#32), partial_sum(prof
 Aggregate Attributes [6]: [sum#94, isEmpty#95, sum#96, isEmpty#97, sum#98, isEmpty#99]
 Results [8]: [channel#30, id#31, sum#100, isEmpty#101, sum#102, isEmpty#103, sum#104, isEmpty#105]
 
-(82) Exchange
-Input [8]: [channel#30, id#31, sum#100, isEmpty#101, sum#102, isEmpty#103, sum#104, isEmpty#105]
-Arguments: hashpartitioning(channel#30, id#31, 5), ENSURE_REQUIREMENTS, [plan_id=12]
-
-(83) HashAggregate [codegen id : 24]
+(82) HashAggregate [codegen id : 23]
 Input [8]: [channel#30, id#31, sum#100, isEmpty#101, sum#102, isEmpty#103, sum#104, isEmpty#105]
 Keys [2]: [channel#30, id#31]
 Functions [3]: [sum(sales#14), sum(returns#32), sum(profit#33)]
 Aggregate Attributes [3]: [sum(sales#14)#106, sum(returns#32)#107, sum(profit#33)#108]
 Results [5]: [channel#30, id#31, cast(sum(sales#14)#106 as decimal(37,2)) AS sales#109, cast(sum(returns#32)#107 as decimal(37,2)) AS returns#110, cast(sum(profit#33)#108 as decimal(38,2)) AS profit#111]
 
-(84) ReusedExchange [Reuses operator id: 82]
-Output [8]: [channel#112, id#113, sum#114, isEmpty#115, sum#116, isEmpty#117, sum#118, isEmpty#119]
-
-(85) HashAggregate [codegen id : 48]
-Input [8]: [channel#112, id#113, sum#114, isEmpty#115, sum#116, isEmpty#117, sum#118, isEmpty#119]
-Keys [2]: [channel#112, id#113]
-Functions [3]: [sum(sales#120), sum(returns#121), sum(profit#122)]
-Aggregate Attributes [3]: [sum(sales#120)#106, sum(returns#121)#107, sum(profit#122)#108]
-Results [4]: [channel#112, sum(sales#120)#106 AS sales#123, sum(returns#121)#107 AS returns#124, sum(profit#122)#108 AS profit#125]
-
-(86) HashAggregate [codegen id : 48]
-Input [4]: [channel#112, sales#123, returns#124, profit#125]
-Keys [1]: [channel#112]
-Functions [3]: [partial_sum(sales#123), partial_sum(returns#124), partial_sum(profit#125)]
-Aggregate Attributes [6]: [sum#126, isEmpty#127, sum#128, isEmpty#129, sum#130, isEmpty#131]
-Results [7]: [channel#112, sum#132, isEmpty#133, sum#134, isEmpty#135, sum#136, isEmpty#137]
-
-(87) Exchange
-Input [7]: [channel#112, sum#132, isEmpty#133, sum#134, isEmpty#135, sum#136, isEmpty#137]
-Arguments: hashpartitioning(channel#112, 5), ENSURE_REQUIREMENTS, [plan_id=13]
-
-(88) HashAggregate [codegen id : 49]
-Input [7]: [channel#112, sum#132, isEmpty#133, sum#134, isEmpty#135, sum#136, isEmpty#137]
-Keys [1]: [channel#112]
-Functions [3]: [sum(sales#123), sum(returns#124), sum(profit#125)]
-Aggregate Attributes [3]: [sum(sales#123)#138, sum(returns#124)#139, sum(profit#125)#140]
-Results [5]: [channel#112, null AS id#141, sum(sales#123)#138 AS sales#142, sum(returns#124)#139 AS returns#143, sum(profit#125)#140 AS profit#144]
-
-(89) ReusedExchange [Reuses operator id: 82]
-Output [8]: [channel#145, id#146, sum#147, isEmpty#148, sum#149, isEmpty#150, sum#151, isEmpty#152]
-
-(90) HashAggregate [codegen id : 73]
-Input [8]: [channel#145, id#146, sum#147, isEmpty#148, sum#149, isEmpty#150, sum#151, isEmpty#152]
-Keys [2]: [channel#145, id#146]
-Functions [3]: [sum(sales#153), sum(returns#154), sum(profit#155)]
-Aggregate Attributes [3]: [sum(sales#153)#106, sum(returns#154)#107, sum(profit#155)#108]
-Results [3]: [sum(sales#153)#106 AS sales#156, sum(returns#154)#107 AS returns#157, sum(profit#155)#108 AS profit#158]
-
-(91) HashAggregate [codegen id : 73]
-Input [3]: [sales#156, returns#157, profit#158]
+(83) ReusedExchange [Reuses operator id: 14]
+Output [3]: [s_store_sk#112, sum#113, sum#114]
+
+(84) HashAggregate [codegen id : 31]
+Input [3]: [s_store_sk#112, sum#113, sum#114]
+Keys [1]: [s_store_sk#112]
+Functions [2]: [sum(UnscaledValue(ss_ext_sales_price#115)), sum(UnscaledValue(ss_net_profit#116))]
+Aggregate Attributes [2]: [sum(UnscaledValue(ss_ext_sales_price#115))#12, sum(UnscaledValue(ss_net_profit#116))#13]
+Results [3]: [s_store_sk#112, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#115))#12,17,2) AS sales#117, MakeDecimal(sum(UnscaledValue(ss_net_profit#116))#13,17,2) AS profit#118]
+
+(85) ReusedExchange [Reuses operator id: 28]
+Output [3]: [s_store_sk#119, returns#120, profit_loss#121]
+
+(86) BroadcastHashJoin [codegen id : 31]
+Left keys [1]: [s_store_sk#112]
+Right keys [1]: [s_store_sk#119]
+Join type: LeftOuter
+Join condition: None
+
+(87) Project [codegen id : 31]
+Output [5]: [store channel AS channel#122, s_store_sk#112 AS id#123, sales#117, coalesce(returns#120, 0.00) AS returns#124, (profit#118 - coalesce(profit_loss#121, 0.00)) AS profit#125]
+Input [6]: [s_store_sk#112, sales#117, profit#118, s_store_sk#119, returns#120, profit_loss#121]
+
+(88) ReusedExchange [Reuses operator id: 37]
+Output [3]: [cs_call_center_sk#126, sum#127, sum#128]
+
+(89) HashAggregate [codegen id : 37]
+Input [3]: [cs_call_center_sk#126, sum#127, sum#128]
+Keys [1]: [cs_call_center_sk#126]
+Functions [2]: [sum(UnscaledValue(cs_ext_sales_price#129)), sum(UnscaledValue(cs_net_profit#130))]
+Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_sales_price#129))#43, sum(UnscaledValue(cs_net_profit#130))#44]
+Results [3]: [cs_call_center_sk#126, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#129))#43,17,2) AS sales#131, MakeDecimal(sum(UnscaledValue(cs_net_profit#130))#44,17,2) AS profit#132]
+
+(90) ReusedExchange [Reuses operator id: 47]
+Output [2]: [returns#133, profit_loss#134]
+
+(91) BroadcastNestedLoopJoin [codegen id : 37]
+Join type: Inner
+Join condition: None
+
+(92) Project [codegen id : 37]
+Output [5]: [catalog channel AS channel#135, cs_call_center_sk#126 AS id#136, sales#131, returns#133, (profit#132 - profit_loss#134) AS profit#137]
+Input [5]: [cs_call_center_sk#126, sales#131, profit#132, returns#133, profit_loss#134]
+
+(93) ReusedExchange [Reuses operator id: 63]
+Output [3]: [wp_web_page_sk#138, sum#139, sum#140]
+
+(94) HashAggregate [codegen id : 45]
+Input [3]: [wp_web_page_sk#138, sum#139, sum#140]
+Keys [1]: [wp_web_page_sk#138]
+Functions [2]: [sum(UnscaledValue(ws_ext_sales_price#141)), sum(UnscaledValue(ws_net_profit#142))]
+Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_sales_price#141))#72, sum(UnscaledValue(ws_net_profit#142))#73]
+Results [3]: [wp_web_page_sk#138, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#141))#72,17,2) AS sales#143, MakeDecimal(sum(UnscaledValue(ws_net_profit#142))#73,17,2) AS profit#144]
+
+(95) ReusedExchange [Reuses operator id: 77]
+Output [3]: [wp_web_page_sk#145, returns#146, profit_loss#147]
+
+(96) BroadcastHashJoin [codegen id : 45]
+Left keys [1]: [wp_web_page_sk#138]
+Right keys [1]: [wp_web_page_sk#145]
+Join type: LeftOuter
+Join condition: None
+
+(97) Project [codegen id : 45]
+Output [5]: [web channel AS channel#148, wp_web_page_sk#138 AS id#149, sales#143, coalesce(returns#146, 0.00) AS returns#150, (profit#144 - coalesce(profit_loss#147, 0.00)) AS profit#151]
+Input [6]: [wp_web_page_sk#138, sales#143, profit#144, wp_web_page_sk#145, returns#146, profit_loss#147]
+
+(98) Union
+
+(99) HashAggregate [codegen id : 46]
+Input [5]: [channel#122, id#123, sales#117, returns#124, profit#125]
+Keys [2]: [channel#122, id#123]
+Functions [3]: [partial_sum(sales#117), partial_sum(returns#124), partial_sum(profit#125)]
+Aggregate Attributes [6]: [sum#152, isEmpty#153, sum#154, isEmpty#155, sum#156, isEmpty#157]
+Results [8]: [channel#122, id#123, sum#158, isEmpty#159, sum#160, isEmpty#161, sum#162, isEmpty#163]
+
+(100) HashAggregate [codegen id : 46]
+Input [8]: [channel#122, id#123, sum#158, isEmpty#159, sum#160, isEmpty#161, sum#162, isEmpty#163]
+Keys [2]: [channel#122, id#123]
+Functions [3]: [sum(sales#117), sum(returns#124), sum(profit#125)]
+Aggregate Attributes [3]: [sum(sales#117)#106, sum(returns#124)#107, sum(profit#125)#108]
+Results [4]: [channel#122, sum(sales#117)#106 AS sales#164, sum(returns#124)#107 AS returns#165, sum(profit#125)#108 AS profit#166]
+
+(101) HashAggregate [codegen id : 46]
+Input [4]: [channel#122, sales#164, returns#165, profit#166]
+Keys [1]: [channel#122]
+Functions [3]: [partial_sum(sales#164), partial_sum(returns#165), partial_sum(profit#166)]
+Aggregate Attributes [6]: [sum#167, isEmpty#168, sum#169, isEmpty#170, sum#171, isEmpty#172]
+Results [7]: [channel#122, sum#173, isEmpty#174, sum#175, isEmpty#176, sum#177, isEmpty#178]
+
+(102) Exchange
+Input [7]: [channel#122, sum#173, isEmpty#174, sum#175, isEmpty#176, sum#177, isEmpty#178]
+Arguments: hashpartitioning(channel#122, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+
+(103) HashAggregate [codegen id : 47]
+Input [7]: [channel#122, sum#173, isEmpty#174, sum#175, isEmpty#176, sum#177, isEmpty#178]
+Keys [1]: [channel#122]
+Functions [3]: [sum(sales#164), sum(returns#165), sum(profit#166)]
+Aggregate Attributes [3]: [sum(sales#164)#179, sum(returns#165)#180, sum(profit#166)#181]
+Results [5]: [channel#122, null AS id#182, sum(sales#164)#179 AS sales#183, sum(returns#165)#180 AS returns#184, sum(profit#166)#181 AS profit#185]
+
+(104) ReusedExchange [Reuses operator id: 14]
+Output [3]: [s_store_sk#186, sum#187, sum#188]
+
+(105) HashAggregate [codegen id : 55]
+Input [3]: [s_store_sk#186, sum#187, sum#188]
+Keys [1]: [s_store_sk#186]
+Functions [2]: [sum(UnscaledValue(ss_ext_sales_price#189)), sum(UnscaledValue(ss_net_profit#190))]
+Aggregate Attributes [2]: [sum(UnscaledValue(ss_ext_sales_price#189))#12, sum(UnscaledValue(ss_net_profit#190))#13]
+Results [3]: [s_store_sk#186, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#189))#12,17,2) AS sales#191, MakeDecimal(sum(UnscaledValue(ss_net_profit#190))#13,17,2) AS profit#192]
+
+(106) ReusedExchange [Reuses operator id: 28]
+Output [3]: [s_store_sk#193, returns#194, profit_loss#195]
+
+(107) BroadcastHashJoin [codegen id : 55]
+Left keys [1]: [s_store_sk#186]
+Right keys [1]: [s_store_sk#193]
+Join type: LeftOuter
+Join condition: None
+
+(108) Project [codegen id : 55]
+Output [5]: [store channel AS channel#196, s_store_sk#186 AS id#197, sales#191, coalesce(returns#194, 0.00) AS returns#198, (profit#192 - coalesce(profit_loss#195, 0.00)) AS profit#199]
+Input [6]: [s_store_sk#186, sales#191, profit#192, s_store_sk#193, returns#194, profit_loss#195]
+
+(109) ReusedExchange [Reuses operator id: 37]
+Output [3]: [cs_call_center_sk#200, sum#201, sum#202]
+
+(110) HashAggregate [codegen id : 61]
+Input [3]: [cs_call_center_sk#200, sum#201, sum#202]
+Keys [1]: [cs_call_center_sk#200]
+Functions [2]: [sum(UnscaledValue(cs_ext_sales_price#203)), sum(UnscaledValue(cs_net_profit#204))]
+Aggregate Attributes [2]: [sum(UnscaledValue(cs_ext_sales_price#203))#43, sum(UnscaledValue(cs_net_profit#204))#44]
+Results [3]: [cs_call_center_sk#200, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#203))#43,17,2) AS sales#205, MakeDecimal(sum(UnscaledValue(cs_net_profit#204))#44,17,2) AS profit#206]
+
+(111) ReusedExchange [Reuses operator id: 47]
+Output [2]: [returns#207, profit_loss#208]
+
+(112) BroadcastNestedLoopJoin [codegen id : 61]
+Join type: Inner
+Join condition: None
+
+(113) Project [codegen id : 61]
+Output [5]: [catalog channel AS channel#209, cs_call_center_sk#200 AS id#210, sales#205, returns#207, (profit#206 - profit_loss#208) AS profit#211]
+Input [5]: [cs_call_center_sk#200, sales#205, profit#206, returns#207, profit_loss#208]
+
+(114) ReusedExchange [Reuses operator id: 63]
+Output [3]: [wp_web_page_sk#212, sum#213, sum#214]
+
+(115) HashAggregate [codegen id : 69]
+Input [3]: [wp_web_page_sk#212, sum#213, sum#214]
+Keys [1]: [wp_web_page_sk#212]
+Functions [2]: [sum(UnscaledValue(ws_ext_sales_price#215)), sum(UnscaledValue(ws_net_profit#216))]
+Aggregate Attributes [2]: [sum(UnscaledValue(ws_ext_sales_price#215))#72, sum(UnscaledValue(ws_net_profit#216))#73]
+Results [3]: [wp_web_page_sk#212, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#215))#72,17,2) AS sales#217, MakeDecimal(sum(UnscaledValue(ws_net_profit#216))#73,17,2) AS profit#218]
+
+(116) ReusedExchange [Reuses operator id: 77]
+Output [3]: [wp_web_page_sk#219, returns#220, profit_loss#221]
+
+(117) BroadcastHashJoin [codegen id : 69]
+Left keys [1]: [wp_web_page_sk#212]
+Right keys [1]: [wp_web_page_sk#219]
+Join type: LeftOuter
+Join condition: None
+
+(118) Project [codegen id : 69]
+Output [5]: [web channel AS channel#222, wp_web_page_sk#212 AS id#223, sales#217, coalesce(returns#220, 0.00) AS returns#224, (profit#218 - coalesce(profit_loss#221, 0.00)) AS profit#225]
+Input [6]: [wp_web_page_sk#212, sales#217, profit#218, wp_web_page_sk#219, returns#220, profit_loss#221]
+
+(119) Union
+
+(120) HashAggregate [codegen id : 70]
+Input [5]: [channel#196, id#197, sales#191, returns#198, profit#199]
+Keys [2]: [channel#196, id#197]
+Functions [3]: [partial_sum(sales#191), partial_sum(returns#198), partial_sum(profit#199)]
+Aggregate Attributes [6]: [sum#226, isEmpty#227, sum#228, isEmpty#229, sum#230, isEmpty#231]
+Results [8]: [channel#196, id#197, sum#232, isEmpty#233, sum#234, isEmpty#235, sum#236, isEmpty#237]
+
+(121) HashAggregate [codegen id : 70]
+Input [8]: [channel#196, id#197, sum#232, isEmpty#233, sum#234, isEmpty#235, sum#236, isEmpty#237]
+Keys [2]: [channel#196, id#197]
+Functions [3]: [sum(sales#191), sum(returns#198), sum(profit#199)]
+Aggregate Attributes [3]: [sum(sales#191)#106, sum(returns#198)#107, sum(profit#199)#108]
+Results [3]: [sum(sales#191)#106 AS sales#238, sum(returns#198)#107 AS returns#239, sum(profit#199)#108 AS profit#240]
+
+(122) HashAggregate [codegen id : 70]
+Input [3]: [sales#238, returns#239, profit#240]
 Keys: []
-Functions [3]: [partial_sum(sales#156), partial_sum(returns#157), partial_sum(profit#158)]
-Aggregate Attributes [6]: [sum#159, isEmpty#160, sum#161, isEmpty#162, sum#163, isEmpty#164]
-Results [6]: [sum#165, isEmpty#166, sum#167, isEmpty#168, sum#169, isEmpty#170]
+Functions [3]: [partial_sum(sales#238), partial_sum(returns#239), partial_sum(profit#240)]
+Aggregate Attributes [6]: [sum#241, isEmpty#242, sum#243, isEmpty#244, sum#245, isEmpty#246]
+Results [6]: [sum#247, isEmpty#248, sum#249, isEmpty#250, sum#251, isEmpty#252]
 
-(92) Exchange
-Input [6]: [sum#165, isEmpty#166, sum#167, isEmpty#168, sum#169, isEmpty#170]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=14]
+(123) Exchange
+Input [6]: [sum#247, isEmpty#248, sum#249, isEmpty#250, sum#251, isEmpty#252]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=13]
 
-(93) HashAggregate [codegen id : 74]
-Input [6]: [sum#165, isEmpty#166, sum#167, isEmpty#168, sum#169, isEmpty#170]
+(124) HashAggregate [codegen id : 71]
+Input [6]: [sum#247, isEmpty#248, sum#249, isEmpty#250, sum#251, isEmpty#252]
 Keys: []
-Functions [3]: [sum(sales#156), sum(returns#157), sum(profit#158)]
-Aggregate Attributes [3]: [sum(sales#156)#171, sum(returns#157)#172, sum(profit#158)#173]
-Results [5]: [null AS channel#174, null AS id#175, sum(sales#156)#171 AS sales#176, sum(returns#157)#172 AS returns#177, sum(profit#158)#173 AS profit#178]
+Functions [3]: [sum(sales#238), sum(returns#239), sum(profit#240)]
+Aggregate Attributes [3]: [sum(sales#238)#253, sum(returns#239)#254, sum(profit#240)#255]
+Results [5]: [null AS channel#256, null AS id#257, sum(sales#238)#253 AS sales#258, sum(returns#239)#254 AS returns#259, sum(profit#240)#255 AS profit#260]
 
-(94) Union
+(125) Union
 
-(95) HashAggregate [codegen id : 75]
+(126) HashAggregate [codegen id : 72]
 Input [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
 Keys [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
 Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
 
-(96) Exchange
+(127) Exchange
 Input [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
-Arguments: hashpartitioning(channel#30, id#31, sales#109, returns#110, profit#111, 5), ENSURE_REQUIREMENTS, [plan_id=15]
+Arguments: hashpartitioning(channel#30, id#31, sales#109, returns#110, profit#111, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
-(97) HashAggregate [codegen id : 76]
+(128) HashAggregate [codegen id : 73]
 Input [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
 Keys [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
 Functions: []
 Aggregate Attributes: []
 Results [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
 
-(98) TakeOrderedAndProject
+(129) TakeOrderedAndProject
 Input [5]: [channel#30, id#31, sales#109, returns#110, profit#111]
 Arguments: 100, [channel#30 ASC NULLS FIRST, id#31 ASC NULLS FIRST], [channel#30, id#31, sales#109, returns#110, profit#111]
 
 ===== Subqueries =====
 
 Subquery:1 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#4 IN dynamicpruning#5
-BroadcastExchange (103)
-+- * Project (102)
-   +- * Filter (101)
-      +- * ColumnarToRow (100)
-         +- Scan parquet spark_catalog.default.date_dim (99)
+BroadcastExchange (134)
++- * Project (133)
+   +- * Filter (132)
+      +- * ColumnarToRow (131)
+         +- Scan parquet spark_catalog.default.date_dim (130)
 
 
-(99) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#6, d_date#179]
+(130) Scan parquet spark_catalog.default.date_dim
+Output [2]: [d_date_sk#6, d_date#261]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,1998-08-04), LessThanOrEqual(d_date,1998-09-03), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
-(100) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#6, d_date#179]
+(131) ColumnarToRow [codegen id : 1]
+Input [2]: [d_date_sk#6, d_date#261]
 
-(101) Filter [codegen id : 1]
-Input [2]: [d_date_sk#6, d_date#179]
-Condition : (((isnotnull(d_date#179) AND (d_date#179 >= 1998-08-04)) AND (d_date#179 <= 1998-09-03)) AND isnotnull(d_date_sk#6))
+(132) Filter [codegen id : 1]
+Input [2]: [d_date_sk#6, d_date#261]
+Condition : (((isnotnull(d_date#261) AND (d_date#261 >= 1998-08-04)) AND (d_date#261 <= 1998-09-03)) AND isnotnull(d_date_sk#6))
 
-(102) Project [codegen id : 1]
+(133) Project [codegen id : 1]
 Output [1]: [d_date_sk#6]
-Input [2]: [d_date_sk#6, d_date#179]
+Input [2]: [d_date_sk#6, d_date#261]
 
-(103) BroadcastExchange
+(134) BroadcastExchange
 Input [1]: [d_date_sk#6]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=16]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=15]
 
 Subquery:2 Hosting operator id = 16 Hosting Expression = sr_returned_date_sk#19 IN dynamicpruning#5
 
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/simplified.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/simplified.txt
index 567e325d1a544..e82c8494b698d 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/simplified.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q77a.sf100/simplified.txt
@@ -1,168 +1,215 @@
 TakeOrderedAndProject [channel,id,sales,returns,profit]
-  WholeStageCodegen (76)
+  WholeStageCodegen (73)
     HashAggregate [channel,id,sales,returns,profit]
       InputAdapter
         Exchange [channel,id,sales,returns,profit] #1
-          WholeStageCodegen (75)
+          WholeStageCodegen (72)
             HashAggregate [channel,id,sales,returns,profit]
               InputAdapter
                 Union
-                  WholeStageCodegen (24)
+                  WholeStageCodegen (23)
                     HashAggregate [channel,id,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(sales),sum(returns),sum(profit),sales,returns,profit,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                      InputAdapter
-                        Exchange [channel,id] #2
-                          WholeStageCodegen (23)
-                            HashAggregate [channel,id,sales,returns,profit] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                              InputAdapter
-                                Union
-                                  WholeStageCodegen (8)
-                                    Project [s_store_sk,sales,returns,profit,profit_loss]
-                                      BroadcastHashJoin [s_store_sk,s_store_sk]
-                                        HashAggregate [s_store_sk,sum,sum] [sum(UnscaledValue(ss_ext_sales_price)),sum(UnscaledValue(ss_net_profit)),sales,profit,sum,sum]
+                      HashAggregate [channel,id,sales,returns,profit] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                        InputAdapter
+                          Union
+                            WholeStageCodegen (8)
+                              Project [s_store_sk,sales,returns,profit,profit_loss]
+                                BroadcastHashJoin [s_store_sk,s_store_sk]
+                                  HashAggregate [s_store_sk,sum,sum] [sum(UnscaledValue(ss_ext_sales_price)),sum(UnscaledValue(ss_net_profit)),sales,profit,sum,sum]
+                                    InputAdapter
+                                      Exchange [s_store_sk] #2
+                                        WholeStageCodegen (3)
+                                          HashAggregate [s_store_sk,ss_ext_sales_price,ss_net_profit] [sum,sum,sum,sum]
+                                            Project [ss_ext_sales_price,ss_net_profit,s_store_sk]
+                                              BroadcastHashJoin [ss_store_sk,s_store_sk]
+                                                Project [ss_store_sk,ss_ext_sales_price,ss_net_profit]
+                                                  BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
+                                                    Filter [ss_store_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.store_sales [ss_store_sk,ss_ext_sales_price,ss_net_profit,ss_sold_date_sk]
+                                                            SubqueryBroadcast [d_date_sk] #1
+                                                              BroadcastExchange #3
+                                                                WholeStageCodegen (1)
+                                                                  Project [d_date_sk]
+                                                                    Filter [d_date,d_date_sk]
+                                                                      ColumnarToRow
+                                                                        InputAdapter
+                                                                          Scan parquet spark_catalog.default.date_dim [d_date_sk,d_date]
+                                                    InputAdapter
+                                                      ReusedExchange [d_date_sk] #3
+                                                InputAdapter
+                                                  BroadcastExchange #4
+                                                    WholeStageCodegen (2)
+                                                      Filter [s_store_sk]
+                                                        ColumnarToRow
+                                                          InputAdapter
+                                                            Scan parquet spark_catalog.default.store [s_store_sk]
+                                  InputAdapter
+                                    BroadcastExchange #5
+                                      WholeStageCodegen (7)
+                                        HashAggregate [s_store_sk,sum,sum] [sum(UnscaledValue(sr_return_amt)),sum(UnscaledValue(sr_net_loss)),returns,profit_loss,sum,sum]
                                           InputAdapter
-                                            Exchange [s_store_sk] #3
-                                              WholeStageCodegen (3)
-                                                HashAggregate [s_store_sk,ss_ext_sales_price,ss_net_profit] [sum,sum,sum,sum]
-                                                  Project [ss_ext_sales_price,ss_net_profit,s_store_sk]
-                                                    BroadcastHashJoin [ss_store_sk,s_store_sk]
-                                                      Project [ss_store_sk,ss_ext_sales_price,ss_net_profit]
-                                                        BroadcastHashJoin [ss_sold_date_sk,d_date_sk]
-                                                          Filter [ss_store_sk]
+                                            Exchange [s_store_sk] #6
+                                              WholeStageCodegen (6)
+                                                HashAggregate [s_store_sk,sr_return_amt,sr_net_loss] [sum,sum,sum,sum]
+                                                  Project [sr_return_amt,sr_net_loss,s_store_sk]
+                                                    BroadcastHashJoin [sr_store_sk,s_store_sk]
+                                                      Project [sr_store_sk,sr_return_amt,sr_net_loss]
+                                                        BroadcastHashJoin [sr_returned_date_sk,d_date_sk]
+                                                          Filter [sr_store_sk]
                                                             ColumnarToRow
                                                               InputAdapter
-                                                                Scan parquet spark_catalog.default.store_sales [ss_store_sk,ss_ext_sales_price,ss_net_profit,ss_sold_date_sk]
-                                                                  SubqueryBroadcast [d_date_sk] #1
-                                                                    BroadcastExchange #4
-                                                                      WholeStageCodegen (1)
-                                                                        Project [d_date_sk]
-                                                                          Filter [d_date,d_date_sk]
-                                                                            ColumnarToRow
-                                                                              InputAdapter
-                                                                                Scan parquet spark_catalog.default.date_dim [d_date_sk,d_date]
+                                                                Scan parquet spark_catalog.default.store_returns [sr_store_sk,sr_return_amt,sr_net_loss,sr_returned_date_sk]
+                                                                  ReusedSubquery [d_date_sk] #1
                                                           InputAdapter
-                                                            ReusedExchange [d_date_sk] #4
+                                                            ReusedExchange [d_date_sk] #3
                                                       InputAdapter
-                                                        BroadcastExchange #5
-                                                          WholeStageCodegen (2)
-                                                            Filter [s_store_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.store [s_store_sk]
-                                        InputAdapter
-                                          BroadcastExchange #6
-                                            WholeStageCodegen (7)
-                                              HashAggregate [s_store_sk,sum,sum] [sum(UnscaledValue(sr_return_amt)),sum(UnscaledValue(sr_net_loss)),returns,profit_loss,sum,sum]
+                                                        ReusedExchange [s_store_sk] #4
+                            WholeStageCodegen (14)
+                              Project [cs_call_center_sk,sales,returns,profit,profit_loss]
+                                BroadcastNestedLoopJoin
+                                  HashAggregate [cs_call_center_sk,sum,sum] [sum(UnscaledValue(cs_ext_sales_price)),sum(UnscaledValue(cs_net_profit)),sales,profit,sum,sum]
+                                    InputAdapter
+                                      Exchange [cs_call_center_sk] #7
+                                        WholeStageCodegen (10)
+                                          HashAggregate [cs_call_center_sk,cs_ext_sales_price,cs_net_profit] [sum,sum,sum,sum]
+                                            Project [cs_call_center_sk,cs_ext_sales_price,cs_net_profit]
+                                              BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                                ColumnarToRow
+                                                  InputAdapter
+                                                    Scan parquet spark_catalog.default.catalog_sales [cs_call_center_sk,cs_ext_sales_price,cs_net_profit,cs_sold_date_sk]
+                                                      ReusedSubquery [d_date_sk] #1
                                                 InputAdapter
-                                                  Exchange [s_store_sk] #7
-                                                    WholeStageCodegen (6)
-                                                      HashAggregate [s_store_sk,sr_return_amt,sr_net_loss] [sum,sum,sum,sum]
-                                                        Project [sr_return_amt,sr_net_loss,s_store_sk]
-                                                          BroadcastHashJoin [sr_store_sk,s_store_sk]
-                                                            Project [sr_store_sk,sr_return_amt,sr_net_loss]
-                                                              BroadcastHashJoin [sr_returned_date_sk,d_date_sk]
-                                                                Filter [sr_store_sk]
-                                                                  ColumnarToRow
-                                                                    InputAdapter
-                                                                      Scan parquet spark_catalog.default.store_returns [sr_store_sk,sr_return_amt,sr_net_loss,sr_returned_date_sk]
-                                                                        ReusedSubquery [d_date_sk] #1
-                                                                InputAdapter
-                                                                  ReusedExchange [d_date_sk] #4
-                                                            InputAdapter
-                                                              ReusedExchange [s_store_sk] #5
-                                  WholeStageCodegen (14)
-                                    Project [cs_call_center_sk,sales,returns,profit,profit_loss]
-                                      BroadcastNestedLoopJoin
-                                        HashAggregate [cs_call_center_sk,sum,sum] [sum(UnscaledValue(cs_ext_sales_price)),sum(UnscaledValue(cs_net_profit)),sales,profit,sum,sum]
+                                                  ReusedExchange [d_date_sk] #3
+                                  InputAdapter
+                                    BroadcastExchange #8
+                                      WholeStageCodegen (13)
+                                        HashAggregate [sum,sum] [sum(UnscaledValue(cr_return_amount)),sum(UnscaledValue(cr_net_loss)),returns,profit_loss,sum,sum]
                                           InputAdapter
-                                            Exchange [cs_call_center_sk] #8
-                                              WholeStageCodegen (10)
-                                                HashAggregate [cs_call_center_sk,cs_ext_sales_price,cs_net_profit] [sum,sum,sum,sum]
-                                                  Project [cs_call_center_sk,cs_ext_sales_price,cs_net_profit]
-                                                    BroadcastHashJoin [cs_sold_date_sk,d_date_sk]
+                                            Exchange #9
+                                              WholeStageCodegen (12)
+                                                HashAggregate [cr_return_amount,cr_net_loss] [sum,sum,sum,sum]
+                                                  Project [cr_return_amount,cr_net_loss]
+                                                    BroadcastHashJoin [cr_returned_date_sk,d_date_sk]
                                                       ColumnarToRow
                                                         InputAdapter
-                                                          Scan parquet spark_catalog.default.catalog_sales [cs_call_center_sk,cs_ext_sales_price,cs_net_profit,cs_sold_date_sk]
+                                                          Scan parquet spark_catalog.default.catalog_returns [cr_return_amount,cr_net_loss,cr_returned_date_sk]
                                                             ReusedSubquery [d_date_sk] #1
                                                       InputAdapter
-                                                        ReusedExchange [d_date_sk] #4
-                                        InputAdapter
-                                          BroadcastExchange #9
-                                            WholeStageCodegen (13)
-                                              HashAggregate [sum,sum] [sum(UnscaledValue(cr_return_amount)),sum(UnscaledValue(cr_net_loss)),returns,profit_loss,sum,sum]
+                                                        ReusedExchange [d_date_sk] #3
+                            WholeStageCodegen (22)
+                              Project [wp_web_page_sk,sales,returns,profit,profit_loss]
+                                BroadcastHashJoin [wp_web_page_sk,wp_web_page_sk]
+                                  HashAggregate [wp_web_page_sk,sum,sum] [sum(UnscaledValue(ws_ext_sales_price)),sum(UnscaledValue(ws_net_profit)),sales,profit,sum,sum]
+                                    InputAdapter
+                                      Exchange [wp_web_page_sk] #10
+                                        WholeStageCodegen (17)
+                                          HashAggregate [wp_web_page_sk,ws_ext_sales_price,ws_net_profit] [sum,sum,sum,sum]
+                                            Project [ws_ext_sales_price,ws_net_profit,wp_web_page_sk]
+                                              BroadcastHashJoin [ws_web_page_sk,wp_web_page_sk]
+                                                Project [ws_web_page_sk,ws_ext_sales_price,ws_net_profit]
+                                                  BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
+                                                    Filter [ws_web_page_sk]
+                                                      ColumnarToRow
+                                                        InputAdapter
+                                                          Scan parquet spark_catalog.default.web_sales [ws_web_page_sk,ws_ext_sales_price,ws_net_profit,ws_sold_date_sk]
+                                                            ReusedSubquery [d_date_sk] #1
+                                                    InputAdapter
+                                                      ReusedExchange [d_date_sk] #3
                                                 InputAdapter
-                                                  Exchange #10
-                                                    WholeStageCodegen (12)
-                                                      HashAggregate [cr_return_amount,cr_net_loss] [sum,sum,sum,sum]
-                                                        Project [cr_return_amount,cr_net_loss]
-                                                          BroadcastHashJoin [cr_returned_date_sk,d_date_sk]
-                                                            ColumnarToRow
-                                                              InputAdapter
-                                                                Scan parquet spark_catalog.default.catalog_returns [cr_return_amount,cr_net_loss,cr_returned_date_sk]
-                                                                  ReusedSubquery [d_date_sk] #1
-                                                            InputAdapter
-                                                              ReusedExchange [d_date_sk] #4
-                                  WholeStageCodegen (22)
-                                    Project [wp_web_page_sk,sales,returns,profit,profit_loss]
-                                      BroadcastHashJoin [wp_web_page_sk,wp_web_page_sk]
-                                        HashAggregate [wp_web_page_sk,sum,sum] [sum(UnscaledValue(ws_ext_sales_price)),sum(UnscaledValue(ws_net_profit)),sales,profit,sum,sum]
+                                                  BroadcastExchange #11
+                                                    WholeStageCodegen (16)
+                                                      Filter [wp_web_page_sk]
+                                                        ColumnarToRow
+                                                          InputAdapter
+                                                            Scan parquet spark_catalog.default.web_page [wp_web_page_sk]
+                                  InputAdapter
+                                    BroadcastExchange #12
+                                      WholeStageCodegen (21)
+                                        HashAggregate [wp_web_page_sk,sum,sum] [sum(UnscaledValue(wr_return_amt)),sum(UnscaledValue(wr_net_loss)),returns,profit_loss,sum,sum]
                                           InputAdapter
-                                            Exchange [wp_web_page_sk] #11
-                                              WholeStageCodegen (17)
-                                                HashAggregate [wp_web_page_sk,ws_ext_sales_price,ws_net_profit] [sum,sum,sum,sum]
-                                                  Project [ws_ext_sales_price,ws_net_profit,wp_web_page_sk]
-                                                    BroadcastHashJoin [ws_web_page_sk,wp_web_page_sk]
-                                                      Project [ws_web_page_sk,ws_ext_sales_price,ws_net_profit]
-                                                        BroadcastHashJoin [ws_sold_date_sk,d_date_sk]
-                                                          Filter [ws_web_page_sk]
+                                            Exchange [wp_web_page_sk] #13
+                                              WholeStageCodegen (20)
+                                                HashAggregate [wp_web_page_sk,wr_return_amt,wr_net_loss] [sum,sum,sum,sum]
+                                                  Project [wr_return_amt,wr_net_loss,wp_web_page_sk]
+                                                    BroadcastHashJoin [wr_web_page_sk,wp_web_page_sk]
+                                                      Project [wr_web_page_sk,wr_return_amt,wr_net_loss]
+                                                        BroadcastHashJoin [wr_returned_date_sk,d_date_sk]
+                                                          Filter [wr_web_page_sk]
                                                             ColumnarToRow
                                                               InputAdapter
-                                                                Scan parquet spark_catalog.default.web_sales [ws_web_page_sk,ws_ext_sales_price,ws_net_profit,ws_sold_date_sk]
+                                                                Scan parquet spark_catalog.default.web_returns [wr_web_page_sk,wr_return_amt,wr_net_loss,wr_returned_date_sk]
                                                                   ReusedSubquery [d_date_sk] #1
                                                           InputAdapter
-                                                            ReusedExchange [d_date_sk] #4
+                                                            ReusedExchange [d_date_sk] #3
                                                       InputAdapter
-                                                        BroadcastExchange #12
-                                                          WholeStageCodegen (16)
-                                                            Filter [wp_web_page_sk]
-                                                              ColumnarToRow
-                                                                InputAdapter
-                                                                  Scan parquet spark_catalog.default.web_page [wp_web_page_sk]
-                                        InputAdapter
-                                          BroadcastExchange #13
-                                            WholeStageCodegen (21)
-                                              HashAggregate [wp_web_page_sk,sum,sum] [sum(UnscaledValue(wr_return_amt)),sum(UnscaledValue(wr_net_loss)),returns,profit_loss,sum,sum]
-                                                InputAdapter
-                                                  Exchange [wp_web_page_sk] #14
-                                                    WholeStageCodegen (20)
-                                                      HashAggregate [wp_web_page_sk,wr_return_amt,wr_net_loss] [sum,sum,sum,sum]
-                                                        Project [wr_return_amt,wr_net_loss,wp_web_page_sk]
-                                                          BroadcastHashJoin [wr_web_page_sk,wp_web_page_sk]
-                                                            Project [wr_web_page_sk,wr_return_amt,wr_net_loss]
-                                                              BroadcastHashJoin [wr_returned_date_sk,d_date_sk]
-                                                                Filter [wr_web_page_sk]
-                                                                  ColumnarToRow
-                                                                    InputAdapter
-                                                                      Scan parquet spark_catalog.default.web_returns [wr_web_page_sk,wr_return_amt,wr_net_loss,wr_returned_date_sk]
-                                                                        ReusedSubquery [d_date_sk] #1
-                                                                InputAdapter
-                                                                  ReusedExchange [d_date_sk] #4
-                                                            InputAdapter
-                                                              ReusedExchange [wp_web_page_sk] #12
-                  WholeStageCodegen (49)
+                                                        ReusedExchange [wp_web_page_sk] #11
+                  WholeStageCodegen (47)
                     HashAggregate [channel,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(sales),sum(returns),sum(profit),id,sales,returns,profit,sum,isEmpty,sum,isEmpty,sum,isEmpty]
                       InputAdapter
-                        Exchange [channel] #15
-                          WholeStageCodegen (48)
+                        Exchange [channel] #14
+                          WholeStageCodegen (46)
                             HashAggregate [channel,sales,returns,profit] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
                               HashAggregate [channel,id,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(sales),sum(returns),sum(profit),sales,returns,profit,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                                InputAdapter
-                                  ReusedExchange [channel,id,sum,isEmpty,sum,isEmpty,sum,isEmpty] #2
-                  WholeStageCodegen (74)
+                                HashAggregate [channel,id,sales,returns,profit] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (31)
+                                        Project [s_store_sk,sales,returns,profit,profit_loss]
+                                          BroadcastHashJoin [s_store_sk,s_store_sk]
+                                            HashAggregate [s_store_sk,sum,sum] [sum(UnscaledValue(ss_ext_sales_price)),sum(UnscaledValue(ss_net_profit)),sales,profit,sum,sum]
+                                              InputAdapter
+                                                ReusedExchange [s_store_sk,sum,sum] #2
+                                            InputAdapter
+                                              ReusedExchange [s_store_sk,returns,profit_loss] #5
+                                      WholeStageCodegen (37)
+                                        Project [cs_call_center_sk,sales,returns,profit,profit_loss]
+                                          BroadcastNestedLoopJoin
+                                            HashAggregate [cs_call_center_sk,sum,sum] [sum(UnscaledValue(cs_ext_sales_price)),sum(UnscaledValue(cs_net_profit)),sales,profit,sum,sum]
+                                              InputAdapter
+                                                ReusedExchange [cs_call_center_sk,sum,sum] #7
+                                            InputAdapter
+                                              ReusedExchange [returns,profit_loss] #8
+                                      WholeStageCodegen (45)
+                                        Project [wp_web_page_sk,sales,returns,profit,profit_loss]
+                                          BroadcastHashJoin [wp_web_page_sk,wp_web_page_sk]
+                                            HashAggregate [wp_web_page_sk,sum,sum] [sum(UnscaledValue(ws_ext_sales_price)),sum(UnscaledValue(ws_net_profit)),sales,profit,sum,sum]
+                                              InputAdapter
+                                                ReusedExchange [wp_web_page_sk,sum,sum] #10
+                                            InputAdapter
+                                              ReusedExchange [wp_web_page_sk,returns,profit_loss] #12
+                  WholeStageCodegen (71)
                     HashAggregate [sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(sales),sum(returns),sum(profit),channel,id,sales,returns,profit,sum,isEmpty,sum,isEmpty,sum,isEmpty]
                       InputAdapter
-                        Exchange #16
-                          WholeStageCodegen (73)
+                        Exchange #15
+                          WholeStageCodegen (70)
                             HashAggregate [sales,returns,profit] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
                               HashAggregate [channel,id,sum,isEmpty,sum,isEmpty,sum,isEmpty] [sum(sales),sum(returns),sum(profit),sales,returns,profit,sum,isEmpty,sum,isEmpty,sum,isEmpty]
-                                InputAdapter
-                                  ReusedExchange [channel,id,sum,isEmpty,sum,isEmpty,sum,isEmpty] #2
+                                HashAggregate [channel,id,sales,returns,profit] [sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty,sum,isEmpty]
+                                  InputAdapter
+                                    Union
+                                      WholeStageCodegen (55)
+                                        Project [s_store_sk,sales,returns,profit,profit_loss]
+                                          BroadcastHashJoin [s_store_sk,s_store_sk]
+                                            HashAggregate [s_store_sk,sum,sum] [sum(UnscaledValue(ss_ext_sales_price)),sum(UnscaledValue(ss_net_profit)),sales,profit,sum,sum]
+                                              InputAdapter
+                                                ReusedExchange [s_store_sk,sum,sum] #2
+                                            InputAdapter
+                                              ReusedExchange [s_store_sk,returns,profit_loss] #5
+                                      WholeStageCodegen (61)
+                                        Project [cs_call_center_sk,sales,returns,profit,profit_loss]
+                                          BroadcastNestedLoopJoin
+                                            HashAggregate [cs_call_center_sk,sum,sum] [sum(UnscaledValue(cs_ext_sales_price)),sum(UnscaledValue(cs_net_profit)),sales,profit,sum,sum]
+                                              InputAdapter
+                                                ReusedExchange [cs_call_center_sk,sum,sum] #7
+                                            InputAdapter
+                                              ReusedExchange [returns,profit_loss] #8
+                                      WholeStageCodegen (69)
+                                        Project [wp_web_page_sk,sales,returns,profit,profit_loss]
+                                          BroadcastHashJoin [wp_web_page_sk,wp_web_page_sk]
+                                            HashAggregate [wp_web_page_sk,sum,sum] [sum(UnscaledValue(ws_ext_sales_price)),sum(UnscaledValue(ws_net_profit)),sales,profit,sum,sum]
+                                              InputAdapter
+                                                ReusedExchange [wp_web_page_sk,sum,sum] #10
+                                            InputAdapter
+                                              ReusedExchange [wp_web_page_sk,returns,profit_loss] #12
diff --git a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q80a.sf100/explain.txt b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q80a.sf100/explain.txt
index f21d2ce9affd7..33eceb0187c0c 100644
--- a/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q80a.sf100/explain.txt
+++ b/sql/core/src/test/resources/tpcds-plan-stability/approved-plans-v2_7/q80a.sf100/explain.txt
@@ -216,946 +216,946 @@ Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_e
 
 (3) Filter [codegen id : 1]
 Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7]
-Condition : ((((isnotnull(ss_store_sk#2) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_promo_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#10], xxhash64(ss_item_sk#1, 42))) AND might_contain(Subquery scalar-subquery#11, [id=#12], xxhash64(ss_promo_sk#3, 42)))
+Condition : ((((isnotnull(ss_store_sk#2) AND isnotnull(ss_item_sk#1)) AND isnotnull(ss_promo_sk#3)) AND might_contain(Subquery scalar-subquery#9, [id=#1], xxhash64(ss_item_sk#1, 42))) AND might_contain(Subquery scalar-subquery#10, [id=#2], xxhash64(ss_promo_sk#3, 42)))
 
 (4) Exchange
 Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7]
-Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#4, 5), ENSURE_REQUIREMENTS, [plan_id=1]
+Arguments: hashpartitioning(ss_item_sk#1, ss_ticket_number#4, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (5) Sort [codegen id : 2]
 Input [7]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7]
 Arguments: [ss_item_sk#1 ASC NULLS FIRST, ss_ticket_number#4 ASC NULLS FIRST], false, 0
 
 (6) Scan parquet spark_catalog.default.store_returns
-Output [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
+Output [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store_returns]
 PushedFilters: [IsNotNull(sr_item_sk), IsNotNull(sr_ticket_number)]
 ReadSchema: struct<sr_item_sk:int,sr_ticket_number:int,sr_return_amt:decimal(7,2),sr_net_loss:decimal(7,2)>
 
 (7) ColumnarToRow [codegen id : 3]
-Input [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
+Input [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
 
 (8) Filter [codegen id : 3]
-Input [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
-Condition : (isnotnull(sr_item_sk#13) AND isnotnull(sr_ticket_number#14))
+Input [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
+Condition : (isnotnull(sr_item_sk#11) AND isnotnull(sr_ticket_number#12))
 
 (9) Project [codegen id : 3]
-Output [4]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
-Input [5]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16, sr_returned_date_sk#17]
+Output [4]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
+Input [5]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14, sr_returned_date_sk#15]
 
 (10) Exchange
-Input [4]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
-Arguments: hashpartitioning(sr_item_sk#13, sr_ticket_number#14, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [4]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
+Arguments: hashpartitioning(sr_item_sk#11, sr_ticket_number#12, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (11) Sort [codegen id : 4]
-Input [4]: [sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
-Arguments: [sr_item_sk#13 ASC NULLS FIRST, sr_ticket_number#14 ASC NULLS FIRST], false, 0
+Input [4]: [sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
+Arguments: [sr_item_sk#11 ASC NULLS FIRST, sr_ticket_number#12 ASC NULLS FIRST], false, 0
 
 (12) SortMergeJoin [codegen id : 9]
 Left keys [2]: [ss_item_sk#1, ss_ticket_number#4]
-Right keys [2]: [sr_item_sk#13, sr_ticket_number#14]
+Right keys [2]: [sr_item_sk#11, sr_ticket_number#12]
 Join type: LeftOuter
 Join condition: None
 
 (13) Project [codegen id : 9]
-Output [8]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16]
-Input [11]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_item_sk#13, sr_ticket_number#14, sr_return_amt#15, sr_net_loss#16]
+Output [8]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14]
+Input [11]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ticket_number#4, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_item_sk#11, sr_ticket_number#12, sr_return_amt#13, sr_net_loss#14]
 
 (14) Scan parquet spark_catalog.default.item
-Output [2]: [i_item_sk#18, i_current_price#19]
+Output [2]: [i_item_sk#16, i_current_price#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), GreaterThan(i_current_price,50.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2)>
 
 (15) ColumnarToRow [codegen id : 5]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (16) Filter [codegen id : 5]
-Input [2]: [i_item_sk#18, i_current_price#19]
-Condition : ((isnotnull(i_current_price#19) AND (i_current_price#19 > 50.00)) AND isnotnull(i_item_sk#18))
+Input [2]: [i_item_sk#16, i_current_price#17]
+Condition : ((isnotnull(i_current_price#17) AND (i_current_price#17 > 50.00)) AND isnotnull(i_item_sk#16))
 
 (17) Project [codegen id : 5]
-Output [1]: [i_item_sk#18]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Output [1]: [i_item_sk#16]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (18) BroadcastExchange
-Input [1]: [i_item_sk#18]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=3]
+Input [1]: [i_item_sk#16]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=5]
 
 (19) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_item_sk#1]
-Right keys [1]: [i_item_sk#18]
+Right keys [1]: [i_item_sk#16]
 Join type: Inner
 Join condition: None
 
 (20) Project [codegen id : 9]
-Output [7]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16]
-Input [9]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16, i_item_sk#18]
+Output [7]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14]
+Input [9]: [ss_item_sk#1, ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14, i_item_sk#16]
 
 (21) Scan parquet spark_catalog.default.promotion
-Output [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [2]: [p_promo_sk#18, p_channel_tv#19]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/promotion]
 PushedFilters: [IsNotNull(p_channel_tv), EqualTo(p_channel_tv,N), IsNotNull(p_promo_sk)]
 ReadSchema: struct<p_promo_sk:int,p_channel_tv:string>
 
 (22) ColumnarToRow [codegen id : 6]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (23) Filter [codegen id : 6]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
-Condition : ((isnotnull(p_channel_tv#21) AND (p_channel_tv#21 = N)) AND isnotnull(p_promo_sk#20))
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
+Condition : ((isnotnull(p_channel_tv#19) AND (p_channel_tv#19 = N)) AND isnotnull(p_promo_sk#18))
 
 (24) Project [codegen id : 6]
-Output [1]: [p_promo_sk#20]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [1]: [p_promo_sk#18]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (25) BroadcastExchange
-Input [1]: [p_promo_sk#20]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=4]
+Input [1]: [p_promo_sk#18]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=6]
 
 (26) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_promo_sk#3]
-Right keys [1]: [p_promo_sk#20]
+Right keys [1]: [p_promo_sk#18]
 Join type: Inner
 Join condition: None
 
 (27) Project [codegen id : 9]
-Output [6]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16]
-Input [8]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16, p_promo_sk#20]
+Output [6]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14]
+Input [8]: [ss_store_sk#2, ss_promo_sk#3, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14, p_promo_sk#18]
 
 (28) ReusedExchange [Reuses operator id: 221]
-Output [1]: [d_date_sk#22]
+Output [1]: [d_date_sk#20]
 
 (29) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_sold_date_sk#7]
-Right keys [1]: [d_date_sk#22]
+Right keys [1]: [d_date_sk#20]
 Join type: Inner
 Join condition: None
 
 (30) Project [codegen id : 9]
-Output [5]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16]
-Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#15, sr_net_loss#16, d_date_sk#22]
+Output [5]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14]
+Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, ss_sold_date_sk#7, sr_return_amt#13, sr_net_loss#14, d_date_sk#20]
 
 (31) Scan parquet spark_catalog.default.store
-Output [2]: [s_store_sk#23, s_store_id#24]
+Output [2]: [s_store_sk#21, s_store_id#22]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/store]
 PushedFilters: [IsNotNull(s_store_sk)]
 ReadSchema: struct<s_store_sk:int,s_store_id:string>
 
 (32) ColumnarToRow [codegen id : 8]
-Input [2]: [s_store_sk#23, s_store_id#24]
+Input [2]: [s_store_sk#21, s_store_id#22]
 
 (33) Filter [codegen id : 8]
-Input [2]: [s_store_sk#23, s_store_id#24]
-Condition : isnotnull(s_store_sk#23)
+Input [2]: [s_store_sk#21, s_store_id#22]
+Condition : isnotnull(s_store_sk#21)
 
 (34) BroadcastExchange
-Input [2]: [s_store_sk#23, s_store_id#24]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=5]
+Input [2]: [s_store_sk#21, s_store_id#22]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=7]
 
 (35) BroadcastHashJoin [codegen id : 9]
 Left keys [1]: [ss_store_sk#2]
-Right keys [1]: [s_store_sk#23]
+Right keys [1]: [s_store_sk#21]
 Join type: Inner
 Join condition: None
 
 (36) Project [codegen id : 9]
-Output [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16, s_store_id#24]
-Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16, s_store_sk#23, s_store_id#24]
+Output [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14, s_store_id#22]
+Input [7]: [ss_store_sk#2, ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14, s_store_sk#21, s_store_id#22]
 
 (37) HashAggregate [codegen id : 9]
-Input [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#15, sr_net_loss#16, s_store_id#24]
-Keys [1]: [s_store_id#24]
-Functions [3]: [partial_sum(UnscaledValue(ss_ext_sales_price#5)), partial_sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00)), partial_sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#25, sum#26, isEmpty#27, sum#28, isEmpty#29]
-Results [6]: [s_store_id#24, sum#30, sum#31, isEmpty#32, sum#33, isEmpty#34]
+Input [5]: [ss_ext_sales_price#5, ss_net_profit#6, sr_return_amt#13, sr_net_loss#14, s_store_id#22]
+Keys [1]: [s_store_id#22]
+Functions [3]: [partial_sum(UnscaledValue(ss_ext_sales_price#5)), partial_sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00)), partial_sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#23, sum#24, isEmpty#25, sum#26, isEmpty#27]
+Results [6]: [s_store_id#22, sum#28, sum#29, isEmpty#30, sum#31, isEmpty#32]
 
 (38) Exchange
-Input [6]: [s_store_id#24, sum#30, sum#31, isEmpty#32, sum#33, isEmpty#34]
-Arguments: hashpartitioning(s_store_id#24, 5), ENSURE_REQUIREMENTS, [plan_id=6]
+Input [6]: [s_store_id#22, sum#28, sum#29, isEmpty#30, sum#31, isEmpty#32]
+Arguments: hashpartitioning(s_store_id#22, 5), ENSURE_REQUIREMENTS, [plan_id=8]
 
 (39) HashAggregate [codegen id : 10]
-Input [6]: [s_store_id#24, sum#30, sum#31, isEmpty#32, sum#33, isEmpty#34]
-Keys [1]: [s_store_id#24]
-Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#5)), sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00)), sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#5))#35, sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00))#36, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))#37]
-Results [5]: [store channel AS channel#38, concat(store, s_store_id#24) AS id#39, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#5))#35,17,2) AS sales#40, sum(coalesce(cast(sr_return_amt#15 as decimal(12,2)), 0.00))#36 AS returns#41, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#16 as decimal(12,2)), 0.00)))#37 AS profit#42]
+Input [6]: [s_store_id#22, sum#28, sum#29, isEmpty#30, sum#31, isEmpty#32]
+Keys [1]: [s_store_id#22]
+Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#5)), sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00)), sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#5))#33, sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00))#34, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))#35]
+Results [5]: [store channel AS channel#36, concat(store, s_store_id#22) AS id#37, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#5))#33,17,2) AS sales#38, sum(coalesce(cast(sr_return_amt#13 as decimal(12,2)), 0.00))#34 AS returns#39, sum((ss_net_profit#6 - coalesce(cast(sr_net_loss#14 as decimal(12,2)), 0.00)))#35 AS profit#40]
 
 (40) Scan parquet spark_catalog.default.catalog_sales
-Output [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
+Output [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#49), dynamicpruningexpression(cs_sold_date_sk#49 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#47), dynamicpruningexpression(cs_sold_date_sk#47 IN dynamicpruning#8)]
 PushedFilters: [IsNotNull(cs_catalog_page_sk), IsNotNull(cs_item_sk), IsNotNull(cs_promo_sk)]
 ReadSchema: struct<cs_catalog_page_sk:int,cs_item_sk:int,cs_promo_sk:int,cs_order_number:int,cs_ext_sales_price:decimal(7,2),cs_net_profit:decimal(7,2)>
 
 (41) ColumnarToRow [codegen id : 11]
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
 
 (42) Filter [codegen id : 11]
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
-Condition : ((((isnotnull(cs_catalog_page_sk#43) AND isnotnull(cs_item_sk#44)) AND isnotnull(cs_promo_sk#45)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#10], xxhash64(cs_item_sk#44, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#11, [id=#12], xxhash64(cs_promo_sk#45, 42)))
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
+Condition : ((((isnotnull(cs_catalog_page_sk#41) AND isnotnull(cs_item_sk#42)) AND isnotnull(cs_promo_sk#43)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#1], xxhash64(cs_item_sk#42, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#10, [id=#2], xxhash64(cs_promo_sk#43, 42)))
 
 (43) Exchange
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
-Arguments: hashpartitioning(cs_item_sk#44, cs_order_number#46, 5), ENSURE_REQUIREMENTS, [plan_id=7]
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
+Arguments: hashpartitioning(cs_item_sk#42, cs_order_number#44, 5), ENSURE_REQUIREMENTS, [plan_id=9]
 
 (44) Sort [codegen id : 12]
-Input [7]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49]
-Arguments: [cs_item_sk#44 ASC NULLS FIRST, cs_order_number#46 ASC NULLS FIRST], false, 0
+Input [7]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47]
+Arguments: [cs_item_sk#42 ASC NULLS FIRST, cs_order_number#44 ASC NULLS FIRST], false, 0
 
 (45) Scan parquet spark_catalog.default.catalog_returns
-Output [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
+Output [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_returns]
 PushedFilters: [IsNotNull(cr_item_sk), IsNotNull(cr_order_number)]
 ReadSchema: struct<cr_item_sk:int,cr_order_number:int,cr_return_amount:decimal(7,2),cr_net_loss:decimal(7,2)>
 
 (46) ColumnarToRow [codegen id : 13]
-Input [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
+Input [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
 
 (47) Filter [codegen id : 13]
-Input [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
-Condition : (isnotnull(cr_item_sk#50) AND isnotnull(cr_order_number#51))
+Input [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
+Condition : (isnotnull(cr_item_sk#48) AND isnotnull(cr_order_number#49))
 
 (48) Project [codegen id : 13]
-Output [4]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
-Input [5]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53, cr_returned_date_sk#54]
+Output [4]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
+Input [5]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51, cr_returned_date_sk#52]
 
 (49) Exchange
-Input [4]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
-Arguments: hashpartitioning(cr_item_sk#50, cr_order_number#51, 5), ENSURE_REQUIREMENTS, [plan_id=8]
+Input [4]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
+Arguments: hashpartitioning(cr_item_sk#48, cr_order_number#49, 5), ENSURE_REQUIREMENTS, [plan_id=10]
 
 (50) Sort [codegen id : 14]
-Input [4]: [cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
-Arguments: [cr_item_sk#50 ASC NULLS FIRST, cr_order_number#51 ASC NULLS FIRST], false, 0
+Input [4]: [cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
+Arguments: [cr_item_sk#48 ASC NULLS FIRST, cr_order_number#49 ASC NULLS FIRST], false, 0
 
 (51) SortMergeJoin [codegen id : 19]
-Left keys [2]: [cs_item_sk#44, cs_order_number#46]
-Right keys [2]: [cr_item_sk#50, cr_order_number#51]
+Left keys [2]: [cs_item_sk#42, cs_order_number#44]
+Right keys [2]: [cr_item_sk#48, cr_order_number#49]
 Join type: LeftOuter
 Join condition: None
 
 (52) Project [codegen id : 19]
-Output [8]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53]
-Input [11]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_order_number#46, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_item_sk#50, cr_order_number#51, cr_return_amount#52, cr_net_loss#53]
+Output [8]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51]
+Input [11]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_order_number#44, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_item_sk#48, cr_order_number#49, cr_return_amount#50, cr_net_loss#51]
 
 (53) ReusedExchange [Reuses operator id: 18]
-Output [1]: [i_item_sk#55]
+Output [1]: [i_item_sk#53]
 
 (54) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_item_sk#44]
-Right keys [1]: [i_item_sk#55]
+Left keys [1]: [cs_item_sk#42]
+Right keys [1]: [i_item_sk#53]
 Join type: Inner
 Join condition: None
 
 (55) Project [codegen id : 19]
-Output [7]: [cs_catalog_page_sk#43, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53]
-Input [9]: [cs_catalog_page_sk#43, cs_item_sk#44, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53, i_item_sk#55]
+Output [7]: [cs_catalog_page_sk#41, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51]
+Input [9]: [cs_catalog_page_sk#41, cs_item_sk#42, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51, i_item_sk#53]
 
 (56) ReusedExchange [Reuses operator id: 25]
-Output [1]: [p_promo_sk#56]
+Output [1]: [p_promo_sk#54]
 
 (57) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_promo_sk#45]
-Right keys [1]: [p_promo_sk#56]
+Left keys [1]: [cs_promo_sk#43]
+Right keys [1]: [p_promo_sk#54]
 Join type: Inner
 Join condition: None
 
 (58) Project [codegen id : 19]
-Output [6]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53]
-Input [8]: [cs_catalog_page_sk#43, cs_promo_sk#45, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53, p_promo_sk#56]
+Output [6]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51]
+Input [8]: [cs_catalog_page_sk#41, cs_promo_sk#43, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51, p_promo_sk#54]
 
 (59) ReusedExchange [Reuses operator id: 221]
-Output [1]: [d_date_sk#57]
+Output [1]: [d_date_sk#55]
 
 (60) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_sold_date_sk#49]
-Right keys [1]: [d_date_sk#57]
+Left keys [1]: [cs_sold_date_sk#47]
+Right keys [1]: [d_date_sk#55]
 Join type: Inner
 Join condition: None
 
 (61) Project [codegen id : 19]
-Output [5]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53]
-Input [7]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cs_sold_date_sk#49, cr_return_amount#52, cr_net_loss#53, d_date_sk#57]
+Output [5]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51]
+Input [7]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cs_sold_date_sk#47, cr_return_amount#50, cr_net_loss#51, d_date_sk#55]
 
 (62) Scan parquet spark_catalog.default.catalog_page
-Output [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
+Output [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/catalog_page]
 PushedFilters: [IsNotNull(cp_catalog_page_sk)]
 ReadSchema: struct<cp_catalog_page_sk:int,cp_catalog_page_id:string>
 
 (63) ColumnarToRow [codegen id : 18]
-Input [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
+Input [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
 
 (64) Filter [codegen id : 18]
-Input [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
-Condition : isnotnull(cp_catalog_page_sk#58)
+Input [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
+Condition : isnotnull(cp_catalog_page_sk#56)
 
 (65) BroadcastExchange
-Input [2]: [cp_catalog_page_sk#58, cp_catalog_page_id#59]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=9]
+Input [2]: [cp_catalog_page_sk#56, cp_catalog_page_id#57]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=11]
 
 (66) BroadcastHashJoin [codegen id : 19]
-Left keys [1]: [cs_catalog_page_sk#43]
-Right keys [1]: [cp_catalog_page_sk#58]
+Left keys [1]: [cs_catalog_page_sk#41]
+Right keys [1]: [cp_catalog_page_sk#56]
 Join type: Inner
 Join condition: None
 
 (67) Project [codegen id : 19]
-Output [5]: [cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53, cp_catalog_page_id#59]
-Input [7]: [cs_catalog_page_sk#43, cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53, cp_catalog_page_sk#58, cp_catalog_page_id#59]
+Output [5]: [cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51, cp_catalog_page_id#57]
+Input [7]: [cs_catalog_page_sk#41, cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51, cp_catalog_page_sk#56, cp_catalog_page_id#57]
 
 (68) HashAggregate [codegen id : 19]
-Input [5]: [cs_ext_sales_price#47, cs_net_profit#48, cr_return_amount#52, cr_net_loss#53, cp_catalog_page_id#59]
-Keys [1]: [cp_catalog_page_id#59]
-Functions [3]: [partial_sum(UnscaledValue(cs_ext_sales_price#47)), partial_sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00)), partial_sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#60, sum#61, isEmpty#62, sum#63, isEmpty#64]
-Results [6]: [cp_catalog_page_id#59, sum#65, sum#66, isEmpty#67, sum#68, isEmpty#69]
+Input [5]: [cs_ext_sales_price#45, cs_net_profit#46, cr_return_amount#50, cr_net_loss#51, cp_catalog_page_id#57]
+Keys [1]: [cp_catalog_page_id#57]
+Functions [3]: [partial_sum(UnscaledValue(cs_ext_sales_price#45)), partial_sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00)), partial_sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#58, sum#59, isEmpty#60, sum#61, isEmpty#62]
+Results [6]: [cp_catalog_page_id#57, sum#63, sum#64, isEmpty#65, sum#66, isEmpty#67]
 
 (69) Exchange
-Input [6]: [cp_catalog_page_id#59, sum#65, sum#66, isEmpty#67, sum#68, isEmpty#69]
-Arguments: hashpartitioning(cp_catalog_page_id#59, 5), ENSURE_REQUIREMENTS, [plan_id=10]
+Input [6]: [cp_catalog_page_id#57, sum#63, sum#64, isEmpty#65, sum#66, isEmpty#67]
+Arguments: hashpartitioning(cp_catalog_page_id#57, 5), ENSURE_REQUIREMENTS, [plan_id=12]
 
 (70) HashAggregate [codegen id : 20]
-Input [6]: [cp_catalog_page_id#59, sum#65, sum#66, isEmpty#67, sum#68, isEmpty#69]
-Keys [1]: [cp_catalog_page_id#59]
-Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#47)), sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00)), sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#47))#70, sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00))#71, sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))#72]
-Results [5]: [catalog channel AS channel#73, concat(catalog_page, cp_catalog_page_id#59) AS id#74, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#47))#70,17,2) AS sales#75, sum(coalesce(cast(cr_return_amount#52 as decimal(12,2)), 0.00))#71 AS returns#76, sum((cs_net_profit#48 - coalesce(cast(cr_net_loss#53 as decimal(12,2)), 0.00)))#72 AS profit#77]
+Input [6]: [cp_catalog_page_id#57, sum#63, sum#64, isEmpty#65, sum#66, isEmpty#67]
+Keys [1]: [cp_catalog_page_id#57]
+Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#45)), sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00)), sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#45))#68, sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00))#69, sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))#70]
+Results [5]: [catalog channel AS channel#71, concat(catalog_page, cp_catalog_page_id#57) AS id#72, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#45))#68,17,2) AS sales#73, sum(coalesce(cast(cr_return_amount#50 as decimal(12,2)), 0.00))#69 AS returns#74, sum((cs_net_profit#46 - coalesce(cast(cr_net_loss#51 as decimal(12,2)), 0.00)))#70 AS profit#75]
 
 (71) Scan parquet spark_catalog.default.web_sales
-Output [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
+Output [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#84), dynamicpruningexpression(ws_sold_date_sk#84 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#82), dynamicpruningexpression(ws_sold_date_sk#82 IN dynamicpruning#8)]
 PushedFilters: [IsNotNull(ws_web_site_sk), IsNotNull(ws_item_sk), IsNotNull(ws_promo_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_web_site_sk:int,ws_promo_sk:int,ws_order_number:int,ws_ext_sales_price:decimal(7,2),ws_net_profit:decimal(7,2)>
 
 (72) ColumnarToRow [codegen id : 21]
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
 
 (73) Filter [codegen id : 21]
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
-Condition : ((((isnotnull(ws_web_site_sk#79) AND isnotnull(ws_item_sk#78)) AND isnotnull(ws_promo_sk#80)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#10], xxhash64(ws_item_sk#78, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#11, [id=#12], xxhash64(ws_promo_sk#80, 42)))
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
+Condition : ((((isnotnull(ws_web_site_sk#77) AND isnotnull(ws_item_sk#76)) AND isnotnull(ws_promo_sk#78)) AND might_contain(ReusedSubquery Subquery scalar-subquery#9, [id=#1], xxhash64(ws_item_sk#76, 42))) AND might_contain(ReusedSubquery Subquery scalar-subquery#10, [id=#2], xxhash64(ws_promo_sk#78, 42)))
 
 (74) Exchange
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
-Arguments: hashpartitioning(ws_item_sk#78, ws_order_number#81, 5), ENSURE_REQUIREMENTS, [plan_id=11]
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
+Arguments: hashpartitioning(ws_item_sk#76, ws_order_number#79, 5), ENSURE_REQUIREMENTS, [plan_id=13]
 
 (75) Sort [codegen id : 22]
-Input [7]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84]
-Arguments: [ws_item_sk#78 ASC NULLS FIRST, ws_order_number#81 ASC NULLS FIRST], false, 0
+Input [7]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82]
+Arguments: [ws_item_sk#76 ASC NULLS FIRST, ws_order_number#79 ASC NULLS FIRST], false, 0
 
 (76) Scan parquet spark_catalog.default.web_returns
-Output [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
+Output [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_returns]
 PushedFilters: [IsNotNull(wr_item_sk), IsNotNull(wr_order_number)]
 ReadSchema: struct<wr_item_sk:int,wr_order_number:int,wr_return_amt:decimal(7,2),wr_net_loss:decimal(7,2)>
 
 (77) ColumnarToRow [codegen id : 23]
-Input [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
+Input [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
 
 (78) Filter [codegen id : 23]
-Input [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
-Condition : (isnotnull(wr_item_sk#85) AND isnotnull(wr_order_number#86))
+Input [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
+Condition : (isnotnull(wr_item_sk#83) AND isnotnull(wr_order_number#84))
 
 (79) Project [codegen id : 23]
-Output [4]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
-Input [5]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88, wr_returned_date_sk#89]
+Output [4]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
+Input [5]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86, wr_returned_date_sk#87]
 
 (80) Exchange
-Input [4]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
-Arguments: hashpartitioning(wr_item_sk#85, wr_order_number#86, 5), ENSURE_REQUIREMENTS, [plan_id=12]
+Input [4]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
+Arguments: hashpartitioning(wr_item_sk#83, wr_order_number#84, 5), ENSURE_REQUIREMENTS, [plan_id=14]
 
 (81) Sort [codegen id : 24]
-Input [4]: [wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
-Arguments: [wr_item_sk#85 ASC NULLS FIRST, wr_order_number#86 ASC NULLS FIRST], false, 0
+Input [4]: [wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
+Arguments: [wr_item_sk#83 ASC NULLS FIRST, wr_order_number#84 ASC NULLS FIRST], false, 0
 
 (82) SortMergeJoin [codegen id : 29]
-Left keys [2]: [ws_item_sk#78, ws_order_number#81]
-Right keys [2]: [wr_item_sk#85, wr_order_number#86]
+Left keys [2]: [ws_item_sk#76, ws_order_number#79]
+Right keys [2]: [wr_item_sk#83, wr_order_number#84]
 Join type: LeftOuter
 Join condition: None
 
 (83) Project [codegen id : 29]
-Output [8]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88]
-Input [11]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_order_number#81, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_item_sk#85, wr_order_number#86, wr_return_amt#87, wr_net_loss#88]
+Output [8]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86]
+Input [11]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_order_number#79, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_item_sk#83, wr_order_number#84, wr_return_amt#85, wr_net_loss#86]
 
 (84) ReusedExchange [Reuses operator id: 18]
-Output [1]: [i_item_sk#90]
+Output [1]: [i_item_sk#88]
 
 (85) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_item_sk#78]
-Right keys [1]: [i_item_sk#90]
+Left keys [1]: [ws_item_sk#76]
+Right keys [1]: [i_item_sk#88]
 Join type: Inner
 Join condition: None
 
 (86) Project [codegen id : 29]
-Output [7]: [ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88]
-Input [9]: [ws_item_sk#78, ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88, i_item_sk#90]
+Output [7]: [ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86]
+Input [9]: [ws_item_sk#76, ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86, i_item_sk#88]
 
 (87) ReusedExchange [Reuses operator id: 25]
-Output [1]: [p_promo_sk#91]
+Output [1]: [p_promo_sk#89]
 
 (88) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_promo_sk#80]
-Right keys [1]: [p_promo_sk#91]
+Left keys [1]: [ws_promo_sk#78]
+Right keys [1]: [p_promo_sk#89]
 Join type: Inner
 Join condition: None
 
 (89) Project [codegen id : 29]
-Output [6]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88]
-Input [8]: [ws_web_site_sk#79, ws_promo_sk#80, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88, p_promo_sk#91]
+Output [6]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86]
+Input [8]: [ws_web_site_sk#77, ws_promo_sk#78, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86, p_promo_sk#89]
 
 (90) ReusedExchange [Reuses operator id: 221]
-Output [1]: [d_date_sk#92]
+Output [1]: [d_date_sk#90]
 
 (91) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_sold_date_sk#84]
-Right keys [1]: [d_date_sk#92]
+Left keys [1]: [ws_sold_date_sk#82]
+Right keys [1]: [d_date_sk#90]
 Join type: Inner
 Join condition: None
 
 (92) Project [codegen id : 29]
-Output [5]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88]
-Input [7]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, ws_sold_date_sk#84, wr_return_amt#87, wr_net_loss#88, d_date_sk#92]
+Output [5]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86]
+Input [7]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, ws_sold_date_sk#82, wr_return_amt#85, wr_net_loss#86, d_date_sk#90]
 
 (93) Scan parquet spark_catalog.default.web_site
-Output [2]: [web_site_sk#93, web_site_id#94]
+Output [2]: [web_site_sk#91, web_site_id#92]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/web_site]
 PushedFilters: [IsNotNull(web_site_sk)]
 ReadSchema: struct<web_site_sk:int,web_site_id:string>
 
 (94) ColumnarToRow [codegen id : 28]
-Input [2]: [web_site_sk#93, web_site_id#94]
+Input [2]: [web_site_sk#91, web_site_id#92]
 
 (95) Filter [codegen id : 28]
-Input [2]: [web_site_sk#93, web_site_id#94]
-Condition : isnotnull(web_site_sk#93)
+Input [2]: [web_site_sk#91, web_site_id#92]
+Condition : isnotnull(web_site_sk#91)
 
 (96) BroadcastExchange
-Input [2]: [web_site_sk#93, web_site_id#94]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=13]
+Input [2]: [web_site_sk#91, web_site_id#92]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, false] as bigint)),false), [plan_id=15]
 
 (97) BroadcastHashJoin [codegen id : 29]
-Left keys [1]: [ws_web_site_sk#79]
-Right keys [1]: [web_site_sk#93]
+Left keys [1]: [ws_web_site_sk#77]
+Right keys [1]: [web_site_sk#91]
 Join type: Inner
 Join condition: None
 
 (98) Project [codegen id : 29]
-Output [5]: [ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88, web_site_id#94]
-Input [7]: [ws_web_site_sk#79, ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88, web_site_sk#93, web_site_id#94]
+Output [5]: [ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86, web_site_id#92]
+Input [7]: [ws_web_site_sk#77, ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86, web_site_sk#91, web_site_id#92]
 
 (99) HashAggregate [codegen id : 29]
-Input [5]: [ws_ext_sales_price#82, ws_net_profit#83, wr_return_amt#87, wr_net_loss#88, web_site_id#94]
-Keys [1]: [web_site_id#94]
-Functions [3]: [partial_sum(UnscaledValue(ws_ext_sales_price#82)), partial_sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00)), partial_sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#95, sum#96, isEmpty#97, sum#98, isEmpty#99]
-Results [6]: [web_site_id#94, sum#100, sum#101, isEmpty#102, sum#103, isEmpty#104]
+Input [5]: [ws_ext_sales_price#80, ws_net_profit#81, wr_return_amt#85, wr_net_loss#86, web_site_id#92]
+Keys [1]: [web_site_id#92]
+Functions [3]: [partial_sum(UnscaledValue(ws_ext_sales_price#80)), partial_sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00)), partial_sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#93, sum#94, isEmpty#95, sum#96, isEmpty#97]
+Results [6]: [web_site_id#92, sum#98, sum#99, isEmpty#100, sum#101, isEmpty#102]
 
 (100) Exchange
-Input [6]: [web_site_id#94, sum#100, sum#101, isEmpty#102, sum#103, isEmpty#104]
-Arguments: hashpartitioning(web_site_id#94, 5), ENSURE_REQUIREMENTS, [plan_id=14]
+Input [6]: [web_site_id#92, sum#98, sum#99, isEmpty#100, sum#101, isEmpty#102]
+Arguments: hashpartitioning(web_site_id#92, 5), ENSURE_REQUIREMENTS, [plan_id=16]
 
 (101) HashAggregate [codegen id : 30]
-Input [6]: [web_site_id#94, sum#100, sum#101, isEmpty#102, sum#103, isEmpty#104]
-Keys [1]: [web_site_id#94]
-Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#82)), sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00)), sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#82))#105, sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00))#106, sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))#107]
-Results [5]: [web channel AS channel#108, concat(web_site, web_site_id#94) AS id#109, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#82))#105,17,2) AS sales#110, sum(coalesce(cast(wr_return_amt#87 as decimal(12,2)), 0.00))#106 AS returns#111, sum((ws_net_profit#83 - coalesce(cast(wr_net_loss#88 as decimal(12,2)), 0.00)))#107 AS profit#112]
+Input [6]: [web_site_id#92, sum#98, sum#99, isEmpty#100, sum#101, isEmpty#102]
+Keys [1]: [web_site_id#92]
+Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#80)), sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00)), sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#80))#103, sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00))#104, sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))#105]
+Results [5]: [web channel AS channel#106, concat(web_site, web_site_id#92) AS id#107, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#80))#103,17,2) AS sales#108, sum(coalesce(cast(wr_return_amt#85 as decimal(12,2)), 0.00))#104 AS returns#109, sum((ws_net_profit#81 - coalesce(cast(wr_net_loss#86 as decimal(12,2)), 0.00)))#105 AS profit#110]
 
 (102) Union
 
 (103) HashAggregate [codegen id : 31]
-Input [5]: [channel#38, id#39, sales#40, returns#41, profit#42]
-Keys [2]: [channel#38, id#39]
-Functions [3]: [partial_sum(sales#40), partial_sum(returns#41), partial_sum(profit#42)]
-Aggregate Attributes [6]: [sum#113, isEmpty#114, sum#115, isEmpty#116, sum#117, isEmpty#118]
-Results [8]: [channel#38, id#39, sum#119, isEmpty#120, sum#121, isEmpty#122, sum#123, isEmpty#124]
+Input [5]: [channel#36, id#37, sales#38, returns#39, profit#40]
+Keys [2]: [channel#36, id#37]
+Functions [3]: [partial_sum(sales#38), partial_sum(returns#39), partial_sum(profit#40)]
+Aggregate Attributes [6]: [sum#111, isEmpty#112, sum#113, isEmpty#114, sum#115, isEmpty#116]
+Results [8]: [channel#36, id#37, sum#117, isEmpty#118, sum#119, isEmpty#120, sum#121, isEmpty#122]
 
 (104) Exchange
-Input [8]: [channel#38, id#39, sum#119, isEmpty#120, sum#121, isEmpty#122, sum#123, isEmpty#124]
-Arguments: hashpartitioning(channel#38, id#39, 5), ENSURE_REQUIREMENTS, [plan_id=15]
+Input [8]: [channel#36, id#37, sum#117, isEmpty#118, sum#119, isEmpty#120, sum#121, isEmpty#122]
+Arguments: hashpartitioning(channel#36, id#37, 5), ENSURE_REQUIREMENTS, [plan_id=17]
 
 (105) HashAggregate [codegen id : 32]
-Input [8]: [channel#38, id#39, sum#119, isEmpty#120, sum#121, isEmpty#122, sum#123, isEmpty#124]
-Keys [2]: [channel#38, id#39]
-Functions [3]: [sum(sales#40), sum(returns#41), sum(profit#42)]
-Aggregate Attributes [3]: [sum(sales#40)#125, sum(returns#41)#126, sum(profit#42)#127]
-Results [5]: [channel#38, id#39, cast(sum(sales#40)#125 as decimal(37,2)) AS sales#128, cast(sum(returns#41)#126 as decimal(38,2)) AS returns#129, cast(sum(profit#42)#127 as decimal(38,2)) AS profit#130]
+Input [8]: [channel#36, id#37, sum#117, isEmpty#118, sum#119, isEmpty#120, sum#121, isEmpty#122]
+Keys [2]: [channel#36, id#37]
+Functions [3]: [sum(sales#38), sum(returns#39), sum(profit#40)]
+Aggregate Attributes [3]: [sum(sales#38)#123, sum(returns#39)#124, sum(profit#40)#125]
+Results [5]: [channel#36, id#37, cast(sum(sales#38)#123 as decimal(37,2)) AS sales#126, cast(sum(returns#39)#124 as decimal(38,2)) AS returns#127, cast(sum(profit#40)#125 as decimal(38,2)) AS profit#128]
 
 (106) ReusedExchange [Reuses operator id: 38]
-Output [6]: [s_store_id#131, sum#132, sum#133, isEmpty#134, sum#135, isEmpty#136]
+Output [6]: [s_store_id#129, sum#130, sum#131, isEmpty#132, sum#133, isEmpty#134]
 
 (107) HashAggregate [codegen id : 42]
-Input [6]: [s_store_id#131, sum#132, sum#133, isEmpty#134, sum#135, isEmpty#136]
-Keys [1]: [s_store_id#131]
-Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#137)), sum(coalesce(cast(sr_return_amt#138 as decimal(12,2)), 0.00)), sum((ss_net_profit#139 - coalesce(cast(sr_net_loss#140 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#137))#35, sum(coalesce(cast(sr_return_amt#138 as decimal(12,2)), 0.00))#36, sum((ss_net_profit#139 - coalesce(cast(sr_net_loss#140 as decimal(12,2)), 0.00)))#37]
-Results [5]: [store channel AS channel#141, concat(store, s_store_id#131) AS id#142, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#137))#35,17,2) AS sales#143, sum(coalesce(cast(sr_return_amt#138 as decimal(12,2)), 0.00))#36 AS returns#144, sum((ss_net_profit#139 - coalesce(cast(sr_net_loss#140 as decimal(12,2)), 0.00)))#37 AS profit#145]
+Input [6]: [s_store_id#129, sum#130, sum#131, isEmpty#132, sum#133, isEmpty#134]
+Keys [1]: [s_store_id#129]
+Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#135)), sum(coalesce(cast(sr_return_amt#136 as decimal(12,2)), 0.00)), sum((ss_net_profit#137 - coalesce(cast(sr_net_loss#138 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#135))#33, sum(coalesce(cast(sr_return_amt#136 as decimal(12,2)), 0.00))#34, sum((ss_net_profit#137 - coalesce(cast(sr_net_loss#138 as decimal(12,2)), 0.00)))#35]
+Results [5]: [store channel AS channel#139, concat(store, s_store_id#129) AS id#140, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#135))#33,17,2) AS sales#141, sum(coalesce(cast(sr_return_amt#136 as decimal(12,2)), 0.00))#34 AS returns#142, sum((ss_net_profit#137 - coalesce(cast(sr_net_loss#138 as decimal(12,2)), 0.00)))#35 AS profit#143]
 
 (108) ReusedExchange [Reuses operator id: 69]
-Output [6]: [cp_catalog_page_id#146, sum#147, sum#148, isEmpty#149, sum#150, isEmpty#151]
+Output [6]: [cp_catalog_page_id#144, sum#145, sum#146, isEmpty#147, sum#148, isEmpty#149]
 
 (109) HashAggregate [codegen id : 52]
-Input [6]: [cp_catalog_page_id#146, sum#147, sum#148, isEmpty#149, sum#150, isEmpty#151]
-Keys [1]: [cp_catalog_page_id#146]
-Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#152)), sum(coalesce(cast(cr_return_amount#153 as decimal(12,2)), 0.00)), sum((cs_net_profit#154 - coalesce(cast(cr_net_loss#155 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#152))#70, sum(coalesce(cast(cr_return_amount#153 as decimal(12,2)), 0.00))#71, sum((cs_net_profit#154 - coalesce(cast(cr_net_loss#155 as decimal(12,2)), 0.00)))#72]
-Results [5]: [catalog channel AS channel#156, concat(catalog_page, cp_catalog_page_id#146) AS id#157, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#152))#70,17,2) AS sales#158, sum(coalesce(cast(cr_return_amount#153 as decimal(12,2)), 0.00))#71 AS returns#159, sum((cs_net_profit#154 - coalesce(cast(cr_net_loss#155 as decimal(12,2)), 0.00)))#72 AS profit#160]
+Input [6]: [cp_catalog_page_id#144, sum#145, sum#146, isEmpty#147, sum#148, isEmpty#149]
+Keys [1]: [cp_catalog_page_id#144]
+Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#150)), sum(coalesce(cast(cr_return_amount#151 as decimal(12,2)), 0.00)), sum((cs_net_profit#152 - coalesce(cast(cr_net_loss#153 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#150))#68, sum(coalesce(cast(cr_return_amount#151 as decimal(12,2)), 0.00))#69, sum((cs_net_profit#152 - coalesce(cast(cr_net_loss#153 as decimal(12,2)), 0.00)))#70]
+Results [5]: [catalog channel AS channel#154, concat(catalog_page, cp_catalog_page_id#144) AS id#155, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#150))#68,17,2) AS sales#156, sum(coalesce(cast(cr_return_amount#151 as decimal(12,2)), 0.00))#69 AS returns#157, sum((cs_net_profit#152 - coalesce(cast(cr_net_loss#153 as decimal(12,2)), 0.00)))#70 AS profit#158]
 
 (110) Scan parquet spark_catalog.default.web_sales
-Output [7]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_order_number#164, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167]
+Output [7]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_order_number#162, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ws_sold_date_sk#167), dynamicpruningexpression(ws_sold_date_sk#167 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ws_sold_date_sk#165), dynamicpruningexpression(ws_sold_date_sk#165 IN dynamicpruning#8)]
 PushedFilters: [IsNotNull(ws_web_site_sk), IsNotNull(ws_item_sk), IsNotNull(ws_promo_sk)]
 ReadSchema: struct<ws_item_sk:int,ws_web_site_sk:int,ws_promo_sk:int,ws_order_number:int,ws_ext_sales_price:decimal(7,2),ws_net_profit:decimal(7,2)>
 
 (111) ColumnarToRow [codegen id : 53]
-Input [7]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_order_number#164, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167]
+Input [7]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_order_number#162, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165]
 
 (112) Filter [codegen id : 53]
-Input [7]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_order_number#164, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167]
-Condition : ((isnotnull(ws_web_site_sk#162) AND isnotnull(ws_item_sk#161)) AND isnotnull(ws_promo_sk#163))
+Input [7]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_order_number#162, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165]
+Condition : ((isnotnull(ws_web_site_sk#160) AND isnotnull(ws_item_sk#159)) AND isnotnull(ws_promo_sk#161))
 
 (113) Exchange
-Input [7]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_order_number#164, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167]
-Arguments: hashpartitioning(ws_item_sk#161, ws_order_number#164, 5), ENSURE_REQUIREMENTS, [plan_id=16]
+Input [7]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_order_number#162, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165]
+Arguments: hashpartitioning(ws_item_sk#159, ws_order_number#162, 5), ENSURE_REQUIREMENTS, [plan_id=18]
 
 (114) Sort [codegen id : 54]
-Input [7]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_order_number#164, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167]
-Arguments: [ws_item_sk#161 ASC NULLS FIRST, ws_order_number#164 ASC NULLS FIRST], false, 0
+Input [7]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_order_number#162, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165]
+Arguments: [ws_item_sk#159 ASC NULLS FIRST, ws_order_number#162 ASC NULLS FIRST], false, 0
 
 (115) ReusedExchange [Reuses operator id: 80]
-Output [4]: [wr_item_sk#168, wr_order_number#169, wr_return_amt#170, wr_net_loss#171]
+Output [4]: [wr_item_sk#166, wr_order_number#167, wr_return_amt#168, wr_net_loss#169]
 
 (116) Sort [codegen id : 56]
-Input [4]: [wr_item_sk#168, wr_order_number#169, wr_return_amt#170, wr_net_loss#171]
-Arguments: [wr_item_sk#168 ASC NULLS FIRST, wr_order_number#169 ASC NULLS FIRST], false, 0
+Input [4]: [wr_item_sk#166, wr_order_number#167, wr_return_amt#168, wr_net_loss#169]
+Arguments: [wr_item_sk#166 ASC NULLS FIRST, wr_order_number#167 ASC NULLS FIRST], false, 0
 
 (117) SortMergeJoin [codegen id : 61]
-Left keys [2]: [ws_item_sk#161, ws_order_number#164]
-Right keys [2]: [wr_item_sk#168, wr_order_number#169]
+Left keys [2]: [ws_item_sk#159, ws_order_number#162]
+Right keys [2]: [wr_item_sk#166, wr_order_number#167]
 Join type: LeftOuter
 Join condition: None
 
 (118) Project [codegen id : 61]
-Output [8]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167, wr_return_amt#170, wr_net_loss#171]
-Input [11]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_order_number#164, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167, wr_item_sk#168, wr_order_number#169, wr_return_amt#170, wr_net_loss#171]
+Output [8]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165, wr_return_amt#168, wr_net_loss#169]
+Input [11]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_order_number#162, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165, wr_item_sk#166, wr_order_number#167, wr_return_amt#168, wr_net_loss#169]
 
 (119) ReusedExchange [Reuses operator id: 18]
-Output [1]: [i_item_sk#172]
+Output [1]: [i_item_sk#170]
 
 (120) BroadcastHashJoin [codegen id : 61]
-Left keys [1]: [ws_item_sk#161]
-Right keys [1]: [i_item_sk#172]
+Left keys [1]: [ws_item_sk#159]
+Right keys [1]: [i_item_sk#170]
 Join type: Inner
 Join condition: None
 
 (121) Project [codegen id : 61]
-Output [7]: [ws_web_site_sk#162, ws_promo_sk#163, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167, wr_return_amt#170, wr_net_loss#171]
-Input [9]: [ws_item_sk#161, ws_web_site_sk#162, ws_promo_sk#163, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167, wr_return_amt#170, wr_net_loss#171, i_item_sk#172]
+Output [7]: [ws_web_site_sk#160, ws_promo_sk#161, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165, wr_return_amt#168, wr_net_loss#169]
+Input [9]: [ws_item_sk#159, ws_web_site_sk#160, ws_promo_sk#161, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165, wr_return_amt#168, wr_net_loss#169, i_item_sk#170]
 
 (122) ReusedExchange [Reuses operator id: 25]
-Output [1]: [p_promo_sk#173]
+Output [1]: [p_promo_sk#171]
 
 (123) BroadcastHashJoin [codegen id : 61]
-Left keys [1]: [ws_promo_sk#163]
-Right keys [1]: [p_promo_sk#173]
+Left keys [1]: [ws_promo_sk#161]
+Right keys [1]: [p_promo_sk#171]
 Join type: Inner
 Join condition: None
 
 (124) Project [codegen id : 61]
-Output [6]: [ws_web_site_sk#162, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167, wr_return_amt#170, wr_net_loss#171]
-Input [8]: [ws_web_site_sk#162, ws_promo_sk#163, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167, wr_return_amt#170, wr_net_loss#171, p_promo_sk#173]
+Output [6]: [ws_web_site_sk#160, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165, wr_return_amt#168, wr_net_loss#169]
+Input [8]: [ws_web_site_sk#160, ws_promo_sk#161, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165, wr_return_amt#168, wr_net_loss#169, p_promo_sk#171]
 
 (125) ReusedExchange [Reuses operator id: 221]
-Output [1]: [d_date_sk#174]
+Output [1]: [d_date_sk#172]
 
 (126) BroadcastHashJoin [codegen id : 61]
-Left keys [1]: [ws_sold_date_sk#167]
-Right keys [1]: [d_date_sk#174]
+Left keys [1]: [ws_sold_date_sk#165]
+Right keys [1]: [d_date_sk#172]
 Join type: Inner
 Join condition: None
 
 (127) Project [codegen id : 61]
-Output [5]: [ws_web_site_sk#162, ws_ext_sales_price#165, ws_net_profit#166, wr_return_amt#170, wr_net_loss#171]
-Input [7]: [ws_web_site_sk#162, ws_ext_sales_price#165, ws_net_profit#166, ws_sold_date_sk#167, wr_return_amt#170, wr_net_loss#171, d_date_sk#174]
+Output [5]: [ws_web_site_sk#160, ws_ext_sales_price#163, ws_net_profit#164, wr_return_amt#168, wr_net_loss#169]
+Input [7]: [ws_web_site_sk#160, ws_ext_sales_price#163, ws_net_profit#164, ws_sold_date_sk#165, wr_return_amt#168, wr_net_loss#169, d_date_sk#172]
 
 (128) ReusedExchange [Reuses operator id: 96]
-Output [2]: [web_site_sk#175, web_site_id#176]
+Output [2]: [web_site_sk#173, web_site_id#174]
 
 (129) BroadcastHashJoin [codegen id : 61]
-Left keys [1]: [ws_web_site_sk#162]
-Right keys [1]: [web_site_sk#175]
+Left keys [1]: [ws_web_site_sk#160]
+Right keys [1]: [web_site_sk#173]
 Join type: Inner
 Join condition: None
 
 (130) Project [codegen id : 61]
-Output [5]: [ws_ext_sales_price#165, ws_net_profit#166, wr_return_amt#170, wr_net_loss#171, web_site_id#176]
-Input [7]: [ws_web_site_sk#162, ws_ext_sales_price#165, ws_net_profit#166, wr_return_amt#170, wr_net_loss#171, web_site_sk#175, web_site_id#176]
+Output [5]: [ws_ext_sales_price#163, ws_net_profit#164, wr_return_amt#168, wr_net_loss#169, web_site_id#174]
+Input [7]: [ws_web_site_sk#160, ws_ext_sales_price#163, ws_net_profit#164, wr_return_amt#168, wr_net_loss#169, web_site_sk#173, web_site_id#174]
 
 (131) HashAggregate [codegen id : 61]
-Input [5]: [ws_ext_sales_price#165, ws_net_profit#166, wr_return_amt#170, wr_net_loss#171, web_site_id#176]
-Keys [1]: [web_site_id#176]
-Functions [3]: [partial_sum(UnscaledValue(ws_ext_sales_price#165)), partial_sum(coalesce(cast(wr_return_amt#170 as decimal(12,2)), 0.00)), partial_sum((ws_net_profit#166 - coalesce(cast(wr_net_loss#171 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#177, sum#178, isEmpty#179, sum#180, isEmpty#181]
-Results [6]: [web_site_id#176, sum#182, sum#183, isEmpty#184, sum#185, isEmpty#186]
+Input [5]: [ws_ext_sales_price#163, ws_net_profit#164, wr_return_amt#168, wr_net_loss#169, web_site_id#174]
+Keys [1]: [web_site_id#174]
+Functions [3]: [partial_sum(UnscaledValue(ws_ext_sales_price#163)), partial_sum(coalesce(cast(wr_return_amt#168 as decimal(12,2)), 0.00)), partial_sum((ws_net_profit#164 - coalesce(cast(wr_net_loss#169 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#175, sum#176, isEmpty#177, sum#178, isEmpty#179]
+Results [6]: [web_site_id#174, sum#180, sum#181, isEmpty#182, sum#183, isEmpty#184]
 
 (132) Exchange
-Input [6]: [web_site_id#176, sum#182, sum#183, isEmpty#184, sum#185, isEmpty#186]
-Arguments: hashpartitioning(web_site_id#176, 5), ENSURE_REQUIREMENTS, [plan_id=17]
+Input [6]: [web_site_id#174, sum#180, sum#181, isEmpty#182, sum#183, isEmpty#184]
+Arguments: hashpartitioning(web_site_id#174, 5), ENSURE_REQUIREMENTS, [plan_id=19]
 
 (133) HashAggregate [codegen id : 62]
-Input [6]: [web_site_id#176, sum#182, sum#183, isEmpty#184, sum#185, isEmpty#186]
-Keys [1]: [web_site_id#176]
-Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#165)), sum(coalesce(cast(wr_return_amt#170 as decimal(12,2)), 0.00)), sum((ws_net_profit#166 - coalesce(cast(wr_net_loss#171 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#165))#105, sum(coalesce(cast(wr_return_amt#170 as decimal(12,2)), 0.00))#106, sum((ws_net_profit#166 - coalesce(cast(wr_net_loss#171 as decimal(12,2)), 0.00)))#107]
-Results [5]: [web channel AS channel#187, concat(web_site, web_site_id#176) AS id#188, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#165))#105,17,2) AS sales#189, sum(coalesce(cast(wr_return_amt#170 as decimal(12,2)), 0.00))#106 AS returns#190, sum((ws_net_profit#166 - coalesce(cast(wr_net_loss#171 as decimal(12,2)), 0.00)))#107 AS profit#191]
+Input [6]: [web_site_id#174, sum#180, sum#181, isEmpty#182, sum#183, isEmpty#184]
+Keys [1]: [web_site_id#174]
+Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#163)), sum(coalesce(cast(wr_return_amt#168 as decimal(12,2)), 0.00)), sum((ws_net_profit#164 - coalesce(cast(wr_net_loss#169 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#163))#103, sum(coalesce(cast(wr_return_amt#168 as decimal(12,2)), 0.00))#104, sum((ws_net_profit#164 - coalesce(cast(wr_net_loss#169 as decimal(12,2)), 0.00)))#105]
+Results [5]: [web channel AS channel#185, concat(web_site, web_site_id#174) AS id#186, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#163))#103,17,2) AS sales#187, sum(coalesce(cast(wr_return_amt#168 as decimal(12,2)), 0.00))#104 AS returns#188, sum((ws_net_profit#164 - coalesce(cast(wr_net_loss#169 as decimal(12,2)), 0.00)))#105 AS profit#189]
 
 (134) Union
 
 (135) HashAggregate [codegen id : 63]
-Input [5]: [channel#141, id#142, sales#143, returns#144, profit#145]
-Keys [2]: [channel#141, id#142]
-Functions [3]: [partial_sum(sales#143), partial_sum(returns#144), partial_sum(profit#145)]
-Aggregate Attributes [6]: [sum#192, isEmpty#193, sum#194, isEmpty#195, sum#196, isEmpty#197]
-Results [8]: [channel#141, id#142, sum#198, isEmpty#199, sum#200, isEmpty#201, sum#202, isEmpty#203]
+Input [5]: [channel#139, id#140, sales#141, returns#142, profit#143]
+Keys [2]: [channel#139, id#140]
+Functions [3]: [partial_sum(sales#141), partial_sum(returns#142), partial_sum(profit#143)]
+Aggregate Attributes [6]: [sum#190, isEmpty#191, sum#192, isEmpty#193, sum#194, isEmpty#195]
+Results [8]: [channel#139, id#140, sum#196, isEmpty#197, sum#198, isEmpty#199, sum#200, isEmpty#201]
 
 (136) Exchange
-Input [8]: [channel#141, id#142, sum#198, isEmpty#199, sum#200, isEmpty#201, sum#202, isEmpty#203]
-Arguments: hashpartitioning(channel#141, id#142, 5), ENSURE_REQUIREMENTS, [plan_id=18]
+Input [8]: [channel#139, id#140, sum#196, isEmpty#197, sum#198, isEmpty#199, sum#200, isEmpty#201]
+Arguments: hashpartitioning(channel#139, id#140, 5), ENSURE_REQUIREMENTS, [plan_id=20]
 
 (137) HashAggregate [codegen id : 64]
-Input [8]: [channel#141, id#142, sum#198, isEmpty#199, sum#200, isEmpty#201, sum#202, isEmpty#203]
-Keys [2]: [channel#141, id#142]
-Functions [3]: [sum(sales#143), sum(returns#144), sum(profit#145)]
-Aggregate Attributes [3]: [sum(sales#143)#125, sum(returns#144)#126, sum(profit#145)#127]
-Results [4]: [channel#141, sum(sales#143)#125 AS sales#204, sum(returns#144)#126 AS returns#205, sum(profit#145)#127 AS profit#206]
+Input [8]: [channel#139, id#140, sum#196, isEmpty#197, sum#198, isEmpty#199, sum#200, isEmpty#201]
+Keys [2]: [channel#139, id#140]
+Functions [3]: [sum(sales#141), sum(returns#142), sum(profit#143)]
+Aggregate Attributes [3]: [sum(sales#141)#123, sum(returns#142)#124, sum(profit#143)#125]
+Results [4]: [channel#139, sum(sales#141)#123 AS sales#202, sum(returns#142)#124 AS returns#203, sum(profit#143)#125 AS profit#204]
 
 (138) HashAggregate [codegen id : 64]
-Input [4]: [channel#141, sales#204, returns#205, profit#206]
-Keys [1]: [channel#141]
-Functions [3]: [partial_sum(sales#204), partial_sum(returns#205), partial_sum(profit#206)]
-Aggregate Attributes [6]: [sum#207, isEmpty#208, sum#209, isEmpty#210, sum#211, isEmpty#212]
-Results [7]: [channel#141, sum#213, isEmpty#214, sum#215, isEmpty#216, sum#217, isEmpty#218]
+Input [4]: [channel#139, sales#202, returns#203, profit#204]
+Keys [1]: [channel#139]
+Functions [3]: [partial_sum(sales#202), partial_sum(returns#203), partial_sum(profit#204)]
+Aggregate Attributes [6]: [sum#205, isEmpty#206, sum#207, isEmpty#208, sum#209, isEmpty#210]
+Results [7]: [channel#139, sum#211, isEmpty#212, sum#213, isEmpty#214, sum#215, isEmpty#216]
 
 (139) Exchange
-Input [7]: [channel#141, sum#213, isEmpty#214, sum#215, isEmpty#216, sum#217, isEmpty#218]
-Arguments: hashpartitioning(channel#141, 5), ENSURE_REQUIREMENTS, [plan_id=19]
+Input [7]: [channel#139, sum#211, isEmpty#212, sum#213, isEmpty#214, sum#215, isEmpty#216]
+Arguments: hashpartitioning(channel#139, 5), ENSURE_REQUIREMENTS, [plan_id=21]
 
 (140) HashAggregate [codegen id : 65]
-Input [7]: [channel#141, sum#213, isEmpty#214, sum#215, isEmpty#216, sum#217, isEmpty#218]
-Keys [1]: [channel#141]
-Functions [3]: [sum(sales#204), sum(returns#205), sum(profit#206)]
-Aggregate Attributes [3]: [sum(sales#204)#219, sum(returns#205)#220, sum(profit#206)#221]
-Results [5]: [channel#141, null AS id#222, sum(sales#204)#219 AS sales#223, sum(returns#205)#220 AS returns#224, sum(profit#206)#221 AS profit#225]
+Input [7]: [channel#139, sum#211, isEmpty#212, sum#213, isEmpty#214, sum#215, isEmpty#216]
+Keys [1]: [channel#139]
+Functions [3]: [sum(sales#202), sum(returns#203), sum(profit#204)]
+Aggregate Attributes [3]: [sum(sales#202)#217, sum(returns#203)#218, sum(profit#204)#219]
+Results [5]: [channel#139, null AS id#220, sum(sales#202)#217 AS sales#221, sum(returns#203)#218 AS returns#222, sum(profit#204)#219 AS profit#223]
 
 (141) Scan parquet spark_catalog.default.store_sales
-Output [7]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ticket_number#229, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232]
+Output [7]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ticket_number#227, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(ss_sold_date_sk#232), dynamicpruningexpression(ss_sold_date_sk#232 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(ss_sold_date_sk#230), dynamicpruningexpression(ss_sold_date_sk#230 IN dynamicpruning#8)]
 PushedFilters: [IsNotNull(ss_store_sk), IsNotNull(ss_item_sk), IsNotNull(ss_promo_sk)]
 ReadSchema: struct<ss_item_sk:int,ss_store_sk:int,ss_promo_sk:int,ss_ticket_number:int,ss_ext_sales_price:decimal(7,2),ss_net_profit:decimal(7,2)>
 
 (142) ColumnarToRow [codegen id : 66]
-Input [7]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ticket_number#229, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232]
+Input [7]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ticket_number#227, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230]
 
 (143) Filter [codegen id : 66]
-Input [7]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ticket_number#229, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232]
-Condition : ((isnotnull(ss_store_sk#227) AND isnotnull(ss_item_sk#226)) AND isnotnull(ss_promo_sk#228))
+Input [7]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ticket_number#227, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230]
+Condition : ((isnotnull(ss_store_sk#225) AND isnotnull(ss_item_sk#224)) AND isnotnull(ss_promo_sk#226))
 
 (144) Exchange
-Input [7]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ticket_number#229, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232]
-Arguments: hashpartitioning(ss_item_sk#226, ss_ticket_number#229, 5), ENSURE_REQUIREMENTS, [plan_id=20]
+Input [7]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ticket_number#227, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230]
+Arguments: hashpartitioning(ss_item_sk#224, ss_ticket_number#227, 5), ENSURE_REQUIREMENTS, [plan_id=22]
 
 (145) Sort [codegen id : 67]
-Input [7]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ticket_number#229, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232]
-Arguments: [ss_item_sk#226 ASC NULLS FIRST, ss_ticket_number#229 ASC NULLS FIRST], false, 0
+Input [7]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ticket_number#227, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230]
+Arguments: [ss_item_sk#224 ASC NULLS FIRST, ss_ticket_number#227 ASC NULLS FIRST], false, 0
 
 (146) ReusedExchange [Reuses operator id: 10]
-Output [4]: [sr_item_sk#233, sr_ticket_number#234, sr_return_amt#235, sr_net_loss#236]
+Output [4]: [sr_item_sk#231, sr_ticket_number#232, sr_return_amt#233, sr_net_loss#234]
 
 (147) Sort [codegen id : 69]
-Input [4]: [sr_item_sk#233, sr_ticket_number#234, sr_return_amt#235, sr_net_loss#236]
-Arguments: [sr_item_sk#233 ASC NULLS FIRST, sr_ticket_number#234 ASC NULLS FIRST], false, 0
+Input [4]: [sr_item_sk#231, sr_ticket_number#232, sr_return_amt#233, sr_net_loss#234]
+Arguments: [sr_item_sk#231 ASC NULLS FIRST, sr_ticket_number#232 ASC NULLS FIRST], false, 0
 
 (148) SortMergeJoin [codegen id : 74]
-Left keys [2]: [ss_item_sk#226, ss_ticket_number#229]
-Right keys [2]: [sr_item_sk#233, sr_ticket_number#234]
+Left keys [2]: [ss_item_sk#224, ss_ticket_number#227]
+Right keys [2]: [sr_item_sk#231, sr_ticket_number#232]
 Join type: LeftOuter
 Join condition: None
 
 (149) Project [codegen id : 74]
-Output [8]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232, sr_return_amt#235, sr_net_loss#236]
-Input [11]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ticket_number#229, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232, sr_item_sk#233, sr_ticket_number#234, sr_return_amt#235, sr_net_loss#236]
+Output [8]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230, sr_return_amt#233, sr_net_loss#234]
+Input [11]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ticket_number#227, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230, sr_item_sk#231, sr_ticket_number#232, sr_return_amt#233, sr_net_loss#234]
 
 (150) ReusedExchange [Reuses operator id: 18]
-Output [1]: [i_item_sk#237]
+Output [1]: [i_item_sk#235]
 
 (151) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_item_sk#226]
-Right keys [1]: [i_item_sk#237]
+Left keys [1]: [ss_item_sk#224]
+Right keys [1]: [i_item_sk#235]
 Join type: Inner
 Join condition: None
 
 (152) Project [codegen id : 74]
-Output [7]: [ss_store_sk#227, ss_promo_sk#228, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232, sr_return_amt#235, sr_net_loss#236]
-Input [9]: [ss_item_sk#226, ss_store_sk#227, ss_promo_sk#228, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232, sr_return_amt#235, sr_net_loss#236, i_item_sk#237]
+Output [7]: [ss_store_sk#225, ss_promo_sk#226, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230, sr_return_amt#233, sr_net_loss#234]
+Input [9]: [ss_item_sk#224, ss_store_sk#225, ss_promo_sk#226, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230, sr_return_amt#233, sr_net_loss#234, i_item_sk#235]
 
 (153) ReusedExchange [Reuses operator id: 25]
-Output [1]: [p_promo_sk#238]
+Output [1]: [p_promo_sk#236]
 
 (154) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_promo_sk#228]
-Right keys [1]: [p_promo_sk#238]
+Left keys [1]: [ss_promo_sk#226]
+Right keys [1]: [p_promo_sk#236]
 Join type: Inner
 Join condition: None
 
 (155) Project [codegen id : 74]
-Output [6]: [ss_store_sk#227, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232, sr_return_amt#235, sr_net_loss#236]
-Input [8]: [ss_store_sk#227, ss_promo_sk#228, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232, sr_return_amt#235, sr_net_loss#236, p_promo_sk#238]
+Output [6]: [ss_store_sk#225, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230, sr_return_amt#233, sr_net_loss#234]
+Input [8]: [ss_store_sk#225, ss_promo_sk#226, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230, sr_return_amt#233, sr_net_loss#234, p_promo_sk#236]
 
 (156) ReusedExchange [Reuses operator id: 221]
-Output [1]: [d_date_sk#239]
+Output [1]: [d_date_sk#237]
 
 (157) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_sold_date_sk#232]
-Right keys [1]: [d_date_sk#239]
+Left keys [1]: [ss_sold_date_sk#230]
+Right keys [1]: [d_date_sk#237]
 Join type: Inner
 Join condition: None
 
 (158) Project [codegen id : 74]
-Output [5]: [ss_store_sk#227, ss_ext_sales_price#230, ss_net_profit#231, sr_return_amt#235, sr_net_loss#236]
-Input [7]: [ss_store_sk#227, ss_ext_sales_price#230, ss_net_profit#231, ss_sold_date_sk#232, sr_return_amt#235, sr_net_loss#236, d_date_sk#239]
+Output [5]: [ss_store_sk#225, ss_ext_sales_price#228, ss_net_profit#229, sr_return_amt#233, sr_net_loss#234]
+Input [7]: [ss_store_sk#225, ss_ext_sales_price#228, ss_net_profit#229, ss_sold_date_sk#230, sr_return_amt#233, sr_net_loss#234, d_date_sk#237]
 
 (159) ReusedExchange [Reuses operator id: 34]
-Output [2]: [s_store_sk#240, s_store_id#241]
+Output [2]: [s_store_sk#238, s_store_id#239]
 
 (160) BroadcastHashJoin [codegen id : 74]
-Left keys [1]: [ss_store_sk#227]
-Right keys [1]: [s_store_sk#240]
+Left keys [1]: [ss_store_sk#225]
+Right keys [1]: [s_store_sk#238]
 Join type: Inner
 Join condition: None
 
 (161) Project [codegen id : 74]
-Output [5]: [ss_ext_sales_price#230, ss_net_profit#231, sr_return_amt#235, sr_net_loss#236, s_store_id#241]
-Input [7]: [ss_store_sk#227, ss_ext_sales_price#230, ss_net_profit#231, sr_return_amt#235, sr_net_loss#236, s_store_sk#240, s_store_id#241]
+Output [5]: [ss_ext_sales_price#228, ss_net_profit#229, sr_return_amt#233, sr_net_loss#234, s_store_id#239]
+Input [7]: [ss_store_sk#225, ss_ext_sales_price#228, ss_net_profit#229, sr_return_amt#233, sr_net_loss#234, s_store_sk#238, s_store_id#239]
 
 (162) HashAggregate [codegen id : 74]
-Input [5]: [ss_ext_sales_price#230, ss_net_profit#231, sr_return_amt#235, sr_net_loss#236, s_store_id#241]
-Keys [1]: [s_store_id#241]
-Functions [3]: [partial_sum(UnscaledValue(ss_ext_sales_price#230)), partial_sum(coalesce(cast(sr_return_amt#235 as decimal(12,2)), 0.00)), partial_sum((ss_net_profit#231 - coalesce(cast(sr_net_loss#236 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#242, sum#243, isEmpty#244, sum#245, isEmpty#246]
-Results [6]: [s_store_id#241, sum#247, sum#248, isEmpty#249, sum#250, isEmpty#251]
+Input [5]: [ss_ext_sales_price#228, ss_net_profit#229, sr_return_amt#233, sr_net_loss#234, s_store_id#239]
+Keys [1]: [s_store_id#239]
+Functions [3]: [partial_sum(UnscaledValue(ss_ext_sales_price#228)), partial_sum(coalesce(cast(sr_return_amt#233 as decimal(12,2)), 0.00)), partial_sum((ss_net_profit#229 - coalesce(cast(sr_net_loss#234 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#240, sum#241, isEmpty#242, sum#243, isEmpty#244]
+Results [6]: [s_store_id#239, sum#245, sum#246, isEmpty#247, sum#248, isEmpty#249]
 
 (163) Exchange
-Input [6]: [s_store_id#241, sum#247, sum#248, isEmpty#249, sum#250, isEmpty#251]
-Arguments: hashpartitioning(s_store_id#241, 5), ENSURE_REQUIREMENTS, [plan_id=21]
+Input [6]: [s_store_id#239, sum#245, sum#246, isEmpty#247, sum#248, isEmpty#249]
+Arguments: hashpartitioning(s_store_id#239, 5), ENSURE_REQUIREMENTS, [plan_id=23]
 
 (164) HashAggregate [codegen id : 75]
-Input [6]: [s_store_id#241, sum#247, sum#248, isEmpty#249, sum#250, isEmpty#251]
-Keys [1]: [s_store_id#241]
-Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#230)), sum(coalesce(cast(sr_return_amt#235 as decimal(12,2)), 0.00)), sum((ss_net_profit#231 - coalesce(cast(sr_net_loss#236 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#230))#35, sum(coalesce(cast(sr_return_amt#235 as decimal(12,2)), 0.00))#36, sum((ss_net_profit#231 - coalesce(cast(sr_net_loss#236 as decimal(12,2)), 0.00)))#37]
-Results [5]: [store channel AS channel#252, concat(store, s_store_id#241) AS id#253, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#230))#35,17,2) AS sales#254, sum(coalesce(cast(sr_return_amt#235 as decimal(12,2)), 0.00))#36 AS returns#255, sum((ss_net_profit#231 - coalesce(cast(sr_net_loss#236 as decimal(12,2)), 0.00)))#37 AS profit#256]
+Input [6]: [s_store_id#239, sum#245, sum#246, isEmpty#247, sum#248, isEmpty#249]
+Keys [1]: [s_store_id#239]
+Functions [3]: [sum(UnscaledValue(ss_ext_sales_price#228)), sum(coalesce(cast(sr_return_amt#233 as decimal(12,2)), 0.00)), sum((ss_net_profit#229 - coalesce(cast(sr_net_loss#234 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ss_ext_sales_price#228))#33, sum(coalesce(cast(sr_return_amt#233 as decimal(12,2)), 0.00))#34, sum((ss_net_profit#229 - coalesce(cast(sr_net_loss#234 as decimal(12,2)), 0.00)))#35]
+Results [5]: [store channel AS channel#250, concat(store, s_store_id#239) AS id#251, MakeDecimal(sum(UnscaledValue(ss_ext_sales_price#228))#33,17,2) AS sales#252, sum(coalesce(cast(sr_return_amt#233 as decimal(12,2)), 0.00))#34 AS returns#253, sum((ss_net_profit#229 - coalesce(cast(sr_net_loss#234 as decimal(12,2)), 0.00)))#35 AS profit#254]
 
 (165) Scan parquet spark_catalog.default.catalog_sales
-Output [7]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_order_number#260, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263]
+Output [7]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_order_number#258, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261]
 Batched: true
 Location: InMemoryFileIndex []
-PartitionFilters: [isnotnull(cs_sold_date_sk#263), dynamicpruningexpression(cs_sold_date_sk#263 IN dynamicpruning#8)]
+PartitionFilters: [isnotnull(cs_sold_date_sk#261), dynamicpruningexpression(cs_sold_date_sk#261 IN dynamicpruning#8)]
 PushedFilters: [IsNotNull(cs_catalog_page_sk), IsNotNull(cs_item_sk), IsNotNull(cs_promo_sk)]
 ReadSchema: struct<cs_catalog_page_sk:int,cs_item_sk:int,cs_promo_sk:int,cs_order_number:int,cs_ext_sales_price:decimal(7,2),cs_net_profit:decimal(7,2)>
 
 (166) ColumnarToRow [codegen id : 76]
-Input [7]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_order_number#260, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263]
+Input [7]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_order_number#258, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261]
 
 (167) Filter [codegen id : 76]
-Input [7]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_order_number#260, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263]
-Condition : ((isnotnull(cs_catalog_page_sk#257) AND isnotnull(cs_item_sk#258)) AND isnotnull(cs_promo_sk#259))
+Input [7]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_order_number#258, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261]
+Condition : ((isnotnull(cs_catalog_page_sk#255) AND isnotnull(cs_item_sk#256)) AND isnotnull(cs_promo_sk#257))
 
 (168) Exchange
-Input [7]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_order_number#260, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263]
-Arguments: hashpartitioning(cs_item_sk#258, cs_order_number#260, 5), ENSURE_REQUIREMENTS, [plan_id=22]
+Input [7]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_order_number#258, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261]
+Arguments: hashpartitioning(cs_item_sk#256, cs_order_number#258, 5), ENSURE_REQUIREMENTS, [plan_id=24]
 
 (169) Sort [codegen id : 77]
-Input [7]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_order_number#260, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263]
-Arguments: [cs_item_sk#258 ASC NULLS FIRST, cs_order_number#260 ASC NULLS FIRST], false, 0
+Input [7]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_order_number#258, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261]
+Arguments: [cs_item_sk#256 ASC NULLS FIRST, cs_order_number#258 ASC NULLS FIRST], false, 0
 
 (170) ReusedExchange [Reuses operator id: 49]
-Output [4]: [cr_item_sk#264, cr_order_number#265, cr_return_amount#266, cr_net_loss#267]
+Output [4]: [cr_item_sk#262, cr_order_number#263, cr_return_amount#264, cr_net_loss#265]
 
 (171) Sort [codegen id : 79]
-Input [4]: [cr_item_sk#264, cr_order_number#265, cr_return_amount#266, cr_net_loss#267]
-Arguments: [cr_item_sk#264 ASC NULLS FIRST, cr_order_number#265 ASC NULLS FIRST], false, 0
+Input [4]: [cr_item_sk#262, cr_order_number#263, cr_return_amount#264, cr_net_loss#265]
+Arguments: [cr_item_sk#262 ASC NULLS FIRST, cr_order_number#263 ASC NULLS FIRST], false, 0
 
 (172) SortMergeJoin [codegen id : 84]
-Left keys [2]: [cs_item_sk#258, cs_order_number#260]
-Right keys [2]: [cr_item_sk#264, cr_order_number#265]
+Left keys [2]: [cs_item_sk#256, cs_order_number#258]
+Right keys [2]: [cr_item_sk#262, cr_order_number#263]
 Join type: LeftOuter
 Join condition: None
 
 (173) Project [codegen id : 84]
-Output [8]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263, cr_return_amount#266, cr_net_loss#267]
-Input [11]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_order_number#260, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263, cr_item_sk#264, cr_order_number#265, cr_return_amount#266, cr_net_loss#267]
+Output [8]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261, cr_return_amount#264, cr_net_loss#265]
+Input [11]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_order_number#258, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261, cr_item_sk#262, cr_order_number#263, cr_return_amount#264, cr_net_loss#265]
 
 (174) ReusedExchange [Reuses operator id: 18]
-Output [1]: [i_item_sk#268]
+Output [1]: [i_item_sk#266]
 
 (175) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [cs_item_sk#258]
-Right keys [1]: [i_item_sk#268]
+Left keys [1]: [cs_item_sk#256]
+Right keys [1]: [i_item_sk#266]
 Join type: Inner
 Join condition: None
 
 (176) Project [codegen id : 84]
-Output [7]: [cs_catalog_page_sk#257, cs_promo_sk#259, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263, cr_return_amount#266, cr_net_loss#267]
-Input [9]: [cs_catalog_page_sk#257, cs_item_sk#258, cs_promo_sk#259, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263, cr_return_amount#266, cr_net_loss#267, i_item_sk#268]
+Output [7]: [cs_catalog_page_sk#255, cs_promo_sk#257, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261, cr_return_amount#264, cr_net_loss#265]
+Input [9]: [cs_catalog_page_sk#255, cs_item_sk#256, cs_promo_sk#257, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261, cr_return_amount#264, cr_net_loss#265, i_item_sk#266]
 
 (177) ReusedExchange [Reuses operator id: 25]
-Output [1]: [p_promo_sk#269]
+Output [1]: [p_promo_sk#267]
 
 (178) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [cs_promo_sk#259]
-Right keys [1]: [p_promo_sk#269]
+Left keys [1]: [cs_promo_sk#257]
+Right keys [1]: [p_promo_sk#267]
 Join type: Inner
 Join condition: None
 
 (179) Project [codegen id : 84]
-Output [6]: [cs_catalog_page_sk#257, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263, cr_return_amount#266, cr_net_loss#267]
-Input [8]: [cs_catalog_page_sk#257, cs_promo_sk#259, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263, cr_return_amount#266, cr_net_loss#267, p_promo_sk#269]
+Output [6]: [cs_catalog_page_sk#255, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261, cr_return_amount#264, cr_net_loss#265]
+Input [8]: [cs_catalog_page_sk#255, cs_promo_sk#257, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261, cr_return_amount#264, cr_net_loss#265, p_promo_sk#267]
 
 (180) ReusedExchange [Reuses operator id: 221]
-Output [1]: [d_date_sk#270]
+Output [1]: [d_date_sk#268]
 
 (181) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [cs_sold_date_sk#263]
-Right keys [1]: [d_date_sk#270]
+Left keys [1]: [cs_sold_date_sk#261]
+Right keys [1]: [d_date_sk#268]
 Join type: Inner
 Join condition: None
 
 (182) Project [codegen id : 84]
-Output [5]: [cs_catalog_page_sk#257, cs_ext_sales_price#261, cs_net_profit#262, cr_return_amount#266, cr_net_loss#267]
-Input [7]: [cs_catalog_page_sk#257, cs_ext_sales_price#261, cs_net_profit#262, cs_sold_date_sk#263, cr_return_amount#266, cr_net_loss#267, d_date_sk#270]
+Output [5]: [cs_catalog_page_sk#255, cs_ext_sales_price#259, cs_net_profit#260, cr_return_amount#264, cr_net_loss#265]
+Input [7]: [cs_catalog_page_sk#255, cs_ext_sales_price#259, cs_net_profit#260, cs_sold_date_sk#261, cr_return_amount#264, cr_net_loss#265, d_date_sk#268]
 
 (183) ReusedExchange [Reuses operator id: 65]
-Output [2]: [cp_catalog_page_sk#271, cp_catalog_page_id#272]
+Output [2]: [cp_catalog_page_sk#269, cp_catalog_page_id#270]
 
 (184) BroadcastHashJoin [codegen id : 84]
-Left keys [1]: [cs_catalog_page_sk#257]
-Right keys [1]: [cp_catalog_page_sk#271]
+Left keys [1]: [cs_catalog_page_sk#255]
+Right keys [1]: [cp_catalog_page_sk#269]
 Join type: Inner
 Join condition: None
 
 (185) Project [codegen id : 84]
-Output [5]: [cs_ext_sales_price#261, cs_net_profit#262, cr_return_amount#266, cr_net_loss#267, cp_catalog_page_id#272]
-Input [7]: [cs_catalog_page_sk#257, cs_ext_sales_price#261, cs_net_profit#262, cr_return_amount#266, cr_net_loss#267, cp_catalog_page_sk#271, cp_catalog_page_id#272]
+Output [5]: [cs_ext_sales_price#259, cs_net_profit#260, cr_return_amount#264, cr_net_loss#265, cp_catalog_page_id#270]
+Input [7]: [cs_catalog_page_sk#255, cs_ext_sales_price#259, cs_net_profit#260, cr_return_amount#264, cr_net_loss#265, cp_catalog_page_sk#269, cp_catalog_page_id#270]
 
 (186) HashAggregate [codegen id : 84]
-Input [5]: [cs_ext_sales_price#261, cs_net_profit#262, cr_return_amount#266, cr_net_loss#267, cp_catalog_page_id#272]
-Keys [1]: [cp_catalog_page_id#272]
-Functions [3]: [partial_sum(UnscaledValue(cs_ext_sales_price#261)), partial_sum(coalesce(cast(cr_return_amount#266 as decimal(12,2)), 0.00)), partial_sum((cs_net_profit#262 - coalesce(cast(cr_net_loss#267 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [5]: [sum#273, sum#274, isEmpty#275, sum#276, isEmpty#277]
-Results [6]: [cp_catalog_page_id#272, sum#278, sum#279, isEmpty#280, sum#281, isEmpty#282]
+Input [5]: [cs_ext_sales_price#259, cs_net_profit#260, cr_return_amount#264, cr_net_loss#265, cp_catalog_page_id#270]
+Keys [1]: [cp_catalog_page_id#270]
+Functions [3]: [partial_sum(UnscaledValue(cs_ext_sales_price#259)), partial_sum(coalesce(cast(cr_return_amount#264 as decimal(12,2)), 0.00)), partial_sum((cs_net_profit#260 - coalesce(cast(cr_net_loss#265 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [5]: [sum#271, sum#272, isEmpty#273, sum#274, isEmpty#275]
+Results [6]: [cp_catalog_page_id#270, sum#276, sum#277, isEmpty#278, sum#279, isEmpty#280]
 
 (187) Exchange
-Input [6]: [cp_catalog_page_id#272, sum#278, sum#279, isEmpty#280, sum#281, isEmpty#282]
-Arguments: hashpartitioning(cp_catalog_page_id#272, 5), ENSURE_REQUIREMENTS, [plan_id=23]
+Input [6]: [cp_catalog_page_id#270, sum#276, sum#277, isEmpty#278, sum#279, isEmpty#280]
+Arguments: hashpartitioning(cp_catalog_page_id#270, 5), ENSURE_REQUIREMENTS, [plan_id=25]
 
 (188) HashAggregate [codegen id : 85]
-Input [6]: [cp_catalog_page_id#272, sum#278, sum#279, isEmpty#280, sum#281, isEmpty#282]
-Keys [1]: [cp_catalog_page_id#272]
-Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#261)), sum(coalesce(cast(cr_return_amount#266 as decimal(12,2)), 0.00)), sum((cs_net_profit#262 - coalesce(cast(cr_net_loss#267 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#261))#70, sum(coalesce(cast(cr_return_amount#266 as decimal(12,2)), 0.00))#71, sum((cs_net_profit#262 - coalesce(cast(cr_net_loss#267 as decimal(12,2)), 0.00)))#72]
-Results [5]: [catalog channel AS channel#283, concat(catalog_page, cp_catalog_page_id#272) AS id#284, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#261))#70,17,2) AS sales#285, sum(coalesce(cast(cr_return_amount#266 as decimal(12,2)), 0.00))#71 AS returns#286, sum((cs_net_profit#262 - coalesce(cast(cr_net_loss#267 as decimal(12,2)), 0.00)))#72 AS profit#287]
+Input [6]: [cp_catalog_page_id#270, sum#276, sum#277, isEmpty#278, sum#279, isEmpty#280]
+Keys [1]: [cp_catalog_page_id#270]
+Functions [3]: [sum(UnscaledValue(cs_ext_sales_price#259)), sum(coalesce(cast(cr_return_amount#264 as decimal(12,2)), 0.00)), sum((cs_net_profit#260 - coalesce(cast(cr_net_loss#265 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(cs_ext_sales_price#259))#68, sum(coalesce(cast(cr_return_amount#264 as decimal(12,2)), 0.00))#69, sum((cs_net_profit#260 - coalesce(cast(cr_net_loss#265 as decimal(12,2)), 0.00)))#70]
+Results [5]: [catalog channel AS channel#281, concat(catalog_page, cp_catalog_page_id#270) AS id#282, MakeDecimal(sum(UnscaledValue(cs_ext_sales_price#259))#68,17,2) AS sales#283, sum(coalesce(cast(cr_return_amount#264 as decimal(12,2)), 0.00))#69 AS returns#284, sum((cs_net_profit#260 - coalesce(cast(cr_net_loss#265 as decimal(12,2)), 0.00)))#70 AS profit#285]
 
 (189) ReusedExchange [Reuses operator id: 132]
-Output [6]: [web_site_id#288, sum#289, sum#290, isEmpty#291, sum#292, isEmpty#293]
+Output [6]: [web_site_id#286, sum#287, sum#288, isEmpty#289, sum#290, isEmpty#291]
 
 (190) HashAggregate [codegen id : 95]
-Input [6]: [web_site_id#288, sum#289, sum#290, isEmpty#291, sum#292, isEmpty#293]
-Keys [1]: [web_site_id#288]
-Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#294)), sum(coalesce(cast(wr_return_amt#295 as decimal(12,2)), 0.00)), sum((ws_net_profit#296 - coalesce(cast(wr_net_loss#297 as decimal(12,2)), 0.00)))]
-Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#294))#105, sum(coalesce(cast(wr_return_amt#295 as decimal(12,2)), 0.00))#106, sum((ws_net_profit#296 - coalesce(cast(wr_net_loss#297 as decimal(12,2)), 0.00)))#107]
-Results [5]: [web channel AS channel#298, concat(web_site, web_site_id#288) AS id#299, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#294))#105,17,2) AS sales#300, sum(coalesce(cast(wr_return_amt#295 as decimal(12,2)), 0.00))#106 AS returns#301, sum((ws_net_profit#296 - coalesce(cast(wr_net_loss#297 as decimal(12,2)), 0.00)))#107 AS profit#302]
+Input [6]: [web_site_id#286, sum#287, sum#288, isEmpty#289, sum#290, isEmpty#291]
+Keys [1]: [web_site_id#286]
+Functions [3]: [sum(UnscaledValue(ws_ext_sales_price#292)), sum(coalesce(cast(wr_return_amt#293 as decimal(12,2)), 0.00)), sum((ws_net_profit#294 - coalesce(cast(wr_net_loss#295 as decimal(12,2)), 0.00)))]
+Aggregate Attributes [3]: [sum(UnscaledValue(ws_ext_sales_price#292))#103, sum(coalesce(cast(wr_return_amt#293 as decimal(12,2)), 0.00))#104, sum((ws_net_profit#294 - coalesce(cast(wr_net_loss#295 as decimal(12,2)), 0.00)))#105]
+Results [5]: [web channel AS channel#296, concat(web_site, web_site_id#286) AS id#297, MakeDecimal(sum(UnscaledValue(ws_ext_sales_price#292))#103,17,2) AS sales#298, sum(coalesce(cast(wr_return_amt#293 as decimal(12,2)), 0.00))#104 AS returns#299, sum((ws_net_profit#294 - coalesce(cast(wr_net_loss#295 as decimal(12,2)), 0.00)))#105 AS profit#300]
 
 (191) Union
 
 (192) HashAggregate [codegen id : 96]
-Input [5]: [channel#252, id#253, sales#254, returns#255, profit#256]
-Keys [2]: [channel#252, id#253]
-Functions [3]: [partial_sum(sales#254), partial_sum(returns#255), partial_sum(profit#256)]
-Aggregate Attributes [6]: [sum#303, isEmpty#304, sum#305, isEmpty#306, sum#307, isEmpty#308]
-Results [8]: [channel#252, id#253, sum#309, isEmpty#310, sum#311, isEmpty#312, sum#313, isEmpty#314]
+Input [5]: [channel#250, id#251, sales#252, returns#253, profit#254]
+Keys [2]: [channel#250, id#251]
+Functions [3]: [partial_sum(sales#252), partial_sum(returns#253), partial_sum(profit#254)]
+Aggregate Attributes [6]: [sum#301, isEmpty#302, sum#303, isEmpty#304, sum#305, isEmpty#306]
+Results [8]: [channel#250, id#251, sum#307, isEmpty#308, sum#309, isEmpty#310, sum#311, isEmpty#312]
 
 (193) Exchange
-Input [8]: [channel#252, id#253, sum#309, isEmpty#310, sum#311, isEmpty#312, sum#313, isEmpty#314]
-Arguments: hashpartitioning(channel#252, id#253, 5), ENSURE_REQUIREMENTS, [plan_id=24]
+Input [8]: [channel#250, id#251, sum#307, isEmpty#308, sum#309, isEmpty#310, sum#311, isEmpty#312]
+Arguments: hashpartitioning(channel#250, id#251, 5), ENSURE_REQUIREMENTS, [plan_id=26]
 
 (194) HashAggregate [codegen id : 97]
-Input [8]: [channel#252, id#253, sum#309, isEmpty#310, sum#311, isEmpty#312, sum#313, isEmpty#314]
-Keys [2]: [channel#252, id#253]
-Functions [3]: [sum(sales#254), sum(returns#255), sum(profit#256)]
-Aggregate Attributes [3]: [sum(sales#254)#125, sum(returns#255)#126, sum(profit#256)#127]
-Results [3]: [sum(sales#254)#125 AS sales#315, sum(returns#255)#126 AS returns#316, sum(profit#256)#127 AS profit#317]
+Input [8]: [channel#250, id#251, sum#307, isEmpty#308, sum#309, isEmpty#310, sum#311, isEmpty#312]
+Keys [2]: [channel#250, id#251]
+Functions [3]: [sum(sales#252), sum(returns#253), sum(profit#254)]
+Aggregate Attributes [3]: [sum(sales#252)#123, sum(returns#253)#124, sum(profit#254)#125]
+Results [3]: [sum(sales#252)#123 AS sales#313, sum(returns#253)#124 AS returns#314, sum(profit#254)#125 AS profit#315]
 
 (195) HashAggregate [codegen id : 97]
-Input [3]: [sales#315, returns#316, profit#317]
+Input [3]: [sales#313, returns#314, profit#315]
 Keys: []
-Functions [3]: [partial_sum(sales#315), partial_sum(returns#316), partial_sum(profit#317)]
-Aggregate Attributes [6]: [sum#318, isEmpty#319, sum#320, isEmpty#321, sum#322, isEmpty#323]
-Results [6]: [sum#324, isEmpty#325, sum#326, isEmpty#327, sum#328, isEmpty#329]
+Functions [3]: [partial_sum(sales#313), partial_sum(returns#314), partial_sum(profit#315)]
+Aggregate Attributes [6]: [sum#316, isEmpty#317, sum#318, isEmpty#319, sum#320, isEmpty#321]
+Results [6]: [sum#322, isEmpty#323, sum#324, isEmpty#325, sum#326, isEmpty#327]
 
 (196) Exchange
-Input [6]: [sum#324, isEmpty#325, sum#326, isEmpty#327, sum#328, isEmpty#329]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=25]
+Input [6]: [sum#322, isEmpty#323, sum#324, isEmpty#325, sum#326, isEmpty#327]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=27]
 
 (197) HashAggregate [codegen id : 98]
-Input [6]: [sum#324, isEmpty#325, sum#326, isEmpty#327, sum#328, isEmpty#329]
+Input [6]: [sum#322, isEmpty#323, sum#324, isEmpty#325, sum#326, isEmpty#327]
 Keys: []
-Functions [3]: [sum(sales#315), sum(returns#316), sum(profit#317)]
-Aggregate Attributes [3]: [sum(sales#315)#330, sum(returns#316)#331, sum(profit#317)#332]
-Results [5]: [null AS channel#333, null AS id#334, sum(sales#315)#330 AS sales#335, sum(returns#316)#331 AS returns#336, sum(profit#317)#332 AS profit#337]
+Functions [3]: [sum(sales#313), sum(returns#314), sum(profit#315)]
+Aggregate Attributes [3]: [sum(sales#313)#328, sum(returns#314)#329, sum(profit#315)#330]
+Results [5]: [null AS channel#331, null AS id#332, sum(sales#313)#328 AS sales#333, sum(returns#314)#329 AS returns#334, sum(profit#315)#330 AS profit#335]
 
 (198) Union
 
 (199) HashAggregate [codegen id : 99]
-Input [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
-Keys [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
+Input [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
+Keys [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
 Functions: []
 Aggregate Attributes: []
-Results [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
+Results [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
 
 (200) Exchange
-Input [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
-Arguments: hashpartitioning(channel#38, id#39, sales#128, returns#129, profit#130, 5), ENSURE_REQUIREMENTS, [plan_id=26]
+Input [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
+Arguments: hashpartitioning(channel#36, id#37, sales#126, returns#127, profit#128, 5), ENSURE_REQUIREMENTS, [plan_id=28]
 
 (201) HashAggregate [codegen id : 100]
-Input [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
-Keys [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
+Input [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
+Keys [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
 Functions: []
 Aggregate Attributes: []
-Results [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
+Results [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
 
 (202) TakeOrderedAndProject
-Input [5]: [channel#38, id#39, sales#128, returns#129, profit#130]
-Arguments: 100, [channel#38 ASC NULLS FIRST, id#39 ASC NULLS FIRST], [channel#38, id#39, sales#128, returns#129, profit#130]
+Input [5]: [channel#36, id#37, sales#126, returns#127, profit#128]
+Arguments: 100, [channel#36 ASC NULLS FIRST, id#37 ASC NULLS FIRST], [channel#36, id#37, sales#126, returns#127, profit#128]
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#10]
+Subquery:1 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#9, [id=#1]
 ObjectHashAggregate (209)
 +- Exchange (208)
    +- ObjectHashAggregate (207)
@@ -1166,42 +1166,42 @@ ObjectHashAggregate (209)
 
 
 (203) Scan parquet spark_catalog.default.item
-Output [2]: [i_item_sk#18, i_current_price#19]
+Output [2]: [i_item_sk#16, i_current_price#17]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/item]
 PushedFilters: [IsNotNull(i_current_price), GreaterThan(i_current_price,50.00), IsNotNull(i_item_sk)]
 ReadSchema: struct<i_item_sk:int,i_current_price:decimal(7,2)>
 
 (204) ColumnarToRow [codegen id : 1]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (205) Filter [codegen id : 1]
-Input [2]: [i_item_sk#18, i_current_price#19]
-Condition : ((isnotnull(i_current_price#19) AND (i_current_price#19 > 50.00)) AND isnotnull(i_item_sk#18))
+Input [2]: [i_item_sk#16, i_current_price#17]
+Condition : ((isnotnull(i_current_price#17) AND (i_current_price#17 > 50.00)) AND isnotnull(i_item_sk#16))
 
 (206) Project [codegen id : 1]
-Output [1]: [i_item_sk#18]
-Input [2]: [i_item_sk#18, i_current_price#19]
+Output [1]: [i_item_sk#16]
+Input [2]: [i_item_sk#16, i_current_price#17]
 
 (207) ObjectHashAggregate
-Input [1]: [i_item_sk#18]
+Input [1]: [i_item_sk#16]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)]
-Aggregate Attributes [1]: [buf#338]
-Results [1]: [buf#339]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)]
+Aggregate Attributes [1]: [buf#336]
+Results [1]: [buf#337]
 
 (208) Exchange
-Input [1]: [buf#339]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=27]
+Input [1]: [buf#337]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=29]
 
 (209) ObjectHashAggregate
-Input [1]: [buf#339]
+Input [1]: [buf#337]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)#340]
-Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#18, 42), 101823, 1521109, 0, 0)#340 AS bloomFilter#341]
+Functions [1]: [bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)#338]
+Results [1]: [bloom_filter_agg(xxhash64(i_item_sk#16, 42), 101823, 1521109, 0, 0)#338 AS bloomFilter#339]
 
-Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#11, [id=#12]
+Subquery:2 Hosting operator id = 3 Hosting Expression = Subquery scalar-subquery#10, [id=#2]
 ObjectHashAggregate (216)
 +- Exchange (215)
    +- ObjectHashAggregate (214)
@@ -1212,40 +1212,40 @@ ObjectHashAggregate (216)
 
 
 (210) Scan parquet spark_catalog.default.promotion
-Output [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [2]: [p_promo_sk#18, p_channel_tv#19]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/promotion]
 PushedFilters: [IsNotNull(p_channel_tv), EqualTo(p_channel_tv,N), IsNotNull(p_promo_sk)]
 ReadSchema: struct<p_promo_sk:int,p_channel_tv:string>
 
 (211) ColumnarToRow [codegen id : 1]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (212) Filter [codegen id : 1]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
-Condition : ((isnotnull(p_channel_tv#21) AND (p_channel_tv#21 = N)) AND isnotnull(p_promo_sk#20))
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
+Condition : ((isnotnull(p_channel_tv#19) AND (p_channel_tv#19 = N)) AND isnotnull(p_promo_sk#18))
 
 (213) Project [codegen id : 1]
-Output [1]: [p_promo_sk#20]
-Input [2]: [p_promo_sk#20, p_channel_tv#21]
+Output [1]: [p_promo_sk#18]
+Input [2]: [p_promo_sk#18, p_channel_tv#19]
 
 (214) ObjectHashAggregate
-Input [1]: [p_promo_sk#20]
+Input [1]: [p_promo_sk#18]
 Keys: []
-Functions [1]: [partial_bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)]
-Aggregate Attributes [1]: [buf#342]
-Results [1]: [buf#343]
+Functions [1]: [partial_bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)]
+Aggregate Attributes [1]: [buf#340]
+Results [1]: [buf#341]
 
 (215) Exchange
-Input [1]: [buf#343]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=28]
+Input [1]: [buf#341]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=30]
 
 (216) ObjectHashAggregate
-Input [1]: [buf#343]
+Input [1]: [buf#341]
 Keys: []
-Functions [1]: [bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)]
-Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)#344]
-Results [1]: [bloom_filter_agg(xxhash64(p_promo_sk#20, 42), 986, 24246, 0, 0)#344 AS bloomFilter#345]
+Functions [1]: [bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)]
+Aggregate Attributes [1]: [bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)#342]
+Results [1]: [bloom_filter_agg(xxhash64(p_promo_sk#18, 42), 986, 24246, 0, 0)#342 AS bloomFilter#343]
 
 Subquery:3 Hosting operator id = 1 Hosting Expression = ss_sold_date_sk#7 IN dynamicpruning#8
 BroadcastExchange (221)
@@ -1256,43 +1256,43 @@ BroadcastExchange (221)
 
 
 (217) Scan parquet spark_catalog.default.date_dim
-Output [2]: [d_date_sk#22, d_date#346]
+Output [2]: [d_date_sk#20, d_date#344]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/date_dim]
 PushedFilters: [IsNotNull(d_date), GreaterThanOrEqual(d_date,1998-08-04), LessThanOrEqual(d_date,1998-09-03), IsNotNull(d_date_sk)]
 ReadSchema: struct<d_date_sk:int,d_date:date>
 
 (218) ColumnarToRow [codegen id : 1]
-Input [2]: [d_date_sk#22, d_date#346]
+Input [2]: [d_date_sk#20, d_date#344]
 
 (219) Filter [codegen id : 1]
-Input [2]: [d_date_sk#22, d_date#346]
-Condition : (((isnotnull(d_date#346) AND (d_date#346 >= 1998-08-04)) AND (d_date#346 <= 1998-09-03)) AND isnotnull(d_date_sk#22))
+Input [2]: [d_date_sk#20, d_date#344]
+Condition : (((isnotnull(d_date#344) AND (d_date#344 >= 1998-08-04)) AND (d_date#344 <= 1998-09-03)) AND isnotnull(d_date_sk#20))
 
 (220) Project [codegen id : 1]
-Output [1]: [d_date_sk#22]
-Input [2]: [d_date_sk#22, d_date#346]
+Output [1]: [d_date_sk#20]
+Input [2]: [d_date_sk#20, d_date#344]
 
 (221) BroadcastExchange
-Input [1]: [d_date_sk#22]
-Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=29]
+Input [1]: [d_date_sk#20]
+Arguments: HashedRelationBroadcastMode(List(cast(input[0, int, true] as bigint)),false), [plan_id=31]
 
-Subquery:4 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#10]
+Subquery:4 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#1]
 
-Subquery:5 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:5 Hosting operator id = 42 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#2]
 
-Subquery:6 Hosting operator id = 40 Hosting Expression = cs_sold_date_sk#49 IN dynamicpruning#8
+Subquery:6 Hosting operator id = 40 Hosting Expression = cs_sold_date_sk#47 IN dynamicpruning#8
 
-Subquery:7 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#10]
+Subquery:7 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#9, [id=#1]
 
-Subquery:8 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#11, [id=#12]
+Subquery:8 Hosting operator id = 73 Hosting Expression = ReusedSubquery Subquery scalar-subquery#10, [id=#2]
 
-Subquery:9 Hosting operator id = 71 Hosting Expression = ws_sold_date_sk#84 IN dynamicpruning#8
+Subquery:9 Hosting operator id = 71 Hosting Expression = ws_sold_date_sk#82 IN dynamicpruning#8
 
-Subquery:10 Hosting operator id = 110 Hosting Expression = ws_sold_date_sk#167 IN dynamicpruning#8
+Subquery:10 Hosting operator id = 110 Hosting Expression = ws_sold_date_sk#165 IN dynamicpruning#8
 
-Subquery:11 Hosting operator id = 141 Hosting Expression = ss_sold_date_sk#232 IN dynamicpruning#8
+Subquery:11 Hosting operator id = 141 Hosting Expression = ss_sold_date_sk#230 IN dynamicpruning#8
 
-Subquery:12 Hosting operator id = 165 Hosting Expression = cs_sold_date_sk#263 IN dynamicpruning#8
+Subquery:12 Hosting operator id = 165 Hosting Expression = cs_sold_date_sk#261 IN dynamicpruning#8
 
 
diff --git a/sql/core/src/test/resources/tpch-plan-stability/q11/explain.txt b/sql/core/src/test/resources/tpch-plan-stability/q11/explain.txt
index 60237063f011a..037b05678df5d 100644
--- a/sql/core/src/test/resources/tpch-plan-stability/q11/explain.txt
+++ b/sql/core/src/test/resources/tpch-plan-stability/q11/explain.txt
@@ -117,11 +117,11 @@ Results [2]: [ps_partkey#1, sum((ps_supplycost#4 * cast(ps_availqty#3 as decimal
 
 (20) Filter [codegen id : 4]
 Input [2]: [ps_partkey#1, value#14]
-Condition : (isnotnull(value#14) AND (cast(value#14 as decimal(38,6)) > Subquery scalar-subquery#15, [id=#16]))
+Condition : (isnotnull(value#14) AND (cast(value#14 as decimal(38,6)) > Subquery scalar-subquery#15, [id=#4]))
 
 (21) Exchange
 Input [2]: [ps_partkey#1, value#14]
-Arguments: rangepartitioning(value#14 DESC NULLS LAST, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Arguments: rangepartitioning(value#14 DESC NULLS LAST, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (22) Sort [codegen id : 5]
 Input [2]: [ps_partkey#1, value#14]
@@ -129,7 +129,7 @@ Arguments: [value#14 DESC NULLS LAST], true, 0
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 20 Hosting Expression = Subquery scalar-subquery#15, [id=#16]
+Subquery:1 Hosting operator id = 20 Hosting Expression = Subquery scalar-subquery#15, [id=#4]
 * HashAggregate (34)
 +- Exchange (33)
    +- * HashAggregate (32)
@@ -145,61 +145,61 @@ Subquery:1 Hosting operator id = 20 Hosting Expression = Subquery scalar-subquer
 
 
 (23) Scan parquet spark_catalog.default.partsupp
-Output [3]: [ps_suppkey#17, ps_availqty#18, ps_supplycost#19]
+Output [3]: [ps_suppkey#16, ps_availqty#17, ps_supplycost#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/partsupp]
 PushedFilters: [IsNotNull(ps_suppkey)]
 ReadSchema: struct<ps_suppkey:bigint,ps_availqty:int,ps_supplycost:decimal(10,0)>
 
 (24) ColumnarToRow [codegen id : 3]
-Input [3]: [ps_suppkey#17, ps_availqty#18, ps_supplycost#19]
+Input [3]: [ps_suppkey#16, ps_availqty#17, ps_supplycost#18]
 
 (25) Filter [codegen id : 3]
-Input [3]: [ps_suppkey#17, ps_availqty#18, ps_supplycost#19]
-Condition : isnotnull(ps_suppkey#17)
+Input [3]: [ps_suppkey#16, ps_availqty#17, ps_supplycost#18]
+Condition : isnotnull(ps_suppkey#16)
 
 (26) ReusedExchange [Reuses operator id: 7]
-Output [2]: [s_suppkey#20, s_nationkey#21]
+Output [2]: [s_suppkey#19, s_nationkey#20]
 
 (27) BroadcastHashJoin [codegen id : 3]
-Left keys [1]: [ps_suppkey#17]
-Right keys [1]: [s_suppkey#20]
+Left keys [1]: [ps_suppkey#16]
+Right keys [1]: [s_suppkey#19]
 Join type: Inner
 Join condition: None
 
 (28) Project [codegen id : 3]
-Output [3]: [ps_availqty#18, ps_supplycost#19, s_nationkey#21]
-Input [5]: [ps_suppkey#17, ps_availqty#18, ps_supplycost#19, s_suppkey#20, s_nationkey#21]
+Output [3]: [ps_availqty#17, ps_supplycost#18, s_nationkey#20]
+Input [5]: [ps_suppkey#16, ps_availqty#17, ps_supplycost#18, s_suppkey#19, s_nationkey#20]
 
 (29) ReusedExchange [Reuses operator id: 14]
-Output [1]: [n_nationkey#22]
+Output [1]: [n_nationkey#21]
 
 (30) BroadcastHashJoin [codegen id : 3]
-Left keys [1]: [s_nationkey#21]
-Right keys [1]: [n_nationkey#22]
+Left keys [1]: [s_nationkey#20]
+Right keys [1]: [n_nationkey#21]
 Join type: Inner
 Join condition: None
 
 (31) Project [codegen id : 3]
-Output [2]: [ps_availqty#18, ps_supplycost#19]
-Input [4]: [ps_availqty#18, ps_supplycost#19, s_nationkey#21, n_nationkey#22]
+Output [2]: [ps_availqty#17, ps_supplycost#18]
+Input [4]: [ps_availqty#17, ps_supplycost#18, s_nationkey#20, n_nationkey#21]
 
 (32) HashAggregate [codegen id : 3]
-Input [2]: [ps_availqty#18, ps_supplycost#19]
+Input [2]: [ps_availqty#17, ps_supplycost#18]
 Keys: []
-Functions [1]: [partial_sum((ps_supplycost#19 * cast(ps_availqty#18 as decimal(10,0))))]
-Aggregate Attributes [2]: [sum#23, isEmpty#24]
-Results [2]: [sum#25, isEmpty#26]
+Functions [1]: [partial_sum((ps_supplycost#18 * cast(ps_availqty#17 as decimal(10,0))))]
+Aggregate Attributes [2]: [sum#22, isEmpty#23]
+Results [2]: [sum#24, isEmpty#25]
 
 (33) Exchange
-Input [2]: [sum#25, isEmpty#26]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
+Input [2]: [sum#24, isEmpty#25]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
 
 (34) HashAggregate [codegen id : 4]
-Input [2]: [sum#25, isEmpty#26]
+Input [2]: [sum#24, isEmpty#25]
 Keys: []
-Functions [1]: [sum((ps_supplycost#19 * cast(ps_availqty#18 as decimal(10,0))))]
-Aggregate Attributes [1]: [sum((ps_supplycost#19 * cast(ps_availqty#18 as decimal(10,0))))#27]
-Results [1]: [(sum((ps_supplycost#19 * cast(ps_availqty#18 as decimal(10,0))))#27 * 0.0001000000) AS (sum((ps_supplycost * ps_availqty)) * 0.0001000000)#28]
+Functions [1]: [sum((ps_supplycost#18 * cast(ps_availqty#17 as decimal(10,0))))]
+Aggregate Attributes [1]: [sum((ps_supplycost#18 * cast(ps_availqty#17 as decimal(10,0))))#26]
+Results [1]: [(sum((ps_supplycost#18 * cast(ps_availqty#17 as decimal(10,0))))#26 * 0.0001000000) AS (sum((ps_supplycost * ps_availqty)) * 0.0001000000)#27]
 
 
diff --git a/sql/core/src/test/resources/tpch-plan-stability/q15/explain.txt b/sql/core/src/test/resources/tpch-plan-stability/q15/explain.txt
index d3489acaa3db3..9358db6cbda51 100644
--- a/sql/core/src/test/resources/tpch-plan-stability/q15/explain.txt
+++ b/sql/core/src/test/resources/tpch-plan-stability/q15/explain.txt
@@ -69,11 +69,11 @@ Results [2]: [l_suppkey#5 AS supplier_no#14, sum((l_extendedprice#6 * (1 - l_dis
 
 (11) Filter [codegen id : 2]
 Input [2]: [supplier_no#14, total_revenue#15]
-Condition : (isnotnull(total_revenue#15) AND (total_revenue#15 = Subquery scalar-subquery#16, [id=#17]))
+Condition : (isnotnull(total_revenue#15) AND (total_revenue#15 = Subquery scalar-subquery#16, [id=#2]))
 
 (12) BroadcastExchange
 Input [2]: [supplier_no#14, total_revenue#15]
-Arguments: HashedRelationBroadcastMode(List(input[0, bigint, true]),false), [plan_id=2]
+Arguments: HashedRelationBroadcastMode(List(input[0, bigint, true]),false), [plan_id=3]
 
 (13) BroadcastHashJoin [codegen id : 3]
 Left keys [1]: [s_suppkey#1]
@@ -87,7 +87,7 @@ Input [6]: [s_suppkey#1, s_name#2, s_address#3, s_phone#4, supplier_no#14, total
 
 (15) Exchange
 Input [5]: [s_suppkey#1, s_name#2, s_address#3, s_phone#4, total_revenue#15]
-Arguments: rangepartitioning(s_suppkey#1 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Arguments: rangepartitioning(s_suppkey#1 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (16) Sort [codegen id : 4]
 Input [5]: [s_suppkey#1, s_name#2, s_address#3, s_phone#4, total_revenue#15]
@@ -95,7 +95,7 @@ Arguments: [s_suppkey#1 ASC NULLS FIRST], true, 0
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 11 Hosting Expression = Subquery scalar-subquery#16, [id=#17]
+Subquery:1 Hosting operator id = 11 Hosting Expression = Subquery scalar-subquery#16, [id=#2]
 * HashAggregate (26)
 +- Exchange (25)
    +- * HashAggregate (24)
@@ -109,57 +109,57 @@ Subquery:1 Hosting operator id = 11 Hosting Expression = Subquery scalar-subquer
 
 
 (17) Scan parquet spark_catalog.default.lineitem
-Output [4]: [l_suppkey#18, l_extendedprice#19, l_discount#20, l_shipdate#21]
+Output [4]: [l_suppkey#17, l_extendedprice#18, l_discount#19, l_shipdate#20]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/lineitem]
 PushedFilters: [IsNotNull(l_shipdate), GreaterThanOrEqual(l_shipdate,1996-01-01), LessThan(l_shipdate,1996-04-01)]
 ReadSchema: struct<l_suppkey:bigint,l_extendedprice:decimal(10,0),l_discount:decimal(10,0),l_shipdate:date>
 
 (18) ColumnarToRow [codegen id : 1]
-Input [4]: [l_suppkey#18, l_extendedprice#19, l_discount#20, l_shipdate#21]
+Input [4]: [l_suppkey#17, l_extendedprice#18, l_discount#19, l_shipdate#20]
 
 (19) Filter [codegen id : 1]
-Input [4]: [l_suppkey#18, l_extendedprice#19, l_discount#20, l_shipdate#21]
-Condition : ((isnotnull(l_shipdate#21) AND (l_shipdate#21 >= 1996-01-01)) AND (l_shipdate#21 < 1996-04-01))
+Input [4]: [l_suppkey#17, l_extendedprice#18, l_discount#19, l_shipdate#20]
+Condition : ((isnotnull(l_shipdate#20) AND (l_shipdate#20 >= 1996-01-01)) AND (l_shipdate#20 < 1996-04-01))
 
 (20) Project [codegen id : 1]
-Output [3]: [l_suppkey#18, l_extendedprice#19, l_discount#20]
-Input [4]: [l_suppkey#18, l_extendedprice#19, l_discount#20, l_shipdate#21]
+Output [3]: [l_suppkey#17, l_extendedprice#18, l_discount#19]
+Input [4]: [l_suppkey#17, l_extendedprice#18, l_discount#19, l_shipdate#20]
 
 (21) HashAggregate [codegen id : 1]
-Input [3]: [l_suppkey#18, l_extendedprice#19, l_discount#20]
-Keys [1]: [l_suppkey#18]
-Functions [1]: [partial_sum((l_extendedprice#19 * (1 - l_discount#20)))]
-Aggregate Attributes [2]: [sum#22, isEmpty#23]
-Results [3]: [l_suppkey#18, sum#24, isEmpty#25]
+Input [3]: [l_suppkey#17, l_extendedprice#18, l_discount#19]
+Keys [1]: [l_suppkey#17]
+Functions [1]: [partial_sum((l_extendedprice#18 * (1 - l_discount#19)))]
+Aggregate Attributes [2]: [sum#21, isEmpty#22]
+Results [3]: [l_suppkey#17, sum#23, isEmpty#24]
 
 (22) Exchange
-Input [3]: [l_suppkey#18, sum#24, isEmpty#25]
-Arguments: hashpartitioning(l_suppkey#18, 5), ENSURE_REQUIREMENTS, [plan_id=4]
+Input [3]: [l_suppkey#17, sum#23, isEmpty#24]
+Arguments: hashpartitioning(l_suppkey#17, 5), ENSURE_REQUIREMENTS, [plan_id=5]
 
 (23) HashAggregate [codegen id : 2]
-Input [3]: [l_suppkey#18, sum#24, isEmpty#25]
-Keys [1]: [l_suppkey#18]
-Functions [1]: [sum((l_extendedprice#19 * (1 - l_discount#20)))]
-Aggregate Attributes [1]: [sum((l_extendedprice#19 * (1 - l_discount#20)))#13]
-Results [1]: [sum((l_extendedprice#19 * (1 - l_discount#20)))#13 AS total_revenue#26]
+Input [3]: [l_suppkey#17, sum#23, isEmpty#24]
+Keys [1]: [l_suppkey#17]
+Functions [1]: [sum((l_extendedprice#18 * (1 - l_discount#19)))]
+Aggregate Attributes [1]: [sum((l_extendedprice#18 * (1 - l_discount#19)))#13]
+Results [1]: [sum((l_extendedprice#18 * (1 - l_discount#19)))#13 AS total_revenue#25]
 
 (24) HashAggregate [codegen id : 2]
-Input [1]: [total_revenue#26]
+Input [1]: [total_revenue#25]
 Keys: []
-Functions [1]: [partial_max(total_revenue#26)]
-Aggregate Attributes [1]: [max#27]
-Results [1]: [max#28]
+Functions [1]: [partial_max(total_revenue#25)]
+Aggregate Attributes [1]: [max#26]
+Results [1]: [max#27]
 
 (25) Exchange
-Input [1]: [max#28]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
+Input [1]: [max#27]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=6]
 
 (26) HashAggregate [codegen id : 3]
-Input [1]: [max#28]
+Input [1]: [max#27]
 Keys: []
-Functions [1]: [max(total_revenue#26)]
-Aggregate Attributes [1]: [max(total_revenue#26)#29]
-Results [1]: [max(total_revenue#26)#29 AS max(total_revenue)#30]
+Functions [1]: [max(total_revenue#25)]
+Aggregate Attributes [1]: [max(total_revenue#25)#28]
+Results [1]: [max(total_revenue#25)#28 AS max(total_revenue)#29]
 
 
diff --git a/sql/core/src/test/resources/tpch-plan-stability/q22/explain.txt b/sql/core/src/test/resources/tpch-plan-stability/q22/explain.txt
index eafde15b7e1a7..1272f8648463b 100644
--- a/sql/core/src/test/resources/tpch-plan-stability/q22/explain.txt
+++ b/sql/core/src/test/resources/tpch-plan-stability/q22/explain.txt
@@ -26,62 +26,62 @@ Input [3]: [c_custkey#1, c_phone#2, c_acctbal#3]
 
 (3) Filter [codegen id : 2]
 Input [3]: [c_custkey#1, c_phone#2, c_acctbal#3]
-Condition : ((isnotnull(c_acctbal#3) AND substring(c_phone#2, 1, 2) IN (13,31,23,29,30,18,17)) AND (cast(c_acctbal#3 as decimal(14,4)) > ReusedSubquery Subquery scalar-subquery#4, [id=#5]))
+Condition : ((isnotnull(c_acctbal#3) AND substring(c_phone#2, 1, 2) IN (13,31,23,29,30,18,17)) AND (cast(c_acctbal#3 as decimal(14,4)) > ReusedSubquery Subquery scalar-subquery#4, [id=#1]))
 
 (4) Scan parquet spark_catalog.default.orders
-Output [1]: [o_custkey#6]
+Output [1]: [o_custkey#5]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/orders]
 ReadSchema: struct<o_custkey:bigint>
 
 (5) ColumnarToRow [codegen id : 1]
-Input [1]: [o_custkey#6]
+Input [1]: [o_custkey#5]
 
 (6) BroadcastExchange
-Input [1]: [o_custkey#6]
-Arguments: HashedRelationBroadcastMode(List(input[0, bigint, true]),false), [plan_id=1]
+Input [1]: [o_custkey#5]
+Arguments: HashedRelationBroadcastMode(List(input[0, bigint, true]),false), [plan_id=2]
 
 (7) BroadcastHashJoin [codegen id : 2]
 Left keys [1]: [c_custkey#1]
-Right keys [1]: [o_custkey#6]
+Right keys [1]: [o_custkey#5]
 Join type: LeftAnti
 Join condition: None
 
 (8) Project [codegen id : 2]
-Output [2]: [substring(c_phone#2, 1, 2) AS cntrycode#7, c_acctbal#3]
+Output [2]: [substring(c_phone#2, 1, 2) AS cntrycode#6, c_acctbal#3]
 Input [3]: [c_custkey#1, c_phone#2, c_acctbal#3]
 
 (9) HashAggregate [codegen id : 2]
-Input [2]: [cntrycode#7, c_acctbal#3]
-Keys [1]: [cntrycode#7]
+Input [2]: [cntrycode#6, c_acctbal#3]
+Keys [1]: [cntrycode#6]
 Functions [2]: [partial_count(1), partial_sum(c_acctbal#3)]
-Aggregate Attributes [3]: [count#8, sum#9, isEmpty#10]
-Results [4]: [cntrycode#7, count#11, sum#12, isEmpty#13]
+Aggregate Attributes [3]: [count#7, sum#8, isEmpty#9]
+Results [4]: [cntrycode#6, count#10, sum#11, isEmpty#12]
 
 (10) Exchange
-Input [4]: [cntrycode#7, count#11, sum#12, isEmpty#13]
-Arguments: hashpartitioning(cntrycode#7, 5), ENSURE_REQUIREMENTS, [plan_id=2]
+Input [4]: [cntrycode#6, count#10, sum#11, isEmpty#12]
+Arguments: hashpartitioning(cntrycode#6, 5), ENSURE_REQUIREMENTS, [plan_id=3]
 
 (11) HashAggregate [codegen id : 3]
-Input [4]: [cntrycode#7, count#11, sum#12, isEmpty#13]
-Keys [1]: [cntrycode#7]
+Input [4]: [cntrycode#6, count#10, sum#11, isEmpty#12]
+Keys [1]: [cntrycode#6]
 Functions [2]: [count(1), sum(c_acctbal#3)]
-Aggregate Attributes [2]: [count(1)#14, sum(c_acctbal#3)#15]
-Results [3]: [cntrycode#7, count(1)#14 AS numcust#16, sum(c_acctbal#3)#15 AS totacctbal#17]
+Aggregate Attributes [2]: [count(1)#13, sum(c_acctbal#3)#14]
+Results [3]: [cntrycode#6, count(1)#13 AS numcust#15, sum(c_acctbal#3)#14 AS totacctbal#16]
 
 (12) Exchange
-Input [3]: [cntrycode#7, numcust#16, totacctbal#17]
-Arguments: rangepartitioning(cntrycode#7 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=3]
+Input [3]: [cntrycode#6, numcust#15, totacctbal#16]
+Arguments: rangepartitioning(cntrycode#6 ASC NULLS FIRST, 5), ENSURE_REQUIREMENTS, [plan_id=4]
 
 (13) Sort [codegen id : 4]
-Input [3]: [cntrycode#7, numcust#16, totacctbal#17]
-Arguments: [cntrycode#7 ASC NULLS FIRST], true, 0
+Input [3]: [cntrycode#6, numcust#15, totacctbal#16]
+Arguments: [cntrycode#6 ASC NULLS FIRST], true, 0
 
 ===== Subqueries =====
 
-Subquery:1 Hosting operator id = 3 Hosting Expression = ReusedSubquery Subquery scalar-subquery#4, [id=#5]
+Subquery:1 Hosting operator id = 3 Hosting Expression = ReusedSubquery Subquery scalar-subquery#4, [id=#1]
 
-Subquery:2 Hosting operator id = 1 Hosting Expression = Subquery scalar-subquery#4, [id=#5]
+Subquery:2 Hosting operator id = 1 Hosting Expression = Subquery scalar-subquery#4, [id=#1]
 * HashAggregate (20)
 +- Exchange (19)
    +- * HashAggregate (18)
@@ -92,39 +92,39 @@ Subquery:2 Hosting operator id = 1 Hosting Expression = Subquery scalar-subquery
 
 
 (14) Scan parquet spark_catalog.default.customer
-Output [2]: [c_phone#18, c_acctbal#19]
+Output [2]: [c_phone#17, c_acctbal#18]
 Batched: true
 Location [not included in comparison]/{warehouse_dir}/customer]
 PushedFilters: [IsNotNull(c_acctbal), GreaterThan(c_acctbal,0)]
 ReadSchema: struct<c_phone:string,c_acctbal:decimal(10,0)>
 
 (15) ColumnarToRow [codegen id : 1]
-Input [2]: [c_phone#18, c_acctbal#19]
+Input [2]: [c_phone#17, c_acctbal#18]
 
 (16) Filter [codegen id : 1]
-Input [2]: [c_phone#18, c_acctbal#19]
-Condition : ((isnotnull(c_acctbal#19) AND (c_acctbal#19 > 0)) AND substring(c_phone#18, 1, 2) IN (13,31,23,29,30,18,17))
+Input [2]: [c_phone#17, c_acctbal#18]
+Condition : ((isnotnull(c_acctbal#18) AND (c_acctbal#18 > 0)) AND substring(c_phone#17, 1, 2) IN (13,31,23,29,30,18,17))
 
 (17) Project [codegen id : 1]
-Output [1]: [c_acctbal#19]
-Input [2]: [c_phone#18, c_acctbal#19]
+Output [1]: [c_acctbal#18]
+Input [2]: [c_phone#17, c_acctbal#18]
 
 (18) HashAggregate [codegen id : 1]
-Input [1]: [c_acctbal#19]
+Input [1]: [c_acctbal#18]
 Keys: []
-Functions [1]: [partial_avg(UnscaledValue(c_acctbal#19))]
-Aggregate Attributes [2]: [sum#20, count#21]
-Results [2]: [sum#22, count#23]
+Functions [1]: [partial_avg(UnscaledValue(c_acctbal#18))]
+Aggregate Attributes [2]: [sum#19, count#20]
+Results [2]: [sum#21, count#22]
 
 (19) Exchange
-Input [2]: [sum#22, count#23]
-Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=4]
+Input [2]: [sum#21, count#22]
+Arguments: SinglePartition, ENSURE_REQUIREMENTS, [plan_id=5]
 
 (20) HashAggregate [codegen id : 2]
-Input [2]: [sum#22, count#23]
+Input [2]: [sum#21, count#22]
 Keys: []
-Functions [1]: [avg(UnscaledValue(c_acctbal#19))]
-Aggregate Attributes [1]: [avg(UnscaledValue(c_acctbal#19))#24]
-Results [1]: [cast((avg(UnscaledValue(c_acctbal#19))#24 / 1.0) as decimal(14,4)) AS avg(c_acctbal)#25]
+Functions [1]: [avg(UnscaledValue(c_acctbal#18))]
+Aggregate Attributes [1]: [avg(UnscaledValue(c_acctbal#18))#23]
+Results [1]: [cast((avg(UnscaledValue(c_acctbal#18))#23 / 1.0) as decimal(14,4)) AS avg(c_acctbal)#24]
 
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/AddMetadataColumnSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/AddMetadataColumnsSuite.scala
similarity index 98%
rename from sql/core/src/test/scala/org/apache/spark/sql/AddMetadataColumnSuite.scala
rename to sql/core/src/test/scala/org/apache/spark/sql/AddMetadataColumnsSuite.scala
index 531d1303e1304..dfb6c6d423acc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/AddMetadataColumnSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/AddMetadataColumnsSuite.scala
@@ -15,9 +15,8 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.catalyst.analysis
+package org.apache.spark.sql
 
-import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.catalyst.expressions.NamedExpression
 import org.apache.spark.sql.catalyst.plans.logical.{Filter, Project}
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/AlwaysPersistedConfigsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/AlwaysPersistedConfigsSuite.scala
new file mode 100644
index 0000000000000..bfadf1eb1885a
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/AlwaysPersistedConfigsSuite.scala
@@ -0,0 +1,205 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql
+
+import org.scalactic.source.Position
+import org.scalatest.Tag
+
+import org.apache.spark.SparkConf
+import org.apache.spark.sql.catalyst.TableIdentifier
+import org.apache.spark.sql.catalyst.analysis.SQLScalarFunction
+import org.apache.spark.sql.catalyst.catalog.{
+  CatalogStorageFormat,
+  CatalogTable,
+  CatalogTableType,
+  SQLFunction
+}
+import org.apache.spark.sql.catalyst.expressions.Alias
+import org.apache.spark.sql.catalyst.plans.logical.{OneRowRelation, Project, View}
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.sql.types.StructType
+
+/**
+ * This suite tests if configs which values should always be stored are stored when creating a view
+ * or a UDF.
+ */
+class AlwaysPersistedConfigsSuite extends QueryTest with SharedSparkSession {
+
+  override protected def test(testName: String, testTags: Tag*)(testFun: => Any)(
+    implicit pos: Position): Unit = {
+    if (!sys.env.get("SPARK_ANSI_SQL_MODE").contains("false")) {
+      super.test(testName, testTags: _*)(testFun)
+    }
+  }
+
+  protected override def sparkConf: SparkConf = {
+    super.sparkConf
+      .set(SQLConf.ASSUME_ANSI_FALSE_IF_NOT_PERSISTED.key, "true")
+  }
+
+  private val testViewName = "test_view"
+  private val testFunctionName = "test_function"
+
+  test("Default ANSI value is stored for views") {
+    withView(testViewName) {
+      testView(confName = "view.sqlConfig.spark.sql.ansi.enabled", expectedValue = "true")
+    }
+  }
+
+  test("Explicitly set ANSI value is respected over default one for views") {
+    withView(testViewName) {
+      withSQLConf("spark.sql.ansi.enabled" -> "false") {
+        testView(confName = "view.sqlConfig.spark.sql.ansi.enabled", expectedValue = "false")
+      }
+    }
+
+    withView(testViewName) {
+      withSQLConf("spark.sql.ansi.enabled" -> "true") {
+        testView(confName = "view.sqlConfig.spark.sql.ansi.enabled", expectedValue = "true")
+      }
+    }
+  }
+
+  test("Default ANSI value is stored for functions") {
+    withUserDefinedFunction(testFunctionName -> false) {
+      testFunction(confName = "sqlConfig.spark.sql.ansi.enabled", expectedValue = "true")
+    }
+  }
+
+  test("Explicitly set ANSI value is respected over default one for functions") {
+    withUserDefinedFunction(testFunctionName -> false) {
+      withSQLConf("spark.sql.ansi.enabled" -> "false") {
+        testFunction(confName = "sqlConfig.spark.sql.ansi.enabled", expectedValue = "false")
+      }
+    }
+
+    withUserDefinedFunction(testFunctionName -> false) {
+      withSQLConf("spark.sql.ansi.enabled" -> "true") {
+        testFunction(confName = "sqlConfig.spark.sql.ansi.enabled", expectedValue = "true")
+      }
+    }
+  }
+
+  test("Default session local timezone value is stored for views") {
+    withView(testViewName) {
+      testView(
+        confName = "view.sqlConfig.spark.sql.session.timeZone",
+        expectedValue = "America/Los_Angeles"
+      )
+    }
+  }
+
+  test("Explicitly set session local timezone value is respected over default one for views") {
+    withView(testViewName) {
+      withSQLConf("spark.sql.session.timeZone" -> "America/New_York") {
+        testView(
+          confName = "view.sqlConfig.spark.sql.session.timeZone",
+          expectedValue = "America/New_York"
+        )
+      }
+    }
+
+    withView(testViewName) {
+      withSQLConf("spark.sql.session.timeZone" -> "America/Los_Angeles") {
+        testView(
+          confName = "view.sqlConfig.spark.sql.session.timeZone",
+          expectedValue = "America/Los_Angeles"
+        )
+      }
+    }
+  }
+
+  test("Default session local timezone value is stored for functions") {
+    withUserDefinedFunction(testFunctionName -> false) {
+      testFunction(
+        confName = "sqlConfig.spark.sql.session.timeZone",
+        expectedValue = "America/Los_Angeles"
+      )
+    }
+  }
+
+  test("Explicitly set session local timezone value is respected over default one for functions") {
+    withUserDefinedFunction(testFunctionName -> false) {
+      withSQLConf("spark.sql.session.timeZone" -> "America/New_York") {
+        testFunction(
+          confName = "sqlConfig.spark.sql.session.timeZone",
+          expectedValue = "America/New_York"
+        )
+      }
+    }
+
+    withUserDefinedFunction(testFunctionName -> false) {
+      withSQLConf("spark.sql.session.timeZone" -> "America/Los_Angeles") {
+        testFunction(
+          confName = "sqlConfig.spark.sql.session.timeZone",
+          expectedValue = "America/Los_Angeles"
+        )
+      }
+    }
+  }
+
+  test("ANSI value is set to false if not persisted for views") {
+    val catalogTable = new CatalogTable(
+      identifier = TableIdentifier(testViewName),
+      tableType = CatalogTableType.VIEW,
+      storage = CatalogStorageFormat(None, None, None, None, false, Map.empty),
+      schema = new StructType(),
+      properties = Map.empty[String, String]
+    )
+    val view = View(desc = catalogTable, isTempView = false, child = OneRowRelation())
+
+    val sqlConf = View.effectiveSQLConf(view.desc.viewSQLConfigs, view.isTempView)
+
+    assert(sqlConf.settings.get("spark.sql.ansi.enabled") == "false")
+  }
+
+  private def testView(confName: String, expectedValue: String): Unit = {
+    sql(s"CREATE VIEW $testViewName AS SELECT CAST('string' AS BIGINT) AS alias")
+
+    val viewMetadata = spark.sessionState.catalog.getTableMetadata(TableIdentifier(testViewName))
+
+    assert(
+      viewMetadata.properties(confName) == expectedValue
+    )
+  }
+
+  private def testFunction(confName: String, expectedValue: String): Unit = {
+    sql(s"""
+         |CREATE OR REPLACE FUNCTION $testFunctionName()
+         |RETURN SELECT CAST('string' AS BIGINT) AS alias
+         |""".stripMargin)
+
+    val df = sql(s"select $testFunctionName()")
+
+    assert(
+      df.queryExecution.analyzed
+        .asInstanceOf[Project]
+        .projectList
+        .head
+        .asInstanceOf[Alias]
+        .child
+        .asInstanceOf[SQLScalarFunction]
+        .function
+        .asInstanceOf[SQLFunction]
+        .properties
+        .get(confName)
+        .get == expectedValue
+    )
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/ApproxTopKSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/ApproxTopKSuite.scala
new file mode 100644
index 0000000000000..8219fce9b2178
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/ApproxTopKSuite.scala
@@ -0,0 +1,331 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql
+
+import java.sql.{Date, Timestamp}
+import java.time.LocalDateTime
+
+import org.apache.spark.{SparkArithmeticException, SparkRuntimeException}
+import org.apache.spark.sql.test.SharedSparkSession
+
+
+class ApproxTopKSuite extends QueryTest with SharedSparkSession {
+
+  val itemsWithTopK: Seq[(String, Seq[Row])] = Seq(
+    ("0, 0, 1, 1, 2, 3, 4, 4",
+      Seq(Row(0, 2), Row(4, 2), Row(1, 2), Row(2, 1), Row(3, 1))), // Int
+    ("'a', 'b', 'c', 'c', 'c', 'c', 'd', 'd'",
+      Seq(Row("c", 4), Row("d", 2), Row("a", 1), Row("b", 1))), // String
+    ("(true), (true), (false), (true), (true), (false), (false)",
+      Seq(Row(true, 4), Row(false, 3))), // Boolean
+    ("cast(0 AS BYTE), cast(0 AS BYTE), cast(0 AS BYTE), cast(0 AS BYTE), " +
+      "cast(1 AS BYTE), cast(1 AS BYTE), cast(1 AS BYTE), cast(2 AS BYTE)",
+      Seq(Row(0, 4), Row(1, 3), Row(2, 1))), // Byte
+    ("cast(0 AS SHORT), cast(0 AS SHORT), cast(0 AS SHORT), cast(0 AS SHORT), " +
+      "cast(1 AS SHORT), cast(1 AS SHORT), cast(1 AS SHORT), cast(2 AS SHORT)",
+      Seq(Row(0, 4), Row(1, 3), Row(2, 1))), // Short
+    ("cast(0 AS LONG), cast(0 AS LONG), cast(0 AS LONG), cast(0 AS LONG), " +
+      "cast(1 AS LONG), cast(1 AS LONG), cast(1 AS LONG), cast(2 AS LONG)",
+      Seq(Row(0, 4), Row(1, 3), Row(2, 1))), // Long
+    ("cast(0.0 AS FLOAT), cast(0.0 AS FLOAT), cast(0.0 AS FLOAT), cast(0.0 AS FLOAT), " +
+      "cast(1.0 AS FLOAT), cast(1.0 AS FLOAT), cast(1.0 AS FLOAT), cast(2.0 AS FLOAT)",
+      Seq(Row(0.0, 4), Row(1.0, 3), Row(2.0, 1))), // Float
+    ("cast(0.0 AS DOUBLE), cast(0.0 AS DOUBLE), cast(0.0 AS DOUBLE), cast(0.0 AS DOUBLE), " +
+      "cast(1.0 AS DOUBLE), cast(1.0 AS DOUBLE), cast(1.0 AS DOUBLE), cast(2.0 AS DOUBLE)",
+      Seq(Row(0.0, 4), Row(1.0, 3), Row(2.0, 1))), // Double
+    ("DATE'2025-01-01', DATE'2025-01-01', DATE'2025-01-01', DATE'2025-01-01', " +
+      "DATE'2025-01-02', DATE'2025-01-02', DATE'2025-01-02', DATE'2025-01-03'",
+      Seq(Row(Date.valueOf("2025-01-01"), 4), Row(Date.valueOf("2025-01-02"), 3),
+        Row(Date.valueOf("2025-01-03"), 1))), // Date
+    ("TIMESTAMP'2025-01-01 00:00:00', TIMESTAMP'2025-01-01 00:00:00', " +
+      "TIMESTAMP'2025-01-01 00:00:00', TIMESTAMP'2025-01-02 00:00:00'",
+      Seq(Row(Timestamp.valueOf("2025-01-01 00:00:00"), 3),
+        Row(Timestamp.valueOf("2025-01-02 00:00:00"), 1))), // Timestamp
+    ("TIMESTAMP_NTZ'2025-01-01 00:00:00', TIMESTAMP_NTZ'2025-01-01 00:00:00', " +
+      "TIMESTAMP_NTZ'2025-01-01 00:00:00', TIMESTAMP_NTZ'2025-01-02 00:00:00'",
+      Seq(Row(LocalDateTime.of(2025, 1, 1, 0, 0), 3),
+        Row(LocalDateTime.of(2025, 1, 2, 0, 0), 1))), // Timestamp_ntz
+    ("CAST(0.0 AS DECIMAL(4, 1)), CAST(0.0 AS DECIMAL(4, 1)), " +
+      "CAST(0.0 AS DECIMAL(4, 1)), CAST(1.0 AS DECIMAL(4, 1)), " +
+      "CAST(1.0 AS DECIMAL(4, 1)), CAST(2.0 AS DECIMAL(4, 1))",
+      Seq(Row(new java.math.BigDecimal("0.0"), 3),
+        Row(new java.math.BigDecimal("1.0"), 2),
+        Row(new java.math.BigDecimal("2.0"), 1))), // Decimal(4, 1)
+    ("CAST(0.0 AS DECIMAL(10, 2)), CAST(0.0 AS DECIMAL(10, 2)), " +
+      "CAST(0.0 AS DECIMAL(10, 2)), CAST(1.0 AS DECIMAL(10, 2)), " +
+      "CAST(1.0 AS DECIMAL(10, 2)), CAST(2.0 AS DECIMAL(10, 2))",
+      Seq(Row(new java.math.BigDecimal("0.00"), 3),
+        Row(new java.math.BigDecimal("1.00"), 2),
+        Row(new java.math.BigDecimal("2.00"), 1))), // Decimal(10, 2)
+    ("CAST(0.0 AS DECIMAL(20, 3)), CAST(0.0 AS DECIMAL(20, 3)), " +
+      "CAST(0.0 AS DECIMAL(20, 3)), CAST(1.0 AS DECIMAL(20, 3)), " +
+      "CAST(1.0 AS DECIMAL(20, 3)), CAST(2.0 AS DECIMAL(20, 3))",
+      Seq(Row(new java.math.BigDecimal("0.000"), 3),
+        Row(new java.math.BigDecimal("1.000"), 2),
+        Row(new java.math.BigDecimal("2.000"), 1))), // Decimal(20, 3)
+    ("(0.0), (0.0), (0.0), (0.0), (1.0), (1.0), (1.0), (2.0)",
+      Seq(Row(new java.math.BigDecimal("0.0"), 4),
+        Row(new java.math.BigDecimal("1.0"), 3),
+        Row(new java.math.BigDecimal("2.0"), 1))) // Decimal default
+  )
+
+  /////////////////////////////////
+  // approx_top_k tests
+  /////////////////////////////////
+
+  test("SPARK-52515: test of 1 parameter") {
+    val res = sql(
+      "SELECT approx_top_k(expr) FROM VALUES (0), (0), (1), (1), (2), (3), (4), (4) AS tab(expr);"
+    )
+    checkAnswer(res, Row(Seq(Row(0, 2), Row(4, 2), Row(1, 2), Row(2, 1), Row(3, 1))))
+  }
+
+  test("SPARK-52515: test of 2 parameter") {
+    val res = sql(
+      "SELECT approx_top_k(expr, 2) " +
+        "FROM VALUES 'a', 'b', 'c', 'c', 'c', 'c', 'd', 'd' AS tab(expr);")
+    checkAnswer(res, Row(Seq(Row("c", 4), Row("d", 2))))
+  }
+
+  test("SPARK-52515: test of 3 parameter") {
+    val res = sql(
+      "SELECT approx_top_k(expr, 10, 100) FROM VALUES (0), (1), (1), (2), (2), (2) AS tab(expr);"
+    )
+    checkAnswer(res, Row(Seq(Row(2, 3), Row(1, 2), Row(0, 1))))
+  }
+
+  gridTest("SPARK-52515: test of different types")(itemsWithTopK) {
+    case (input, expected) =>
+      val res = sql(s"SELECT approx_top_k(expr) FROM VALUES $input AS tab(expr);")
+      checkAnswer(res, Row(expected))
+  }
+
+  test("SPARK-52515: invalid k value null") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k(expr, NULL) FROM VALUES (0), (1), (2) AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_NULL_ARG",
+      parameters = Map("argName" -> "`k`")
+    )
+  }
+
+  test("SPARK-52515: invalid k value < 1") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k(expr, 0) FROM VALUES (0), (1), (2) AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_NON_POSITIVE_ARG",
+      parameters = Map("argName" -> "`k`", "argValue" -> "0")
+    )
+  }
+
+  test("SPARK-52515: invalid k value > Int.MaxValue") {
+    withSQLConf("spark.sql.ansi.enabled" -> true.toString) {
+      val k: Long = Int.MaxValue + 1L
+      checkError(
+        exception = intercept[SparkArithmeticException] {
+          sql(s"SELECT approx_top_k(expr, $k) FROM VALUES (0), (1), (2) AS tab(expr);").collect()
+        },
+        condition = "CAST_OVERFLOW",
+        parameters = Map(
+          "value" -> (k.toString + "L"),
+          "sourceType" -> "\"BIGINT\"",
+          "targetType" -> "\"INT\"",
+          "ansiConfig" -> "\"spark.sql.ansi.enabled\""
+        )
+      )
+    }
+  }
+
+  test("SPARK-52515: invalid maxItemsTracked value null") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k(expr, 5, NULL) FROM VALUES (0), (1), (2) AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_NULL_ARG",
+      parameters = Map("argName" -> "`maxItemsTracked`")
+    )
+  }
+
+  test("SPARK-52515: invalid maxItemsTracked value < 1") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k(expr, 5, 0) FROM VALUES (0), (1), (2) AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_NON_POSITIVE_ARG",
+      parameters = Map("argName" -> "`maxItemsTracked`", "argValue" -> "0")
+    )
+  }
+
+  test("SPARK-52515: invalid maxItemsTracked > 1000000") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k(expr, 10, 1000001) FROM VALUES (0), (1) AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_MAX_ITEMS_TRACKED_EXCEEDS_LIMIT",
+      parameters = Map("maxItemsTracked" -> "1000001", "limit" -> "1000000")
+    )
+  }
+
+  test("SPARK-52515: invalid maxItemsTracked < k") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k(expr, 10, 5) FROM VALUES (0), (1), (2) AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_MAX_ITEMS_TRACKED_LESS_THAN_K",
+      parameters = Map("maxItemsTracked" -> "5", "k" -> "10")
+    )
+  }
+
+  test("SPARK-52515: does not count NULL values") {
+    val res = sql(
+      "SELECT approx_top_k(expr, 2)" +
+        "FROM VALUES 'a', 'a', 'b', 'b', 'b', NULL, NULL, NULL AS tab(expr);")
+    checkAnswer(res, Row(Seq(Row("b", 3), Row("a", 2))))
+  }
+
+  /////////////////////////////////
+  // approx_top_k_accumulate and
+  // approx_top_k_estimate tests
+  /////////////////////////////////
+
+  test("SPARK-52588: accumulate and estimate of Integer with default parameters") {
+    val res = sql("SELECT approx_top_k_estimate(approx_top_k_accumulate(expr)) " +
+      "FROM VALUES (0), (0), (0), (1), (1), (2), (3), (4) AS tab(expr);")
+    checkAnswer(res, Row(Seq(Row(0, 3), Row(1, 2), Row(4, 1), Row(2, 1), Row(3, 1))))
+  }
+
+  test("SPARK-52588: accumulate and estimate of String") {
+    val res = sql("SELECT approx_top_k_estimate(approx_top_k_accumulate(expr), 2) " +
+      "FROM VALUES 'a', 'b', 'c', 'c', 'c', 'c', 'd', 'd' AS tab(expr);")
+    checkAnswer(res, Row(Seq(Row("c", 4), Row("d", 2))))
+  }
+
+  test("SPARK-52588: accumulate and estimate of Decimal(4, 1)") {
+    val res = sql("SELECT approx_top_k_estimate(approx_top_k_accumulate(expr, 10)) " +
+      "FROM VALUES CAST(0.0 AS DECIMAL(4, 1)), CAST(0.0 AS DECIMAL(4, 1)), " +
+      "CAST(0.0 AS DECIMAL(4, 1)), CAST(1.0 AS DECIMAL(4, 1)), " +
+      "CAST(1.0 AS DECIMAL(4, 1)), CAST(2.0 AS DECIMAL(4, 1)) AS tab(expr);")
+    checkAnswer(res, Row(Seq(
+      Row(new java.math.BigDecimal("0.0"), 3),
+      Row(new java.math.BigDecimal("1.0"), 2),
+      Row(new java.math.BigDecimal("2.0"), 1))))
+  }
+
+  test("SPARK-52588: accumulate and estimate of Decimal(20, 3)") {
+    val res = sql("SELECT approx_top_k_estimate(approx_top_k_accumulate(expr, 10), 2) " +
+      "FROM VALUES CAST(0.0 AS DECIMAL(20, 3)), CAST(0.0 AS DECIMAL(20, 3)), " +
+      "CAST(0.0 AS DECIMAL(20, 3)), CAST(1.0 AS DECIMAL(20, 3)), " +
+      "CAST(1.0 AS DECIMAL(20, 3)), CAST(2.0 AS DECIMAL(20, 3)) AS tab(expr);")
+    checkAnswer(res, Row(Seq(
+      Row(new java.math.BigDecimal("0.000"), 3),
+      Row(new java.math.BigDecimal("1.000"), 2))))
+  }
+
+  gridTest("SPARK-52588: accumulate and estimate of different types")(itemsWithTopK) {
+    case (input, expected) =>
+      val res = sql(s"SELECT approx_top_k_estimate(approx_top_k_accumulate(expr)) " +
+        s"FROM VALUES $input AS tab(expr);")
+      checkAnswer(res, Row(expected))
+  }
+
+  test("SPARK-52588: invalid accumulate if maxItemsTracked is null") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k_accumulate(expr, NULL) FROM VALUES 0, 1, 2 AS tab(expr);")
+          .collect()
+      },
+      condition = "APPROX_TOP_K_NULL_ARG",
+      parameters = Map("argName" -> "`maxItemsTracked`")
+    )
+  }
+
+  test("SPARK-52588: invalid accumulate if maxItemsTracked < 1") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k_accumulate(expr, 0) FROM VALUES 0, 1, 2 AS tab(expr);")
+          .collect()
+      },
+      condition = "APPROX_TOP_K_NON_POSITIVE_ARG",
+      parameters = Map("argName" -> "`maxItemsTracked`", "argValue" -> "0")
+    )
+  }
+
+  test("SPARK-52588: invalid accumulate if maxItemsTracked > 1000000") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k_accumulate(expr, 1000001) FROM VALUES (0) AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_MAX_ITEMS_TRACKED_EXCEEDS_LIMIT",
+      parameters = Map("maxItemsTracked" -> "1000001", "limit" -> "1000000")
+    )
+  }
+
+  test("SPARK-52588: invalid estimate if k is null") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k_estimate(approx_top_k_accumulate(expr), NULL) " +
+          "FROM VALUES 0, 1, 2 AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_NULL_ARG",
+      parameters = Map("argName" -> "`k`")
+    )
+  }
+
+  test("SPARK-52588: invalid estimate if k < 1") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k_estimate(approx_top_k_accumulate(expr), 0) " +
+          "FROM VALUES 0, 1, 2 AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_NON_POSITIVE_ARG",
+      parameters = Map("argName" -> "`k`", "argValue" -> "0")
+    )
+  }
+
+  test("SPARK-52588: invalid estimate if k > Int.MaxValue") {
+    withSQLConf("spark.sql.ansi.enabled" -> true.toString) {
+      val k: Long = Int.MaxValue + 1L
+      checkError(
+        exception = intercept[SparkArithmeticException] {
+          sql(s"SELECT approx_top_k_estimate(approx_top_k_accumulate(expr), $k) " +
+            "FROM VALUES 0, 1, 2 AS tab(expr);").collect()
+        },
+        condition = "CAST_OVERFLOW",
+        parameters = Map(
+          "value" -> (k.toString + "L"),
+          "sourceType" -> "\"BIGINT\"",
+          "targetType" -> "\"INT\"",
+          "ansiConfig" -> "\"spark.sql.ansi.enabled\""
+        )
+      )
+    }
+  }
+
+  test("SPARK-52588: invalid estimate if k > maxItemsTracked") {
+    checkError(
+      exception = intercept[SparkRuntimeException] {
+        sql("SELECT approx_top_k_estimate(approx_top_k_accumulate(expr, 5), 10) " +
+          "FROM VALUES 0, 1, 2 AS tab(expr);").collect()
+      },
+      condition = "APPROX_TOP_K_MAX_ITEMS_TRACKED_LESS_THAN_K",
+      parameters = Map("maxItemsTracked" -> "5", "k" -> "10")
+    )
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/BloomFilterAggregateQuerySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/BloomFilterAggregateQuerySuite.scala
index af97856fd222e..fb279b1db6fc9 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/BloomFilterAggregateQuerySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/BloomFilterAggregateQuerySuite.scala
@@ -41,16 +41,19 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
   override def beforeAll(): Unit = {
     super.beforeAll()
     // Register 'bloom_filter_agg' to builtin.
-    spark.sessionState.functionRegistry.registerFunction(funcId_bloom_filter_agg,
+    spark.sessionState.functionRegistry.registerFunction(
+      funcId_bloom_filter_agg,
       new ExpressionInfo(classOf[BloomFilterAggregate].getName, "bloom_filter_agg"),
-      (children: Seq[Expression]) => children.size match {
-        case 1 => new BloomFilterAggregate(children.head)
-        case 2 => new BloomFilterAggregate(children.head, children(1))
-        case 3 => new BloomFilterAggregate(children.head, children(1), children(2))
-      })
+      (children: Seq[Expression]) =>
+        children.size match {
+          case 1 => new BloomFilterAggregate(children.head)
+          case 2 => new BloomFilterAggregate(children.head, children(1))
+          case 3 => new BloomFilterAggregate(children.head, children(1), children(2))
+        })
 
     // Register 'might_contain' to builtin.
-    spark.sessionState.functionRegistry.registerFunction(funcId_might_contain,
+    spark.sessionState.functionRegistry.registerFunction(
+      funcId_might_contain,
       new ExpressionInfo(classOf[BloomFilterMightContain].getName, "might_contain"),
       (children: Seq[Expression]) => BloomFilterMightContain(children.head, children(1)))
   }
@@ -64,10 +67,22 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
   test("Test bloom_filter_agg and might_contain") {
     val conf = SQLConf.get
     val table = "bloom_filter_test"
-    for (numEstimatedItems <- Seq(Long.MinValue, -10L, 0L, 4096L, 4194304L, Long.MaxValue,
-      conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_ITEMS))) {
-      for ((numBits, index) <- Seq(Long.MinValue, -10L, 0L, 4096L, 4194304L, Long.MaxValue,
-        conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_BITS)).zipWithIndex) {
+    for (numEstimatedItems <- Seq(
+        Long.MinValue,
+        -10L,
+        0L,
+        4096L,
+        4194304L,
+        Long.MaxValue,
+        conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_ITEMS))) {
+      for ((numBits, index) <- Seq(
+          Long.MinValue,
+          -10L,
+          0L,
+          4096L,
+          4194304L,
+          Long.MaxValue,
+          conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_BITS)).zipWithIndex) {
         val sqlString = s"""
                            |SELECT every(might_contain(
                            |            (SELECT bloom_filter_agg(col,
@@ -85,7 +100,8 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
            """.stripMargin
         withTempView(table) {
           (Seq(Long.MinValue, 0, Long.MaxValue) ++ (1L to 10000L))
-            .toDF("col").createOrReplaceTempView(table)
+            .toDF("col")
+            .createOrReplaceTempView(table)
           // Validate error messages as well as answers when there's no error.
           if (numEstimatedItems <= 0) {
             val exception = intercept[AnalysisException] {
@@ -104,16 +120,13 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
                 "valueRange" -> "[0, positive]",
                 "currentValue" -> toSQLValue(numEstimatedItems, LongType),
                 "sqlExpr" -> (s""""bloom_filter_agg(col, CAST($numEstimatedItems AS BIGINT), """ +
-                  s"""CAST($numBits AS BIGINT))"""")
-              ),
+                  s"""CAST($numBits AS BIGINT))"""")),
               context = ExpectedContext(
                 fragment = "bloom_filter_agg(col,\n" +
                   s"              cast($numEstimatedItems as long),\n" +
                   s"              cast($numBits as long))",
                 start = 49,
-                stop = stop(index)
-              )
-            )
+                stop = stop(index)))
           } else if (numBits <= 0) {
             val exception = intercept[AnalysisException] {
               spark.sql(sqlString)
@@ -132,16 +145,13 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
                 "valueRange" -> "[0, positive]",
                 "currentValue" -> toSQLValue(numBits, LongType),
                 "sqlExpr" -> (s""""bloom_filter_agg(col, CAST($numEstimatedItems AS BIGINT), """ +
-                  s"""CAST($numBits AS BIGINT))"""")
-              ),
+                  s"""CAST($numBits AS BIGINT))"""")),
               context = ExpectedContext(
                 fragment = "bloom_filter_agg(col,\n" +
                   s"              cast($numEstimatedItems as long),\n" +
                   s"              cast($numBits as long))",
                 start = 49,
-                stop = stop(index)
-              )
-            )
+                stop = stop(index)))
           } else {
             checkAnswer(spark.sql(sqlString), Row(true, false))
           }
@@ -154,8 +164,7 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
     val exception1 = intercept[AnalysisException] {
       spark.sql("""
         |SELECT bloom_filter_agg(a)
-        |FROM values (1.2), (2.5) as t(a)"""
-        .stripMargin)
+        |FROM values (1.2), (2.5) as t(a)""".stripMargin)
     }
     checkError(
       exception = exception1,
@@ -165,20 +174,13 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
         "sqlExpr" -> "\"bloom_filter_agg(a, 1000000, 8388608)\"",
         "expectedLeft" -> "\"BINARY\"",
         "expectedRight" -> "\"BIGINT\"",
-        "actual" -> "\"DECIMAL(2,1)\", \"BIGINT\", \"BIGINT\""
-      ),
-      context = ExpectedContext(
-        fragment = "bloom_filter_agg(a)",
-        start = 8,
-        stop = 26
-      )
-    )
+        "actual" -> "\"DECIMAL(2,1)\", \"BIGINT\", \"BIGINT\""),
+      context = ExpectedContext(fragment = "bloom_filter_agg(a)", start = 8, stop = 26))
 
     val exception2 = intercept[AnalysisException] {
       spark.sql("""
         |SELECT bloom_filter_agg(a, 2)
-        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)"""
-        .stripMargin)
+        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)""".stripMargin)
     }
     checkError(
       exception = exception2,
@@ -188,20 +190,13 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
         "sqlExpr" -> "\"bloom_filter_agg(a, 2, (2 * 8))\"",
         "expectedLeft" -> "\"BINARY\"",
         "expectedRight" -> "\"BIGINT\"",
-        "actual" -> "\"BIGINT\", \"INT\", \"BIGINT\""
-      ),
-      context = ExpectedContext(
-        fragment = "bloom_filter_agg(a, 2)",
-        start = 8,
-        stop = 29
-      )
-    )
+        "actual" -> "\"BIGINT\", \"INT\", \"BIGINT\""),
+      context = ExpectedContext(fragment = "bloom_filter_agg(a, 2)", start = 8, stop = 29))
 
     val exception3 = intercept[AnalysisException] {
       spark.sql("""
         |SELECT bloom_filter_agg(a, cast(2 as long), 5)
-        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)"""
-        .stripMargin)
+        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)""".stripMargin)
     }
     checkError(
       exception = exception3,
@@ -211,60 +206,42 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
         "sqlExpr" -> "\"bloom_filter_agg(a, CAST(2 AS BIGINT), 5)\"",
         "expectedLeft" -> "\"BINARY\"",
         "expectedRight" -> "\"BIGINT\"",
-        "actual" -> "\"BIGINT\", \"BIGINT\", \"INT\""
-      ),
+        "actual" -> "\"BIGINT\", \"BIGINT\", \"INT\""),
       context = ExpectedContext(
         fragment = "bloom_filter_agg(a, cast(2 as long), 5)",
         start = 8,
-        stop = 46
-      )
-    )
+        stop = 46))
 
     val exception4 = intercept[AnalysisException] {
       spark.sql("""
         |SELECT bloom_filter_agg(a, null, 5)
-        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)"""
-        .stripMargin)
+        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)""".stripMargin)
     }
     checkError(
       exception = exception4,
       condition = "DATATYPE_MISMATCH.UNEXPECTED_NULL",
       parameters = Map(
         "exprName" -> "estimatedNumItems or numBits",
-        "sqlExpr" -> "\"bloom_filter_agg(a, NULL, 5)\""
-      ),
-      context = ExpectedContext(
-        fragment = "bloom_filter_agg(a, null, 5)",
-        start = 8,
-        stop = 35
-      )
-    )
+        "sqlExpr" -> "\"bloom_filter_agg(a, NULL, 5)\""),
+      context = ExpectedContext(fragment = "bloom_filter_agg(a, null, 5)", start = 8, stop = 35))
 
     val exception5 = intercept[AnalysisException] {
       spark.sql("""
         |SELECT bloom_filter_agg(a, 5, null)
-        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)"""
-        .stripMargin)
+        |FROM values (cast(1 as long)), (cast(2 as long)) as t(a)""".stripMargin)
     }
     checkError(
       exception = exception5,
       condition = "DATATYPE_MISMATCH.UNEXPECTED_NULL",
       parameters = Map(
         "exprName" -> "estimatedNumItems or numBits",
-        "sqlExpr" -> "\"bloom_filter_agg(a, 5, NULL)\""
-      ),
-      context = ExpectedContext(
-        fragment = "bloom_filter_agg(a, 5, null)",
-        start = 8,
-        stop = 35
-      )
-    )
+        "sqlExpr" -> "\"bloom_filter_agg(a, 5, NULL)\""),
+      context = ExpectedContext(fragment = "bloom_filter_agg(a, 5, null)", start = 8, stop = 35))
   }
 
   test("Test that might_contain errors out disallowed input value types") {
     val exception1 = intercept[AnalysisException] {
-      spark.sql("""|SELECT might_contain(1.0, 1L)"""
-        .stripMargin)
+      spark.sql("""|SELECT might_contain(1.0, 1L)""".stripMargin)
     }
     checkError(
       exception = exception1,
@@ -274,18 +251,11 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
         "functionName" -> "`might_contain`",
         "expectedLeft" -> "\"BINARY\"",
         "expectedRight" -> "\"BIGINT\"",
-        "actual" -> "\"DECIMAL(2,1)\", \"BIGINT\""
-      ),
-      context = ExpectedContext(
-        fragment = "might_contain(1.0, 1L)",
-        start = 7,
-        stop = 28
-      )
-    )
+        "actual" -> "\"DECIMAL(2,1)\", \"BIGINT\""),
+      context = ExpectedContext(fragment = "might_contain(1.0, 1L)", start = 7, stop = 28))
 
     val exception2 = intercept[AnalysisException] {
-      spark.sql("""|SELECT might_contain(NULL, 0.1)"""
-        .stripMargin)
+      spark.sql("""|SELECT might_contain(NULL, 0.1)""".stripMargin)
     }
     checkError(
       exception = exception2,
@@ -295,22 +265,15 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
         "functionName" -> "`might_contain`",
         "expectedLeft" -> "\"BINARY\"",
         "expectedRight" -> "\"BIGINT\"",
-        "actual" -> "\"VOID\", \"DECIMAL(1,1)\""
-      ),
-      context = ExpectedContext(
-        fragment = "might_contain(NULL, 0.1)",
-        start = 7,
-        stop = 30
-      )
-    )
+        "actual" -> "\"VOID\", \"DECIMAL(1,1)\""),
+      context = ExpectedContext(fragment = "might_contain(NULL, 0.1)", start = 7, stop = 30))
   }
 
   test("Test that might_contain errors out non-constant Bloom filter") {
     val exception1 = intercept[AnalysisException] {
       spark.sql("""
                   |SELECT might_contain(cast(a as binary), cast(5 as long))
-                  |FROM values (cast(1 as string)), (cast(2 as string)) as t(a)"""
-        .stripMargin)
+                  |FROM values (cast(1 as string)), (cast(2 as string)) as t(a)""".stripMargin)
     }
     checkError(
       exception = exception1,
@@ -318,20 +281,16 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
       parameters = Map(
         "sqlExpr" -> "\"might_contain(CAST(a AS BINARY), CAST(5 AS BIGINT))\"",
         "functionName" -> "`might_contain`",
-        "actual" -> "\"CAST(a AS BINARY)\""
-      ),
+        "actual" -> "\"CAST(a AS BINARY)\""),
       context = ExpectedContext(
         fragment = "might_contain(cast(a as binary), cast(5 as long))",
         start = 8,
-        stop = 56
-      )
-    )
+        stop = 56))
 
     val exception2 = intercept[AnalysisException] {
       spark.sql("""
                   |SELECT might_contain((select cast(a as binary)), cast(5 as long))
-                  |FROM values (cast(1 as string)), (cast(2 as string)) as t(a)"""
-        .stripMargin)
+                  |FROM values (cast(1 as string)), (cast(2 as string)) as t(a)""".stripMargin)
     }
     checkError(
       exception = exception2,
@@ -339,32 +298,38 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
       parameters = Map(
         "sqlExpr" -> "\"might_contain(scalarsubquery(a), CAST(5 AS BIGINT))\"",
         "functionName" -> "`might_contain`",
-        "actual" -> "\"scalarsubquery(a)\""
-      ),
+        "actual" -> "\"scalarsubquery(a)\""),
       context = ExpectedContext(
         fragment = "might_contain((select cast(a as binary)), cast(5 as long))",
         start = 8,
-        stop = 65
-      )
-    )
+        stop = 65))
   }
 
-  test("Test that might_contain can take a constant value input") {
-    checkAnswer(spark.sql(
-      """SELECT might_contain(
+  test("Test that might_contain can take a constant value input (seedless version)") {
+    checkAnswer(
+      spark.sql("""SELECT might_contain(
         |X'00000001000000050000000343A2EC6EA8C117E2D3CDB767296B144FC5BFBCED9737F267',
         |cast(201 as long))""".stripMargin),
       Row(false))
   }
 
+  test("Test that might_contain can take a constant value input (seeded version)") {
+    checkAnswer(
+      spark.sql("""SELECT might_contain(
+        |X'0000000200000005000000000000000343A2EC6EA8C117E2D3CDB767296B144FC5BFBCED9737F267',
+        |cast(201 as long))""".stripMargin),
+      Row(false))
+  }
+
   test("Test that bloom_filter_agg produces a NULL with empty input") {
-    checkAnswer(spark.sql("""SELECT bloom_filter_agg(cast(id as long)) from range(1, 1)"""),
+    checkAnswer(
+      spark.sql("""SELECT bloom_filter_agg(cast(id as long)) from range(1, 1)"""),
       Row(null))
   }
 
   test("Test NULL inputs for might_contain") {
-    checkAnswer(spark.sql(
-      s"""
+    checkAnswer(
+      spark.sql(s"""
          |SELECT might_contain(null, null) both_null,
          |       might_contain(null, 1L) null_bf,
          |       might_contain((SELECT bloom_filter_agg(cast(id as long)) from range(1, 10000)),
@@ -374,9 +339,15 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
   }
 
   test("Test that a query with bloom_filter_agg has partial aggregates") {
-    assert(spark.sql("""SELECT bloom_filter_agg(cast(id as long)) from range(1, 1000000)""")
-      .queryExecution.executedPlan.asInstanceOf[AdaptiveSparkPlanExec].inputPlan
-      .collect({case agg: BaseAggregateExec => agg}).size == 2)
+    assert(
+      spark
+        .sql("""SELECT bloom_filter_agg(cast(id as long)) from range(1, 1000000)""")
+        .queryExecution
+        .executedPlan
+        .asInstanceOf[AdaptiveSparkPlanExec]
+        .inputPlan
+        .collect({ case agg: BaseAggregateExec => agg })
+        .size == 2)
   }
 
   test("Test numBitsExpression") {
@@ -385,7 +356,8 @@ class BloomFilterAggregateQuerySuite extends QueryTest with SharedSparkSession {
       assert(agg.numBitsExpression === Literal(numBits))
     }
 
-    checkNumBits(conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_ITEMS) * 100,
+    checkNumBits(
+      conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_ITEMS) * 100,
       conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_BITS))
     checkNumBits(conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_ITEMS) + 10, 29193836)
     checkNumBits(conf.getConf(SQLConf.RUNTIME_BLOOM_FILTER_MAX_NUM_ITEMS), 29193763)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/CachedTableSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/CachedTableSuite.scala
index 68299804ea877..3cdf906cfd59e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/CachedTableSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/CachedTableSuite.scala
@@ -19,15 +19,13 @@ package org.apache.spark.sql
 
 import java.io.{File, FilenameFilter}
 import java.nio.file.{Files, Paths}
-import java.time.{Duration, LocalDateTime, Period}
+import java.time.{Duration, LocalDateTime, LocalTime, Period}
 import java.util.concurrent.atomic.AtomicBoolean
 
 import scala.collection.mutable.HashSet
 import scala.concurrent.duration._
 
-import org.apache.commons.io.FileUtils
-
-import org.apache.spark.CleanerListener
+import org.apache.spark.{CleanerListener, SparkRuntimeException}
 import org.apache.spark.executor.DataReadMethod._
 import org.apache.spark.executor.DataReadMethod.DataReadMethod
 import org.apache.spark.scheduler.{SparkListener, SparkListenerEvent, SparkListenerJobStart}
@@ -182,7 +180,7 @@ class CachedTableSuite extends QueryTest with SQLTestUtils
 
   test("too big for memory") {
     withTempView("bigData") {
-      val data = "*" * 1000
+      val data = "*".repeat(1000)
       sparkContext.parallelize(1 to 200000, 1).map(_ => BigData(data)).toDF()
         .createOrReplaceTempView("bigData")
       spark.table("bigData").persist(StorageLevel.MEMORY_AND_DISK)
@@ -1405,7 +1403,7 @@ class CachedTableSuite extends QueryTest with SQLTestUtils
         .filter(_.startsWith("Location:"))
         .head
         .replace("Location: file:", "")
-      FileUtils.copyDirectory(
+      Utils.copyDirectory(
         new File(part0Loc),
         new File(part0Loc.replace("part=0", "part=1")))
 
@@ -1792,6 +1790,19 @@ class CachedTableSuite extends QueryTest with SQLTestUtils
     }
   }
 
+  test("SPARK-52692: Support cache/uncache table with Time type") {
+    val tableName = "timeCache"
+    withTable(tableName) {
+      sql(s"CACHE TABLE $tableName AS SELECT TIME'22:00:00'")
+      checkAnswer(spark.table(tableName), Row(LocalTime.parse("22:00:00")))
+      spark.table(tableName).queryExecution.withCachedData.collect {
+        case cached: InMemoryRelation =>
+          assert(cached.stats.sizeInBytes === 8)
+      }
+      sql(s"UNCACHE TABLE $tableName")
+    }
+  }
+
   Seq(true, false).foreach { callerEnableAQE =>
     test(s"SPARK-49982: AQE negative caching with in memory table cache - callerEnableAQE=" +
       callerEnableAQE) {
@@ -1833,4 +1844,13 @@ class CachedTableSuite extends QueryTest with SQLTestUtils
       }
     }
   }
+
+  test("SPARK-52684: Atomicity of cache table on error") {
+    withTempView("SPARK_52684") {
+      intercept[SparkRuntimeException] {
+        spark.sql("CACHE TABLE SPARK_52684 AS SELECT raise_error('SPARK-52684') AS c1")
+      }
+      assert(!spark.catalog.tableExists("SPARK_52684"))
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala
index eceadc338bfca..02abb701b5dfa 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/CharVarcharTestSuite.scala
@@ -24,7 +24,7 @@ import org.apache.spark.sql.catalyst.parser.CatalystSqlParser
 import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, Project}
 import org.apache.spark.sql.catalyst.util.CharVarcharUtils
 import org.apache.spark.sql.connector.SchemaRequiredDataSource
-import org.apache.spark.sql.connector.catalog.InMemoryPartitionTableCatalog
+import org.apache.spark.sql.connector.catalog.{CatalogV2Util, InMemoryPartitionTableCatalog}
 import org.apache.spark.sql.execution.datasources.LogicalRelation
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
 import org.apache.spark.sql.internal.SQLConf
@@ -77,7 +77,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     Seq("CHAR(5)", "VARCHAR(5)").foreach { typ =>
       withTable("t") {
         sql(s"CREATE TABLE t(i STRING, c $typ) USING $format")
-        (0 to 5).map(n => "a" + " " * n).foreach { v =>
+        (0 to 5).map(n => "a" + " ".repeat(n)).foreach { v =>
           sql(s"INSERT OVERWRITE t VALUES ('1', '$v')")
           checkPlainResult(spark.table("t"), typ, v)
         }
@@ -112,7 +112,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     // via dynamic partitioned columns
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c CHAR(5)) USING $format PARTITIONED BY (c)")
-      (0 to 5).map(n => "a" + " " * n).foreach { v =>
+      (0 to 5).map(n => "a" + " ".repeat(n)).foreach { v =>
         sql(s"INSERT OVERWRITE t VALUES ('1', '$v')")
         checkPlainResult(spark.table("t"), "CHAR(5)", v)
       }
@@ -120,7 +120,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
 
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c CHAR(5)) USING $format PARTITIONED BY (c)")
-      (0 to 5).map(n => "a" + " " * n).foreach { v =>
+      (0 to 5).map(n => "a" + " ".repeat(n)).foreach { v =>
         // via dynamic partitioned columns with drop partition command
         sql(s"INSERT INTO t VALUES ('1', '$v')")
         checkPlainResult(spark.table("t"), "CHAR(5)", v)
@@ -160,7 +160,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
       // https://issues.apache.org/jira/browse/SPARK-34192
       withTable("t") {
         sql(s"CREATE TABLE t(i STRING, c VARCHAR(5)) USING $format PARTITIONED BY (c)")
-        val v = "a" + " " * n
+        val v = "a" + " ".repeat(n)
         // via dynamic partitioned columns
         sql(s"INSERT INTO t VALUES ('1', '$v')")
         checkPlainResult(spark.table("t"), "VARCHAR(5)", v)
@@ -211,7 +211,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c STRUCT<c: CHAR(5)>) USING $format")
       sql("INSERT INTO t VALUES ('1', struct('a'))")
-      checkAnswer(spark.table("t"), Row("1", Row("a" + " " * 4)))
+      checkAnswer(spark.table("t"), Row("1", Row("a" + " ".repeat(4))))
       checkColType(spark.table("t").schema(1), new StructType().add("c", CharType(5)))
 
       sql("INSERT OVERWRITE t VALUES ('1', null)")
@@ -225,7 +225,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c ARRAY<CHAR(5)>) USING $format")
       sql("INSERT INTO t VALUES ('1', array('a', 'ab'))")
-      checkAnswer(spark.table("t"), Row("1", Seq("a" + " " * 4, "ab" + " " * 3)))
+      checkAnswer(spark.table("t"), Row("1", Seq("a" + " ".repeat(4), "ab" + " ".repeat(3))))
       checkColType(spark.table("t").schema(1), ArrayType(CharType(5)))
 
       sql("INSERT OVERWRITE t VALUES ('1', null)")
@@ -239,7 +239,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c MAP<CHAR(5), STRING>) USING $format")
       sql("INSERT INTO t VALUES ('1', map('a', 'ab'))")
-      checkAnswer(spark.table("t"), Row("1", Map(("a" + " " * 4, "ab"))))
+      checkAnswer(spark.table("t"), Row("1", Map(("a" + " ".repeat(4), "ab"))))
       checkColType(spark.table("t").schema(1), MapType(CharType(5), StringType))
 
       sql("INSERT OVERWRITE t VALUES ('1', null)")
@@ -251,7 +251,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c MAP<STRING, CHAR(5)>) USING $format")
       sql("INSERT INTO t VALUES ('1', map('a', 'ab'))")
-      checkAnswer(spark.table("t"), Row("1", Map(("a", "ab" + " " * 3))))
+      checkAnswer(spark.table("t"), Row("1", Map(("a", "ab" + " ".repeat(3)))))
       checkColType(spark.table("t").schema(1), MapType(StringType, CharType(5)))
 
       sql("INSERT OVERWRITE t VALUES ('1', null)")
@@ -265,7 +265,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c MAP<CHAR(5), CHAR(10)>) USING $format")
       sql("INSERT INTO t VALUES ('1', map('a', 'ab'))")
-      checkAnswer(spark.table("t"), Row("1", Map(("a" + " " * 4, "ab" + " " * 8))))
+      checkAnswer(spark.table("t"), Row("1", Map(("a" + " ".repeat(4), "ab" + " ".repeat(8)))))
       checkColType(spark.table("t").schema(1), MapType(CharType(5), CharType(10)))
 
       sql("INSERT OVERWRITE t VALUES ('1', null)")
@@ -277,7 +277,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c STRUCT<c: ARRAY<CHAR(5)>>) USING $format")
       sql("INSERT INTO t VALUES ('1', struct(array('a', 'ab')))")
-      checkAnswer(spark.table("t"), Row("1", Row(Seq("a" + " " * 4, "ab" + " " * 3))))
+      checkAnswer(spark.table("t"), Row("1", Row(Seq("a" + " ".repeat(4), "ab" + " ".repeat(3)))))
       checkColType(spark.table("t").schema(1),
         new StructType().add("c", ArrayType(CharType(5))))
 
@@ -294,7 +294,8 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c ARRAY<STRUCT<c: CHAR(5)>>) USING $format")
       sql("INSERT INTO t VALUES ('1', array(struct('a'), struct('ab')))")
-      checkAnswer(spark.table("t"), Row("1", Seq(Row("a" + " " * 4), Row("ab" + " " * 3))))
+      checkAnswer(spark.table("t"),
+        Row("1", Seq(Row("a" + " ".repeat(4)), Row("ab" + " ".repeat(3)))))
       checkColType(spark.table("t").schema(1),
         ArrayType(new StructType().add("c", CharType(5))))
 
@@ -311,7 +312,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
     withTable("t") {
       sql(s"CREATE TABLE t(i STRING, c ARRAY<ARRAY<CHAR(5)>>) USING $format")
       sql("INSERT INTO t VALUES ('1', array(array('a', 'ab')))")
-      checkAnswer(spark.table("t"), Row("1", Seq(Seq("a" + " " * 4, "ab" + " " * 3))))
+      checkAnswer(spark.table("t"), Row("1", Seq(Seq("a" + " ".repeat(4), "ab" + " ".repeat(3)))))
       checkColType(spark.table("t").schema(1), ArrayType(ArrayType(CharType(5))))
 
       sql("INSERT OVERWRITE t VALUES ('1', null)")
@@ -425,7 +426,7 @@ trait CharVarcharTestSuite extends QueryTest with SQLTestUtils {
       sql("INSERT INTO t VALUES ('12 ', '12 ')")
       sql("INSERT INTO t VALUES ('1234  ', '1234  ')")
       checkAnswer(spark.table("t"), Seq(
-        Row("12" + " " * 3, "12 "),
+        Row("12" + " ".repeat(3), "12 "),
         Row("1234 ", "1234 ")))
     }
   }
@@ -923,7 +924,7 @@ class BasicCharVarcharTestSuite extends QueryTest with SharedSparkSession {
       def checkSchema(df: DataFrame): Unit = {
         val schemas = df.queryExecution.analyzed.collect {
           case l: LogicalRelation => l.relation.schema
-          case d: DataSourceV2Relation => d.table.schema()
+          case d: DataSourceV2Relation => CatalogV2Util.v2ColumnsToStructType(d.table.columns())
         }
         assert(schemas.length == 1)
         assert(schemas.head.map(_.dataType) == Seq(StringType))
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/CsvFunctionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/CsvFunctionsSuite.scala
index f5cca28dc01da..212e6ff64b29c 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/CsvFunctionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/CsvFunctionsSuite.scala
@@ -825,7 +825,7 @@ class CsvFunctionsSuite extends QueryTest with SharedSparkSession {
 
     // In singleVariantColumn mode, from_csv normally treats all inputs as valid. The only exception
     // case is the input exceeds the variant size limit (16MiB).
-    val largeInput = "a" * (16 * 1024 * 1024)
+    val largeInput = "a".repeat(16 * 1024 * 1024)
     checkAnswer(
       Seq(largeInput).toDF("value").select(
         from_csv(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameAggregateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameAggregateSuite.scala
index 6ce0a657d5b9d..721d1c1deea9d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameAggregateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameAggregateSuite.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql
 
-import java.time.{Duration, LocalDateTime, Period}
+import java.time.{Duration, LocalDateTime, LocalTime, Period}
 
 import scala.util.Random
 
@@ -2364,7 +2364,7 @@ class DataFrameAggregateSuite extends QueryTest
             val expectedAnswer = Row(null)
             assertDecimalSumOverflow(df2, ansiEnabled, fnName, expectedAnswer)
 
-            val decStr = "1" + "0" * 19
+            val decStr = "1" + "0".repeat(19)
             val d1 = spark.range(0, 12, 1, 1)
             val d2 = d1.select(expr(s"cast('$decStr' as decimal (38, 18)) as d")).agg(aggFn($"d"))
             assertDecimalSumOverflow(d2, ansiEnabled, fnName, expectedAnswer)
@@ -2567,6 +2567,40 @@ class DataFrameAggregateSuite extends QueryTest
       checkAnswer(df, Row(1.001d, 1, 1) :: Row(6.002d, 1, 1) :: Nil)
     }
   }
+
+  test("SPARK-52626: Support group by Time column") {
+    val ts1 = "15:00:00"
+    val ts2 = "22:00:00"
+    val localTime = Seq(ts1, ts1, ts2).map(LocalTime.parse)
+    val df = localTime.toDF("t").groupBy("t").count().orderBy("t")
+    val expectedSchema =
+      new StructType().add(StructField("t", TimeType())).add("count", LongType, false)
+    assert (df.schema == expectedSchema)
+    checkAnswer(df, Seq(Row(LocalTime.parse(ts1), 2), Row(LocalTime.parse(ts2), 1)))
+  }
+
+  test("SPARK-52660: Support aggregation of Time column when codegen is split") {
+    val res = sql(
+      "SELECT max(expr), MIN(expr) " +
+        "FROM VALUES TIME'22:01:00', " +
+        "TIME'22:00:00', " +
+        "TIME'15:00:00', " +
+        "TIME'22:01:00', " +
+        "TIME'13:22:01', " +
+        "TIME'03:00:00', " +
+        "TIME'22:00:00', " +
+        "TIME'17:45:00' AS tab(expr);")
+    checkAnswer(
+      res,
+      Row(LocalTime.of(22, 1, 0), LocalTime.of(3, 0, 0)))
+  }
+
+  test("SPARK-53155: global lower aggregation should not be removed") {
+    val df = emptyTestData
+      .groupBy().agg(lit(1).as("col1"), lit(2).as("col2"), lit(3).as("col3"))
+      .groupBy($"col1").agg(max("col1"))
+    checkAnswer(df, Seq(Row(1, 1)))
+  }
 }
 
 case class B(c: Option[Double])
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSelfJoinSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSelfJoinSuite.scala
index b60b10d68e86e..8d13258a15230 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSelfJoinSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSelfJoinSuite.scala
@@ -18,8 +18,8 @@
 package org.apache.spark.sql
 
 import org.apache.spark.api.python.PythonEvalType
-import org.apache.spark.sql.catalyst.expressions.{Alias, Ascending, AttributeReference, PythonUDF, SortOrder}
-import org.apache.spark.sql.catalyst.plans.logical.{Expand, Generate, ScriptInputOutputSchema, ScriptTransformation, Window => WindowPlan}
+import org.apache.spark.sql.catalyst.expressions.{Alias, Ascending, AttributeReference, EqualTo, NamedExpression, PythonUDF, SortOrder}
+import org.apache.spark.sql.catalyst.plans.logical.{Expand, Generate, Join, ScriptInputOutputSchema, ScriptTransformation, Window => WindowPlan}
 import org.apache.spark.sql.classic.{Dataset => DatasetImpl}
 import org.apache.spark.sql.expressions.Window
 import org.apache.spark.sql.functions.{col, count, explode, sum, year}
@@ -499,4 +499,58 @@ class DataFrameSelfJoinSuite extends QueryTest with SharedSparkSession {
       assert(df1.join(df2, $"t1.i" === $"t2.i").cache().count() == 1)
     }
   }
+
+  test("SPARK-53098: `DeduplicateRelations` shouldn't remap expressions if old `ExprId` still " +
+  "exists in output") {
+    val df1 = Seq[TestData](TestData(1, "sales")).toDS()
+    val df2 = Seq[TestData](TestData(1, "sales")).toDS()
+    val df3 = df1.join(df2, df1("key") === df2("key")).select(df1("*"))
+    for (conf <- Seq(true, false)) {
+      withSQLConf(
+        // Disable auto-resolution of ambiguity because we want to test behavior before
+        // `resolveSelfJoinCondition` fully kicks in (while we still have ambiguous join condition)
+        SQLConf.DATAFRAME_SELF_JOIN_AUTO_RESOLVE_AMBIGUITY.key -> "false",
+        SQLConf.DONT_DEDUPLICATE_EXPRESSION_IF_EXPR_ID_IN_OUTPUT.key -> conf.toString,
+        // Single-pass analyzer always maps self-join condition to the left branch, regardless of
+        // conf so we return single-pass result only if deduplication conf is true.
+        SQLConf.ANALYZER_DUAL_RUN_RETURN_SINGLE_PASS_RESULT.key -> conf.toString
+      ) {
+        val analyzedPlan =
+          df1.join(df3, df1.col("key") === df3.col("key"), "left_outer").queryExecution.analyzed
+          .asInstanceOf[Join]
+        val joinCondition = analyzedPlan.condition.get.asInstanceOf[EqualTo]
+        val leftBranchExprId = joinCondition.left.asInstanceOf[NamedExpression]
+        val rightBranchExprId = joinCondition.right.asInstanceOf[NamedExpression]
+        assert(leftBranchExprId === rightBranchExprId)
+        assert(analyzedPlan.left.outputSet.contains(leftBranchExprId) == conf)
+        assert(analyzedPlan.right.outputSet.contains(leftBranchExprId) != conf)
+      }
+    }
+  }
+
+  test("SPARK-53143: self join edge-case when Join is not returned by the analyzer") {
+    withTable("table_1", "table_2") {
+      // Edge case with multiple joins. Example: two joins, where the latter one is self join.
+      // The first one is the "using" join - in this case, analyzer's
+      //   `ResolveNaturalAndUsingJoin` will add `Project` as the top node.
+      // The second join is a self join, but with specified join condition (i.e. `joinExprs`) -
+      //   if the join condition uses columns that are not part of the project list (of the first
+      //   join), `AddMetadataColumns` rule will be hit to add metadata for those columns. As a
+      //   consequence, `Project` will be added to the top of joined plan to return the
+      //   original/expected list of projected columns.
+      // Whereas similar (i.e. `Project` node on top) can happen in multiple other cases,
+      //   from `Dataset` perspective the issue is specific to self joins only, since
+      //   `resolveSelfJoinCondition` assumed that the analyzed plan will be always of `Join` type.
+      sql("CREATE TABLE IF NOT EXISTS table_1 (id INT);")
+      sql("INSERT INTO table_1 VALUES (1), (2);")
+      sql("CREATE TABLE IF NOT EXISTS table_2 (id INT, col_1 STRING);")
+      sql("INSERT INTO table_2 VALUES (1, 'str'), (2, 'test');")
+      val df = spark.table("table_2").where("col_1 = 'test'").select("id")
+      assert(
+        spark.table("table_1").alias("t")
+          .join(df.alias("df1"), usingColumns = Seq("id"))
+          .join(df.alias("df2"), joinExprs = $"df1.id" === $"df2.id", joinType = "left")
+          .count() == 1)
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSetOperationsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSetOperationsSuite.scala
index 5ddbb40fff1d5..e778690076ea5 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSetOperationsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameSetOperationsSuite.scala
@@ -22,9 +22,11 @@ import java.util.Locale
 
 import org.apache.spark.sql.catalyst.optimizer.RemoveNoopUnion
 import org.apache.spark.sql.catalyst.plans.logical.Union
+import org.apache.spark.sql.catalyst.plans.physical.UnknownPartitioning
 import org.apache.spark.sql.execution.{SparkPlan, UnionExec}
 import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
 import org.apache.spark.sql.execution.columnar.InMemoryTableScanExec
+import org.apache.spark.sql.execution.exchange.{ReusedExchangeExec, ShuffleExchangeExec}
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.{ExamplePoint, ExamplePointUDT, SharedSparkSession, SQLTestData}
@@ -1508,6 +1510,113 @@ class DataFrameSetOperationsSuite extends QueryTest
       }
     }
   }
+
+  test("SPARK-52921: union partitioning - reused shuffle") {
+    withSQLConf(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "false") {
+      val df1 = Seq((1, 2, 4), (1, 3, 5), (2, 2, 3), (2, 4, 5)).toDF("a", "b", "c")
+      val df2 = Seq((1, 2, 4), (1, 3, 5), (2, 2, 3), (2, 4, 5)).toDF("a", "b", "c")
+
+      val union = df1.repartition($"a").union(df2.repartition($"a"))
+      val unionExec = union.queryExecution.executedPlan.collect {
+        case u: UnionExec => u
+      }
+      assert(unionExec.size == 1)
+
+      val shuffle = df1.repartition($"a").queryExecution.executedPlan.collect {
+        case s: ShuffleExchangeExec => s
+      }
+      assert(shuffle.size == 1)
+
+      val reuseShuffle = union.queryExecution.executedPlan.collect {
+        case r: ReusedExchangeExec => r
+      }
+      assert(reuseShuffle.size == 1)
+
+      val childPartitioning = shuffle.head.outputPartitioning
+      val partitioning = unionExec.head.outputPartitioning
+      assert(partitioning == childPartitioning)
+    }
+  }
+
+  test("SPARK-52921: union partitioning - semantic equality") {
+    val df1 = Seq((1, 2, 4), (1, 3, 5), (2, 2, 3), (2, 4, 5)).toDF("a", "b", "c")
+    val df2 = Seq((4, 1, 5), (2, 4, 6), (1, 4, 2), (3, 5, 1)).toDF("d", "e", "f")
+
+    val correctResult = withSQLConf(SQLConf.UNION_OUTPUT_PARTITIONING.key -> "false") {
+      df1.repartition($"a").union(df2.repartition($"d")).collect()
+    }
+
+    Seq(true, false).foreach { enabled =>
+      withSQLConf(
+          SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "false",
+          SQLConf.UNION_OUTPUT_PARTITIONING.key -> enabled.toString) {
+
+        val union = df1.repartition($"a").union(df2.repartition($"d"))
+        val unionExec = union.queryExecution.executedPlan.collect {
+          case u: UnionExec => u
+        }
+        assert(unionExec.size == 1)
+
+        val shuffle = df1.repartition($"a").queryExecution.executedPlan.collect {
+          case s: ShuffleExchangeExec => s
+        }
+        assert(shuffle.size == 1)
+
+        val childPartitioning = shuffle.head.outputPartitioning
+        val partitioning = unionExec.head.outputPartitioning
+        if (enabled) {
+          assert(partitioning == childPartitioning)
+        }
+
+        checkAnswer(union, correctResult)
+
+        // Avoid unnecessary shuffle if union output partitioning is enabled
+        val shuffledUnion = union.repartition($"a")
+        val shuffleNumBefore = union.queryExecution.executedPlan.collect {
+          case s: ShuffleExchangeExec => s
+        }
+        val shuffleNumAfter = shuffledUnion.queryExecution.executedPlan.collect {
+          case s: ShuffleExchangeExec => s
+        }
+
+        if (enabled) {
+          assert(shuffleNumBefore.size == shuffleNumAfter.size)
+        } else {
+          assert(shuffleNumBefore.size + 1 == shuffleNumAfter.size)
+        }
+        checkAnswer(union, shuffledUnion)
+      }
+    }
+  }
+
+  test("SPARK-52921: union partitioning - range partitioning") {
+    val df1 = Seq((1, 2, 4), (1, 3, 5), (2, 2, 3), (2, 4, 5)).toDF("a", "b", "c")
+    val df2 = Seq((4, 1, 5), (2, 4, 6), (1, 4, 2), (3, 5, 1)).toDF("d", "e", "f")
+
+    val correctResult = withSQLConf(SQLConf.UNION_OUTPUT_PARTITIONING.key -> "false") {
+      df1.repartitionByRange($"a").union(df2.repartitionByRange($"d")).collect()
+    }
+
+    Seq(true, false).foreach { enabled =>
+      withSQLConf(
+        SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "false",
+        SQLConf.UNION_OUTPUT_PARTITIONING.key -> enabled.toString) {
+
+        val union = df1.repartitionByRange($"a").union(df2.repartitionByRange($"d"))
+        val unionExec = union.queryExecution.executedPlan.collect {
+          case u: UnionExec => u
+        }
+        assert(unionExec.size == 1)
+
+        // For range partitioning, even children have the same partitioning,
+        // the union output partitioning is still UnknownPartitioning.
+        val partitioning = unionExec.head.outputPartitioning
+        assert(partitioning.isInstanceOf[UnknownPartitioning])
+
+        checkAnswer(union, correctResult)
+      }
+    }
+  }
 }
 
 case class UnionClass1a(a: Int, b: Long, nested: UnionClass2)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWindowFunctionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWindowFunctionsSuite.scala
index 01e72daead440..6e9f338557158 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWindowFunctionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWindowFunctionsSuite.scala
@@ -1619,4 +1619,21 @@ class DataFrameWindowFunctionsSuite extends QueryTest
       }
     }
   }
+
+  test("SPARK-49386: Window spill with more than the inMemoryThreshold and spillSizeThreshold") {
+    val df = Seq((1, "1"), (2, "2"), (1, "3"), (2, "4")).toDF("key", "value")
+    val window = Window.partitionBy($"key").orderBy($"value")
+
+    withSQLConf(SQLConf.WINDOW_EXEC_BUFFER_IN_MEMORY_THRESHOLD.key -> "1",
+      SQLConf.WINDOW_EXEC_BUFFER_SPILL_THRESHOLD.key -> Int.MaxValue.toString) {
+      assertNotSpilled(sparkContext, "select") {
+        df.select($"key", sum("value").over(window)).collect()
+      }
+      withSQLConf(SQLConf.WINDOW_EXEC_BUFFER_SIZE_SPILL_THRESHOLD.key -> "1") {
+        assertSpilled(sparkContext, "select") {
+          df.select($"key", sum("value").over(window)).collect()
+        }
+      }
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWriterV2Suite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWriterV2Suite.scala
index c9c29ab4746b5..f31e5d2037ea1 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWriterV2Suite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DataFrameWriterV2Suite.scala
@@ -32,7 +32,7 @@ import org.apache.spark.sql.connector.catalog.CatalogManager.SESSION_CATALOG_NAM
 import org.apache.spark.sql.connector.expressions.{BucketTransform, ClusterByTransform, DaysTransform, FieldReference, HoursTransform, IdentityTransform, LiteralValue, MonthsTransform, YearsTransform}
 import org.apache.spark.sql.execution.QueryExecution
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.sources.FakeSourceOne
 import org.apache.spark.sql.test.SharedSparkSession
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DatasetCacheSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DatasetCacheSuite.scala
index 9d8aaf8d90e32..510eeb4fa00bd 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DatasetCacheSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DatasetCacheSuite.scala
@@ -17,9 +17,12 @@
 
 package org.apache.spark.sql
 
+import java.time.LocalTime
+
 import org.scalatest.concurrent.TimeLimits
 import org.scalatest.time.SpanSugar._
 
+import org.apache.spark.sql.execution.ColumnarToRowExec
 import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
 import org.apache.spark.sql.execution.columnar.{InMemoryRelation, InMemoryTableScanExec}
 import org.apache.spark.sql.functions._
@@ -328,4 +331,10 @@ class DatasetCacheSuite extends QueryTest
     val df3 = spark.range(5).select(struct($"id".as("name", metadata2)))
     assert(!df3.queryExecution.executedPlan.exists(_.isInstanceOf[InMemoryTableScanExec]))
   }
+
+  test("SPARK-53418: Handle TimeType in ColumnAccessor") {
+    val plan = spark.sql("SELECT TIME '13:33:33'").cache().queryExecution.sparkPlan
+    val value = ColumnarToRowExec(plan).executeCollectPublic().head.get(0)
+    assert(value == LocalTime.of(13, 33, 33))
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DatasetSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DatasetSuite.scala
index a15bbfe5c6574..653ad7bc34332 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DatasetSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DatasetSuite.scala
@@ -47,7 +47,7 @@ import org.apache.spark.sql.catalyst.util.sideBySide
 import org.apache.spark.sql.execution.{LogicalRDD, RDDScanExec, SQLExecution}
 import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
 import org.apache.spark.sql.execution.exchange.{BroadcastExchangeExec, ShuffleExchangeExec}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.expressions.UserDefinedFunction
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/DynamicPartitionPruningSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/DynamicPartitionPruningSuite.scala
index 1ed5ea4216a9f..e1a2fd33c7c93 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/DynamicPartitionPruningSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/DynamicPartitionPruningSuite.scala
@@ -28,7 +28,7 @@ import org.apache.spark.sql.execution.adaptive._
 import org.apache.spark.sql.execution.datasources.v2.BatchScanExec
 import org.apache.spark.sql.execution.exchange.{BroadcastExchangeLike, ReusedExchangeExec}
 import org.apache.spark.sql.execution.joins.BroadcastHashJoinExec
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StreamingQueryWrapper}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamingQueryWrapper}
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.{SharedSparkSession, SQLTestUtils}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/ExplainSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/ExplainSuite.scala
index 9c90e0105a424..b27122a8de2bc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/ExplainSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/ExplainSuite.scala
@@ -310,10 +310,10 @@ class ExplainSuite extends ExplainSuiteHelper with DisableAdaptiveExecutionSuite
               |""".stripMargin
 
           val expected_pattern1 =
-            "Subquery:1 Hosting operator id = 1 Hosting Expression = k#xL IN subquery#x"
+            "Subquery:1 Hosting operator id = 1 Hosting Expression = k#xL IN dynamicpruning#x"
           val expected_pattern2 =
             "PartitionFilters: \\[isnotnull\\(k#xL\\), dynamicpruningexpression\\(k#xL " +
-              "IN subquery#x\\)\\]"
+              "IN dynamicpruning#x\\)\\]"
           val expected_pattern3 =
             "Location: InMemoryFileIndex \\[\\S*org.apache.spark.sql.ExplainSuite" +
               "/df2/\\S*, ... 99 entries\\]"
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/ExpressionsSchemaSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/ExpressionsSchemaSuite.scala
index df6fc50dc59db..fe222f8e102d4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/ExpressionsSchemaSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/ExpressionsSchemaSuite.scala
@@ -18,12 +18,14 @@
 package org.apache.spark.sql
 
 import java.io.File
+import java.nio.file.Files
 
 import scala.collection.mutable.ArrayBuffer
 
-import org.apache.spark.sql.catalyst.util.{fileToString, stringToFile}
+import org.apache.spark.sql.catalyst.util.stringToFile
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.tags.ExtendedSQLTest
+import org.apache.spark.util.Utils
 
 // scalastyle:off line.size.limit
 /**
@@ -147,7 +149,7 @@ class ExpressionsSchemaSuite extends QueryTest with SharedSparkSession {
       val goldenOutput = (header ++ outputBuffer).mkString("\n")
       val parent = resultFile.getParentFile
       if (!parent.exists()) {
-        assert(parent.mkdirs(), "Could not create directory: " + parent)
+        assert(Utils.createDirectory(parent), "Could not create directory: " + parent)
       }
       stringToFile(resultFile, goldenOutput)
       // scalastyle:off println
@@ -164,7 +166,7 @@ class ExpressionsSchemaSuite extends QueryTest with SharedSparkSession {
     val outputSize = outputs.size
     val headerSize = header.size
     val expectedOutputs = {
-      val expectedGoldenOutput = fileToString(resultFile)
+      val expectedGoldenOutput = Files.readString(resultFile.toPath)
       val lines = expectedGoldenOutput.split("\n")
       val expectedSize = lines.size
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/FileScanSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/FileScanSuite.scala
index c8cd7750230ae..c7ea8eca75eaa 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/FileScanSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/FileScanSuite.scala
@@ -17,9 +17,10 @@
 
 package org.apache.spark.sql
 
+import java.util.{Map => JMap}
+
 import scala.collection.mutable
 
-import com.google.common.collect.ImmutableMap
 import org.apache.hadoop.fs.{FileStatus, Path}
 
 import org.apache.spark.sql.catalyst.dsl.expressions._
@@ -81,10 +82,10 @@ trait FileScanSuiteBase extends SharedSparkSession {
       Array[Filter](sources.And(sources.IsNull("data"), sources.LessThan("data", 0)))
     val pushedFiltersNotEqual =
       Array[Filter](sources.And(sources.IsNull("data"), sources.LessThan("data", 1)))
-    val optionsMap = ImmutableMap.of("key", "value")
-    val options = new CaseInsensitiveStringMap(ImmutableMap.copyOf(optionsMap))
+    val optionsMap = JMap.of("key", "value")
+    val options = new CaseInsensitiveStringMap(JMap.copyOf(optionsMap))
     val optionsNotEqual =
-      new CaseInsensitiveStringMap(ImmutableMap.copyOf(ImmutableMap.of("key2", "value2")))
+      new CaseInsensitiveStringMap(JMap.copyOf(JMap.of("key2", "value2")))
     val partitionFilters = Seq(And(IsNull($"data".int), LessThan($"data".int, 0)))
     val partitionFiltersNotEqual = Seq(And(IsNull($"data".int),
       LessThan($"data".int, 1)))
@@ -113,7 +114,7 @@ trait FileScanSuiteBase extends SharedSparkSession {
           readDataSchema.copy(),
           readPartitionSchema.copy(),
           pushedFilters.clone(),
-          new CaseInsensitiveStringMap(ImmutableMap.copyOf(optionsMap)),
+          new CaseInsensitiveStringMap(JMap.copyOf(optionsMap)),
           Seq(partitionFilters: _*),
           Seq(dataFilters: _*))
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/ICUCollationsMapSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/ICUCollationsMapSuite.scala
index 42d486bd75454..be3f46f0b1c53 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/ICUCollationsMapSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/ICUCollationsMapSuite.scala
@@ -17,8 +17,11 @@
 
 package org.apache.spark.sql
 
+import java.nio.file.Files
+
 import org.apache.spark.SparkFunSuite
-import org.apache.spark.sql.catalyst.util.{fileToString, stringToFile, CollationFactory}
+import org.apache.spark.sql.catalyst.util.{stringToFile, CollationFactory}
+import org.apache.spark.util.Utils
 
 // scalastyle:off line.size.limit
 /**
@@ -54,13 +57,13 @@ class ICUCollationsMapSuite extends SparkFunSuite {
     }
     val parent = collationsMapFile.getParentFile
     if (!parent.exists()) {
-      assert(parent.mkdirs(), "Could not create directory: " + parent)
+      assert(Utils.createDirectory(parent), "Could not create directory: " + parent)
     }
     stringToFile(collationsMapFile, goldenOutput)
   }
 
   test("ICU locales map breaking change") {
-    val goldenLines = fileToString(collationsMapFile).split('\n')
+    val goldenLines = Files.readString(collationsMapFile.toPath).split('\n')
     val goldenRelevantLines = goldenLines.slice(4, goldenLines.length) // skip header
     val input = goldenRelevantLines.map(
       s => (s.split('|')(2).strip(), s.split('|')(1).strip().toInt))
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/IntegratedUDFTestUtils.scala b/sql/core/src/test/scala/org/apache/spark/sql/IntegratedUDFTestUtils.scala
index 6d5456462d8d6..694f182f12966 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/IntegratedUDFTestUtils.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/IntegratedUDFTestUtils.scala
@@ -474,7 +474,8 @@ object IntegratedUDFTestUtils extends SQLHelper {
    *   casted_col.cast(df.schema["col"].dataType)
    * }}}
    */
-  case class TestPythonUDF(name: String, returnType: Option[DataType] = None) extends TestUDF {
+  case class TestPythonUDF(name: String, returnType: Option[DataType] = None,
+      deterministic: Boolean = true) extends TestUDF {
     private[IntegratedUDFTestUtils] lazy val udf = new UserDefinedPythonFunction(
       name = name,
       func = SimplePythonFunction(
@@ -487,7 +488,7 @@ object IntegratedUDFTestUtils extends SQLHelper {
         accumulator = null),
       dataType = StringType,
       pythonEvalType = PythonEvalType.SQL_BATCHED_UDF,
-      udfDeterministic = true) {
+      udfDeterministic = deterministic) {
 
       override def builder(e: Seq[Expression]): Expression = {
         assert(e.length == 1, "Defined UDF only has one column")
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/JoinSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/JoinSuite.scala
index 41f2e5c9a406e..885512d4d1980 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/JoinSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/JoinSuite.scala
@@ -809,7 +809,20 @@ class JoinSuite extends QueryTest with SharedSparkSession with AdaptiveSparkPlan
     withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "1",
       SQLConf.SORT_MERGE_JOIN_EXEC_BUFFER_IN_MEMORY_THRESHOLD.key -> "0",
       SQLConf.SORT_MERGE_JOIN_EXEC_BUFFER_SPILL_THRESHOLD.key -> "1") {
+      testSpill()
+    }
+  }
+
+  test("SPARK-49386: test SortMergeJoin (with spill by size threshold)") {
+    withSQLConf(SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "1",
+      SQLConf.SORT_MERGE_JOIN_EXEC_BUFFER_IN_MEMORY_THRESHOLD.key -> "0",
+      SQLConf.SORT_MERGE_JOIN_EXEC_BUFFER_SPILL_THRESHOLD.key -> Int.MaxValue.toString,
+      SQLConf.SORT_MERGE_JOIN_EXEC_BUFFER_SIZE_SPILL_THRESHOLD.key -> "1") {
+      testSpill()
+    }
+  }
 
+  private def testSpill(): Unit = {
       assertSpilled(sparkContext, "inner join") {
         checkAnswer(
           sql("SELECT * FROM testData JOIN testData2 ON key = a where key = 2"),
@@ -896,7 +909,6 @@ class JoinSuite extends QueryTest with SharedSparkSession with AdaptiveSparkPlan
         )
       }
     }
-  }
 
   test("outer broadcast hash join should not throw NPE") {
     withTempView("v1", "v2") {
@@ -1559,30 +1571,58 @@ class JoinSuite extends QueryTest with SharedSparkSession with AdaptiveSparkPlan
       spark.range(10).map(i => (i.toString, i + 1)).toDF("c1", "c2").write.saveAsTable("t1")
       spark.range(10).map(i => ((i % 5).toString, i % 3)).toDF("c1", "c2").write.saveAsTable("t2")
 
+      spark.range(10).map(i => (i, i + 1)).toDF("c1", "c2").write.saveAsTable("t1a")
+      spark.range(10).map(i => (i % 5, i % 3)).toDF("c1", "c2").write.saveAsTable("t2a")
+
+      val semiExpected1 = Seq(Row("0"), Row("1"), Row("2"), Row("3"), Row("4"))
+      val antiExpected1 = Seq(Row("5"), Row("6"), Row("7"), Row("8"), Row("9"))
+      val semiExpected2 = Seq(Row(0))
+      val antiExpected2 = Seq.tabulate(9) { x => Row(x + 1) }
+
       val semiJoinQueries = Seq(
         // No join condition, ignore duplicated key.
         (s"SELECT /*+ SHUFFLE_HASH(t2) */ t1.c1 FROM t1 LEFT SEMI JOIN t2 ON t1.c1 = t2.c1",
-          true),
+          true, semiExpected1, antiExpected1),
         // Have join condition on build join key only, ignore duplicated key.
         (s"""
             |SELECT /*+ SHUFFLE_HASH(t2) */ t1.c1 FROM t1 LEFT SEMI JOIN t2
             |ON t1.c1 = t2.c1 AND CAST(t1.c2 * 2 AS STRING) != t2.c1
           """.stripMargin,
-          true),
+          true, semiExpected1, antiExpected1),
         // Have join condition on other build attribute beside join key, do not ignore
         // duplicated key.
         (s"""
             |SELECT /*+ SHUFFLE_HASH(t2) */ t1.c1 FROM t1 LEFT SEMI JOIN t2
             |ON t1.c1 = t2.c1 AND t1.c2 * 100 != t2.c2
           """.stripMargin,
-          false)
+          false, semiExpected1, antiExpected1),
+        // SPARK-52873: Have a join condition that references attributes from the build-side
+        // join key, but those attributes are contained by a different expression than that
+        // used as the build-side join key (that is, CAST((t2.c2+10000)/1000 AS INT) is not
+        // the same as t2.c2). In this case, ignoreDuplicatedKey should be false
+        (
+          s"""
+             |SELECT /*+ SHUFFLE_HASH(t2a) */ t1a.c1 FROM t1a LEFT SEMI JOIN t2a
+             |ON CAST((t1a.c2+10000)/1000 AS INT) = CAST((t2a.c2+10000)/1000 AS INT)
+             |AND t2a.c2 >= t1a.c2 + 1
+             |""".stripMargin,
+        false, semiExpected2, antiExpected2),
+        // SPARK-52873: Have a join condition that contains the same expression as the
+        // build-side join key,and does not violate any other rules for the join condition.
+        // In this case, ignoreDuplicatedKey should be true
+        (
+          s"""
+             |SELECT /*+ SHUFFLE_HASH(t2a) */ t1a.c1 FROM t1a LEFT SEMI JOIN t2a
+             |ON t1a.c1 * 10000 = t2a.c1 * 1000 AND t2a.c1 * 1000 >= t1a.c1
+             |""".stripMargin,
+          true, semiExpected2, antiExpected2)
       )
       semiJoinQueries.foreach {
-        case (query, ignoreDuplicatedKey) =>
+        case (query, ignoreDuplicatedKey, semiExpected, antiExpected) =>
           val semiJoinDF = sql(query)
           val antiJoinDF = sql(query.replaceAll("SEMI", "ANTI"))
-          checkAnswer(semiJoinDF, Seq(Row("0"), Row("1"), Row("2"), Row("3"), Row("4")))
-          checkAnswer(antiJoinDF, Seq(Row("5"), Row("6"), Row("7"), Row("8"), Row("9")))
+          checkAnswer(semiJoinDF, semiExpected)
+          checkAnswer(antiJoinDF, antiExpected)
           Seq(semiJoinDF, antiJoinDF).foreach { df =>
             assert(collect(df.queryExecution.executedPlan) {
               case j: ShuffledHashJoinExec if j.ignoreDuplicatedKey == ignoreDuplicatedKey => true
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/JsonFunctionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/JsonFunctionsSuite.scala
index ea185b6b4901a..68d98cd0d1827 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/JsonFunctionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/JsonFunctionsSuite.scala
@@ -559,7 +559,7 @@ class JsonFunctionsSuite extends QueryTest with SharedSparkSession {
       sqlState = "42601",
       parameters = Map(
         "error" -> "'InvalidType'",
-        "hint" -> ": extra input 'InvalidType'"
+        "hint" -> ""
       ),
       context = ExpectedContext(
         fragment = "from_json(value, 'time InvalidType')",
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/LogQuerySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/LogQuerySuite.scala
index 861b0bf0f3945..854b50a65d37d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/LogQuerySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/LogQuerySuite.scala
@@ -18,8 +18,9 @@
 package org.apache.spark.sql
 
 import java.io.File
+import java.util.Locale
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.util.LogUtils.SPARK_LOG_SCHEMA
 
@@ -63,7 +64,8 @@ class LogQuerySuite extends QueryTest with SharedSparkSession with Logging {
       createTempView("logs")
       checkAnswer(
         spark.sql(s"SELECT level, msg, context, exception FROM logs WHERE msg = '${msg.message}'"),
-        Row("ERROR", msg.message, Map(LogKeys.EXECUTOR_ID.name -> "1"), null) :: Nil)
+        Row("ERROR", msg.message,
+          Map(LogKeys.EXECUTOR_ID.name.toLowerCase(Locale.ROOT) -> "1"), null) :: Nil)
     }
   }
 
@@ -74,7 +76,7 @@ class LogQuerySuite extends QueryTest with SharedSparkSession with Logging {
 
     withTempView("logs") {
       createTempView("logs")
-      val expectedMDC = Map(LogKeys.TASK_ID.name -> "2")
+      val expectedMDC = Map(LogKeys.TASK_ID.name.toLowerCase(Locale.ROOT) -> "2")
       checkAnswer(
         spark.sql("SELECT level, msg, context, exception.class, exception.msg FROM logs " +
           s"WHERE msg = '${msg.message}'"),
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/MathFunctionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/MathFunctionsSuite.scala
index f1d0815c181b9..23d3fc3d2fe5e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/MathFunctionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/MathFunctionsSuite.scala
@@ -246,7 +246,8 @@ class MathFunctionsSuite extends QueryTest with SharedSparkSession {
 
   test("SPARK-36229 inconsistently behaviour where returned value is above the 64 char threshold") {
     withSQLConf(SQLConf.ANSI_ENABLED.key -> false.toString) {
-      val df = Seq(("?" * 64), ("?" * 65), ("a" * 4 + "?" * 60), ("a" * 4 + "?" * 61)).toDF("num")
+      val df = Seq(("?".repeat(64)), ("?".repeat(65)), ("a".repeat(4) + "?".repeat(60)),
+          ("a".repeat(4) + "?".repeat(61))).toDF("num")
       val expectedResult = Seq(Row("0"), Row("0"), Row("43690"), Row("43690"))
       checkAnswer(df.select(conv($"num", 16, 10)), expectedResult)
       checkAnswer(df.select(conv($"num", 16, -10)), expectedResult)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/PlanStabilitySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/PlanStabilitySuite.scala
index ad424b3a7cc76..e4b5e10f7c3be 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/PlanStabilitySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/PlanStabilitySuite.scala
@@ -19,11 +19,10 @@ package org.apache.spark.sql
 
 import java.io.File
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
 import scala.collection.mutable
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.sql.catalyst.expressions.AttributeSet
 import org.apache.spark.sql.catalyst.util._
 import org.apache.spark.sql.execution._
@@ -31,6 +30,7 @@ import org.apache.spark.sql.execution.adaptive.DisableAdaptiveExecutionSuite
 import org.apache.spark.sql.execution.exchange.{Exchange, ReusedExchangeExec, ValidateRequirements}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.tags.ExtendedSQLTest
+import org.apache.spark.util.Utils
 
 // scalastyle:off line.size.limit
 /**
@@ -77,8 +77,9 @@ trait PlanStabilitySuite extends DisableAdaptiveExecutionSuite {
   }
 
   private val referenceRegex = "#\\d+".r
-  private val normalizeRegex = "#\\d+L?".r
-  private val planIdRegex = "plan_id=\\d+".r
+  // Do not match `id=#123` like ids as those are actually plan ids in `SubqueryExec` nodes.
+  private val exprIdRegexp = "(?<prefix>(?<!id=)#)\\d+L?".r
+  private val planIdRegex = "(?<prefix>(plan_id=|id=#))\\d+".r
 
   private val clsName = this.getClass.getCanonicalName
 
@@ -101,9 +102,9 @@ trait PlanStabilitySuite extends DisableAdaptiveExecutionSuite {
   private def isApproved(
       dir: File, actualSimplifiedPlan: String, actualExplain: String): Boolean = {
     val simplifiedFile = new File(dir, "simplified.txt")
-    val expectedSimplified = FileUtils.readFileToString(simplifiedFile, StandardCharsets.UTF_8)
+    val expectedSimplified = Files.readString(simplifiedFile.toPath)
     lazy val explainFile = new File(dir, "explain.txt")
-    lazy val expectedExplain = FileUtils.readFileToString(explainFile, StandardCharsets.UTF_8)
+    lazy val expectedExplain = Files.readString(explainFile.toPath)
     expectedSimplified == actualSimplifiedPlan && expectedExplain == actualExplain
   }
 
@@ -122,20 +123,20 @@ trait PlanStabilitySuite extends DisableAdaptiveExecutionSuite {
     val foundMatch = dir.exists() && isApproved(dir, simplified, explain)
 
     if (!foundMatch) {
-      FileUtils.deleteDirectory(dir)
-      assert(dir.mkdirs())
+      Utils.deleteRecursively(dir)
+      assert(Utils.createDirectory(dir))
 
       val file = new File(dir, "simplified.txt")
-      FileUtils.writeStringToFile(file, simplified, StandardCharsets.UTF_8)
+      Files.writeString(file.toPath(), simplified, StandardCharsets.UTF_8)
       val fileOriginalPlan = new File(dir, "explain.txt")
-      FileUtils.writeStringToFile(fileOriginalPlan, explain, StandardCharsets.UTF_8)
+      Files.writeString(fileOriginalPlan.toPath(), explain, StandardCharsets.UTF_8)
       logDebug(s"APPROVED: $file $fileOriginalPlan")
     }
   }
 
   private def checkWithApproved(plan: SparkPlan, name: String, explain: String): Unit = {
     val dir = getDirForTest(name)
-    val tempDir = FileUtils.getTempDirectory
+    val tempDir = System.getProperty("java.io.tmpdir")
     val actualSimplified = getSimplifiedPlan(plan)
     val foundMatch = isApproved(dir, actualSimplified, explain)
 
@@ -147,11 +148,10 @@ trait PlanStabilitySuite extends DisableAdaptiveExecutionSuite {
       val actualSimplifiedFile = new File(tempDir, s"$name.actual.simplified.txt")
       val actualExplainFile = new File(tempDir, s"$name.actual.explain.txt")
 
-      val approvedSimplified = FileUtils.readFileToString(
-        approvedSimplifiedFile, StandardCharsets.UTF_8)
+      val approvedSimplified = Files.readString(approvedSimplifiedFile.toPath)
       // write out for debugging
-      FileUtils.writeStringToFile(actualSimplifiedFile, actualSimplified, StandardCharsets.UTF_8)
-      FileUtils.writeStringToFile(actualExplainFile, explain, StandardCharsets.UTF_8)
+      Files.writeString(actualSimplifiedFile.toPath(), actualSimplified, StandardCharsets.UTF_8)
+      Files.writeString(actualExplainFile.toPath(), explain, StandardCharsets.UTF_8)
 
       fail(
         s"""
@@ -209,7 +209,7 @@ trait PlanStabilitySuite extends DisableAdaptiveExecutionSuite {
      *     Project [c_customer_id]
      */
     def simplifyNode(node: SparkPlan, depth: Int): String = {
-      val padding = "  " * depth
+      val padding = "  ".repeat(depth)
       var thisNode = node.nodeName
       if (node.references.nonEmpty) {
         thisNode += s" [${cleanUpReferences(node.references)}]"
@@ -230,18 +230,15 @@ trait PlanStabilitySuite extends DisableAdaptiveExecutionSuite {
   }
 
   private def normalizeIds(plan: String): String = {
-    val map = new mutable.HashMap[String, String]()
-    normalizeRegex.findAllMatchIn(plan).map(_.toString)
-      .foreach(map.getOrElseUpdate(_, (map.size + 1).toString))
-    val exprIdNormalized = normalizeRegex.replaceAllIn(
-      plan, regexMatch => s"#${map(regexMatch.toString)}")
+    val exprIdMap = new mutable.HashMap[String, String]()
+    val exprIdNormalized = exprIdRegexp.replaceAllIn(plan,
+      m => exprIdMap.getOrElseUpdate(m.toString(), s"${m.group("prefix")}${exprIdMap.size + 1}"))
 
-    // Normalize the plan id in Exchange nodes. See `Exchange.stringArgs`.
+    // Normalize the plan ids in Exchange and Subquery nodes.
+    // See `Exchange.stringArgs` and `SubqueryExec.stringArgs`
     val planIdMap = new mutable.HashMap[String, String]()
-    planIdRegex.findAllMatchIn(exprIdNormalized).map(_.toString)
-      .foreach(planIdMap.getOrElseUpdate(_, (planIdMap.size + 1).toString))
-    planIdRegex.replaceAllIn(
-      exprIdNormalized, regexMatch => s"plan_id=${planIdMap(regexMatch.toString)}")
+    planIdRegex.replaceAllIn(exprIdNormalized,
+      m => planIdMap.getOrElseUpdate(s"$m", s"${m.group("prefix")}${planIdMap.size + 1}"))
   }
 
   private def normalizeLocation(plan: String): String = {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/SQLQuerySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/SQLQuerySuite.scala
index 26aa4b6b5210f..89a6a12a7e4e9 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/SQLQuerySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/SQLQuerySuite.scala
@@ -26,8 +26,6 @@ import java.util.concurrent.atomic.AtomicBoolean
 
 import scala.collection.mutable
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.{AccumulatorSuite, SPARK_DOC_ROOT, SparkArithmeticException, SparkDateTimeException, SparkException, SparkNumberFormatException, SparkRuntimeException}
 import org.apache.spark.scheduler.{SparkListener, SparkListenerJobStart}
 import org.apache.spark.sql.catalyst.ExtendedAnalysisException
@@ -57,7 +55,7 @@ import org.apache.spark.sql.test.SQLTestData._
 import org.apache.spark.sql.types._
 import org.apache.spark.tags.ExtendedSQLTest
 import org.apache.spark.unsafe.types.{CalendarInterval, UTF8String}
-import org.apache.spark.util.ResetSystemProperties
+import org.apache.spark.util.{ResetSystemProperties, Utils}
 
 @ExtendedSQLTest
 class SQLQuerySuite extends QueryTest with SharedSparkSession with AdaptiveSparkPlanHelper
@@ -111,7 +109,6 @@ class SQLQuerySuite extends QueryTest with SharedSparkSession with AdaptiveSpark
   }
 
   test("SPARK-34678: describe functions for table-valued functions") {
-    sql("describe function range").show(false)
     checkKeywordsExist(sql("describe function range"),
       "Function: range",
       "Class: org.apache.spark.sql.catalyst.plans.logical.Range",
@@ -3875,7 +3872,7 @@ class SQLQuerySuite extends QueryTest with SharedSparkSession with AdaptiveSpark
         "/local/org.apache.spark/SPARK-33084/1.0/jars/")
       targetCacheJarDir.mkdir()
       // copy jar to local cache
-      FileUtils.copyFileToDirectory(sourceJar, targetCacheJarDir)
+      Utils.copyFileToDirectory(sourceJar, targetCacheJarDir)
       withTempView("v1") {
         withUserDefinedFunction(
           s"default.$functionName" -> false,
@@ -4963,6 +4960,92 @@ class SQLQuerySuite extends QueryTest with SharedSparkSession with AdaptiveSpark
     )
   }
 
+  test("SPARK-52956: Preserve alias metadata when collapsing projects") {
+    withTable("t1") {
+      sql("CREATE TABLE t1(col1 TIMESTAMP);")
+
+      val query = """WITH cte AS (
+                    |      SELECT col1, col1 FROM t1
+                    |    UNION ALL
+                    |      SELECT col1, col1 FROM t1
+                    |    )
+                    |    SELECT * FROM cte;""".stripMargin
+
+      withSQLConf(
+        SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED.key -> "true",
+        SQLConf.PRESERVE_ALIAS_METADATA_WHEN_COLLAPSING_PROJECTS.key -> "true"
+      ) {
+        val basePlan = sql(query)
+        val finalPlan =
+          basePlan.toDF("col_0", "col_1").select("col_0", "col_1").toDF("col1", "col1")
+        finalPlan.queryExecution.assertOptimized()
+      }
+
+      withSQLConf(
+        SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED.key -> "true",
+        SQLConf.PRESERVE_ALIAS_METADATA_WHEN_COLLAPSING_PROJECTS.key -> "false"
+      ) {
+        // With the flag set to false, __is_duplicate metadata will not be preserved in Project
+        // nodes under Union. This will cause RemoveRedundantAliases to remove aliases of duplicate
+        // columns and leave Union unresolved.
+        val e = intercept[SparkException] {
+          val basePlan = sql(query)
+          val finalPlan =
+            basePlan.toDF("col_0", "col_1").select("col_0", "col_1").toDF("col1", "col1")
+          finalPlan.queryExecution.assertOptimized()
+        }
+        assert(e.getCondition.contains("PLAN_VALIDATION_FAILED_RULE_IN_BATCH"))
+        assert(
+          e.getMessage.contains(
+            "org.apache.spark.sql.catalyst.optimizer.RemoveRedundantAliases"
+          )
+        )
+      }
+    }
+  }
+
+  test("SPARK-52686: Union should be resolved only if there are no duplicates") {
+    // Different implementations of `WidenSetOperationTypes` cause an additional Project with ANSI
+    // off.
+    val expectedResult = if (conf.ansiEnabled) { 7 } else { 8 }
+    withTable("t1", "t2", "t3") {
+      sql("CREATE TABLE t1 (col1 STRING, col2 STRING, col3 STRING)")
+      sql("CREATE TABLE t2 (col1 STRING, col2 DOUBLE, col3 STRING)")
+      sql("CREATE TABLE t3 (col1 STRING, col2 DOUBLE, a STRING, col3 STRING)")
+
+      for (confValue <- Seq(false, true)) {
+        withSQLConf(
+          SQLConf.UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED.key -> confValue.toString
+        ) {
+          val analyzedPlan = sql(
+            """SELECT
+              |    *
+              |FROM (
+              |    SELECT col1, col2, NULL AS a, col1 FROM t1
+              |    UNION
+              |    SELECT col1, col2, NULL AS a, col3 FROM t2
+              |    UNION
+              |    SELECT * FROM t3
+              |)""".stripMargin
+          ).queryExecution.analyzed
+
+          val projectCount = analyzedPlan.collect {
+            case project: Project => project
+          }.size
+
+          // When UNION_IS_RESOLVED_WHEN_DUPLICATES_PER_CHILD_RESOLVED is disabled, we resolve
+          // outer Union before deduplicating ExprIds in inner union. Because of this we get an
+          // additional unnecessary Project (see SPARK-52686).
+          if (confValue) {
+            assert(projectCount == expectedResult)
+          } else {
+            assert(projectCount == expectedResult + 1)
+          }
+        }
+      }
+    }
+  }
+
   Seq(true, false).foreach { codegenEnabled =>
     test(s"SPARK-52060: one row relation with codegen enabled - $codegenEnabled") {
       withSQLConf(SQLConf.WHOLESTAGE_CODEGEN_ENABLED.key -> codegenEnabled.toString) {
@@ -4974,6 +5057,28 @@ class SQLQuerySuite extends QueryTest with SharedSparkSession with AdaptiveSpark
       }
     }
   }
+
+  test("SPARK-53094: Fix cube-related data quality problem") {
+    val df = sql(
+      """SELECT product, region, sum(amount) AS s
+        |FROM VALUES
+        |  ('a', 'east', 100),
+        |  ('b', 'east', 200),
+        |  ('a', 'west', 150),
+        |  ('b', 'west', 250),
+        |  ('a', 'east', 120) AS t(product, region, amount)
+        |GROUP BY product, region WITH CUBE
+        |HAVING count(product) > 2
+        |ORDER BY s DESC""".stripMargin)
+
+    checkAnswer(df, Seq(Row(null, null, 820), Row(null, "east", 420), Row("a", null, 370)))
+  }
+
+  test("SPARK-53308: Don't remove aliases in RemoveRedundantAliases that would cause duplicates") {
+    val df = sql("SELECT col1 FROM values(1) WHERE 1 IN (SELECT col1 UNION SELECT col1);")
+
+    checkAnswer(df, Row(1))
+  }
 }
 
 case class Foo(bar: Option[String])
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestHelper.scala b/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestHelper.scala
index cd54161f54acc..23a43dbd641d0 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestHelper.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestHelper.scala
@@ -18,6 +18,7 @@
 package org.apache.spark.sql
 
 import java.io.File
+import java.nio.file.Files
 
 import scala.collection.mutable.ArrayBuffer
 import scala.util.control.NonFatal
@@ -27,17 +28,18 @@ import org.apache.spark.ErrorMessageFormat.MINIMAL
 import org.apache.spark.SparkThrowableHelper.getMessage
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.IntegratedUDFTestUtils.{TestUDF, TestUDTFSet}
+import org.apache.spark.sql.catalyst.SQLConfHelper
 import org.apache.spark.sql.catalyst.expressions.{CurrentDate, CurrentTime, CurrentTimestampLike, CurrentUser, Literal}
 import org.apache.spark.sql.catalyst.planning.PhysicalOperation
 import org.apache.spark.sql.catalyst.plans.logical._
-import org.apache.spark.sql.catalyst.util.fileToString
 import org.apache.spark.sql.execution.HiveResult.hiveResultString
 import org.apache.spark.sql.execution.SQLExecution
 import org.apache.spark.sql.execution.command.{DescribeColumnCommand, DescribeCommandBase}
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{DateType, StructType, TimestampType}
 import org.apache.spark.util.ArrayImplicits.SparkArrayOps
 
-trait SQLQueryTestHelper extends Logging {
+trait SQLQueryTestHelper extends SQLConfHelper with Logging {
 
   private val notIncludedMsg = "[not included in comparison]"
   private val clsName = this.getClass.getCanonicalName
@@ -55,7 +57,7 @@ trait SQLQueryTestHelper extends Logging {
       .replaceAll("Created By.*", s"Created By $notIncludedMsg")
       .replaceAll("Created Time.*", s"Created Time $notIncludedMsg")
       .replaceAll("Last Access.*", s"Last Access $notIncludedMsg")
-      .replaceAll("Owner\t.*", s"Owner\t$notIncludedMsg")
+      .replaceAll("Owner[\t ]+(.*)", s"Owner\t$notIncludedMsg")
       .replaceAll("Partition Statistics\t\\d+", s"Partition Statistics\t$notIncludedMsg")
       .replaceAll("CTERelationDef \\d+,", s"CTERelationDef xxxx,")
       .replaceAll("CTERelationRef \\d+,", s"CTERelationRef xxxx,")
@@ -117,7 +119,9 @@ trait SQLQueryTestHelper extends Logging {
     if (deterministic) {
       // Perform query analysis, but also get rid of the #1234 expression IDs that show up in the
       // resolved plans.
-      (schema, Seq(replaceNotIncludedMsg(analyzed.toString)))
+      withSQLConf(SQLConf.MAX_TO_STRING_FIELDS.key -> Int.MaxValue.toString) {
+        (schema, Seq(replaceNotIncludedMsg(analyzed.toString)))
+      }
     } else {
       // The analyzed plan is nondeterministic so elide it from the result to keep tests reliable.
       (schema, Seq("[Analyzer test output redacted due to nondeterminism]"))
@@ -406,7 +410,7 @@ trait SQLQueryTestHelper extends Logging {
     val importedTestCaseName = comments.filter(_.startsWith("--IMPORT ")).map(_.substring(9))
     val importedCode = importedTestCaseName.flatMap { testCaseName =>
       allTestCases.find(_.name == testCaseName).map { testCase =>
-        val input = fileToString(new File(testCase.inputFile))
+        val input = Files.readString(new File(testCase.inputFile).toPath)
         val (_, code) = splitCommentsAndCodes(input)
         code
       }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestSuite.scala
index 575a4ae69d1a9..a57c72f5fc155 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/SQLQueryTestSuite.scala
@@ -19,6 +19,7 @@ package org.apache.spark.sql
 
 import java.io.File
 import java.net.URI
+import java.nio.file.Files
 import java.util.Locale
 
 import org.apache.spark.{SparkConf, TestUtils}
@@ -27,8 +28,8 @@ import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.catalyst.plans.SQLHelper
 import org.apache.spark.sql.catalyst.plans.logical.{Command, LogicalPlan}
 import org.apache.spark.sql.catalyst.rules.RuleExecutor
-import org.apache.spark.sql.catalyst.util.{fileToString, stringToFile}
 import org.apache.spark.sql.catalyst.util.DateTimeConstants.NANOS_PER_SECOND
+import org.apache.spark.sql.catalyst.util.stringToFile
 import org.apache.spark.sql.execution.WholeStageCodegenExec
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.TimestampTypes
@@ -156,6 +157,7 @@ class SQLQueryTestSuite extends QueryTest with SharedSparkSession with SQLHelper
     // SPARK-39564: don't print out serde to avoid introducing complicated and error-prone
     // regex magic.
     .set("spark.test.noSerdeInExplain", "true")
+    .set(SQLConf.SCHEMA_LEVEL_COLLATIONS_ENABLED, true)
 
   // SPARK-32106 Since we add SQL test 'transform.sql' will use `cat` command,
   // here we need to ignore it.
@@ -228,7 +230,7 @@ class SQLQueryTestSuite extends QueryTest with SharedSparkSession with SQLHelper
 
   /** Run a test case. */
   protected def runSqlTestCase(testCase: TestCase, listTestCases: Seq[TestCase]): Unit = {
-    val input = fileToString(new File(testCase.inputFile))
+    val input = Files.readString(new File(testCase.inputFile).toPath)
     val (comments, code) = splitCommentsAndCodes(input)
     val queries = getQueries(code, comments, listTestCases)
     val settings = getSparkSettings(comments)
@@ -377,7 +379,7 @@ class SQLQueryTestSuite extends QueryTest with SharedSparkSession with SQLHelper
       val resultFile = new File(testCase.resultFile)
       val parent = resultFile.getParentFile
       if (!parent.exists()) {
-        assert(parent.mkdirs(), "Could not create directory: " + parent)
+        assert(Utils.createDirectory(parent), "Could not create directory: " + parent)
       }
       stringToFile(resultFile, goldenOutput)
     }
@@ -638,7 +640,7 @@ class SQLQueryTestSuite extends QueryTest with SharedSparkSession with SQLHelper
       makeOutput: (String, Option[String], String) => QueryTestOutput): Unit = {
     // Read back the golden file.
     val expectedOutputs: Seq[QueryTestOutput] = {
-      val goldenOutput = fileToString(new File(resultFile))
+      val goldenOutput = Files.readString(new File(resultFile).toPath)
       val segments = goldenOutput.split("-- !query.*\n")
 
       val numSegments = outputs.map(_.numSegments).sum + 1
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/StringFunctionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/StringFunctionsSuite.scala
index 0df7f806272c0..a1de322ac298c 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/StringFunctionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/StringFunctionsSuite.scala
@@ -464,7 +464,7 @@ class StringFunctionsSuite extends QueryTest with SharedSparkSession {
       Row("www.apache")
     )
 
-    // TODO SPARK-48779 Move E2E SQL tests with column input to collations.sql golden file.
+    // TODO SPARK-48779 Move E2E SQL tests with column input to collations-basic.sql golden file.
     val testTable = "test_substring_index"
     withTable(testTable) {
       sql(s"CREATE TABLE $testTable (num int) USING parquet")
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/SubquerySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/SubquerySuite.scala
index 576f93e94ec1e..205f4f7eec801 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/SubquerySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/SubquerySuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.SparkRuntimeException
-import org.apache.spark.sql.catalyst.expressions.SubqueryExpression
+import org.apache.spark.sql.catalyst.expressions.{EqualTo, NamedExpression, OuterReference, SubqueryExpression}
 import org.apache.spark.sql.catalyst.plans.{LeftAnti, LeftSemi}
 import org.apache.spark.sql.catalyst.plans.logical.{Aggregate, Filter, Join, LogicalPlan, Project, Sort, Union}
 import org.apache.spark.sql.execution._
@@ -2846,4 +2846,38 @@ class SubquerySuite extends QueryTest
         :: Row(true) :: Row(true) :: Row(true) :: Nil
     )
   }
+
+
+  test("SPARK-52896: Outer reference ExprId should match exposed attribute") {
+    val plan =
+      sql(
+        """
+          | SELECT col1
+          | FROM VALUES(1,2)
+          | GROUP BY col1
+          | HAVING MAX(col2) == (SELECT 1 WHERE MAX(col2) = 1)
+          |
+      """.stripMargin).queryExecution.analyzed
+
+    // Expected plan:
+    // Project
+    // +- Filter (scalar-subquery)
+    // :  +- Project
+    // :     +- Filter
+    // :        +- OneRowRelation
+    // +- Aggregate
+    //   +- LocalRelation
+
+    val havingNode = plan.asInstanceOf[Project].child.asInstanceOf[Filter]
+    val subquery =
+      havingNode.condition.asInstanceOf[EqualTo].right.asInstanceOf[SubqueryExpression]
+    val subqueryFilter = subquery.plan.asInstanceOf[Project].child.asInstanceOf[Filter]
+
+    val exposedAttribute = subquery.getOuterAttrs.head.asInstanceOf[NamedExpression]
+    val outerReferenceAttribute = subqueryFilter.condition.asInstanceOf[EqualTo].collectFirst {
+      case outerReference: OuterReference => outerReference.e
+    }.get
+
+    assert(exposedAttribute.exprId == outerReferenceAttribute.exprId)
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/TPCDSQueryTestSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/TPCDSQueryTestSuite.scala
index c1246a167b8cc..7d1f060b973c7 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/TPCDSQueryTestSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/TPCDSQueryTestSuite.scala
@@ -23,10 +23,11 @@ import java.nio.file.{Files, Paths}
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark.{SparkConf, SparkContext}
-import org.apache.spark.sql.catalyst.util.{fileToString, resourceToString, stringToFile}
+import org.apache.spark.sql.catalyst.util.{resourceToString, stringToFile}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.TestSparkSession
 import org.apache.spark.tags.ExtendedSQLTest
+import org.apache.spark.util.Utils
 
 /**
  * End-to-end tests to check TPCDS query results.
@@ -122,14 +123,14 @@ class TPCDSQueryTestSuite extends QueryTest with TPCDSBase with SQLQueryTestHelp
           }
           val parent = goldenFile.getParentFile
           if (!parent.exists()) {
-            assert(parent.mkdirs(), "Could not create directory: " + parent)
+            assert(Utils.createDirectory(parent), "Could not create directory: " + parent)
           }
           stringToFile(goldenFile, goldenOutput)
         }
 
         // Read back the golden file.
         val (expectedSchema, expectedOutput) = {
-          val goldenOutput = fileToString(goldenFile)
+          val goldenOutput = Files.readString(goldenFile.toPath)
           val segments = goldenOutput.split("-- !query.*\n")
 
           // query has 3 segments, plus the header
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/TimeFunctionsSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/TimeFunctionsSuiteBase.scala
new file mode 100644
index 0000000000000..c84b556c81f89
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/TimeFunctionsSuiteBase.scala
@@ -0,0 +1,645 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql
+
+import java.time.LocalDate
+import java.time.LocalTime
+import java.time.temporal.ChronoUnit
+
+import org.apache.spark.{SparkConf, SparkDateTimeException, SparkIllegalArgumentException}
+import org.apache.spark.sql.functions._
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.sql.types._
+
+abstract class TimeFunctionsSuiteBase extends QueryTest with SharedSparkSession {
+  import testImplicits._
+
+  // Helper method to assert that two DataFrames with TimeType values are approximately equal.
+  // This method assumes that the two dataframes (df1 and df2) have the same schemas and sizes.
+  // Also, only 1 column is expected in each DataFrame, and that column must be of TimeType.
+  private def assertTwoTimesAreApproximatelyEqual(df1: DataFrame, df2: DataFrame) = {
+    // Check that both DataFrames have the same schema.
+    val schema1 = df1.schema
+    val schema2 = df2.schema
+    require(schema1 == schema2, "Both DataFrames must have the same schema, but got " +
+      s"$schema1 and $schema2 for the two given DataFrames df1 and df2, respectively.")
+    // Check that both DataFrames have the same number of rows.
+    val numRows1 = df1.count()
+    val numRows2 = df2.count()
+    require(numRows1 == numRows2, "Both DataFrames must have the same number of rows, but got" +
+      s"$numRows1 and $numRows2 rows in the two given DataFrames df1 and df2, respectively.")
+    // Check that both DataFrames have only 1 column.
+    val fields1 = schema1.fields.length
+    require(fields1 == 1, s"The first DataFrame must have only one column, but got $fields1.")
+    val fields2 = schema2.fields.length
+    require(fields2 == 1, s"The second DataFrame must have only one column, but got $fields2.")
+    // Check that the column type is TimeType.
+    val columnType1 = schema1.fields.head.dataType
+    require(columnType1.isInstanceOf[TimeType], "The column type of the first DataFrame " +
+      s"must be TimeType, but got $columnType1.")
+    val columnType2 = schema2.fields.head.dataType
+    require(columnType2.isInstanceOf[TimeType], "The column type of the second DataFrame " +
+      s"must be TimeType, but got $columnType2.")
+
+    // Extract the LocalTime values from the input DataFrames.
+    val time1: LocalTime = df1.collect().head.get(0).asInstanceOf[LocalTime]
+    val time2: LocalTime = df2.collect().head.get(0).asInstanceOf[LocalTime]
+
+    // Check that the time difference is within a set number of minutes.
+    val maxTimeDiffInMinutes = 15 // This should be enough time to ensure correctness.
+    val timeDiffInMillis = Math.abs(ChronoUnit.MILLIS.between(time1, time2))
+    assert(
+      timeDiffInMillis <= maxTimeDiffInMinutes * 60 * 1000,
+      s"Time difference exceeds $maxTimeDiffInMinutes minutes: $timeDiffInMillis ms."
+    )
+  }
+
+  test("SPARK-52882: current_time function with default precision") {
+    // Create a dummy DataFrame with a single row to test the current_time() function.
+    val df = spark.range(1)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "current_time()"
+    )
+    val result2 = df.select(
+      current_time()
+    )
+
+    // Check that both methods produce approximately the same result.
+    assertTwoTimesAreApproximatelyEqual(result1, result2)
+  }
+
+  test("SPARK-52882: current_time function with specified precision") {
+    (0 to 6).foreach { precision: Int =>
+      // Create a dummy DataFrame with a single row to test the current_time(precision) function.
+      val df = spark.range(1)
+
+      // Test the function using both `selectExpr` and `select`.
+      val result1 = df.selectExpr(
+        s"current_time($precision)"
+      )
+      val result2 = df.select(
+        current_time(precision)
+      )
+
+      // Confirm that the precision is correctly set.
+      assert(result1.schema.fields.head.dataType == TimeType(precision))
+      assert(result2.schema.fields.head.dataType == TimeType(precision))
+
+      // Check that both methods produce approximately the same result.
+      assertTwoTimesAreApproximatelyEqual(result1, result2)
+    }
+  }
+
+  test("SPARK-52881: make_time function") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("hour", IntegerType, nullable = false),
+      StructField("minute", IntegerType, nullable = false),
+      StructField("second", DecimalType(16, 6), nullable = false)
+    ))
+    val data = Seq(
+      Row(0, 0, BigDecimal(0.0)),
+      Row(1, 2, BigDecimal(3.4)),
+      Row(23, 59, BigDecimal(59.999999))
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "make_time(hour, minute, second)"
+    )
+    val result2 = df.select(
+      make_time(col("hour"), col("minute"), col("second"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "00:00:00",
+      "01:02:03.4",
+      "23:59:59.999999"
+    ).toDF("timeString").select(col("timeString").cast("time"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+  }
+
+  test("SPARK-53109: make_timestamp_ntz function") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("date", DateType, nullable = false),
+      StructField("time", TimeType(), nullable = false)
+    ))
+    val data = Seq(
+      Row(LocalDate.parse("2020-01-01"), LocalTime.parse("00:00:00")),
+      Row(LocalDate.parse("2023-10-20"), LocalTime.parse("12:34:56")),
+      Row(LocalDate.parse("2023-12-31"), LocalTime.parse("23:59:59.999999"))
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "make_timestamp_ntz(date, time)"
+    )
+    val result2 = df.select(
+      make_timestamp_ntz(col("date"), col("time"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "2020-01-01 00:00:00",
+      "2023-10-20 12:34:56",
+      "2023-12-31 23:59:59.999999"
+    ).toDF("timestamp_ntz").select(col("timestamp_ntz").cast("timestamp_ntz"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+
+    // NULL result is returned for any NULL input.
+    val nullInputDF = Seq(
+      (null, LocalTime.parse("00:00:00")),
+      (LocalDate.parse("2020-01-01"), null),
+      (null, null)
+    ).toDF("date", "time")
+    val nullResult = Seq[Integer](
+      null, null, null
+    ).toDF("ts").select(col("ts"))
+    checkAnswer(
+      nullInputDF.select(make_timestamp_ntz(col("date"), col("time"))),
+      nullResult
+    )
+  }
+
+  test("SPARK-52885: hour function") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("time", TimeType(), nullable = false)
+    ))
+    val data = Seq(
+      Row(LocalTime.parse("00:00:00")),
+      Row(LocalTime.parse("01:02:03.4")),
+      Row(LocalTime.parse("23:59:59.999999"))
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "hour(time)"
+    )
+    val result2 = df.select(
+      hour(col("time"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      0,
+      1,
+      23
+    ).toDF("hour").select(col("hour"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+  }
+
+  test("SPARK-52886: minute function") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("time", TimeType(), nullable = false)
+    ))
+    val data = Seq(
+      Row(LocalTime.parse("00:00:00")),
+      Row(LocalTime.parse("01:02:03.4")),
+      Row(LocalTime.parse("23:59:59.999999"))
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "minute(time)"
+    )
+    val result2 = df.select(
+      minute(col("time"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      0,
+      2,
+      59
+    ).toDF("minute").select(col("minute"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+  }
+
+  test("SPARK-52887: second function") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("time", TimeType(), nullable = false)
+    ))
+    val data = Seq(
+      Row(LocalTime.parse("00:00:00")),
+      Row(LocalTime.parse("01:02:03.4")),
+      Row(LocalTime.parse("23:59:59.999999"))
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "second(time)"
+    )
+    val result2 = df.select(
+      second(col("time"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      0,
+      3,
+      59
+    ).toDF("second").select(col("second"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+  }
+
+  test("SPARK-53108: time_diff function") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("unit", StringType, nullable = false),
+      StructField("start", TimeType(), nullable = false),
+      StructField("end", TimeType(), nullable = false)
+    ))
+    val data = Seq(
+      Row("HOUR", LocalTime.parse("20:30:29"), LocalTime.parse("21:30:28")),
+      Row("second", LocalTime.parse("09:32:05.359123"), LocalTime.parse("17:23:49.906152")),
+      Row("MicroSecond", LocalTime.parse("09:32:05.359123"), LocalTime.parse("17:23:49.906152"))
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "time_diff(unit, start, end)"
+    )
+    val result2 = df.select(
+      time_diff(col("unit"), col("start"), col("end"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      0,
+      28304,
+      28304547029L
+    ).toDF("diff").select(col("diff"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+
+    // NULL result is returned for any NULL input.
+    val nullInputDF = Seq(
+      (null, LocalTime.parse("01:02:03"), LocalTime.parse("01:02:03")),
+      ("HOUR", null, LocalTime.parse("01:02:03")),
+      ("HOUR", LocalTime.parse("01:02:03"), null),
+      ("HOUR", null, null),
+      (null, LocalTime.parse("01:02:03"), null),
+      (null, null, LocalTime.parse("01:02:03")),
+      (null, null, null)
+    ).toDF("unit", "start", "end")
+    val nullResult = Seq[Integer](
+      null, null, null, null, null, null, null
+    ).toDF("diff").select(col("diff"))
+    checkAnswer(
+      nullInputDF.select(time_diff(col("unit"), col("start"), col("end"))),
+      nullResult
+    )
+
+    // Error is thrown for malformed input.
+    val invalidUnitDF = Seq(
+      ("invalid_unit", LocalTime.parse("01:02:03"), LocalTime.parse("01:02:03"))
+    ).toDF("unit", "start", "end")
+    checkError(
+      exception = intercept[SparkIllegalArgumentException] {
+        invalidUnitDF.select(time_diff(col("unit"), col("start"), col("end"))).collect()
+      },
+      condition = "INVALID_PARAMETER_VALUE.TIME_UNIT",
+      parameters = Map(
+        "functionName" -> "`time_diff`",
+        "parameter" -> "`unit`",
+        "invalidValue" -> "'invalid_unit'"
+      )
+    )
+  }
+
+  test("SPARK-53107: time_trunc function") {
+    // Input data for the function (including null values).
+    val schema = StructType(Seq(
+      StructField("unit", StringType),
+      StructField("time", TimeType())
+    ))
+    val data = Seq(
+      Row("HOUR", LocalTime.parse("00:00:00")),
+      Row("second", LocalTime.parse("01:02:03.4")),
+      Row("MicroSecond", LocalTime.parse("23:59:59.999999")),
+      Row(null, LocalTime.parse("01:02:03")),
+      Row("MiNuTe", null),
+      Row(null, null)
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "time_trunc(unit, time)"
+    )
+    val result2 = df.select(
+      time_trunc(col("unit"), col("time"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "00:00:00",
+      "01:02:03",
+      "23:59:59.999999",
+      null,
+      null,
+      null
+    ).toDF("timeString").select(col("timeString").cast("time"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+
+    // Error is thrown for malformed input.
+    val invalidUnitDF = Seq(("invalid_unit", LocalTime.parse("01:02:03"))).toDF("unit", "time")
+    checkError(
+      exception = intercept[SparkIllegalArgumentException] {
+        invalidUnitDF.select(time_trunc(col("unit"), col("time"))).collect()
+      },
+      condition = "INVALID_PARAMETER_VALUE.TIME_UNIT",
+      parameters = Map(
+        "functionName" -> "`time_trunc`",
+        "parameter" -> "`unit`",
+        "invalidValue" -> "'invalid_unit'"
+      )
+    )
+  }
+
+  test("SPARK-52883: to_time function without format") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("str", StringType, nullable = false)
+    ))
+    val data = Seq(
+      Row("00:00:00"),
+      Row("01:02:03.4"),
+      Row("23:59:59.999999")
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "to_time(str)"
+    )
+    val result2 = df.select(
+      to_time(col("str"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "00:00:00",
+      "01:02:03.4",
+      "23:59:59.999999"
+    ).toDF("timeString").select(col("timeString").cast("time"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+
+    // Error is thrown for malformed input.
+    val invalidTimeDF = Seq("invalid_time").toDF("str")
+    checkError(
+      exception = intercept[SparkDateTimeException] {
+        invalidTimeDF.select(to_time(col("str"))).collect()
+      },
+      condition = "CANNOT_PARSE_TIME",
+      parameters = Map("input" -> "'invalid_time'", "format" -> "'HH:mm:ss.SSSSSS'")
+    )
+  }
+
+  test("SPARK-52883: to_time function with format") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("str", StringType, nullable = false),
+      StructField("format", StringType, nullable = false)
+    ))
+    val data = Seq(
+      Row("00.00.00", "HH.mm.ss"),
+      Row("01.02.03.4", "HH.mm.ss.S"),
+      Row("23.59.59.999999", "HH.mm.ss.SSSSSS")
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "to_time(str, format)"
+    )
+    val result2 = df.select(
+      to_time(col("str"), col("format"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "00:00:00",
+      "01:02:03.4",
+      "23:59:59.999999"
+    ).toDF("timeString").select(col("timeString").cast("time"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+
+    // Error is thrown for malformed input.
+    val invalidTimeDF = Seq(("invalid_time", "HH.mm.ss")).toDF("str", "format")
+    checkError(
+      exception = intercept[SparkDateTimeException] {
+        invalidTimeDF.select(to_time(col("str"), col("format"))).collect()
+      },
+      condition = "CANNOT_PARSE_TIME",
+      parameters = Map("input" -> "'invalid_time'", "format" -> "'HH.mm.ss'")
+    )
+  }
+
+  test("SPARK-53109: try_make_timestamp_ntz function") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("date", DateType, nullable = false),
+      StructField("time", TimeType(), nullable = false)
+    ))
+    val data = Seq(
+      Row(LocalDate.parse("2020-01-01"), LocalTime.parse("00:00:00")),
+      Row(LocalDate.parse("2023-10-20"), LocalTime.parse("12:34:56")),
+      Row(LocalDate.parse("2023-12-31"), LocalTime.parse("23:59:59.999999"))
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "try_make_timestamp_ntz(date, time)"
+    )
+    val result2 = df.select(
+      try_make_timestamp_ntz(col("date"), col("time"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "2020-01-01 00:00:00",
+      "2023-10-20 12:34:56",
+      "2023-12-31 23:59:59.999999"
+    ).toDF("timestamp_ntz").select(col("timestamp_ntz").cast("timestamp_ntz"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+
+    // NULL result is returned for any NULL input.
+    val nullInputDF = Seq(
+      (null, LocalTime.parse("00:00:00")),
+      (LocalDate.parse("2020-01-01"), null),
+      (null, null)
+    ).toDF("date", "time")
+    val nullResult = Seq[Integer](
+      null, null, null
+    ).toDF("ts").select(col("ts"))
+    checkAnswer(
+      nullInputDF.select(try_make_timestamp_ntz(col("date"), col("time"))),
+      nullResult
+    )
+  }
+
+  test("SPARK-52884: try_to_time function without format") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("str", StringType)
+    ))
+    val data = Seq(
+      Row("00:00:00"),
+      Row("01:02:03.4"),
+      Row("23:59:59.999999"),
+      Row("invalid_time"),
+      Row(null)
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "try_to_time(str)"
+    )
+    val result2 = df.select(
+      try_to_time(col("str"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "00:00:00",
+      "01:02:03.4",
+      "23:59:59.999999",
+      null,
+      null
+    ).toDF("timeString").select(col("timeString").cast("time"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+  }
+
+  test("SPARK-52884: try_to_time function with format") {
+    // Input data for the function.
+    val schema = StructType(Seq(
+      StructField("str", StringType),
+      StructField("format", StringType)
+    ))
+    val data = Seq(
+      Row("00.00.00", "HH.mm.ss"),
+      Row("01.02.03.4", "HH.mm.ss.SSS"),
+      Row("23.59.59.999999", "HH.mm.ss.SSSSSS"),
+      Row("invalid_time", "HH.mm.ss"),
+      Row("00.00.00", "invalid_format"),
+      Row("invalid_time", "invalid_format"),
+      Row("00:00:00", "HH.mm.ss"),
+      Row("abc", "HH.mm.ss"),
+      Row("00:00:00", null),
+      Row(null, "HH.mm.ss")
+    )
+    val df = spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+
+    // Test the function using both `selectExpr` and `select`.
+    val result1 = df.selectExpr(
+      "try_to_time(str, format)"
+    )
+    val result2 = df.select(
+      try_to_time(col("str"), col("format"))
+    )
+    // Check that both methods produce the same result.
+    checkAnswer(result1, result2)
+
+    // Expected output of the function.
+    val expected = Seq(
+      "00:00:00",
+      "01:02:03.4",
+      "23:59:59.999999",
+      null,
+      null,
+      null,
+      null,
+      null,
+      null,
+      null
+    ).toDF("timeString").select(col("timeString").cast("time"))
+    // Check that the results match the expected output.
+    checkAnswer(result1, expected)
+    checkAnswer(result2, expected)
+  }
+}
+
+// This class is used to run the same tests with ANSI mode enabled explicitly.
+class TimeFunctionsAnsiOnSuite extends TimeFunctionsSuiteBase {
+  override def sparkConf: SparkConf = super.sparkConf.set(SQLConf.ANSI_ENABLED.key, "true")
+}
+
+// This class is used to run the same tests with ANSI mode disabled explicitly.
+class TimeFunctionsAnsiOffSuite extends TimeFunctionsSuiteBase {
+  override def sparkConf: SparkConf = super.sparkConf.set(SQLConf.ANSI_ENABLED.key, "false")
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/UserDefinedTypeSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/UserDefinedTypeSuite.scala
index 24175ea8ed947..16330d8da43fa 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/UserDefinedTypeSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/UserDefinedTypeSuite.scala
@@ -22,7 +22,7 @@ import java.util.Arrays
 
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.CatalystTypeConverters
-import org.apache.spark.sql.catalyst.expressions.{Cast, CodegenObjectFactoryMode, ExpressionEvalHelper, Literal}
+import org.apache.spark.sql.catalyst.expressions.{Cast, CodegenObjectFactoryMode, ExpressionEvalHelper, Literal, SpecificInternalRow}
 import org.apache.spark.sql.execution.datasources.parquet.ParquetTest
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
@@ -245,6 +245,19 @@ class UserDefinedTypeSuite extends QueryTest with SharedSparkSession with Parque
     checkEvaluation(ret, "(1.0, 3.0, 5.0, 7.0, 9.0)")
   }
 
+  test("SPARK-52583: Cast UserDefinedType to string with custom stringifyValue") {
+    val udt = new TestUDT.MyDenseVectorUDT() {
+      override def stringifyValue(obj: Any): String = {
+        val v = obj.asInstanceOf[TestUDT.MyDenseVector]
+        v.toString.stripPrefix("(").stripSuffix(")")
+      }
+    }
+    val vector = new TestUDT.MyDenseVector(Array(1.0, 3.0, 5.0, 7.0, 9.0))
+    val data = udt.serialize(vector)
+    val ret = Cast(Literal(data, udt), StringType, None)
+    checkEvaluation(ret, "1.0, 3.0, 5.0, 7.0, 9.0")
+  }
+
   test("SPARK-28497 Can't up cast UserDefinedType to string") {
     val udt = new TestUDT.MyDenseVectorUDT()
     assert(!Cast.canUpCast(udt, StringType))
@@ -299,4 +312,22 @@ class UserDefinedTypeSuite extends QueryTest with SharedSparkSession with Parque
       }
     }
   }
+
+  test("SPARK-52666: Map UDT to correct MutableValue in SpecificInternalRow") {
+    val udt = new YearUDT()
+    val row = new SpecificInternalRow(Seq(udt))
+    row.setInt(0, udt.serialize(Year.of(2018)))
+    assert(row.getInt(0) == 2018)
+  }
+
+  test("SPARK-52694: Add Encoders#udt") {
+    val udt = new YearUDT()
+    implicit val yearEncoder: Encoder[Year] = Encoders.udt(udt)
+    val ds = spark.createDataset(Seq(Year.of(2018), Year.of(2019)))
+    assert(ds.schema.head.dataType == udt)
+    checkAnswer(ds.toDF("year"), Seq(Row(Year.of(2018)), Row(Year.of(2019))))
+    checkDataset(
+      spark.range(10).map(i => Year.of(i.toInt + 2018)),
+      (0 to 9).map(i => Year.of(i + 2018)): _*)
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/VariantEndToEndSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/VariantEndToEndSuite.scala
index a40e34d94d085..8a0e2c2965315 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/VariantEndToEndSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/VariantEndToEndSuite.scala
@@ -51,10 +51,10 @@ class VariantEndToEndSuite extends QueryTest with SharedSparkSession {
     check("-1")
     check("1.0E10")
     check("\"\"")
-    check("\"" + ("a" * 63) + "\"")
-    check("\"" + ("b" * 64) + "\"")
+    check("\"" + "a".repeat(63) + "\"")
+    check("\"" + "b".repeat(64) + "\"")
     // scalastyle:off nonascii
-    check("\"" + ("你好，世界" * 20) + "\"")
+    check("\"" + "你好，世界".repeat(20) + "\"")
     // scalastyle:on nonascii
     check("[]")
     check("{}")
@@ -87,10 +87,10 @@ class VariantEndToEndSuite extends QueryTest with SharedSparkSession {
     check("-1")
     check("1.0E10")
     check("\"\"")
-    check("\"" + ("a" * 63) + "\"")
-    check("\"" + ("b" * 64) + "\"")
+    check("\"" + "a".repeat(63) + "\"")
+    check("\"" + "b".repeat(64) + "\"")
     // scalastyle:off nonascii
-    check("\"" + ("你好，世界" * 20) + "\"")
+    check("\"" + "你好，世界".repeat(20) + "\"")
     // scalastyle:on nonascii
     check("[]")
     check("{}")
@@ -137,10 +137,10 @@ class VariantEndToEndSuite extends QueryTest with SharedSparkSession {
     check("-1")
     check("1.0E10")
     check("\"\"")
-    check("\"" + ("a" * 63) + "\"")
-    check("\"" + ("b" * 64) + "\"")
+    check("\"" + "a".repeat(63) + "\"")
+    check("\"" + "b".repeat(64) + "\"")
     // scalastyle:off nonascii
-    check("\"" + ("你好，世界" * 20) + "\"")
+    check("\"" + "你好，世界".repeat(20) + "\"")
     // scalastyle:on nonascii
     check("[]")
     check("{}")
@@ -155,7 +155,7 @@ class VariantEndToEndSuite extends QueryTest with SharedSparkSession {
     check("{1:2}", null)
     check("{\"a\":1", null)
     check("{\"a\":[a,b,c]}", null)
-    check("\"" + "a" * (16 * 1024 * 1024) + "\"", null)
+    check("\"" + "a".repeat(16 * 1024 * 1024) + "\"", null)
   }
 
   test("to_json with nested variant") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/VariantSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/VariantSuite.scala
index 95cee3b995996..ac6a4e435709f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/VariantSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/VariantSuite.scala
@@ -48,7 +48,7 @@ class VariantSuite extends QueryTest with SharedSparkSession with ExpressionEval
         .map(_.get(0).asInstanceOf[VariantVal].toString)
         .sorted
         .toSeq
-      val expected = (1 until 10).map(id => "1" * id)
+      val expected = (1 until 10).map(id => "1".repeat(id))
       assert(result == expected)
     }
 
@@ -290,7 +290,7 @@ class VariantSuite extends QueryTest with SharedSparkSession with ExpressionEval
         .map(_.get(0).asInstanceOf[VariantVal].toString)
         .sorted
         .toSeq
-      val expected = (1 until 10).map(id => "1" * id)
+      val expected = (1 until 10).map(id => "1".repeat(id))
       assert(result == expected)
     }
 
@@ -831,7 +831,7 @@ class VariantSuite extends QueryTest with SharedSparkSession with ExpressionEval
   }
 
   test("variant_get size") {
-    val largeKey = "x" * 1000
+    val largeKey = "x".repeat(1000)
     val df = Seq(s"""{ "$largeKey": {"a" : 1 },
                        "b" : 2,
                        "c": [1,2,3,{"$largeKey": 4}] }""").toDF("json")
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/VariantWriteShreddingSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/VariantWriteShreddingSuite.scala
index d31bf109af6c7..3e6cde71366a8 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/VariantWriteShreddingSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/VariantWriteShreddingSuite.scala
@@ -77,6 +77,12 @@ class VariantWriteShreddingSuite extends SparkFunSuite with ExpressionEvalHelper
         StructField("value", BinaryType, nullable = true),
         StructField("typed_value", IntegerType, nullable = true))))
 
+    // If typed_value is not provided, value is required.
+    assert(SparkShreddingUtils.variantShreddingSchema(VariantType) ==
+      StructType(Seq(
+        StructField("metadata", BinaryType, nullable = false),
+        StructField("value", BinaryType, nullable = false))))
+
     val fieldA = StructType(Seq(
       StructField("value", BinaryType, nullable = true),
       StructField("typed_value", TimestampNTZType, nullable = true)))
@@ -86,10 +92,22 @@ class VariantWriteShreddingSuite extends SparkFunSuite with ExpressionEvalHelper
     val fieldB = StructType(Seq(
       StructField("value", BinaryType, nullable = true),
       StructField("typed_value", arrayType, nullable = true)))
+    // If typed_value is not provided for an object field, value is still optional.
+    val fieldC = StructType(Seq(
+      StructField("value", BinaryType, nullable = true)))
+    // If typed_value is not provided for an array element, value is required.
+    val untypedArrayType = ArrayType(StructType(Seq(
+      StructField("value", BinaryType, nullable = false))), containsNull = false)
+    val fieldD = StructType(Seq(
+      StructField("value", BinaryType, nullable = true),
+      StructField("typed_value", untypedArrayType, nullable = true)))
     val objectType = StructType(Seq(
       StructField("a", fieldA, nullable = false),
-      StructField("b", fieldB, nullable = false)))
-    val structSchema = DataType.fromDDL("a timestamp_ntz, b array<string>")
+      StructField("b", fieldB, nullable = false),
+      StructField("c", fieldC, nullable = false),
+      StructField("d", fieldD, nullable = false)))
+    val structSchema = DataType.fromDDL(
+      "a timestamp_ntz, b array<string>, c variant, d array<variant>")
     assert(SparkShreddingUtils.variantShreddingSchema(structSchema) ==
       StructType(Seq(
         StructField("metadata", BinaryType, nullable = false),
@@ -185,6 +203,8 @@ class VariantWriteShreddingSuite extends SparkFunSuite with ExpressionEvalHelper
       testWithSchema(obj, t, Row(obj.getMetadata, untypedValue(obj), null))
     }
 
+    testWithSchema(obj, VariantType, Row(obj.getMetadata, untypedValue(obj)))
+
     // Happy path
     testWithSchema(obj, StructType.fromDDL("a int, b string"),
       Row(obj.getMetadata, null, Row(Row(null, 1), Row(null, "hello"))))
@@ -210,6 +230,11 @@ class VariantWriteShreddingSuite extends SparkFunSuite with ExpressionEvalHelper
     testWithSchema(obj, ArrayType(StructType.fromDDL("a int, b string")),
       Row(obj.getMetadata, untypedValue(obj), null))
 
+    // Shred with no typed_value in field schema
+    testWithSchema(obj, StructType.fromDDL("a variant, b variant"),
+      Row(obj.getMetadata, null,
+        Row(Row(untypedValue("1")), Row(untypedValue("\"hello\"")))))
+
     // Similar to the case above where "b" was not in the shredding schema, but with the unshredded
     // value being an object. Check that the copied value has correct dictionary IDs.
     val obj2 = parseJson("""{"a": 1, "b": {"c": "hello"}}""")
@@ -230,6 +255,9 @@ class VariantWriteShreddingSuite extends SparkFunSuite with ExpressionEvalHelper
       StructType.fromDDL("a int, b string")).foreach { t =>
       testWithSchema(arr, t, Row(arr.getMetadata, untypedValue(arr), null))
     }
+
+    testWithSchema(arr, VariantType, Row(arr.getMetadata, untypedValue(arr)))
+
     // First element is shredded
     testWithSchema(arr, ArrayType(StructType.fromDDL("a int, b string")),
       Row(arr.getMetadata, null, Array(
@@ -254,6 +282,15 @@ class VariantWriteShreddingSuite extends SparkFunSuite with ExpressionEvalHelper
         Row(null, 2),
         Row(null, 3)
       )))
+
+    // No typed_value in element schema
+    testWithSchema(arr, ArrayType(VariantType),
+      Row(arr.getMetadata, null, Array(
+        Row(untypedValue("""{"a": 1, "b": "hello"}""")),
+        Row(untypedValue("2")),
+        Row(untypedValue("null")),
+        Row(untypedValue("4"))
+      )))
   }
 
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/XmlFunctionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/XmlFunctionsSuite.scala
index afb0ceac5b50d..51509cc5ec3ee 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/XmlFunctionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/XmlFunctionsSuite.scala
@@ -366,7 +366,7 @@ class XmlFunctionsSuite extends QueryTest with SharedSparkSession {
       sqlState = "42601",
       parameters = Map(
         "error" -> "'InvalidType'",
-        "hint" -> ": extra input 'InvalidType'"
+        "hint" -> ""
       ),
       context = ExpectedContext(
         fragment = "from_xml(value, 'time InvalidType')",
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/analysis/AnalysisConfOverrideSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/analysis/AnalysisConfOverrideSuite.scala
index 6f2b348e011d9..a473bb6a02d75 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/analysis/AnalysisConfOverrideSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/analysis/AnalysisConfOverrideSuite.scala
@@ -18,6 +18,7 @@
 package org.apache.spark.sql.analysis
 
 import org.apache.spark.SparkConf
+import org.apache.spark.SparkNoSuchElementException
 import org.apache.spark.sql.SparkSessionExtensions
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.rules.Rule
@@ -27,7 +28,7 @@ class AnalysisConfOverrideSuite extends SharedSparkSession {
 
   override protected def sparkConf: SparkConf = {
     super.sparkConf
-      .set("spark.sql.extensions", "com.databricks.sql.ConfOverrideValidationExtensions")
+      .set("spark.sql.extensions", classOf[ConfOverrideValidationExtensions].getName)
   }
 
   override def beforeAll(): Unit = {
@@ -47,7 +48,7 @@ class AnalysisConfOverrideSuite extends SharedSparkSession {
       val key = "spark.sql.catalog.x.y"
       val value = "true"
       withSQLConf(key -> value) {
-        f
+        f(key, value)
       }
     }
   }
@@ -107,18 +108,15 @@ class AnalysisConfOverrideSuite extends SharedSparkSession {
             |""".stripMargin
         )
         spark.sql(
-          """CREATE OR REPLACE FUNCTION f3(in bigint) RETURNS (out bigint)
+          """CREATE OR REPLACE FUNCTION f3(in bigint) RETURNS bigint
             |RETURN in + 1
             |""".stripMargin
         )
-        ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
-          spark.sql("SELECT * FROM f1()")
-        }
-        ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
-          spark.sql("SELECT * FROM f2()")
-        }
-        ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
-          spark.sql("SELECT f3(1)")
+
+        ("SELECT * FROM f1()" :: "SELECT * FROM f2()" :: "SELECT f3(1)" :: Nil).foreach { query =>
+          ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
+            spark.sql(query)
+          }
         }
       }
     }
@@ -142,24 +140,20 @@ class AnalysisConfOverrideSuite extends SharedSparkSession {
               |""".stripMargin
           )
           spark.sql(
-            """CREATE OR REPLACE FUNCTION f3(in bigint) RETURNS (out bigint)
+            """CREATE OR REPLACE FUNCTION f3(in bigint) RETURNS bigint
               |RETURN in + 1
               |""".stripMargin
           )
-          intercept[AssertionError] {
-            ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
-              spark.sql("SELECT * FROM f1()")
-            }
-          }
-          intercept[AssertionError] {
-            ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
-              spark.sql("SELECT * FROM f2()")
-            }
-          }
-          intercept[AssertionError] {
-            ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
-              spark.sql("SELECT f3(1)")
-            }
+
+          ("SELECT * FROM f1()" :: "SELECT * FROM f2()" :: "SELECT f3(1)" :: Nil).foreach { query =>
+            checkError(
+              exception = intercept[SparkNoSuchElementException] {
+                ValidateConfOverrideRule.withConfValidationEnabled(key, value) {
+                  spark.sql(query)
+                }
+              },
+              condition = "SQL_CONF_NOT_FOUND",
+              parameters = Map("sqlConf" -> "\"spark.sql.catalog.x.y\""))
           }
         }
       }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ExplicitlyUnsupportedResolverFeatureSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ExplicitlyUnsupportedResolverFeatureSuite.scala
index 0e66897868d3f..222128b394449 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ExplicitlyUnsupportedResolverFeatureSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ExplicitlyUnsupportedResolverFeatureSuite.scala
@@ -45,22 +45,6 @@ class ExplicitlyUnsupportedResolverFeatureSuite extends QueryTest with SharedSpa
     }
   }
 
-  test("Unsupported star expansion") {
-    checkResolution("SELECT * FROM VALUES (1, 2) WHERE 3 IN (*)")
-  }
-
-  test("Lateral column alias in Aggregate below a Sort") {
-    checkResolution(
-      "SELECT dept AS d, d, 10 AS d FROM VALUES(1) AS t(dept) GROUP BY dept ORDER BY dept"
-    )
-  }
-
-  test("Unsupported lambda") {
-    checkResolution(
-      "SELECT array_sort(array(2, 1), (p1, p2) -> CASE WHEN p1 > p2 THEN 1 ELSE 0 END)"
-    )
-  }
-
   private def checkResolution(sqlText: String, shouldPass: Boolean = false): Unit = {
     val unresolvedPlan = spark.sessionState.sqlParser.parsePlan(sqlText)
     checkResolution(unresolvedPlan, shouldPass)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/HybridAnalyzerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/HybridAnalyzerSuite.scala
index 66f412c8c3195..21d9a72fc2a9f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/HybridAnalyzerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/HybridAnalyzerSuite.scala
@@ -23,7 +23,8 @@ import org.scalatest.Tag
 import org.apache.spark.sql.{AnalysisException, QueryTest}
 import org.apache.spark.sql.catalyst.{
   ExtendedAnalysisException,
-  QueryPlanningTracker
+  QueryPlanningTracker,
+  TableIdentifier
 }
 import org.apache.spark.sql.catalyst.analysis.{
   AnalysisContext,
@@ -31,20 +32,11 @@ import org.apache.spark.sql.catalyst.analysis.{
   UnresolvedAttribute,
   UnresolvedStar
 }
-import org.apache.spark.sql.catalyst.analysis.resolver.{
-  AnalyzerBridgeState,
-  ExplicitlyUnsupportedResolverFeature,
-  HybridAnalyzer,
-  Resolver,
-  ResolverGuard
-}
+import org.apache.spark.sql.catalyst.analysis.resolver._
 import org.apache.spark.sql.catalyst.expressions.AttributeReference
 import org.apache.spark.sql.catalyst.plans.NormalizePlan
-import org.apache.spark.sql.catalyst.plans.logical.{
-  LocalRelation,
-  LogicalPlan,
-  Project
-}
+import org.apache.spark.sql.catalyst.plans.logical.{LocalRelation, LogicalPlan, Project}
+import org.apache.spark.sql.connector.catalog.CatalogManager
 import org.apache.spark.sql.errors.QueryCompilationErrors
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
@@ -97,6 +89,13 @@ class HybridAnalyzerSuite extends QueryTest with SharedSparkSession {
     }
   }
 
+  private class BrokenResolverGuard(catalogManager: CatalogManager)
+      extends ResolverGuard(catalogManager) {
+    override def apply(plan: LogicalPlan): Boolean = {
+      throw new Exception("Broken resolver guard")
+    }
+  }
+
   private class ValidatingResolver(bridgeRelations: Boolean)
       extends Resolver(spark.sessionState.catalogManager) {
     override def lookupMetadataAndResolve(
@@ -300,13 +299,7 @@ class HybridAnalyzerSuite extends QueryTest with SharedSparkSession {
   }
 
   test("Explicitly unsupported resolver feature") {
-    val plan: LogicalPlan = {
-      Project(
-        Seq(UnresolvedStar(None)),
-        LocalRelation(col1Integer)
-      )
-    }
-    checkAnswer(
+    assertPlansEqual(
       new HybridAnalyzer(
         new ValidatingAnalyzer(bridgeRelations = true),
         new ResolverGuard(spark.sessionState.catalogManager),
@@ -314,8 +307,8 @@ class HybridAnalyzerSuite extends QueryTest with SharedSparkSession {
           new ExplicitlyUnsupportedResolverFeature("FAILURE"),
           bridgeRelations = true
         )
-      ).apply(plan, new QueryPlanningTracker),
-      plan
+      ).apply(unresolvedPlan, new QueryPlanningTracker),
+      resolvedPlan
     )
   }
 
@@ -451,7 +444,43 @@ class HybridAnalyzerSuite extends QueryTest with SharedSparkSession {
     }
   }
 
+  test("Tentative mode conf is not stored during view creation when explicitly set") {
+    withSQLConf(SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_ENABLED_TENTATIVELY.key -> "true") {
+      validateConfStoredInView(
+        conf = SQLConf.ANALYZER_SINGLE_PASS_RESOLVER_ENABLED_TENTATIVELY.key,
+        shouldStore = false
+      )
+    }
+  }
+
+  test("Dual-run mode conf is not stored during view creation when explicitly set") {
+    withSQLConf(SQLConf.ANALYZER_DUAL_RUN_LEGACY_AND_SINGLE_PASS_RESOLVER.key -> "true") {
+      validateConfStoredInView(
+        conf = SQLConf.ANALYZER_DUAL_RUN_LEGACY_AND_SINGLE_PASS_RESOLVER.key,
+        shouldStore = false
+      )
+    }
+  }
+
+  test("Single-pass result conf is stored during view creation when explicitly set") {
+    withSQLConf(SQLConf.ANALYZER_DUAL_RUN_RETURN_SINGLE_PASS_RESULT.key -> "true") {
+      validateConfStoredInView(
+        conf = SQLConf.ANALYZER_DUAL_RUN_RETURN_SINGLE_PASS_RESULT.key,
+        shouldStore = true
+      )
+    }
+  }
+
   private def assertPlansEqual(actualPlan: LogicalPlan, expectedPlan: LogicalPlan) = {
     assert(NormalizePlan(actualPlan) == NormalizePlan(expectedPlan))
   }
+
+  private def validateConfStoredInView(conf: String, shouldStore: Boolean): Unit = {
+    withView("v1") {
+      sql("CREATE VIEW v1 AS SELECT 1")
+
+      val viewMetadata = spark.sessionState.catalog.getTableMetadata(TableIdentifier("v1"))
+      assert(viewMetadata.properties.contains(s"view.sqlConfig.$conf") == shouldStore)
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/MetadataResolverSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/MetadataResolverSuite.scala
index be5d95633b5e3..f315f1b8a5971 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/MetadataResolverSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/MetadataResolverSuite.scala
@@ -21,28 +21,19 @@ import scala.collection.mutable
 
 import org.apache.spark.sql.QueryTest
 import org.apache.spark.sql.catalyst.{AliasIdentifier, TableIdentifier}
-import org.apache.spark.sql.catalyst.analysis.{
-  AnalysisContext,
-  FunctionResolution,
-  UnresolvedRelation
-}
-import org.apache.spark.sql.catalyst.analysis.resolver.{
-  AnalyzerBridgeState,
-  BridgedRelationId,
-  BridgedRelationMetadataProvider,
-  MetadataResolver,
-  RelationId,
-  Resolver,
-  ViewResolver
-}
+import org.apache.spark.sql.catalyst.analysis.{AnalysisContext, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.analysis.resolver._
 import org.apache.spark.sql.catalyst.catalog.UnresolvedCatalogRelation
 import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, SubqueryAlias, View}
 import org.apache.spark.sql.execution.datasources.{FileResolver, HadoopFsRelation, LogicalRelation}
 import org.apache.spark.sql.test.{SharedSparkSession, SQLTestUtils}
-import org.apache.spark.sql.types.{IntegerType, LongType, StringType, StructField, StructType}
+import org.apache.spark.sql.types._
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 
-class MetadataResolverSuite extends QueryTest with SharedSparkSession with SQLTestUtils {
+class MetadataResolverSuite
+    extends QueryTest
+    with SharedSparkSession
+    with SQLTestUtils {
   private val catalogName = "spark_catalog"
 
   private val keyValueTableSchema = StructType(
@@ -57,9 +48,7 @@ class MetadataResolverSuite extends QueryTest with SharedSparkSession with SQLTe
     )
   )
 
-  test(
-    "Single CSV relation"
-  ) {
+  test("Single CSV relation") {
     withTable("src_csv") {
       spark.sql("CREATE TABLE src_csv (key INT, value STRING) USING CSV;").collect()
 
@@ -70,9 +59,7 @@ class MetadataResolverSuite extends QueryTest with SharedSparkSession with SQLTe
     }
   }
 
-  test(
-    "Single ORC relation"
-  ) {
+  test("Single ORC relation") {
     withTable("src_orc") {
       spark.sql("CREATE TABLE src_orc (key INT, value STRING) USING ORC;").collect()
 
@@ -176,9 +163,7 @@ class MetadataResolverSuite extends QueryTest with SharedSparkSession with SQLTe
     }
   }
 
-  test(
-    "Relation from a file"
-  ) {
+  test("Relation from a file") {
     val df = spark.range(100).toDF()
     withTempPath(f => {
       df.write.json(f.getCanonicalPath)
@@ -341,7 +326,6 @@ class MetadataResolverSuite extends QueryTest with SharedSparkSession with SQLTe
         new MetadataResolver(
           spark.sessionState.catalogManager,
           relationResolution,
-          new FunctionResolution(spark.sessionState.catalogManager, relationResolution),
           Seq(new FileResolver(spark))
         )
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/NameScopeSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/NameScopeSuite.scala
index 1fdf833d22de5..614c3b2e9ad3a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/NameScopeSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/NameScopeSuite.scala
@@ -17,10 +17,10 @@
 
 package org.apache.spark.sql.analysis.resolver
 
-import java.util.HashSet
+import java.util.{Arrays, HashSet}
 
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.catalyst.analysis.{UnresolvedAttribute, UnresolvedStar}
+import org.apache.spark.sql.catalyst.analysis.UnresolvedStar
 import org.apache.spark.sql.catalyst.analysis.resolver.{NameScope, NameScopeStack, NameTarget}
 import org.apache.spark.sql.catalyst.expressions.{
   Attribute,
@@ -34,15 +34,7 @@ import org.apache.spark.sql.catalyst.expressions.{
   OuterReference
 }
 import org.apache.spark.sql.catalyst.plans.PlanTest
-import org.apache.spark.sql.types.{
-  ArrayType,
-  BooleanType,
-  IntegerType,
-  MapType,
-  StringType,
-  StructField,
-  StructType
-}
+import org.apache.spark.sql.types._
 
 class NameScopeSuite extends PlanTest {
   private val col1Integer = AttributeReference(name = "col1", dataType = IntegerType)()
@@ -85,6 +77,7 @@ class NameScopeSuite extends PlanTest {
     name = "col10",
     dataType = MapType(StringType, IntegerType)
   )()
+  private val col10Integer = AttributeReference(name = "col10", dataType = IntegerType)()
   private val col11MapWithStruct = AttributeReference(
     name = "col11",
     dataType = MapType(
@@ -644,6 +637,259 @@ class NameScopeSuite extends PlanTest {
     }
   }
 
+  test("Hidden output gets prioritized because of conflict") {
+    val stack = new NameScopeStack
+
+    stack.overwriteCurrent(
+      output = Some(Seq(col1Integer, col1IntegerOther)),
+      hiddenOutput = Some(Seq(col1IntegerOther, col2Integer)),
+      availableAliases = Some(new HashSet[ExprId](Arrays.asList(col1Integer.exprId)))
+    )
+
+    assert(
+      stack.resolveMultipartName(Seq("col1")) == NameTarget(
+        candidates = Seq(col1Integer, col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(Seq("col1"), shouldPreferHiddenOutput = true) == NameTarget(
+        candidates = Seq(col1Integer, col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(Seq("col1"), canResolveNameByHiddenOutput = true) == NameTarget(
+        candidates = Seq(col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col1"),
+        canResolveNameByHiddenOutput = true,
+        shouldPreferHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+  }
+
+  test("Main output gets prioritized because of conflict") {
+    val stack = new NameScopeStack
+
+    stack.overwriteCurrent(
+      output = Some(Seq(col1Integer)),
+      hiddenOutput = Some(Seq(col1Integer, col1IntegerOther, col2Integer)),
+      availableAliases = Some(new HashSet[ExprId])
+    )
+
+    assert(
+      stack.resolveMultipartName(Seq("col1")) == NameTarget(
+        candidates = Seq(col1Integer),
+        output = Seq(col1Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(Seq("col1"), shouldPreferHiddenOutput = true) == NameTarget(
+        candidates = Seq(col1Integer),
+        output = Seq(col1Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(Seq("col1"), canResolveNameByHiddenOutput = true) == NameTarget(
+        candidates = Seq(col1Integer),
+        output = Seq(col1Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col1"),
+        canResolveNameByHiddenOutput = true,
+        shouldPreferHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(col1Integer),
+        output = Seq(col1Integer)
+      )
+    )
+  }
+
+  test("Both main and hidden outputs have a conflict") {
+    val stack = new NameScopeStack
+
+    stack.overwriteCurrent(
+      output = Some(Seq(col1Integer, col1IntegerOther)),
+      hiddenOutput = Some(Seq(col1Integer, col1IntegerOther, col2Integer)),
+      availableAliases = Some(new HashSet[ExprId])
+    )
+
+    assert(
+      stack.resolveMultipartName(Seq("col1")) == NameTarget(
+        candidates = Seq(col1Integer, col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(Seq("col1"), shouldPreferHiddenOutput = true) == NameTarget(
+        candidates = Seq(col1Integer, col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(Seq("col1"), canResolveNameByHiddenOutput = true) == NameTarget(
+        candidates = Seq(col1Integer, col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col1"),
+        canResolveNameByHiddenOutput = true,
+        shouldPreferHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(col1Integer, col1IntegerOther),
+        output = Seq(col1Integer, col1IntegerOther)
+      )
+    )
+  }
+
+  test("Hidden output gets prioritized because of impossible extract") {
+    val stack = new NameScopeStack
+
+    stack.overwriteCurrent(
+      output = Some(Seq(col10Integer)),
+      hiddenOutput = Some(Seq(col10Map)),
+      availableAliases = Some(new HashSet[ExprId](Arrays.asList(col10Integer.exprId)))
+    )
+
+    assert(
+      stack.resolveMultipartName(Seq("col10", "key")) == NameTarget(
+        candidates = Seq.empty,
+        output = Seq(col10Integer)
+      )
+    )
+    assert(
+      stack
+        .resolveMultipartName(Seq("col10", "key"), shouldPreferHiddenOutput = true) == NameTarget(
+        candidates = Seq.empty,
+        output = Seq(col10Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col10", "key"),
+        canResolveNameByHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(GetMapValue(col10Map, Literal("key"))),
+        aliasName = Some("key"),
+        output = Seq(col10Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col10", "key"),
+        canResolveNameByHiddenOutput = true,
+        shouldPreferHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(GetMapValue(col10Map, Literal("key"))),
+        aliasName = Some("key"),
+        output = Seq(col10Integer)
+      )
+    )
+  }
+
+  test("Main output gets prioritized because of impossible extract") {
+    val stack = new NameScopeStack
+
+    stack.overwriteCurrent(
+      output = Some(Seq(col10Map)),
+      hiddenOutput = Some(Seq(col10Integer)),
+      availableAliases = Some(new HashSet[ExprId](Arrays.asList(col10Map.exprId)))
+    )
+
+    assert(
+      stack.resolveMultipartName(Seq("col10", "key")) == NameTarget(
+        candidates = Seq(GetMapValue(col10Map, Literal("key"))),
+        aliasName = Some("key"),
+        output = Seq(col10Map)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col10", "key"),
+        shouldPreferHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(GetMapValue(col10Map, Literal("key"))),
+        aliasName = Some("key"),
+        output = Seq(col10Map)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col10", "key"),
+        canResolveNameByHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(GetMapValue(col10Map, Literal("key"))),
+        aliasName = Some("key"),
+        output = Seq(col10Map)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col10", "key"),
+        canResolveNameByHiddenOutput = true,
+        shouldPreferHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq(GetMapValue(col10Map, Literal("key"))),
+        aliasName = Some("key"),
+        output = Seq(col10Map)
+      )
+    )
+  }
+
+  test("Both main and hidden outputs have impossible extract") {
+    val stack = new NameScopeStack
+
+    stack.overwriteCurrent(
+      output = Some(Seq(col1Integer)),
+      hiddenOutput = Some(Seq(col1IntegerOther)),
+      availableAliases = Some(new HashSet[ExprId](Arrays.asList(col1Integer.exprId)))
+    )
+
+    assert(
+      stack.resolveMultipartName(Seq("col1", "key")) == NameTarget(
+        candidates = Seq.empty,
+        output = Seq(col1Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(Seq("col1", "key"), shouldPreferHiddenOutput = true) == NameTarget(
+        candidates = Seq.empty,
+        output = Seq(col1Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col1", "key"),
+        canResolveNameByHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq.empty,
+        output = Seq(col1Integer)
+      )
+    )
+    assert(
+      stack.resolveMultipartName(
+        Seq("col1", "key"),
+        canResolveNameByHiddenOutput = true,
+        shouldPreferHiddenOutput = true
+      ) == NameTarget(
+        candidates = Seq.empty,
+        output = Seq(col1Integer)
+      )
+    )
+  }
+
   test("Empty stack") {
     val stack = new NameScopeStack
 
@@ -728,37 +974,6 @@ class NameScopeSuite extends PlanTest {
     assert(stack.current.output == Seq(col1Integer))
   }
 
-  test(
-    "Name resolution should prefer table columns over aliases with same name when " +
-    "shouldPreferTableColumnsOverAliases is set or throw AMBIGUOUS_REFERENCE otherwise"
-  ) {
-    val stack = new NameScopeStack
-    val output = Seq(col1Integer, col1IntegerOther)
-    val availableAliases = new HashSet[ExprId](1)
-    availableAliases.add(col1IntegerOther.exprId)
-
-    stack.overwriteCurrent(output = Some(output), availableAliases = Some(availableAliases))
-
-    assert(
-      stack.resolveMultipartName(
-        multipartName = Seq("col1"),
-        shouldPreferTableColumnsOverAliases = true
-      ) == NameTarget(
-        candidates = Seq(col1Integer),
-        output = output
-      )
-    )
-
-    checkError(
-      exception = intercept[AnalysisException] {
-        val nameTarget = stack.resolveMultipartName(multipartName = Seq("col1"))
-        nameTarget.pickCandidate(UnresolvedAttribute(nameParts = Seq("col1")))
-      },
-      condition = "AMBIGUOUS_REFERENCE",
-      parameters = Map("name" -> "`col1`", "referenceNames" -> "[`col1`, `col1`]")
-    )
-  }
-
   /**
    * Check both [[resolveMultipartName]] and [[findAttributesByName]] for a single part name.
    *
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ResolverGuardSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ResolverGuardSuite.scala
index dbdca7d0b5d6d..7d6b321edba1f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ResolverGuardSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ResolverGuardSuite.scala
@@ -232,6 +232,7 @@ class ResolverGuardSuite extends QueryTest with SharedSparkSession {
 
   test("Group by") {
     checkResolverGuard("SELECT col1, count(col1) FROM VALUES(1) GROUP BY ALL", shouldPass = true)
+    checkResolverGuard("SELECT * FROM VALUES(1,2,3) GROUP BY ALL", shouldPass = true)
     checkResolverGuard("SELECT col1 FROM VALUES(1) GROUP BY 1", shouldPass = true)
     checkResolverGuard("SELECT col1, col1 + 1 FROM VALUES(1) GROUP BY 1, col1", shouldPass = true)
   }
@@ -286,6 +287,17 @@ class ResolverGuardSuite extends QueryTest with SharedSparkSession {
     )
   }
 
+  test("TABLESAMPLE") {
+    checkResolverGuard(
+      "SELECT * FROM (VALUES (1), (2), (3)) TABLESAMPLE (40 PERCENT)",
+      shouldPass = true
+    )
+  }
+
+  test("Semi-structured extract") {
+    checkResolverGuard("SELECT PARSE_JSON('{\"a\":1}'):a", shouldPass = true)
+  }
+
   // Queries that shouldn't pass the OperatorResolverGuard
 
   test("Unsupported literal functions") {
@@ -306,9 +318,26 @@ class ResolverGuardSuite extends QueryTest with SharedSparkSession {
     }
   }
 
-  test("UDFs") {
-    sql("CREATE FUNCTION supermario(x INT) RETURNS INT RETURN x + 3")
-    checkResolverGuard("SELECT supermario(2)", shouldPass = false)
+  test("UDF") {
+    withSqlFunction("supermario") {
+      sql("CREATE FUNCTION supermario(x INT) RETURNS INT RETURN x + 3")
+
+      checkResolverGuard("SELECT supermario(2)", shouldPass = false)
+    }
+  }
+
+  test("UDF in a database with the same name as a built-in function") {
+    withDatabase("upper") {
+      sql("CREATE DATABASE IF NOT EXISTS upper")
+
+      withSqlFunction("supermario") {
+        sql("USE DATABASE upper")
+
+        sql("CREATE FUNCTION supermario(x INT) RETURNS INT RETURN x + 3")
+
+        checkResolverGuard("SELECT upper.supermario(2)", shouldPass = false)
+      }
+    }
   }
 
   test("PLAN_ID_TAG") {
@@ -320,6 +349,19 @@ class ResolverGuardSuite extends QueryTest with SharedSparkSession {
     checkResolverGuard(plan, shouldPass = false)
   }
 
+  test("Star outside of Project list") {
+    checkResolverGuard("SELECT * FROM VALUES (1, 2) WHERE 3 IN (*)", shouldPass = false)
+  }
+
+  test("Lambda variable") {
+    checkResolverGuard(
+      "SELECT array_sort(array(2, 1), (p1, p2) -> IF(p1 > p2, 1, 0))",
+      shouldPass = false
+    )
+    checkResolverGuard("SELECT transform(array(2, 1), x -> x * 2)", shouldPass = false)
+    checkResolverGuard("SELECT filter(array(2, 1), x -> x > 0)", shouldPass = false)
+  }
+
   test("Catch ExplicitlyUnsupportedResolverFeature exceptions") {
 
     class ThrowsExplicitlyUnsupportedFeatureResolver
@@ -348,7 +390,7 @@ class ResolverGuardSuite extends QueryTest with SharedSparkSession {
   }
 
   private def checkResolverGuard(query: String, shouldPass: Boolean): Unit = {
-    checkResolverGuard(spark.sql(query).queryExecution.logical, shouldPass)
+    checkResolverGuard(spark.sessionState.sqlParser.parsePlan(query), shouldPass)
   }
 
   private def checkResolverGuard(
@@ -396,4 +438,12 @@ class ResolverGuardSuite extends QueryTest with SharedSparkSession {
       sql("DROP TEMPORARY VARIABLE session_variable;")
     }
   }
+
+  private def withSqlFunction[R](name: String)(body: => R): R = {
+    try {
+      body
+    } finally {
+      spark.sql(s"DROP FUNCTION IF EXISTS $name")
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ViewResolverSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ViewResolverSuite.scala
index 9d2601e2578c3..a03e353c40b01 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ViewResolverSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/analysis/resolver/ViewResolverSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.analysis.resolver
 
 import org.apache.spark.sql.{AnalysisException, QueryTest, Row}
-import org.apache.spark.sql.catalyst.analysis.{FunctionResolution, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.analysis.UnresolvedRelation
 import org.apache.spark.sql.catalyst.analysis.resolver.{MetadataResolver, Resolver, ResolverRunner}
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.dsl.plans._
@@ -177,8 +177,7 @@ class ViewResolverSuite extends QueryTest with SharedSparkSession {
     val relationResolution = Resolver.createRelationResolution(spark.sessionState.catalogManager)
     val metadataResolver = new MetadataResolver(
       spark.sessionState.catalogManager,
-      relationResolution,
-      new FunctionResolution(spark.sessionState.catalogManager, relationResolution)
+      relationResolution
     )
 
     val unresolvedPlan = spark.sessionState.sqlParser.parsePlan(sqlText)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/artifact/ArtifactManagerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/artifact/ArtifactManagerSuite.scala
index d23f483f9ddf7..f4a4ab012c2e0 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/artifact/ArtifactManagerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/artifact/ArtifactManagerSuite.scala
@@ -20,10 +20,9 @@ import java.io.File
 import java.nio.charset.StandardCharsets
 import java.nio.file.{Files, Path, Paths}
 
-import org.apache.commons.io.FileUtils
-
-import org.apache.spark.{SparkConf, SparkException}
+import org.apache.spark.{SparkConf, SparkException, SparkRuntimeException}
 import org.apache.spark.metrics.source.CodegenMetrics
+import org.apache.spark.sql.Artifact
 import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.functions.col
 import org.apache.spark.sql.internal.SQLConf
@@ -56,7 +55,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
     assume(artifactPath.resolve("smallClassFile.class").toFile.exists)
 
     val copyDir = Utils.createTempDir().toPath
-    FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+    Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
     val stagingPath = copyDir.resolve("smallClassFile.class")
     assert(stagingPath.toFile.exists())
     val remotePath = Paths.get("classes/smallClassFile.class")
@@ -72,7 +71,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
     assume(artifactPath.resolve("Hello.class").toFile.exists)
 
     val copyDir = Utils.createTempDir().toPath
-    FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+    Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
     val stagingPath = copyDir.resolve("Hello.class")
     assert(stagingPath.toFile.exists())
     val remotePath = Paths.get("classes/Hello.class")
@@ -98,7 +97,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
     assume(artifactPath.resolve("Hello.class").toFile.exists)
 
     val copyDir = Utils.createTempDir().toPath
-    FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+    Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
     val stagingPath = copyDir.resolve("Hello.class")
     assert(stagingPath.toFile.exists())
     val remotePath = Paths.get("classes/Hello.class")
@@ -180,7 +179,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
 
     val copyDir = Utils.createTempDir().toPath
     val destFSDir = Utils.createTempDir().toPath
-    FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+    Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
     val stagingPath = copyDir.resolve("smallClassFile.class")
     val remotePath = Paths.get("forward_to_fs", destFSDir.toString, "smallClassFileCopied.class")
     assert(stagingPath.toFile.exists())
@@ -203,7 +202,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
       val blockId = CacheId(spark.sessionUUID, "abc")
       // Setup artifact dir
       val copyDir = Utils.createTempDir().toPath
-      FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+      Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
       try {
         artifactManager.addArtifact(remotePath, stagingPath, None)
         val stagingPathFile = copyDir.resolve("smallClassFile.class")
@@ -230,7 +229,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
           case _: SparkException =>
           case throwable: Throwable => throw throwable
         } finally {
-          FileUtils.deleteDirectory(copyDir.toFile)
+          Utils.deleteRecursively(copyDir.toFile)
           blockManager.removeCache(spark.sessionUUID)
         }
       }
@@ -246,7 +245,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
 
     def addHelloClass(session: SparkSession): Unit = {
       val copyDir = Utils.createTempDir().toPath
-      FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+      Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
       val stagingPath = copyDir.resolve("Hello.class")
       val remotePath = Paths.get("classes/Hello.class")
       assert(stagingPath.toFile.exists())
@@ -299,7 +298,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
     assume(artifactPath.resolve("Hello.class").toFile.exists)
 
     val copyDir = Utils.createTempDir().toPath
-    FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+    Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
     val stagingPath = copyDir.resolve("Hello.class")
     val remotePath = Paths.get("classes/Hello.class")
 
@@ -348,6 +347,76 @@ class ArtifactManagerSuite extends SharedSparkSession {
     }
   }
 
+  test("Add multiple artifacts to local session and check if all are added despite exception") {
+    val copyDir = Utils.createTempDir().toPath
+    Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+
+    val artifact1Path = "my/custom/pkg/artifact1.jar"
+    val artifact2Path = "my/custom/pkg/artifact2.jar"
+    val targetPath = Paths.get(artifact1Path)
+    val targetPath2 = Paths.get(artifact2Path)
+
+    val classPath1 = copyDir.resolve("Hello.class")
+    val classPath2 = copyDir.resolve("udf_noA.jar")
+    assume(artifactPath.resolve("Hello.class").toFile.exists)
+    assume(artifactPath.resolve("smallClassFile.class").toFile.exists)
+
+    val artifact1 = Artifact.newArtifactFromExtension(
+      targetPath.getFileName.toString,
+      targetPath,
+      new Artifact.LocalFile(Paths.get(classPath1.toString)))
+
+    val alreadyExistingArtifact = Artifact.newArtifactFromExtension(
+      targetPath2.getFileName.toString,
+      targetPath,
+      new Artifact.LocalFile(Paths.get(classPath2.toString)))
+
+    val artifact2 = Artifact.newArtifactFromExtension(
+      targetPath2.getFileName.toString,
+      targetPath2,
+      new Artifact.LocalFile(Paths.get(classPath2.toString)))
+
+    spark.artifactManager.addLocalArtifacts(Seq(artifact1))
+
+    val ex = intercept[SparkRuntimeException] {
+      spark.artifactManager.addLocalArtifacts(
+        Seq(alreadyExistingArtifact, artifact2, alreadyExistingArtifact))
+    }
+
+    checkError(
+      exception = ex,
+      condition = "ARTIFACT_ALREADY_EXISTS",
+      parameters = Map("normalizedRemoteRelativePath" -> s"jars/${targetPath.toString}"))
+
+    assert(ex.getSuppressed.length == 1)
+    assert(ex.getSuppressed.head.isInstanceOf[SparkRuntimeException])
+    val suppressed = ex.getSuppressed.head.asInstanceOf[SparkRuntimeException]
+
+    checkError(
+      exception = suppressed,
+      condition = "ARTIFACT_ALREADY_EXISTS",
+      parameters = Map("normalizedRemoteRelativePath" -> s"jars/${targetPath.toString}"))
+
+    // Artifact1 should have been added
+    val expectedFile1 = ArtifactManager.artifactRootDirectory
+      .resolve(s"$sessionUUID/jars/$artifact1Path")
+      .toFile
+    assert(expectedFile1.exists())
+
+    // Artifact2 should have been added despite exception
+    val expectedFile2 = ArtifactManager.artifactRootDirectory
+      .resolve(s"$sessionUUID/jars/$artifact2Path")
+      .toFile
+    assert(expectedFile2.exists())
+
+    // Cleanup
+    artifactManager.cleanUpResourcesForTesting()
+    val sessionDir = ArtifactManager.artifactRootDirectory.resolve(sessionUUID).toFile
+
+    assert(!expectedFile1.exists())
+    assert(!sessionDir.exists())
+  }
+
   test("Added artifact can be loaded by the current SparkSession") {
     val path = artifactPath.resolve("IntSumUdf.class")
     assume(path.toFile.exists)
@@ -368,7 +437,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
     val copyDir = Utils.createTempDir().toPath
     assume(artifactPath.resolve(classFileToUse).toFile.exists)
 
-    FileUtils.copyDirectory(artifactPath.toFile, copyDir.toFile)
+    Utils.copyDirectory(artifactPath.toFile, copyDir.toFile)
     val classPath = copyDir.resolve(classFileToUse)
     assert(classPath.toFile.exists())
 
@@ -407,7 +476,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
     withTempPath { dir =>
       val path = dir.toPath
       // Setup artifact dir
-      FileUtils.copyDirectory(artifactPath.toFile, dir)
+      Utils.copyDirectory(artifactPath.toFile, dir)
       val randomFilePath = path.resolve("random_file")
       val testBytes = "test".getBytes(StandardCharsets.UTF_8)
       Files.write(randomFilePath, testBytes)
@@ -425,7 +494,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
         jarPath, path.resolve("udf_noA.jar"), None)
       artifactManager.addArtifact( // Cached
         Paths.get("cache/test"), randomFilePath, None)
-      assert(FileUtils.listFiles(artifactManager.artifactPath.toFile, null, true).size() === 3)
+      assert(Utils.listPaths(artifactManager.artifactPath.toFile).size() === 3)
 
       // Clone the artifact manager
       val newSession = spark.cloneSession()
@@ -444,7 +513,7 @@ class ArtifactManagerSuite extends SharedSparkSession {
         }
       }
 
-      val allFiles = FileUtils.listFiles(newArtifactManager.artifactPath.toFile, null, true)
+      val allFiles = Utils.listFiles(newArtifactManager.artifactPath.toFile)
       assert(allFiles.size() === 3)
       allFiles.forEach { file =>
         assert(!file.getCanonicalPath.contains(spark.sessionUUID))
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationExpressionWalkerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationExpressionWalkerSuite.scala
index ba1be1b03ef84..71961988b2f36 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationExpressionWalkerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationExpressionWalkerSuite.scala
@@ -384,7 +384,8 @@ class CollationExpressionWalkerSuite extends SparkFunSuite with SharedSparkSessi
       "sha2",
       "sha",
       "crc32",
-      "ascii"
+      "ascii",
+      "time_trunc"
     )
 
     logInfo("Total number of expression: " + expressionCounter)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationSuite.scala
index c278233b557b7..4044e5674191b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/collation/CollationSuite.scala
@@ -27,7 +27,7 @@ import org.apache.spark.sql.catalyst.ExtendedAnalysisException
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.util.CollationFactory
 import org.apache.spark.sql.connector.{DatasourceV2SQLBase, FakeV2ProviderWithCustomSchema}
-import org.apache.spark.sql.connector.catalog.{Identifier, InMemoryTable}
+import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Identifier, InMemoryTable}
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.CatalogHelper
 import org.apache.spark.sql.connector.catalog.CatalogV2Util.withDefaultOwnership
 import org.apache.spark.sql.errors.DataTypeErrors.toSQLType
@@ -610,16 +610,16 @@ class CollationSuite extends DatasourceV2SQLBase with AdaptiveSparkPlanHelper {
       sql(s"ALTER TABLE $tableName ALTER COLUMN c3.value TYPE STRING COLLATE UTF8_BINARY")
       sql(s"ALTER TABLE $tableName ALTER COLUMN c4.t TYPE STRING COLLATE UNICODE")
       val testCatalog = catalog("testcat").asTableCatalog
-      val tableSchema = testCatalog.loadTable(Identifier.of(Array(), "alter_column_tbl")).schema()
-      val c1Metadata = tableSchema.find(_.name == "c1").get.metadata
-      assert(c1Metadata === createMetadata("c1"))
-      val c2Metadata = tableSchema.find(_.name == "c2").get.metadata
-      assert(c2Metadata === createMetadata("c2"))
-      val c3Metadata = tableSchema.find(_.name == "c3").get.metadata
-      assert(c3Metadata === createMetadata("c3"))
-      val c4Metadata = tableSchema.find(_.name == "c4").get.metadata
-      assert(c4Metadata === createMetadata("c4"))
-      val c4tMetadata = tableSchema.find(_.name == "c4").get.dataType
+      val columns = testCatalog.loadTable(Identifier.of(Array(), "alter_column_tbl")).columns()
+      val c1Metadata = columns.find(_.name() == "c1").get.metadataInJSON()
+      assert(c1Metadata === createMetadata("c1").json)
+      val c2Metadata = columns.find(_.name() == "c2").get.metadataInJSON()
+      assert(c2Metadata === createMetadata("c2").json)
+      val c3Metadata = columns.find(_.name() == "c3").get.metadataInJSON()
+      assert(c3Metadata === createMetadata("c3").json)
+      val c4Metadata = columns.find(_.name() == "c4").get.metadataInJSON()
+      assert(c4Metadata === createMetadata("c4").json)
+      val c4tMetadata = columns.find(_.name() == "c4").get.dataType()
         .asInstanceOf[StructType].find(_.name == "t").get.metadata
       assert(c4tMetadata === createMetadata("c4t"))
     }
@@ -864,7 +864,8 @@ class CollationSuite extends DatasourceV2SQLBase with AdaptiveSparkPlanHelper {
       assert(table.columns().head.dataType() == StringType(collationId))
 
       val rdd = spark.sparkContext.parallelize(table.asInstanceOf[InMemoryTable].rows)
-      checkAnswer(spark.internalCreateDataFrame(rdd, table.schema), Seq.empty)
+      checkAnswer(spark.internalCreateDataFrame(rdd,
+        CatalogV2Util.v2ColumnsToStructType(table.columns)), Seq.empty)
 
       sql(s"INSERT INTO $tableName VALUES ('a'), ('A')")
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/AlterTableTests.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/AlterTableTests.scala
index 53528bf2eae2d..9b01cd9f75bdc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/AlterTableTests.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/AlterTableTests.scala
@@ -24,8 +24,9 @@ import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.analysis.UnresolvedAttribute
 import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.catalyst.util.quoteIdentifier
-import org.apache.spark.sql.connector.catalog.{Column, Table}
+import org.apache.spark.sql.connector.catalog.{Column, ColumnDefaultValue, Table}
 import org.apache.spark.sql.connector.catalog.CatalogV2Util.withDefaultOwnership
+import org.apache.spark.sql.connector.expressions.LiteralValue
 import org.apache.spark.sql.errors.QueryErrorsBase
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
@@ -86,7 +87,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType().add("id", IntegerType))
+      assert(table.columns sameElements Array(Column.create("id", IntegerType)))
     }
   }
 
@@ -99,7 +100,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType().add("id", IntegerType).add("data", StringType))
+      assert(table.columns sameElements
+        Array(Column.create("id", IntegerType),
+          Column.create("data", StringType)))
     }
   }
 
@@ -112,9 +115,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === StructType(Seq(
-        StructField("id", IntegerType),
-        StructField("data", StringType, nullable = false))))
+      assert(table.columns sameElements
+        Array(Column.create("id", IntegerType),
+          Column.create("data", StringType, false)))
     }
   }
 
@@ -127,9 +130,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === StructType(Seq(
-        StructField("id", IntegerType),
-        StructField("data", StringType).withComment("doc"))))
+      assert(table.columns sameElements
+        Array(Column.create("id", IntegerType),
+          Column.create("data", StringType, true, "doc", null)))
     }
   }
 
@@ -152,15 +155,17 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       sql(s"CREATE TABLE $t (point struct<x: int>) USING $v2Format")
 
       sql(s"ALTER TABLE $t ADD COLUMN a string FIRST")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("a", StringType)
-        .add("point", new StructType().add("x", IntegerType)))
+      assert(getTableMetadata(t).columns sameElements
+        Array(
+          Column.create("a", StringType),
+          Column.create("point", new StructType().add("x", IntegerType))))
 
       sql(s"ALTER TABLE $t ADD COLUMN b string AFTER point")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("a", StringType)
-        .add("point", new StructType().add("x", IntegerType))
-        .add("b", StringType))
+      assert(getTableMetadata(t).columns sameElements
+        Array(
+          Column.create("a", StringType),
+          Column.create("point", new StructType().add("x", IntegerType)),
+          Column.create("b", StringType)))
 
       val e1 = intercept[AnalysisException](
         sql(s"ALTER TABLE $t ADD COLUMN c string AFTER non_exist"))
@@ -171,21 +176,22 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       )
 
       sql(s"ALTER TABLE $t ADD COLUMN point.y int FIRST")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("a", StringType)
-        .add("point", new StructType()
-          .add("y", IntegerType)
-          .add("x", IntegerType))
-        .add("b", StringType))
+      assert(getTableMetadata(t).columns sameElements
+        Array(Column.create("a", StringType),
+          Column.create("point", new StructType()
+            .add("y", IntegerType)
+            .add("x", IntegerType)),
+          Column.create("b", StringType)))
 
       sql(s"ALTER TABLE $t ADD COLUMN point.z int AFTER x")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("a", StringType)
-        .add("point", new StructType()
-          .add("y", IntegerType)
-          .add("x", IntegerType)
-          .add("z", IntegerType))
-        .add("b", StringType))
+      assert(getTableMetadata(t).columns sameElements
+        Array(
+          Column.create("a", StringType),
+          Column.create("point", new StructType()
+            .add("y", IntegerType)
+            .add("x", IntegerType)
+            .add("z", IntegerType)),
+          Column.create("b", StringType)))
 
       val e2 = intercept[AnalysisException](
         sql(s"ALTER TABLE $t ADD COLUMN point.x2 int AFTER non_exist"))
@@ -203,28 +209,30 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       sql(s"CREATE TABLE $t (a string, b int, point struct<x: double, y: double>) USING $v2Format")
       sql(s"ALTER TABLE $t ADD COLUMNS (x int AFTER a, y int AFTER x, z int AFTER y)")
 
-      assert(getTableMetadata(t).schema === new StructType()
-        .add("a", StringType)
-        .add("x", IntegerType)
-        .add("y", IntegerType)
-        .add("z", IntegerType)
-        .add("b", IntegerType)
-        .add("point", new StructType()
-          .add("x", DoubleType)
-          .add("y", DoubleType)))
+      assert(getTableMetadata(t).columns sameElements
+        Array(
+          Column.create("a", StringType),
+          Column.create("x", IntegerType),
+          Column.create("y", IntegerType),
+          Column.create("z", IntegerType),
+          Column.create("b", IntegerType),
+          Column.create("point", new StructType()
+            .add("x", DoubleType)
+            .add("y", DoubleType))))
 
       sql(s"ALTER TABLE $t ADD COLUMNS (point.z double AFTER x, point.zz double AFTER z)")
-      assert(getTableMetadata(t).schema === new StructType()
-        .add("a", StringType)
-        .add("x", IntegerType)
-        .add("y", IntegerType)
-        .add("z", IntegerType)
-        .add("b", IntegerType)
-        .add("point", new StructType()
-          .add("x", DoubleType)
-          .add("z", DoubleType)
-          .add("zz", DoubleType)
-          .add("y", DoubleType)))
+      assert(getTableMetadata(t).columns sameElements
+        Array(
+          Column.create("a", StringType),
+          Column.create("x", IntegerType),
+          Column.create("y", IntegerType),
+          Column.create("z", IntegerType),
+          Column.create("b", IntegerType),
+          Column.create("point", new StructType()
+            .add("x", DoubleType)
+            .add("z", DoubleType)
+            .add("zz", DoubleType)
+            .add("y", DoubleType))))
 
       // The new column being referenced should come before being referenced.
       val e = intercept[AnalysisException](
@@ -246,10 +254,10 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === StructType(Seq(
-        StructField("id", IntegerType),
-        StructField("data", StringType).withComment("doc"),
-        StructField("ts", TimestampType))))
+      assert(table.columns sameElements Array(
+          Column.create("id", IntegerType),
+          Column.create("data", StringType, true, "doc", null),
+          Column.create("ts", TimestampType)))
     }
   }
 
@@ -262,12 +270,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType),
-          StructField("z", DoubleType)))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", new StructType()
+          .add("x", DoubleType)
+          .add("y", DoubleType)
+          .add("z", DoubleType))))
     }
   }
 
@@ -281,12 +289,14 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType),
-          StructField("z", DoubleType))), LongType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points",
+          MapType(StructType(Seq(
+            StructField("x", DoubleType),
+            StructField("y", DoubleType),
+            StructField("z", DoubleType))),
+            LongType))))
     }
   }
 
@@ -300,12 +310,13 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StringType, StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType),
-          StructField("z", DoubleType))))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points",
+          MapType(StringType, StructType(Seq(
+            StructField("x", DoubleType),
+            StructField("y", DoubleType),
+            StructField("z", DoubleType)))))))
     }
   }
 
@@ -318,12 +329,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(StructType(Seq(
           StructField("x", DoubleType),
           StructField("y", DoubleType),
-          StructField("z", DoubleType))))))
+          StructField("z", DoubleType)))))))
     }
   }
 
@@ -337,28 +348,25 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
         val table = getTableMetadata(t)
 
         assert(table.name === t)
-        assert(table.schema === new StructType()
-          .add("a", StringType)
-          .add(StructField("b", IntegerType)
-            .withCurrentDefaultValue("2 + 3")
-            .withExistenceDefaultValue("5")))
+        assert(table.columns sameElements Array(
+          Column.create("a", StringType),
+          Column.create("b", IntegerType, true, null,
+            new ColumnDefaultValue("2 + 3", LiteralValue(5, IntegerType)), null)))
 
         sql(s"alter table $t alter column b set default 2 + 3")
 
         assert(
-          getTableMetadata(t).schema === new StructType()
-            .add("a", StringType)
-            .add(StructField("b", IntegerType)
-              .withCurrentDefaultValue("2 + 3")
-              .withExistenceDefaultValue("5")))
+          getTableMetadata(t).columns sameElements Array(
+            Column.create("a", StringType),
+            Column.create("b", IntegerType, true, null,
+              new ColumnDefaultValue("2 + 3", LiteralValue(5, IntegerType)), null)))
 
         sql(s"alter table $t alter column b drop default")
 
         assert(
-          getTableMetadata(t).schema === new StructType()
-            .add("a", StringType)
-            .add(StructField("b", IntegerType)
-              .withExistenceDefaultValue("5")))
+          getTableMetadata(t).columns sameElements Array(
+            Column.create("a", StringType),
+            Column.create("b", IntegerType, true, null, """{"EXISTS_DEFAULT":"5"}""")))
       }
     }
   }
@@ -401,11 +409,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(StructType(Seq(
           StructField("x", DoubleType),
           StructField("y", DoubleType))))))
+      )
     }
   }
 
@@ -418,12 +427,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(StructType(Seq(
           StructField("x", DoubleType),
           StructField("y", DoubleType),
-          StructField("z", DoubleType).withComment("doc"))))))
+          StructField("z", DoubleType).withComment("doc")))))))
     }
   }
 
@@ -521,7 +530,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType().add("id", LongType))
+      assert(table.columns sameElements Array(Column.create("id", LongType)))
     }
   }
 
@@ -531,7 +540,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       sql(s"CREATE TABLE $t (id int) USING $v2Format")
       (DataTypeTestUtils.dayTimeIntervalTypes ++ DataTypeTestUtils.yearMonthIntervalTypes)
         .foreach {
-          case d: DataType => d.typeName
+          d: DataType => d.typeName
             val sqlText = s"ALTER TABLE $t ALTER COLUMN id TYPE ${d.typeName}"
 
             checkError(
@@ -559,12 +568,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
 
       val table = getTableMetadata(t)
       assert(table.name === t)
-      assert(table.schema === new StructType().add("id", LongType, nullable = false))
+      assert(table.columns sameElements Array(Column.create("id", LongType, false)))
 
       sql(s"ALTER TABLE $t ALTER COLUMN id DROP NOT NULL")
       val table2 = getTableMetadata(t)
       assert(table2.name === t)
-      assert(table2.schema === new StructType().add("id", LongType))
+      assert(table2.columns sameElements Array(Column.create("id", LongType, true)))
 
       val e = intercept[AnalysisException] {
         sql(s"ALTER TABLE $t ALTER COLUMN id SET NOT NULL")
@@ -581,11 +590,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
 
       val table = getTableMetadata(t)
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType)))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", new StructType()
+          .add("x", DoubleType)
+          .add("y", DoubleType))))
     }
   }
 
@@ -613,11 +622,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType)))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", new StructType()
+          .add("x", DoubleType)
+          .add("y", DoubleType))))
     }
   }
 
@@ -644,9 +653,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(IntegerType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(IntegerType))))
     }
   }
 
@@ -659,9 +668,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(LongType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(LongType))))
     }
   }
 
@@ -688,9 +697,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("m", MapType(StringType, IntegerType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("m", MapType(StringType, IntegerType))))
     }
   }
 
@@ -703,9 +712,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("m", MapType(StringType, LongType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("m", MapType(StringType, LongType))))
     }
   }
 
@@ -719,11 +728,13 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType))), LongType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points",
+          MapType(StructType(Seq(
+            StructField("x", DoubleType),
+            StructField("y", DoubleType))),
+            LongType))))
     }
   }
 
@@ -737,11 +748,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StringType, StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType))))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points",
+          MapType(StringType, StructType(Seq(
+            StructField("x", DoubleType),
+            StructField("y", DoubleType)))))))
     }
   }
 
@@ -754,11 +766,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType))))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points",
+          ArrayType(StructType(Seq(
+            StructField("x", DoubleType),
+            StructField("y", DoubleType)))))))
     }
   }
 
@@ -834,7 +847,8 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === StructType(Seq(StructField("id", IntegerType).withComment("doc"))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType, true, "doc", null)))
     }
   }
 
@@ -844,22 +858,22 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       sql(s"CREATE TABLE $t (a int, b int, point struct<x: int, y: int, z: int>) USING $v2Format")
 
       sql(s"ALTER TABLE $t ALTER COLUMN b FIRST")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("b", IntegerType)
-        .add("a", IntegerType)
-        .add("point", new StructType()
+      assert(getTableMetadata(t).columns sameElements Array(
+        Column.create("b", IntegerType),
+        Column.create("a", IntegerType),
+        Column.create("point", new StructType()
           .add("x", IntegerType)
           .add("y", IntegerType)
-          .add("z", IntegerType)))
+          .add("z", IntegerType))))
 
       sql(s"ALTER TABLE $t ALTER COLUMN b AFTER point")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("a", IntegerType)
-        .add("point", new StructType()
+      assert(getTableMetadata(t).columns sameElements Array(
+        Column.create("a", IntegerType),
+        Column.create("point", new StructType()
           .add("x", IntegerType)
           .add("y", IntegerType)
-          .add("z", IntegerType))
-        .add("b", IntegerType))
+          .add("z", IntegerType)),
+        Column.create("b", IntegerType)))
 
       val sqlText1 = s"ALTER TABLE $t ALTER COLUMN b AFTER non_exist"
       checkError(
@@ -874,22 +888,23 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
         context = ExpectedContext(fragment = sqlText1, start = 0, stop = sqlText1.length - 1))
 
       sql(s"ALTER TABLE $t ALTER COLUMN point.y FIRST")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("a", IntegerType)
-        .add("point", new StructType()
+      assert(getTableMetadata(t).columns sameElements Array(
+        Column.create("a", IntegerType),
+        Column.create("point", new StructType()
           .add("y", IntegerType)
           .add("x", IntegerType)
-          .add("z", IntegerType))
-        .add("b", IntegerType))
+          .add("z", IntegerType)),
+        Column.create("b", IntegerType)
+      ))
 
       sql(s"ALTER TABLE $t ALTER COLUMN point.y AFTER z")
-      assert(getTableMetadata(t).schema == new StructType()
-        .add("a", IntegerType)
-        .add("point", new StructType()
+      assert(getTableMetadata(t).columns sameElements Array(
+        Column.create("a", IntegerType),
+        Column.create("point", new StructType()
           .add("x", IntegerType)
           .add("z", IntegerType)
-          .add("y", IntegerType))
-        .add("b", IntegerType))
+          .add("y", IntegerType)),
+        Column.create("b", IntegerType)))
 
       val sqlText2 = s"ALTER TABLE $t ALTER COLUMN point.y AFTER non_exist"
       checkError(
@@ -918,11 +933,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType).withComment("doc")))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", new StructType()
+          .add("x", DoubleType)
+          .add("y", DoubleType, nullable = true, "doc"))))
     }
   }
 
@@ -936,11 +951,12 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType).withComment("doc"))), LongType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points",
+          MapType(StructType(Seq(
+            StructField("x", DoubleType),
+            StructField("y", DoubleType).withComment("doc"))), LongType))))
     }
   }
 
@@ -954,11 +970,15 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StringType, StructType(Seq(
-          StructField("x", DoubleType),
-          StructField("y", DoubleType).withComment("doc"))))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points",
+          MapType(StringType, StructType(Seq(
+            StructField("x", DoubleType),
+            StructField("y", DoubleType, nullable = true,
+              new MetadataBuilder()
+                .putString("comment", "doc")
+                .build())))))))
     }
   }
 
@@ -971,11 +991,14 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(StructType(Seq(
           StructField("x", DoubleType),
-          StructField("y", DoubleType).withComment("doc"))))))
+          StructField("y", DoubleType, nullable = true,
+            new MetadataBuilder()
+              .putString("comment", "doc")
+              .build())))))))
     }
   }
 
@@ -1037,7 +1060,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
 
         assert(table.name === t)
         assert(
-          table.columns() === Array(
+          table.columns sameElements Array(
             Column.create("data", StringType),
             Column.create("id", LongType),
             Column.create("ts", TimestampType, true),
@@ -1104,7 +1127,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType().add("user_id", IntegerType))
+      assert(table.columns sameElements Array(Column.create("user_id", IntegerType)))
     }
   }
 
@@ -1117,11 +1140,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", StructType(Seq(
           StructField("x", DoubleType),
-          StructField("t", DoubleType)))))
+          StructField("t", DoubleType))))))
     }
   }
 
@@ -1135,11 +1158,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", MapType(StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", MapType(StructType(Seq(
           StructField("x", DoubleType),
-          StructField("t", DoubleType))), LongType)))
+          StructField("t", DoubleType))), LongType))))
     }
   }
 
@@ -1153,11 +1176,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StringType, StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", MapType(StringType, StructType(Seq(
           StructField("x", DoubleType),
-          StructField("t", DoubleType))))))
+          StructField("t", DoubleType)))))))
     }
   }
 
@@ -1170,11 +1193,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(StructType(Seq(
           StructField("x", DoubleType),
-          StructField("t", DoubleType))))))
+          StructField("t", DoubleType)))))))
     }
   }
 
@@ -1278,7 +1301,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType().add("id", IntegerType))
+      assert(table.columns sameElements Array(Column.create("id", IntegerType)))
     }
   }
 
@@ -1292,11 +1315,11 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", StructType(Seq(
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", StructType(Seq(
           StructField("x", DoubleType),
-          StructField("y", DoubleType)))))
+          StructField("y", DoubleType))))))
     }
   }
 
@@ -1310,10 +1333,10 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("point", MapType(StructType(Seq(
-          StructField("x", DoubleType))), LongType)))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("point", MapType(StructType(Seq(
+          StructField("x", DoubleType))), LongType))))
     }
   }
 
@@ -1327,10 +1350,10 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", MapType(StringType, StructType(Seq(
-          StructField("x", DoubleType))))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", MapType(StringType, StructType(Seq(
+          StructField("x", DoubleType)))))))
     }
   }
 
@@ -1343,10 +1366,10 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === new StructType()
-        .add("id", IntegerType)
-        .add("points", ArrayType(StructType(Seq(
-          StructField("x", DoubleType))))))
+      assert(table.columns sameElements Array(
+        Column.create("id", IntegerType),
+        Column.create("points", ArrayType(StructType(Seq(
+          StructField("x", DoubleType)))))))
     }
   }
 
@@ -1370,7 +1393,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       // with if exists it should pass
       sql(s"ALTER TABLE $t DROP COLUMN IF EXISTS data")
       val table = getTableMetadata(t)
-      assert(table.schema == new StructType().add("id", IntegerType))
+      assert(table.columns sameElements Array(Column.create("id", IntegerType)))
     }
   }
 
@@ -1394,7 +1417,7 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       // with if exists it should pass
       sql(s"ALTER TABLE $t DROP COLUMN IF EXISTS point.x")
       val table = getTableMetadata(t)
-      assert(table.schema == new StructType().add("id", IntegerType))
+      assert(table.columns sameElements Array(Column.create("id", IntegerType)))
     }
   }
 
@@ -1408,8 +1431,10 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       sql(s"ALTER TABLE $t DROP COLUMNS IF EXISTS " +
         s"names, name, points.element.z, id, points.element.x")
       val table = getTableMetadata(t)
-      assert(table.schema == new StructType()
-        .add("points", ArrayType(StructType(Seq(StructField("y", DoubleType))))))
+      assert(table.columns sameElements Array(
+        Column.create("points", ArrayType(
+          StructType(Seq(
+            StructField("y", DoubleType)))))))
     }
   }
 
@@ -1456,9 +1481,9 @@ trait AlterTableTests extends SharedSparkSession with QueryErrorsBase {
       val table = getTableMetadata(t)
 
       assert(table.name === t)
-      assert(table.schema === StructType(Seq(
-        StructField("col2", StringType),
-        StructField("col3", IntegerType).withComment("c3"))))
+      assert(table.columns sameElements Array(
+        Column.create("col2", StringType),
+        Column.create("col3", IntegerType, true, "c3", null)))
     }
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourcePushdownTestUtils.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourcePushdownTestUtils.scala
new file mode 100644
index 0000000000000..03cea0fb9d6f9
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourcePushdownTestUtils.scala
@@ -0,0 +1,196 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.connector
+
+import org.apache.spark.sql.{DataFrame, ExplainSuiteHelper}
+import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.connector.expressions.aggregate.GeneralAggregateFunc
+import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2ScanRelation, V1ScanWrapper}
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.types.StructType
+
+trait DataSourcePushdownTestUtils extends ExplainSuiteHelper {
+  protected def checkSamplePushed(df: DataFrame, pushed: Boolean = true): Unit = {
+    val sample = df.queryExecution.optimizedPlan.collect {
+      case s: Sample => s
+    }
+    if (pushed) {
+      assert(sample.isEmpty)
+    } else {
+      assert(sample.nonEmpty)
+    }
+  }
+
+  protected def checkFilterPushed(df: DataFrame, pushed: Boolean = true): Unit = {
+    val filter = df.queryExecution.optimizedPlan.collect {
+      case f: Filter => f
+    }
+    if (pushed) {
+      assert(filter.isEmpty)
+    } else {
+      assert(filter.nonEmpty)
+    }
+  }
+
+  protected def checkLimitRemoved(df: DataFrame, pushed: Boolean = true): Unit = {
+    val limit = df.queryExecution.optimizedPlan.collect {
+      case l: LocalLimit => l
+      case g: GlobalLimit => g
+    }
+    if (pushed) {
+      assert(limit.isEmpty)
+    } else {
+      assert(limit.nonEmpty)
+    }
+  }
+
+  protected def checkLimitPushed(df: DataFrame, limit: Option[Int]): Unit = {
+    df.queryExecution.optimizedPlan.collect {
+      case relation: DataSourceV2ScanRelation => relation.scan match {
+        case v1: V1ScanWrapper =>
+          assert(v1.pushedDownOperators.limit == limit)
+      }
+    }
+  }
+
+  protected def checkColumnPruned(df: DataFrame, col: String): Unit = {
+    val scan = df.queryExecution.optimizedPlan.collectFirst {
+      case s: DataSourceV2ScanRelation => s
+    }.get
+    assert(scan.schema.names.sameElements(Seq(col)))
+  }
+
+  protected def checkAggregateRemoved(df: DataFrame, pushed: Boolean = true): Unit = {
+    val aggregates = df.queryExecution.optimizedPlan.collect {
+      case agg: Aggregate => agg
+    }
+    if (pushed) {
+      assert(aggregates.isEmpty)
+    } else {
+      assert(aggregates.nonEmpty)
+    }
+  }
+
+  protected def checkAggregatePushed(df: DataFrame, funcName: String): Unit = {
+    df.queryExecution.optimizedPlan.collect {
+      case DataSourceV2ScanRelation(_, scan, _, _, _) =>
+        assert(scan.isInstanceOf[V1ScanWrapper])
+        val wrapper = scan.asInstanceOf[V1ScanWrapper]
+        assert(wrapper.pushedDownOperators.aggregation.isDefined)
+        val aggregationExpressions =
+          wrapper.pushedDownOperators.aggregation.get.aggregateExpressions()
+        assert(aggregationExpressions.exists { expr =>
+          expr.isInstanceOf[GeneralAggregateFunc] &&
+            expr.asInstanceOf[GeneralAggregateFunc].name() == funcName
+        })
+    }
+  }
+
+  protected def checkSortRemoved(
+      df: DataFrame,
+      pushed: Boolean = true): Unit = {
+    val sorts = df.queryExecution.optimizedPlan.collect {
+      case s: Sort => s
+    }
+
+    if (pushed) {
+      assert(sorts.isEmpty)
+    } else {
+      assert(sorts.nonEmpty)
+    }
+  }
+
+  protected def checkOffsetRemoved(
+      df: DataFrame,
+      pushed: Boolean = true): Unit = {
+    val offsets = df.queryExecution.optimizedPlan.collect {
+      case o: Offset => o
+    }
+
+    if (pushed) {
+      assert(offsets.isEmpty)
+    } else {
+      assert(offsets.nonEmpty)
+    }
+  }
+
+  protected def checkOffsetPushed(df: DataFrame, offset: Option[Int]): Unit = {
+    df.queryExecution.optimizedPlan.collect {
+      case relation: DataSourceV2ScanRelation => relation.scan match {
+        case v1: V1ScanWrapper =>
+          assert(v1.pushedDownOperators.offset == offset)
+      }
+    }
+  }
+
+  protected def checkJoinNotPushed(df: DataFrame): Unit = {
+    val joinNodes = df.queryExecution.optimizedPlan.collect {
+      case j: Join => j
+    }
+    assert(joinNodes.nonEmpty, "Join should not be pushed down")
+  }
+
+  protected def checkJoinPushed(df: DataFrame): Unit = {
+    val joinNodes = df.queryExecution.optimizedPlan.collect {
+      case j: Join => j
+    }
+    assert(joinNodes.isEmpty, "Join should be pushed down")
+  }
+
+  protected def checkJoinPushed(df: DataFrame, expectedPushdownString: String): Unit = {
+    checkJoinPushed(df)
+    if (expectedPushdownString.nonEmpty) {
+      checkPushedInfo(df, expectedPushdownString)
+    }
+  }
+
+  protected def checkPushedInfo(df: DataFrame, expectedPlanFragment: String*): Unit = {
+    withSQLConf(SQLConf.MAX_METADATA_STRING_LENGTH.key -> "1000") {
+      df.queryExecution.optimizedPlan.collect {
+        case _: DataSourceV2ScanRelation =>
+          checkKeywordsExistsInExplain(df, expectedPlanFragment: _*)
+      }
+    }
+  }
+
+  /**
+   * Check if the output schema of dataframe {@code df} is same as {@code schema}. There is one
+   * limitation: if expected schema name is empty, assertion on same names will be skipped.
+   * <br>
+   * For example, it is not really possible to use {@code checkPrunedColumns} for join pushdown,
+   * because in case of duplicate names, columns will have random UUID suffixes. For this reason,
+   * the best we can do is test that the size is same, and other fields beside names do match.
+   */
+  protected def checkPrunedColumnsDataTypeAndNullability(
+      df: DataFrame,
+      schema: StructType): Unit = {
+    df.queryExecution.optimizedPlan.collect {
+      case relation: DataSourceV2ScanRelation => relation.scan match {
+        case v1: V1ScanWrapper =>
+          val dfSchema = v1.readSchema()
+
+          assert(dfSchema.length == schema.length)
+          dfSchema.fields.zip(schema.fields).foreach { case (f1, f2) =>
+            assert(f1.name == f2.name)
+            assert(f1.dataType == f2.dataType)
+            assert(f1.nullable == f2.nullable)
+          }
+      }
+    }
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2DataFrameSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2DataFrameSuite.scala
index 342eefa1a6f63..27b07079a984e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2DataFrameSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2DataFrameSuite.scala
@@ -19,6 +19,8 @@ package org.apache.spark.sql.connector
 
 import java.util.Collections
 
+import scala.jdk.CollectionConverters._
+
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.sql.{AnalysisException, DataFrame, Row, SaveMode}
 import org.apache.spark.sql.QueryTest.withQueryExecutionsCaptured
@@ -26,7 +28,8 @@ import org.apache.spark.sql.catalyst.analysis.TableAlreadyExistsException
 import org.apache.spark.sql.catalyst.plans.logical.{AppendData, CreateTableAsSelect, LogicalPlan, ReplaceTableAsSelect}
 import org.apache.spark.sql.connector.catalog.{Column, ColumnDefaultValue, DefaultValue, Identifier, InMemoryTableCatalog, TableInfo}
 import org.apache.spark.sql.connector.catalog.TableChange.{AddColumn, UpdateColumnDefaultValue}
-import org.apache.spark.sql.connector.expressions.{ApplyTransform, Cast => V2Cast, GeneralScalarExpression, LiteralValue, Transform}
+import org.apache.spark.sql.connector.expressions.{ApplyTransform, GeneralScalarExpression, LiteralValue, Transform}
+import org.apache.spark.sql.connector.expressions.filter.{AlwaysFalse, AlwaysTrue}
 import org.apache.spark.sql.execution.{QueryExecution, SparkPlan}
 import org.apache.spark.sql.execution.ExplainUtils.stripAQEPlan
 import org.apache.spark.sql.execution.datasources.v2.{AlterTableExec, CreateTableExec, DataSourceV2Relation, ReplaceTableExec}
@@ -369,21 +372,15 @@ class DataSourceV2DataFrameSuite
           null,
           new ColumnDefaultValue(
             "(100 + 23)",
-            new GeneralScalarExpression(
-              "+",
-              Array(LiteralValue(100, IntegerType), LiteralValue(23, IntegerType))),
+            LiteralValue(123, IntegerType),
             LiteralValue(123, IntegerType)),
           new ColumnDefaultValue(
             "('h' || 'r')",
-            new GeneralScalarExpression(
-              "CONCAT",
-              Array(
-                LiteralValue(UTF8String.fromString("h"), StringType),
-                LiteralValue(UTF8String.fromString("r"), StringType))),
+            LiteralValue(UTF8String.fromString("hr"), StringType),
             LiteralValue(UTF8String.fromString("hr"), StringType)),
           new ColumnDefaultValue(
             "CAST(1 AS BOOLEAN)",
-            new V2Cast(LiteralValue(1, IntegerType), IntegerType, BooleanType),
+            new AlwaysTrue,
             LiteralValue(true, BooleanType))))
 
       val df1 = Seq(1).toDF("id")
@@ -418,21 +415,15 @@ class DataSourceV2DataFrameSuite
           null,
           new ColumnDefaultValue(
             "(50 * 2)",
-            new GeneralScalarExpression(
-              "*",
-              Array(LiteralValue(50, IntegerType), LiteralValue(2, IntegerType))),
+            LiteralValue(100, IntegerType),
             LiteralValue(100, IntegerType)),
           new ColumnDefaultValue(
             "('un' || 'known')",
-            new GeneralScalarExpression(
-              "CONCAT",
-              Array(
-                LiteralValue(UTF8String.fromString("un"), StringType),
-                LiteralValue(UTF8String.fromString("known"), StringType))),
+            LiteralValue(UTF8String.fromString("unknown"), StringType),
             LiteralValue(UTF8String.fromString("unknown"), StringType)),
           new ColumnDefaultValue(
             "CAST(0 AS BOOLEAN)",
-            new V2Cast(LiteralValue(0, IntegerType), IntegerType, BooleanType),
+            new AlwaysFalse,
             LiteralValue(false, BooleanType))))
 
       val df3 = Seq(1).toDF("id")
@@ -467,21 +458,15 @@ class DataSourceV2DataFrameSuite
         Array(
           new ColumnDefaultValue(
             "(100 + 23)",
-            new GeneralScalarExpression(
-              "+",
-              Array(LiteralValue(100, IntegerType), LiteralValue(23, IntegerType))),
+            LiteralValue(123, IntegerType),
             LiteralValue(123, IntegerType)),
           new ColumnDefaultValue(
             "('h' || 'r')",
-            new GeneralScalarExpression(
-              "CONCAT",
-              Array(
-                LiteralValue(UTF8String.fromString("h"), StringType),
-                LiteralValue(UTF8String.fromString("r"), StringType))),
+            LiteralValue(UTF8String.fromString("hr"), StringType),
             LiteralValue(UTF8String.fromString("hr"), StringType)),
           new ColumnDefaultValue(
             "CAST(1 AS BOOLEAN)",
-            new V2Cast(LiteralValue(1, IntegerType), IntegerType, BooleanType),
+            new AlwaysTrue,
             LiteralValue(true, BooleanType))))
     }
   }
@@ -512,19 +497,13 @@ class DataSourceV2DataFrameSuite
         Array(
           new DefaultValue(
             "(123 + 56)",
-            new GeneralScalarExpression(
-              "+",
-              Array(LiteralValue(123, IntegerType), LiteralValue(56, IntegerType)))),
+            LiteralValue(179, IntegerType)),
           new DefaultValue(
             "('r' || 'l')",
-            new GeneralScalarExpression(
-              "CONCAT",
-              Array(
-                LiteralValue(UTF8String.fromString("r"), StringType),
-                LiteralValue(UTF8String.fromString("l"), StringType)))),
+            LiteralValue(UTF8String.fromString("rl"), StringType)),
           new DefaultValue(
             "CAST(0 AS BOOLEAN)",
-            new V2Cast(LiteralValue(0, IntegerType), IntegerType, BooleanType))))
+            new AlwaysFalse)))
     }
   }
 
@@ -690,7 +669,7 @@ class DataSourceV2DataFrameSuite
             LiteralValue(1542490413000000L, TimestampType)),
           new ColumnDefaultValue(
             "1",
-            new V2Cast(LiteralValue(1, IntegerType), IntegerType, DoubleType),
+            LiteralValue(1.0, DoubleType),
             LiteralValue(1.0, DoubleType))))
 
       val replaceExec = executeAndKeepPhysicalPlan[ReplaceTableExec] {
@@ -712,11 +691,7 @@ class DataSourceV2DataFrameSuite
             LiteralValue(1645624555000000L, TimestampType)),
           new ColumnDefaultValue(
             "(1 + 1)",
-            new V2Cast(
-              new GeneralScalarExpression("+", Array(LiteralValue(1, IntegerType),
-                LiteralValue(1, IntegerType))),
-              IntegerType,
-              DoubleType),
+            LiteralValue(2.0, DoubleType),
             LiteralValue(2.0, DoubleType))))
     }
   }
@@ -744,7 +719,7 @@ class DataSourceV2DataFrameSuite
               LiteralValue(1542490413000000L, TimestampType)),
             new ColumnDefaultValue(
               "1",
-              new V2Cast(LiteralValue(1, IntegerType), IntegerType, DoubleType),
+              LiteralValue(1.0, DoubleType),
               LiteralValue(1.0, DoubleType))))
 
         val alterCol1 = executeAndKeepPhysicalPlan[AlterTableExec] {
@@ -762,11 +737,7 @@ class DataSourceV2DataFrameSuite
               LiteralValue(1645624555000000L, TimestampType)),
             new DefaultValue(
               "(1 + 1)",
-              new V2Cast(
-                new GeneralScalarExpression("+", Array(LiteralValue(1, IntegerType),
-                  LiteralValue(1, IntegerType))),
-                IntegerType,
-                DoubleType))))
+              LiteralValue(2.0, DoubleType))))
       }
   }
 
@@ -846,6 +817,45 @@ class DataSourceV2DataFrameSuite
     }
   }
 
+  test("SPARK-52860: insert with schema evolution") {
+    val tableName = "testcat.ns1.ns2.tbl"
+    val ident = Identifier.of(Array("ns1", "ns2"), "tbl")
+    Seq(true, false).foreach { caseSensitive =>
+      withSQLConf(SQLConf.CASE_SENSITIVE.key -> caseSensitive.toString) {
+        withTable(tableName) {
+          val tableInfo = new TableInfo.Builder().
+            withColumns(
+              Array(Column.create("c1", IntegerType)))
+            .withProperties(
+              Map("accept-any-schema" -> "true").asJava)
+            .build()
+          catalog("testcat").createTable(ident, tableInfo)
+
+          val data = Seq((1, "a"), (2, "b"), (3, "c"))
+          val df = if (caseSensitive) {
+            data.toDF("c1", "C1")
+          } else {
+            data.toDF("c1", "c2")
+          }
+          df.writeTo(tableName).append()
+          checkAnswer(spark.table(tableName), df)
+
+          val cols = catalog("testcat").loadTable(ident).columns()
+          val expectedCols = if (caseSensitive) {
+            Array(
+              Column.create("c1", IntegerType),
+              Column.create("C1", StringType))
+          } else {
+            Array(
+              Column.create("c1", IntegerType),
+              Column.create("c2", StringType))
+          }
+          assert(cols === expectedCols)
+        }
+      }
+    }
+  }
+
   private def executeAndKeepPhysicalPlan[T <: SparkPlan](func: => Unit): T = {
     val qe = withQueryExecutionsCaptured(spark) {
       func
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2SQLSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2SQLSuite.scala
index cd4cd462088a0..9171e44571e88 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2SQLSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2SQLSuite.scala
@@ -38,14 +38,14 @@ import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.connector.catalog.{Column => ColumnV2, _}
 import org.apache.spark.sql.connector.catalog.CatalogManager.SESSION_CATALOG_NAME
 import org.apache.spark.sql.connector.catalog.CatalogV2Util.withDefaultOwnership
-import org.apache.spark.sql.connector.expressions.{Cast => V2Cast, Expression, GeneralScalarExpression, LiteralValue, Transform}
+import org.apache.spark.sql.connector.expressions.{LiteralValue, Transform}
 import org.apache.spark.sql.errors.QueryErrorsBase
 import org.apache.spark.sql.execution.FilterExec
 import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
 import org.apache.spark.sql.execution.columnar.InMemoryRelation
 import org.apache.spark.sql.execution.datasources.{HadoopFsRelation, LogicalRelationWithTable}
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2ScanRelation
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.internal.{SQLConf, StaticSQLConf}
 import org.apache.spark.sql.internal.SQLConf.{PARTITION_OVERWRITE_MODE, PartitionOverwriteMode, V2_SESSION_CATALOG_IMPLEMENTATION}
 import org.apache.spark.sql.sources.SimpleScanSource
@@ -655,12 +655,7 @@ class DataSourceV2SQLSuiteV1Filter
         null, /* no comment */
         new ColumnDefaultValue(
           "41 + 1",
-          new V2Cast(
-            new GeneralScalarExpression(
-              "+",
-              Array[Expression](LiteralValue(41, IntegerType), LiteralValue(1, IntegerType))),
-            IntegerType,
-            LongType),
+          LiteralValue(42L, LongType),
           LiteralValue(42L, LongType)),
         null /* no metadata */)
       assert(actual === expected,
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2Suite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2Suite.scala
index 3eeed2e41754c..ca82a8c612099 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2Suite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/DataSourceV2Suite.scala
@@ -1380,7 +1380,7 @@ class PartitionAwareDataSource extends TestingV2Source {
 
 class OrderAndPartitionAwareDataSource extends PartitionAwareDataSource {
 
-  class MyScanBuilder(
+  class OrderAwareScanBuilder(
       val partitionKeys: Option[Seq[String]],
       val orderKeys: Seq[String])
     extends SimpleScanBuilder
@@ -1414,7 +1414,7 @@ class OrderAndPartitionAwareDataSource extends PartitionAwareDataSource {
 
   override def getTable(options: CaseInsensitiveStringMap): Table = new SimpleBatchTable {
     override def newScanBuilder(options: CaseInsensitiveStringMap): ScanBuilder = {
-      new MyScanBuilder(
+      new OrderAwareScanBuilder(
         Option(options.get("partitionKeys")).map(_.split(",").toImmutableArraySeq),
         Option(options.get("orderKeys")).map(_.split(",").toSeq).getOrElse(Seq.empty)
       )
@@ -1518,7 +1518,7 @@ class SupportsExternalMetadataWritableDataSource extends SimpleWritableDataSourc
 
 class ReportStatisticsDataSource extends SimpleWritableDataSource {
 
-  class MyScanBuilder extends SimpleScanBuilder
+  class ReportStatisticsScanBuilder extends SimpleScanBuilder
     with SupportsReportStatistics {
     override def estimateStatistics(): Statistics = {
       new Statistics {
@@ -1536,7 +1536,7 @@ class ReportStatisticsDataSource extends SimpleWritableDataSource {
   override def getTable(options: CaseInsensitiveStringMap): Table = {
     new SimpleBatchTable {
       override def newScanBuilder(options: CaseInsensitiveStringMap): ScanBuilder = {
-        new MyScanBuilder
+        new ReportStatisticsScanBuilder
       }
     }
   }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DeleteFromTableSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DeleteFromTableSuiteBase.scala
index 33c17c648046a..0f7f4cefe2feb 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/DeleteFromTableSuiteBase.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/DeleteFromTableSuiteBase.scala
@@ -18,12 +18,16 @@
 package org.apache.spark.sql.connector
 
 import org.apache.spark.sql.Row
+import org.apache.spark.sql.catalyst.expressions.CheckInvariant
+import org.apache.spark.sql.catalyst.plans.logical.Filter
 import org.apache.spark.sql.execution.datasources.v2.{DeleteFromTableExec, ReplaceDataExec, WriteDeltaExec}
 
 abstract class DeleteFromTableSuiteBase extends RowLevelOperationSuiteBase {
 
   import testImplicits._
 
+  protected def enforceCheckConstraintOnDelete: Boolean = true
+
   test("delete from table containing added column with default value") {
     createAndInitTable("pk INT NOT NULL, dep STRING", """{ "pk": 1, "dep": "hr" }""")
 
@@ -64,28 +68,32 @@ abstract class DeleteFromTableSuiteBase extends RowLevelOperationSuiteBase {
   }
 
   test("delete from table with table constraints") {
-    sql(
-      s"""
-         |CREATE TABLE $tableNameAsString (
-         | pk INT NOT NULL PRIMARY KEY,
-         | id INT UNIQUE,
-         | dep STRING,
-         | CONSTRAINT pk_check CHECK (pk > 0))
-         | PARTITIONED BY (dep)
-         |""".stripMargin)
-      append("pk INT NOT NULL, id INT, dep STRING",
-        """{ "pk": 1, "id": 2, "dep": "hr" }
-          |{ "pk": 2, "id": 4, "dep": "eng" }
-          |{ "pk": 3, "id": 6, "dep": "eng" }
-          |""".stripMargin)
-      sql(s"DELETE FROM $tableNameAsString WHERE pk < 2")
-      checkAnswer(
-        sql(s"SELECT * FROM $tableNameAsString"),
-        Seq(Row(2, 4, "eng"), Row(3, 6, "eng")))
-      sql(s"DELETE FROM $tableNameAsString WHERE pk >=3")
-      checkAnswer(
-        sql(s"SELECT * FROM $tableNameAsString"),
-        Seq(Row(2, 4, "eng")))
+    createAndInitTable(
+      "pk INT NOT NULL, id INT, dep STRING",
+      """{ "pk": 1, "id": 2, "dep": "hr" }
+        |{ "pk": 2, "id": 4, "dep": "eng" }
+        |{ "pk": 3, "id": 6, "dep": "eng" }
+        |""".stripMargin)
+    sql(s"ALTER TABLE $tableNameAsString ADD CONSTRAINT positive_pk CHECK (pk > 0)")
+    val df = sql(s"DELETE FROM $tableNameAsString WHERE pk < 2")
+    val checkInvariant = df.queryExecution.analyzed.collectFirst {
+      case f: Filter =>
+        f.condition.collectFirst {
+          case c: CheckInvariant => c
+        }
+    }.flatten
+    if (enforceCheckConstraintOnDelete) {
+      assert(checkInvariant.isDefined, "Check invariant should be present in the delete plan")
+    } else {
+      assert(checkInvariant.isEmpty, "Check invariant should not be present in the delete plan")
+    }
+    checkAnswer(
+      sql(s"SELECT * FROM $tableNameAsString"),
+      Seq(Row(2, 4, "eng"), Row(3, 6, "eng")))
+    sql(s"DELETE FROM $tableNameAsString WHERE pk >=3")
+    checkAnswer(
+      sql(s"SELECT * FROM $tableNameAsString"),
+      Seq(Row(2, 4, "eng")))
   }
 
   test("delete from table containing struct column with default value") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedDeleteFromTableSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedDeleteFromTableSuite.scala
index 8ad713424cec5..eaa3f2f42b218 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedDeleteFromTableSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedDeleteFromTableSuite.scala
@@ -30,6 +30,8 @@ class DeltaBasedDeleteFromTableSuite extends DeleteFromTableSuiteBase {
     props
   }
 
+  override def enforceCheckConstraintOnDelete: Boolean = false
+
   test("delete handles metadata columns correctly") {
     createAndInitTable("pk INT NOT NULL, id INT, dep STRING",
       """{ "pk": 1, "id": 1, "dep": "hr" }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedMergeIntoTableSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedMergeIntoTableSuiteBase.scala
index 7ccd3abcc5615..92b0acbbd2921 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedMergeIntoTableSuiteBase.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/DeltaBasedMergeIntoTableSuiteBase.scala
@@ -23,6 +23,8 @@ abstract class DeltaBasedMergeIntoTableSuiteBase extends MergeIntoTableSuiteBase
 
   import testImplicits._
 
+  override protected def deltaMerge = true
+
   test("merge into schema pruning with WHEN MATCHED clause (update)") {
     withTempView("source") {
       createAndInitTable("pk INT NOT NULL, salary INT, country STRING, dep STRING",
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/KeyGroupedPartitioningSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/KeyGroupedPartitioningSuite.scala
index c24f52bd93070..c73e8e16fbbb0 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/KeyGroupedPartitioningSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/KeyGroupedPartitioningSuite.scala
@@ -1063,6 +1063,72 @@ class KeyGroupedPartitioningSuite extends DistributionAndOrderingSuiteBase {
     }
   }
 
+  test("[SPARK-53074] partial clustering avoided to meet a non-JOIN required distribution") {
+    val items_partitions = Array(identity("id"))
+    createTable(items, itemsColumns, items_partitions)
+    sql(s"INSERT INTO testcat.ns.$items VALUES " +
+      "(1, 'aa', 40.0, cast('2020-01-01' as timestamp)), " +
+      "(1, 'aa', 40.0, cast('2020-01-01' as timestamp)), " +
+      "(2, 'bb', 10.0, cast('2020-01-01' as timestamp)), " +
+      "(3, 'cc', 15.5, cast('2020-02-01' as timestamp))")
+
+    val purchases_partitions = Array(identity("item_id"))
+    createTable(purchases, purchasesColumns, purchases_partitions)
+    sql(s"INSERT INTO testcat.ns.$purchases VALUES " +
+      "(1, 45.0, cast('2020-01-01' as timestamp)), " +
+      "(1, 50.0, cast('2020-01-02' as timestamp)), " +
+      "(2, 15.0, cast('2020-01-02' as timestamp)), " +
+      "(2, 20.0, cast('2020-01-03' as timestamp)), " +
+      "(3, 20.0, cast('2020-02-01' as timestamp))")
+
+    for {
+      pushDownValues <- Seq(true, false)
+      enable <- Seq("true", "false")
+    } yield {
+      withSQLConf(
+          SQLConf.REQUIRE_ALL_CLUSTER_KEYS_FOR_CO_PARTITION.key -> false.toString,
+          SQLConf.V2_BUCKETING_PUSH_PART_VALUES_ENABLED.key -> pushDownValues.toString,
+          SQLConf.V2_BUCKETING_PARTIALLY_CLUSTERED_DISTRIBUTION_ENABLED.key -> enable) {
+        // The left side uses a key-grouped partitioning to satisfy the WINDOW function's
+        // required distribution. By default, the left side will be partially clustered (since
+        // it's estimated to be larger), but this partial clustering won't be applied because the
+        // left side needs to be key-grouped partitioned to satisfy the WINDOW's required
+        // distribution.
+        // The left side needs to project additional fields to ensure it's estimated to be
+        // larger than the right side.
+        val df = sql(
+          s"""
+             |WITH purchases_windowed AS (
+             |  SELECT
+             |    ROW_NUMBER() OVER (
+             |      PARTITION BY item_id ORDER BY time DESC
+             |    ) AS RN,
+             |    item_id,
+             |    price,
+             |    STRUCT(item_id, price, time) AS purchases_struct
+             |  FROM testcat.ns.$purchases
+             |)
+             |SELECT
+             |  SUM(p.price),
+             |  SUM(p.purchases_struct.item_id),
+             |  SUM(p.purchases_struct.price),
+             |  MAX(p.purchases_struct.time)
+             |FROM
+             |  purchases_windowed p JOIN testcat.ns.$items i
+             |  ON i.id = p.item_id
+             |WHERE p.RN = 1
+             |""".stripMargin)
+        checkAnswer(df, Seq(Row(140.0, 7, 140.0, Timestamp.valueOf("2020-02-01 00:00:00"))))
+        val shuffles = collectShuffles(df.queryExecution.executedPlan)
+        assert(shuffles.isEmpty, "should not contain any shuffle")
+        if (pushDownValues) {
+          val scans = collectScans(df.queryExecution.executedPlan)
+          assert(scans.forall(_.inputRDD.partitions.length === 3))
+        }
+      }
+    }
+  }
+
   test("data source partitioning + dynamic partition filtering") {
     withSQLConf(
         SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "-1",
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/MergeIntoTableSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/MergeIntoTableSuiteBase.scala
index b43424793d441..10586adab1f6e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/MergeIntoTableSuiteBase.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/MergeIntoTableSuiteBase.scala
@@ -21,17 +21,67 @@ import org.apache.spark.SparkRuntimeException
 import org.apache.spark.sql.{AnalysisException, Row}
 import org.apache.spark.sql.catalyst.expressions.{AttributeReference, EqualTo, In, Not}
 import org.apache.spark.sql.catalyst.optimizer.BuildLeft
-import org.apache.spark.sql.connector.catalog.{Column, ColumnDefaultValue}
-import org.apache.spark.sql.connector.expressions.LiteralValue
+import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Column, ColumnDefaultValue, InMemoryTable, TableInfo}
+import org.apache.spark.sql.connector.expressions.{GeneralScalarExpression, LiteralValue}
 import org.apache.spark.sql.execution.SparkPlan
+import org.apache.spark.sql.execution.adaptive.AdaptiveSparkPlanHelper
+import org.apache.spark.sql.execution.datasources.v2.MergeRowsExec
 import org.apache.spark.sql.execution.joins.{BroadcastHashJoinExec, BroadcastNestedLoopJoinExec, CartesianProductExec}
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.types.{IntegerType, StringType}
+import org.apache.spark.sql.types.{ArrayType, BooleanType, IntegerType, MapType, StringType, StructField, StructType}
 
-abstract class MergeIntoTableSuiteBase extends RowLevelOperationSuiteBase {
+abstract class MergeIntoTableSuiteBase extends RowLevelOperationSuiteBase
+  with AdaptiveSparkPlanHelper {
 
   import testImplicits._
 
+  protected def deltaMerge: Boolean = false
+
+  test("merge into table with expression-based default values") {
+    val columns = Array(
+      Column.create("pk", IntegerType),
+      Column.create("salary", IntegerType),
+      Column.create("dep", StringType),
+      Column.create(
+        "value",
+        IntegerType,
+        false, /* not nullable */
+        null, /* no comment */
+        new ColumnDefaultValue(
+          new GeneralScalarExpression(
+            "+",
+            Array(LiteralValue(100, IntegerType), LiteralValue(23, IntegerType))),
+          LiteralValue(123, IntegerType)),
+        "{}"))
+    val tableInfo = new TableInfo.Builder().withColumns(columns).build()
+    catalog.createTable(ident, tableInfo)
+
+    withTempView("source") {
+      val sourceRows = Seq(
+        (1, 500, "eng"),
+        (2, 600, "hr"))
+      sourceRows.toDF("pk", "salary", "dep").createOrReplaceTempView("source")
+
+      sql(s"INSERT INTO $tableNameAsString (pk, salary, dep, value) VALUES (1, 200, 'eng', 999)")
+
+      sql(
+        s"""MERGE INTO $tableNameAsString t
+           |USING source s
+           |ON t.pk = s.pk
+           |WHEN MATCHED THEN
+           | UPDATE SET value = DEFAULT
+           |WHEN NOT MATCHED THEN
+           | INSERT (pk, salary, dep) VALUES (s.pk, s.salary, s.dep)
+           |""".stripMargin)
+
+      checkAnswer(
+        sql(s"SELECT * FROM $tableNameAsString"),
+        Seq(
+          Row(1, 200, "eng", 123), // update
+          Row(2, 600, "hr", 123))) // insert
+    }
+  }
+
   test("merge into table containing added column with default value") {
     withTempView("source") {
       sql(
@@ -1726,6 +1776,1030 @@ abstract class MergeIntoTableSuiteBase extends RowLevelOperationSuiteBase {
     }
   }
 
+  test("Merge metrics with matched clause") {
+    withTempView("source") {
+      createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+        """{ "pk": 1, "salary": 100, "dep": "hr" }
+          |{ "pk": 2, "salary": 200, "dep": "software" }
+          |{ "pk": 3, "salary": 300, "dep": "hr" }
+          |""".stripMargin)
+
+      val sourceDF = Seq(1, 2, 10).toDF("pk")
+      sourceDF.createOrReplaceTempView("source")
+
+      val mergeExec = findMergeExec {
+        s"""MERGE INTO $tableNameAsString t
+           |USING source s
+           |ON t.pk = s.pk
+           |WHEN MATCHED AND salary < 200 THEN
+           | UPDATE SET salary = 1000
+           |""".stripMargin
+      }
+
+      assertMetric(mergeExec, "numTargetRowsCopied", if (deltaMerge) 0 else 2)
+      assertMetric(mergeExec, "numTargetRowsInserted", 0)
+      assertMetric(mergeExec, "numTargetRowsUpdated", 1)
+      assertMetric(mergeExec, "numTargetRowsDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsMatchedUpdated", 1)
+      assertMetric(mergeExec, "numTargetRowsMatchedDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceDeleted", 0)
+
+      checkAnswer(
+        sql(s"SELECT * FROM $tableNameAsString"),
+        Seq(
+          Row(1, 1000, "hr"), // updated
+          Row(2, 200, "software"),
+          Row(3, 300, "hr")))
+
+      val table = catalog.loadTable(ident)
+      val commitProps = table.asInstanceOf[InMemoryTable].commits.last.properties
+      assert(commitProps("merge.numTargetRowsCopied") === (if (deltaMerge) "0" else "2"))
+      assert(commitProps("merge.numTargetRowsInserted") === "0")
+      assert(commitProps("merge.numTargetRowsUpdated") === "1")
+      assert(commitProps("merge.numTargetRowsDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsMatchedUpdated") === "1")
+      assert(commitProps("merge.numTargetRowsMatchedDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceDeleted") === "0")
+    }
+  }
+
+  test("Merge metrics with matched and not matched clause") {
+    withTempView("source") {
+      createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+        """{ "pk": 1, "salary": 100, "dep": "hr" }
+          |{ "pk": 2, "salary": 200, "dep": "software" }
+          |{ "pk": 3, "salary": 300, "dep": "hr" }
+          |""".stripMargin)
+
+      val sourceDF = Seq(
+        (4, 100, "marketing"),
+        (5, 400, "executive"),
+        (6, 100, "hr")
+      ).toDF("pk", "salary", "dep")
+      sourceDF.createOrReplaceTempView("source")
+
+      val mergeExec = findMergeExec {
+        s"""MERGE INTO $tableNameAsString t
+           |USING source s
+           |ON t.pk = s.pk
+           |WHEN MATCHED THEN
+           | UPDATE SET salary = 9999
+           |WHEN NOT MATCHED AND salary > 200 THEN
+           | INSERT *
+           |""".stripMargin
+      }
+
+      assertMetric(mergeExec, "numTargetRowsCopied", 0)
+      assertMetric(mergeExec, "numTargetRowsInserted", 1)
+      assertMetric(mergeExec, "numTargetRowsUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsMatchedUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsMatchedDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceDeleted", 0)
+
+      checkAnswer(
+        sql(s"SELECT * FROM $tableNameAsString"),
+        Seq(
+          Row(1, 100, "hr"),
+          Row(2, 200, "software"),
+          Row(3, 300, "hr"),
+          Row(5, 400, "executive"))) // inserted
+
+      val table = catalog.loadTable(ident)
+      val commitProps = table.asInstanceOf[InMemoryTable].commits.last.properties
+      assert(commitProps("merge.numTargetRowsCopied") === "0")
+      assert(commitProps("merge.numTargetRowsInserted") === "1")
+      assert(commitProps("merge.numTargetRowsUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsMatchedUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsMatchedDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceDeleted") === "0")
+    }
+  }
+
+  test("Merge metrics with matched and not matched by source clauses: update") {
+    withTempView("source") {
+      createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+        """{ "pk": 1, "salary": 100, "dep": "hr" }
+          |{ "pk": 2, "salary": 200, "dep": "software" }
+          |{ "pk": 3, "salary": 300, "dep": "hr" }
+          |{ "pk": 4, "salary": 400, "dep": "marketing" }
+          |{ "pk": 5, "salary": 500, "dep": "executive" }
+          |""".stripMargin)
+
+      val sourceDF = Seq(1, 2, 10).toDF("pk")
+      sourceDF.createOrReplaceTempView("source")
+
+      val mergeExec = findMergeExec {
+        s"""MERGE INTO $tableNameAsString t
+           |USING source s
+           |ON t.pk = s.pk
+           |WHEN MATCHED AND salary < 200 THEN
+           | UPDATE SET salary = 1000
+           |WHEN NOT MATCHED BY SOURCE AND salary > 400 THEN
+           | UPDATE SET salary = -1
+           |""".stripMargin
+      }
+
+      assertMetric(mergeExec, "numTargetRowsCopied", if (deltaMerge) 0 else 3)
+      assertMetric(mergeExec, "numTargetRowsInserted", 0)
+      assertMetric(mergeExec, "numTargetRowsUpdated", 2)
+      assertMetric(mergeExec, "numTargetRowsDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsMatchedUpdated", 1)
+      assertMetric(mergeExec, "numTargetRowsMatchedDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceUpdated", 1)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceDeleted", 0)
+
+      checkAnswer(
+        sql(s"SELECT * FROM $tableNameAsString"),
+        Seq(
+          Row(1, 1000, "hr"), // updated
+          Row(2, 200, "software"),
+          Row(3, 300, "hr"),
+          Row(4, 400, "marketing"),
+          Row(5, -1, "executive"))) // updated
+
+      val table = catalog.loadTable(ident)
+      val commitProps = table.asInstanceOf[InMemoryTable].commits.last.properties
+      assert(commitProps("merge.numTargetRowsCopied") === (if (deltaMerge) "0" else "3"))
+      assert(commitProps("merge.numTargetRowsInserted") === "0")
+      assert(commitProps("merge.numTargetRowsUpdated") === "2")
+      assert(commitProps("merge.numTargetRowsDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsMatchedUpdated") === "1")
+      assert(commitProps("merge.numTargetRowsMatchedDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceUpdated") === "1")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceDeleted") === "0")
+    }
+  }
+
+  test("Merge metrics with matched and not matched by source clauses: delete") {
+    withTempView("source") {
+      createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+        """{ "pk": 1, "salary": 100, "dep": "hr" }
+          |{ "pk": 2, "salary": 200, "dep": "software" }
+          |{ "pk": 3, "salary": 300, "dep": "hr" }
+          |{ "pk": 4, "salary": 400, "dep": "marketing" }
+          |{ "pk": 5, "salary": 500, "dep": "executive" }
+          |""".stripMargin)
+
+      val sourceDF = Seq(1, 2, 10).toDF("pk")
+      sourceDF.createOrReplaceTempView("source")
+
+      val mergeExec = findMergeExec {
+        s"""MERGE INTO $tableNameAsString t
+           |USING source s
+           |ON t.pk = s.pk
+           |WHEN MATCHED AND salary < 200 THEN
+           | DELETE
+           |WHEN NOT MATCHED BY SOURCE AND salary > 400 THEN
+           | DELETE
+           |""".stripMargin
+      }
+
+
+      assertMetric(mergeExec, "numTargetRowsCopied", if (deltaMerge) 0 else 3)
+      assertMetric(mergeExec, "numTargetRowsInserted", 0)
+      assertMetric(mergeExec, "numTargetRowsUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsDeleted", 2)
+      assertMetric(mergeExec, "numTargetRowsMatchedUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsMatchedDeleted", 1)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceDeleted", 1)
+
+      checkAnswer(
+        sql(s"SELECT * FROM $tableNameAsString"),
+        Seq(
+          // Row(1, 100, "hr") deleted
+          Row(2, 200, "software"),
+          Row(3, 300, "hr"),
+          Row(4, 400, "marketing"))
+          // Row(5, 500, "executive") deleted
+      )
+
+      val table = catalog.loadTable(ident)
+      val commitProps = table.asInstanceOf[InMemoryTable].commits.last.properties
+      assert(commitProps("merge.numTargetRowsCopied") === (if (deltaMerge) "0" else "3"))
+      assert(commitProps("merge.numTargetRowsInserted") === "0")
+      assert(commitProps("merge.numTargetRowsUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsDeleted") === "2")
+      assert(commitProps("merge.numTargetRowsMatchedUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsMatchedDeleted") === "1")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceDeleted") === "1")
+    }
+  }
+
+  test("Merge metrics with matched, not matched, and not matched by source clauses: update") {
+    withTempView("source") {
+      createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+        """{ "pk": 1, "salary": 100, "dep": "hr" }
+          |{ "pk": 2, "salary": 200, "dep": "software" }
+          |{ "pk": 3, "salary": 300, "dep": "hr" }
+          |{ "pk": 4, "salary": 400, "dep": "marketing" }
+          |{ "pk": 5, "salary": 500, "dep": "executive" }
+          |""".stripMargin)
+
+      val sourceDF = Seq(1, 2, 6, 10).toDF("pk")
+      sourceDF.createOrReplaceTempView("source")
+
+      val mergeExec = findMergeExec {
+        s"""MERGE INTO $tableNameAsString t
+           |USING source s
+           |ON t.pk = s.pk
+           |WHEN MATCHED AND salary < 200 THEN
+           | UPDATE SET salary = 1000
+           |WHEN NOT MATCHED AND s.pk < 10 THEN
+           | INSERT (pk, salary, dep) VALUES (s.pk, -1, "dummy")
+           |WHEN NOT MATCHED BY SOURCE AND salary > 400 THEN
+           | UPDATE SET salary = -1
+           |""".stripMargin
+      }
+
+      assertMetric(mergeExec, "numTargetRowsCopied", if (deltaMerge) 0 else 3)
+      assertMetric(mergeExec, "numTargetRowsInserted", 1)
+      assertMetric(mergeExec, "numTargetRowsUpdated", 2)
+      assertMetric(mergeExec, "numTargetRowsDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsMatchedUpdated", 1)
+      assertMetric(mergeExec, "numTargetRowsMatchedDeleted", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceUpdated", 1)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceDeleted", 0)
+
+      checkAnswer(
+        sql(s"SELECT * FROM $tableNameAsString"),
+        Seq(
+          Row(1, 1000, "hr"), // updated
+          Row(2, 200, "software"),
+          Row(3, 300, "hr"),
+          Row(4, 400, "marketing"),
+          Row(5, -1, "executive"), // updated
+          Row(6, -1, "dummy"))) // inserted
+
+      val table = catalog.loadTable(ident)
+      val commitProps = table.asInstanceOf[InMemoryTable].commits.last.properties
+      assert(commitProps("merge.numTargetRowsCopied") === (if (deltaMerge) "0" else "3"))
+      assert(commitProps("merge.numTargetRowsInserted") === "1")
+      assert(commitProps("merge.numTargetRowsUpdated") === "2")
+      assert(commitProps("merge.numTargetRowsDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsMatchedUpdated") === "1")
+      assert(commitProps("merge.numTargetRowsMatchedDeleted") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceUpdated") === "1")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceDeleted") === "0")
+    }
+  }
+
+  test("Merge metrics with matched, not matched, and not matched by source clauses: delete") {
+    withTempView("source") {
+      createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+        """{ "pk": 1, "salary": 100, "dep": "hr" }
+          |{ "pk": 2, "salary": 200, "dep": "software" }
+          |{ "pk": 3, "salary": 300, "dep": "hr" }
+          |{ "pk": 4, "salary": 400, "dep": "marketing" }
+          |{ "pk": 5, "salary": 500, "dep": "executive" }
+          |""".stripMargin)
+
+      val sourceDF = Seq(1, 2, 6, 10).toDF("pk")
+      sourceDF.createOrReplaceTempView("source")
+
+      val mergeExec = findMergeExec {
+        s"""MERGE INTO $tableNameAsString t
+           |USING source s
+           |ON t.pk = s.pk
+           |WHEN MATCHED AND salary < 200 THEN
+           | DELETE
+           |WHEN NOT MATCHED AND s.pk < 10 THEN
+           | INSERT (pk, salary, dep) VALUES (s.pk, -1, "dummy")
+           |WHEN NOT MATCHED BY SOURCE AND salary > 400 THEN
+           | DELETE
+           |""".stripMargin
+      }
+
+      assertMetric(mergeExec, "numTargetRowsCopied", if (deltaMerge) 0 else 3)
+      assertMetric(mergeExec, "numTargetRowsInserted", 1)
+      assertMetric(mergeExec, "numTargetRowsUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsDeleted", 2)
+      assertMetric(mergeExec, "numTargetRowsMatchedUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsMatchedDeleted", 1)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceUpdated", 0)
+      assertMetric(mergeExec, "numTargetRowsNotMatchedBySourceDeleted", 1)
+
+      checkAnswer(
+        sql(s"SELECT * FROM $tableNameAsString"),
+        Seq(
+          // Row(1, 100, "hr") deleted
+          Row(2, 200, "software"),
+          Row(3, 300, "hr"),
+          Row(4, 400, "marketing"),
+          // Row(5, 500, "executive") deleted
+          Row(6, -1, "dummy"))) // inserted
+
+      val table = catalog.loadTable(ident)
+      val commitProps = table.asInstanceOf[InMemoryTable].commits.last.properties
+      assert(commitProps("merge.numTargetRowsCopied") === (if (deltaMerge) "0" else "3"))
+      assert(commitProps("merge.numTargetRowsInserted") === "1")
+      assert(commitProps("merge.numTargetRowsUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsDeleted") === "2")
+      assert(commitProps("merge.numTargetRowsMatchedUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsMatchedDeleted") === "1")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceUpdated") === "0")
+      assert(commitProps("merge.numTargetRowsNotMatchedBySourceDeleted") === "1")
+    }
+  }
+
+  test("SPARK-52689: V2 write metrics for merge") {
+    Seq("true", "false").foreach { aqeEnabled: String =>
+      withTempView("source") {
+        withSQLConf(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> aqeEnabled) {
+          createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+            """{ "pk": 1, "salary": 100, "dep": "hr" }
+              |{ "pk": 2, "salary": 200, "dep": "software" }
+              |{ "pk": 3, "salary": 300, "dep": "hr" }
+              |{ "pk": 4, "salary": 400, "dep": "marketing" }
+              |{ "pk": 5, "salary": 500, "dep": "executive" }
+              |""".stripMargin)
+
+          val sourceDF = Seq(1, 2, 6, 10).toDF("pk")
+          sourceDF.createOrReplaceTempView("source")
+
+          sql(
+            s"""MERGE INTO $tableNameAsString t
+               |USING source s
+               |ON t.pk = s.pk
+               |WHEN MATCHED AND salary < 200 THEN
+               | DELETE
+               |WHEN NOT MATCHED AND s.pk < 10 THEN
+               | INSERT (pk, salary, dep) VALUES (s.pk, -1, "dummy")
+               |WHEN NOT MATCHED BY SOURCE AND salary > 400 THEN
+               | DELETE
+               |""".stripMargin
+          )
+
+          val table = catalog.loadTable(ident)
+          val commitProps = table.asInstanceOf[InMemoryTable].commits.last.properties
+          assert(commitProps("merge.numTargetRowsCopied") === (if (deltaMerge) "0" else "3"))
+          assert(commitProps("merge.numTargetRowsInserted") === "1")
+          assert(commitProps("merge.numTargetRowsUpdated") === "0")
+          assert(commitProps("merge.numTargetRowsDeleted") === "2")
+          assert(commitProps("merge.numTargetRowsMatchedUpdated") === "0")
+          assert(commitProps("merge.numTargetRowsMatchedDeleted") === "1")
+          assert(commitProps("merge.numTargetRowsNotMatchedBySourceUpdated") === "0")
+          assert(commitProps("merge.numTargetRowsNotMatchedBySourceDeleted") === "1")
+
+          sql(s"DROP TABLE $tableNameAsString")
+        }
+      }
+    }
+  }
+
+  test("Merge schema evolution new column with set explicit column") {
+    Seq((true, true), (false, true), (true, false)).foreach {
+      case (withSchemaEvolution, schemaEvolutionEnabled) =>
+        withTempView("source") {
+          createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+            """{ "pk": 1, "salary": 100, "dep": "hr" }
+              |{ "pk": 2, "salary": 200, "dep": "software" }
+              |{ "pk": 3, "salary": 300, "dep": "hr" }
+              |{ "pk": 4, "salary": 400, "dep": "marketing" }
+              |{ "pk": 5, "salary": 500, "dep": "executive" }
+              |""".stripMargin)
+
+          if (!schemaEvolutionEnabled) {
+            sql(s"""ALTER TABLE $tableNameAsString SET TBLPROPERTIES
+                   | ('auto-schema-evolution' = 'false')""".stripMargin)
+          }
+
+          val sourceDF = Seq((4, 150, "dummy", true),
+            (5, 250, "dummy", true),
+            (6, 350, "dummy", false)).toDF("pk", "salary", "dep", "active")
+          sourceDF.createOrReplaceTempView("source")
+
+          val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+          val mergeStmt = s"""MERGE $schemaEvolutionClause
+                             |INTO $tableNameAsString t
+                             |USING source s
+                             |ON t.pk = s.pk
+                             |WHEN MATCHED THEN
+                             | UPDATE SET dep='software', active=s.active
+                             |WHEN NOT MATCHED THEN
+                             | INSERT (pk, salary, dep, active) VALUES (s.pk, 0, s.dep, s.active)
+                             |""".stripMargin
+
+          if (withSchemaEvolution && schemaEvolutionEnabled) {
+            sql(mergeStmt)
+            checkAnswer(
+              sql(s"SELECT * FROM $tableNameAsString"),
+              Seq(
+                Row(1, 100, "hr", null),
+                Row(2, 200, "software", null),
+                Row(3, 300, "hr", null),
+                Row(4, 400, "software", true),
+                Row(5, 500, "software", true),
+                Row(6, 0, "dummy", false)))
+          } else {
+            val e = intercept[org.apache.spark.sql.AnalysisException] {
+              sql(mergeStmt)
+            }
+            assert(e.errorClass.get == "UNRESOLVED_COLUMN.WITH_SUGGESTION")
+            assert(e.getMessage.contains("A column, variable, or function parameter with name " +
+              "`active` cannot be resolved"))
+          }
+
+          sql(s"DROP TABLE $tableNameAsString")
+        }
+    }
+  }
+
+  test("Merge schema evolution new column with set all columns") {
+    Seq((true, true), (false, true), (true, false)).foreach {
+      case (withSchemaEvolution, schemaEvolutionEnabled) =>
+      withTempView("source") {
+        createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+          """{ "pk": 1, "salary": 100, "dep": "hr" }
+            |{ "pk": 2, "salary": 200, "dep": "software" }
+            |{ "pk": 3, "salary": 300, "dep": "hr" }
+            |{ "pk": 4, "salary": 400, "dep": "marketing" }
+            |{ "pk": 5, "salary": 500, "dep": "executive" }
+            |""".stripMargin)
+
+
+        if (!schemaEvolutionEnabled) {
+          sql(s"""ALTER TABLE $tableNameAsString SET TBLPROPERTIES
+                 | ('auto-schema-evolution' = 'false')""".stripMargin)
+        }
+
+        val sourceDF = Seq((4, 150, "finance", true),
+          (5, 250, "finance", false),
+          (6, 350, "finance", true)).toDF("pk", "salary", "dep", "active")
+        sourceDF.createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        sql(
+          s"""MERGE $schemaEvolutionClause
+             |INTO $tableNameAsString t
+             |USING source s
+             |ON t.pk = s.pk
+             |WHEN MATCHED THEN
+             | UPDATE SET *
+             |WHEN NOT MATCHED THEN
+             | INSERT *
+             |""".stripMargin)
+
+        if (withSchemaEvolution && schemaEvolutionEnabled) {
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(
+              Row(1, 100, "hr", null),
+              Row(2, 200, "software", null),
+              Row(3, 300, "hr", null),
+              Row(4, 150, "finance", true),
+              Row(5, 250, "finance", false),
+              Row(6, 350, "finance", true)))
+        } else {
+          // Without schema evolution, the new columns are not added
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(
+              Row(1, 100, "hr"),
+              Row(2, 200, "software"),
+              Row(3, 300, "hr"),
+              Row(4, 150, "finance"),
+              Row(5, 250, "finance"),
+              Row(6, 350, "finance")))
+        }
+      }
+      sql(s"DROP TABLE $tableNameAsString")
+    }
+  }
+
+  test("Merge schema evolution replacing column with set all column") {
+    Seq((true, true), (false, true), (true, false)).foreach {
+      case (withSchemaEvolution, schemaEvolutionEnabled) =>
+      withTempView("source") {
+        createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+          """{ "pk": 1, "salary": 100, "dep": "hr" }
+            |{ "pk": 2, "salary": 200, "dep": "software" }
+            |{ "pk": 3, "salary": 300, "dep": "hr" }
+            |{ "pk": 4, "salary": 400, "dep": "marketing" }
+            |{ "pk": 5, "salary": 500, "dep": "executive" }
+            |""".stripMargin)
+
+        if (!schemaEvolutionEnabled) {
+          sql(s"""ALTER TABLE $tableNameAsString SET TBLPROPERTIES
+                 | ('auto-schema-evolution' = 'false')""".stripMargin)
+        }
+
+        val sourceDF = Seq((4, 150, true),
+          (5, 250, true),
+          (6, 350, false)).toDF("pk", "salary", "active")
+        sourceDF.createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        sql(s"""MERGE $schemaEvolutionClause
+                           |INTO $tableNameAsString t
+                           |USING source s
+                           |ON t.pk = s.pk
+                           |WHEN MATCHED THEN
+                           | UPDATE SET *
+                           |WHEN NOT MATCHED THEN
+                           | INSERT *
+                           |""".stripMargin)
+        if (withSchemaEvolution && schemaEvolutionEnabled) {
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(
+              Row(1, 100, "hr", null),
+              Row(2, 200, "software", null),
+              Row(3, 300, "hr", null),
+              Row(4, 150, "marketing", true),
+              Row(5, 250, "executive", true),
+              Row(6, 350, null, false)))
+        } else {
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(
+              Row(1, 100, "hr"),
+              Row(2, 200, "software"),
+              Row(3, 300, "hr"),
+              Row(4, 150, "marketing"),
+              Row(5, 250, "executive"),
+              Row(6, 350, null)))
+        }
+        sql(s"DROP TABLE $tableNameAsString")
+      }
+    }
+  }
+
+  test("Merge schema evolution replacing column with set explicit column") {
+    Seq((true, true), (false, true), (true, false)).foreach {
+      case (withSchemaEvolution, schemaEvolutionEnabled) =>
+      withTempView("source") {
+        createAndInitTable("pk INT NOT NULL, salary INT, dep STRING",
+          """{ "pk": 1, "salary": 100, "dep": "hr" }
+            |{ "pk": 2, "salary": 200, "dep": "software" }
+            |{ "pk": 3, "salary": 300, "dep": "hr" }
+            |{ "pk": 4, "salary": 400, "dep": "marketing" }
+            |{ "pk": 5, "salary": 500, "dep": "executive" }
+            |""".stripMargin)
+
+        if (!schemaEvolutionEnabled) {
+          sql(s"""ALTER TABLE $tableNameAsString SET TBLPROPERTIES
+                 | ('auto-schema-evolution' = 'false')""".stripMargin)
+        }
+
+        val sourceDF = Seq((4, 150, true),
+          (5, 250, true),
+          (6, 350, false)).toDF("pk", "salary", "active")
+        sourceDF.createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        val mergeStmt = s"""MERGE $schemaEvolutionClause
+                           |INTO $tableNameAsString t
+                           |USING source s
+                           |ON t.pk = s.pk
+                           |WHEN MATCHED THEN
+                           | UPDATE SET dep = 'finance', active = s.active
+                           |WHEN NOT MATCHED THEN
+                           | INSERT (pk, salary, dep, active) VALUES
+                           | (s.pk, s.salary, 'finance', s.active)
+                           |""".stripMargin
+
+        if (withSchemaEvolution && schemaEvolutionEnabled) {
+          sql(mergeStmt)
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(
+              Row(1, 100, "hr", null),
+              Row(2, 200, "software", null),
+              Row(3, 300, "hr", null),
+              Row(4, 400, "finance", true),
+              Row(5, 500, "finance", true),
+              Row(6, 350, "finance", false)))
+        } else {
+          val e = intercept[org.apache.spark.sql.AnalysisException] {
+            sql(mergeStmt)
+          }
+          assert(e.errorClass.get == "UNRESOLVED_COLUMN.WITH_SUGGESTION")
+          assert(e.getMessage.contains("A column, variable, or function parameter with name " +
+            "`active` cannot be resolved"))
+        }
+
+        sql(s"DROP TABLE $tableNameAsString")
+      }
+    }
+  }
+
+  test("merge into schema evolution add column with nested field and set explicit columns") {
+    Seq(true, false).foreach { withSchemaEvolution =>
+      withTempView("source") {
+        createAndInitTable(
+          s"""pk INT NOT NULL,
+             |s STRUCT<c1: INT, c2: STRUCT<a: ARRAY<INT>, m: MAP<STRING, STRING>>>,
+             |dep STRING""".stripMargin,
+          """{ "pk": 1, "s": { "c1": 2, "c2": { "a": [1,2], "m": { "a": "b" } } }, "dep": "hr" }""")
+
+        val sourceTableSchema = StructType(Seq(
+          StructField("pk", IntegerType, nullable = false),
+          StructField("s", StructType(Seq(
+            StructField("c1", IntegerType),
+            StructField("c2", StructType(Seq(
+              StructField("a", ArrayType(IntegerType)),
+              StructField("m", MapType(StringType, StringType)),
+              StructField("c3", BooleanType) // new column
+            )))
+          ))),
+          StructField("dep", StringType)
+        ))
+        val data = Seq(
+          Row(1, Row(10, Row(Array(3, 4), Map("c" -> "d"), false)), "sales"),
+          Row(2, Row(20, Row(Array(4, 5), Map("e" -> "f"), true)), "engineering")
+        )
+        spark.createDataFrame(spark.sparkContext.parallelize(data), sourceTableSchema)
+          .createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        val mergeStmt =
+          s"""MERGE $schemaEvolutionClause
+             |INTO $tableNameAsString t
+             |USING source src
+             |ON t.pk = src.pk
+             |WHEN MATCHED THEN
+             | UPDATE SET s.c1 = -1, s.c2.m = map('k', 'v'), s.c2.a = array(-1),
+             | s.c2.c3 = src.s.c2.c3
+             |WHEN NOT MATCHED THEN
+             | INSERT (pk, s, dep) VALUES (src.pk,
+             |   named_struct('c1', src.s.c1,
+             |     'c2', named_struct('a', src.s.c2.a, 'm', map('g', 'h'), 'c3', true)), src.dep)
+             |""".stripMargin
+
+        if (withSchemaEvolution) {
+          sql(mergeStmt)
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(Row(1, Row(-1, Row(Seq(-1), Map("k" -> "v"), false)), "hr"),
+              Row(2, Row(20, Row(Seq(4, 5), Map("g" -> "h"), true)), "engineering")))
+        } else {
+          val exception = intercept[org.apache.spark.sql.AnalysisException] {
+            sql(mergeStmt)
+          }
+          assert(exception.errorClass.get == "FIELD_NOT_FOUND")
+          assert(exception.getMessage.contains("No such struct field `c3` in `a`, `m`. "))
+        }
+      }
+      sql(s"DROP TABLE IF EXISTS $tableNameAsString")
+    }
+  }
+
+  test("merge into schema evolution add column with nested field and set all columns") {
+    Seq(true, false).foreach { withSchemaEvolution =>
+      withTempView("source") {
+        createAndInitTable(
+          s"""pk INT NOT NULL,
+             |s STRUCT<c1: INT, c2: STRUCT<a: ARRAY<INT>, m: MAP<STRING, STRING>>>,
+             |dep STRING""".stripMargin,
+          """{ "pk": 1, "s": { "c1": 2, "c2": { "a": [1,2], "m": { "a": "b" } } }, "dep": "hr" }""")
+
+        val sourceTableSchema = StructType(Seq(
+          StructField("pk", IntegerType, nullable = false),
+          StructField("s", StructType(Seq(
+            StructField("c1", IntegerType),
+            StructField("c2", StructType(Seq(
+              StructField("a", ArrayType(IntegerType)),
+              StructField("m", MapType(StringType, StringType)),
+              StructField("c3", BooleanType) // new column
+            )))
+          ))),
+          StructField("dep", StringType)
+        ))
+        val data = Seq(
+          Row(1, Row(10, Row(Array(3, 4), Map("c" -> "d"), false)), "sales"),
+          Row(2, Row(20, Row(Array(4, 5), Map("e" -> "f"), true)), "engineering")
+        )
+        spark.createDataFrame(spark.sparkContext.parallelize(data), sourceTableSchema)
+          .createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        val mergeStmt =
+          s"""MERGE $schemaEvolutionClause
+             |INTO $tableNameAsString t
+             |USING source src
+             |ON t.pk = src.pk
+             |WHEN MATCHED THEN
+             | UPDATE SET *
+             |WHEN NOT MATCHED THEN
+             | INSERT *
+             |""".stripMargin
+
+        if (withSchemaEvolution) {
+          sql(mergeStmt)
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(Row(1, Row(10, Row(Seq(3, 4), Map("c" -> "d"), false)), "sales"),
+              Row(2, Row(20, Row(Seq(4, 5), Map("e" -> "f"), true)), "engineering")))
+        } else {
+          val exception = intercept[org.apache.spark.sql.AnalysisException] {
+            sql(mergeStmt)
+          }
+          assert(exception.errorClass.get == "INCOMPATIBLE_DATA_FOR_TABLE.EXTRA_STRUCT_FIELDS")
+          assert(exception.getMessage.contains(
+            "Cannot write extra fields `c3` to the struct `s`.`c2`"))
+        }
+      }
+      sql(s"DROP TABLE IF EXISTS $tableNameAsString")
+    }
+  }
+
+  test("merge into schema evolution replace column with nested field and set explicit columns") {
+    Seq(true, false).foreach { withSchemaEvolution =>
+      withTempView("source") {
+        createAndInitTable(
+          s"""pk INT NOT NULL,
+             |s STRUCT<c1: INT, c2: STRUCT<a: ARRAY<INT>, m: MAP<STRING, STRING>>>,
+             |dep STRING""".stripMargin,
+          """{ "pk": 1, "s": { "c1": 2, "c2": { "a": [1,2], "m": { "a": "b" } } }, "dep": "hr" }""")
+
+        val sourceTableSchema = StructType(Seq(
+          StructField("pk", IntegerType, nullable = false),
+          StructField("s", StructType(Seq(
+            StructField("c1", IntegerType),
+            StructField("c2", StructType(Seq(
+              // removed column 'a'
+              StructField("m", MapType(StringType, StringType)),
+              StructField("c3", BooleanType) // new column
+            )))
+          ))),
+          StructField("dep", StringType)
+        ))
+        val data = Seq(
+          Row(1, Row(10, Row(Map("c" -> "d"), false)), "sales"),
+          Row(2, Row(20, Row(Map("e" -> "f"), true)), "engineering")
+        )
+        spark.createDataFrame(spark.sparkContext.parallelize(data), sourceTableSchema)
+          .createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        val mergeStmt =
+          s"""MERGE $schemaEvolutionClause
+             |INTO $tableNameAsString t
+             |USING source src
+             |ON t.pk = src.pk
+             |WHEN MATCHED THEN
+             | UPDATE SET s.c1 = -1, s.c2.m = map('k', 'v'), s.c2.a = array(-1),
+             | s.c2.c3 = src.s.c2.c3
+             |WHEN NOT MATCHED THEN
+             | INSERT (pk, s, dep) VALUES (src.pk,
+             |   named_struct('c1', src.s.c1,
+             |     'c2', named_struct('a', array(-2), 'm', map('g', 'h'), 'c3', true)), src.dep)
+             |""".stripMargin
+
+        if (withSchemaEvolution) {
+          sql(mergeStmt)
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(Row(1, Row(-1, Row(Seq(-1), Map("k" -> "v"), false)), "hr"),
+              Row(2, Row(20, Row(Seq(-2), Map("g" -> "h"), true)), "engineering")))
+        } else {
+          val exception = intercept[org.apache.spark.sql.AnalysisException] {
+            sql(mergeStmt)
+          }
+          assert(exception.errorClass.get == "FIELD_NOT_FOUND")
+          assert(exception.getMessage.contains("No such struct field `c3` in `a`, `m`. "))
+        }
+      }
+      sql(s"DROP TABLE IF EXISTS $tableNameAsString")
+    }
+  }
+
+  // TODO- support schema evolution for missing nested types using UPDATE SET * and INSERT *
+  test("merge into schema evolution replace column with nested field and set all columns") {
+    Seq(true, false).foreach { withSchemaEvolution =>
+      withTempView("source") {
+        createAndInitTable(
+          s"""pk INT NOT NULL,
+             |s STRUCT<c1: INT, c2: STRUCT<a: ARRAY<INT>, m: MAP<STRING, STRING>>>,
+             |dep STRING""".stripMargin,
+          """{ "pk": 1, "s": { "c1": 2, "c2": { "a": [1,2], "m": { "a": "b" } } }, "dep": "hr" }""")
+
+        val sourceTableSchema = StructType(Seq(
+          StructField("pk", IntegerType, nullable = false),
+          StructField("s", StructType(Seq(
+            StructField("c1", IntegerType),
+            StructField("c2", StructType(Seq(
+              // removed column 'a'
+              StructField("m", MapType(StringType, StringType)),
+              StructField("c3", BooleanType) // new column
+            )))
+          ))),
+          StructField("dep", StringType)
+        ))
+        val data = Seq(
+          Row(1, Row(10, Row(Map("c" -> "d"), false)), "sales"),
+          Row(2, Row(20, Row(Map("e" -> "f"), true)), "engineering")
+        )
+        spark.createDataFrame(spark.sparkContext.parallelize(data), sourceTableSchema)
+          .createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        val exception = intercept[org.apache.spark.sql.AnalysisException] {
+          sql(
+            s"""MERGE $schemaEvolutionClause
+               |INTO $tableNameAsString t
+               |USING source src
+               |ON t.pk = src.pk
+               |WHEN MATCHED THEN
+               | UPDATE SET *
+               |WHEN NOT MATCHED THEN
+               | INSERT *
+               |""".stripMargin)
+        }
+
+        assert(exception.errorClass.get == "INCOMPATIBLE_DATA_FOR_TABLE.CANNOT_FIND_DATA")
+        assert(exception.getMessage.contains("Cannot find data for the output column `s`.`c2`.`a`"))
+      }
+      sql(s"DROP TABLE IF EXISTS $tableNameAsString")
+    }
+  }
+
+  test("merge into schema evolution add column for struct in array and set all columns") {
+    Seq(true, false).foreach { withSchemaEvolution =>
+      withTempView("source") {
+        createAndInitTable(
+          s"""pk INT NOT NULL,
+             |a ARRAY<STRUCT<c1: INT, c2: STRING>>,
+             |dep STRING""".stripMargin,
+          """{ "pk": 0, "a": [ { "c1": 1, "c2": "a" }, { "c1": 2, "c2": "b" } ], "dep": "sales"},
+             { "pk": 1, "a": [ { "c1": 1, "c2": "a" }, { "c1": 2, "c2": "b" } ], "dep": "hr" }"""
+            .stripMargin)
+
+        val sourceTableSchema = StructType(Seq(
+          StructField("pk", IntegerType, nullable = false),
+          StructField("a", ArrayType(
+            StructType(Seq(
+              StructField("c1", IntegerType),
+              StructField("c2", StringType),
+              StructField("c3", BooleanType))))), // new column
+          StructField("dep", StringType)))
+        val data = Seq(
+          Row(1, Array(Row(10, "c", true), Row(20, "d", false)), "hr"),
+          Row(2, Array(Row(30, "d", false), Row(40, "e", true)), "engineering")
+        )
+        spark.createDataFrame(spark.sparkContext.parallelize(data), sourceTableSchema)
+          .createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        val mergeStmt =
+          s"""MERGE $schemaEvolutionClause
+             |INTO $tableNameAsString t
+             |USING source src
+             |ON t.pk = src.pk
+             |WHEN MATCHED THEN
+             | UPDATE SET *
+             |WHEN NOT MATCHED THEN
+             | INSERT *
+             |""".stripMargin
+
+        if (withSchemaEvolution) {
+          sql(mergeStmt)
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            // TODO- InMemoryBaseTable does not return null for nested schema evolution.
+            Seq(Row(0, Array(Row(1, "a", true), Row(2, "b", true)), "sales"),
+              Row(1, Array(Row(10, "c", true), Row(20, "d", false)), "hr"),
+              Row(2, Array(Row(30, "d", false), Row(40, "e", true)), "engineering")))
+        } else {
+          val exception = intercept[org.apache.spark.sql.AnalysisException] {
+            sql(mergeStmt)
+          }
+          assert(exception.errorClass.get == "INCOMPATIBLE_DATA_FOR_TABLE.EXTRA_STRUCT_FIELDS")
+          assert(exception.getMessage.contains(
+            "Cannot write extra fields `c3` to the struct `a`.`element`"))
+        }
+      }
+      sql(s"DROP TABLE IF EXISTS $tableNameAsString")
+    }
+  }
+
+  test("merge into schema evolution add column for struct in map and set all columns") {
+    Seq(true, false).foreach { withSchemaEvolution =>
+      withTempView("source") {
+        val schema =
+          StructType(Seq(
+            StructField("pk", IntegerType, nullable = false),
+            StructField("m", MapType(
+              StructType(Seq(StructField("c1", IntegerType))),
+              StructType(Seq(StructField("c2", StringType))))),
+            StructField("dep", StringType)))
+        createTable(CatalogV2Util.structTypeToV2Columns(schema))
+
+        val data = Seq(
+          Row(0, Map(Row(10) -> Row("c")), "hr"),
+          Row(1, Map(Row(20) -> Row("d")), "sales"))
+        spark.createDataFrame(spark.sparkContext.parallelize(data), schema)
+          .writeTo(tableNameAsString).append()
+
+        val sourceTableSchema = StructType(Seq(
+          StructField("pk", IntegerType),
+          StructField("m", MapType(
+            StructType(Seq(StructField("c1", IntegerType), StructField("c3", BooleanType))),
+            StructType(Seq(StructField("c2", StringType), StructField("c4", BooleanType))))),
+          StructField("dep", StringType)))
+        val sourceData = Seq(
+          Row(1, Map(Row(10, true) -> Row("y", false)), "sales"),
+          Row(2, Map(Row(20, false) -> Row("z", true)), "engineering")
+        )
+        spark.createDataFrame(spark.sparkContext.parallelize(sourceData), sourceTableSchema)
+          .createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+        val mergeStmt =
+          s"""MERGE $schemaEvolutionClause
+             |INTO $tableNameAsString t
+             |USING source src
+             |ON t.pk = src.pk
+             |WHEN MATCHED THEN
+             | UPDATE SET *
+             |WHEN NOT MATCHED THEN
+             | INSERT *
+             |""".stripMargin
+
+        if (withSchemaEvolution) {
+          sql(mergeStmt)
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            // TODO- InMemoryBaseTable does not return null for nested schema evolution.
+            Seq(Row(0, Map(Row(10, true) -> Row("c", true)), "hr"),
+              Row(1, Map(Row(10, true) -> Row("y", false)), "sales"),
+              Row(2, Map(Row(20, false) -> Row("z", true)), "engineering")))
+        } else {
+          val exception = intercept[org.apache.spark.sql.AnalysisException] {
+            sql(mergeStmt)
+          }
+          assert(exception.errorClass.get == "INCOMPATIBLE_DATA_FOR_TABLE.EXTRA_STRUCT_FIELDS")
+          assert(exception.getMessage.contains(
+            "Cannot write extra fields `c3` to the struct `m`.`key`"))
+        }
+      }
+      sql(s"DROP TABLE IF EXISTS $tableNameAsString")
+    }
+  }
+
+  test("merge into empty table with NOT MATCHED clause schema evolution") {
+    Seq(true, false) foreach { withSchemaEvolution =>
+      withTempView("source") {
+        createTable("pk INT NOT NULL, salary INT, dep STRING")
+
+        val sourceRows = Seq(
+          (1, 100, "hr", true),
+          (2, 200, "finance", false),
+          (3, 300, "hr", true))
+        sourceRows.toDF("pk", "salary", "dep", "active").createOrReplaceTempView("source")
+
+        val schemaEvolutionClause = if (withSchemaEvolution) "WITH SCHEMA EVOLUTION" else ""
+
+        sql(
+          s"""MERGE $schemaEvolutionClause
+             |INTO $tableNameAsString t
+             |USING source s
+             |ON t.pk = s.pk
+             |WHEN NOT MATCHED THEN
+             | INSERT *
+             |""".stripMargin)
+
+        if (withSchemaEvolution) {
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(
+              Row(1, 100, "hr", true),
+              Row(2, 200, "finance", false),
+              Row(3, 300, "hr", true)))
+        } else {
+          checkAnswer(
+            sql(s"SELECT * FROM $tableNameAsString"),
+            Seq(
+              Row(1, 100, "hr"),
+              Row(2, 200, "finance"),
+              Row(3, 300, "hr")))
+        }
+        sql("DROP TABLE IF EXISTS " + tableNameAsString)
+      }
+    }
+  }
+
+  private def findMergeExec(query: String): MergeRowsExec = {
+    val plan = executeAndKeepPlan {
+      sql(query)
+    }
+    collectFirst(plan) {
+      case m: MergeRowsExec => m
+    } match {
+      case Some(m) => m
+      case None =>
+        fail("MergeRowsExec not found in the plan")
+    }
+  }
+
   private def assertNoLeftBroadcastOrReplication(query: String): Unit = {
     val plan = executeAndKeepPlan {
       sql(query)
@@ -1748,4 +2822,16 @@ abstract class MergeIntoTableSuiteBase extends RowLevelOperationSuiteBase {
     }
     assert(e.getMessage.contains("ON search condition of the MERGE statement"))
   }
+
+  private def assertMetric(
+      mergeExec: MergeRowsExec,
+      metricName: String,
+      expected: Long): Unit = {
+    mergeExec.metrics.get(metricName) match {
+      case Some(metric) =>
+        assert(metric.value == expected,
+          s"Expected $metricName to be $expected, but got ${metric.value}")
+      case None => fail(s"$metricName metric not found")
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/PushablePredicateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/PushablePredicateSuite.scala
index 8b99e3aa6981a..e871eed6abbe6 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/PushablePredicateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/PushablePredicateSuite.scala
@@ -17,39 +17,76 @@
 
 package org.apache.spark.sql.connector
 
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.QueryTest
-import org.apache.spark.sql.catalyst.expressions.Literal
+import org.apache.spark.sql.catalyst.expressions.{Cast, Literal}
+import org.apache.spark.sql.connector.expressions.filter.{AlwaysTrue, Predicate => V2Predicate}
 import org.apache.spark.sql.execution.datasources.v2.PushablePredicate
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.sql.types.{BooleanType, TimestampType}
 
 class PushablePredicateSuite extends QueryTest with SharedSparkSession {
 
-  test("PushablePredicate None returned - flag on") {
-    withSQLConf(SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE.key -> "true") {
-      val pushable = PushablePredicate.unapply(Literal.create("string"))
-      assert(!pushable.isDefined)
-    }
-  }
+  override def sparkConf: SparkConf = super.sparkConf.set(SQLConf.ANSI_ENABLED, true)
 
-  test("PushablePredicate success - flag on") {
-    withSQLConf(SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE.key -> "true") {
-      val pushable = PushablePredicate.unapply(Literal.create(true))
-      assert(pushable.isDefined)
+  test("simple boolean expression should always return v2 Predicate") {
+    Seq(true, false).foreach { createV2Predicate =>
+      Seq(true, false).foreach { noAssert =>
+        withSQLConf(
+          SQLConf.DATA_SOURCE_ALWAYS_CREATE_V2_PREDICATE.key -> createV2Predicate.toString,
+          SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE.key -> noAssert.toString) {
+          val pushable = PushablePredicate.unapply(Literal.create(true))
+          assert(pushable.isDefined)
+          assert(pushable.get.isInstanceOf[AlwaysTrue])
+        }
+      }
     }
   }
 
-  test("PushablePredicate success") {
-    withSQLConf(SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE.key -> "false") {
-      val pushable = PushablePredicate.unapply(Literal.create(true))
-      assert(pushable.isDefined)
+  test("non-boolean expression") {
+    Seq(true, false).foreach { createV2Predicate =>
+      Seq(true, false).foreach { noAssert =>
+        withSQLConf(
+          SQLConf.DATA_SOURCE_ALWAYS_CREATE_V2_PREDICATE.key -> createV2Predicate.toString,
+          SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE.key -> noAssert.toString) {
+          val catalystExpr = Literal.create("string")
+          if (noAssert) {
+            val pushable = PushablePredicate.unapply(catalystExpr)
+            assert(pushable.isEmpty)
+          } else {
+            intercept[java.lang.AssertionError] {
+              PushablePredicate.unapply(catalystExpr)
+            }
+          }
+        }
+      }
     }
   }
 
-  test("PushablePredicate throws") {
-    withSQLConf(SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE.key -> "false") {
-      intercept[java.lang.AssertionError] {
-        PushablePredicate.unapply(Literal.create("string"))
+  test("non-trivial boolean expression") {
+    Seq(true, false).foreach { createV2Predicate =>
+      Seq(true, false).foreach { noAssert =>
+        withSQLConf(
+          SQLConf.DATA_SOURCE_ALWAYS_CREATE_V2_PREDICATE.key -> createV2Predicate.toString,
+          SQLConf.DATA_SOURCE_DONT_ASSERT_ON_PREDICATE.key -> noAssert.toString) {
+          val catalystExpr =
+            Cast(Cast(Literal.create("2025-01-01 00:00:00"), TimestampType), BooleanType)
+          if (createV2Predicate) {
+            val pushable = PushablePredicate.unapply(catalystExpr)
+            assert(pushable.isDefined)
+            assert(pushable.get.isInstanceOf[V2Predicate])
+          } else {
+            if (noAssert) {
+              val pushable = PushablePredicate.unapply(catalystExpr)
+              assert(pushable.isEmpty)
+            } else {
+              intercept[java.lang.AssertionError] {
+                PushablePredicate.unapply(catalystExpr)
+              }
+            }
+          }
+        }
       }
     }
   }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/SupportsCatalogOptionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/SupportsCatalogOptionsSuite.scala
index b952270fc7869..5e17c1a64f446 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/SupportsCatalogOptionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/SupportsCatalogOptionsSuite.scala
@@ -30,14 +30,14 @@ import org.apache.spark.sql.{AnalysisException, DataFrame, QueryTest, SaveMode}
 import org.apache.spark.sql.catalyst.analysis.{NoSuchTableException, TableAlreadyExistsException}
 import org.apache.spark.sql.catalyst.plans.logical.{AppendData, LogicalPlan, OverwriteByExpression}
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
-import org.apache.spark.sql.connector.catalog.{Identifier, InMemoryTableCatalog, SupportsCatalogOptions, TableCatalog}
+import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Column, Identifier, InMemoryTableCatalog, SupportsCatalogOptions, TableCatalog}
 import org.apache.spark.sql.connector.catalog.CatalogManager.SESSION_CATALOG_NAME
 import org.apache.spark.sql.connector.expressions.{FieldReference, IdentityTransform}
 import org.apache.spark.sql.execution.QueryExecution
 import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
 import org.apache.spark.sql.internal.SQLConf.V2_SESSION_CATALOG_IMPLEMENTATION
 import org.apache.spark.sql.test.SharedSparkSession
-import org.apache.spark.sql.types.{LongType, StructType}
+import org.apache.spark.sql.types.LongType
 import org.apache.spark.sql.util.{CaseInsensitiveStringMap, QueryExecutionListener}
 import org.apache.spark.unsafe.types.UTF8String
 
@@ -100,7 +100,8 @@ class SupportsCatalogOptionsSuite extends QueryTest with SharedSparkSession with
     }
     assert(table.partitioning().map(_.references().head.fieldNames().head) === partitionBy,
       "Partitioning was incorrect")
-    assert(table.schema() === df.schema.asNullable, "Schema did not match")
+    assert(table.columns() === CatalogV2Util.structTypeToV2Columns(df.schema.asNullable),
+      "Column did not match")
 
     checkAnswer(load("t1", withCatalogOption), df.toDF())
   }
@@ -147,7 +148,8 @@ class SupportsCatalogOptionsSuite extends QueryTest with SharedSparkSession with
 
     val table = catalog(SESSION_CATALOG_NAME).loadTable(Identifier.of(Array("default"), "t1"))
     assert(table.partitioning().isEmpty, "Partitioning should be empty")
-    assert(table.schema() === new StructType().add("id", LongType), "Schema did not match")
+    assert(table.columns() sameElements
+      Array(Column.create("id", LongType)), "Schema did not match")
     assert(load("t1", None).count() === 0)
   }
 
@@ -159,7 +161,8 @@ class SupportsCatalogOptionsSuite extends QueryTest with SharedSparkSession with
 
     val table = catalog(catalogName).loadTable("t1")
     assert(table.partitioning().isEmpty, "Partitioning should be empty")
-    assert(table.schema() === new StructType().add("id", LongType), "Schema did not match")
+    assert(table.columns() sameElements
+      Array(Column.create("id", LongType)), "Schema did not match")
     assert(load("t1", Some(catalogName)).count() === 0)
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/TableCapabilityCheckSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/TableCapabilityCheckSuite.scala
index 95301adb9b686..4da06ed82993d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/TableCapabilityCheckSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/TableCapabilityCheckSuite.scala
@@ -29,7 +29,8 @@ import org.apache.spark.sql.connector.catalog.{Table, TableCapability}
 import org.apache.spark.sql.connector.catalog.TableCapability._
 import org.apache.spark.sql.execution.datasources.DataSource
 import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2Relation, TableCapabilityCheck}
-import org.apache.spark.sql.execution.streaming.{Offset, Source, StreamingRelation}
+import org.apache.spark.sql.execution.streaming.{Offset, Source}
+import org.apache.spark.sql.execution.streaming.runtime.StreamingRelation
 import org.apache.spark.sql.sources.StreamSourceProvider
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.{LongType, StringType, StructType}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/UpdateTableSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/UpdateTableSuiteBase.scala
index 0c3ed5106ebac..c8c14876fceec 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/UpdateTableSuiteBase.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/UpdateTableSuiteBase.scala
@@ -19,8 +19,8 @@ package org.apache.spark.sql.connector
 
 import org.apache.spark.SparkRuntimeException
 import org.apache.spark.sql.Row
-import org.apache.spark.sql.connector.catalog.{Column, ColumnDefaultValue}
-import org.apache.spark.sql.connector.expressions.LiteralValue
+import org.apache.spark.sql.connector.catalog.{Column, ColumnDefaultValue, TableChange, TableInfo}
+import org.apache.spark.sql.connector.expressions.{GeneralScalarExpression, LiteralValue}
 import org.apache.spark.sql.types.{IntegerType, StringType}
 
 abstract class UpdateTableSuiteBase extends RowLevelOperationSuiteBase {
@@ -64,6 +64,59 @@ abstract class UpdateTableSuiteBase extends RowLevelOperationSuiteBase {
         Row(5, 500, "hr", null)))
   }
 
+  test("update table with expression-based default values") {
+    val columns = Array(
+      Column.create("pk", IntegerType),
+      Column.create("salary", IntegerType),
+      Column.create("dep", StringType))
+    val tableInfo = new TableInfo.Builder().withColumns(columns).build()
+    catalog.createTable(ident, tableInfo)
+
+    append("pk INT, salary INT, dep STRING",
+      """{ "pk": 1, "salary": 100, "dep": "hr" }
+        |{ "pk": 2, "salary": 200, "dep": "software" }
+        |{ "pk": 3, "salary": 300, "dep": "hr" }
+        |""".stripMargin)
+
+    val addColumn = TableChange.addColumn(
+      Array("value"),
+      IntegerType,
+      false, /* not nullable */
+      null, /* no comment */
+      null, /* no position */
+      new ColumnDefaultValue(
+        new GeneralScalarExpression(
+          "+",
+          Array(LiteralValue(100, IntegerType), LiteralValue(23, IntegerType))),
+        LiteralValue(123, IntegerType)))
+    catalog.alterTable(ident, addColumn)
+
+    append("pk INT, salary INT, dep STRING, value INT",
+      """{ "pk": 4, "salary": 400, "dep": "hr", "value": -4 }
+        |{ "pk": 5, "salary": 500, "dep": "hr", "value": -5 }
+        |""".stripMargin)
+
+    checkAnswer(
+      sql(s"SELECT * FROM $tableNameAsString"),
+      Seq(
+        Row(1, 100, "hr", 123),
+        Row(2, 200, "software", 123),
+        Row(3, 300, "hr", 123),
+        Row(4, 400, "hr", -4),
+        Row(5, 500, "hr", -5)))
+
+    sql(s"UPDATE $tableNameAsString SET value = DEFAULT WHERE pk >= 5")
+
+    checkAnswer(
+      sql(s"SELECT * FROM $tableNameAsString"),
+      Seq(
+        Row(1, 100, "hr", 123),
+        Row(2, 200, "software", 123),
+        Row(3, 300, "hr", 123),
+        Row(4, 400, "hr", -4),
+        Row(5, 500, "hr", 123)))
+  }
+
   test("EXPLAIN only update") {
     createAndInitTable("pk INT NOT NULL, dep STRING", """{ "pk": 1, "dep": "hr" }""")
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/V1ReadFallbackSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/V1ReadFallbackSuite.scala
index bfde1984f1fbc..747d16434534f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/V1ReadFallbackSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/V1ReadFallbackSuite.scala
@@ -144,7 +144,7 @@ class TableWithV1ReadFallback(override val name: String) extends Table with Supp
   private class V1ReadFallbackScanBuilder extends ScanBuilder
     with SupportsPushDownRequiredColumns with SupportsPushDownFilters {
 
-    private var requiredSchema: StructType = schema()
+    private var requiredSchema: StructType = CatalogV2Util.v2ColumnsToStructType(columns())
     override def pruneColumns(requiredSchema: StructType): Unit = {
       this.requiredSchema = requiredSchema
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/connector/WriteDistributionAndOrderingSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/connector/WriteDistributionAndOrderingSuite.scala
index 0b313eb64f26a..ff6a215496bee 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/connector/WriteDistributionAndOrderingSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/connector/WriteDistributionAndOrderingSuite.scala
@@ -35,7 +35,7 @@ import org.apache.spark.sql.execution.{QueryExecution, SortExec, SparkPlan}
 import org.apache.spark.sql.execution.adaptive.AQEShuffleReadExec
 import org.apache.spark.sql.execution.datasources.v2.V2TableWriteExec
 import org.apache.spark.sql.execution.exchange.ShuffleExchangeLike
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.sources.ContinuousMemoryStream
 import org.apache.spark.sql.functions.lit
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryCompilationErrorsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryCompilationErrorsSuite.scala
index 110347e766e80..9e16c5b2a3ddd 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryCompilationErrorsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryCompilationErrorsSuite.scala
@@ -954,7 +954,7 @@ class QueryCompilationErrorsSuite
     }
     checkError(
       exception = intercept[AnalysisException] {
-        converter.convertField(StructField("test", dummyDataType))
+        converter.convertField(StructField("test", dummyDataType), inShredded = false)
       },
       condition = "INTERNAL_ERROR",
       parameters = Map("message" -> "Cannot convert Spark data type \"DUMMY\" to any Parquet type.")
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryExecutionErrorsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryExecutionErrorsSuite.scala
index 46f2502582c38..fcecaf25d4ca5 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryExecutionErrorsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/errors/QueryExecutionErrorsSuite.scala
@@ -46,7 +46,7 @@ import org.apache.spark.sql.execution.datasources.jdbc.connection.ConnectionProv
 import org.apache.spark.sql.execution.datasources.orc.OrcTest
 import org.apache.spark.sql.execution.datasources.parquet.ParquetTest
 import org.apache.spark.sql.execution.datasources.v2.jdbc.JDBCTableCatalog
-import org.apache.spark.sql.execution.streaming.FileSystemBasedCheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.FileSystemBasedCheckpointFileManager
 import org.apache.spark.sql.execution.vectorized.ConstantColumnVector
 import org.apache.spark.sql.functions.{lit, lower, struct, sum, udf}
 import org.apache.spark.sql.internal.LegacyBehaviorPolicy.EXCEPTION
@@ -656,6 +656,7 @@ class QueryExecutionErrorsSuite
       sqlState = "42704")
 
     JdbcDialects.unregisterDialect(testH2DialectUnrecognizedSQLType)
+    JdbcDialects.registerDialect(existH2Dialect)
   }
 
   test("INVALID_BUCKET_FILE: error if there exists any malformed bucket files") {
@@ -1275,6 +1276,22 @@ class QueryExecutionErrorsSuite
       sql("ALTER TABLE t SET LOCATION '/mister/spark'")
     }
   }
+
+  test("SPARK-42841: SQL query with unsupported data types for ordering") {
+    import org.apache.spark.sql.catalyst.types.PhysicalDataType
+    import org.apache.spark.sql.types.CalendarIntervalType
+
+    // Test PhysicalDataType.ordering() with CalendarIntervalType
+    // It's hard to make a sql test that passes Argument verification but fails
+    // Order verification. So we directly test the error.
+    checkError(
+      exception = intercept[SparkIllegalArgumentException] {
+        PhysicalDataType.ordering(CalendarIntervalType)
+      },
+      condition = "DATATYPE_CANNOT_ORDER",
+      parameters = Map("dataType" -> "PhysicalCalendarIntervalType"))
+  }
+
 }
 
 class FakeFileSystemSetPermission extends LocalFileSystem {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/BroadcastExchangeSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/BroadcastExchangeSuite.scala
index 60a74a553bc45..8d6ee83f5e6b7 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/BroadcastExchangeSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/BroadcastExchangeSuite.scala
@@ -98,6 +98,21 @@ class BroadcastExchangeSuite extends SparkPlanTest
       assert(joinDF.collect().length == 1)
     }
   }
+
+  test("SPARK-52962: broadcast exchange should not reset metrics") {
+    val df = spark.range(1).toDF()
+    val joinDF = df.join(broadcast(df), "id")
+    joinDF.collect()
+    val broadcastExchangeExec = collect(
+      joinDF.queryExecution.executedPlan) { case p: BroadcastExchangeExec => p }
+    assert(broadcastExchangeExec.size == 1, "one and only BroadcastExchangeExec")
+
+    val broadcastExchangeNode = broadcastExchangeExec.head
+    val metrics = broadcastExchangeNode.metrics
+    assert(metrics("numOutputRows").value == 1)
+    broadcastExchangeNode.resetMetrics()
+    assert(metrics("numOutputRows").value == 1)
+  }
 }
 
 // Additional tests run in 'local-cluster' mode.
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/CoalesceShufflePartitionsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/CoalesceShufflePartitionsSuite.scala
index 4b650957e42c0..28762f01d7a20 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/CoalesceShufflePartitionsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/CoalesceShufflePartitionsSuite.scala
@@ -503,16 +503,14 @@ class CoalesceShufflePartitionsSuite extends SparkFunSuite with SQLConfHelper
 
   test("SPARK-51505: log empty partition number metrics") {
     val test: SparkSession => Unit = { spark: SparkSession =>
-      withSQLConf(SQLConf.SHUFFLE_PARTITIONS.key -> "5") {
-        val df = spark.range(0, 1000, 1, 5).withColumn("value", when(col("id") < 500, 0)
-            .otherwise(1)).groupBy("value").agg("value" -> "sum")
-        df.collect()
-        val plan = df.queryExecution.executedPlan
-        val coalesce = collectFirst(plan) {
-          case e: AQEShuffleReadExec => e
-        }.get
-        assert(coalesce.metrics("numEmptyPartitions").value == 3)
-      }
+      val df = spark.range(0, 1000, 1, 10).withColumn("value", expr("id % 3"))
+        .groupBy("value").agg("value" -> "sum")
+      df.collect()
+      val plan = df.queryExecution.executedPlan
+      val coalesce = collectFirst(plan) {
+        case e: AQEShuffleReadExec => e
+      }.get
+      assert(coalesce.metrics("numEmptyPartitions").value == 2)
     }
     withSparkSession(test, 100, None)
   }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArrayBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArrayBenchmark.scala
index 31b002a1e245d..461c899325f44 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArrayBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArrayBenchmark.scala
@@ -107,7 +107,8 @@ object ExternalAppendOnlyUnsafeRowArrayBenchmark extends BenchmarkBase {
       for (_ <- 0L until iterations) {
         val array = new ExternalAppendOnlyUnsafeRowArray(
           ExternalAppendOnlyUnsafeRowArray.DefaultInitialSizeOfInMemoryBuffer,
-          numSpillThreshold)
+          numSpillThreshold,
+          Long.MaxValue)
 
         rows.foreach(x => array.add(x))
 
@@ -146,6 +147,7 @@ object ExternalAppendOnlyUnsafeRowArrayBenchmark extends BenchmarkBase {
           1024,
           SparkEnv.get.memoryManager.pageSizeBytes,
           numSpillThreshold,
+          Long.MaxValue,
           false)
 
         rows.foreach(x =>
@@ -170,7 +172,9 @@ object ExternalAppendOnlyUnsafeRowArrayBenchmark extends BenchmarkBase {
     benchmark.addCase("ExternalAppendOnlyUnsafeRowArray") { _: Int =>
       var sum = 0L
       for (_ <- 0L until iterations) {
-        val array = new ExternalAppendOnlyUnsafeRowArray(numSpillThreshold, numSpillThreshold)
+        val array = new ExternalAppendOnlyUnsafeRowArray(numSpillThreshold,
+          numSpillThreshold,
+          Long.MaxValue)
         rows.foreach(x => array.add(x))
 
         val iterator = array.generateIterator()
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArraySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArraySuite.scala
index b9e7367d54df1..62ea7f2f92597 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArraySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/ExternalAppendOnlyUnsafeRowArraySuite.scala
@@ -47,7 +47,8 @@ class ExternalAppendOnlyUnsafeRowArraySuite extends SparkFunSuite with LocalSpar
         1024,
         SparkEnv.get.memoryManager.pageSizeBytes,
         inMemoryThreshold,
-        spillThreshold)
+        spillThreshold,
+        Long.MaxValue)
       try f(array) finally {
         array.clear()
       }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/HiveResultSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/HiveResultSuite.scala
index 13c246660e867..ae5b303116def 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/HiveResultSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/HiveResultSuite.scala
@@ -17,15 +17,15 @@
 
 package org.apache.spark.sql.execution
 
-import java.time.{Duration, Period}
+import java.time.{Duration, Period, Year}
 
+import org.apache.spark.sql.YearUDT
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils
 import org.apache.spark.sql.connector.catalog.InMemoryTableCatalog
 import org.apache.spark.sql.execution.HiveResult._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.{ExamplePoint, ExamplePointUDT, SharedSparkSession}
-import org.apache.spark.sql.types.{YearMonthIntervalType => YM}
-import org.apache.spark.sql.types.YearMonthIntervalType
+import org.apache.spark.sql.types.{YearMonthIntervalType, YearMonthIntervalType => YM}
 
 
 class HiveResultSuite extends SharedSparkSession {
@@ -172,4 +172,18 @@ class HiveResultSuite extends SharedSparkSession {
     val plan2 = df.selectExpr("array(i)").queryExecution.executedPlan
     assert(hiveResultString(plan2) === Seq("[5 00:00:00.010000000]"))
   }
+
+  test("SPARK-52650: Use stringifyValue to get UDT string representation") {
+    val year = Year.of(18)
+    val tpe = new YearUDT()
+    assert(toHiveString((year, tpe),
+      nested = false, getTimeFormatters, getBinaryFormatter) === "18")
+    val tpe2 = new YearUDT() {
+      override def stringifyValue(obj: Any): String = {
+        f"${obj.asInstanceOf[Year].getValue}%04d"
+      }
+    }
+    assert(toHiveString((year, tpe2),
+      nested = false, getTimeFormatters, getBinaryFormatter) === "0018")
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryExecutionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryExecutionSuite.scala
index 86cac7ba7088c..a4e4a407255c0 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryExecutionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryExecutionSuite.scala
@@ -238,7 +238,8 @@ class QueryExecutionSuite extends SharedSparkSession {
       }
     }
     Seq("=== Applying Rule org.apache.spark.sql.execution",
-        "=== Result of Batch Preparations ===").foreach { expectedMsg =>
+        "=== Result of Batch Preparations ===",
+        "Output Information:").foreach { expectedMsg =>
       assert(testAppender.loggingEvents.exists(
         _.getMessage.getFormattedMessage.contains(expectedMsg)))
     }
@@ -327,36 +328,51 @@ class QueryExecutionSuite extends SharedSparkSession {
   }
 
   test("SPARK-47764: Cleanup shuffle dependencies - DoNotCleanup mode") {
-    val plan = spark.range(100).repartition(10).logicalPlan
-    val df = Dataset.ofRows(spark, plan, DoNotCleanup)
-    df.collect()
-
-    val blockManager = spark.sparkContext.env.blockManager
-    assert(blockManager.migratableResolver.getStoredShuffles().nonEmpty)
-    assert(blockManager.diskBlockManager.getAllBlocks().nonEmpty)
-    cleanupShuffles()
+    Seq(true, false).foreach { adaptiveEnabled => {
+      withSQLConf((SQLConf.ADAPTIVE_EXECUTION_ENABLED.key, adaptiveEnabled.toString)) {
+        val plan = spark.range(100).repartition(10).logicalPlan
+        val df = Dataset.ofRows(spark, plan, DoNotCleanup)
+        df.collect()
+
+        val blockManager = spark.sparkContext.env.blockManager
+        assert(blockManager.migratableResolver.getStoredShuffles().nonEmpty)
+        assert(blockManager.diskBlockManager.getAllBlocks().nonEmpty)
+        cleanupShuffles()
+        }
+      }
+    }
   }
 
   test("SPARK-47764: Cleanup shuffle dependencies - SkipMigration mode") {
-    val plan = spark.range(100).repartition(10).logicalPlan
-    val df = Dataset.ofRows(spark, plan, SkipMigration)
-    df.collect()
-
-    val blockManager = spark.sparkContext.env.blockManager
-    assert(blockManager.migratableResolver.getStoredShuffles().isEmpty)
-    assert(blockManager.diskBlockManager.getAllBlocks().nonEmpty)
-    cleanupShuffles()
+    Seq(true, false).foreach { adaptiveEnabled => {
+      withSQLConf((SQLConf.ADAPTIVE_EXECUTION_ENABLED.key, adaptiveEnabled.toString)) {
+        val plan = spark.range(100).repartition(10).logicalPlan
+        val df = Dataset.ofRows(spark, plan, SkipMigration)
+        df.collect()
+
+        val blockManager = spark.sparkContext.env.blockManager
+        assert(blockManager.migratableResolver.getStoredShuffles().isEmpty)
+        assert(blockManager.diskBlockManager.getAllBlocks().nonEmpty)
+        cleanupShuffles()
+        }
+      }
+    }
   }
 
   test("SPARK-47764: Cleanup shuffle dependencies - RemoveShuffleFiles mode") {
-    val plan = spark.range(100).repartition(10).logicalPlan
-    val df = Dataset.ofRows(spark, plan, RemoveShuffleFiles)
-    df.collect()
-
-    val blockManager = spark.sparkContext.env.blockManager
-    assert(blockManager.migratableResolver.getStoredShuffles().isEmpty)
-    assert(blockManager.diskBlockManager.getAllBlocks().isEmpty)
-    cleanupShuffles()
+    Seq(true, false).foreach { adaptiveEnabled => {
+      withSQLConf((SQLConf.ADAPTIVE_EXECUTION_ENABLED.key, adaptiveEnabled.toString)) {
+        val plan = spark.range(100).repartition(10).logicalPlan
+        val df = Dataset.ofRows(spark, plan, RemoveShuffleFiles)
+        df.collect()
+
+        val blockManager = spark.sparkContext.env.blockManager
+        assert(blockManager.migratableResolver.getStoredShuffles().isEmpty)
+        assert(blockManager.diskBlockManager.getAllBlocks().isEmpty)
+        cleanupShuffles()
+        }
+      }
+    }
   }
 
   test("SPARK-35378: Return UnsafeRow in CommandResultExecCheck execute methods") {
@@ -440,6 +456,15 @@ class QueryExecutionSuite extends SharedSparkSession {
     }
   }
 
+  test("determineShuffleCleanupMode should return correct mode based on SQL configuration") {
+    withSQLConf((SQLConf.CLASSIC_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED.key, "false")) {
+      assert(QueryExecution.determineShuffleCleanupMode(conf) === DoNotCleanup)
+    }
+    withSQLConf((SQLConf.CLASSIC_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED.key, "true")) {
+      assert(QueryExecution.determineShuffleCleanupMode(conf) === RemoveShuffleFiles)
+    }
+  }
+
   case class MockCallbackEagerCommand(
       var trackerAnalyzed: QueryPlanningTracker = null,
       var trackerReadyForExecution: QueryPlanningTracker = null)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryPlanningTrackerEndToEndSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryPlanningTrackerEndToEndSuite.scala
index 5ff459513e848..aac68e6389805 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryPlanningTrackerEndToEndSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/QueryPlanningTrackerEndToEndSuite.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StreamExecution}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamExecution}
 import org.apache.spark.sql.streaming.StreamTest
 
 class QueryPlanningTrackerEndToEndSuite extends StreamTest {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLJsonProtocolSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLJsonProtocolSuite.scala
index 1cb988cc36541..8f7e68632bf4f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLJsonProtocolSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLJsonProtocolSuite.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution
 import com.fasterxml.jackson.databind.ObjectMapper
 import org.json4s.jackson.JsonMethods._
 
-import org.apache.spark.SparkConf
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.scheduler.SparkListenerEvent
 import org.apache.spark.sql.LocalSparkSession
@@ -29,7 +28,6 @@ import org.apache.spark.sql.test.TestSparkSession
 import org.apache.spark.util.{JsonProtocol, Utils}
 
 class SQLJsonProtocolSuite extends SparkFunSuite with LocalSparkSession {
-  private val jsonProtocol = new JsonProtocol(new SparkConf())
 
   test("SparkPlanGraph backward compatibility: metadata") {
     Seq(true, false).foreach { newExecutionStartEvent =>
@@ -63,7 +61,7 @@ class SQLJsonProtocolSuite extends SparkFunSuite with LocalSparkSession {
              |}
           """.stripMargin
 
-        val reconstructedEvent = jsonProtocol.sparkEventFromJson(SQLExecutionStartJsonString)
+        val reconstructedEvent = JsonProtocol.sparkEventFromJson(SQLExecutionStartJsonString)
         if (newExecutionStartEvent) {
           val expectedEvent = if (newExecutionStartJson) {
             SparkListenerSQLExecutionStart(0, Some(1), "test desc", "test detail",
@@ -95,7 +93,7 @@ class SQLJsonProtocolSuite extends SparkFunSuite with LocalSparkSession {
     event.executionName = Some("test")
     event.qe = qe
     event.executionFailure = Some(exception)
-    val json = jsonProtocol.sparkEventToJsonString(event)
+    val json = JsonProtocol.sparkEventToJsonString(event)
     // scalastyle:off line.size.limit
     assert(parse(json) == parse(
       s"""
@@ -107,7 +105,7 @@ class SQLJsonProtocolSuite extends SparkFunSuite with LocalSparkSession {
         |}
       """.stripMargin))
     // scalastyle:on
-    val readBack = jsonProtocol.sparkEventFromJson(json)
+    val readBack = JsonProtocol.sparkEventFromJson(json)
     event.duration = 0
     event.executionName = None
     event.qe = null
@@ -125,7 +123,7 @@ class SQLJsonProtocolSuite extends SparkFunSuite with LocalSparkSession {
         |  "time" : 10
         |}
       """.stripMargin
-    val readBack = jsonProtocol.sparkEventFromJson(executionEnd)
+    val readBack = JsonProtocol.sparkEventFromJson(executionEnd)
     assert(readBack == SparkListenerSQLExecutionEnd(1, 10))
 
     // parse new event using old SparkListenerSQLExecutionEnd
@@ -140,7 +138,7 @@ class SQLJsonProtocolSuite extends SparkFunSuite with LocalSparkSession {
         |}
       """.stripMargin
     // scalastyle:on
-    val readBack2 = jsonProtocol.sparkEventFromJson(newExecutionEnd)
+    val readBack2 = JsonProtocol.sparkEventFromJson(newExecutionEnd)
     assert(readBack2 == OldVersionSQLExecutionEnd(1, 10))
   }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewSuite.scala
index 4fd96eadfac75..f715353fd431a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewSuite.scala
@@ -1316,4 +1316,21 @@ abstract class SQLViewSuite extends QueryTest with SQLTestUtils {
       assert(ts1._1.getTime < ts2._1.getTime)
     }
   }
+
+  test("SPARK-52521: view with ANSI expressions") {
+    withView("v1") {
+      withSQLConf(ANSI_ENABLED.key -> "true") {
+        sql(
+          """
+            |CREATE VIEW v1 AS
+            |SELECT RIGHT(CAST(id AS STRING), 1) AS c
+            |FROM range(1)
+            |GROUP BY RIGHT(CAST(id AS STRING), 1)
+            |""".stripMargin)
+      }
+      withSQLConf(ANSI_ENABLED.key -> "false") {
+        checkAnswer(sql("SELECT * FROM v1"), Row("0"))
+      }
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewTestSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewTestSuite.scala
index 0d57b815a192c..f6d2e096ecacc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewTestSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/SQLViewTestSuite.scala
@@ -22,6 +22,7 @@ import scala.jdk.CollectionConverters._
 import org.apache.spark.sql.{AnalysisException, DataFrame, QueryTest, Row}
 import org.apache.spark.sql.catalyst.{FunctionIdentifier, TableIdentifier}
 import org.apache.spark.sql.catalyst.catalog.CatalogFunction
+import org.apache.spark.sql.catalyst.catalog.CatalogTable._
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.plans.logical.Repartition
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils.withDefaultTimeZone
@@ -827,6 +828,32 @@ class PersistedViewTestSuite extends SQLViewTestSuite with SharedSparkSession {
     )
   }
 
+  test("SPARK-52417: Simplify Table properties handling in View Schema Evolution Mode") {
+    withTable("t") {
+      withView("v") {
+        sql("CREATE TABLE t (c1 int)")
+        sql("CREATE VIEW v WITH SCHEMA EVOLUTION AS SELECT * from t")
+        sql("INSERT INTO t VALUES (1), (2), (3)")
+        checkAnswer(sql("SELECT * FROM v"), Seq(Row(1), Row(2), Row(3)))
+
+        val table = spark.sessionState.catalog.getTableMetadata(TableIdentifier("v"))
+        assert(table.properties.get(VIEW_SCHEMA_MODE) === Some("EVOLUTION"))
+        assert(!table.properties.exists(_._1.startsWith(VIEW_QUERY_OUTPUT_PREFIX)))
+        assert(!table.properties.exists(_._1.startsWith(VIEW_QUERY_OUTPUT_NUM_COLUMNS)))
+
+        sql("DROP TABLE t")
+        sql("CREATE TABLE t (s1 string, b1 boolean)")
+        sql("INSERT INTO t VALUES ('a', true), ('b', false), ('c', true)")
+        checkAnswer(sql("SELECT * FROM v"), Seq(Row("a", true), Row("b", false), Row("c", true)))
+
+        val updatedTable = spark.sessionState.catalog.getTableMetadata(TableIdentifier("v"))
+        assert(updatedTable.properties.get(VIEW_SCHEMA_MODE) === Some("EVOLUTION"))
+        assert(!updatedTable.properties.exists(_._1.startsWith(VIEW_QUERY_OUTPUT_PREFIX)))
+        assert(!updatedTable.properties.exists(_._1.startsWith(VIEW_QUERY_OUTPUT_NUM_COLUMNS)))
+      }
+    }
+  }
+
   def getShowCreateDDL(view: String, serde: Boolean = false): String = {
     val result = if (serde) {
       sql(s"SHOW CREATE TABLE $view AS SERDE")
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/SortSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/SortSuite.scala
index 4cb9ae7cbc178..ea7d9386083ec 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/SortSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/SortSuite.scala
@@ -82,8 +82,9 @@ class SortSuite extends SparkPlanTest with SharedSparkSession {
   test("sorting does not crash for large inputs") {
     val sortOrder = $"a".asc :: Nil
     val stringLength = 1024 * 1024 * 2
+    val df = Seq(Tuple1("a".repeat(stringLength)), Tuple1("b".repeat(stringLength))).toDF("a")
     checkThatPlansAgree(
-      Seq(Tuple1("a" * stringLength), Tuple1("b" * stringLength)).toDF("a").repartition(1),
+      df.repartition(1),
       SortExec(sortOrder, global = true, _: SparkPlan, testSpillFrequency = 1),
       ReferenceSort(sortOrder, global = true, _: SparkPlan),
       sortAnswers = false
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/SparkSqlParserSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/SparkSqlParserSuite.scala
index fbcc8a582bfbb..94e60db67ac75 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/SparkSqlParserSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/SparkSqlParserSuite.scala
@@ -19,12 +19,12 @@ package org.apache.spark.sql.execution
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.spark.SparkThrowable
+import org.apache.spark.{SparkConf, SparkThrowable}
 import org.apache.spark.internal.config.ConfigEntry
 import org.apache.spark.sql.catalyst.{FunctionIdentifier, TableIdentifier}
 import org.apache.spark.sql.catalyst.analysis.{AnalysisTest, UnresolvedAlias, UnresolvedAttribute, UnresolvedFunction, UnresolvedGenerator, UnresolvedHaving, UnresolvedRelation, UnresolvedStar}
 import org.apache.spark.sql.catalyst.expressions.{Ascending, AttributeReference, Concat, GreaterThan, Literal, NullsFirst, SortOrder, UnresolvedWindowExpression, UnspecifiedFrame, WindowSpecDefinition, WindowSpecReference}
-import org.apache.spark.sql.catalyst.parser.ParseException
+import org.apache.spark.sql.catalyst.parser.{AbstractParser, ParseException}
 import org.apache.spark.sql.catalyst.plans.logical._
 import org.apache.spark.sql.catalyst.trees.TreePattern._
 import org.apache.spark.sql.connector.catalog.TableCatalog
@@ -44,6 +44,10 @@ import org.apache.spark.util.ArrayImplicits._
 class SparkSqlParserSuite extends AnalysisTest with SharedSparkSession {
   import org.apache.spark.sql.catalyst.dsl.expressions._
 
+  override protected def sparkConf: SparkConf =
+    super.sparkConf
+      .set(SQLConf.MANAGE_PARSER_CACHES.key, true.toString)
+
   private lazy val parser = new SparkSqlParser()
 
   private def assertEqual(sqlCommand: String, plan: LogicalPlan): Unit = {
@@ -1026,4 +1030,138 @@ class SparkSqlParserSuite extends AnalysisTest with SharedSparkSession {
           stop = sql.length - 1))
     }
   }
+
+  private def awfulQuery(depth: Int): String = {
+    if (depth == 0) {
+      s"rand()"
+    } else {
+      s"case when ${awfulQuery(depth - 1)} > 0.5 " +
+      s"then ${awfulQuery(depth - 1)} " +
+      s"else ${awfulQuery(depth - 1)} " +
+      "end"
+    }
+  }
+
+  test("SPARK-47404: Managed parsers killswitch works") {
+    val initialSize = AbstractParser.getDFACacheNumStates
+    val mediumQuery = s"select ${awfulQuery(2)} from range(10)"
+
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_THRESHOLD.key -> (10000).toString,
+        SQLConf.PARSER_DFA_CACHE_FLUSH_RATIO.key -> 100.toString) {
+      withSQLConf(SQLConf.MANAGE_PARSER_CACHES.key -> false.toString) {
+        parser.parsePlan(mediumQuery)
+      }
+      val disabledSize = AbstractParser.getDFACacheNumStates
+      // There should be no change to the state of the managed caches when not enabled
+      assert(disabledSize == initialSize)
+
+      withSQLConf(SQLConf.MANAGE_PARSER_CACHES.key -> true.toString) {
+        parser.parsePlan(mediumQuery)
+      }
+      val enabledSize = AbstractParser.getDFACacheNumStates
+      // Now the cache should be populated
+      assert(enabledSize > initialSize)
+    }
+  }
+
+  test("SPARK-47404: Always release Antlr cache when cache limit is 0") {
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_THRESHOLD.key -> (-1).toString) {
+      parser.parsePlan("select id from range(10)")
+    }
+    val initialCacheSize = AbstractParser.getDFACacheNumStates
+    assert(initialCacheSize > 0)
+
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_THRESHOLD.key -> 0.toString) {
+      parser.parsePlan("select id from range(10)")
+    }
+    val clearedCacheSize = AbstractParser.getDFACacheNumStates
+    assert(clearedCacheSize == 0)
+  }
+
+  test("SPARK-47404: Release ANTLR cache based on threshold") {
+    val smallQuery = "select id from range(10)"
+    val bigQuery = s"select ${awfulQuery(8)} from range(10)"
+
+    // Chose this value based on the observed size of the parser cache being ~27k states after
+    // parsing `bigQuery` on my machine.
+    val threshold = 10000
+
+    // Fill the cache a little
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_THRESHOLD.key -> threshold.toString) {
+      parser.parsePlan(smallQuery)
+    }
+    val smallQueryCacheSize = AbstractParser.getDFACacheNumStates
+    assert(smallQueryCacheSize > 0)
+    assert(smallQueryCacheSize < threshold)
+
+    // Parse a big query to fill the cache
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_THRESHOLD.key -> (-1).toString) {
+      parser.parsePlan(bigQuery)
+    }
+    val bigQueryCacheSize = AbstractParser.getDFACacheNumStates
+    assert(bigQueryCacheSize > threshold)
+
+    // Parse a small query to release the cache
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_THRESHOLD.key -> threshold.toString) {
+      parser.parsePlan(smallQuery)
+    }
+    val clearedCacheSize = AbstractParser.getDFACacheNumStates
+    assert(clearedCacheSize == 0)
+  }
+
+  test("SPARK-47404: Release Antlr cache based on memory ratio") {
+    val smallQuery = "select id from range(10)"
+    val bigQuery = s"select ${awfulQuery(8)} from range(10)"
+
+    val driverMemory = Runtime.getRuntime.maxMemory()
+    // `bigQuery` fills the cache to about 27k states
+    val stateThreshold = 15000
+    // Calculate what ratio will give us this threshold based on driver memory
+    val ratio = stateThreshold * AbstractParser.BYTES_PER_DFA_STATE * 100.0 / driverMemory
+
+    // Fill the cache a little
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_RATIO.key -> ratio.toString) {
+      parser.parsePlan(smallQuery)
+    }
+    val smallQueryCacheSize = AbstractParser.getDFACacheNumStates
+    assert(smallQueryCacheSize > 0)
+    assert(smallQueryCacheSize < stateThreshold)
+
+    // Parse a big query to fill the cache
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_RATIO.key -> 100.toString) {
+      parser.parsePlan(bigQuery)
+    }
+    val bigQueryCacheSize = AbstractParser.getDFACacheNumStates
+    assert(bigQueryCacheSize > smallQueryCacheSize)
+
+    // Parse a small query to release the cache
+    withSQLConf(SQLConf.PARSER_DFA_CACHE_FLUSH_RATIO.key -> ratio.toString) {
+      parser.parsePlan(smallQuery)
+    }
+    val clearedCacheSize = AbstractParser.getDFACacheNumStates
+    assert(clearedCacheSize == 0)
+  }
+
+  Seq(
+    (-1, -1, false),
+    (10000, -1, true),
+    (-1, 1, true),
+    (10000, 1, true)
+  ).foreach { case (threshold, ratio, shouldFlush) =>
+    test(s"SPARK-47404: Antlr cache combined thresholds. States: $threshold, Ratio: $ratio") {
+      // The cache should be flushed if either of the thresholds are exceeded.
+      val bigQuery = s"select ${awfulQuery(8)} from range(10)"
+      withSQLConf(
+          SQLConf.PARSER_DFA_CACHE_FLUSH_THRESHOLD.key -> threshold.toString,
+          SQLConf.PARSER_DFA_CACHE_FLUSH_RATIO.key -> ratio.toString) {
+        parser.parsePlan(bigQuery)
+        val bigQueryCacheSize = AbstractParser.getDFACacheNumStates
+        if (shouldFlush) {
+          assert(bigQueryCacheSize == 0)
+        } else {
+          assert(bigQueryCacheSize > 0)
+        }
+      }
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/UnsafeKVExternalSorterSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/UnsafeKVExternalSorterSuite.scala
index b3370b6733d92..77ecea0d6293a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/UnsafeKVExternalSorterSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/UnsafeKVExternalSorterSuite.scala
@@ -128,7 +128,9 @@ class UnsafeKVExternalSorterSuite extends SparkFunSuite with SharedSparkSession
 
     val sorter = new UnsafeKVExternalSorter(
       keySchema, valueSchema, SparkEnv.get.blockManager, SparkEnv.get.serializerManager,
-      pageSize, SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD.defaultValue.get)
+      pageSize, SHUFFLE_SPILL_NUM_ELEMENTS_FORCE_SPILL_THRESHOLD.defaultValue.get,
+      SHUFFLE_SPILL_MAX_SIZE_FORCE_SPILL_THRESHOLD.defaultValue.get
+    )
 
     // Insert the keys and values into the sorter
     inputData.foreach { case (k, v) =>
@@ -226,6 +228,7 @@ class UnsafeKVExternalSorterSuite extends SparkFunSuite with SharedSparkSession
         sparkContext.env.serializerManager,
         taskMemoryManager.pageSizeBytes(),
         Int.MaxValue,
+        Long.MaxValue,
         map)
     } finally {
       TaskContext.unset()
@@ -250,6 +253,7 @@ class UnsafeKVExternalSorterSuite extends SparkFunSuite with SharedSparkSession
         sparkContext.env.serializerManager,
         taskMemoryManager.pageSizeBytes(),
         Int.MaxValue,
+        Long.MaxValue,
         map)
       assert(sorter.getSpillSize === expectedSpillSize)
     } finally {
@@ -275,6 +279,7 @@ class UnsafeKVExternalSorterSuite extends SparkFunSuite with SharedSparkSession
         sparkContext.env.serializerManager,
         taskMemoryManager.pageSizeBytes(),
         Int.MaxValue,
+        Long.MaxValue,
         map1)
       val sorter2 = new UnsafeKVExternalSorter(
         schema,
@@ -283,6 +288,7 @@ class UnsafeKVExternalSorterSuite extends SparkFunSuite with SharedSparkSession
         sparkContext.env.serializerManager,
         taskMemoryManager.pageSizeBytes(),
         Int.MaxValue,
+        Long.MaxValue,
         map2)
       sorter1.merge(sorter2)
       assert(sorter1.getSpillSize === expectedSpillSize)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala
index 13de81065cb77..de0fde16e5d03 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/adaptive/AdaptiveQueryExecSuite.scala
@@ -930,14 +930,19 @@ class AdaptiveQueryExecSuite
           SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "true",
           SQLConf.AUTO_BROADCASTJOIN_THRESHOLD.key -> "-1") {
           val joined = createJoinedDF()
-          joined.explain(true)
 
           val error = intercept[SparkException] {
             joined.collect()
           }
-          assert((Seq(error) ++ Option(error.getCause) ++ error.getSuppressed()).exists(
-            e => e.getMessage() != null && e.getMessage().contains("coalesce test error")))
-
+          val errMsgList = (error :: error.getCause :: error.getSuppressed.toList)
+            .filter(e => e != null && e.getMessage != null)
+            .map(_.getMessage)
+
+          assert(errMsgList.exists(_.contains("coalesce test error")),
+            s"""
+               |The error message should contain 'coalesce test error', but got:
+               |${errMsgList.mkString("======\n", "\n", "\n======")}
+               |""".stripMargin)
           val adaptivePlan = joined.queryExecution.executedPlan.asInstanceOf[AdaptiveSparkPlanExec]
 
           // All QueryStages should be based on ShuffleQueryStageExec
@@ -1119,7 +1124,7 @@ class AdaptiveQueryExecSuite
         assert(reads.length == 1)
         val read = reads.head
         assert(read.isLocalRead)
-        assert(read.metrics.keys.toSeq == Seq("numPartitions"))
+        assert(read.metrics.keys.toSeq == Seq("numPartitions", "numEmptyPartitions"))
         assert(read.metrics("numPartitions").value == read.partitionSpecs.length)
       }
 
@@ -1740,7 +1745,8 @@ class AdaptiveQueryExecSuite
       Seq("=== Result of Batch AQE Preparations ===",
           "=== Result of Batch AQE Post Stage Creation ===",
           "=== Result of Batch AQE Replanning ===",
-          "=== Result of Batch AQE Query Stage Optimization ===").foreach { expectedMsg =>
+          "=== Result of Batch AQE Query Stage Optimization ===",
+          "Output Information:").foreach { expectedMsg =>
         assert(testAppender.loggingEvents.exists(
           _.getMessage.getFormattedMessage.contains(expectedMsg)))
       }
@@ -1865,7 +1871,9 @@ class AdaptiveQueryExecSuite
     }
 
     withSQLConf(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "true",
-      SQLConf.SHUFFLE_PARTITIONS.key -> "5") {
+      SQLConf.SHUFFLE_PARTITIONS.key -> "5",
+      // Disabling cleanup as the test assertions depend on them
+      SQLConf.CLASSIC_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED.key -> "false") {
       val df = sql(
         """
           |SELECT * FROM (
@@ -2083,7 +2091,15 @@ class AdaptiveQueryExecSuite
               """.stripMargin),
             numUnion = if (combineUnionEnabled) 1 else 2,
             numShuffleReader = 3,
-            numPartition = 1 + 1 + 2)
+            // SPARK-52921
+            // If `combineUnionEnabled` is false, there are 2 unions.
+            // The inner union has 1 partition because its children have the same partitioning:
+            // CoalescedHashPartitioning(HashPartitioning(key, 10), CoalescedBoundary(0,10)).
+            // The outer union has 1 (inner union) + 2 (t1) partitions.
+            //
+            // If `combineUnionEnabled` is true, there is only 1 union. As the children have
+            // different partitioning, the union will have sum of children partitions.
+            numPartition = if (combineUnionEnabled) 1 + 1 + 2 else 1 + 2)
 
           // negative test
           checkResultPartition(
@@ -3135,6 +3151,137 @@ class AdaptiveQueryExecSuite
       }
     }
   }
+
+  test("SPARK-42322: STAGE_MATERIALIZATION_MULTIPLE_FAILURES error class validation") {
+    withSQLConf(
+      SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "true") {
+
+      withTempView("test_table1", "test_table2") {
+        import java.lang.reflect.InvocationTargetException
+
+        // Create datasets
+        spark.range(100).selectExpr("id", "id % 10 as group_col")
+          .createOrReplaceTempView("test_table1")
+        spark.range(100).selectExpr("id", "id % 5 as group_col")
+          .createOrReplaceTempView("test_table2")
+
+        // Create a simple query to get the plan
+        val df = spark.sql("""
+          SELECT t1.group_col, COUNT(*) as cnt
+          FROM test_table1 t1
+          JOIN test_table2 t2 ON t1.group_col = t2.group_col
+          GROUP BY t1.group_col
+        """)
+
+        // Instead of trying to trigger actual failures, let's directly test the error creation
+        val adaptivePlan = df.queryExecution.executedPlan.asInstanceOf[AdaptiveSparkPlanExec]
+
+        // Access the private method to test error creation logic
+        val errors = Seq(
+          new RuntimeException("Stage 1 materialization failed"),
+          new RuntimeException("Stage 2 materialization failed")
+        )
+
+        // Use reflection to access and test the cleanUpAndThrowException method
+        val cleanUpMethod = classOf[AdaptiveSparkPlanExec].getDeclaredMethod(
+          "cleanUpAndThrowException", classOf[Seq[Throwable]], classOf[Option[Int]])
+        cleanUpMethod.setAccessible(true)
+
+        val exception = intercept[InvocationTargetException] {
+          cleanUpMethod.invoke(adaptivePlan, errors, None)
+        }
+
+        // Verify that we get the expected error class for multiple stage failures
+        val cause = exception.getCause.asInstanceOf[SparkException]
+        assert(cause.getCondition == "STAGE_MATERIALIZATION_MULTIPLE_FAILURES",
+          s"Expected STAGE_MATERIALIZATION_MULTIPLE_FAILURES, " +
+            s"got: ${cause.getCondition}")
+        val errorMessage = cause.getMessage
+        assert(errorMessage.contains("Multiple failures (2) in stage materialization:"),
+          s"Error message should contain failure count, got: $errorMessage")
+        assert(errorMessage.contains("1. RuntimeException: Stage 1 materialization failed"),
+          s"Error message should contain first error details, got: $errorMessage")
+        assert(errorMessage.contains("2. RuntimeException: Stage 2 materialization failed"),
+          s"Error message should contain second error details, got: $errorMessage")
+      }
+    }
+  }
+
+  test("SPARK-52921: Specify outputPartitioning for UnionExec for same output partitoning") {
+    def checkResultPartition(
+        df: Dataset[Row],
+        numUnion: Int,
+        numShuffleReader: Int,
+        numPartition: Int): Unit = {
+      df.collect()
+      assert(collect(df.queryExecution.executedPlan) {
+        case u: UnionExec => u
+      }.size == numUnion)
+      assert(collect(df.queryExecution.executedPlan) {
+        case r: AQEShuffleReadExec => r
+      }.size === numShuffleReader)
+      assert(df.rdd.partitions.length === numPartition)
+    }
+
+    Seq(true, false).foreach { combineUnionEnabled =>
+      val combineUnionConfig = if (combineUnionEnabled) {
+        SQLConf.OPTIMIZER_EXCLUDED_RULES.key -> ""
+      } else {
+        SQLConf.OPTIMIZER_EXCLUDED_RULES.key ->
+          "org.apache.spark.sql.catalyst.optimizer.CombineUnions"
+      }
+      // advisory partition size 1048576 has no special meaning, just a big enough value
+      withSQLConf(SQLConf.ADAPTIVE_EXECUTION_ENABLED.key -> "true",
+        SQLConf.COALESCE_PARTITIONS_ENABLED.key -> "true",
+        SQLConf.ADVISORY_PARTITION_SIZE_IN_BYTES.key -> "1048576",
+        SQLConf.COALESCE_PARTITIONS_MIN_PARTITION_NUM.key -> "1",
+        SQLConf.SHUFFLE_PARTITIONS.key -> "10",
+        combineUnionConfig) {
+        withTempView("t1", "t2") {
+          spark.sparkContext.parallelize((1 to 10).map(i => TestData(i, i.toString)), 2)
+            .toDF().createOrReplaceTempView("t1")
+          spark.sparkContext.parallelize((1 to 10).map(i => TestData(i, i.toString)), 4)
+            .toDF().createOrReplaceTempView("t2")
+
+          val query =
+            """
+              |SELECT /*+ merge(t2) */ t1.key, t2.key FROM t1 JOIN t2 ON t1.key = t2.key
+              |UNION ALL
+              |SELECT key, count(*) FROM t2 GROUP BY key
+              |UNION ALL
+              |SELECT * FROM t1
+              |""".stripMargin
+
+          val correctResults = withSQLConf(SQLConf.UNION_OUTPUT_PARTITIONING.key -> "false") {
+            checkResultPartition(
+              sql(query),
+              numUnion = if (combineUnionEnabled) 1 else 2,
+              numShuffleReader = 3,
+              numPartition = 1 + 1 + 2)
+
+            sql(query).collect()
+          }
+
+          withSQLConf(SQLConf.UNION_OUTPUT_PARTITIONING.key -> "true") {
+            checkResultPartition(
+              sql(query),
+              numUnion = if (combineUnionEnabled) 1 else 2,
+              numShuffleReader = 3,
+              // If `combineUnionEnabled` is false, there are 2 unions.
+              // The inner union has 1 partition because its children have the same partitioning:
+              // CoalescedHashPartitioning(HashPartitioning(key, 10), CoalescedBoundary(0,10)).
+              // The outer union has 1 (inner union) + 2 (t1) partitions.
+              //
+              // If `combineUnionEnabled` is true, there is only 1 union. As the children have
+              // different partitioning, the union will have sum of children partitions.
+              numPartition = if (combineUnionEnabled) 1 + 1 + 2 else 1 + 2)
+
+            checkAnswer(sql(query), correctResults)
+          }
+        }
+      }
+    }
+  }
 }
 
 /**
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowConvertersSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowConvertersSuite.scala
index 39c3d8df7550e..ccf6b63eb5ded 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowConvertersSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowConvertersSuite.scala
@@ -17,12 +17,12 @@
 package org.apache.spark.sql.execution.arrow
 
 import java.io.{ByteArrayOutputStream, DataOutputStream, File}
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.sql.{Date, Timestamp}
 import java.text.SimpleDateFormat
+import java.time.LocalTime
 import java.util.Locale
 
-import com.google.common.io.Files
 import org.apache.arrow.memory.RootAllocator
 import org.apache.arrow.vector.{VectorLoader, VectorSchemaRoot}
 import org.apache.arrow.vector.ipc.JsonFileReader
@@ -731,6 +731,43 @@ class ArrowConvertersSuite extends SharedSparkSession {
     }
   }
 
+  test("time type conversion") {
+    val json =
+      s"""
+         |{
+         |  "schema" : {
+         |    "fields" : [ {
+         |      "name" : "time",
+         |      "type" : {
+         |        "name" : "time",
+         |        "unit" : "NANOSECOND",
+         |        "bitWidth" : 64
+         |      },
+         |      "nullable" : true,
+         |      "children" : [ ]
+         |    } ]
+         |  },
+         |  "batches" : [ {
+         |    "count" : 3,
+         |    "columns" : [ {
+         |      "name" : "time",
+         |      "count" : 3,
+         |      "VALIDITY" : [ 1, 1, 1 ],
+         |      "DATA" : [ 0, 43200000000000, 3723123456789 ]
+         |    } ]
+         |  } ]
+         |}
+       """.stripMargin
+
+    val t1 = LocalTime.of(0, 0, 0)
+    val t2 = LocalTime.of(12, 0, 0)
+    val t3 = LocalTime.of(1, 2, 3, 123456789)
+
+    val df = Seq(t1, t2, t3).toDF("time")
+
+    collectAndValidate(df, json, "timeData.json")
+  }
+
   test("floating-point NaN") {
     val json =
       s"""
@@ -1218,8 +1255,8 @@ class ArrowConvertersSuite extends SharedSparkSession {
 
     val tempFile1 = new File(tempDataPath, "testData2-ints-part1.json")
     val tempFile2 = new File(tempDataPath, "testData2-ints-part2.json")
-    Files.asCharSink(tempFile1, StandardCharsets.UTF_8).write(json1)
-    Files.asCharSink(tempFile2, StandardCharsets.UTF_8).write(json2)
+    Files.writeString(tempFile1.toPath, json1)
+    Files.writeString(tempFile2.toPath, json2)
 
     validateConversion(schema, arrowBatches(0), tempFile1)
     validateConversion(schema, arrowBatches(1), tempFile2)
@@ -1497,6 +1534,422 @@ class ArrowConvertersSuite extends SharedSparkSession {
     }
   }
 
+  test("roundtrip arrow batches with IPC stream - single batch") {
+    val inputRows = (0 until 9).map(InternalRow(_)) :+ InternalRow(null)
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+    val ctx = TaskContext.empty()
+
+    val batchIter = ArrowConverters.toBatchIterator(
+      inputRows.iterator, schema, 10, null, true, false, ctx)
+
+    // Write batches to Arrow IPC stream format
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    // Test the new IPC stream converter with metrics
+    val (iterator, outputSchema) = ArrowConverters.fromIPCStreamWithIterator(out.toByteArray, ctx)
+    assert(outputSchema == schema)
+
+    // Initially one batch loaded
+    assert(iterator.batchesLoaded == 0)
+    assert(iterator.totalRowsProcessed == 0)
+
+    var count = 0
+    iterator.zipWithIndex.foreach { case (row, i) =>
+      if (i != 9) {
+        assert(row.getInt(0) == i)
+      } else {
+        assert(row.isNullAt(0))
+      }
+      count += 1
+    }
+    assert(count == inputRows.length)
+
+    // Verify metrics after consuming all rows
+    assert(iterator.batchesLoaded == 1,
+      s"Expected 1 batch loaded, got ${iterator.batchesLoaded}")
+    assert(iterator.totalRowsProcessed == inputRows.length,
+      s"Expected ${inputRows.length} rows processed, got ${iterator.totalRowsProcessed}")
+  }
+
+  test("multiple record batches in single IPC stream") {
+    val inputRows = (0 until 25).map(InternalRow(_))
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+    val ctx = TaskContext.empty()
+
+    // Create multiple batches with small batch size
+    val batchIter = ArrowConverters.toBatchIterator(
+      inputRows.iterator, schema, 5, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    val (iterator, outputSchema) = ArrowConverters.fromIPCStreamWithIterator(out.toByteArray, ctx)
+    assert(outputSchema == schema)
+
+    // Initially no batches loaded
+    assert(iterator.batchesLoaded == 0)
+    assert(iterator.totalRowsProcessed == 0)
+
+    iterator.zipWithIndex.foreach { case (row, i) =>
+      assert(row.getInt(0) == i)
+    }
+
+    // With batch size 5 and 25 rows, we expect 5 batches (25/5 = 5)
+    val expectedBatches = 5
+    assert(iterator.batchesLoaded == expectedBatches,
+      s"Expected $expectedBatches batches loaded, got ${iterator.batchesLoaded}")
+    assert(iterator.totalRowsProcessed == inputRows.length,
+      s"Expected ${inputRows.length} rows processed, got ${iterator.totalRowsProcessed}")
+  }
+
+  test("multiple record batches in single stream without schema") {
+    val inputRows = (0 until 15).map(InternalRow(_))
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+    val ctx = TaskContext.empty()
+
+    val batchIter = ArrowConverters.toBatchIterator(
+      inputRows.iterator, schema, 7, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    val (outputRowIter, outputSchema) = ArrowConverters.fromIPCStream(out.toByteArray, ctx)
+    assert(outputSchema == schema)
+    val res = outputRowIter.zipWithIndex.map { case (row, i) =>
+      assert(row.getInt(0) == i)
+      i
+    }
+    assert(res.length == inputRows.length)
+  }
+
+  test("roundtrip arrow batches with complex schema using IPC stream") {
+    val rows = (0 until 12).map { i =>
+      InternalRow(i, UTF8String.fromString(s"str-$i"), InternalRow(i * 2))
+    }
+
+    val schema = StructType(Seq(
+      StructField("int", IntegerType),
+      StructField("str", StringType),
+      StructField("struct", StructType(Seq(StructField("inner", IntegerType))))
+    ))
+
+    val inputRows = rows.map { row =>
+      val proj = UnsafeProjection.create(schema)
+      proj(row).copy()
+    }
+    val ctx = TaskContext.empty()
+
+    // Create multiple batches
+    val batchIter = ArrowConverters.toBatchIterator(
+      inputRows.iterator, schema, 4, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    val (outputRowIter, outputSchema) = ArrowConverters.fromIPCStream(out.toByteArray, ctx)
+    assert(outputSchema == schema)
+    val outputRows = outputRowIter.zipWithIndex.map { case (row, i) =>
+      assert(row.getInt(0) == i)
+      assert(row.getUTF8String(1).toString == s"str-$i")
+      val struct = row.getStruct(2, 1)
+      assert(struct.getInt(0) == i * 2)
+      i
+    }
+    assert(outputRows.length == inputRows.length)
+  }
+
+  test("IPC stream batch metrics validation") {
+    val ctx = TaskContext.empty()
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+
+    // Test with different batch sizes to validate metrics
+    val testCases = Seq(
+      (50, 7),  // 50 rows, batch size 7 -> 8 batches (7*7 + 1)
+      (20, 4),  // 20 rows, batch size 4 -> 5 batches (4*4 + 4)
+      (15, 15), // 15 rows, batch size 15 -> 1 batch
+      (0, 5)    // 0 rows, any batch size -> 0 batches
+    )
+
+    testCases.foreach { case (rowCount, batchSize) =>
+      val inputRows = (0 until rowCount).map(InternalRow(_))
+      val batchIter = ArrowConverters.toBatchIterator(
+        inputRows.iterator, schema, batchSize, null, true, false, ctx)
+
+      val out = new ByteArrayOutputStream()
+      Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+        val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+        writer.writeBatches(batchIter)
+        writer.end()
+      }
+
+      val (iterator, outputSchema) = ArrowConverters.fromIPCStreamWithIterator(out.toByteArray, ctx)
+      assert(outputSchema == schema)
+
+      // Initially no batches loaded
+      assert(iterator.batchesLoaded == 0)
+      assert(iterator.totalRowsProcessed == 0)
+
+      // Consume all rows
+      val proj = UnsafeProjection.create(schema)
+      val outputRows = iterator.map(proj(_).copy())
+      assert(outputRows.length == rowCount)
+
+      if (rowCount > 0) {
+        // Calculate expected batches
+        val expectedBatches = Math.ceil(rowCount.toDouble / batchSize).toInt
+        assert(iterator.batchesLoaded == expectedBatches,
+          s"For $rowCount rows with batch size $batchSize: " +
+          s"expected $expectedBatches batches, got ${iterator.batchesLoaded}")
+        assert(iterator.totalRowsProcessed == rowCount,
+          s"For $rowCount rows: expected $rowCount rows processed, " +
+          s"got ${iterator.totalRowsProcessed}")
+      } else {
+        // Empty case - no batches should be loaded
+        assert(iterator.batchesLoaded == 0)
+        assert(iterator.totalRowsProcessed == 0)
+      }
+    }
+  }
+
+  test("empty IPC stream") {
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+    val ctx = TaskContext.empty()
+
+    val batchIter = ArrowConverters.toBatchIterator(
+      Iterator.empty, schema, 10, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    val (iterator, outputSchema) = ArrowConverters.fromIPCStreamWithIterator(out.toByteArray, ctx)
+    assert(outputSchema == schema)
+
+    // Validate metrics for empty stream
+    // assert(iterator.batchesLoaded == 0)
+    assert(iterator.totalRowsProcessed == 0)
+    assert(!iterator.hasNext)
+
+    // Metrics should remain 0 after hasNext check
+    // assert(iterator.batchesLoaded == 0)
+    assert(iterator.totalRowsProcessed == 0)
+  }
+
+  test("IPC stream with invalid data") {
+    val ctx = TaskContext.empty()
+    val invalidData = Array[Byte](1, 2, 3, 4, 5)
+
+    intercept[Exception] {
+      ArrowConverters.fromIPCStream(invalidData, ctx)
+    }
+  }
+
+  test("IPC stream with empty data") {
+    val ctx = TaskContext.empty()
+    val emptyData = Array.empty[Byte]
+
+    intercept[Exception] {
+      ArrowConverters.fromIPCStream(emptyData, ctx)
+    }
+  }
+
+  test("IPC stream with null context") {
+    val inputRows = (0 until 5).map(InternalRow(_))
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+    val ctx = TaskContext.empty()
+
+    val batchIter = ArrowConverters.toBatchIterator(
+      inputRows.iterator, schema, 10, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    // Test with null context - should still work but won't have cleanup registration
+    val proj = UnsafeProjection.create(schema)
+    val (outputRowIter, outputSchema) = ArrowConverters.fromIPCStream(out.toByteArray, null)
+    assert(outputSchema == schema)
+    val outputRows = outputRowIter.map(proj(_).copy()).toList
+    assert(outputRows.length == inputRows.length)
+    outputRows.zipWithIndex.foreach { case (row, i) =>
+      assert(row.getInt(0) == i)
+    }
+  }
+
+  test("multi-batch iteration validation with varying batch sizes") {
+    val inputRows = (0 until 100).map(InternalRow(_))
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+    val ctx = TaskContext.empty()
+
+    // Create many small batches
+    val batchIter = ArrowConverters.toBatchIterator(
+      inputRows.iterator, schema, 3, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    val (iterator, outputSchema) = ArrowConverters.fromIPCStreamWithIterator(out.toByteArray, ctx)
+    assert(outputSchema == schema)
+
+    // Initially no batches loaded
+    assert(iterator.batchesLoaded == 0)
+    assert(iterator.totalRowsProcessed == 0)
+
+    // Test hasNext multiple times without calling next
+    assert(iterator.hasNext)
+    assert(iterator.hasNext)
+    assert(iterator.hasNext)
+
+    // After hasNext calls, first batch should be loaded
+    assert(iterator.batchesLoaded == 1)
+    assert(iterator.totalRowsProcessed == 0) // First batch has 3 rows
+
+    // Consume all rows
+    val proj = UnsafeProjection.create(schema)
+    val outputRows = iterator.map(proj(_).copy()).toList
+    assert(outputRows.length == inputRows.length)
+    outputRows.zipWithIndex.foreach { case (row, i) =>
+      assert(row.getInt(0) == i)
+    }
+
+    // With batch size 3 and 100 rows, we expect 34 batches (ceiling(100/3) = 34)
+    val expectedBatches = Math.ceil(inputRows.length.toDouble / 3).toInt
+    assert(iterator.batchesLoaded == expectedBatches,
+      s"Expected $expectedBatches batches loaded, got ${iterator.batchesLoaded}")
+    assert(iterator.totalRowsProcessed == inputRows.length,
+      s"Expected ${inputRows.length} rows processed, got ${iterator.totalRowsProcessed}")
+
+    // Verify no more data
+    assert(!iterator.hasNext)
+  }
+
+  test("multi-batch iteration with complex schema validation") {
+    val inputRows = (0 until 50).map { i =>
+      InternalRow(
+        i,
+        UTF8String.fromString(s"test-$i"),
+        if (i % 2 == 0) null else InternalRow(i * 3),
+        Array(i, i + 1, i + 2).map(x => x.toByte)
+      )
+    }
+
+    val schema = StructType(Seq(
+      StructField("id", IntegerType, nullable = false),
+      StructField("name", StringType, nullable = false),
+      StructField("nested", StructType(Seq(StructField("value", IntegerType))), nullable = true),
+      StructField("bytes", BinaryType, nullable = false)
+    ))
+
+    val projectedRows = inputRows.map { row =>
+      val proj = UnsafeProjection.create(schema)
+      proj(row).copy()
+    }
+    val ctx = TaskContext.empty()
+
+    // Use small batch size to create many batches
+    val batchIter = ArrowConverters.toBatchIterator(
+      projectedRows.iterator, schema, 7, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    val (outputRowIter, outputSchema) = ArrowConverters.fromIPCStream(out.toByteArray, ctx)
+    val proj = UnsafeProjection.create(schema)
+    assert(outputSchema == schema)
+    val outputRows = outputRowIter.map(proj(_).copy()).toList
+    assert(outputRows.length == inputRows.length)
+
+    outputRows.zipWithIndex.foreach { case (row, i) =>
+      assert(row.getInt(0) == i)
+      assert(row.getUTF8String(1).toString == s"test-$i")
+      if (i % 2 == 0) {
+        assert(row.isNullAt(2))
+      } else {
+        val nested = row.getStruct(2, 1)
+        assert(nested.getInt(0) == i * 3)
+      }
+      val expectedBytes = Array(i, i + 1, i + 2).map(_.toByte)
+      assert(row.getBinary(3).sameElements(expectedBytes))
+    }
+  }
+
+  test("IPC stream partial consumption metrics validation") {
+    val inputRows = (0 until 30).map(InternalRow(_))
+    val schema = StructType(Seq(StructField("int", IntegerType, nullable = true)))
+    val ctx = TaskContext.empty()
+    val batchSize = 7
+
+    val batchIter = ArrowConverters.toBatchIterator(
+      inputRows.iterator, schema, batchSize, null, true, false, ctx)
+
+    val out = new ByteArrayOutputStream()
+    Utils.tryWithResource(new DataOutputStream(out)) { dataOut =>
+      val writer = new ArrowBatchStreamWriter(schema, dataOut, null, true, false)
+      writer.writeBatches(batchIter)
+      writer.end()
+    }
+
+    val (iterator, outputSchema) = ArrowConverters.fromIPCStreamWithIterator(out.toByteArray, ctx)
+    assert(outputSchema == schema)
+
+    // Initially no batches loaded
+    assert(iterator.batchesLoaded == 0)
+    assert(iterator.totalRowsProcessed == 0)
+
+    // Consume first 10 rows (should load 2 batches: 7 + 3)
+    val firstBatch = iterator.take(10).toList
+    assert(firstBatch.length == 10)
+
+    // After consuming 10 rows, we should have loaded at least 2 batches
+    assert(iterator.batchesLoaded >= 2,
+      s"Expected at least 2 batches loaded after 10 rows, got ${iterator.batchesLoaded}")
+    assert(iterator.totalRowsProcessed >= 10,
+      s"Expected at least 10 rows processed, got ${iterator.totalRowsProcessed}")
+
+    // Consume remaining rows
+    val remainingRows = iterator.toList
+    val totalConsumed = firstBatch.length + remainingRows.length
+    assert(totalConsumed == inputRows.length)
+
+    // Final metrics should show all batches loaded
+    val expectedBatches = Math.ceil(inputRows.length.toDouble / batchSize).toInt
+    assert(iterator.batchesLoaded == expectedBatches,
+      s"Expected $expectedBatches batches loaded, got ${iterator.batchesLoaded}")
+    assert(iterator.totalRowsProcessed == inputRows.length,
+      s"Expected ${inputRows.length} rows processed, got ${iterator.totalRowsProcessed}")
+  }
+
   /** Test that a converted DataFrame to Arrow record batch equals batch read from JSON file */
   private def collectAndValidate(
       df: DataFrame,
@@ -1507,7 +1960,7 @@ class ArrowConvertersSuite extends SharedSparkSession {
     // NOTE: coalesce to single partition because can only load 1 batch in validator
     val batchBytes = df.coalesce(1).toArrowBatchRdd.collect().head
     val tempFile = new File(tempDataPath, file)
-    Files.asCharSink(tempFile, StandardCharsets.UTF_8).write(json)
+    Files.writeString(tempFile.toPath, json)
     validateConversion(df.schema, batchBytes, tempFile, timeZoneId, errorOnDuplicatedFieldNames)
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowWriterSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowWriterSuite.scala
index acf258a373c36..99d245529e96d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowWriterSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/arrow/ArrowWriterSuite.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.execution.arrow
 import org.apache.arrow.vector.VectorSchemaRoot
 
 import org.apache.spark.SparkFunSuite
+import org.apache.spark.sql.YearUDT
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.util._
 import org.apache.spark.sql.types._
@@ -38,6 +39,8 @@ class ArrowWriterSuite extends SparkFunSuite {
       val datatype = dt match {
         case _: DayTimeIntervalType => DayTimeIntervalType()
         case _: YearMonthIntervalType => YearMonthIntervalType()
+        case _: TimeType => TimeType()
+        case u: UserDefinedType[_] => u.sqlType
         case tpe => tpe
       }
       val schema = new StructType().add("value", datatype, nullable = true)
@@ -53,7 +56,7 @@ class ArrowWriterSuite extends SparkFunSuite {
       data.zipWithIndex.foreach {
         case (null, rowId) => assert(reader.isNullAt(rowId))
         case (datum, rowId) =>
-          val value = dt match {
+          val value = datatype match {
             case BooleanType => reader.getBoolean(rowId)
             case ByteType => reader.getByte(rowId)
             case ShortType => reader.getShort(rowId)
@@ -67,6 +70,7 @@ class ArrowWriterSuite extends SparkFunSuite {
             case DateType => reader.getInt(rowId)
             case TimestampType => reader.getLong(rowId)
             case TimestampNTZType => reader.getLong(rowId)
+            case _: TimeType => reader.getLong(rowId)
             case _: YearMonthIntervalType => reader.getInt(rowId)
             case _: DayTimeIntervalType => reader.getLong(rowId)
             case CalendarIntervalType => reader.getInterval(rowId)
@@ -91,6 +95,7 @@ class ArrowWriterSuite extends SparkFunSuite {
     check(DateType, Seq(0, 1, 2, null, 4))
     check(TimestampType, Seq(0L, 3.6e9.toLong, null, 8.64e10.toLong), "America/Los_Angeles")
     check(TimestampNTZType, Seq(0L, 3.6e9.toLong, null, 8.64e10.toLong))
+    DataTypeTestUtils.timeTypes.foreach(check(_, Seq(0L, 4.32e4.toLong, null, 3723123456789L)))
     check(NullType, Seq(null, null, null))
     DataTypeTestUtils.yearMonthIntervalTypes
       .foreach(check(_, Seq(null, 0, 1, -1, Int.MaxValue, Int.MinValue)))
@@ -102,16 +107,19 @@ class ArrowWriterSuite extends SparkFunSuite {
         new CalendarInterval(-1, -2, -3),
         new CalendarInterval(-11, -22, -33),
         null))
+    check(new YearUDT, Seq(2020, 2021, null, 2022))
   }
 
   test("get multiple") {
     def check(dt: DataType, data: Seq[Any], timeZoneId: String = null): Unit = {
-      val avroDatatype = dt match {
+      val datatype = dt match {
         case _: DayTimeIntervalType => DayTimeIntervalType()
         case _: YearMonthIntervalType => YearMonthIntervalType()
+        case _: TimeType => TimeType()
+        case u: UserDefinedType[_] => u.sqlType
         case tpe => tpe
       }
-      val schema = new StructType().add("value", avroDatatype, nullable = false)
+      val schema = new StructType().add("value", datatype, nullable = false)
       val writer = ArrowWriter.create(schema, timeZoneId)
       assert(writer.schema === schema)
 
@@ -121,7 +129,7 @@ class ArrowWriterSuite extends SparkFunSuite {
       writer.finish()
 
       val reader = new ArrowColumnVector(writer.root.getFieldVectors().get(0))
-      val values = dt match {
+      val values = datatype match {
         case BooleanType => reader.getBooleans(0, data.size)
         case ByteType => reader.getBytes(0, data.size)
         case ShortType => reader.getShorts(0, data.size)
@@ -132,6 +140,7 @@ class ArrowWriterSuite extends SparkFunSuite {
         case DateType => reader.getInts(0, data.size)
         case TimestampType => reader.getLongs(0, data.size)
         case TimestampNTZType => reader.getLongs(0, data.size)
+        case _: TimeType => reader.getLongs(0, data.size)
         case _: YearMonthIntervalType => reader.getInts(0, data.size)
         case _: DayTimeIntervalType => reader.getLongs(0, data.size)
       }
@@ -149,8 +158,10 @@ class ArrowWriterSuite extends SparkFunSuite {
     check(DateType, (0 until 10))
     check(TimestampType, (0 until 10).map(_ * 4.32e10.toLong), "America/Los_Angeles")
     check(TimestampNTZType, (0 until 10).map(_ * 4.32e10.toLong))
+    DataTypeTestUtils.timeTypes.foreach(check(_, (0 until 10).map(_ * 4.32e10.toLong)))
     DataTypeTestUtils.yearMonthIntervalTypes.foreach(check(_, (0 until 14)))
     DataTypeTestUtils.dayTimeIntervalTypes.foreach(check(_, (-10 until 10).map(_ * 1000.toLong)))
+    check(new YearUDT, 2018 to 2029)
   }
 
   test("write multiple, over initial capacity") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/Base64Benchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/Base64Benchmark.scala
index 3ad6baea84f2d..b5290eafae3e2 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/Base64Benchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/Base64Benchmark.scala
@@ -36,14 +36,14 @@ object Base64Benchmark extends SqlBasedBenchmark {
   private val N = 20L * 1000 * 1000
 
   private def doEncode(len: Int, f: Array[Byte] => Array[Byte]): Unit = {
-    spark.range(N).map(_ => "Spark" * len).foreach { s =>
+    spark.range(N).map(_ => "Spark".repeat(len)).foreach { s =>
       f(s.getBytes)
       ()
     }
   }
 
   private def doDecode(len: Int, f: Array[Byte] => Array[Byte]): Unit = {
-    spark.range(N).map(_ => "Spark" * len).map { s =>
+    spark.range(N).map(_ => "Spark".repeat(len)).map { s =>
       // using the same encode func
       java.util.Base64.getMimeEncoder.encode(s.getBytes)
     }.foreach { s =>
@@ -52,6 +52,7 @@ object Base64Benchmark extends SqlBasedBenchmark {
     }
   }
 
+  // scalastyle:off commonscodecbase64
   override def runBenchmarkSuite(mainArgs: Array[String]): Unit = {
     Seq(1, 3, 5, 7).map { len =>
       val benchmark = new Benchmark(s"encode for $len", N, output = output)
@@ -75,4 +76,5 @@ object Base64Benchmark extends SqlBasedBenchmark {
       benchmark
     }.foreach(_.run())
   }
+  // scalastyle:on commonscodecbase64
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CharVarcharBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CharVarcharBenchmark.scala
index 05148f5494e96..02529bb11ab78 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CharVarcharBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CharVarcharBenchmark.scala
@@ -62,7 +62,7 @@ object CharVarcharBenchmark extends SqlBasedBenchmark {
             createTable(tblName, colType, path)
             spark.range(card).map { _ =>
               if (hasSpaces) {
-                "st" + " " * length
+                "st" + " ".repeat(length)
               } else {
                 "st"
               }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CollationBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CollationBenchmark.scala
index 6069127a0df9d..0836823a994a7 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CollationBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/CollationBenchmark.scala
@@ -19,7 +19,9 @@ package org.apache.spark.sql.execution.benchmark
 import scala.concurrent.duration._
 
 import org.apache.spark.benchmark.{Benchmark, BenchmarkBase}
+import org.apache.spark.sql.catalyst.expressions.Murmur3HashFunction
 import org.apache.spark.sql.catalyst.util.{CollationFactory, CollationSupport}
+import org.apache.spark.sql.types.StringType
 import org.apache.spark.unsafe.types.UTF8String
 
 abstract class CollationBenchmarkBase extends BenchmarkBase {
@@ -92,7 +94,7 @@ abstract class CollationBenchmarkBase extends BenchmarkBase {
         sublistStrings.foreach { _ =>
           utf8Strings.foreach { s =>
             (0 to 3).foreach { _ =>
-              collation.hashFunction.applyAsLong(s)
+              Murmur3HashFunction.hash(s, StringType(collationType), 42L, true, false).toInt
             }
           }
         }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/ConstantColumnVectorBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/ConstantColumnVectorBenchmark.scala
index 078954f1a6023..a2d48df6bd003 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/ConstantColumnVectorBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/ConstantColumnVectorBenchmark.scala
@@ -268,7 +268,7 @@ object ConstantColumnVectorBenchmark extends BenchmarkBase {
 
     Seq(1, 5, 10, 15, 20, 30).foreach { length =>
       val builder = new UTF8StringBuilder()
-      builder.append(RandomStringUtils.random(length))
+      builder.append(RandomStringUtils.secure.next(length))
       val row = InternalRow(builder.build())
       testWrite(valuesPerIteration, batchSize, StringType, row)
     }
@@ -281,7 +281,7 @@ object ConstantColumnVectorBenchmark extends BenchmarkBase {
 
     Seq(1, 5, 10, 15, 20, 30).foreach { length =>
       val builder = new UTF8StringBuilder()
-      builder.append(RandomStringUtils.random(length))
+      builder.append(RandomStringUtils.secure.next(length))
       val row = InternalRow(builder.build())
       testRead(valuesPerIteration, batchSize, StringType, row)
     }
@@ -293,7 +293,7 @@ object ConstantColumnVectorBenchmark extends BenchmarkBase {
 
     Seq(1, 5, 10, 15, 20, 30).foreach { length =>
       val builder = new UTF8StringBuilder()
-      builder.append(RandomStringUtils.random(length))
+      builder.append(RandomStringUtils.secure.next(length))
       val row = InternalRow(builder.build())
       testWriteAndRead(valuesPerIteration, batchSize, StringType, row)
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/DataSourceReadBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/DataSourceReadBenchmark.scala
index ff57a447d3b7b..84c5d1919f8ff 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/DataSourceReadBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/DataSourceReadBenchmark.scala
@@ -362,11 +362,11 @@ object DataSourceReadBenchmark extends SqlBasedBenchmark {
       withTempTable("t1", "parquetV1Table", "parquetV2Table", "orcTable") {
         import spark.implicits._
         spark.range(values).map(_ => Random.nextLong()).map { x =>
-          val arrayOfStructColumn = (0 until 5).map(i => (x + i, s"$x" * 5))
+          val arrayOfStructColumn = (0 until 5).map(i => (x + i, s"$x".repeat(5)))
           val mapOfStructColumn = Map(
-            s"$x" -> (x * 0.1, (x, s"$x" * 100)),
-            (s"$x" * 2) -> (x * 0.2, (x, s"$x" * 200)),
-            (s"$x" * 3) -> (x * 0.3, (x, s"$x" * 300)))
+            s"$x" -> (x * 0.1, (x, s"$x".repeat(100))),
+            (s"$x".repeat(2)) -> (x * 0.2, (x, s"$x".repeat(200))),
+            (s"$x".repeat(3)) -> (x * 0.3, (x, s"$x".repeat(300))))
           (arrayOfStructColumn, mapOfStructColumn)
         }.toDF("col1", "col2").createOrReplaceTempView("t1")
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/LargeRowBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/LargeRowBenchmark.scala
index 8b4f78e79913a..7b37f637468b3 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/LargeRowBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/LargeRowBenchmark.scala
@@ -40,7 +40,7 @@ object LargeRowBenchmark extends SqlBasedBenchmark {
   private def writeLargeRow(path: String, rowsNum: Int, numCols: Int, cellSizeMb: Double): Unit = {
     val stringLength = (cellSizeMb * 1024 * 1024).toInt
     spark.range(rowsNum)
-      .select(Seq.tabulate(numCols)(i => lit("a" * stringLength).as(s"col$i")): _*)
+      .select(Seq.tabulate(numCols)(i => lit("a".repeat(stringLength)).as(s"col$i")): _*)
       .write.parquet(path)
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/NestedSchemaPruningBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/NestedSchemaPruningBenchmark.scala
index 90fad7f36b862..f7569df8237b4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/NestedSchemaPruningBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/NestedSchemaPruningBenchmark.scala
@@ -41,8 +41,8 @@ abstract class NestedSchemaPruningBenchmark extends SqlBasedBenchmark {
     .range(N * 10)
     .sample(false, 0.1)
     .map { x =>
-      val col3 = (0 until 5).map(i => (x + i, s"$x" * 5))
-      (x, (x, s"$x" * 100), col3)
+      val col3 = (0 until 5).map(i => (x + i, s"$x".repeat(5)))
+      (x, (x, s"$x".repeat(100)), col3)
     }.toDF("col1", "col2", "col3")
 
   private def addCase(benchmark: Benchmark, name: String, sql: String): Unit = {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/PrimitiveArrayBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/PrimitiveArrayBenchmark.scala
index a09a64d6a8fd3..659f3699d5a4f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/PrimitiveArrayBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/PrimitiveArrayBenchmark.scala
@@ -19,6 +19,7 @@ package org.apache.spark.sql.execution.benchmark
 
 import org.apache.spark.benchmark.Benchmark
 import org.apache.spark.sql.SparkSession
+import org.apache.spark.util.collection.Utils.createArray
 
 /**
  * Benchmark primitive arrays via DataFrame and Dataset program using primitive arrays
@@ -53,7 +54,7 @@ object PrimitiveArrayBenchmark extends SqlBasedBenchmark {
     val count = 1024 * 1024 * 2
 
     val sc = spark.sparkContext
-    val primitiveIntArray = Array.fill[Int](count)(65535)
+    val primitiveIntArray = createArray(count, 65535)
     val dsInt = sc.parallelize(Seq(primitiveIntArray), 1).toDS()
     dsInt.count()  // force to build dataset
     val intArray = { i: Int =>
@@ -64,7 +65,7 @@ object PrimitiveArrayBenchmark extends SqlBasedBenchmark {
         n += 1
       }
     }
-    val primitiveDoubleArray = Array.fill[Double](count)(65535.0)
+    val primitiveDoubleArray = createArray(count, 65535.0)
     val dsDouble = sc.parallelize(Seq(primitiveDoubleArray), 1).toDS()
     dsDouble.count()  // force to build dataset
     val doubleArray = { i: Int =>
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/StateStoreBasicOperationsBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/StateStoreBasicOperationsBenchmark.scala
index ff4bd41409af8..ab03d9cb6a1f1 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/StateStoreBasicOperationsBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/benchmark/StateStoreBasicOperationsBenchmark.scala
@@ -17,12 +17,15 @@
 
 package org.apache.spark.sql.execution.benchmark
 
+import java.util.UUID
+
 import scala.util.Random
 
 import org.apache.hadoop.conf.Configuration
 
 import org.apache.spark.benchmark.Benchmark
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.sql.execution.streaming.state.{HDFSBackedStateStoreProvider, NoPrefixKeyStateEncoderSpec, RocksDBStateStoreProvider, StateStore, StateStoreConf, StateStoreId, StateStoreProvider}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{IntegerType, StructField, StructType, TimestampType}
@@ -462,9 +465,11 @@ object StateStoreBasicOperationsBenchmark extends SqlBasedBenchmark {
     val storeId = StateStoreId(newDir(), Random.nextInt(), 0)
     val provider = new HDFSBackedStateStoreProvider()
     val storeConf = new StateStoreConf(new SQLConf())
+    val configuration = new Configuration
+    configuration.set(StreamExecution.RUN_ID_KEY, UUID.randomUUID().toString)
     provider.init(
       storeId, keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
-      useColumnFamilies = false, storeConf, new Configuration)
+      useColumnFamilies = false, storeConf, configuration)
     provider
   }
 
@@ -477,11 +482,16 @@ object StateStoreBasicOperationsBenchmark extends SqlBasedBenchmark {
     val sqlConf = new SQLConf()
     sqlConf.setConfString("spark.sql.streaming.stateStore.rocksdb.trackTotalNumberOfRows",
       trackTotalNumberOfRows.toString)
+    sqlConf.setConfString("spark.sql.streaming.stateStore.coordinatorReportSnapshotUploadLag",
+      false.toString)
     val storeConf = new StateStoreConf(sqlConf)
 
+    val configuration = new Configuration
+    configuration.set(StreamExecution.RUN_ID_KEY, UUID.randomUUID().toString)
+
     provider.init(
       storeId, keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
-      useColumnFamilies = useColumnFamilies, storeConf, new Configuration,
+      useColumnFamilies = useColumnFamilies, storeConf, configuration,
       useMultipleValuesPerKey = useMultipleValuesPerKey)
     provider
   }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/CachedBatchSerializerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/CachedBatchSerializerSuite.scala
index 46f60e881ddba..47b935a2880ae 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/CachedBatchSerializerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/CachedBatchSerializerSuite.scala
@@ -25,7 +25,7 @@ import org.apache.spark.sql.{QueryTest, Row}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression, UnsafeProjection}
 import org.apache.spark.sql.columnar.{CachedBatch, CachedBatchSerializer}
-import org.apache.spark.sql.execution.ColumnarToRowExec
+import org.apache.spark.sql.execution.{ColumnarToRowExec, SparkPlan, WholeStageCodegenExec}
 import org.apache.spark.sql.execution.adaptive.{AdaptiveSparkPlanExec, AdaptiveSparkPlanHelper}
 import org.apache.spark.sql.execution.columnar.InMemoryRelation.clearSerializer
 import org.apache.spark.sql.execution.vectorized.OnHeapColumnVector
@@ -122,6 +122,25 @@ class TestSingleIntColumnarCachedBatchSerializer extends CachedBatchSerializer {
   }
 }
 
+/**
+ * An equivalence of Spark's [[DefaultCachedBatchSerializer]] while the API
+ * [[convertToColumnarPlanIfPossible]] is being tested.
+ */
+class DefaultCachedBatchSerializerNoUnwrap extends DefaultCachedBatchSerializer {
+  override def supportsColumnarInput(schema: Seq[Attribute]): Boolean = {
+    // Return true to let Spark call #convertToColumnarPlanIfPossible to unwrap the input
+    // columnar plan out from the guard of the topmost ColumnarToRowExec.
+    true
+  }
+
+  override def convertToColumnarPlanIfPossible(plan: SparkPlan): SparkPlan = {
+    assert(!plan.supportsColumnar)
+    // Disable the unwrapping code path from default CachedBatchSerializer so
+    // Spark will keep the topmost columnar-to-row plan node.
+    plan
+  }
+}
+
 class CachedBatchSerializerSuite extends QueryTest
   with SharedSparkSession with AdaptiveSparkPlanHelper {
   import testImplicits._
@@ -180,3 +199,41 @@ class CachedBatchSerializerSuite extends QueryTest
     }
   }
 }
+
+
+class CachedBatchSerializerNoUnwrapSuite extends QueryTest
+  with SharedSparkSession with AdaptiveSparkPlanHelper {
+
+  import testImplicits._
+
+  override protected def sparkConf: SparkConf = {
+    super.sparkConf.set(
+      StaticSQLConf.SPARK_CACHE_SERIALIZER.key,
+      classOf[DefaultCachedBatchSerializerNoUnwrap].getName)
+  }
+
+  test("Do not unwrap ColumnarToRowExec") {
+    withTempPath { workDir =>
+      val workDirPath = workDir.getAbsolutePath
+      val input = Seq(100, 200).toDF("count")
+      input.write.parquet(workDirPath)
+      val data = spark.read.parquet(workDirPath)
+      data.cache()
+      val df = data.union(data)
+      assert(df.count() == 4)
+      checkAnswer(df, Row(100) :: Row(200) :: Row(100) :: Row(200) :: Nil)
+
+      val finalPlan = df.queryExecution.executedPlan
+      val cachedPlans = finalPlan.collect {
+        case i: InMemoryTableScanExec => i.relation.cachedPlan
+      }
+      assert(cachedPlans.length == 2)
+      cachedPlans.foreach {
+        cachedPlan =>
+          assert(cachedPlan.isInstanceOf[WholeStageCodegenExec])
+          assert(cachedPlan.asInstanceOf[WholeStageCodegenExec]
+            .child.isInstanceOf[ColumnarToRowExec])
+      }
+    }
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/compression/CompressionSchemeBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/compression/CompressionSchemeBenchmark.scala
index 290cfd56b8bce..e19e8ba38b77c 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/compression/CompressionSchemeBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/columnar/compression/CompressionSchemeBenchmark.scala
@@ -222,7 +222,7 @@ object CompressionSchemeBenchmark extends BenchmarkBase with AllCompressionSchem
     val testData = allocateLocal(count * (4 + strLen))
 
     val g = {
-      val dataTable = (0 until tableSize).map(_ => RandomStringUtils.randomAlphabetic(strLen))
+      val dataTable = (0 until tableSize).map(_ => RandomStringUtils.secure.nextAlphabetic(strLen))
       val rng = genHigherSkewData()
       () => dataTable(rng().toInt % tableSize)
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/ConstraintParseSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/ConstraintParseSuiteBase.scala
index dadc791138ac0..af47bca4179c4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/ConstraintParseSuiteBase.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/ConstraintParseSuiteBase.scala
@@ -80,11 +80,13 @@ abstract class ConstraintParseSuiteBase extends AnalysisTest with SharedSparkSes
   protected def verifyConstraints(
       sql: String,
       constraints: Seq[TableConstraint],
-      isCreateTable: Boolean = true): Unit = {
+      isCreateTable: Boolean = true,
+      columnANullable: Boolean = true,
+      columnBNullable: Boolean = true): Unit = {
     val parsed = parsePlan(sql)
     val columns = Seq(
-      ColumnDefinition("a", IntegerType),
-      ColumnDefinition("b", StringType)
+      ColumnDefinition("a", IntegerType, nullable = columnANullable),
+      ColumnDefinition("b", StringType, nullable = columnBNullable)
     )
     val expected = createExpectedPlan(
       columns = columns, tableConstraints = constraints, isCreateTable = isCreateTable)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DDLCommandTestUtils.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DDLCommandTestUtils.scala
index a97be14536177..e31648ce33732 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DDLCommandTestUtils.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DDLCommandTestUtils.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.execution.command
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.fs.{FileSystem, Path}
 import org.scalactic.source.Position
 import org.scalatest.Tag
@@ -29,6 +28,7 @@ import org.apache.spark.sql.catalyst.catalog.CatalogTypes.TablePartitionSpec
 import org.apache.spark.sql.connector.catalog.{CatalogV2Util, TableCatalog}
 import org.apache.spark.sql.execution.datasources.PartitioningUtils
 import org.apache.spark.sql.test.SQLTestUtils
+import org.apache.spark.util.Utils
 
 /**
  * The common settings and utility functions for all v1 and v2 test suites. When a function
@@ -170,7 +170,7 @@ trait DDLCommandTestUtils extends SQLTestUtils {
   def copyPartition(tableName: String, from: String, to: String): String = {
     val part0Loc = getPartitionLocation(tableName, from)
     val part1Loc = part0Loc.replace(from, to)
-    FileUtils.copyDirectory(new File(part0Loc), new File(part1Loc))
+    Utils.copyDirectory(new File(part0Loc), new File(part1Loc))
     part1Loc
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DeclareVariableParserSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DeclareVariableParserSuite.scala
index 02f1d012297bf..bfdf06caf4336 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DeclareVariableParserSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DeclareVariableParserSuite.scala
@@ -17,12 +17,12 @@
 
 package org.apache.spark.sql.execution.command
 
-import org.apache.spark.sql.catalyst.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.catalyst.analysis.{AnalysisTest, UnresolvedAttribute, UnresolvedFunction, UnresolvedIdentifier, UnresolvedInlineTable}
 import org.apache.spark.sql.catalyst.expressions.{Add, Cast, Divide, Literal, ScalarSubquery}
 import org.apache.spark.sql.catalyst.parser.CatalystSqlParser.parsePlan
 import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.catalyst.plans.logical.{CreateVariable, DefaultValueExpression, Project, SubqueryAlias}
+import org.apache.spark.sql.catalyst.util.EvaluateUnresolvedInlineTable
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.{Decimal, DecimalType, DoubleType, IntegerType, MapType, NullType, StringType}
@@ -34,61 +34,61 @@ class DeclareVariableParserSuite extends AnalysisTest with SharedSparkSession {
     comparePlans(
       parsePlan("DECLARE var1 INT = 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Cast(Literal(1, IntegerType), IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE var1 INT"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Literal(null, IntegerType), "null"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE var1 = 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Literal(1, IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE VARIABLE var1 = 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Literal(1, IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE VAR var1 = 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Literal(1, IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE VARIABLE var1 DEFAULT 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Literal(1, IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE VARIABLE var1 INT DEFAULT 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Cast(Literal(1, IntegerType), IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE VARIABLE system.session.var1 DEFAULT 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("system", "session", "var1")),
+        Seq(UnresolvedIdentifier(Seq("system", "session", "var1"))),
         DefaultValueExpression(Literal(1, IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE VARIABLE session.var1 DEFAULT 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("session", "var1")),
+        Seq(UnresolvedIdentifier(Seq("session", "var1"))),
         DefaultValueExpression(Literal(1, IntegerType), "1"),
         replace = false))
     comparePlans(
       parsePlan("DECLARE VARIABLE var1 STRING DEFAULT CURRENT_DATABASE()"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(
           Cast(UnresolvedFunction("CURRENT_DATABASE", Nil, isDistinct = false), StringType),
           "CURRENT_DATABASE()"),
@@ -103,7 +103,7 @@ class DeclareVariableParserSuite extends AnalysisTest with SharedSparkSession {
     comparePlans(
       parsePlan("DECLARE VARIABLE var1 INT DEFAULT (SELECT c1 FROM VALUES(1) AS T(c1))"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(
           Cast(ScalarSubquery(
             Project(UnresolvedAttribute("c1") :: Nil,
@@ -117,13 +117,13 @@ class DeclareVariableParserSuite extends AnalysisTest with SharedSparkSession {
     comparePlans(
       parsePlan("DECLARE OR REPLACE VARIABLE var1 = 1"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Literal(1, IntegerType), "1"),
         replace = true))
     comparePlans(
       parsePlan("DECLARE OR REPLACE VARIABLE var1 DOUBLE DEFAULT 1 + RAND(5)"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(
           Cast(
             Add(Literal(1, IntegerType),
@@ -134,20 +134,20 @@ class DeclareVariableParserSuite extends AnalysisTest with SharedSparkSession {
     comparePlans(
       parsePlan("DECLARE OR REPLACE VARIABLE var1 DEFAULT NULL"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Literal(null, NullType), "NULL"),
         replace = true))
     comparePlans(
       parsePlan("DECLARE OR REPLACE VARIABLE INT DEFAULT 5.0"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("INT")),
+        Seq(UnresolvedIdentifier(Seq("INT"))),
         DefaultValueExpression(Literal(Decimal("5.0"), DecimalType(2, 1)), "5.0"),
         replace = true))
     comparePlans(
       parsePlan("DECLARE OR REPLACE VARIABLE var1 MAP<string, double> " +
         "DEFAULT MAP('Hello', 5.1, 'World', -7.1E10)"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Cast(
           UnresolvedFunction("MAP", Seq(
             Literal(UTF8String.fromString("Hello"), StringType),
@@ -160,13 +160,13 @@ class DeclareVariableParserSuite extends AnalysisTest with SharedSparkSession {
     comparePlans(
       parsePlan("DECLARE OR REPLACE VARIABLE var1 INT DEFAULT NULL"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Cast(Literal(null, NullType), IntegerType), "NULL"),
         replace = true))
     comparePlans(
       parsePlan("DECLARE OR REPLACE VARIABLE var1 INT DEFAULT 1 / 0"),
       CreateVariable(
-        UnresolvedIdentifier(Seq("var1")),
+        Seq(UnresolvedIdentifier(Seq("var1"))),
         DefaultValueExpression(Cast(
           Divide(Literal(1, IntegerType), Literal(0, IntegerType)), IntegerType),
           "1 / 0"),
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DescribeTableSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DescribeTableSuiteBase.scala
index 9d34b6725c4fc..1ea75ccb09d8b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DescribeTableSuiteBase.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/DescribeTableSuiteBase.scala
@@ -252,7 +252,6 @@ trait DescribeTableSuiteBase extends QueryTest with DDLCommandTestUtils {
       df.write.mode("append").clusterBy("col1", "col2.x").saveAsTable(tbl)
       val descriptionDf = sql(s"DESC $tbl")
 
-      descriptionDf.show(false)
       assert(descriptionDf.schema.map(field => (field.name, field.dataType)) === Seq(
         ("col_name", StringType),
         ("data_type", StringType),
@@ -277,7 +276,6 @@ trait DescribeTableSuiteBase extends QueryTest with DDLCommandTestUtils {
       df.writeTo(tbl).clusterBy("col1", "col2.x").create()
       val descriptionDf = sql(s"DESC $tbl")
 
-      descriptionDf.show(false)
       assert(descriptionDf.schema.map(field => (field.name, field.dataType)) === Seq(
         ("col_name", StringType),
         ("data_type", StringType),
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PlanResolutionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PlanResolutionSuite.scala
index ccf502d79c00d..ecc293a5acc2a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PlanResolutionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PlanResolutionSuite.scala
@@ -2315,11 +2315,24 @@ class PlanResolutionSuite extends SharedSparkSession with AnalysisTest {
          |USING testcat.tab2
          |ON 1 = 1
          |WHEN MATCHED THEN UPDATE SET *""".stripMargin
-    checkError(
-      exception = intercept[AnalysisException](parseAndResolve(sql2)),
-      condition = "UNRESOLVED_COLUMN.WITH_SUGGESTION",
-      parameters = Map("objectName" -> "`s`", "proposal" -> "`i`, `x`"),
-      context = ExpectedContext(fragment = sql2, start = 0, stop = 80))
+    val parsed2 = parseAndResolve(sql2)
+    parsed2 match {
+      case MergeIntoTable(
+          AsDataSourceV2Relation(target),
+          AsDataSourceV2Relation(source),
+          EqualTo(IntegerLiteral(1), IntegerLiteral(1)),
+          Seq(UpdateAction(None, updateAssigns)), // Matched actions
+          Seq(), // Not matched actions
+          Seq(), // Not matched by source actions
+          withSchemaEvolution) =>
+        val ti = target.output.find(_.name == "i").get
+        val si = source.output.find(_.name == "i").get
+        assert(updateAssigns.size == 1)
+        assert(updateAssigns.head.key.asInstanceOf[AttributeReference].sameRef(ti))
+        assert(updateAssigns.head.value.asInstanceOf[AttributeReference].sameRef(si))
+        assert(withSchemaEvolution === false)
+      case other => fail("Expect MergeIntoTable, but got:\n" + other.treeString)
+    }
 
     // INSERT * with incompatible schema between source and target tables.
     val sql3 =
@@ -2327,11 +2340,24 @@ class PlanResolutionSuite extends SharedSparkSession with AnalysisTest {
         |USING testcat.tab2
         |ON 1 = 1
         |WHEN NOT MATCHED THEN INSERT *""".stripMargin
-    checkError(
-      exception = intercept[AnalysisException](parseAndResolve(sql3)),
-      condition = "UNRESOLVED_COLUMN.WITH_SUGGESTION",
-      parameters = Map("objectName" -> "`s`", "proposal" -> "`i`, `x`"),
-      context = ExpectedContext(fragment = sql3, start = 0, stop = 80))
+    val parsed3 = parseAndResolve(sql3)
+    parsed3 match {
+      case MergeIntoTable(
+          AsDataSourceV2Relation(target),
+          AsDataSourceV2Relation(source),
+          EqualTo(IntegerLiteral(1), IntegerLiteral(1)),
+          Seq(), // Matched action
+          Seq(InsertAction(None, insertAssigns)), // Not matched actions
+          Seq(), // Not matched by source actions
+          withSchemaEvolution) =>
+        val ti = target.output.find(_.name == "i").get
+        val si = source.output.find(_.name == "i").get
+        assert(insertAssigns.size == 1)
+        assert(insertAssigns.head.key.asInstanceOf[AttributeReference].sameRef(ti))
+        assert(insertAssigns.head.value.asInstanceOf[AttributeReference].sameRef(si))
+        assert(withSchemaEvolution === false)
+      case other => fail("Expect MergeIntoTable, but got:\n" + other.treeString)
+    }
 
     val sql4 =
       """
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PrimaryKeyConstraintParseSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PrimaryKeyConstraintParseSuite.scala
index 711db63ad4243..f81a7885adca0 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PrimaryKeyConstraintParseSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/PrimaryKeyConstraintParseSuite.scala
@@ -21,7 +21,8 @@ import org.apache.spark.sql.catalyst.analysis.UnresolvedTable
 import org.apache.spark.sql.catalyst.expressions.PrimaryKeyConstraint
 import org.apache.spark.sql.catalyst.parser.CatalystSqlParser.parsePlan
 import org.apache.spark.sql.catalyst.parser.ParseException
-import org.apache.spark.sql.catalyst.plans.logical.AddConstraint
+import org.apache.spark.sql.catalyst.plans.logical.{AddConstraint, ColumnDefinition}
+import org.apache.spark.sql.types.StringType
 
 class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
   override val validConstraintCharacteristics =
@@ -34,7 +35,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       tableName = "t",
       userProvidedName = null)
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints)
+    verifyConstraints(sql, constraints, columnANullable = false)
   }
 
   test("Create table with named primary key - table level") {
@@ -45,7 +46,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       userProvidedName = "pk1"
     )
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints)
+    verifyConstraints(sql, constraints, columnANullable = false)
   }
 
   test("Create table with composite primary key - table level") {
@@ -55,7 +56,24 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       tableName = "t",
       userProvidedName = null)
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints)
+    verifyConstraints(sql, constraints, columnANullable = false, columnBNullable = false)
+  }
+
+  test("Create table with composite primary key - case insensitivity") {
+    val sql = "CREATE TABLE t (FirstName STRING, LastName STRING," +
+      " PRIMARY KEY (firstName, LASTNAME)) USING parquet"
+    val constraint = PrimaryKeyConstraint(
+      columns = Seq("firstName", "LASTNAME"),
+      tableName = "t",
+      userProvidedName = null)
+    val expectedPlan = createExpectedPlan(
+      columns = Seq(
+        ColumnDefinition("FirstName", StringType, nullable = false),
+        ColumnDefinition("LastName", StringType, nullable = false)),
+      tableConstraints = Seq(constraint),
+      isCreateTable = true)
+    val parsed = parsePlan(sql)
+    comparePlans(parsed, expectedPlan)
   }
 
   test("Create table with primary key - column level") {
@@ -65,7 +83,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       tableName = "t",
       userProvidedName = null)
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints)
+    verifyConstraints(sql, constraints, columnANullable = false)
   }
 
   test("Create table with named primary key - column level") {
@@ -76,7 +94,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       userProvidedName = "pk1"
     )
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints)
+    verifyConstraints(sql, constraints, columnANullable = false)
   }
 
   test("Create table with multiple primary keys should fail") {
@@ -101,7 +119,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       tableName = "t",
       userProvidedName = null)
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints, isCreateTable = false)
+    verifyConstraints(sql, constraints, isCreateTable = false, columnANullable = false)
   }
 
   test("Replace table with named primary key - table level") {
@@ -112,7 +130,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       userProvidedName = "pk1"
     )
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints, isCreateTable = false)
+    verifyConstraints(sql, constraints, isCreateTable = false, columnANullable = false)
   }
 
   test("Replace table with composite primary key - table level") {
@@ -122,7 +140,25 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       tableName = "t",
       userProvidedName = null)
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints, isCreateTable = false)
+    verifyConstraints(sql, constraints, isCreateTable = false, columnANullable = false,
+      columnBNullable = false)
+  }
+
+  test("Replace table with composite primary key - case insensitivity") {
+    val sql = "REPLACE TABLE t (FirstName STRING, LastName STRING," +
+      " PRIMARY KEY (firstName, LASTNAME)) USING parquet"
+    val constraint = PrimaryKeyConstraint(
+      columns = Seq("firstName", "LASTNAME"),
+      tableName = "t",
+      userProvidedName = null)
+    val expectedPlan = createExpectedPlan(
+      columns = Seq(
+        ColumnDefinition("FirstName", StringType, nullable = false),
+        ColumnDefinition("LastName", StringType, nullable = false)),
+      tableConstraints = Seq(constraint),
+      isCreateTable = false)
+    val parsed = parsePlan(sql)
+    comparePlans(parsed, expectedPlan)
   }
 
   test("Replace table with primary key - column level") {
@@ -132,7 +168,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       tableName = "t",
       userProvidedName = null)
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints, isCreateTable = false)
+    verifyConstraints(sql, constraints, isCreateTable = false, columnANullable = false)
   }
 
   test("Replace table with named primary key - column level") {
@@ -143,7 +179,7 @@ class PrimaryKeyConstraintParseSuite extends ConstraintParseSuiteBase {
       userProvidedName = "pk1"
     )
     val constraints = Seq(constraint)
-    verifyConstraints(sql, constraints, isCreateTable = false)
+    verifyConstraints(sql, constraints, isCreateTable = false, columnANullable = false)
   }
 
   test("Replace table with multiple primary keys should fail") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v1/MsckRepairTableSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v1/MsckRepairTableSuite.scala
index 45dc9e0e00f63..731456c13e813 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v1/MsckRepairTableSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v1/MsckRepairTableSuite.scala
@@ -19,10 +19,9 @@ package org.apache.spark.sql.execution.command.v1
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.execution.command
+import org.apache.spark.util.Utils
 
 /**
  * This base suite contains unified tests for the `MSCK REPAIR TABLE` command that
@@ -37,7 +36,7 @@ import org.apache.spark.sql.execution.command
 trait MsckRepairTableSuiteBase extends command.MsckRepairTableSuiteBase {
   def deletePartitionDir(tableName: String, part: String): Unit = {
     val partLoc = getPartitionLocation(tableName, part)
-    FileUtils.deleteDirectory(new File(partLoc))
+    Utils.deleteRecursively(new File(partLoc))
   }
 
   test("drop partitions") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CheckConstraintSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CheckConstraintSuite.scala
index 397d9248f6280..de03653fc9165 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CheckConstraintSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CheckConstraintSuite.scala
@@ -134,7 +134,7 @@ class CheckConstraintSuite extends QueryTest with CommandSuiteBase with DDLComma
       val constraint = getCheckConstraint(table)
       assert(constraint.name() == "c1")
       assert(constraint.toDDL ==
-        "CONSTRAINT c1 CHECK (from_json(j, 'a INT').a > 1) ENFORCED VALID NORELY")
+        "CONSTRAINT c1 CHECK (from_json(j, 'a INT').a > 1) ENFORCED NORELY")
       assert(constraint.predicateSql() == "from_json(j, 'a INT').a > 1")
       assert(constraint.predicate() == null)
     }
@@ -142,12 +142,12 @@ class CheckConstraintSuite extends QueryTest with CommandSuiteBase with DDLComma
 
   def getConstraintCharacteristics(): Seq[(String, String)] = {
     Seq(
-      ("", s"ENFORCED VALID NORELY"),
-      ("NORELY", s"ENFORCED VALID NORELY"),
-      ("RELY", s"ENFORCED VALID RELY"),
-      ("ENFORCED", s"ENFORCED VALID NORELY"),
-      ("ENFORCED NORELY", s"ENFORCED VALID NORELY"),
-      ("ENFORCED RELY", s"ENFORCED VALID RELY")
+      ("", s"ENFORCED NORELY"),
+      ("NORELY", s"ENFORCED NORELY"),
+      ("RELY", s"ENFORCED RELY"),
+      ("ENFORCED", s"ENFORCED NORELY"),
+      ("ENFORCED NORELY", s"ENFORCED NORELY"),
+      ("ENFORCED RELY", s"ENFORCED RELY")
     )
   }
 
@@ -176,7 +176,7 @@ class CheckConstraintSuite extends QueryTest with CommandSuiteBase with DDLComma
             val constraint = getCheckConstraint(table)
             assert(constraint.name() == "c1")
             assert(constraint.toDDL ==
-              s"CONSTRAINT c1 CHECK (LENGTH(name) > 0) ENFORCED VALID NORELY")
+              s"CONSTRAINT c1 CHECK (LENGTH(name) > 0) ENFORCED NORELY")
             assert(constraint.predicateSql() == "LENGTH(name) > 0")
           }
         }
@@ -258,7 +258,7 @@ class CheckConstraintSuite extends QueryTest with CommandSuiteBase with DDLComma
       val constraint = getCheckConstraint(table)
       assert(constraint.name() == "valid_positive_num")
       assert(constraint.toDDL ==
-        "CONSTRAINT valid_positive_num CHECK (s.num >= -1) ENFORCED VALID NORELY")
+        "CONSTRAINT valid_positive_num CHECK (s.num >= -1) ENFORCED NORELY")
     }
   }
 
@@ -288,7 +288,7 @@ class CheckConstraintSuite extends QueryTest with CommandSuiteBase with DDLComma
       val constraint = getCheckConstraint(table)
       assert(constraint.name() == "valid_map_val")
       assert(constraint.toDDL ==
-        "CONSTRAINT valid_map_val CHECK (m['a'] >= -1) ENFORCED VALID NORELY")
+        "CONSTRAINT valid_map_val CHECK (m['a'] >= -1) ENFORCED NORELY")
     }
   }
 
@@ -316,7 +316,7 @@ class CheckConstraintSuite extends QueryTest with CommandSuiteBase with DDLComma
       val constraint = getCheckConstraint(table)
       assert(constraint.name() == "valid_array")
       assert(constraint.toDDL ==
-        "CONSTRAINT valid_array CHECK (a[1] >= -2) ENFORCED VALID NORELY")
+        "CONSTRAINT valid_array CHECK (a[1] >= -2) ENFORCED NORELY")
     }
   }
 
@@ -336,7 +336,7 @@ class CheckConstraintSuite extends QueryTest with CommandSuiteBase with DDLComma
           condition = "CONSTRAINT_ALREADY_EXISTS",
           sqlState = "42710",
           parameters = Map("constraintName" -> "abc",
-            "oldConstraint" -> "CONSTRAINT abc CHECK (id > 0) ENFORCED VALID NORELY")
+            "oldConstraint" -> "CONSTRAINT abc CHECK (id > 0) ENFORCED NORELY")
         )
       }
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateFlowCommandSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateFlowCommandSuite.scala
index 725b5a35f504e..dd000ab8fd6da 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateFlowCommandSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateFlowCommandSuite.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.command
+package org.apache.spark.sql.execution.command.v2
 
 import org.apache.spark.sql.catalyst.analysis.{AnalysisTest, UnresolvedIdentifier, UnresolvedRelation}
 import org.apache.spark.sql.catalyst.plans.logical.{
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateMaterializedViewAsSelectParserSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateMaterializedViewAsSelectParserSuite.scala
index 8314354f9d6f5..1185a0e3a8ee1 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateMaterializedViewAsSelectParserSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateMaterializedViewAsSelectParserSuite.scala
@@ -15,9 +15,10 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.command
+package org.apache.spark.sql.execution.command.v2
 
 import org.apache.spark.sql.catalyst.parser.ParseException
+import org.apache.spark.sql.execution.command.CreatePipelineDatasetAsSelectParserSuiteBase
 
 /**
  * The class contains tests for the `CREATE MATERIALIZED VIEW ... AS ...` command
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateStreamingTableAsSelectParserSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateStreamingTableAsSelectParserSuite.scala
index eb9c4cf898846..a129243551518 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateStreamingTableAsSelectParserSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/CreateStreamingTableAsSelectParserSuite.scala
@@ -15,7 +15,9 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.execution.command
+package org.apache.spark.sql.execution.command.v2
+
+import org.apache.spark.sql.execution.command.CreatePipelineDatasetAsSelectParserSuiteBase
 
 /**
  * The class contains tests for the `CREATE STREAMING TABLE ... AS ...` command
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/DescribeTableSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/DescribeTableSuite.scala
index 9cd7f0d8aade6..89c613389eb22 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/DescribeTableSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/DescribeTableSuite.scala
@@ -213,4 +213,59 @@ class DescribeTableSuite extends command.DescribeTableSuiteBase
       assert("""\d+\s+bytes,\s+4\s+rows""".r.matches(stats))
     }
   }
+
+  test("desc table constraints") {
+    withNamespaceAndTable("ns", "pk_table", nonPartitionCatalog) { tbl =>
+      withTable("fk_table") {
+        sql(
+          s"""
+             |CREATE TABLE fk_table (id INT PRIMARY KEY) USING parquet
+        """.stripMargin)
+        sql(
+          s"""
+             |CREATE TABLE $tbl (
+             |  id INT,
+             |  a INT,
+             |  b STRING,
+             |  c STRING,
+             |  PRIMARY KEY (id),
+             |  CONSTRAINT fk_a FOREIGN KEY (a) REFERENCES fk_table(id) RELY,
+             |  CONSTRAINT uk_b UNIQUE (b),
+             |  CONSTRAINT uk_a_c UNIQUE (a, c),
+             |  CONSTRAINT c1 CHECK (c IS NOT NULL),
+             |  CONSTRAINT c2 CHECK (id > 0)
+             |)
+             |$defaultUsing
+        """.stripMargin)
+
+        // Skipped showing NORELY since it is the default value.
+        var expectedConstraintsDdl = Array(
+          "# Constraints,,",
+          "pk_table_pk,PRIMARY KEY (id) NOT ENFORCED,",
+          "fk_a,FOREIGN KEY (a) REFERENCES fk_table (id) NOT ENFORCED RELY,",
+          "uk_b,UNIQUE (b) NOT ENFORCED,",
+          "uk_a_c,UNIQUE (a, c) NOT ENFORCED,",
+          "c1,CHECK (c IS NOT NULL) ENFORCED,",
+          "c2,CHECK (id > 0) ENFORCED,"
+        )
+        var descDdL = sql(s"DESCRIBE EXTENDED $tbl").collect().map(_.mkString(","))
+          .dropWhile(_ != "# Constraints,,")
+        assert(descDdL === expectedConstraintsDdl)
+
+        // Show non-default value for RELY.
+        sql(s"ALTER TABLE $tbl ADD CONSTRAINT c3 CHECK (b IS NOT NULL) RELY")
+        descDdL = sql(s"DESCRIBE EXTENDED $tbl").collect().map(_.mkString(","))
+          .dropWhile(_ != "# Constraints,,")
+        expectedConstraintsDdl = expectedConstraintsDdl ++
+          Array("c3,CHECK (b IS NOT NULL) ENFORCED RELY,")
+        assert(descDdL === expectedConstraintsDdl)
+
+        sql(s"ALTER TABLE $tbl DROP CONSTRAINT c1")
+        descDdL = sql(s"DESCRIBE EXTENDED $tbl").collect().map(_.mkString(","))
+          .dropWhile(_ != "# Constraints,,")
+        assert(descDdL === expectedConstraintsDdl
+          .filter(_ != "c1,CHECK (c IS NOT NULL) ENFORCED,"))
+      }
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ForeignKeyConstraintSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ForeignKeyConstraintSuite.scala
index 02646a3cfcbb0..a876013490ea7 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ForeignKeyConstraintSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ForeignKeyConstraintSuite.scala
@@ -23,12 +23,12 @@ class ForeignKeyConstraintSuite extends QueryTest with CommandSuiteBase with DDL
   override protected def command: String = "FOREIGN KEY CONSTRAINT"
 
   private val validConstraintCharacteristics = Seq(
-    ("", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NOT ENFORCED", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NOT ENFORCED NORELY", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NORELY NOT ENFORCED", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NORELY", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("RELY", "NOT ENFORCED UNVALIDATED RELY")
+    ("", "NOT ENFORCED NORELY"),
+    ("NOT ENFORCED", "NOT ENFORCED NORELY"),
+    ("NOT ENFORCED NORELY", "NOT ENFORCED NORELY"),
+    ("NORELY NOT ENFORCED", "NOT ENFORCED NORELY"),
+    ("NORELY", "NOT ENFORCED NORELY"),
+    ("RELY", "NOT ENFORCED RELY")
   )
 
   test("Add foreign key constraint") {
@@ -104,7 +104,7 @@ class ForeignKeyConstraintSuite extends QueryTest with CommandSuiteBase with DDL
           parameters = Map("constraintName" -> "fk1",
             "oldConstraint" ->
               ("CONSTRAINT fk1 FOREIGN KEY (fk) " +
-                "REFERENCES test_catalog.ns.tbl_ref (id) NOT ENFORCED UNVALIDATED NORELY"))
+                "REFERENCES test_catalog.ns.tbl_ref (id) NOT ENFORCED NORELY"))
         )
       }
     }
@@ -124,7 +124,7 @@ class ForeignKeyConstraintSuite extends QueryTest with CommandSuiteBase with DDL
       assert(constraint.name() == "fk1")
       assert(constraint.toDDL ==
         s"CONSTRAINT fk1 FOREIGN KEY (fk1, fk2) " +
-          s"REFERENCES test_catalog.ns.tbl_ref (id1, id2) NOT ENFORCED UNVALIDATED NORELY")
+          s"REFERENCES test_catalog.ns.tbl_ref (id1, id2) NOT ENFORCED NORELY")
     }
   }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/PrimaryKeyConstraintSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/PrimaryKeyConstraintSuite.scala
index a4785e953a2d8..f692f9588161e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/PrimaryKeyConstraintSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/PrimaryKeyConstraintSuite.scala
@@ -23,12 +23,12 @@ class PrimaryKeyConstraintSuite extends QueryTest with CommandSuiteBase with DDL
   override protected def command: String = "PRIMARY KEY CONSTRAINT"
 
   private val validConstraintCharacteristics = Seq(
-    ("", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NOT ENFORCED", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NOT ENFORCED NORELY", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NORELY NOT ENFORCED", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NORELY", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("RELY", "NOT ENFORCED UNVALIDATED RELY")
+    ("", "NOT ENFORCED NORELY"),
+    ("NOT ENFORCED", "NOT ENFORCED NORELY"),
+    ("NOT ENFORCED NORELY", "NOT ENFORCED NORELY"),
+    ("NORELY NOT ENFORCED", "NOT ENFORCED NORELY"),
+    ("NORELY", "NOT ENFORCED NORELY"),
+    ("RELY", "NOT ENFORCED RELY")
   )
 
   test("Add primary key constraint") {
@@ -92,7 +92,7 @@ class PrimaryKeyConstraintSuite extends QueryTest with CommandSuiteBase with DDL
           condition = "CONSTRAINT_ALREADY_EXISTS",
           sqlState = "42710",
           parameters = Map("constraintName" -> "pk1",
-            "oldConstraint" -> "CONSTRAINT pk1 PRIMARY KEY (id) NOT ENFORCED UNVALIDATED NORELY")
+            "oldConstraint" -> "CONSTRAINT pk1 PRIMARY KEY (id) NOT ENFORCED NORELY")
         )
       }
     }
@@ -109,7 +109,7 @@ class PrimaryKeyConstraintSuite extends QueryTest with CommandSuiteBase with DDL
       val constraint = table.constraints.head
       assert(constraint.name() == "pk1")
       assert(constraint.toDDL ==
-        "CONSTRAINT pk1 PRIMARY KEY (id1, id2) NOT ENFORCED UNVALIDATED NORELY")
+        "CONSTRAINT pk1 PRIMARY KEY (id1, id2) NOT ENFORCED NORELY")
     }
   }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ShowCreateTableSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ShowCreateTableSuite.scala
index f72127cbd1de2..2e3929d906ce3 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ShowCreateTableSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/ShowCreateTableSuite.scala
@@ -181,4 +181,60 @@ class ShowCreateTableSuite extends command.ShowCreateTableSuiteBase with Command
       )
     }
   }
+
+  test("show table constraints") {
+    withNamespaceAndTable("ns", "tbl", nonPartitionCatalog) { t =>
+      withTable("other_table") {
+        sql(
+          s"""
+             |CREATE TABLE other_table (
+             |  id STRING PRIMARY KEY
+             |)
+             |USING parquet
+        """.stripMargin)
+        sql(
+          s"""
+             |CREATE TABLE $t (
+             |  a INT,
+             |  b STRING,
+             |  c STRING,
+             |  PRIMARY KEY (a),
+             |  CONSTRAINT uk_b UNIQUE (b),
+             |  CONSTRAINT fk_c FOREIGN KEY (c) REFERENCES other_table(id) RELY,
+             |  CONSTRAINT c1 CHECK (c IS NOT NULL),
+             |  CONSTRAINT c2 CHECK (a > 0)
+             |)
+             |$defaultUsing
+        """.stripMargin)
+        var showDDL = getShowCreateDDL(t)
+        val expectedDDLPrefix = Array(
+          s"CREATE TABLE $nonPartitionCatalog.ns.tbl (",
+          "a INT NOT NULL,",
+          "b STRING,",
+          "c STRING,",
+          "CONSTRAINT tbl_pk PRIMARY KEY (a) NOT ENFORCED NORELY,",
+          "CONSTRAINT uk_b UNIQUE (b) NOT ENFORCED NORELY,",
+          "CONSTRAINT fk_c FOREIGN KEY (c) REFERENCES other_table (id) NOT ENFORCED RELY,",
+          "CONSTRAINT c1 CHECK (c IS NOT NULL) ENFORCED NORELY,"
+        )
+        assert(showDDL === expectedDDLPrefix ++ Array(
+          "CONSTRAINT c2 CHECK (a > 0) ENFORCED NORELY)",
+          defaultUsing))
+
+        sql(s"ALTER TABLE $t ADD CONSTRAINT c3 CHECK (b IS NOT NULL) ENFORCED RELY")
+        showDDL = getShowCreateDDL(t)
+        val expectedDDLArrayWithNewConstraint = expectedDDLPrefix ++ Array(
+          "CONSTRAINT c2 CHECK (a > 0) ENFORCED NORELY,",
+          "CONSTRAINT c3 CHECK (b IS NOT NULL) ENFORCED RELY)",
+          defaultUsing
+        )
+        assert(showDDL === expectedDDLArrayWithNewConstraint)
+        sql(s"ALTER TABLE $t DROP CONSTRAINT c1")
+        showDDL = getShowCreateDDL(t)
+        val expectedDDLArrayAfterDrop = expectedDDLArrayWithNewConstraint.filterNot(
+          _.contains("c1 CHECK (c IS NOT NULL) ENFORCED NORELY"))
+        assert(showDDL === expectedDDLArrayAfterDrop)
+      }
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/UniqueConstraintSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/UniqueConstraintSuite.scala
index 9446cbc6ade22..6efc3912af9d2 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/UniqueConstraintSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/command/v2/UniqueConstraintSuite.scala
@@ -23,12 +23,12 @@ class UniqueConstraintSuite extends QueryTest with CommandSuiteBase with DDLComm
   override protected def command: String = "UNIQUE CONSTRAINT"
 
   private val validConstraintCharacteristics = Seq(
-    ("", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NOT ENFORCED", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NOT ENFORCED NORELY", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NORELY NOT ENFORCED", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("NORELY", "NOT ENFORCED UNVALIDATED NORELY"),
-    ("RELY", "NOT ENFORCED UNVALIDATED RELY")
+    ("", "NOT ENFORCED NORELY"),
+    ("NOT ENFORCED", "NOT ENFORCED NORELY"),
+    ("NOT ENFORCED NORELY", "NOT ENFORCED NORELY"),
+    ("NORELY NOT ENFORCED", "NOT ENFORCED NORELY"),
+    ("NORELY", "NOT ENFORCED NORELY"),
+    ("RELY", "NOT ENFORCED RELY")
   )
 
   test("Add unique constraint") {
@@ -92,7 +92,7 @@ class UniqueConstraintSuite extends QueryTest with CommandSuiteBase with DDLComm
           condition = "CONSTRAINT_ALREADY_EXISTS",
           sqlState = "42710",
           parameters = Map("constraintName" -> "uk1",
-            "oldConstraint" -> "CONSTRAINT uk1 UNIQUE (id) NOT ENFORCED UNVALIDATED NORELY")
+            "oldConstraint" -> "CONSTRAINT uk1 UNIQUE (id) NOT ENFORCED NORELY")
         )
       }
     }
@@ -109,7 +109,7 @@ class UniqueConstraintSuite extends QueryTest with CommandSuiteBase with DDLComm
       val constraint = table.constraints.head
       assert(constraint.name() == "uk1")
       assert(constraint.toDDL ==
-        "CONSTRAINT uk1 UNIQUE (id1, id2) NOT ENFORCED UNVALIDATED NORELY")
+        "CONSTRAINT uk1 UNIQUE (id1, id2) NOT ENFORCED NORELY")
     }
   }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/DataSourceResolverSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/DataSourceResolverSuite.scala
index 11b2577f1e873..5e12948aab68e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/DataSourceResolverSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/DataSourceResolverSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.execution.datasources
 
 import org.apache.spark.sql.QueryTest
-import org.apache.spark.sql.catalyst.analysis.{FunctionResolution, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.analysis.UnresolvedRelation
 import org.apache.spark.sql.catalyst.analysis.resolver.{
   MetadataResolver,
   ProhibitedResolver,
@@ -93,8 +93,7 @@ class DataSourceResolverSuite extends QueryTest with SharedSparkSession {
       Resolver.createRelationResolution(spark.sessionState.catalogManager)
     val metadataResolver = new MetadataResolver(
       spark.sessionState.catalogManager,
-      relationResolution,
-      new FunctionResolution(spark.sessionState.catalogManager, relationResolution)
+      relationResolution
     )
     val dataSourceResolver = new DataSourceResolver(spark)
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileIndexSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileIndexSuite.scala
index 33b4cc1d2e7f2..1150f6163b978 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileIndexSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileIndexSuite.scala
@@ -656,6 +656,30 @@ class FileIndexSuite extends SharedSparkSession {
     assert(FileIndexOptions.isValidOption("modifiedafter"))
     assert(FileIndexOptions.isValidOption("pathglobfilter"))
   }
+
+  test("SPARK-52339: Correctly compare root paths") {
+    withTempDir { dir =>
+      val file1 = new File(dir, "text1.txt")
+      stringToFile(file1, "text1")
+      val file2 = new File(dir, "text2.txt")
+      stringToFile(file2, "text2")
+      val path1 = new Path(file1.getCanonicalPath)
+      val path2 = new Path(file2.getCanonicalPath)
+
+      val schema = StructType(Seq(StructField("a", StringType, false)))
+
+      // Verify that the order of paths doesn't matter
+      val fileIndex1a = new InMemoryFileIndex(spark, Seq(path1, path2), Map.empty, Some(schema))
+      val fileIndex1b = new InMemoryFileIndex(spark, Seq(path2, path1), Map.empty, Some(schema))
+      assert(fileIndex1a == fileIndex1b)
+
+      // Verify that a different number of paths does matter
+      val fileIndex2a = new InMemoryFileIndex(spark, Seq(path1, path1), Map.empty, Some(schema))
+      val fileIndex2b = new InMemoryFileIndex(spark, Seq(path1, path1, path1),
+        Map.empty, Some(schema))
+      assert(fileIndex2a != fileIndex2b)
+    }
+  }
 }
 
 object DeletionRaceFileSystem {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategySuite.scala
index 94a0501b74d47..afeca756208e6 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/FileSourceStrategySuite.scala
@@ -400,7 +400,7 @@ class FileSourceStrategySuite extends QueryTest with SharedSparkSession {
 
         Seq("p1=1/p2=2/p3=3/file1", "p1=1/p2=3/p3=3/file1").foreach { fileName =>
           val file = new File(tempDir, fileName)
-          assert(file.getParentFile.exists() || file.getParentFile.mkdirs())
+          assert(file.getParentFile.exists() || Utils.createDirectory(file.getParentFile))
           util.stringToFile(file, fileName)
         }
 
@@ -682,8 +682,8 @@ class FileSourceStrategySuite extends QueryTest with SharedSparkSession {
     files.foreach {
       case (name, size) =>
         val file = new File(tempDir, name)
-        assert(file.getParentFile.exists() || file.getParentFile.mkdirs())
-        util.stringToFile(file, "*" * size)
+        assert(file.getParentFile.exists() || Utils.createDirectory(file.getParentFile))
+        util.stringToFile(file, "*".repeat(size))
     }
 
     val df = spark.read
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormatSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormatSuite.scala
index 62f2f2cb10a85..7d2166beb2d7b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormatSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/binaryfile/BinaryFileFormatSuite.scala
@@ -23,7 +23,7 @@ import java.sql.Timestamp
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.{ByteStreams, Closeables}
+import com.google.common.io.Closeables
 import org.apache.hadoop.fs.{FileStatus, FileSystem, GlobFilter, Path}
 import org.mockito.Mockito.{mock, when}
 
@@ -134,7 +134,7 @@ class BinaryFileFormatSuite extends QueryTest with SharedSparkSession {
           val fcontent = {
             val stream = fs.open(fileStatus.getPath)
             val content = try {
-              ByteStreams.toByteArray(stream)
+              stream.readAllBytes()
             } finally {
               Closeables.close(stream, true)
             }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala
index 1684879612f51..eaf137cbf8f76 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/csv/CSVSuite.scala
@@ -17,9 +17,10 @@
 
 package org.apache.spark.sql.execution.datasources.csv
 
-import java.io.{EOFException, File}
+import java.io.{EOFException, File, FileOutputStream}
+import java.net.URI
 import java.nio.charset.{Charset, StandardCharsets}
-import java.nio.file.{Files, StandardOpenOption}
+import java.nio.file.{Files, Paths, StandardOpenOption}
 import java.sql.{Date, Timestamp}
 import java.text.SimpleDateFormat
 import java.time._
@@ -32,10 +33,11 @@ import com.univocity.parsers.common.TextParsingException
 import org.apache.commons.lang3.time.FastDateFormat
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.io.SequenceFile.CompressionType
-import org.apache.hadoop.io.compress.GzipCodec
+import org.apache.hadoop.io.compress.{CompressionCodecFactory, GzipCodec}
 import org.apache.logging.log4j.Level
 
 import org.apache.spark._
+import org.apache.spark.io.ZStdCompressionCodec
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.csv.CSVOptions
 import org.apache.spark.sql.catalyst.expressions.ToStringBase
@@ -86,6 +88,10 @@ abstract class CSVSuite
   private val malformedRowFile = "test-data/malformedRow.csv"
   private val charFile = "test-data/char.csv"
   private val moreColumnsFile = "test-data/more-columns.csv"
+  // Generated by compressing cars.csv using Ubuntu's zstd command line tool
+  private val zstCompressedCarsFile = "test-data/cars.csv.zst"
+  // Generated by compressing cars.csv using Hadoop-3.4.1 native Zstandard codec
+  private val zstHadoopCompressedCarsFile = "test-data/cars.csv.hadoop.zst"
 
   /** Verifies data and schema. */
   private def verifyCars(
@@ -2591,7 +2597,7 @@ abstract class CSVSuite
   test("SPARK-28431: prevent CSV datasource throw TextParsingException with large size message") {
     withTempPath { path =>
       val maxCharsPerCol = 10000
-      val str = "a" * (maxCharsPerCol + 1)
+      val str = "a".repeat(maxCharsPerCol + 1)
 
       Files.write(
         path.toPath,
@@ -2901,7 +2907,7 @@ abstract class CSVSuite
 
   test("SPARK-34768: counting a long record with ignoreTrailingWhiteSpace set to true") {
     val bufSize = 128
-    val line = "X" * (bufSize - 1) + "| |"
+    val line = "X".repeat(bufSize - 1) + "| |"
     withTempPath { path =>
       Seq(line).toDF().write.text(path.getAbsolutePath)
       assert(spark.read.format("csv")
@@ -3686,6 +3692,135 @@ abstract class CSVSuite
       parameters = Map("columnName" -> "`v`", "columnType" -> "\"VARIANT\"", "format" -> "CSV")
     )
   }
+
+  private def createTestFiles(dir: File, fileFormatWriter: Boolean,
+                              header: Boolean): Seq[Row] = {
+    val numRecord = 100
+    val codecExtensionMap = HadoopCompressionCodec.values()
+      .map(c => (c.lowerCaseName(),
+        Option(c.getCompressionCodec).map(_.getDefaultExtension).getOrElse(""))) ++
+      Seq(("zstd", ".zst"), ("zstd", ".zstd"), ("gzip", ".gzip"))
+
+    val codecFactory = new CompressionCodecFactory(spark.sessionState.newHadoopConf())
+    codecExtensionMap.foreach { case (codec, ext) =>
+
+      val records: Seq[(Int, String)] = (1 to numRecord).map(id => (id, s"value_${codec}$ext"))
+      val file = new File(dir, s"test_$codec.csv$ext")
+
+      // file data source writers do not support zstd codec yet.
+      if (fileFormatWriter && !codec.equals("zstd")) {
+        val df = records.toDF("id", "value")
+        df.coalesce(1).write
+          .option("header", header.toString)
+          .option("compression", codec)
+          .csv(file.getCanonicalPath)
+
+        val compressedFiles = new File(file.getCanonicalPath).listFiles()
+
+        compressedFiles.foreach { file =>
+          if (file.isFile && file.getName.startsWith("part")) {
+            val newName = file.getName.split("\\.").init.mkString(".") + ext
+            val status = file.renameTo(new File(dir, newName))
+            assert(status)
+          }
+        }
+      } else {
+        val headerRow = if (header) {
+          s"id,value\n"
+        } else {
+          ""
+        }
+        val data = headerRow + records.map {
+          case (id, value) => s"${id},${value}"
+        }.mkString("\n")
+
+        val os = new FileOutputStream(file)
+
+        val outputStream = codec match {
+          case "zstd" =>
+            new ZStdCompressionCodec(sparkConf).compressedOutputStream(os)
+          case codec if ext.nonEmpty =>
+            val compressionCodec = codecFactory.getCodecByName(codec)
+            compressionCodec.createOutputStream(os)
+          case _ => os
+        }
+        outputStream.write(data.getBytes(StandardCharsets.UTF_8))
+        outputStream.close()
+      }
+    }
+
+    val expectedOutput = codecExtensionMap.flatMap {
+      case (codec, ext) =>
+        val data = (1 to numRecord).map(i => Row(i, s"value_${codec}$ext"))
+        data
+    }.toSeq
+    assert(expectedOutput.length == codecExtensionMap.length * numRecord)
+    expectedOutput
+  }
+
+  test("Test all supported codec and extension including zst, zstd and gzip") {
+    for (
+      multiLine <- Seq(true, false);
+      header <- Seq(true, false);
+      fileFormatWriter <- Seq(true, false)
+    ) {
+      logInfo(
+        s"Testing with multiLine=$multiLine, " +
+          s"header=$header, fileFormatWriter=$fileFormatWriter"
+      )
+      withTempDir { dir =>
+        val options = Map(
+          "multiLine" -> multiLine.toString,
+          "header" -> header.toString,
+          "inferSchema" -> "true",
+          "recursiveFileLookup" -> "true"
+        )
+
+        val expectedOutput = createTestFiles(dir, fileFormatWriter, header)
+        val df = spark.read.options(options).csv(dir.getCanonicalPath)
+        checkAnswer(df, expectedOutput)
+      }
+    }
+  }
+
+  test("ZSTD compressed csv test with type inference") {
+    Seq(zstCompressedCarsFile, zstHadoopCompressedCarsFile).foreach { file =>
+      val cars = spark
+        .read
+        .format("csv")
+        .option("header", "true")
+        .option("inferSchema", "true")
+        .load(testFile(file))
+
+      verifyCars(cars, withHeader = true, checkTypes = true)
+    }
+  }
+
+  test("corrupted ZSTD compressed csv respects ignoreCorruptFiles") {
+    withTempDir { dir =>
+      val originalFile = new File(dir, "original.csv.zst")
+      val corruptedHeadFile = new File(dir, "corrupted_head.csv.zst")
+      val corruptedTailFile = new File(dir, "corrupted_tail.csv.zst")
+      val bytes = Files.readAllBytes(Paths.get(new URI(testFile(zstCompressedCarsFile))))
+      Files.write(originalFile.toPath(), bytes)
+      Files.write(corruptedHeadFile.toPath(), bytes.drop(10))
+      Files.write(corruptedTailFile.toPath(), bytes.dropRight(10))
+
+      withSQLConf(SQLConf.IGNORE_CORRUPT_FILES.key -> "true") {
+        val df = spark.read.format("csv").option("header", "true").load(dir.getAbsolutePath)
+        // check that the entries from originalFile are still read
+        assert(df.count() == 3)
+      }
+
+      withSQLConf(SQLConf.IGNORE_CORRUPT_FILES.key -> "false") {
+        val ex = intercept[SparkException] {
+          spark.read.format("csv").option("header", "true").load(dir.getAbsolutePath).collect()
+        }
+        checkErrorMatchPVals(ex, "FAILED_READ_FILE.NO_HINT",
+          Map("path" -> ".*corrupted.*\\.csv\\.zst"))
+      }
+    }
+  }
 }
 
 class CSVv1Suite extends CSVSuite {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonBenchmark.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonBenchmark.scala
index 02ed2a16d1137..94a2ccc41d30b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonBenchmark.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonBenchmark.scala
@@ -109,7 +109,7 @@ object JsonBenchmark extends SqlBasedBenchmark {
   def writeWideColumn(path: String, rowsNum: Int): StructType = {
     spark.sparkContext.range(0, rowsNum, 1)
       .map { i =>
-        val s = "abcdef0123456789ABCDEF" * 20
+        val s = "abcdef0123456789ABCDEF".repeat(20)
         s"""{"a":"$s","b": $i,"c":"$s","d":$i,"e":"$s","f":$i,"x":"$s","y":$i,"z":"$s"}"""
       }
       .toDF().write.text(path)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonSuite.scala
index eb803d04f1533..70cebd9c9ce47 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/JsonSuite.scala
@@ -26,13 +26,13 @@ import java.util.Locale
 import java.util.concurrent.atomic.AtomicLong
 
 import com.fasterxml.jackson.core.JsonFactory
-import org.apache.commons.lang3.exception.ExceptionUtils
 import org.apache.hadoop.fs.{Path, PathFilter}
 import org.apache.hadoop.io.SequenceFile.CompressionType
-import org.apache.hadoop.io.compress.GzipCodec
+import org.apache.hadoop.io.compress.{CompressionCodecFactory, GzipCodec}
 
 import org.apache.spark.{SparkConf, SparkException, SparkRuntimeException, SparkUpgradeException, TestUtils}
 import org.apache.spark.SparkIllegalArgumentException
+import org.apache.spark.io.ZStdCompressionCodec
 import org.apache.spark.rdd.RDD
 import org.apache.spark.scheduler.{SparkListener, SparkListenerJobEnd}
 import org.apache.spark.sql.{functions => F, _}
@@ -795,7 +795,7 @@ abstract class JsonSuite
   test("Find compatible types even if inferred DecimalType is not capable of other IntegralType") {
     val mixedIntegerAndDoubleRecords = Seq(
       """{"a": 3, "b": 1.1}""",
-      s"""{"a": 3.1, "b": 0.${"0" * 38}1}""").toDS()
+      s"""{"a": 3.1, "b": 0.${"0".repeat(38)}1}""").toDS()
     val jsonDF = spark.read
       .option("prefersDecimal", "true")
       .json(mixedIntegerAndDoubleRecords)
@@ -3371,7 +3371,7 @@ abstract class JsonSuite
     )
 
     checkError(
-      exception = ExceptionUtils.getRootCause(exception).asInstanceOf[SparkRuntimeException],
+      exception = Utils.getRootCause(exception).asInstanceOf[SparkRuntimeException],
       condition = "INVALID_JSON_ROOT_FIELD",
       parameters = Map.empty
     )
@@ -4064,7 +4064,7 @@ abstract class JsonSuite
 
     // Test scan with partitions.
     withTempDir { dir =>
-      new File(dir, "a=1/b=2/").mkdirs()
+      Utils.createDirectory(new File(dir, "a=1/b=2/"))
       Files.write(new File(dir, "a=1/b=2/file.json").toPath, content)
       checkAnswer(
         spark.read.format("json").option("singleVariantColumn", "var")
@@ -4096,6 +4096,94 @@ abstract class JsonSuite
         Row("{null, bad json}"), Row("{[1,2,3], null}"))
     )
   }
+
+  private def createTestFiles(dir: File, fileFormatWriter: Boolean,
+    multiline: Boolean): Seq[Row] = {
+    val numRecord = 100
+    val codecExtensionMap = HadoopCompressionCodec.values()
+      .map(c => (c.lowerCaseName(),
+        Option(c.getCompressionCodec).map(_.getDefaultExtension).getOrElse(""))) ++
+      Seq(("zstd", ".zst"), ("zstd", ".zstd"), ("gzip", ".gzip"))
+
+    val codecFactory = new CompressionCodecFactory(spark.sessionState.newHadoopConf())
+    codecExtensionMap.foreach { case (codec, ext) =>
+
+      val records: Seq[(Int, String)] = (1 to numRecord).map(id => (id, s"value_${codec}$ext"))
+      val file = new File(dir, s"test_$codec.json$ext")
+
+      // file data source writers do not support zstd codec yet.
+      if (fileFormatWriter && !multiline && !codec.equals("zstd")) {
+        // Json writer cannot write root-level json arrays.
+        val df = records.toDF("id", "value")
+        df.coalesce(1).write
+          .option("compression", codec)
+          .json(file.getCanonicalPath)
+
+        val compressedFiles = new File(file.getCanonicalPath).listFiles()
+
+        compressedFiles.foreach { file =>
+          if (file.isFile && file.getName.startsWith("part")) {
+            val newName = file.getName.split("\\.").init.mkString(".") + ext
+            val status = file.renameTo(new File(dir, newName))
+            assert(status)
+          }
+        }
+      } else {
+        val lines = records.map {
+          case (id, value) =>
+            s"""{"id": ${id}, "value": "$value"}"""
+        }
+        val data = if (multiline) {
+          lines.mkString("[\n", ",\n", "\n]")
+        } else {
+          lines.mkString("\n")
+        }
+
+        val os = new FileOutputStream(file)
+
+        val outputStream = codec match {
+          case "zstd" =>
+            new ZStdCompressionCodec(sparkConf).compressedOutputStream(os)
+          case codec if ext.nonEmpty =>
+            val compressionCodec = codecFactory.getCodecByName(codec)
+            compressionCodec.createOutputStream(os)
+          case _ => os
+        }
+        outputStream.write(data.getBytes(StandardCharsets.UTF_8))
+        outputStream.close()
+      }
+    }
+
+    val expectedOutput = codecExtensionMap.flatMap {
+      case (codec, ext) =>
+        val data = (1 to numRecord).map(i => Row(i, s"value_${codec}$ext"))
+        data
+    }.toSeq
+    assert(expectedOutput.length == codecExtensionMap.length * numRecord)
+    expectedOutput
+  }
+
+  test("Test all supported codec and extension including zst, zstd and gzip") {
+    for (
+      multiLine <- Seq(true, false);
+      fileFormatWriter <- Seq(true, false)
+    ) {
+      logInfo(
+        s"Testing with multiLine=$multiLine, " +
+          s"fileFormatWriter=$fileFormatWriter"
+      )
+      withTempDir { dir =>
+        val options = Map(
+          "multiLine" -> multiLine.toString,
+          "recursiveFileLookup" -> "true"
+        )
+
+        val expectedOutput = createTestFiles(dir, fileFormatWriter, multiLine)
+        val df = spark.read.options(options).json(dir.getCanonicalPath)
+        checkAnswer(df, expectedOutput)
+      }
+    }
+  }
 }
 
 class JsonV1Suite extends JsonSuite {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/TestJsonData.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/TestJsonData.scala
index 6fa2bdfbfe758..6d5a4d9c0ad7d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/TestJsonData.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/json/TestJsonData.scala
@@ -217,11 +217,11 @@ private[json] trait TestJsonData {
 
   def floatingValueRecords: Dataset[String] =
     spark.createDataset(spark.sparkContext.parallelize(
-      s"""{"a": 0.${"0" * 38}1, "b": 0.01}""" :: Nil))(Encoders.STRING)
+      s"""{"a": 0.${"0".repeat(38)}1, "b": 0.01}""" :: Nil))(Encoders.STRING)
 
   def bigIntegerRecords: Dataset[String] =
     spark.createDataset(spark.sparkContext.parallelize(
-      s"""{"a": 1${"0" * 38}, "b": 92233720368547758070}""" :: Nil))(Encoders.STRING)
+      s"""{"a": 1${"0".repeat(38)}, "b": 92233720368547758070}""" :: Nil))(Encoders.STRING)
 
   def datesRecords: Dataset[String] =
     spark.createDataset(spark.sparkContext.parallelize(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/noop/NoopStreamSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/noop/NoopStreamSuite.scala
index adcc771fe33ff..80877b0fb9f0d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/noop/NoopStreamSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/noop/NoopStreamSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.execution.datasources.noop
 
 import org.apache.spark.sql.classic.DataFrame
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.streaming.{StreamingQuery, StreamTest, Trigger}
 
 class NoopStreamSuite extends StreamTest {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcPartitionDiscoverySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcPartitionDiscoverySuite.scala
index ea839b8e1ef10..4de62156e3b90 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcPartitionDiscoverySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcPartitionDiscoverySuite.scala
@@ -25,6 +25,7 @@ import org.apache.spark.SparkConf
 import org.apache.spark.sql._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.util.Utils
 
 // The data where the partitioning key exists only in the directory structure.
 case class OrcParData(intField: Int, stringField: String)
@@ -56,7 +57,7 @@ abstract class OrcPartitionDiscoveryTest extends OrcTest {
       new File(parent, child)
     }
 
-    assert(partDir.mkdirs(), s"Couldn't create directory $partDir")
+    assert(Utils.createDirectory(partDir), s"Couldn't create directory $partDir")
     partDir
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcQuerySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcQuerySuite.scala
index ab0d4d9bc53b8..8d90a78c6e62f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcQuerySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcQuerySuite.scala
@@ -43,6 +43,7 @@ import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.util.Utils
+import org.apache.spark.util.collection.Utils.createArray
 
 case class AllDataTypesWithNonPrimitiveType(
     stringField: String,
@@ -737,13 +738,13 @@ abstract class OrcQuerySuite extends OrcQueryTest with SharedSparkSession {
     withTempPath { dir =>
       val path = dir.getCanonicalPath
       val df = spark.range(10).map { x =>
-        val stringColumn = s"$x" * 10
-        val structColumn = (x, s"$x" * 100)
-        val arrayColumn = (0 until 5).map(i => (x + i, s"$x" * 5))
+        val stringColumn = s"$x".repeat(10)
+        val structColumn = (x, s"$x".repeat(100))
+        val arrayColumn = (0 until 5).map(i => (x + i, s"$x".repeat(5)))
         val mapColumn = Map(
-          s"$x" -> (x * 0.1, (x, s"$x" * 100)),
-          (s"$x" * 2) -> (x * 0.2, (x, s"$x" * 200)),
-          (s"$x" * 3) -> (x * 0.3, (x, s"$x" * 300)))
+          s"$x" -> (x * 0.1, (x, s"$x".repeat(100))),
+          (s"$x".repeat(2)) -> (x * 0.2, (x, s"$x".repeat(200))),
+          (s"$x".repeat(3)) -> (x * 0.3, (x, s"$x".repeat(300))))
         (x, stringColumn, structColumn, arrayColumn, mapColumn)
       }.toDF("int_col", "string_col", "struct_col", "array_col", "map_col")
       df.write.format("orc").save(path)
@@ -786,10 +787,10 @@ abstract class OrcQuerySuite extends OrcQueryTest with SharedSparkSession {
     withTempPath { dir =>
       val path = dir.getCanonicalPath
       val df = spark.range(10).map { x =>
-        val stringColumn = s"$x" * 10
-        val structColumn = (x, s"$x" * 100)
-        val arrayColumn = (0 until 5).map(i => (x + i, s"$x" * 5))
-        val mapColumn = Map(s"$x" -> (x * 0.1, (x, s"$x" * 100)))
+        val stringColumn = s"$x".repeat(10)
+        val structColumn = (x, s"$x".repeat(100))
+        val arrayColumn = (0 until 5).map(i => (x + i, s"$x".repeat(5)))
+        val mapColumn = Map(s"$x" -> (x * 0.1, (x, s"$x".repeat(100))))
         (x, stringColumn, structColumn, arrayColumn, mapColumn)
       }.toDF("int_col", "string_col", "struct_col", "array_col", "map_col")
       df.write.format("orc").save(path)
@@ -854,7 +855,7 @@ abstract class OrcQuerySuite extends OrcQueryTest with SharedSparkSession {
     withTempPath { dir =>
       val path = dir.getCanonicalPath
       val df = spark.range(1, 22, 1, 1).map { _ =>
-        val byteData = Array.fill[Byte](1024 * 1024)('X')
+        val byteData = createArray[Byte](1024 * 1024, 'X')
         val mapData = (1 to 100).map(i => (i, byteData))
         mapData
       }.toDF()
@@ -868,7 +869,7 @@ abstract class OrcQuerySuite extends OrcQueryTest with SharedSparkSession {
         withTempPath { dir =>
           val path = dir.getCanonicalPath
           val df = spark.range(1, 1024, 1, 1).map { _ =>
-            val byteData = Array.fill[Byte](5 * 1024 * 1024)('X')
+            val byteData = createArray[Byte](5 * 1024 * 1024, 'X')
             byteData
           }.toDF()
           df.write.format("orc").save(path)
@@ -885,9 +886,9 @@ abstract class OrcQuerySuite extends OrcQueryTest with SharedSparkSession {
         val path = dir.getCanonicalPath
         val df = spark.range(1, 1 + 512, 1, 1).map { i =>
           if (i == 1) {
-            (i, Array.fill[Byte](5 * 1024 * 1024)('X'))
+            (i, createArray[Byte](5 * 1024 * 1024, 'X'))
           } else {
-            (i, Array.fill[Byte](1)('X'))
+            (i, createArray[Byte](1, 'X'))
           }
         }.toDF("c1", "c2")
         df.write.format("orc").save(path)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcTest.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcTest.scala
index b96a61962a70f..7f95c1fe85d71 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcTest.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/orc/OrcTest.scala
@@ -22,7 +22,6 @@ import java.io.File
 import scala.reflect.ClassTag
 import scala.reflect.runtime.universe.TypeTag
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.BeforeAndAfterAll
 
 import org.apache.spark.sql.{Column, DataFrame, QueryTest}
@@ -35,6 +34,7 @@ import org.apache.spark.sql.execution.datasources.v2.orc.OrcScan
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.ORC_IMPLEMENTATION
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.Utils
 
 /**
  * OrcTest
@@ -143,7 +143,7 @@ trait OrcTest extends QueryTest with FileBasedDataSourceTest with BeforeAndAfter
     // Copy to avoid URISyntaxException when `sql/hive` accesses the resources in `sql/core`
     val file = File.createTempFile("orc-test", ".orc")
     file.deleteOnExit();
-    FileUtils.copyURLToFile(url, file)
+    Utils.copyURLToFile(url, file)
     spark.read.orc(file.getAbsolutePath)
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnIndexSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnIndexSuite.scala
index e1e44697be7f2..4e103e771d169 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnIndexSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetColumnIndexSuite.scala
@@ -59,7 +59,7 @@ class ParquetColumnIndexSuite extends QueryTest with ParquetTest with SharedSpar
   }
 
   test("reading from unaligned pages - test filters") {
-    val df = spark.range(0, 2000).map(i => (i, s"$i:${"o" * (i / 100).toInt}")).toDF()
+    val df = spark.range(0, 2000).map(i => (i, s"$i:${"o".repeat((i / 100).toInt)}")).toDF()
     checkUnalignedPages(df)(actions: _*)
   }
 
@@ -97,14 +97,14 @@ class ParquetColumnIndexSuite extends QueryTest with ParquetTest with SharedSpar
     // insert 50 null values in [400, 450) to verify that they are skipped during processing row
     // range [500, 1000) against the second page of col_2 [400, 800)
     val df = spark.range(0, 2000).map { i =>
-      val strVal = if (i >= 400 && i < 450) null else s"$i:${"o" * (i / 100).toInt}"
+      val strVal = if (i >= 400 && i < 450) null else s"$i:${"o".repeat((i / 100).toInt)}"
       (i, strVal)
     }.toDF()
     checkUnalignedPages(df)(actions: _*)
   }
 
   test("reading unaligned pages - struct type") {
-    val df = (0 until 2000).map(i => Tuple1((i.toLong, s"$i:${"o" * (i / 100)}"))).toDF("s")
+    val df = (0 until 2000).map(i => Tuple1((i.toLong, s"$i:${"o".repeat(i / 100)}"))).toDF("s")
     checkUnalignedPages(df)(
       df => df.filter("s._1 = 500"),
       df => df.filter("s._1 = 500 or s._1 = 1500"),
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetDeltaLengthByteArrayEncodingSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetDeltaLengthByteArrayEncodingSuite.scala
index fd81dcfe24d89..a1c01632dd3c1 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetDeltaLengthByteArrayEncodingSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetDeltaLengthByteArrayEncodingSuite.scala
@@ -135,7 +135,7 @@ class ParquetDeltaLengthByteArrayEncodingSuite
       if (randomEmpty.nextInt() % 11 != 0) {
         maxLen = 0;
       }
-      samples(i) = RandomStringUtils.randomAlphanumeric(0, maxLen)
+      samples(i) = RandomStringUtils.secure.nextAlphanumeric(0, maxLen)
     }
     samples
   }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetIOSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetIOSuite.scala
index d78b4a426e707..f52b0bdd87902 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetIOSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetIOSuite.scala
@@ -41,8 +41,8 @@ import org.apache.spark.{SPARK_VERSION_SHORT, SparkException, TestUtils}
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeRow}
+import org.apache.spark.sql.catalyst.util.{DateTimeConstants, DateTimeUtils}
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils.localTime
-import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.execution.datasources.SQLHadoopMapReduceCommitProtocol
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
@@ -1623,7 +1623,7 @@ class ParquetIOSuite extends QueryTest with ParquetTest with SharedSparkSession
         val writer = createParquetWriter(schema, tablePath, dictionaryEnabled = dictEnabled)
         (0 until numRecords).foreach { i =>
           val record = new SimpleGroup(schema)
-          record.add(0, localTime(23, 59, 59, 123456))
+          record.add(0, localTime(23, 59, 59, 123456) / DateTimeConstants.NANOS_PER_MICROS)
           writer.write(record)
         }
         writer.close
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetInteroperabilitySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetInteroperabilitySuite.scala
index baa11df302b04..257a89754f4ef 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetInteroperabilitySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetInteroperabilitySuite.scala
@@ -20,7 +20,6 @@ package org.apache.spark.sql.execution.datasources.parquet
 import java.io.File
 import java.time.ZoneOffset
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.fs.{Path, PathFilter}
 import org.apache.parquet.format.converter.ParquetMetadataConverter.NO_FILTER
 import org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName
@@ -30,6 +29,7 @@ import org.apache.spark.sql.catalyst.util.DateTimeUtils
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.{ArrayType, IntegerType, StructField, StructType}
+import org.apache.spark.util.Utils
 
 class ParquetInteroperabilitySuite extends ParquetCompatibilityTest with SharedSparkSession {
   test("parquet files with different physical schemas but share the same logical schema") {
@@ -177,7 +177,7 @@ class ParquetInteroperabilitySuite extends ParquetCompatibilityTest with SharedS
       // match the column names of the file from impala
       val df = spark.createDataset(ts).toDF().repartition(1).withColumnRenamed("value", "ts")
       df.write.parquet(tableDir.getAbsolutePath)
-      FileUtils.copyFile(new File(impalaPath), new File(tableDir, "part-00001.parq"))
+      Utils.copyFile(new File(impalaPath), new File(tableDir, "part-00001.parq"))
 
       Seq(false, true).foreach { int96TimestampConversion =>
         withAllParquetReaders {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetPartitionDiscoverySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetPartitionDiscoverySuite.scala
index 6f5855461fcce..324fe148592a0 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetPartitionDiscoverySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetPartitionDiscoverySuite.scala
@@ -23,7 +23,6 @@ import java.sql.Timestamp
 import java.time.{LocalDateTime, LocalTime, ZoneId, ZoneOffset}
 import java.util.Locale
 
-import com.google.common.io.Files
 import org.apache.hadoop.fs.Path
 import org.apache.parquet.hadoop.ParquetOutputFormat
 
@@ -37,11 +36,12 @@ import org.apache.spark.sql.catalyst.util.DateTimeUtils.localDateTimeToMicros
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.datasources.{PartitionPath => Partition}
 import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2Relation, FileTable}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.UTF8String
+import org.apache.spark.util.Utils
 
 // The data where the partitioning key exists only in the directory structure.
 case class ParquetData(intField: Int, stringField: String)
@@ -79,8 +79,8 @@ abstract class ParquetPartitionDiscoverySuite
 
     check("10", IntegerType)
     check("1000000000000000", LongType)
-    val decimal = Decimal("1" * 20)
-    check("1" * 20, DecimalType(decimal.precision, decimal.scale))
+    val decimal = Decimal("1".repeat(20))
+    check("1".repeat(20), DecimalType(decimal.precision, decimal.scale))
     check("1.5", DoubleType)
     check("hello", StringType)
     check("1990-02-24", DateType)
@@ -770,7 +770,7 @@ abstract class ParquetPartitionDiscoverySuite
           Row(
             Long.MaxValue,
             4.5,
-            new java.math.BigDecimal(new BigInteger("1" * 20)),
+            new java.math.BigDecimal(new BigInteger("1".repeat(20))),
             java.sql.Date.valueOf("2015-05-23"),
             ts,
             "This is a string, /[]?=:",
@@ -821,8 +821,8 @@ abstract class ParquetPartitionDiscoverySuite
         .partitionBy("b", "c", "d")
         .save(dir.getCanonicalPath)
 
-      Files.touch(new File(s"${dir.getCanonicalPath}/b=1", ".DS_Store"))
-      Files.createParentDirs(new File(s"${dir.getCanonicalPath}/b=1/c=1/.foo/bar"))
+      Utils.touch(new File(s"${dir.getCanonicalPath}/b=1", ".DS_Store"))
+      Utils.createParentDirs(new File(s"${dir.getCanonicalPath}/b=1/c=1/.foo/bar"))
 
       checkAnswer(spark.read.format("parquet").load(dir.getCanonicalPath), df)
     }
@@ -838,8 +838,8 @@ abstract class ParquetPartitionDiscoverySuite
         .partitionBy("b", "c", "d")
         .save(tablePath.getCanonicalPath)
 
-      Files.touch(new File(s"${tablePath.getCanonicalPath}/", "_SUCCESS"))
-      Files.createParentDirs(new File(s"${dir.getCanonicalPath}/b=1/c=1/.foo/bar"))
+      Utils.touch(new File(s"${tablePath.getCanonicalPath}/", "_SUCCESS"))
+      Utils.createParentDirs(new File(s"${dir.getCanonicalPath}/b=1/c=1/.foo/bar"))
 
       checkAnswer(spark.read.format("parquet").load(tablePath.getCanonicalPath), df)
     }
@@ -855,8 +855,8 @@ abstract class ParquetPartitionDiscoverySuite
         .partitionBy("b", "c", "d")
         .save(tablePath.getCanonicalPath)
 
-      Files.touch(new File(s"${tablePath.getCanonicalPath}/", "_SUCCESS"))
-      Files.createParentDirs(new File(s"${dir.getCanonicalPath}/b=1/c=1/.foo/bar"))
+      Utils.touch(new File(s"${tablePath.getCanonicalPath}/", "_SUCCESS"))
+      Utils.createParentDirs(new File(s"${dir.getCanonicalPath}/b=1/c=1/.foo/bar"))
 
       checkAnswer(spark.read.format("parquet").load(tablePath.getCanonicalPath), df)
     }
@@ -953,9 +953,9 @@ abstract class ParquetPartitionDiscoverySuite
             .partitionBy("b", "c", "d")
             .save(tablePath.getCanonicalPath)
 
-          Files.touch(new File(s"${tablePath.getCanonicalPath}/b=1", "_SUCCESS"))
-          Files.touch(new File(s"${tablePath.getCanonicalPath}/b=1/c=1", "_SUCCESS"))
-          Files.touch(new File(s"${tablePath.getCanonicalPath}/b=1/c=1/d=1", "_SUCCESS"))
+          Utils.touch(new File(s"${tablePath.getCanonicalPath}/b=1", "_SUCCESS"))
+          Utils.touch(new File(s"${tablePath.getCanonicalPath}/b=1/c=1", "_SUCCESS"))
+          Utils.touch(new File(s"${tablePath.getCanonicalPath}/b=1/c=1/d=1", "_SUCCESS"))
           checkAnswer(spark.read.format("parquet").load(tablePath.getCanonicalPath), df)
         }
       }
@@ -1061,9 +1061,9 @@ abstract class ParquetPartitionDiscoverySuite
       //
       // The summary files and the dot-file under `p0=0` should not fail partition discovery.
 
-      Files.copy(new File(p1, "_metadata"), new File(p0, "_metadata"))
-      Files.copy(new File(p1, "_common_metadata"), new File(p0, "_common_metadata"))
-      Files.touch(new File(p0, ".dummy"))
+      Utils.copyFile(new File(p1, "_metadata"), new File(p0, "_metadata"))
+      Utils.copyFile(new File(p1, "_common_metadata"), new File(p0, "_common_metadata"))
+      Utils.touch(new File(p0, ".dummy"))
 
       checkAnswer(spark.read.parquet(s"$path"), Seq(
         Row(0, 0, 0),
@@ -1097,13 +1097,13 @@ abstract class ParquetPartitionDiscoverySuite
     }
 
     withTempPath { path =>
-      val df = Seq((1, "1"), (2, "3"), (3, "2" * 30)).toDF("i", "decimal")
+      val df = Seq((1, "1"), (2, "3"), (3, "2".repeat(30))).toDF("i", "decimal")
       df.write.format("parquet").partitionBy("decimal").save(path.getAbsolutePath)
       checkAnswer(
         spark.read.load(path.getAbsolutePath),
         Row(1, BigDecimal("1")) ::
           Row(2, BigDecimal("3")) ::
-          Row(3, BigDecimal("2" * 30)) :: Nil)
+          Row(3, BigDecimal("2".repeat(30))) :: Nil)
     }
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetTest.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetTest.scala
index d108803d43e44..b7b082e329658 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetTest.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetTest.scala
@@ -39,6 +39,7 @@ import org.apache.spark.sql.catalyst.ScalaReflection
 import org.apache.spark.sql.execution.datasources.FileBasedDataSourceTest
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StructType
+import org.apache.spark.util.Utils
 
 /**
  * A helper trait that provides convenient facilities for Parquet testing.
@@ -105,7 +106,7 @@ private[sql] trait ParquetTest extends FileBasedDataSourceTest {
       new File(parent, child)
     }
 
-    assert(partDir.mkdirs(), s"Couldn't create directory $partDir")
+    assert(Utils.createDirectory(partDir), s"Couldn't create directory $partDir")
     partDir
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVariantShreddingSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVariantShreddingSuite.scala
index 4da5c264655d7..c41d88ac552da 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVariantShreddingSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVariantShreddingSuite.scala
@@ -19,8 +19,16 @@ package org.apache.spark.sql.execution.datasources.parquet
 
 import java.io.File
 
+import org.apache.hadoop.conf.Configuration
+import org.apache.hadoop.fs.Path
+import org.apache.parquet.hadoop.ParquetFileReader
+import org.apache.parquet.hadoop.util.HadoopInputFile
+import org.apache.parquet.schema.{LogicalTypeAnnotation, PrimitiveType}
+import org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName
+
 import org.apache.spark.sql.{QueryTest, Row}
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.internal.SQLConf.ParquetOutputTimestampType
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.unsafe.types.VariantVal
 
@@ -35,6 +43,118 @@ class ParquetVariantShreddingSuite extends QueryTest with ParquetTest with Share
     }
   }
 
+  test("timestamp physical type") {
+    ParquetOutputTimestampType.values.foreach { timestampParquetType =>
+      withSQLConf(SQLConf.PARQUET_OUTPUT_TIMESTAMP_TYPE.key -> timestampParquetType.toString) {
+        withTempDir { dir =>
+          val schema = "t timestamp, st struct<t timestamp>, at array<timestamp>"
+          val fullSchema = "v struct<metadata binary, value binary, typed_value struct<" +
+            "t struct<value binary, typed_value timestamp>," +
+            "st struct<" +
+            "value binary, typed_value struct<t struct<value binary, typed_value timestamp>>>," +
+            "at struct<" +
+              "value binary, typed_value array<struct<value binary, typed_value timestamp>>>" +
+            ">>, " +
+            "t1 timestamp, st1 struct<t1 timestamp>"
+          val df = spark.sql(
+            """
+              | select
+              |   to_variant_object(
+              |     named_struct('t', 1::timestamp, 'st', named_struct('t', 2::timestamp),
+              |     'at', array(5::timestamp))
+              |   ) v, 3::timestamp t1, named_struct('t1', 4::timestamp) st1
+              | from range(1)
+              |""".stripMargin)
+          withSQLConf(SQLConf.VARIANT_WRITE_SHREDDING_ENABLED.key -> true.toString,
+            SQLConf.VARIANT_ALLOW_READING_SHREDDED.key -> true.toString,
+            SQLConf.VARIANT_FORCE_SHREDDING_SCHEMA_FOR_TEST.key -> schema) {
+            df.write.mode("overwrite").parquet(dir.getAbsolutePath)
+            checkAnswer(
+              spark.read.parquet(dir.getAbsolutePath).selectExpr("to_json(v)"),
+              df.selectExpr("to_json(v)").collect()
+            )
+            val shreddedDf = spark.read.schema(fullSchema).parquet(dir.getAbsolutePath)
+            checkAnswer(
+              shreddedDf.selectExpr("v.typed_value.t.typed_value::long"),
+              Seq(Row(1)))
+            checkAnswer(
+              shreddedDf.selectExpr("v.typed_value.st.typed_value.t.typed_value::long"),
+              Seq(Row(2)))
+            checkAnswer(
+              shreddedDf.selectExpr("t1::long"),
+              Seq(Row(3)))
+            checkAnswer(
+              shreddedDf.selectExpr("st1.t1::long"),
+              Seq(Row(4)))
+            checkAnswer(
+              shreddedDf.selectExpr("v.typed_value.at.typed_value[0].typed_value::long"),
+              Seq(Row(5)))
+            val file = dir.listFiles().find(_.getName.endsWith(".parquet")).get
+            val parquetFilePath = file.getAbsolutePath
+            val inputFile = HadoopInputFile.fromPath(new Path(parquetFilePath), new Configuration())
+            val reader = ParquetFileReader.open(inputFile)
+            val footer = reader.getFooter
+            val schema = footer.getFileMetaData.getSchema
+            // v.typed_value.t.typed_value
+            val vGroup = schema.getType(schema.getFieldIndex("v")).asGroupType()
+            val typedValueGroup = vGroup.getType("typed_value").asGroupType()
+            val tGroup = typedValueGroup.getType("t").asGroupType()
+            val typedValue1 = tGroup.getType("typed_value").asPrimitiveType()
+            assert(typedValue1.getPrimitiveTypeName == PrimitiveTypeName.INT64)
+            assert(typedValue1.getLogicalTypeAnnotation == LogicalTypeAnnotation.timestampType(
+              true, LogicalTypeAnnotation.TimeUnit.MICROS))
+
+            // v.typed_value.st.typed_value.t.typed_value
+            val stGroup = typedValueGroup.getType("st").asGroupType()
+            val stTypedValueGroup = stGroup.getType("typed_value").asGroupType()
+            val stTGroup = stTypedValueGroup.getType("t").asGroupType()
+            val typedValue2 = stTGroup.getType("typed_value").asPrimitiveType()
+            assert(typedValue2.getPrimitiveTypeName == PrimitiveTypeName.INT64)
+            assert(typedValue2.getLogicalTypeAnnotation == LogicalTypeAnnotation.timestampType(
+              true, LogicalTypeAnnotation.TimeUnit.MICROS))
+
+            // v.typed_value.at.typed_value[0].typed_value
+            val atGroup = typedValueGroup.getType("at").asGroupType()
+            val atTypedValueGroup = atGroup.getType("typed_value").asGroupType()
+            val atLGroup = atTypedValueGroup.getType("list").asGroupType()
+            val atLEGroup = atLGroup.getType("element").asGroupType()
+            val typedValue3 = atLEGroup.getType("typed_value").asPrimitiveType()
+            assert(typedValue3.getPrimitiveTypeName == PrimitiveTypeName.INT64)
+            assert(typedValue3.getLogicalTypeAnnotation == LogicalTypeAnnotation.timestampType(
+              true, LogicalTypeAnnotation.TimeUnit.MICROS))
+
+            def verifyNonVariantTimestampType(t: PrimitiveType): Unit = {
+              timestampParquetType match {
+                case ParquetOutputTimestampType.INT96 =>
+                  assert(t.getPrimitiveTypeName == PrimitiveTypeName.INT96)
+                  assert(t.getLogicalTypeAnnotation == null)
+                case ParquetOutputTimestampType.TIMESTAMP_MICROS =>
+                  assert(t.getPrimitiveTypeName == PrimitiveTypeName.INT64)
+                  assert(t.getLogicalTypeAnnotation == LogicalTypeAnnotation.timestampType(
+                    true, LogicalTypeAnnotation.TimeUnit.MICROS))
+                case ParquetOutputTimestampType.TIMESTAMP_MILLIS =>
+                  assert(t.getPrimitiveTypeName == PrimitiveTypeName.INT64)
+                  assert(t.getLogicalTypeAnnotation == LogicalTypeAnnotation.timestampType(
+                    true, LogicalTypeAnnotation.TimeUnit.MILLIS))
+              }
+            }
+
+            // t1
+            val t1Value = schema.getType(schema.getFieldIndex("t1")).asPrimitiveType()
+            verifyNonVariantTimestampType(t1Value)
+
+            // st1.t1
+            val st1Group = schema.getType(schema.getFieldIndex("st1")).asGroupType()
+            val st1T1Value = st1Group.getType("t1").asPrimitiveType()
+            verifyNonVariantTimestampType(st1T1Value)
+            reader.close()
+          }
+        }
+      }
+    }
+  }
+
+
   testWithTempDir("write shredded variant basic") { dir =>
     val schema = "a int, b string, c decimal(15, 1)"
     val df = spark.sql(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorizedSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorizedSuite.scala
index f2d04a9c28f2a..5d68fcac1385d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorizedSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/parquet/ParquetVectorizedSuite.scala
@@ -41,6 +41,7 @@ import org.apache.spark.sql.execution.vectorized.ColumnVectorUtils
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.util.ArrayImplicits._
+import org.apache.spark.util.collection.Utils.createArray
 
 /**
  * A test suite on the vectorized Parquet reader. Unlike `ParquetIOSuite`, this focuses on
@@ -501,7 +502,7 @@ class ParquetVectorizedSuite extends QueryTest with ParquetTest with SharedSpark
     val maxDef = if (inputValues.contains(null)) 1 else 0
     val ty = parquetSchema.asGroupType().getType("a").asPrimitiveType()
     val cd = new ColumnDescriptor(Seq("a").toArray, ty, 0, maxDef)
-    val repetitionLevels = Array.fill[Int](inputValues.length)(0)
+    val repetitionLevels = createArray(inputValues.length, 0)
     val definitionLevels = inputValues.map(v => if (v == null) 0 else maxDef)
 
     val memPageStore = new MemPageStore(expectedValues.length)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/text/TextSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/text/TextSuite.scala
index dd254dbc7da85..90af707305494 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/text/TextSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/text/TextSuite.scala
@@ -17,15 +17,17 @@
 
 package org.apache.spark.sql.execution.datasources.text
 
-import java.io.File
+import java.io.{File, FileOutputStream}
 import java.nio.charset.StandardCharsets
 import java.nio.file.Files
 
 import org.apache.hadoop.io.SequenceFile.CompressionType
-import org.apache.hadoop.io.compress.GzipCodec
+import org.apache.hadoop.io.compress.{CompressionCodecFactory, GzipCodec}
 
 import org.apache.spark.{SparkConf, SparkIllegalArgumentException, TestUtils}
+import org.apache.spark.io.ZStdCompressionCodec
 import org.apache.spark.sql.{AnalysisException, DataFrame, QueryTest, Row, SaveMode}
+import org.apache.spark.sql.catalyst.util.HadoopCompressionCodec
 import org.apache.spark.sql.catalyst.util.HadoopCompressionCodec.{BZIP2, DEFLATE, GZIP, LZ4, NONE, SNAPPY}
 import org.apache.spark.sql.execution.datasources.CommonFileDataSourceSuite
 import org.apache.spark.sql.internal.SQLConf
@@ -253,6 +255,91 @@ abstract class TextSuite extends QueryTest with SharedSparkSession with CommonFi
     assert(TextOptions.isValidOption("encoding"))
     assert(TextOptions.isValidOption("lineSep"))
   }
+
+  private def createTestFiles(dir: File, fileFormatWriter: Boolean,
+    wholeText: Boolean): Seq[Row] = {
+    val numRecord = 100
+    val codecExtensionMap = HadoopCompressionCodec.values()
+      .map(c => (c.lowerCaseName(),
+        Option(c.getCompressionCodec).map(_.getDefaultExtension).getOrElse(""))) ++
+      Seq(("zstd", ".zst"), ("zstd", ".zstd"), ("gzip", ".gzip"))
+
+    val codecFactory = new CompressionCodecFactory(spark.sessionState.newHadoopConf())
+    codecExtensionMap.foreach { case (codec, ext) =>
+
+      val data = (1 to numRecord).map(i => s"$i, value_${codec}$ext").mkString("\n")
+      val file = new File(dir, s"test_$codec.txt$ext")
+
+      // file data source writers do not support zstd codec yet.
+      if (fileFormatWriter && !codec.equals("zstd")) {
+        val df = Seq(data).toDF("value")
+        df.coalesce(1).write
+          .format("text")
+          .option("compression", codec)
+          .save(file.getCanonicalPath)
+
+        val compressedFiles = new File(file.getCanonicalPath).listFiles()
+
+        compressedFiles.foreach { file =>
+          if (file.isFile && file.getName.startsWith("part")) {
+            val newName = file.getName.split("\\.").init.mkString(".") + ext
+            val status = file.renameTo(new File(dir, newName))
+            assert(status)
+          }
+        }
+      } else {
+        val os = new FileOutputStream(file)
+
+        val outputStream = codec match {
+          case "zstd" =>
+            new ZStdCompressionCodec(sparkConf).compressedOutputStream(os)
+          case codec if ext.nonEmpty =>
+            val compressionCodec = codecFactory.getCodecByName(codec)
+            compressionCodec.createOutputStream(os)
+          case _ => os
+        }
+        outputStream.write(data.getBytes(StandardCharsets.UTF_8))
+        outputStream.close()
+      }
+    }
+
+    val expectedOutput = codecExtensionMap.flatMap {
+      case (codec, ext) =>
+        val data = (1 to numRecord).map(i => s"$i, value_${codec}$ext")
+        if (wholeText) {
+          if (fileFormatWriter && !codec.equals("zstd")) {
+            Seq(Row(data.mkString("", "\n", "\n")))
+          } else {
+            Seq(Row(data.mkString("\n")))
+          }
+        } else {
+          data.map(Row(_))
+        }
+    }.toSeq
+    val numRows = if (wholeText) 1 else numRecord
+    assert(expectedOutput.length == codecExtensionMap.length * numRows)
+    expectedOutput
+  }
+
+  test("Test all supported codec and extension including zst, zstd and gzip") {
+    for (
+      wholeText <- Seq(true, false);
+      fileFormatWriter <- Seq(true, false)
+    ) {
+      logInfo(s"Testing with wholeText=$wholeText, fileFormatWriter=$fileFormatWriter")
+
+      withTempDir { dir =>
+        val options = Map(
+          "wholeText" -> wholeText.toString,
+          "recursiveFileLookup" -> "true"
+        )
+
+        val expectedOutput = createTestFiles(dir, fileFormatWriter, wholeText)
+        val df = spark.read.options(options).text(dir.getCanonicalPath)
+        checkAnswer(df, expectedOutput)
+      }
+    }
+  }
 }
 
 class TextV1Suite extends TextSuite {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/DSV2JoinPushDownAliasGenerationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/DSV2JoinPushDownAliasGenerationSuite.scala
new file mode 100644
index 0000000000000..a30f65d981a3a
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/DSV2JoinPushDownAliasGenerationSuite.scala
@@ -0,0 +1,152 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution.datasources.v2
+
+import java.util.Locale
+
+import org.apache.spark.SparkFunSuite
+import org.apache.spark.sql.connector.read.SupportsPushDownJoin.ColumnWithAlias
+
+class DSV2JoinPushDownAliasGenerationSuite extends SparkFunSuite {
+
+  private def assertAliases(
+    leftInput: Array[String],
+    rightInput: Array[String],
+    expectedLeft: Array[ColumnWithAlias],
+    expectedRight: Array[ColumnWithAlias]
+  ): Unit = {
+    val (actualLeft, actualRight) = V2ScanRelationPushDown
+      .generateColumnAliasesForDuplicatedName(leftInput, rightInput)
+
+    val uniqName: ColumnWithAlias => String = col => {
+      if (col.alias() == null) col.colName() else col.alias().toLowerCase(Locale.ROOT)
+    }
+    // Ensure no duplicate column names after ignoring capitalization
+    assert((actualLeft ++ actualRight).map(uniqName).distinct.length
+      == actualLeft.length + actualRight.length)
+
+    assert(
+      actualLeft === expectedLeft,
+      s"""Left side aliases mismatch.
+         |Expected: ${expectedLeft.map(_.alias()).mkString(", ")}
+         |Actual: ${actualLeft.map(_.alias()).mkString(", ")}""".stripMargin
+    )
+
+    assert(
+      actualRight === expectedRight,
+      s"""Right side aliases mismatch.
+         |Expected: ${expectedRight.map(_.alias()).mkString(", ")}
+         |Actual: ${actualRight.map(_.alias()).mkString(", ")}""".stripMargin
+    )
+  }
+
+  test("Basic case with no duplicate column names") {
+    assertAliases(
+      leftInput = Array("id", "name"),
+      rightInput = Array("email", "phone"),
+      expectedLeft = Array(
+        new ColumnWithAlias("id", null),
+        new ColumnWithAlias("name", null)
+      ),
+      expectedRight = Array(
+        new ColumnWithAlias("email", null),
+        new ColumnWithAlias("phone", null)
+      )
+    )
+  }
+
+  test("Extreme duplication scenarios") {
+    assertAliases(
+      leftInput = Array("id", "id", "id"),
+      rightInput = Array("id", "id"),
+      expectedLeft = Array(
+        new ColumnWithAlias("id", null),
+        new ColumnWithAlias("id", "id_1"),
+        new ColumnWithAlias("id", "id_2")
+      ),
+      expectedRight = Array(
+        new ColumnWithAlias("id", "id_3"),
+        new ColumnWithAlias("id", "id_4")
+      )
+    )
+  }
+
+  test("Exact duplicate column names") {
+    assertAliases(
+      leftInput = Array("id", "name"),
+      rightInput = Array("id", "name"),
+      expectedLeft = Array(
+        new ColumnWithAlias("id", null),
+        new ColumnWithAlias("name", null)
+      ),
+      expectedRight = Array(
+        new ColumnWithAlias("id", "id_1"),
+        new ColumnWithAlias("name", "name_1")
+      )
+    )
+  }
+
+  test("Columns with numeric suffixes (id vs id_1)") {
+    assertAliases(
+      leftInput = Array("id", "id_1", "name"),
+      rightInput = Array("id", "name", "value"),
+      expectedLeft = Array(
+        new ColumnWithAlias("id", null),
+        new ColumnWithAlias("id_1", null),
+        new ColumnWithAlias("name", null)
+      ),
+      expectedRight = Array(
+        new ColumnWithAlias("id", "id_2"),
+        new ColumnWithAlias("name", "name_1"),
+        new ColumnWithAlias("value", null)
+      )
+    )
+  }
+
+  test("Case-sensitive conflicts (ID vs id)") {
+    assertAliases(
+      leftInput = Array("ID", "Name"),
+      rightInput = Array("id", "name"),
+      expectedLeft = Array(
+        new ColumnWithAlias("ID", null),
+        new ColumnWithAlias("Name", null)
+      ),
+      expectedRight = Array(
+        new ColumnWithAlias("id", "id_1"),
+        new ColumnWithAlias("name", "name_1")
+      )
+    )
+  }
+
+  test("Mixed case and numeric suffixes") {
+    assertAliases(
+      leftInput = Array("UserID", "user_id", "user_id_1"),
+      rightInput = Array("userId", "USER_ID", "user_id_2"),
+      expectedLeft = Array(
+        new ColumnWithAlias("UserID", null),
+        new ColumnWithAlias("user_id", null),
+        new ColumnWithAlias("user_id_1", null)
+      ),
+      expectedRight = Array(
+        new ColumnWithAlias("userId", "userId_1"),
+        new ColumnWithAlias("USER_ID", "USER_ID_3"),
+        new ColumnWithAlias("user_id_2", null)
+      )
+    )
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2StrategySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2StrategySuite.scala
index 241866555d0e8..4c6b0a54c8180 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2StrategySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/DataSourceV2StrategySuite.scala
@@ -17,6 +17,7 @@
 
 package org.apache.spark.sql.execution.datasources.v2
 
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.catalyst.analysis.UnresolvedAttribute
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.expressions._
@@ -24,11 +25,16 @@ import org.apache.spark.sql.catalyst.plans.PlanTest
 import org.apache.spark.sql.catalyst.util.V2ExpressionBuilder
 import org.apache.spark.sql.connector.expressions.{Expression => V2Expression, FieldReference, GeneralScalarExpression, LiteralValue}
 import org.apache.spark.sql.connector.expressions.filter.{AlwaysFalse, AlwaysTrue, And => V2And, Not => V2Not, Or => V2Or, Predicate}
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.{BooleanType, DoubleType, IntegerType, LongType, StringType, StructField, StructType}
 import org.apache.spark.unsafe.types.UTF8String
 
 class DataSourceV2StrategySuite extends PlanTest with SharedSparkSession {
+
+  override protected def sparkConf: SparkConf = super.sparkConf
+    .set(SQLConf.ANSI_ENABLED, true)
+
   val attrInts = Seq(
     $"cint".int,
     $"`c.int`".int,
@@ -328,42 +334,44 @@ class DataSourceV2StrategySuite extends PlanTest with SharedSparkSession {
   }
 
   test("round trip conversion of CASE_WHEN expression") {
+    val intCol = $"cint".int
+    val intColRef = FieldReference("cint")
     // CASE WHEN cond1 THEN value1 WHEN cond2 THEN value2
     checkRoundTripConversion(
       catalystExpr = CaseWhen(
         Seq(
-          (EqualTo(Literal(1), Literal(2)), Literal("a")),
-          (EqualTo(Literal(3), Literal(4)), Literal("b"))),
+          (EqualTo(intCol, Literal(2)), Literal("a")),
+          (EqualTo(intCol, Literal(4)), Literal("b"))),
         None),
       v2Expr = new GeneralScalarExpression(
         "CASE_WHEN",
         Array(
-          new Predicate("=", Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))),
+          new Predicate("=", Array(intColRef, LiteralValue(2, IntegerType))),
           LiteralValue(UTF8String.fromString("a"), StringType),
-          new Predicate("=", Array(LiteralValue(3, IntegerType), LiteralValue(4, IntegerType))),
+          new Predicate("=", Array(intColRef, LiteralValue(4, IntegerType))),
           LiteralValue(UTF8String.fromString("b"), StringType))))
 
     // CASE WHEN cond1 THEN value1 ELSE elseValue
     checkRoundTripConversion(
       catalystExpr = CaseWhen(
-        Seq((EqualTo(Literal(1), Literal(2)), Literal("yes"))),
+        Seq((EqualTo(intCol, Literal(2)), Literal("yes"))),
         Some(Literal("no"))),
       v2Expr = new GeneralScalarExpression(
         "CASE_WHEN",
         Array(
-          new Predicate("=", Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))),
+          new Predicate("=", Array(intColRef, LiteralValue(2, IntegerType))),
           LiteralValue(UTF8String.fromString("yes"), StringType),
           LiteralValue(UTF8String.fromString("no"), StringType))))
 
     // CASE WHEN cond1 THEN true ELSE false
     checkRoundTripConversion(
       catalystExpr = CaseWhen(
-        Seq((EqualTo(Literal(1), Literal(2)), Literal(true))),
+        Seq((EqualTo(intCol, Literal(2)), Literal(true))),
         Some(Literal(false))),
       v2Expr = new Predicate(
         "CASE_WHEN",
         Array(
-          new Predicate("=", Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))),
+          new Predicate("=", Array(intColRef, LiteralValue(2, IntegerType))),
           new AlwaysTrue,
           new AlwaysFalse)),
       isPredicate = true)
@@ -372,251 +380,260 @@ class DataSourceV2StrategySuite extends PlanTest with SharedSparkSession {
     checkRoundTripConversion(
       catalystExpr = CaseWhen(
         Seq(
-          (EqualTo(Literal(1), Literal(2)), Literal(true)),
-          (EqualTo(Literal(3), Literal(4)), Literal(false))),
+          (EqualTo(intCol, Literal(2)), Literal(true)),
+          (EqualTo(intCol, Literal(4)), Literal(false))),
         Some(Literal(true))),
       v2Expr = new Predicate(
         "CASE_WHEN",
         Array(
-          new Predicate("=", Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))),
+          new Predicate("=", Array(intColRef, LiteralValue(2, IntegerType))),
           new AlwaysTrue,
-          new Predicate("=", Array(LiteralValue(3, IntegerType), LiteralValue(4, IntegerType))),
+          new Predicate("=", Array(intColRef, LiteralValue(4, IntegerType))),
           new AlwaysFalse,
           new AlwaysTrue)),
       isPredicate = true)
   }
 
   test("round trip conversion of math functions") {
+    val intCol = $"cint".int
+    val intColRef = FieldReference("cint")
+    val doubleCol = $"cdouble".double
+    val doubleColRef = FieldReference("cdouble")
     checkRoundTripConversion(
-      catalystExpr = Log10(Literal(100)),
-      v2Expr = new GeneralScalarExpression("LOG10", Array(LiteralValue(100, IntegerType))))
+      catalystExpr = Log10(intCol),
+      v2Expr = new GeneralScalarExpression("LOG10", Array(intColRef)))
 
     checkRoundTripConversion(
       catalystExpr = new Rand(),
       v2Expr = new GeneralScalarExpression("RAND", Array()))
 
     checkRoundTripConversion(
-      catalystExpr = new Rand(Literal(17L)),
-      v2Expr = new GeneralScalarExpression("RAND", Array(LiteralValue(17L, LongType))))
+      catalystExpr = new Rand(intCol),
+      v2Expr = new GeneralScalarExpression("RAND", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Abs(Literal(-5), failOnError = true),
-      v2Expr = new GeneralScalarExpression("ABS", Array(LiteralValue(-5, IntegerType))))
+      catalystExpr = Abs(intCol, failOnError = true),
+      v2Expr = new GeneralScalarExpression("ABS", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = UnaryMinus(Literal(5), failOnError = true),
-      v2Expr = new GeneralScalarExpression("-", Array(LiteralValue(5, IntegerType))))
+      catalystExpr = UnaryMinus(intCol, failOnError = true),
+      v2Expr = new GeneralScalarExpression("-", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Log2(Literal(8)),
-      v2Expr = new GeneralScalarExpression("LOG2", Array(LiteralValue(8, IntegerType))))
+      catalystExpr = Log2(intCol),
+      v2Expr = new GeneralScalarExpression("LOG2", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Log(Literal(100)),
-      v2Expr = new GeneralScalarExpression("LN", Array(LiteralValue(100, IntegerType))))
+      catalystExpr = Log(intCol),
+      v2Expr = new GeneralScalarExpression("LN", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Exp(Literal(1.0)),
-      v2Expr = new GeneralScalarExpression("EXP", Array(LiteralValue(1.0, DoubleType))))
+      catalystExpr = Exp(doubleCol),
+      v2Expr = new GeneralScalarExpression("EXP", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Sqrt(Literal(4.0)),
-      v2Expr = new GeneralScalarExpression("SQRT", Array(LiteralValue(4.0, DoubleType))))
+      catalystExpr = Sqrt(doubleCol),
+      v2Expr = new GeneralScalarExpression("SQRT", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Floor(Literal(4.7)),
-      v2Expr = new GeneralScalarExpression("FLOOR", Array(LiteralValue(4.7, DoubleType))))
+      catalystExpr = Floor(doubleCol),
+      v2Expr = new GeneralScalarExpression("FLOOR", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Ceil(Literal(4.3)),
-      v2Expr = new GeneralScalarExpression("CEIL", Array(LiteralValue(4.3, DoubleType))))
+      catalystExpr = Ceil(doubleCol),
+      v2Expr = new GeneralScalarExpression("CEIL", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Sin(Literal(0)),
-      v2Expr = new GeneralScalarExpression("SIN", Array(LiteralValue(0, IntegerType))))
+      catalystExpr = Sin(intCol),
+      v2Expr = new GeneralScalarExpression("SIN", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Sinh(Literal(0)),
-      v2Expr = new GeneralScalarExpression("SINH", Array(LiteralValue(0, IntegerType))))
+      catalystExpr = Sinh(intCol),
+      v2Expr = new GeneralScalarExpression("SINH", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Cos(Literal(0)),
-      v2Expr = new GeneralScalarExpression("COS", Array(LiteralValue(0, IntegerType))))
+      catalystExpr = Cos(intCol),
+      v2Expr = new GeneralScalarExpression("COS", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Cosh(Literal(0)),
-      v2Expr = new GeneralScalarExpression("COSH", Array(LiteralValue(0, IntegerType))))
+      catalystExpr = Cosh(intCol),
+      v2Expr = new GeneralScalarExpression("COSH", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Tan(Literal(0)),
-      v2Expr = new GeneralScalarExpression("TAN", Array(LiteralValue(0, IntegerType))))
+      catalystExpr = Tan(intCol),
+      v2Expr = new GeneralScalarExpression("TAN", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Tanh(Literal(0)),
-      v2Expr = new GeneralScalarExpression("TANH", Array(LiteralValue(0, IntegerType))))
+      catalystExpr = Tanh(intCol),
+      v2Expr = new GeneralScalarExpression("TANH", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Cot(Literal(1)),
-      v2Expr = new GeneralScalarExpression("COT", Array(LiteralValue(1, IntegerType))))
+      catalystExpr = Cot(intCol),
+      v2Expr = new GeneralScalarExpression("COT", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Asin(Literal(1.0)),
-      v2Expr = new GeneralScalarExpression("ASIN", Array(LiteralValue(1.0, DoubleType))))
+      catalystExpr = Asin(doubleCol),
+      v2Expr = new GeneralScalarExpression("ASIN", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Asinh(Literal(1.0)),
-      v2Expr = new GeneralScalarExpression("ASINH", Array(LiteralValue(1.0, DoubleType))))
+      catalystExpr = Asinh(doubleCol),
+      v2Expr = new GeneralScalarExpression("ASINH", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Acos(Literal(1.0)),
-      v2Expr = new GeneralScalarExpression("ACOS", Array(LiteralValue(1.0, DoubleType))))
+      catalystExpr = Acos(doubleCol),
+      v2Expr = new GeneralScalarExpression("ACOS", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Acosh(Literal(1.0)),
-      v2Expr = new GeneralScalarExpression("ACOSH", Array(LiteralValue(1.0, DoubleType))))
+      catalystExpr = Acosh(doubleCol),
+      v2Expr = new GeneralScalarExpression("ACOSH", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Atan(Literal(1.0)),
-      v2Expr = new GeneralScalarExpression("ATAN", Array(LiteralValue(1.0, DoubleType))))
+      catalystExpr = Atan(doubleCol),
+      v2Expr = new GeneralScalarExpression("ATAN", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Atanh(Literal(0.5)),
-      v2Expr = new GeneralScalarExpression("ATANH", Array(LiteralValue(0.5, DoubleType))))
+      catalystExpr = Atanh(doubleCol),
+      v2Expr = new GeneralScalarExpression("ATANH", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Cbrt(Literal(8.0)),
-      v2Expr = new GeneralScalarExpression("CBRT", Array(LiteralValue(8.0, DoubleType))))
+      catalystExpr = Cbrt(doubleCol),
+      v2Expr = new GeneralScalarExpression("CBRT", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = ToDegrees(Literal(3.14)),
-      v2Expr = new GeneralScalarExpression("DEGREES", Array(LiteralValue(3.14, DoubleType))))
+      catalystExpr = ToDegrees(doubleCol),
+      v2Expr = new GeneralScalarExpression("DEGREES", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = ToRadians(Literal(180.0)),
-      v2Expr = new GeneralScalarExpression("RADIANS", Array(LiteralValue(180.0, DoubleType))))
+      catalystExpr = ToRadians(doubleCol),
+      v2Expr = new GeneralScalarExpression("RADIANS", Array(doubleColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Signum(Literal(-42)),
-      v2Expr = new GeneralScalarExpression("SIGN", Array(LiteralValue(-42, IntegerType))))
+      catalystExpr = Signum(intCol),
+      v2Expr = new GeneralScalarExpression("SIGN", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Add(Literal(1), Literal(2), EvalMode.ANSI),
+      catalystExpr = Add(intCol, Literal(2), EvalMode.ANSI),
       v2Expr = new GeneralScalarExpression(
         "+",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Subtract(Literal(5), Literal(3), EvalMode.ANSI),
+      catalystExpr = Subtract(intCol, Literal(3), EvalMode.ANSI),
       v2Expr = new GeneralScalarExpression(
         "-",
-        Array(LiteralValue(5, IntegerType), LiteralValue(3, IntegerType))))
+        Array(intColRef, LiteralValue(3, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Multiply(Literal(2), Literal(4), EvalMode.ANSI),
+      catalystExpr = Multiply(intCol, Literal(4), EvalMode.ANSI),
       v2Expr = new GeneralScalarExpression(
         "*",
-        Array(LiteralValue(2, IntegerType), LiteralValue(4, IntegerType))))
+        Array(intColRef, LiteralValue(4, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Divide(Literal(10), Literal(2), EvalMode.ANSI),
+      catalystExpr = Divide(intCol, Literal(2), EvalMode.ANSI),
       v2Expr = new GeneralScalarExpression(
         "/",
-        Array(LiteralValue(10, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Remainder(Literal(7), Literal(3), EvalMode.ANSI),
+      catalystExpr = Remainder(intCol, Literal(3), EvalMode.ANSI),
       v2Expr = new GeneralScalarExpression(
         "%",
-        Array(LiteralValue(7, IntegerType), LiteralValue(3, IntegerType))))
+        Array(intColRef, LiteralValue(3, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Logarithm(Literal(10), Literal(100)),
+      catalystExpr = Logarithm(Literal(10), intCol),
       v2Expr = new GeneralScalarExpression(
         "LOG",
-        Array(LiteralValue(10, IntegerType), LiteralValue(100, IntegerType))))
+        Array(LiteralValue(10, IntegerType), intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Pow(Literal(2), Literal(3)),
+      catalystExpr = Pow(intCol, Literal(3)),
       v2Expr = new GeneralScalarExpression(
         "POWER",
-        Array(LiteralValue(2, IntegerType), LiteralValue(3, IntegerType))))
+        Array(intColRef, LiteralValue(3, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Round(Literal(123.456), Literal(2), ansiEnabled = true),
+      catalystExpr = Round(doubleCol, Literal(2), ansiEnabled = true),
       v2Expr = new GeneralScalarExpression(
         "ROUND",
-        Array(LiteralValue(123.456, DoubleType), LiteralValue(2, IntegerType))))
+        Array(doubleColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Atan2(Literal(1.0), Literal(1.0)),
+      catalystExpr = Atan2(doubleCol, Literal(1.0)),
       v2Expr = new GeneralScalarExpression(
         "ATAN2",
-        Array(LiteralValue(1.0, DoubleType), LiteralValue(1.0, DoubleType))))
+        Array(doubleColRef, LiteralValue(1.0, DoubleType))))
 
     checkRoundTripConversion(
-      catalystExpr = Coalesce(Seq(Literal(null, IntegerType), Literal(5))),
+      catalystExpr = Coalesce(Seq(Literal(null, IntegerType), intCol)),
       v2Expr = new GeneralScalarExpression(
         "COALESCE",
-        Array(LiteralValue(null, IntegerType), LiteralValue(5, IntegerType))))
+        Array(LiteralValue(null, IntegerType), intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = Greatest(Seq(Literal(1), Literal(2))),
+      catalystExpr = Greatest(Seq(intCol, Literal(2))),
       v2Expr = new GeneralScalarExpression(
         "GREATEST",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Least(Seq(Literal(1), Literal(2))),
+      catalystExpr = Least(Seq(intCol, Literal(2))),
       v2Expr = new GeneralScalarExpression(
         "LEAST",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = WidthBucket(Literal(5), Literal(0), Literal(10), Literal(5)),
+      catalystExpr = WidthBucket(intCol, Literal(0), Literal(10), Literal(5)),
       v2Expr = new GeneralScalarExpression(
         "WIDTH_BUCKET",
         Array(
-          LiteralValue(5, IntegerType),
+          intColRef,
           LiteralValue(0, IntegerType),
           LiteralValue(10, IntegerType),
           LiteralValue(5, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Sqrt(Pow(Abs(Literal(-3), failOnError = true), Literal(2))),
+      catalystExpr = Sqrt(Pow(Abs(intCol, failOnError = true), Literal(2))),
       v2Expr = new GeneralScalarExpression(
         "SQRT",
         Array(
           new GeneralScalarExpression(
             "POWER",
-            Array(new GeneralScalarExpression("ABS", Array(LiteralValue(-3, IntegerType))),
-          LiteralValue(2, IntegerType))))))
+            Array(new GeneralScalarExpression("ABS", Array(intColRef)),
+              LiteralValue(2, IntegerType))))))
   }
 
   test("round trip conversion of bitwise functions") {
+    val intCol = $"cint".int
+    val intColRef = FieldReference("cint")
+
     checkRoundTripConversion(
-      catalystExpr = BitwiseNot(Literal(5)),
-      v2Expr = new GeneralScalarExpression("~", Array(LiteralValue(5, IntegerType))))
+      catalystExpr = BitwiseNot(intCol),
+      v2Expr = new GeneralScalarExpression("~", Array(intColRef)))
 
     checkRoundTripConversion(
-      catalystExpr = BitwiseAnd(Literal(6), Literal(3)),
+      catalystExpr = BitwiseAnd(intCol, Literal(3)),
       v2Expr = new GeneralScalarExpression("&", Array(
-        LiteralValue(6, IntegerType),
+        intColRef,
         LiteralValue(3, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = BitwiseOr(Literal(4), Literal(1)),
+      catalystExpr = BitwiseOr(intCol, Literal(1)),
       v2Expr = new GeneralScalarExpression("|", Array(
-        LiteralValue(4, IntegerType),
+        intColRef,
         LiteralValue(1, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = BitwiseXor(Literal(12), Literal(5)),
+      catalystExpr = BitwiseXor(intCol, Literal(5)),
       v2Expr = new GeneralScalarExpression("^", Array(
-        LiteralValue(12, IntegerType),
+        intColRef,
         LiteralValue(5, IntegerType))))
   }
 
   test("round trip conversion of predicate expressions") {
+    val intCol = $"cint".int
+    val intColRef = FieldReference("cint")
     checkRoundTripConversion(
       catalystExpr = IsNull($"a".boolean),
       v2Expr = new Predicate("IS_NULL", Array(FieldReference("a"))))
@@ -636,56 +653,47 @@ class DataSourceV2StrategySuite extends PlanTest with SharedSparkSession {
         "=",
         Array(FieldReference("a"), LiteralValue(true, BooleanType)))),
       catalystExpr = Not(EqualTo($"a".boolean, Literal(true))))
-
     checkRoundTripConversion(
-      catalystExpr = EqualTo(Literal(1), Literal(2)),
+      catalystExpr = EqualTo(intCol, Literal(2)),
       v2Expr = new Predicate(
         "=",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = EqualNullSafe(Literal(1), Literal(2)),
+      catalystExpr = EqualNullSafe(intCol, Literal(2)),
       v2Expr = new Predicate(
         "<=>",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = GreaterThan(Literal(1), Literal(2)),
+      catalystExpr = GreaterThan(intCol, Literal(2)),
       v2Expr = new Predicate(
         ">",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = GreaterThanOrEqual(Literal(1), Literal(2)),
+      catalystExpr = GreaterThanOrEqual(intCol, Literal(2)),
       v2Expr = new Predicate(
         ">=",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = LessThan(Literal(1), Literal(2)),
+      catalystExpr = LessThan(intCol, Literal(2)),
       v2Expr = new Predicate(
         "<",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = LessThanOrEqual(Literal(1), Literal(2)),
+      catalystExpr = LessThanOrEqual(intCol, Literal(2)),
       v2Expr = new Predicate(
         "<=",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
-      catalystExpr = Not(EqualTo(Literal(1), Literal(2))),
+      catalystExpr = Not(EqualTo(intCol, Literal(2))),
       v2Expr = new Predicate(
         "<>",
-        Array(LiteralValue(1, IntegerType), LiteralValue(2, IntegerType))))
-
-    checkRoundTripConversion(
-      catalystExpr = And(Literal.TrueLiteral, Literal.FalseLiteral),
-      v2Expr = new V2And(new AlwaysTrue, new AlwaysFalse))
-
-    checkRoundTripConversion(
-      catalystExpr = Or(Literal.TrueLiteral, Literal.FalseLiteral),
-      v2Expr = new V2Or(new AlwaysTrue, new AlwaysFalse))
+        Array(intColRef, LiteralValue(2, IntegerType))))
 
     checkRoundTripConversion(
       catalystExpr = StartsWith($"a".string, Literal("foo")),
@@ -714,6 +722,115 @@ class DataSourceV2StrategySuite extends PlanTest with SharedSparkSession {
         LiteralValue(3, IntegerType))))
   }
 
+  test("Constant foldable CASE_WHEN expression") {
+    checkV2Conversion(
+      catalystExpr = CaseWhen(
+        Seq(
+          (EqualTo(Literal(1), Literal(2)), Literal("a")),
+          (EqualTo(Literal(3), Literal(3)), Literal("b"))),
+        None),
+      v2Expr = LiteralValue(UTF8String.fromString("b"), StringType)
+    )
+
+    checkV2Conversion(
+      catalystExpr = CaseWhen(
+        Seq((EqualTo(Literal(1), Literal(1)), Literal("yes"))),
+        Some(Literal("no"))),
+      v2Expr = LiteralValue(UTF8String.fromString("yes"), StringType)
+    )
+  }
+
+  test("Constant foldable math functions") {
+    checkV2Conversion(
+      catalystExpr = Log10(Literal(100.0)),
+      v2Expr = LiteralValue(2.0, DoubleType)
+    )
+
+    checkV2Conversion(
+      catalystExpr = Abs(Literal(-5), failOnError = true),
+      v2Expr = LiteralValue(5, IntegerType)
+    )
+
+    checkV2Conversion(
+      catalystExpr = UnaryMinus(Literal(5), failOnError = true),
+      v2Expr = LiteralValue(-5, IntegerType)
+    )
+
+    checkV2Conversion(
+      catalystExpr = Log2(Literal(8.0)),
+      v2Expr = LiteralValue(3.0, DoubleType)
+    )
+
+    checkV2Conversion(
+      catalystExpr = Sqrt(Literal(4.0)),
+      v2Expr = LiteralValue(2.0, DoubleType)
+    )
+
+    checkV2Conversion(
+      catalystExpr = Floor(Literal(3.7)),
+      v2Expr = LiteralValue(3L, LongType)
+    )
+
+    checkV2Conversion(
+      catalystExpr = Ceil(Literal(3.1)),
+      v2Expr = LiteralValue(4L, LongType)
+    )
+  }
+
+  test("Partial constant folding of math functions") {
+    checkV2Conversion(
+      catalystExpr = Log10(Literal(100.0)) + $"cint".int,
+      v2Expr = new GeneralScalarExpression("+", Array(
+        LiteralValue(2.0, DoubleType),
+        FieldReference("cint"))))
+
+    checkV2Conversion(
+      catalystExpr = Abs(Literal(-10), failOnError = true) * $"cdouble".double,
+      v2Expr = new GeneralScalarExpression("*", Array(
+        LiteralValue(10, IntegerType),
+        FieldReference("cdouble"))))
+
+    checkV2Conversion(
+      catalystExpr = Sqrt(Literal(16.0)) - $"cint".int,
+      v2Expr = new GeneralScalarExpression("-", Array(
+        LiteralValue(4.0, DoubleType),
+        FieldReference("cint"))))
+
+    checkV2Conversion(
+      catalystExpr = $"cdouble".double / Log2(Literal(32.0)),
+      v2Expr = new GeneralScalarExpression("/", Array(
+        FieldReference("cdouble"),
+        LiteralValue(5.0, DoubleType))))
+
+    checkV2Conversion(
+      catalystExpr = Floor(Literal(7.9)) + Ceil(Literal(2.1)),
+      v2Expr = LiteralValue(10L, LongType))
+
+    checkV2Conversion(
+      catalystExpr = $"cint".int % Abs(Literal(-3), failOnError = true),
+      v2Expr = new GeneralScalarExpression("%", Array(
+        FieldReference("cint"),
+        LiteralValue(3, IntegerType))))
+
+    checkV2Conversion(
+      catalystExpr = Exp(Literal(0.0)) * $"cdouble".double,
+      v2Expr = new GeneralScalarExpression("*", Array(
+        LiteralValue(1.0, DoubleType),
+        FieldReference("cdouble"))))
+  }
+
+  test("Current Like functions are not supported") {
+    val currentFunctions = Seq(
+      CurrentDate(),
+      CurrentTimestamp(),
+      CurrentUser()
+    )
+
+    currentFunctions.foreach { catalystExpr =>
+      assert(new V2ExpressionBuilder(catalystExpr).build().isEmpty)
+    }
+  }
+
   /**
    * Translate the given Catalyst [[Expression]] into data source V2 [[Predicate]]
    * then verify against the given [[Predicate]].
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalogSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalogSuite.scala
index 63e54812922ac..c7e8dfeb59143 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalogSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/V2SessionCatalogSuite.scala
@@ -288,7 +288,7 @@ class V2SessionCatalogTableSuite extends V2SessionCatalogBaseSuite {
     val loaded = catalog.loadTable(testIdent)
 
     assert(table.name == loaded.name)
-    assert(table.schema == loaded.schema)
+    assert(table.columns sameElements loaded.columns())
     assert(table.properties == loaded.properties)
   }
 
@@ -490,8 +490,10 @@ class V2SessionCatalogTableSuite extends V2SessionCatalogBaseSuite {
     catalog.alterTable(testIdent, TableChange.updateColumnType(Array("id"), LongType))
     val updated = catalog.loadTable(testIdent)
 
-    val expectedSchema = new StructType().add("id", LongType).add("data", StringType)
-    assert(updated.schema == expectedSchema)
+    val expectedColumns = Array(
+      Column.create("id", LongType),
+      Column.create("data", StringType))
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: update column nullability") {
@@ -509,7 +511,6 @@ class V2SessionCatalogTableSuite extends V2SessionCatalogBaseSuite {
       TableChange.updateColumnNullability(Array("id"), true))
     val updated = catalog.loadTable(testIdent)
 
-    val expectedSchema = new StructType().add("id", IntegerType).add("data", StringType)
     val expectedColumns: Array[Column] = Array(
       Column.create("id", IntegerType),
       Column.create("data", StringType)
@@ -546,10 +547,10 @@ class V2SessionCatalogTableSuite extends V2SessionCatalogBaseSuite {
       TableChange.updateColumnComment(Array("id"), "comment text"))
     val updated = catalog.loadTable(testIdent)
 
-    val expectedSchema = new StructType()
-        .add("id", IntegerType, nullable = true, "comment text")
-        .add("data", StringType)
-    assert(updated.schema == expectedSchema)
+    val expectedColumns = Array(
+      Column.create("id", IntegerType, true, "comment text", null),
+      Column.create("data", StringType))
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: replace comment") {
@@ -562,15 +563,15 @@ class V2SessionCatalogTableSuite extends V2SessionCatalogBaseSuite {
 
     catalog.alterTable(testIdent, TableChange.updateColumnComment(Array("id"), "comment text"))
 
-    val expectedSchema = new StructType()
-        .add("id", IntegerType, nullable = true, "replacement comment")
-        .add("data", StringType)
+    val expectedColumns = Array(
+      Column.create("id", IntegerType, true, "replacement comment", null),
+      Column.create("data", StringType))
 
     catalog.alterTable(testIdent,
       TableChange.updateColumnComment(Array("id"), "replacement comment"))
     val updated = catalog.loadTable(testIdent)
 
-    assert(updated.schema == expectedSchema)
+    assert(updated.columns sameElements expectedColumns)
   }
 
   test("alterTable: add comment to missing column fails") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceChangeDataReadSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceChangeDataReadSuite.scala
index 8ee6d8762404c..be19981dc8a8c 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceChangeDataReadSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceChangeDataReadSuite.scala
@@ -23,7 +23,7 @@ import org.apache.hadoop.conf.Configuration
 import org.scalatest.Assertions
 
 import org.apache.spark.sql.Row
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StreamExecution}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamExecution}
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.functions.col
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceReadSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceReadSuite.scala
index 56a6a1e641f48..d744304afb429 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceReadSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceReadSuite.scala
@@ -23,13 +23,14 @@ import java.util.UUID
 import org.apache.hadoop.conf.Configuration
 import org.scalatest.Assertions
 
-import org.apache.spark.{SparkException, SparkUnsupportedOperationException}
+import org.apache.spark.{SparkException, SparkThrowable, SparkUnsupportedOperationException}
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.{AnalysisException, DataFrame, Encoders, Row}
 import org.apache.spark.sql.catalyst.expressions.{BoundReference, GenericInternalRow}
 import org.apache.spark.sql.catalyst.plans.physical.HashPartitioning
 import org.apache.spark.sql.execution.datasources.v2.state.utils.SchemaUtil
-import org.apache.spark.sql.execution.streaming.{CommitLog, MemoryStream, OffsetSeqLog, StreamExecution}
+import org.apache.spark.sql.execution.streaming.checkpointing.{CommitLog, OffsetSeqLog}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamExecution}
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.functions.col
 import org.apache.spark.sql.internal.SQLConf
@@ -526,6 +527,9 @@ class RocksDBStateDataSourceReadSuite extends StateDataSourceReadSuite {
 
 class RocksDBWithChangelogCheckpointStateDataSourceReaderSuite extends
 StateDataSourceReadSuite {
+
+  import testImplicits._
+
   override protected def newStateStoreProvider(): RocksDBStateStoreProvider =
     new RocksDBStateStoreProvider
 
@@ -568,6 +572,141 @@ StateDataSourceReadSuite {
     testSnapshotOnJoinState("rocksdb", 1)
     testSnapshotOnJoinState("rocksdb", 2)
   }
+
+  /**
+   * Note that we cannot use the golden files approach for transformWithState. The new schema
+   * format keeps track of the schema file path as an absolute path which cannot be used with
+   * the getResource model used in other similar tests on runbot.
+   */
+  test("snapshotStartBatchId on join state v3") {
+    withTempDir { tmpDir =>
+      withSQLConf(
+        SQLConf.STREAMING_JOIN_STATE_FORMAT_VERSION.key -> "3",
+        SQLConf.STREAMING_MAINTENANCE_INTERVAL.key -> "100"
+      ) {
+        val inputData = MemoryStream[(Int, Long)]
+        val query = getStreamStreamJoinQuery(inputData)
+        testStream(query)(
+          StartStream(checkpointLocation = tmpDir.getCanonicalPath),
+          AddData(inputData, (1, 1L), (2, 2L), (3, 3L), (4, 4L), (5, 5L)),
+          ProcessAllAvailable(),
+          Execute { _ => Thread.sleep(2000) },
+          AddData(inputData, (6, 6L), (7, 7L), (8, 8L), (9, 9L), (10, 10L)),
+          ProcessAllAvailable(),
+          Execute { _ => Thread.sleep(2000) },
+          AddData(inputData, (11, 11L), (12, 12L), (13, 13L), (14, 14L), (15, 15L)),
+          ProcessAllAvailable(),
+          Execute { _ => Thread.sleep(5000) },
+          StopStream
+        )
+
+        val stateSnapshotDf = spark.read.format("statestore")
+          .option("snapshotPartitionId", 2)
+          .option("snapshotStartBatchId", 0)
+          .option("joinSide", "left")
+          .load(tmpDir.getCanonicalPath)
+
+        val stateDf = spark.read.format("statestore")
+          .option("joinSide", "left")
+          .load(tmpDir.getCanonicalPath)
+          .filter(col("partition_id") === 2)
+
+        checkAnswer(stateSnapshotDf, stateDf)
+      }
+    }
+  }
+}
+
+class RocksDBWithCheckpointV2StateDataSourceReaderSuite extends StateDataSourceReadSuite {
+  override protected def newStateStoreProvider(): RocksDBStateStoreProvider =
+    new RocksDBStateStoreProvider
+
+  import testImplicits._
+
+  override def beforeAll(): Unit = {
+    super.beforeAll()
+    spark.conf.set(SQLConf.STATE_STORE_CHECKPOINT_FORMAT_VERSION, 2)
+    spark.conf.set(SQLConf.STATE_STORE_PROVIDER_CLASS.key,
+      newStateStoreProvider().getClass.getName)
+    spark.conf.set("spark.sql.streaming.stateStore.rocksdb.changelogCheckpointing.enabled",
+      "true")
+  }
+
+  // TODO: Remove this test once we allow migrations from checkpoint v1 to v2
+  test("reading checkpoint v2 store with version 1 should fail") {
+    withTempDir { tmpDir =>
+      val inputData = MemoryStream[(Int, Long)]
+      val query = getStreamStreamJoinQuery(inputData)
+      testStream(query)(
+        StartStream(checkpointLocation = tmpDir.getCanonicalPath),
+        AddData(inputData, (1, 1L), (2, 2L), (3, 3L), (4, 4L), (5, 5L)),
+        ProcessAllAvailable(),
+        Execute { _ => Thread.sleep(2000) },
+        StopStream
+      )
+
+      withSQLConf(SQLConf.STATE_STORE_CHECKPOINT_FORMAT_VERSION.key -> "1") {
+        // Verify reading state throws error when reading checkpoint v2 with version 1
+        val exc = intercept[IllegalStateException] {
+          val stateDf = spark.read.format("statestore")
+            .option(StateSourceOptions.BATCH_ID, 0)
+            .option(StateSourceOptions.OPERATOR_ID, 0)
+            .load(tmpDir.getCanonicalPath)
+          stateDf.collect()
+        }
+
+        checkError(exc.getCause.asInstanceOf[SparkThrowable],
+          "INVALID_LOG_VERSION.EXACT_MATCH_VERSION", "KD002",
+          Map(
+            "version" -> "2",
+            "matchVersion" -> "1"))
+      }
+    }
+  }
+
+  test("check unsupported modes with checkpoint v2") {
+    withTempDir { tmpDir =>
+      val inputData = MemoryStream[(Int, Long)]
+      val query = getStreamStreamJoinQuery(inputData)
+      testStream(query)(
+        StartStream(checkpointLocation = tmpDir.getCanonicalPath),
+        AddData(inputData, (1, 1L), (2, 2L), (3, 3L), (4, 4L), (5, 5L)),
+        ProcessAllAvailable(),
+        Execute { _ => Thread.sleep(2000) },
+        StopStream
+      )
+
+      // Verify reading snapshot throws error with checkpoint v2
+      val exc1 = intercept[StateDataSourceInvalidOptionValue] {
+        val stateSnapshotDf = spark.read.format("statestore")
+          .option("snapshotPartitionId", 2)
+          .option("snapshotStartBatchId", 0)
+          .option("joinSide", "left")
+          .load(tmpDir.getCanonicalPath)
+        stateSnapshotDf.collect()
+      }
+
+      checkError(exc1, "STDS_INVALID_OPTION_VALUE.WITH_MESSAGE", "42616",
+        Map(
+          "optionName" -> StateSourceOptions.SNAPSHOT_START_BATCH_ID,
+          "message" -> "Snapshot reading is currently not supported with checkpoint v2."))
+
+      // Verify reading change feed throws error with checkpoint v2
+      val exc2 = intercept[StateDataSourceInvalidOptionValue] {
+        val stateDf = spark.read.format("statestore")
+          .option(StateSourceOptions.READ_CHANGE_FEED, value = true)
+          .option(StateSourceOptions.CHANGE_START_BATCH_ID, 0)
+          .option(StateSourceOptions.CHANGE_END_BATCH_ID, 1)
+          .load(tmpDir.getAbsolutePath)
+        stateDf.collect()
+      }
+
+      checkError(exc2, "STDS_INVALID_OPTION_VALUE.WITH_MESSAGE", "42616",
+        Map(
+          "optionName" -> StateSourceOptions.READ_CHANGE_FEED,
+          "message" -> "Read change feed is currently not supported with checkpoint v2."))
+    }
+  }
 }
 
 abstract class StateDataSourceReadSuite extends StateDataSourceTestBase with Assertions {
@@ -869,6 +1008,10 @@ abstract class StateDataSourceReadSuite extends StateDataSourceTestBase with Ass
     testStreamStreamJoin(2)
   }
 
+  test("stream-stream join, state ver 3") {
+    testStreamStreamJoin(3)
+  }
+
   private def testStreamStreamJoin(stateVersion: Int): Unit = {
     def assertInternalColumnIsNotExposed(df: DataFrame): Unit = {
       val valueSchema = SchemaUtil.getSchemaAsDataType(df.schema, "value")
@@ -879,6 +1022,12 @@ abstract class StateDataSourceReadSuite extends StateDataSourceTestBase with Ass
       }
     }
 
+    // We should only test state version 3 with RocksDBStateStoreProvider
+    if (stateVersion == 3
+      && SQLConf.get.stateStoreProviderClass != classOf[RocksDBStateStoreProvider].getName) {
+      return
+    }
+
     withSQLConf(SQLConf.STREAMING_JOIN_STATE_FORMAT_VERSION.key -> stateVersion.toString) {
       withTempDir { tempDir =>
         runStreamStreamJoinQuery(tempDir.getAbsolutePath)
@@ -939,7 +1088,7 @@ abstract class StateDataSourceReadSuite extends StateDataSourceTestBase with Ass
 
         val stateReadDfForRightKeyWithIndexToValue = stateReaderForRightKeyWithIndexToValue.load()
 
-        if (stateVersion == 2) {
+        if (stateVersion >= 2) {
           val resultDf4 = stateReadDfForRightKeyWithIndexToValue
             .selectExpr("key.field0 AS key_0", "key.index AS key_index",
               "value.rightId AS rightId", "CAST(value.rightTime AS integer) AS rightTime",
@@ -1110,6 +1259,7 @@ abstract class StateDataSourceReadSuite extends StateDataSourceTestBase with Ass
       assert(get(result, "a", 2).get == 2)
       assert(get(result, "a", 3).get == 3)
       assert(get(result, "a", 4).isEmpty)
+      result.release()
 
       provider.close()
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTestBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTestBase.scala
index 705d9f125964f..64d005c719b7d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTestBase.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTestBase.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.execution.datasources.v2.state
 import java.sql.Timestamp
 
 import org.apache.spark.sql.{DataFrame, Dataset}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.StateStore
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTransformWithStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTransformWithStateSuite.scala
index 7d242c7444f13..1800319fb8b46 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTransformWithStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/v2/state/StateDataSourceTransformWithStateSuite.scala
@@ -23,7 +23,7 @@ import org.apache.hadoop.conf.Configuration
 
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.{Encoders, Row}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{AlsoTestWithEncodingTypes, AlsoTestWithRocksDBFeatures, RocksDBFileManager, RocksDBStateStoreProvider, TestClass}
 import org.apache.spark.sql.functions.{col, explode, timestamp_seconds}
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlInferSchemaSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlInferSchemaSuite.scala
index 618127fb6e615..9f36cb3ad2cde 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlInferSchemaSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlInferSchemaSuite.scala
@@ -20,7 +20,7 @@ import java.io.File
 import java.nio.file.Files
 import java.util.UUID
 
-import org.apache.spark.rdd.RDD
+import org.apache.spark.SparkConf
 import org.apache.spark.sql.{DataFrame, Encoders, QueryTest, Row}
 import org.apache.spark.sql.functions.col
 import org.apache.spark.sql.internal.SQLConf
@@ -43,6 +43,11 @@ class XmlInferSchemaSuite
     with TestXmlData
     with XmlSchemaInferenceCaseSensitivityTests {
 
+  protected val legacyParserEnabled: Boolean = false
+
+  override protected def sparkConf: SparkConf = super.sparkConf
+    .set("spark.sql.xml.legacyXMLParser.enabled", legacyParserEnabled.toString)
+
   private val baseOptions = Map("rowTag" -> "ROW")
 
   private val ignoreSurroundingSpacesOptions = Map("ignoreSurroundingSpaces" -> "true")
@@ -407,9 +412,13 @@ class XmlInferSchemaSuite
   }
 
   test("XML with partitions") {
-    def makePartition(rdd: RDD[String], parent: File, partName: String, partValue: Any): File = {
+    def makePartition(rows: Seq[String], parent: File, partName: String, partValue: Any): File = {
+      val spark = this.spark
+      import spark.implicits._
       val p = new File(parent, s"$partName=${partValue.toString}")
-      rdd.saveAsTextFile(p.getCanonicalPath)
+      (Seq("<ROWS>") ++ rows ++ Seq("</ROWS>")).toDF("data")
+        .coalesce(1)
+        .write.text(p.getAbsolutePath)
       p
     }
 
@@ -418,7 +427,7 @@ class XmlInferSchemaSuite
         val d1 = new File(root, "d1=1")
         // root/d1=1/col1=abc
         makePartition(
-          sparkContext.parallelize(2 to 5).map(i => s"""<ROW><a>1</a><b>str$i</b></ROW>"""),
+          (2 to 5).map(i => s"""<ROW><a>1</a><b>str$i</b></ROW>"""),
           d1,
           "col1",
           "abc"
@@ -426,7 +435,7 @@ class XmlInferSchemaSuite
 
         // root/d1=1/col1=abd
         makePartition(
-          sparkContext.parallelize(6 to 10).map(i => s"""<ROW><a>1</a><c>str$i</c></ROW>"""),
+          (6 to 10).map(i => s"""<ROW><a>1</a><c>str$i</c></ROW>"""),
           d1,
           "col1",
           "abd"
@@ -649,7 +658,14 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
       dir: File,
       multiline: Boolean = true,
       fileName: String = UUID.randomUUID().toString): String = {
-    val bytes = if (multiline) xmlString.getBytes() else xmlString.filter(_ >= ' ').getBytes
+    val xmlStringWithRootTag =
+      s"""
+         |<ROWS>
+         |$xmlString
+         |</ROWS>""".stripMargin
+    val bytes =
+      if (multiline) xmlStringWithRootTag.getBytes()
+      else xmlStringWithRootTag.filter(_ >= ' ').getBytes
     Files.write(new File(dir, fileName).toPath, bytes)
     dir.getCanonicalPath + s"/$fileName"
   }
@@ -657,6 +673,7 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
   private val valueTagCaseSensitivityTestcase: XmlSchemaInferenceCaseSensitiveTestCase = {
     val caseSensitiveValueTag =
       """
+        |<ROWS>
         |<ROW>
         |    <a>
         |       1
@@ -668,6 +685,7 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
         |       3
         |    </A>
         |</ROW>
+        |</ROWS>
         |""".stripMargin
     XmlSchemaInferenceCaseSensitiveTestCase(
       "value tag",
@@ -692,6 +710,7 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
   private val arrayComplexCaseSensitivityTestcase: XmlSchemaInferenceCaseSensitiveTestCase = {
     val caseSensitiveArrayType =
       """
+        |<ROWS>
         |<ROW>
         |    <a>
         |        1
@@ -705,6 +724,7 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
         |<ROW>
         |    <A>5</A>
         |</ROW>
+        |</ROWS>
         |""".stripMargin
     XmlSchemaInferenceCaseSensitiveTestCase(
       "array type - simple",
@@ -742,6 +762,7 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
   private val arraySimpleCaseSensitivityTestcase: XmlSchemaInferenceCaseSensitiveTestCase = {
     val caseSensitiveArrayType =
       """
+        |<ROWS>
         |<ROW>
         |    <a>
         |        <b>1</b>
@@ -752,6 +773,7 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
         |        <c>4</c>
         |    </A>
         |</ROW>
+        |</ROWS>
         |""".stripMargin
     XmlSchemaInferenceCaseSensitiveTestCase(
       "array type - complex",
@@ -942,3 +964,6 @@ trait XmlSchemaInferenceCaseSensitivityTests extends QueryTest {
   }
 }
 
+class XmlInferSchemaSuiteWithLegacyParser extends XmlInferSchemaSuite {
+  override val legacyParserEnabled: Boolean = true
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlPartitioningSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlPartitioningSuite.scala
index c08f2d6c329bb..22bb66daf3134 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlPartitioningSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlPartitioningSuite.scala
@@ -25,13 +25,15 @@ import org.apache.spark.sql.SparkSession
 /**
  * Tests various cases of partition size, compression.
  */
-final class XmlPartitioningSuite extends SparkFunSuite with Matchers with BeforeAndAfterAll {
+class XmlPartitioningSuite extends SparkFunSuite with Matchers with BeforeAndAfterAll {
+  protected val legacyParserEnabled: Boolean = false
 
-  private def doPartitionTest(suffix: String, blockSize: Long, large: Boolean): Unit = {
+  protected def doPartitionTest(suffix: String, blockSize: Long, large: Boolean): Unit = {
     val spark = SparkSession.builder()
       .master("local[2]")
       .appName("XmlPartitioningSuite")
       .config("spark.hadoop.fs.local.block.size", blockSize)
+      .config("spark.sql.xml.legacyXMLParser.enabled", legacyParserEnabled)
       .getOrCreate()
     try {
       val fileName = s"test-data/xml-resources/fias_house${if (large) ".large" else ""}.xml$suffix"
@@ -73,3 +75,7 @@ final class XmlPartitioningSuite extends SparkFunSuite with Matchers with Before
   }
 
 }
+
+class XmlPartitioningSuiteWithLegacyParser extends XmlPartitioningSuite {
+  override protected val legacyParserEnabled: Boolean = true
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlSuite.scala
index 5c4f4a96aee11..ce5194864c10d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlSuite.scala
@@ -16,11 +16,11 @@
  */
 package org.apache.spark.sql.execution.datasources.xml
 
-import java.io.{EOFException, File, StringWriter}
+import java.io.{EOFException, File, FileOutputStream, StringWriter}
 import java.nio.charset.{StandardCharsets, UnsupportedCharsetException}
 import java.nio.file.{Files, Path, Paths}
 import java.sql.{Date, Timestamp}
-import java.time.{Instant, LocalDateTime}
+import java.time.{Instant, LocalDateTime, Year}
 import java.util.TimeZone
 import java.util.concurrent.ConcurrentHashMap
 import javax.xml.stream.{XMLOutputFactory, XMLStreamException}
@@ -30,14 +30,15 @@ import scala.collection.mutable
 import scala.io.Source
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.lang3.exception.ExceptionUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.FSDataInputStream
 import org.apache.hadoop.io.{LongWritable, Text}
-import org.apache.hadoop.io.compress.GzipCodec
+import org.apache.hadoop.io.compress.{CompressionCodecFactory, GzipCodec}
 
-import org.apache.spark.{DebugFilesystem, SparkException}
-import org.apache.spark.sql.{AnalysisException, DataFrame, Dataset, Encoders, QueryTest, Row, SaveMode}
+import org.apache.spark.{DebugFilesystem, SparkConf, SparkException}
+import org.apache.spark.io.ZStdCompressionCodec
+import org.apache.spark.sql.{AnalysisException, DataFrame, Dataset, Encoders, QueryTest, Row, SaveMode, YearUDT}
+import org.apache.spark.sql.catalyst.encoders.AgnosticEncoders.UDTEncoder
 import org.apache.spark.sql.catalyst.util._
 import org.apache.spark.sql.catalyst.util.TypeUtils.ordinalNumber
 import org.apache.spark.sql.catalyst.xml.{IndentingXMLStreamWriter, XmlOptions}
@@ -50,6 +51,7 @@ import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.unsafe.types.UTF8String
+import org.apache.spark.util.Utils
 
 class XmlSuite
     extends QueryTest
@@ -58,7 +60,12 @@ class XmlSuite
     with TestXmlData {
   import testImplicits._
 
-  private val resDir = "test-data/xml-resources/"
+  protected val legacyParserEnabled: Boolean = false
+
+  override protected def sparkConf: SparkConf = super.sparkConf
+    .set("spark.sql.xml.legacyXMLParser.enabled", legacyParserEnabled.toString)
+
+  protected val resDir = "test-data/xml-resources/"
 
   private var tempDir: Path = _
 
@@ -194,6 +201,16 @@ class XmlSuite
     assert(results.length === 3)
   }
 
+  test("DSL test zstd compressed file") {
+    val results = spark.read
+      .option("rowTag", "ROW")
+      .xml(getTestResourcePath(resDir + "cars.xml.zst"))
+      .select("year")
+      .collect()
+
+    assert(results.length === 3)
+  }
+
   test("DSL test bad charset name") {
     val exception = intercept[SparkException] {
       spark.read
@@ -203,7 +220,7 @@ class XmlSuite
         .select("year")
         .collect()
     }
-    ExceptionUtils.getRootCause(exception).isInstanceOf[UnsupportedCharsetException]
+    Utils.getRootCause(exception).isInstanceOf[UnsupportedCharsetException]
     assert(exception.getMessage.contains("1-9588-osi"))
   }
 
@@ -322,21 +339,37 @@ class XmlSuite
       .option("columnNameOfCorruptRecord", "_malformed_records")
       .xml(getTestResourcePath(resDir + "cars-malformed.xml"))
     val cars = carsDf.collect()
-    assert(cars.length === 3)
 
-    val malformedRowOne = carsDf.cache().select("_malformed_records").first().get(0).toString
-    val malformedRowTwo = carsDf.cache().select("_malformed_records").take(2).last.get(0).toString
-    val expectedMalformedRowOne = "<ROW><year>2012</year><make>Tesla</make><model>>S" +
-      "<comment>No comment</comment></ROW>"
-    val expectedMalformedRowTwo = "<ROW></year><make>Ford</make><model>E350</model>model></model>" +
-      "<comment>Go get one now they are going fast</comment></ROW>"
+    if (legacyParserEnabled) {
+      assert(cars.length === 3)
+      val malformedRows = carsDf.cache().filter($"_malformed_records".isNotNull)
+      val malformedRowOne = malformedRows.select("_malformed_records").first().get(0).toString
+      val malformedRowTwo = malformedRows.select("_malformed_records").take(2).last.get(0).toString
+      val expectedMalformedRowOne = "<ROW><year>2012</year><make>Tesla</make><model>>S" +
+        "<comment>No comment</comment></ROW>"
+      val expectedMalformedRowTwo = "<ROW></year><make>Ford</make><model>E350</model>" +
+        "model></model><comment>Go get one now they are going fast</comment></ROW>"
+      assert(
+        malformedRowOne.replaceAll("\\s", "") === expectedMalformedRowOne.replaceAll("\\s", ""))
+      assert(
+        malformedRowTwo.replaceAll("\\s", "") === expectedMalformedRowTwo.replaceAll("\\s", ""))
+
+      val validRows = carsDf.cache().filter($"_malformed_records".isNull)
+      checkAnswer(validRows, Seq(Row(null, "Chevy", "Volt", 2015)))
+    } else {
+      // Memory efficient parser skips parsing data once malformed-ness is detected.
+      assert(cars.length === 2)
+
+      // Memory efficient parser will put the whole file into _malformed_records column
+      val malformedRows = carsDf.cache().filter($"_malformed_records".isNotNull)
+      assert(
+        malformedRows.first().getString(0).startsWith("<?xml version=\"1.0\"?>")
+          && malformedRows.first().getString(0).endsWith("</ROWSET>\n")
+      )
 
-    assert(malformedRowOne.replaceAll("\\s", "") === expectedMalformedRowOne.replaceAll("\\s", ""))
-    assert(malformedRowTwo.replaceAll("\\s", "") === expectedMalformedRowTwo.replaceAll("\\s", ""))
-    assert(cars(2)(0) === null)
-    assert(cars(0).toSeq.takeRight(3) === Seq(null, null, null))
-    assert(cars(1).toSeq.takeRight(3) === Seq(null, null, null))
-    assert(cars(2).toSeq.takeRight(3) === Seq("Chevy", "Volt", 2015))
+      val validRows = carsDf.cache().filter($"_malformed_records".isNull)
+      checkAnswer(validRows, Seq(Row(null, "Chevy", "Volt", 2015)))
+    }
   }
 
   test("DSL test with empty file and known schema") {
@@ -1062,9 +1095,15 @@ class XmlSuite
       .xml(getTestResourcePath(resDir + "books-malformed-attributes.xml"))
       .collect()
 
-    assert(results.length === 2)
-    assert(results(0)(0) === "bk111")
-    assert(results(1)(0) === "bk112")
+    if (legacyParserEnabled) {
+      assert(results.length === 2)
+      assert(results(0)(0) === "bk111")
+      assert(results(1)(0) === "bk112")
+    } else {
+      // Memory efficient parser skips parsing data once malformed-ness is detected.
+      assert(results.length === 1)
+      assert(results(0)(0) === "bk111")
+    }
   }
 
   test("read utf-8 encoded file with empty tag") {
@@ -1268,6 +1307,60 @@ class XmlSuite
       rec.endsWith("</basket>"))
   }
 
+  test("test XSD validation where row tag is the root tag") {
+    val basketDF = spark.read
+      .option("rowTag", "baskets")
+      .option("inferSchema", true)
+      .option("mode", "PERMISSIVE")
+      .option("rowValidationXSDPath", getTestResourcePath(resDir + "basket.xsd")
+        .replace("file:/", "/"))
+      .option("columnNameOfCorruptRecord", "_malformed_records")
+      .xml(getTestResourcePath(resDir + "basket.xml"))
+      .cache()
+    assert(basketDF.schema == new StructType().add("_malformed_records", StringType))
+  }
+
+  Seq(
+    "basket_invalid_in_the_beginning.xml",
+    "basket_invalid_in_the_middle.xml",
+    "basket_invalid_at_the_end.xml"
+  ).foreach { file =>
+    test("test XSD validation with invalid XSD records in different places, file: " + file) {
+      val basketDF = spark.read
+        .option("rowTag", "basket")
+        .option("inferSchema", true)
+        .option(
+          "rowValidationXSDPath",
+          getTestResourcePath(resDir + "basket.xsd")
+            .replace("file:/", "/")
+        )
+        .option("mode", "PERMISSIVE")
+        .option("columnNameOfCorruptRecord", "_malformed_records")
+        .xml(getTestResourcePath(resDir + file))
+        .cache()
+
+      // Should have both valid and invalid records
+      assert(basketDF.count() == 4)
+
+      // Check invalid record
+      assert(basketDF.filter($"_malformed_records".isNotNull).count() == 1)
+      val rec = basketDF
+        .filter($"_malformed_records".isNotNull)
+        .select("_malformed_records").collect()(0).getString(0)
+      assert(
+        rec.startsWith("""<basket invalid="true">""") &&
+          rec.indexOf("<extra>123</extra>") != -1 &&
+          rec.endsWith("</basket>"))
+
+      // Check valid records
+      assert(basketDF.filter($"_malformed_records".isNull).count() == 3)
+      checkAnswer(
+        basketDF.filter($"_malformed_records".isNull).select($"entry".getItem(0)),
+        Seq(Row(Row(1, "fork")), Row(Row(3, "apple")), Row(Row(5, "straw")))
+      )
+    }
+  }
+
   test("test xmlDataset") {
     val data = Seq(
       "<ROW><year>2012</year><make>Tesla</make><model>S</model><comment>No comment</comment></ROW>",
@@ -2434,10 +2527,12 @@ class XmlSuite
   test("Timestamp type inference for a mix of TIMESTAMP_NTZ and TIMESTAMP_LTZ") {
     withTempPath { path =>
       Seq(
+        "<ROWS>",
         "<ROW><col0>2020-12-12T12:12:12.000</col0></ROW>",
         "<ROW><col0>2020-12-12T17:12:12.000Z</col0></ROW>",
         "<ROW><col0>2020-12-12T17:12:12.000+05:00</col0></ROW>",
-        "<ROW><col0>2020-12-12T12:12:12.000</col0></ROW>"
+        "<ROW><col0>2020-12-12T12:12:12.000</col0></ROW>",
+        "</ROWS>"
       ).toDF("data")
         .coalesce(1)
         .write.text(path.getAbsolutePath)
@@ -2469,10 +2564,12 @@ class XmlSuite
   test("Malformed records when reading TIMESTAMP_LTZ as TIMESTAMP_NTZ") {
     withTempPath { path =>
       Seq(
+        "<ROWS>",
         "<ROW><col0>2020-12-12T12:12:12.000</col0></ROW>",
         "<ROW><col0>2020-12-12T12:12:12.000Z</col0></ROW>",
         "<ROW><col0>2020-12-12T12:12:12.000+05:00</col0></ROW>",
-        "<ROW><col0>2020-12-12T12:12:12.000</col0></ROW>"
+        "<ROW><col0>2020-12-12T12:12:12.000</col0></ROW>",
+        "</ROWS>"
       ).toDF("data")
         .coalesce(1)
         .write.text(path.getAbsolutePath)
@@ -2820,7 +2917,7 @@ class XmlSuite
   test("Find compatible types even if inferred DecimalType is not capable of other IntegralType") {
     val mixedIntegerAndDoubleRecords = Seq(
       """<ROW><a>3</a><b>1.1</b></ROW>""",
-      s"""<ROW><a>3.1</a><b>0.${"0" * 38}1</b></ROW>""").toDS()
+      s"""<ROW><a>3.1</a><b>0.${"0".repeat(38)}1</b></ROW>""").toDS()
     val xmlDF = spark.read
       .option("prefersDecimal", "true")
       .option("rowTag", "ROW")
@@ -2840,9 +2937,8 @@ class XmlSuite
     )
   }
 
-  def bigIntegerRecords: Dataset[String] =
-    spark.createDataset(spark.sparkContext.parallelize(
-      s"""<ROW><a>1${"0" * 38}</a><b>92233720368547758070</b></ROW>""" :: Nil))(Encoders.STRING)
+  def bigIntegerRecords: Dataset[String] = spark.createDataset(spark.sparkContext.parallelize(
+    s"""<ROW><a>1${"0".repeat(38)}</a><b>92233720368547758070</b></ROW>""" :: Nil))(Encoders.STRING)
 
   test("Infer big integers correctly even when it does not fit in decimal") {
     val df = spark.read
@@ -2862,7 +2958,7 @@ class XmlSuite
 
   def floatingValueRecords: Dataset[String] =
     spark.createDataset(spark.sparkContext.parallelize(
-      s"""<ROW><a>0.${"0" * 38}1</a><b>.01</b></ROW>""" :: Nil))(Encoders.STRING)
+      s"""<ROW><a>0.${"0".repeat(38)}1</a><b>.01</b></ROW>""" :: Nil))(Encoders.STRING)
 
   test("Infer floating-point values correctly even when it does not fit in decimal") {
     val df = spark.read
@@ -2906,8 +3002,8 @@ class XmlSuite
             .xml(inputFile.toURI.toString)
             .collect()
         }
-        assert(ExceptionUtils.getRootCause(e).isInstanceOf[EOFException])
-        assert(ExceptionUtils.getRootCause(e).getMessage === "Unexpected end of input stream")
+        assert(Utils.getRootCause(e).isInstanceOf[EOFException])
+        assert(Utils.getRootCause(e).getMessage === "Unexpected end of input stream")
         val e2 = intercept[SparkException] {
           spark.read
             .option("rowTag", "ROW")
@@ -2915,8 +3011,8 @@ class XmlSuite
             .xml(inputFile.toURI.toString)
             .collect()
         }
-        assert(ExceptionUtils.getRootCause(e2).isInstanceOf[EOFException])
-        assert(ExceptionUtils.getRootCause(e2).getMessage === "Unexpected end of input stream")
+        assert(Utils.getRootCause(e2).isInstanceOf[EOFException])
+        assert(Utils.getRootCause(e2).getMessage === "Unexpected end of input stream")
       }
       withSQLConf(SQLConf.IGNORE_CORRUPT_FILES.key -> "true") {
         val result = spark.read
@@ -2925,6 +3021,13 @@ class XmlSuite
            .xml(inputFile.toURI.toString)
            .collect()
         assert(result.isEmpty)
+
+        val result2 = spark.read
+          .option("rowTag", "ROW")
+          .option("multiLine", true)
+          .xml(inputFile.toURI.toString)
+          .collect()
+        assert(result2.isEmpty)
       }
     })
     withTempPath { dir =>
@@ -3084,6 +3187,8 @@ class XmlSuite
         assert(dfRead.count() === numRecords)
         assert(XmlSuiteDebugFileSystem.totalFiles() === numFiles)
         assert(XmlSuiteDebugFileSystem.maxFiles() > 1)
+
+        XmlSuiteDebugFileSystem.reset()
       }
     }
   }
@@ -3399,6 +3504,113 @@ class XmlSuite
       )
     }
   }
+
+  private def createTestFiles(dir: File, fileFormatWriter: Boolean): Seq[Row] = {
+    val numRecord = 100
+    val codecExtensionMap = HadoopCompressionCodec.values()
+      .map(c => (c.lowerCaseName(),
+        Option(c.getCompressionCodec).map(_.getDefaultExtension).getOrElse(""))) ++
+      Seq(("zstd", ".zst"), ("zstd", ".zstd"), ("gzip", ".gzip"))
+
+    val codecFactory = new CompressionCodecFactory(spark.sessionState.newHadoopConf())
+    codecExtensionMap.foreach { case (codec, ext) =>
+
+      val records: Seq[(Int, String)] = (1 to numRecord).map(id => (id, s"value_${codec}$ext"))
+      val file = new File(dir, s"test_$codec.xml$ext")
+
+      // file data source writers do not support zstd codec yet.
+      if (fileFormatWriter && !codec.equals("zstd")) {
+        val df = records.toDF("id", "value")
+        df.coalesce(1).write
+          .option("rowTag", "ROW")
+          .option("compression", codec)
+          .xml(file.getCanonicalPath)
+
+        val compressedFiles = new File(file.getCanonicalPath).listFiles()
+
+        compressedFiles.foreach { file =>
+          if (file.isFile && file.getName.startsWith("part")) {
+            val newName = file.getName.split("\\.").init.mkString(".") + ext
+            val status = file.renameTo(new File(dir, newName))
+            assert(status)
+          }
+        }
+      } else {
+        val data = records.map {
+          case (id, value) =>
+            s"""  <ROW>
+               |    <id>${id}</id>
+               |    <value>${value}</value>
+               |  </ROW>""".stripMargin
+        }.mkString("<ROWS>\n", "\n", "\n</ROWS>")
+        val os = new FileOutputStream(file)
+
+        val outputStream = codec match {
+          case "zstd" =>
+            new ZStdCompressionCodec(sparkConf).compressedOutputStream(os)
+          case codec if ext.nonEmpty =>
+            val compressionCodec = codecFactory.getCodecByName(codec)
+            compressionCodec.createOutputStream(os)
+          case _ => os
+        }
+        outputStream.write(data.getBytes(StandardCharsets.UTF_8))
+        outputStream.close()
+      }
+    }
+
+    val expectedOutput = codecExtensionMap.flatMap {
+      case (codec, ext) =>
+        val data = (1 to numRecord).map(i => Row(i, s"value_${codec}$ext"))
+        data
+    }.toSeq
+    assert(expectedOutput.length == codecExtensionMap.length * numRecord)
+    expectedOutput
+  }
+
+  test("Test all supported codec and extension including zst, zstd and gzip") {
+    for (
+      fileFormatWriter <- Seq(true, false)
+    ) {
+      logInfo(s"Testing with fileFormatWriter=$fileFormatWriter")
+      withTempDir { dir =>
+        val options = Map(
+          "rowTag" -> "ROW",
+          "recursiveFileLookup" -> "true"
+        )
+
+        val expectedOutput = createTestFiles(dir, fileFormatWriter)
+        val df = spark.read.options(options).xml(dir.getCanonicalPath)
+        checkAnswer(df, expectedOutput)
+      }
+    }
+  }
+
+  test("SPARK-52695: UDT write support for xml file format") {
+    val udt = new YearUDT()
+    val encoder = UDTEncoder(udt, classOf[YearUDT])
+    withTempDir { dir =>
+      val path = dir.getCanonicalPath
+      // Write a dataset of Year objects
+      val df1 = spark.range(2018, 2025).map(y => Year.of(y.toInt))(encoder)
+
+      df1
+      .write
+      .mode(SaveMode.Overwrite)
+      .option("rowTag", "ROW")
+      .xml(path)
+
+      val df = spark.read
+        .option("rowTag", "ROW")
+        .xml(path)
+
+      assert(df.schema === StructType(Seq(StructField("value", LongType))))
+      checkAnswer(df, spark.range(2018, 2025).toDF("value"))
+    }
+  }
+}
+
+class XmlSuiteWithLegacyParser extends XmlSuite {
+  override protected val legacyParserEnabled: Boolean = true
 }
 
 // Mock file system that checks the number of open files
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlVariantSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlVariantSuite.scala
index 63b816ad6b53a..5f5e017038b74 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlVariantSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/datasources/xml/XmlVariantSuite.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.execution.datasources.xml
 import java.io.CharArrayWriter
 import java.time.ZoneOffset
 
-import org.apache.spark.SparkException
+import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.sql.{AnalysisException, DataFrame, QueryTest, Row}
 import org.apache.spark.sql.catalyst.xml.{StaxXmlGenerator, StaxXmlParser, XmlOptions}
 import org.apache.spark.sql.functions.{col, variant_get}
@@ -31,6 +31,11 @@ import org.apache.spark.unsafe.types.VariantVal
 
 class XmlVariantSuite extends QueryTest with SharedSparkSession with TestXmlData {
 
+  protected val legacyParserEnabled: Boolean = false
+
+  override protected def sparkConf: SparkConf = super.sparkConf
+    .set("spark.sql.xml.legacyXMLParser.enabled", legacyParserEnabled.toString)
+
   private val baseOptions = Map("rowTag" -> "ROW", "valueTag" -> "_VALUE", "attributePrefix" -> "_")
 
   private val resDir = "test-data/xml-resources/"
@@ -505,10 +510,14 @@ class XmlVariantSuite extends QueryTest with SharedSparkSession with TestXmlData
       singleVariantColumn = Some("var"),
       extraOptions = Map("mode" -> "PERMISSIVE")
     )
-    checkAnswer(
-      df.select(variant_get(col("var"), "$.year", "int")),
+    val expectedResult = if (legacyParserEnabled) {
       Seq(Row(2015), Row(null), Row(null))
-    )
+    } else {
+      // When the optimized parser is enabled, there are only two records:
+      // one is the valid xml record, the rest is treated as one malformed record
+      Seq(Row(2015), Row(null))
+    }
+    checkAnswer(df.select(variant_get(col("var"), "$.year", "int")), expectedResult)
 
     // DROPMALFORMED mode
     val df2 = createDSLDataFrame(
@@ -934,3 +943,7 @@ class XmlVariantSuite extends QueryTest with SharedSparkSession with TestXmlData
     assert(xmlResult.head === xmlStr)
   }
 }
+
+class XmlVariantSuiteWithLegacyParser extends XmlVariantSuite {
+  override protected val legacyParserEnabled: Boolean = true
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/joins/HashedRelationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/joins/HashedRelationSuite.scala
index 6590deaa47e01..6da5e0b1a123e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/joins/HashedRelationSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/joins/HashedRelationSuite.scala
@@ -293,7 +293,7 @@ class HashedRelationSuite extends SharedSparkSession {
     val key = 0L
     // the page array is initialized with length 1 << 17 (1M bytes),
     // so here we need a value larger than 1 << 18 (2M bytes), to trigger the bug
-    val bigStr = UTF8String.fromString("x" * (1 << 19))
+    val bigStr = UTF8String.fromString("x".repeat(1 << 19))
 
     map.append(key, unsafeProj(InternalRow(bigStr)))
     map.optimize()
@@ -410,7 +410,7 @@ class HashedRelationSuite extends SharedSparkSession {
     val unsafeProj = UnsafeProjection.create(
       Seq(BoundReference(0, IntegerType, false),
         BoundReference(1, StringType, true)))
-    val unsafeRow = unsafeProj(InternalRow(0, UTF8String.fromString(" " * 100)))
+    val unsafeRow = unsafeProj(InternalRow(0, UTF8String.fromString(" ".repeat(100))))
     val key = Seq(BoundReference(0, IntegerType, false))
     val rows = (0 until (1 << 24)).iterator.map { i =>
       unsafeRow.setInt(0, i % 1000000)
@@ -437,7 +437,7 @@ class HashedRelationSuite extends SharedSparkSession {
     val unsafeProj = UnsafeProjection.create(
       Seq(BoundReference(0, IntegerType, false),
         BoundReference(1, StringType, true)))
-    val unsafeRow = unsafeProj(InternalRow(0, UTF8String.fromString(" " * 100)))
+    val unsafeRow = unsafeProj(InternalRow(0, UTF8String.fromString(" ".repeat(100))))
     val key = Seq(BoundReference(0, IntegerType, false))
     val rows = (0 until (1 << 10)).iterator.map { i =>
       unsafeRow.setInt(0, i % 1000000)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/metric/SQLMetricsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/metric/SQLMetricsSuite.scala
index 29481599362a4..4e50457ae47da 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/metric/SQLMetricsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/metric/SQLMetricsSuite.scala
@@ -25,7 +25,6 @@ import scala.util.Random
 import com.fasterxml.jackson.databind.ObjectMapper
 import org.apache.hadoop.mapreduce.{JobContext, TaskAttemptContext}
 
-import org.apache.spark.SparkConf
 import org.apache.spark.internal.io.FileCommitProtocol
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.expressions.aggregate.{Final, Partial}
@@ -634,10 +633,9 @@ class SQLMetricsSuite extends SharedSparkSession with SQLMetricsTestUtils
     // After serializing to JSON, the original value type is lost, but we can still
     // identify that it's a SQL metric from the metadata
     val mapper = new ObjectMapper()
-    val jsonProtocol = new JsonProtocol(new SparkConf())
-    val metricInfoJson = jsonProtocol.toJsonString(
-      jsonProtocol.accumulableInfoToJson(metricInfo, _))
-    val metricInfoDeser = jsonProtocol.accumulableInfoFromJson(mapper.readTree(metricInfoJson))
+    val metricInfoJson = JsonProtocol.toJsonString(
+      JsonProtocol.accumulableInfoToJson(metricInfo, _))
+    val metricInfoDeser = JsonProtocol.accumulableInfoFromJson(mapper.readTree(metricInfoJson))
     metricInfoDeser.update match {
       case Some(v: String) => assert(v.toLong === 10L)
       case Some(v) => fail(s"deserialized metric value was not a string: ${v.getClass.getName}")
@@ -987,6 +985,18 @@ class SQLMetricsSuite extends SharedSparkSession with SQLMetricsTestUtils
     assert(SQLMetrics.createSizeMetric(sparkContext, name = "m").toInfoUpdate.update === Some(-1))
     assert(SQLMetrics.createMetric(sparkContext, name = "m").toInfoUpdate.update === Some(0))
   }
+
+  test("withTimingNs should time and return same result") {
+    val metric = SQLMetrics.createTimingMetric(sparkContext, name = "m")
+
+    // Use a simple block that returns a value
+    val result = SQLMetrics.withTimingNs(metric) {
+      42
+    }
+
+    assert(result === 42)
+    assert(!metric.isZero, "Metric was not increased")
+  }
 }
 
 case class CustomFileCommitProtocol(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonDataSourceSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonDataSourceSuite.scala
index f9eb01c10edee..d201f1890dbdb 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonDataSourceSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonDataSourceSuite.scala
@@ -126,6 +126,24 @@ class PythonDataSourceSuite extends PythonDataSourceSuiteBase {
     assume(shouldTestPandasUDFs)
     val df = spark.read.format(staticSourceName).load()
     checkAnswer(df, Seq(Row(0, 0), Row(0, 1), Row(1, 0), Row(1, 1), Row(2, 0), Row(2, 1)))
+
+    // Overwrite the static source
+    val errorText = "static source overwritten"
+    val dataSourceScript =
+      s"""
+         |from pyspark.sql.datasource import DataSource
+         |
+         |class $staticSourceName(DataSource):
+         |    def schema(self) -> str:
+         |        raise Exception("$errorText")
+         |""".stripMargin
+    val dataSource = createUserDefinedPythonDataSource(
+      name = staticSourceName, pythonScript = dataSourceScript)
+    spark.dataSource.registerPython(staticSourceName, dataSource)
+    val err = intercept[AnalysisException] {
+      spark.read.format(staticSourceName).load()
+    }
+    assert(err.getMessage.contains(errorText))
   }
 
   test("simple data source") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonUDFSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonUDFSuite.scala
index 10603cc3aeafb..9b40226c2049b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonUDFSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/PythonUDFSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.execution.python
 
 import org.apache.spark.sql.{AnalysisException, IntegratedUDFTestUtils, QueryTest, Row}
-import org.apache.spark.sql.functions.{array, col, count, transform}
+import org.apache.spark.sql.functions.{array, avg, col, count, transform}
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.LongType
 
@@ -139,4 +139,21 @@ class PythonUDFSuite extends QueryTest with SharedSparkSession {
       checkAnswer(df, Row(0, 1, 1, 0, 1, 1))
     }
   }
+
+  test("SPARK-53311: Nondeterministic Python UDF pull out in aggregate with grouping") {
+    assume(shouldTestPythonUDFs)
+
+    // nondeterministic UDF
+    val pythonUDF = TestPythonUDF(name = "foo", Some(LongType), deterministic = false)
+
+    // This query should work without throwing an analysis exception
+    // The UDF foo(value) appears in both grouping expressions and aggregate expressions
+    // The fix ensures that both instances are properly mapped to the same attribute
+    val df = spark.range(1)
+      .selectExpr("id", "id % 3 as value")
+      .groupBy(pythonUDF(col("value")))
+      .agg(avg("id"), pythonUDF(col("value")))
+
+    checkAnswer(df, Row(0, 0.0, 0))
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/RowQueueSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/RowQueueSuite.scala
index 4314e0d0ee380..5cf1dea7d073c 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/RowQueueSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/RowQueueSuite.scala
@@ -68,7 +68,7 @@ class RowQueueSuite extends SparkFunSuite with EncryptionFunSuite {
   encryptionTest("disk queue") { conf =>
     val serManager = createSerializerManager(conf)
     val dir = Utils.createTempDir().getCanonicalFile
-    dir.mkdirs()
+    Utils.createDirectory(dir)
     val queue = DiskRowQueue(new File(dir, "buffer"), 1, serManager)
     val row = new UnsafeRow(1)
     row.pointTo(new Array[Byte](16), 16)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingDataSourceSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingDataSourceSuite.scala
index 5914abd11c01c..3b3e8687858dc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingDataSourceSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/PythonStreamingDataSourceSuite.scala
@@ -26,7 +26,9 @@ import org.apache.spark.sql.{AnalysisException, DataFrame, Row}
 import org.apache.spark.sql.IntegratedUDFTestUtils.{createUserDefinedPythonDataSource, shouldTestPandasUDFs}
 import org.apache.spark.sql.execution.datasources.v2.python.{PythonDataSourceV2, PythonMicroBatchStream, PythonStreamingSourceOffset}
 import org.apache.spark.sql.execution.python.PythonDataSourceSuiteBase
-import org.apache.spark.sql.execution.streaming.{CommitLog, MemoryStream, OffsetSeqLog, ProcessingTimeTrigger}
+import org.apache.spark.sql.execution.streaming.ProcessingTimeTrigger
+import org.apache.spark.sql.execution.streaming.checkpointing.{CommitLog, OffsetSeqLog}
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.streaming.StreamingQueryException
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServerSuite.scala
index 1321ba528e11a..ff99b4ee280d4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/python/streaming/TransformWithStateInPySparkStateServerSuite.scala
@@ -30,12 +30,14 @@ import org.apache.spark.SparkFunSuite
 import org.apache.spark.sql.{Encoder, Row}
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema
-import org.apache.spark.sql.execution.streaming.{StatefulProcessorHandleImpl, StatefulProcessorHandleState}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{StatefulProcessorHandleImpl, StatefulProcessorHandleState}
 import org.apache.spark.sql.execution.streaming.state.StateMessage
 import org.apache.spark.sql.execution.streaming.state.StateMessage.{AppendList, AppendValue, Clear, ContainsKey, DeleteTimer, Exists, ExpiryTimerRequest, Get, GetProcessingTime, GetValue, GetWatermark, HandleState, Keys, ListStateCall, ListStateGet, ListStatePut, ListTimers, MapStateCall, ParseStringSchema, RegisterTimer, RemoveKey, SetHandleState, StateCallCommand, StatefulProcessorCall, TimerRequest, TimerStateCallCommand, TimerValueRequest, UpdateValue, UtilsRequest, Values, ValueStateCall, ValueStateUpdate}
 import org.apache.spark.sql.streaming.{ListState, MapState, TTLConfig, ValueState}
 import org.apache.spark.sql.types.{IntegerType, StructField, StructType}
+import org.apache.spark.tags.SlowSQLTest
 
+@SlowSQLTest
 class TransformWithStateInPySparkStateServerSuite extends SparkFunSuite with BeforeAndAfterEach {
   val stateName = "test"
   val iteratorId = "testId"
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/AsyncProgressTrackingMicroBatchExecutionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/AsyncProgressTrackingMicroBatchExecutionSuite.scala
index 7838e62013db5..218b66b779463 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/AsyncProgressTrackingMicroBatchExecutionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/AsyncProgressTrackingMicroBatchExecutionSuite.scala
@@ -22,7 +22,6 @@ import java.util.concurrent.{CountDownLatch, Semaphore, TimeUnit}
 
 import scala.collection.mutable.ListBuffer
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.BeforeAndAfter
 import org.scalatest.matchers.should.Matchers
 import org.scalatest.time.{Seconds, Span}
@@ -30,7 +29,9 @@ import org.scalatest.time.{Seconds, Span}
 import org.apache.spark.TestUtils
 import org.apache.spark.sql._
 import org.apache.spark.sql.connector.read.streaming
-import org.apache.spark.sql.execution.streaming.AsyncProgressTrackingMicroBatchExecution.{ASYNC_PROGRESS_TRACKING_CHECKPOINTING_INTERVAL_MS, ASYNC_PROGRESS_TRACKING_ENABLED, ASYNC_PROGRESS_TRACKING_OVERRIDE_SINK_SUPPORT_CHECK}
+import org.apache.spark.sql.execution.streaming.checkpointing.{AsyncCommitLog, AsyncOffsetSeqLog, OffsetSeq}
+import org.apache.spark.sql.execution.streaming.runtime.{AsyncProgressTrackingMicroBatchExecution, MemoryStream, StreamExecution}
+import org.apache.spark.sql.execution.streaming.runtime.AsyncProgressTrackingMicroBatchExecution.{ASYNC_PROGRESS_TRACKING_CHECKPOINTING_INTERVAL_MS, ASYNC_PROGRESS_TRACKING_ENABLED, ASYNC_PROGRESS_TRACKING_OVERRIDE_SINK_SUPPORT_CHECK}
 import org.apache.spark.sql.functions.{column, window}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.{StreamingQuery, StreamingQueryException, StreamTest, Trigger}
@@ -1359,10 +1360,10 @@ class AsyncProgressTrackingMicroBatchExecutionSuite
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     testStream(streamEvent, extraOptions = Map(
       ASYNC_PROGRESS_TRACKING_ENABLED -> "true",
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CheckpointFileManagerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CheckpointFileManagerSuite.scala
index cdf736b1fffca..788bd9ae33948 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CheckpointFileManagerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CheckpointFileManagerSuite.scala
@@ -24,10 +24,11 @@ import scala.util.Random
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 
-import org.apache.spark.SparkFunSuite
+import org.apache.spark.{SparkException, SparkFunSuite}
 import org.apache.spark.sql.catalyst.plans.SQLHelper
 import org.apache.spark.sql.catalyst.util.quietly
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.CancellableFSDataOutputStream
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, FileContextBasedCheckpointFileManager, FileSystemBasedCheckpointFileManager, HDFSMetadataLog}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.CancellableFSDataOutputStream
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 
@@ -145,6 +146,56 @@ class CheckpointFileManagerSuite extends SharedSparkSession {
       }
     }
   }
+
+  test("SPARK-52824: CheckpointFileManager.create() does not throw InvocationTargetException") {
+    withSQLConf(
+      SQLConf.STREAMING_CHECKPOINT_FILE_MANAGER_CLASS.parent.key ->
+        classOf[ConstructorFailureTestManager].getName) {
+      val ex = intercept[SparkException] {
+        CheckpointFileManager.create(new Path("/"), spark.sessionState.newHadoopConf())
+      }
+      checkError(
+        ex,
+        condition = "CANNOT_LOAD_CHECKPOINT_FILE_MANAGER.ERROR_LOADING_CLASS",
+        parameters = Map(
+          "path" -> "/",
+          "className" -> classOf[ConstructorFailureTestManager].getName,
+          "msg" -> "java.lang.IllegalStateException: error")
+      )
+    }
+  }
+
+  test("SPARK-52824: CheckpointFileManager.create() throws uncategorized error") {
+    val hadoopConf = spark.sessionState.newHadoopConf()
+    // Set invalid fs.defaultFS to trigger uncategorized error from URI.create
+    hadoopConf.set("fs.defaultFS", "|invalid/")
+    val ex = intercept[SparkException] {
+      CheckpointFileManager.create(new Path("/"), hadoopConf)
+    }
+    checkError(
+      ex,
+      condition = "CANNOT_LOAD_CHECKPOINT_FILE_MANAGER.UNCATEGORIZED",
+      parameters = Map("path" -> "/")
+    )
+  }
+
+  test("SPARK-52824: CheckpointFileManager.create() throws error when class cannot be found") {
+    withSQLConf(
+      SQLConf.STREAMING_CHECKPOINT_FILE_MANAGER_CLASS.parent.key ->
+        "notarealclass") {
+      val ex = intercept[SparkException] {
+        CheckpointFileManager.create(new Path("/"), spark.sessionState.newHadoopConf())
+      }
+      checkError(
+        ex,
+        condition = "CANNOT_LOAD_CHECKPOINT_FILE_MANAGER.ERROR_LOADING_CLASS",
+        parameters = Map(
+          "path" -> "/",
+          "className" -> "notarealclass",
+          "msg" -> "java.lang.ClassNotFoundException: notarealclass")
+      )
+    }
+  }
 }
 
 abstract class CheckpointFileManagerTestsOnLocalFs
@@ -222,6 +273,11 @@ object CreateAtomicTestManager {
   @volatile var cancelCalledInCreateAtomic = false
 }
 
+/** A fake implementation to test constructor failure */
+class ConstructorFailureTestManager(path: Path, hadoopConf: Configuration)
+  extends FileSystemBasedCheckpointFileManager(path, hadoopConf) {
+  throw new IllegalStateException("error")
+}
 
 /**
  * CheckpointFileManagerSuiteFileSystem to test fallback of the CheckpointFileManager
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CompactibleFileStreamLogSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CompactibleFileStreamLogSuite.scala
index 808ffe036f89d..5a1608cb6165a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CompactibleFileStreamLogSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/CompactibleFileStreamLogSuite.scala
@@ -22,11 +22,12 @@ import java.nio.charset.StandardCharsets._
 
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.SparkSession
+import org.apache.spark.sql.execution.streaming.runtime.CompactibleFileStreamLog
 import org.apache.spark.sql.test.SharedSparkSession
 
 class CompactibleFileStreamLogSuite extends SharedSparkSession {
 
-  import CompactibleFileStreamLog._
+  import org.apache.spark.sql.execution.streaming.runtime.CompactibleFileStreamLog._
 
   /** -- testing of `object CompactibleFileStreamLog` begins -- */
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/FileStreamSinkLogSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/FileStreamSinkLogSuite.scala
index 27cdeaeb46238..12f99a4c78d34 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/FileStreamSinkLogSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/FileStreamSinkLogSuite.scala
@@ -28,13 +28,14 @@ import scala.util.Random
 import org.apache.hadoop.fs.{FileSystem, FSDataInputStream, Path, RawLocalFileSystem}
 
 import org.apache.spark.SparkFunSuite
+import org.apache.spark.sql.execution.streaming.sinks.{FileStreamSinkLog, SinkFileStatus}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.util.ArrayImplicits._
 
 class FileStreamSinkLogSuite extends SparkFunSuite with SharedSparkSession {
 
-  import CompactibleFileStreamLog._
+  import org.apache.spark.sql.execution.streaming.runtime.CompactibleFileStreamLog._
   import FileStreamSinkLog._
 
   test("shouldRetain") {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/HDFSMetadataLogSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/HDFSMetadataLogSuite.scala
index 08f245135f589..d6702c1e4ea50 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/HDFSMetadataLogSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/HDFSMetadataLogSuite.scala
@@ -25,6 +25,7 @@ import scala.language.implicitConversions
 import org.scalatest.concurrent.Waiters._
 import org.scalatest.time.SpanSugar._
 
+import org.apache.spark.sql.execution.streaming.checkpointing.{FileContextBasedCheckpointFileManager, FileSystemBasedCheckpointFileManager, HDFSMetadataLog}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.util.UninterruptibleThread
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MemorySinkSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MemorySinkSuite.scala
index 01b601783f3d4..4ec44eac22e36 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MemorySinkSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MemorySinkSuite.scala
@@ -24,6 +24,7 @@ import org.scalatest.BeforeAndAfter
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.types.DataTypeUtils
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.sources._
 import org.apache.spark.sql.streaming.StreamTest
 import org.apache.spark.sql.types.{IntegerType, StructField, StructType}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MergingSortWithSessionWindowStateIteratorSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MergingSortWithSessionWindowStateIteratorSuite.scala
index 163ff43a45aff..aa348d3df598e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MergingSortWithSessionWindowStateIteratorSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MergingSortWithSessionWindowStateIteratorSuite.scala
@@ -25,7 +25,8 @@ import org.scalatest.BeforeAndAfter
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
-import org.apache.spark.sql.execution.streaming.state.{HDFSBackedStateStoreProvider, PrefixKeyScanStateEncoderSpec, RocksDBStateStoreProvider, StateStore, StateStoreConf, StateStoreId, StateStoreProviderId, StreamingSessionWindowStateManager}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{MergingSortWithSessionWindowStateIterator, StatefulOperatorStateInfo, StreamingSessionWindowStateManager}
+import org.apache.spark.sql.execution.streaming.state.{HDFSBackedStateStoreProvider, PrefixKeyScanStateEncoderSpec, RocksDBStateStoreProvider, StateStore, StateStoreConf, StateStoreId, StateStoreProviderId}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamTest
 import org.apache.spark.sql.types.{IntegerType, LongType, StringType, StructType}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecutionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecutionSuite.scala
index 3c2c75e5c7f9e..3fec6e816b839 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecutionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/MicroBatchExecutionSuite.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.execution.streaming
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.BeforeAndAfter
 import org.scalatest.matchers.should._
 import org.scalatest.time.{Seconds, Span}
@@ -28,6 +27,7 @@ import org.apache.spark.sql.catalyst.plans.logical.Range
 import org.apache.spark.sql.classic.{DataFrame, Dataset, SparkSession}
 import org.apache.spark.sql.connector.read.streaming
 import org.apache.spark.sql.connector.read.streaming.SparkDataStream
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, MemoryStream, MicroBatchExecution, SerializedOffset, StreamExecution, StreamingExecutionRelation}
 import org.apache.spark.sql.functions.{count, timestamp_seconds, window}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.{StreamingQueryException, StreamTest, Trigger}
@@ -169,7 +169,7 @@ class MicroBatchExecutionSuite extends StreamTest with BeforeAndAfter with Match
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     testStream(streamEvent) (
       AddData(inputData, 1, 2, 3, 4, 5, 6),
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/OffsetSeqLogSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/OffsetSeqLogSuite.scala
index 5f7205eaf4bbe..9c4a7b1879f61 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/OffsetSeqLogSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/OffsetSeqLogSuite.scala
@@ -19,11 +19,12 @@ package org.apache.spark.sql.execution.streaming
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.sql.catalyst.util.stringToFile
+import org.apache.spark.sql.execution.streaming.checkpointing.{OffsetSeq, OffsetSeqLog, OffsetSeqMetadata}
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, SerializedOffset}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.util.Utils
 
 class OffsetSeqLogSuite extends SharedSparkSession {
 
@@ -180,7 +181,7 @@ class OffsetSeqLogSuite extends SharedSparkSession {
       withTempDir { checkpointDir =>
         val resourceUri = this.getClass.getResource(
         "/structured-streaming/checkpoint-version-4.0.0-tws-" + storeEncodingFormat + "/").toURI
-        FileUtils.copyDirectory(new File(resourceUri), checkpointDir.getCanonicalFile)
+        Utils.copyDirectory(new File(resourceUri), checkpointDir.getCanonicalFile)
         verifyOffsetLogEntry(checkpointDir.getAbsolutePath, entryExists = true,
           storeEncodingFormat)
       }
@@ -191,7 +192,7 @@ class OffsetSeqLogSuite extends SharedSparkSession {
     withTempDir { checkpointDir =>
       val resourceUri = this.getClass.getResource(
         "/structured-streaming/checkpoint-version-3.5.1-streaming-deduplication/").toURI
-      FileUtils.copyDirectory(new File(resourceUri), checkpointDir.getCanonicalFile)
+      Utils.copyDirectory(new File(resourceUri), checkpointDir.getCanonicalFile)
       verifyOffsetLogEntry(checkpointDir.getAbsolutePath, entryExists = false,
         "unsaferow")
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/ProcessingTimeExecutorSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/ProcessingTimeExecutorSuite.scala
index bb7f8fc98d602..a45abbbd5542f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/ProcessingTimeExecutorSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/ProcessingTimeExecutorSuite.scala
@@ -24,6 +24,7 @@ import org.scalatest.concurrent.PatienceConfiguration.Timeout
 import org.scalatest.time.SpanSugar._
 
 import org.apache.spark.SparkFunSuite
+import org.apache.spark.sql.execution.streaming.runtime.ProcessingTimeExecutor
 import org.apache.spark.sql.streaming.util.StreamManualClock
 
 class ProcessingTimeExecutorSuite extends SparkFunSuite with TimeLimits {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamMetadataSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamMetadataSuite.scala
index 87f8004ab9588..e1c5c1a3e0772 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamMetadataSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamMetadataSuite.scala
@@ -23,6 +23,7 @@ import java.util.UUID
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
+import org.apache.spark.sql.execution.streaming.runtime.StreamMetadata
 import org.apache.spark.sql.streaming.StreamTest
 
 class StreamMetadataSuite extends StreamTest {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamRelationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamRelationSuite.scala
index e4ac17e0467ad..d38dd821efdab 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamRelationSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/StreamRelationSuite.scala
@@ -28,6 +28,7 @@ import org.apache.spark.sql.catalyst.expressions.AttributeReference
 import org.apache.spark.sql.catalyst.parser.CatalystSqlParser.parsePlan
 import org.apache.spark.sql.catalyst.plans.logical.{Project, SubqueryAlias}
 import org.apache.spark.sql.execution.datasources.DataSource
+import org.apache.spark.sql.execution.streaming.runtime.StreamingRelation
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.IntegerType
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
@@ -77,7 +78,7 @@ class StreamRelationSuite extends SharedSparkSession with AnalysisTest {
   }
 
   test("STREAM options are parsed correctly for streaming by identifier") {
-    val plan = parsePlan("SELECT * FROM STREAM table1 AS t WITH ('key'='value')")
+    val plan = parsePlan("SELECT * FROM STREAM table1 WITH ('key'='value') AS t")
     comparePlans(
       plan,
       Project(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/UpdatingSessionsIteratorSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/UpdatingSessionsIteratorSuite.scala
index 187eda5d36f61..9aad453e8f569 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/UpdatingSessionsIteratorSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/UpdatingSessionsIteratorSuite.scala
@@ -65,10 +65,11 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
   // just copying default values to avoid bothering with SQLContext
   val inMemoryThreshold = 4096
   val spillThreshold = Int.MaxValue
+  val spillSizeThreshold = Long.MaxValue
 
   test("no row") {
     val iterator = new UpdatingSessionsIterator(None.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     assert(!iterator.hasNext)
   }
@@ -77,7 +78,7 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rows = List(createRow("a", 1, 100, 110, 10, 1.1))
 
     val iterator = new UpdatingSessionsIterator(rows.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     assert(iterator.hasNext)
 
@@ -95,7 +96,7 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rows = List(row1, row2, row3, row4)
 
     val iterator = new UpdatingSessionsIterator(rows.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     val retRows = rows.indices.map { _ =>
       assert(iterator.hasNext)
@@ -126,7 +127,7 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rowsAll = rows1 ++ rows2
 
     val iterator = new UpdatingSessionsIterator(rowsAll.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     val retRows1 = rows1.indices.map { _ =>
       assert(iterator.hasNext)
@@ -162,7 +163,7 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rowsAll = rows1 ++ rows2
 
     val iterator = new UpdatingSessionsIterator(rowsAll.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     val retRows1 = rows1.indices.map { _ =>
       assert(iterator.hasNext)
@@ -207,7 +208,7 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rowsAll = rows1 ++ rows2 ++ rows3 ++ rows4
 
     val iterator = new UpdatingSessionsIterator(rowsAll.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     val retRows1 = rows1.indices.map { _ =>
       assert(iterator.hasNext)
@@ -260,7 +261,7 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rows = List(row1, row2, row3, row4)
 
     val iterator = new UpdatingSessionsIterator(rows.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     // UpdatingSessionIterator can't detect error on hasNext
     assert(iterator.hasNext)
@@ -296,7 +297,7 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rows = List(row1, row2, row3)
 
     val iterator = new UpdatingSessionsIterator(rows.iterator, keysWithSessionAttributes,
-      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold)
+      sessionAttribute, rowAttributes, inMemoryThreshold, spillThreshold, spillSizeThreshold)
 
     // UpdatingSessionIterator can't detect error on hasNext
     assert(iterator.hasNext)
@@ -339,7 +340,8 @@ class UpdatingSessionsIteratorSuite extends SharedSparkSession {
     val rows = List(row1, row2, row3, row4)
 
     val iterator = new UpdatingSessionsIterator(rows.iterator, Seq(noKeySessionAttribute),
-      noKeySessionAttribute, noKeyRowAttributes, inMemoryThreshold, spillThreshold)
+      noKeySessionAttribute, noKeyRowAttributes, inMemoryThreshold, spillThreshold,
+      spillSizeThreshold)
 
     val retRows = rows.indices.map { _ =>
       assert(iterator.hasNext)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/WatermarkTrackerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/WatermarkTrackerSuite.scala
index 6018d286fc21e..052b77b5fa9b9 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/WatermarkTrackerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/WatermarkTrackerSuite.scala
@@ -22,6 +22,8 @@ import java.util.UUID
 import scala.collection.mutable
 
 import org.apache.spark.sql.execution.{SparkPlan, UnionExec}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{EventTimeStatsAccum, EventTimeWatermarkExec}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, WatermarkTracker}
 import org.apache.spark.sql.functions.timestamp_seconds
 import org.apache.spark.sql.streaming.StreamTest
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ConsoleWriteSupportSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ConsoleWriteSupportSuite.scala
index b5f23853fd5b2..f26635e7c67a7 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ConsoleWriteSupportSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ConsoleWriteSupportSuite.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.execution.streaming.sources
 
 import java.io.ByteArrayOutputStream
 
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.streaming.{StreamTest, Trigger}
 
 class ConsoleWriteSupportSuite extends StreamTest {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachBatchSinkSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachBatchSinkSuite.scala
index fc36235667ec0..de92aa6d998ea 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachBatchSinkSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachBatchSinkSuite.scala
@@ -17,6 +17,8 @@
 
 package org.apache.spark.sql.execution.streaming.sources
 
+import java.io.File
+
 import scala.collection.mutable
 import scala.language.implicitConversions
 
@@ -24,8 +26,10 @@ import org.apache.spark.ExecutorDeadException
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.execution.SerializeFromObjectExec
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
+import org.apache.spark.sql.execution.streaming.state.StateStoreCommitValidationFailed
 import org.apache.spark.sql.functions._
+import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming._
 import org.apache.spark.util.ArrayImplicits._
 
@@ -255,6 +259,425 @@ class ForeachBatchSinkSuite extends StreamTest {
     query.awaitTermination()
   }
 
+  test("SPARK-52008: foreachBatch with show() should fail with appropriate error") {
+    // This test verifies that commit validation is enabled by default
+    withSQLConf(SQLConf.SHUFFLE_PARTITIONS.key -> "5") {
+      withTempDir { tempDir =>
+        val checkpointPath = tempDir.getCanonicalPath
+        // Create a simple streaming DataFrame
+        val streamingDF = spark.readStream
+          .format("rate")
+          .option("rowsPerSecond", 3)
+          .load()
+          .withColumn("pt_id", (rand() * 99 + 1).cast("int"))
+          .withColumn("event_time",
+            expr("timestampadd(SECOND, cast(rand() * 2 * 86400 - 86400 as int), timestamp)"))
+          .withColumn("in_map", (rand() * 2).cast("int") === 1)
+          .drop("value")
+
+        // Create a stateful streaming query
+        val windowedDF = streamingDF
+          .withWatermark("event_time", "1 day")
+          .groupBy("pt_id")
+          .agg(
+            max("event_time").as("latest_event_time"),
+            last("in_map").as("in_map")
+          )
+          .withColumn("output_time", current_timestamp())
+
+        // Define a foreachBatch function that uses show(), which only consumes some partitions
+        def problematicBatchProcessor(batchDF: DataFrame, batchId: Long): Unit = {
+          // show() only processes enough partitions to display the specified number of rows
+          // This doesn't consume all partitions, causing state files to be missing
+          batchDF.show(2) // Only shows 2 rows, not processing all partitions
+        }
+
+        // Start the streaming query
+        val queryEx = intercept[StreamingQueryException] {
+          val query = windowedDF.writeStream
+            .queryName("reproducer_test")
+            .option("checkpointLocation", checkpointPath)
+            .foreachBatch(problematicBatchProcessor _)
+            .outputMode("update")
+            .start()
+
+          // Wait for the exception to be thrown
+          query.awaitTermination()
+        }
+
+        // Verify we get the StateStore commit validation error
+        // The error is wrapped by RPC framework, so we need to check the cause chain
+        val rootCause = queryEx.getCause
+        assert(rootCause != null, "Expected a root cause for the StreamingQueryException")
+
+        // The RPC framework wraps our exception, so check the cause of the cause
+        val actualException = rootCause.getCause
+        assert(actualException != null, "Expected a cause for the RPC exception")
+        assert(actualException.isInstanceOf[StateStoreCommitValidationFailed],
+          s"Expected StateStoreCommitValidationFailed but got ${actualException.getClass.getName}")
+
+        val errorMessage = actualException.getMessage
+        assert(errorMessage.contains("[STATE_STORE_COMMIT_VALIDATION_FAILED]"),
+          s"Expected STATE_STORE_COMMIT_VALIDATION_FAILED error, but got: $errorMessage")
+        assert(errorMessage.contains("State store commit validation failed"),
+          s"Expected state store commit validation message, but got: $errorMessage")
+        assert(errorMessage.contains("Missing commits"),
+          s"Expected missing commits message, but got: $errorMessage")
+
+        // Extract and validate the expected vs actual commit counts
+        val expectedPattern = "Expected (\\d+) commits but got (\\d+)".r
+        val missingPattern = "Missing commits: (.+)".r
+
+        expectedPattern.findFirstMatchIn(errorMessage) match {
+          case Some(m) =>
+            val expectedCommits = m.group(1).toInt
+            val actualCommits = m.group(2).toInt
+
+            // We should have fewer actual commits than expected due to show(2)
+            // not processing all partitions
+            assert(actualCommits < expectedCommits,
+              s"Expected fewer actual commits ($actualCommits)" +
+                s" than expected commits ($expectedCommits)")
+            assert(actualCommits >= 1,
+              s"Expected at least 1 actual commit from show(2), but got $actualCommits")
+            assert(expectedCommits == 5,
+              s"Expected more than 5 commits but got $expectedCommits")
+
+          case None =>
+            fail(s"Could not find expected/actual commit counts in error message: $errorMessage")
+        }
+
+        // Validate that missing commits are reported with proper structure
+        missingPattern.findFirstMatchIn(errorMessage) match {
+          case Some(m) =>
+            val missingCommits = m.group(1)
+            assert(missingCommits.nonEmpty,
+              s"Expected non-empty missing commits list, but got: '$missingCommits'")
+            // Should contain operator and partition information
+            assert(missingCommits.contains("operator=") && missingCommits.contains("partition="),
+              s"Expected missing commits to contain operator and" +
+                s" partition info, but got: '$missingCommits'")
+          case None =>
+            fail(s"Could not find missing commits in error message: $errorMessage")
+        }
+      }
+    }
+  }
+
+  test("StateStore commit validation should detect missing commits") {
+    withSQLConf(SQLConf.SHUFFLE_PARTITIONS.key -> "5") {
+      withTempDir { tempDir =>
+        val checkpointPath = tempDir.getCanonicalPath
+
+        // Create a streaming DataFrame with controlled partitioning
+        val streamingDF = spark.readStream
+          .format("rate")
+          .option("rowsPerSecond", 10)
+          .option("numPartitions", 4) // Ensure we have multiple partitions
+          .load()
+          .withColumn("key", col("value") % 100)
+
+        // Create a stateful operation that requires all partitions to process
+        val aggregatedDF = streamingDF
+          .groupBy("key")
+          .agg(count("*").as("count"))
+
+        // ForeachBatch function that only processes some data and then throws exception
+        // This should cause some StateStore commits to be missing
+        def problematicBatchProcessor(batchDF: DataFrame, batchId: Long): Unit = {
+          // Force evaluation of only a subset of partitions by using limit
+          // This should cause some partitions to not process their StateStores
+          batchDF.limit(5).collect() // Only process first 5 rows
+
+          // Simulate a failure that prevents remaining partitions from committing
+          if (batchId > 0) {
+            throw new RuntimeException("Simulated batch processing failure")
+          }
+        }
+
+        // This should fail with StateStore commit validation error
+        val queryEx = intercept[StreamingQueryException] {
+          val query = aggregatedDF.writeStream
+            .queryName("commit_validation_test")
+            .option("checkpointLocation", checkpointPath)
+            .foreachBatch(problematicBatchProcessor _)
+            .outputMode("complete")
+            .start()
+
+          query.awaitTermination()
+        }
+
+        // Should fail with either our new validation error or the simulated RuntimeException
+        // Check the cause chain since RPC wraps exceptions
+        val rootCause = queryEx.getCause
+        val actualException = if (rootCause != null) rootCause.getCause else null
+
+        val hasCommitValidationError = actualException != null && (
+          actualException.isInstanceOf[StateStoreCommitValidationFailed] ||
+          actualException.getMessage.contains("[STATE_STORE_COMMIT_VALIDATION_FAILED]"))
+        val hasSimulatedError = queryEx.getMessage.contains("Simulated batch processing failure")
+
+        assert(hasCommitValidationError || hasSimulatedError,
+          s"Expected StateStore commit validation error or simulated error," +
+            s" but got: ${queryEx.getMessage}")
+      }
+    }
+  }
+
+  test("StateStore commit validation with AvailableNow trigger") {
+    withSQLConf(SQLConf.SHUFFLE_PARTITIONS.key -> "5") {
+      withTempDir { tempDir =>
+        val checkpointPath = tempDir.getCanonicalPath
+
+        // Create a temporary file with data
+        val inputPath = new File(tempDir, "input").getCanonicalPath
+        val inputData = spark.range(0, 100)
+          .selectExpr("id", "id % 10 as key")
+        inputData.write
+          .mode("overwrite")
+          .parquet(inputPath)
+
+        // Get the schema from the written data
+        val schema = inputData.schema
+
+        // Create a streaming DataFrame with AvailableNow trigger
+        val streamingDF = spark.readStream
+          .format("parquet")
+          .schema(schema) // Provide the schema explicitly
+          .load(inputPath)
+
+        // Stateful aggregation
+        val aggregatedDF = streamingDF
+          .groupBy("key")
+          .agg(count("*").as("count"))
+
+        // ForeachBatch that only processes partial data
+        def problematicBatchProcessor(batchDF: DataFrame, batchId: Long): Unit = {
+          // Only show first 2 rows, won't process all partitions
+          batchDF.show(2)
+        }
+
+        val queryEx = intercept[StreamingQueryException] {
+          val query = aggregatedDF.writeStream
+            .queryName("availablenow_commit_test")
+            .option("checkpointLocation", checkpointPath)
+            .foreachBatch(problematicBatchProcessor _)
+            .outputMode("complete")
+            .trigger(Trigger.AvailableNow())
+            .start()
+
+          query.awaitTermination()
+        }
+
+        // Check the cause chain since RPC wraps exceptions
+        val rootCause = queryEx.getCause
+        assert(rootCause != null, "Expected a root cause for the StreamingQueryException")
+        val actualException = rootCause.getCause
+        assert(actualException != null, "Expected a cause for the RPC exception")
+
+        assert(actualException.isInstanceOf[StateStoreCommitValidationFailed] ||
+          actualException.getMessage.contains("[STATE_STORE_COMMIT_VALIDATION_FAILED]"),
+          s"Expected STATE_STORE_COMMIT_VALIDATION_FAILED error," +
+            s" but got: ${actualException.getMessage}")
+      }
+    }
+  }
+
+  test("StateStore commit validation with swallowed exceptions in foreachBatch") {
+    withSQLConf(SQLConf.SHUFFLE_PARTITIONS.key -> "5") {
+      withTempDir { tempDir =>
+        val checkpointPath = tempDir.getCanonicalPath
+
+        // Create streaming DataFrame
+        val streamingDF = spark.readStream
+          .format("rate")
+          .option("rowsPerSecond", 10)
+          .option("numPartitions", 4)
+          .load()
+          .withColumn("key", col("value") % 10)
+
+        // Stateful aggregation
+        val aggregatedDF = streamingDF
+          .groupBy("key")
+          .agg(sum("value").as("sum"))
+
+        // ForeachBatch that swallows exceptions and returns early
+        def problematicBatchProcessor(batchDF: DataFrame, batchId: Long): Unit = {
+          try {
+            // Process only first few rows
+            val firstRows = batchDF.limit(2).collect()
+
+            // Simulate some processing that might fail
+            if (firstRows.length > 1) {
+              throw new RuntimeException("Processing failed!")
+            }
+          } catch {
+            case _: Exception =>
+              // Swallow the exception and return early
+              // This means remaining partitions won't be processed
+              return
+          }
+
+          // This code is never reached due to early return
+          batchDF.collect()
+        }
+
+        val queryEx = intercept[StreamingQueryException] {
+          val query = aggregatedDF.writeStream
+            .queryName("swallowed_exception_test")
+            .option("checkpointLocation", checkpointPath)
+            .foreachBatch(problematicBatchProcessor _)
+            .outputMode("update")
+            .start()
+
+          query.awaitTermination()
+        }
+
+        // Check the cause chain since RPC wraps exceptions
+        val rootCause = queryEx.getCause
+        assert(rootCause != null, "Expected a root cause for the StreamingQueryException")
+        val actualException = rootCause.getCause
+        assert(actualException != null, "Expected a cause for the RPC exception")
+
+        assert(actualException.isInstanceOf[StateStoreCommitValidationFailed] ||
+          actualException.getMessage.contains("[STATE_STORE_COMMIT_VALIDATION_FAILED]"),
+          s"Expected STATE_STORE_COMMIT_VALIDATION_FAILED error," +
+            s" but got: ${actualException.getMessage}")
+      }
+    }
+  }
+
+  test("StateStore commit validation with multiple swallowed exceptions") {
+    withSQLConf(SQLConf.SHUFFLE_PARTITIONS.key -> "5") {
+      withTempDir { tempDir =>
+        val checkpointPath = tempDir.getCanonicalPath
+
+        val streamingDF = spark.readStream
+          .format("rate")
+          .option("rowsPerSecond", 10)
+          .load()
+          .withColumn("key", col("value") % 5)
+
+        // Multiple aggregations to create multiple StateStores
+        val aggregatedDF = streamingDF
+          .groupBy("key")
+          .agg(
+            count("*").as("count"),
+            sum("value").as("sum"),
+            avg("value").as("avg")
+          )
+
+        var processedCount = 0
+
+        // ForeachBatch with multiple exception swallowing points
+        def problematicBatchProcessor(batchDF: DataFrame, batchId: Long): Unit = {
+          try {
+            // First processing attempt
+            batchDF.limit(1).collect()
+            processedCount += 1
+
+            try {
+              // Second processing attempt that fails
+              if (processedCount > 0) {
+                throw new IllegalStateException("Second processing failed")
+              }
+            } catch {
+              case _: IllegalStateException =>
+              // Swallow and continue
+            }
+
+            try {
+              // Third processing attempt
+              batchDF.limit(2).collect()
+              throw new RuntimeException("Third processing failed")
+            } catch {
+              case _: RuntimeException =>
+                // Swallow and return early
+                return
+            }
+
+            // Never reached - full processing
+            batchDF.collect()
+          } catch {
+            case _: Exception =>
+            // Outer catch that swallows everything
+          }
+        }
+
+        val queryEx = intercept[StreamingQueryException] {
+          val query = aggregatedDF.writeStream
+            .queryName("multiple_swallowed_exceptions_test")
+            .option("checkpointLocation", checkpointPath)
+            .foreachBatch(problematicBatchProcessor _)
+            .outputMode("complete")
+            .start()
+
+          query.awaitTermination()
+        }
+
+        // Check the cause chain since RPC wraps exceptions
+        val rootCause = queryEx.getCause
+        assert(rootCause != null, "Expected a root cause for the StreamingQueryException")
+        val actualException = rootCause.getCause
+        assert(actualException != null, "Expected a cause for the RPC exception")
+
+        assert(actualException.isInstanceOf[StateStoreCommitValidationFailed] ||
+          actualException.getMessage.contains("[STATE_STORE_COMMIT_VALIDATION_FAILED]"),
+          s"Expected STATE_STORE_COMMIT_VALIDATION_FAILED error," +
+            s" but got: ${actualException.getMessage}")
+      }
+    }
+  }
+
+  test("StateStore commit validation can be disabled via configuration") {
+    withSQLConf(
+      SQLConf.SHUFFLE_PARTITIONS.key -> "5",
+      SQLConf.STATE_STORE_COMMIT_VALIDATION_ENABLED.key -> "false") {
+      withTempDir { tempDir =>
+        val checkpointPath = tempDir.getCanonicalPath
+
+        val streamingDF = spark.readStream
+          .format("rate")
+          .option("rowsPerSecond", 3)
+          .load()
+          .withColumn("key", col("value") % 10)
+
+        val aggregatedDF = streamingDF
+          .groupBy("key")
+          .agg(count("*").as("count"))
+
+        // ForeachBatch that only processes partial data
+        // With validation disabled, this should not fail
+        def partialProcessor(batchDF: DataFrame, batchId: Long): Unit = {
+          // Only show first 2 rows, won't process all partitions
+          batchDF.show(2)
+        }
+
+        // This should complete successfully with validation disabled
+        val query = aggregatedDF.writeStream
+          .queryName("validation_disabled_test")
+          .option("checkpointLocation", checkpointPath)
+          .foreachBatch(partialProcessor _)
+          .outputMode("complete")
+          .trigger(Trigger.ProcessingTime("1 second"))
+          .start()
+
+        try {
+          // Wait for at least 2-3 batches to be processed
+          eventually(timeout(streamingTimeout)) {
+            assert(query.lastProgress != null, "Query should have made progress")
+            assert(query.lastProgress.batchId >= 2,
+              s"Query should have processed at least 3 batches, " +
+                s"but only processed ${query.lastProgress.batchId + 1}")
+          }
+        } finally {
+          query.stop()
+          query.awaitTermination()
+        }
+      }
+    }
+  }
+
   // ============== Helper classes and methods =================
 
   private class ForeachBatchTester[T: Encoder](memoryStream: MemoryStream[Int]) {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachWriterSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachWriterSuite.scala
index 32f92ce276a06..8c657c2e07160 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachWriterSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/ForeachWriterSuite.scala
@@ -25,7 +25,7 @@ import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.{ExecutorDeadException, SparkException}
 import org.apache.spark.sql.ForeachWriter
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.{count, timestamp_seconds, window}
 import org.apache.spark.sql.streaming.{OutputMode, StreamingQueryException, StreamTest}
 import org.apache.spark.sql.test.SharedSparkSession
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamProviderSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamProviderSuite.scala
index aeb1bba31410d..f5e3cb6ce0aef 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamProviderSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/RateStreamProviderSuite.scala
@@ -28,8 +28,8 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.connector.read.streaming.{Offset, SparkDataStream}
 import org.apache.spark.sql.execution.datasources.DataSource
 import org.apache.spark.sql.execution.datasources.v2.StreamingDataSourceV2ScanRelation
-import org.apache.spark.sql.execution.streaming._
 import org.apache.spark.sql.execution.streaming.continuous._
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, RateStreamOffset, StreamExecution}
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.streaming.StreamTest
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketStreamSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketStreamSuite.scala
index 2c17d75624d38..8b8ae57c82c4d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketStreamSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/sources/TextSocketStreamSuite.scala
@@ -33,8 +33,8 @@ import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.connector.read.streaming.{Offset, SparkDataStream}
 import org.apache.spark.sql.execution.datasources.DataSource
 import org.apache.spark.sql.execution.datasources.v2.StreamingDataSourceV2ScanRelation
-import org.apache.spark.sql.execution.streaming._
 import org.apache.spark.sql.execution.streaming.continuous._
+import org.apache.spark.sql.execution.streaming.runtime.{ContinuousRecordPartitionOffset, LongOffset, StreamExecution}
 import org.apache.spark.sql.streaming.{StreamingQueryException, StreamTest}
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FailureInjectionCheckpointFileManager.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FailureInjectionCheckpointFileManager.scala
index 9429cd5ef39ef..ec5d195f8f8ae 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FailureInjectionCheckpointFileManager.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FailureInjectionCheckpointFileManager.scala
@@ -25,8 +25,8 @@ import org.apache.hadoop.fs.permission.FsPermission
 import org.apache.hadoop.util.Progressable
 
 import org.apache.spark.internal.Logging
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.{CancellableFSDataOutputStream, RenameBasedFSDataOutputStream}
-import org.apache.spark.sql.execution.streaming.FileSystemBasedCheckpointFileManager
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.{CancellableFSDataOutputStream, RenameBasedFSDataOutputStream}
+import org.apache.spark.sql.execution.streaming.checkpointing.FileSystemBasedCheckpointFileManager
 
 /**
  * A wrapper file output stream that will throw exception in close() and put the underlying
@@ -258,7 +258,8 @@ class FailureInjectionRocksDBStateStoreProvider extends RocksDBStateStoreProvide
       useColumnFamilies: Boolean,
       enableStateStoreCheckpointIds: Boolean,
       partitionId: Int,
-      eventForwarder: Option[RocksDBEventForwarder] = None): RocksDB = {
+      eventForwarder: Option[RocksDBEventForwarder] = None,
+      uniqueId: Option[String]): RocksDB = {
     FailureInjectionRocksDBStateStoreProvider.createRocksDBWithFaultInjection(
       dfsRootDir,
       conf,
@@ -268,7 +269,8 @@ class FailureInjectionRocksDBStateStoreProvider extends RocksDBStateStoreProvide
       useColumnFamilies,
       enableStateStoreCheckpointIds,
       partitionId,
-      eventForwarder)
+      eventForwarder,
+      uniqueId)
   }
 }
 
@@ -286,7 +288,8 @@ object FailureInjectionRocksDBStateStoreProvider {
       useColumnFamilies: Boolean,
       enableStateStoreCheckpointIds: Boolean,
       partitionId: Int,
-      eventForwarder: Option[RocksDBEventForwarder]): RocksDB = {
+      eventForwarder: Option[RocksDBEventForwarder],
+      uniqueId: Option[String]): RocksDB = {
     new RocksDB(
       dfsRootDir,
       conf = conf,
@@ -296,7 +299,8 @@ object FailureInjectionRocksDBStateStoreProvider {
       useColumnFamilies = useColumnFamilies,
       enableStateStoreCheckpointIds = enableStateStoreCheckpointIds,
       partitionId = partitionId,
-      eventForwarder = eventForwarder
+      eventForwarder = eventForwarder,
+      uniqueId
     ) {
       override def createFileManager(
           dfsRootDir: String,
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FlatMapGroupsWithStateExecHelperSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FlatMapGroupsWithStateExecHelperSuite.scala
index 2456999b4382a..0369dd6c81ef5 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FlatMapGroupsWithStateExecHelperSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/FlatMapGroupsWithStateExecHelperSuite.scala
@@ -22,7 +22,8 @@ import java.util.concurrent.atomic.AtomicInteger
 import org.apache.spark.sql.Encoder
 import org.apache.spark.sql.catalyst.encoders.{encoderFor, ExpressionEncoder}
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
-import org.apache.spark.sql.execution.streaming.GroupStateImpl._
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.FlatMapGroupsWithStateExecHelper
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl._
 import org.apache.spark.sql.streaming.StreamTest
 import org.apache.spark.sql.types._
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ListStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ListStateSuite.scala
index 476b43e42cb87..40caade2acb78 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ListStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ListStateSuite.scala
@@ -23,7 +23,8 @@ import java.util.UUID
 import org.apache.spark.{SparkIllegalArgumentException, SparkUnsupportedOperationException}
 import org.apache.spark.sql.Encoders
 import org.apache.spark.sql.catalyst.encoders.{encoderFor, ExpressionEncoder}
-import org.apache.spark.sql.execution.streaming.{ImplicitGroupingKeyTracker, ListStateImplWithTTL, StatefulProcessorHandleImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.ListStateImplWithTTL
 import org.apache.spark.sql.streaming.{ListState, TimeMode, TTLConfig, ValueState}
 
 /**
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MapStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MapStateSuite.scala
index 9a0a891d538ec..00855ba15f8df 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MapStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MapStateSuite.scala
@@ -22,7 +22,8 @@ import java.util.UUID
 
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.Encoders
-import org.apache.spark.sql.execution.streaming.{ImplicitGroupingKeyTracker, MapStateImplWithTTL, StatefulProcessorHandleImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.MapStateImplWithTTL
 import org.apache.spark.sql.streaming.{ListState, MapState, TimeMode, TTLConfig, ValueState}
 import org.apache.spark.sql.types.{BinaryType, StructType}
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MemoryStateStore.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MemoryStateStore.scala
index 9a04a0c759ac4..931b00abc17cf 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MemoryStateStore.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/MemoryStateStore.scala
@@ -26,8 +26,10 @@ class MemoryStateStore extends StateStore() {
   import scala.jdk.CollectionConverters._
   private val map = new ConcurrentHashMap[UnsafeRow, UnsafeRow]
 
-  override def iterator(colFamilyName: String): Iterator[UnsafeRowPair] = {
-    map.entrySet.iterator.asScala.map { case e => new UnsafeRowPair(e.getKey, e.getValue) }
+  override def iterator(colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
+    val iter =
+      map.entrySet.iterator.asScala.map { case e => new UnsafeRowPair(e.getKey, e.getValue) }
+    new StateStoreIterator(iter)
   }
 
   override def createColFamilyIfAbsent(
@@ -55,6 +57,9 @@ class MemoryStateStore extends StateStore() {
 
   override def abort(): Unit = {}
 
+  override def release(): Unit = {}
+
+
   override def id: StateStoreId = null
 
   override def version: Long = 0
@@ -63,7 +68,9 @@ class MemoryStateStore extends StateStore() {
 
   override def hasCommitted: Boolean = true
 
-  override def prefixScan(prefixKey: UnsafeRow, colFamilyName: String): Iterator[UnsafeRowPair] = {
+  override def prefixScan(
+      prefixKey: UnsafeRow,
+      colFamilyName: String): StateStoreIterator[UnsafeRowPair] = {
     throw new UnsupportedOperationException("Doesn't support prefix scan!")
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadataSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadataSuite.scala
index 2f3fd21bd3da0..f34ae3d32888b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadataSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/OperatorStateMetadataSuite.scala
@@ -22,8 +22,9 @@ import org.apache.hadoop.fs.Path
 import org.apache.spark.SparkRuntimeException
 import org.apache.spark.sql.{Column, Row}
 import org.apache.spark.sql.execution.datasources.v2.state.{StateDataSourceUnspecifiedRequiredOption, StateSourceOptions}
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, LongOffset, MemoryStream, OffsetSeq, OffsetSeqLog}
-import org.apache.spark.sql.execution.streaming.StreamingCheckpointConstants.DIR_NAME_OFFSETS
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, OffsetSeq, OffsetSeqLog}
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, MemoryStream}
+import org.apache.spark.sql.execution.streaming.runtime.StreamingCheckpointConstants.DIR_NAME_OFFSETS
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.{OutputMode, RunningCountStatefulProcessor, StreamTest, TimeMode}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBCheckpointFailureInjectionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBCheckpointFailureInjectionSuite.scala
index 0c3e457c8df1a..fee0dc2821fbf 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBCheckpointFailureInjectionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBCheckpointFailureInjectionSuite.scala
@@ -24,7 +24,7 @@ import scala.language.implicitConversions
 import org.apache.hadoop.conf.Configuration
 
 import org.apache.spark.{SparkConf, SparkException}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.count
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.STREAMING_CHECKPOINT_FILE_MANAGER_CLASS
@@ -602,7 +602,8 @@ class RocksDBCheckpointFailureInjectionSuite extends StreamTest
         useColumnFamilies = true,
         enableStateStoreCheckpointIds = enableStateStoreCheckpointIds,
         partitionId = 0,
-        eventForwarder = None)
+        eventForwarder = None,
+        uniqueId = None)
       db.load(version, checkpointId)
       func(db)
     } finally {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreCheckpointFormatV2Suite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreCheckpointFormatV2Suite.scala
index fd317903be96e..3b35ec3d4b97a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreCheckpointFormatV2Suite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreCheckpointFormatV2Suite.scala
@@ -27,12 +27,14 @@ import org.scalatest.Tag
 import org.apache.spark.{SparkContext, SparkException, TaskContext}
 import org.apache.spark.sql.{DataFrame, ForeachWriter}
 import org.apache.spark.sql.catalyst.expressions.UnsafeRow
-import org.apache.spark.sql.execution.streaming.{CommitLog, MemoryStream, StreamExecution}
+import org.apache.spark.sql.execution.streaming.checkpointing.CommitLog
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamExecution}
+import org.apache.spark.sql.execution.streaming.state.StateStoreCoordinatorSuite.withCoordinatorRef
 import org.apache.spark.sql.execution.streaming.state.StateStoreTestsHelper
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming._
-import org.apache.spark.sql.streaming.OutputMode.Update
+import org.apache.spark.sql.streaming.OutputMode.{Append, Update}
 import org.apache.spark.sql.test.TestSparkSession
 import org.apache.spark.sql.types.StructType
 
@@ -76,17 +78,21 @@ case class CkptIdCollectingStateStoreWrapper(innerStore: StateStore) extends Sta
 
   override def prefixScan(
       prefixKey: UnsafeRow,
-      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Iterator[UnsafeRowPair] = {
+      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME)
+    : StateStoreIterator[UnsafeRowPair] = {
     innerStore.prefixScan(prefixKey, colFamilyName)
   }
 
   override def iterator(
-      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME): Iterator[UnsafeRowPair] = {
+      colFamilyName: String = StateStore.DEFAULT_COL_FAMILY_NAME)
+    : StateStoreIterator[UnsafeRowPair] = {
     innerStore.iterator(colFamilyName)
   }
 
   override def abort(): Unit = innerStore.abort()
 
+  override def release(): Unit = {}
+
   // Implement methods from StateStore (current trait)
 
   override def removeColFamilyIfExists(colFamilyName: String): Boolean = {
@@ -155,7 +161,6 @@ class CkptIdCollectingStateStoreProviderWrapper extends StateStoreProvider {
       hadoopConf: Configuration,
       useMultipleValuesPerKey: Boolean = false,
       stateSchemaProvider: Option[StateSchemaProvider] = None): Unit = {
-    hadoopConf.set(StreamExecution.RUN_ID_KEY, UUID.randomUUID().toString)
     innerProvider.init(
       stateStoreId,
       keySchema,
@@ -178,11 +183,38 @@ class CkptIdCollectingStateStoreProviderWrapper extends StateStoreProvider {
   }
 
   override def getReadStore(version: Long, uniqueId: Option[String] = None): ReadStateStore = {
-    new WrappedReadStateStore(
-      CkptIdCollectingStateStoreWrapper(innerProvider.getReadStore(version, uniqueId)))
+    // Don't wrap the read store with WrappedReadStateStore since it makes upgrading difficult
+    // Just return the wrapped store directly
+    CkptIdCollectingStateStoreWrapper(innerProvider.getReadStore(version, uniqueId))
   }
 
-  override def doMaintenance(): Unit = innerProvider.doMaintenance()
+  override def upgradeReadStoreToWriteStore(
+      readStore: ReadStateStore,
+      version: Long,
+      uniqueId: Option[String] = None): StateStore = {
+    // Following the pattern from RocksDBStateStoreProvider, we verify version and id match
+    assert(version == readStore.version,
+      s"Can only upgrade readStore to writeStore with the same version," +
+        s" readStoreVersion: ${readStore.version}, writeStoreVersion: ${version}")
+    assert(this.stateStoreId == readStore.id, "Can only upgrade readStore to writeStore with" +
+      " the same stateStoreId")
+
+    // Extract the inner store from our wrapper
+    val innerReadStore = readStore match {
+      case wrapper: CkptIdCollectingStateStoreWrapper => wrapper.innerStore
+      case _ =>
+        throw new IllegalStateException(
+          s"Expected CkptIdCollectingStateStoreWrapper" +
+            s" but got ${readStore.getClass}")
+    }
+
+    // Delegate to inner provider to upgrade the store
+    val upgradedStore = innerProvider.upgradeReadStoreToWriteStore(
+      innerReadStore, version, uniqueId)
+
+    // Wrap the upgraded store with CkptIdCollectingStateStoreWrapper
+    CkptIdCollectingStateStoreWrapper(upgradedStore)
+  }
 
   override def supportedCustomMetrics: Seq[StateStoreCustomMetric] =
     innerProvider.supportedCustomMetrics
@@ -578,6 +610,29 @@ class RocksDBStateStoreCheckpointFormatV2Suite extends StreamTest
     validateBaseCheckpointInfo()
   }
 
+  def validateCheckpointInfoGlobalLimit(
+      numBatches: Int,
+      numStateStores: Int,
+      batchVersionSet: Set[Long]): Unit = {
+    val checkpointInfoList = CkptIdCollectingStateStoreWrapper.getStateStoreCheckpointInfos
+    // We have 6 batches, 1 partitions (since global limit), and 1 state store per batch
+    assert(checkpointInfoList.size == numBatches * numStateStores * 1)
+    checkpointInfoList.foreach { l =>
+      assert(l.stateStoreCkptId.isDefined)
+      if (batchVersionSet.contains(l.batchVersion)) {
+        assert(l.baseStateStoreCkptId.isDefined)
+      }
+    }
+    assert(checkpointInfoList.count(_.partitionId == 0) == numBatches * numStateStores)
+    // Since we use global limit, there should be no partition 1
+    assert(checkpointInfoList.count(_.partitionId == 1) == 0)
+    for (i <- 1 to numBatches) {
+      // Since we use global limit, there should be only one store per batch
+      assert(checkpointInfoList.count(_.batchVersion == i) == numStateStores * 1)
+    }
+    validateBaseCheckpointInfo()
+  }
+
   /**
    * Verify lineage for each partition across batches. Below should satisfy because
    * these ids are stored in the following manner:
@@ -1140,6 +1195,54 @@ class RocksDBStateStoreCheckpointFormatV2Suite extends StreamTest
     validateCheckpointInfo(6, 1, Set(2, 4, 6))
   }
 
+
+  // No matter the number of shuffle partitions, global limit should always use one partition
+  Seq(1, 2, 10, 200).foreach { shufflePartitions =>
+    testWithCheckpointInfoTracked(
+      s"checkpointFormatVersion2 validate StreamingGlobalLimit with " +
+      s"shufflePartitions = $shufflePartitions") {
+      withTempDir { checkpointDir =>
+        withSQLConf((SQLConf.SHUFFLE_PARTITIONS.key, shufflePartitions.toString)) {
+          val inputData = MemoryStream[Int]
+          val aggregated = inputData
+            .toDF()
+            .limit(10)
+
+          testStream(aggregated, Append)(
+            StartStream(checkpointLocation = checkpointDir.getAbsolutePath),
+            AddData(inputData, 3),
+            CheckLastBatch(3),
+            AddData(inputData, 3, 2),
+            CheckLastBatch(3, 2),
+            StopStream
+          )
+
+          // Test recovery
+          testStream(aggregated, Append)(
+            StartStream(checkpointLocation = checkpointDir.getAbsolutePath),
+            AddData(inputData, 4, 1, 3),
+            CheckLastBatch(4, 1, 3),
+            AddData(inputData, 5, 4, 4),
+            CheckLastBatch(5, 4, 4),
+            StopStream
+          )
+
+          // crash recovery again
+          testStream(aggregated, Append)(
+            StartStream(checkpointLocation = checkpointDir.getAbsolutePath),
+            AddData(inputData, 4, 7),
+            CheckLastBatch(4),
+            AddData(inputData, 5),
+            CheckLastBatch(),
+            StopStream
+          )
+
+          validateCheckpointInfoGlobalLimit(6, 1, Set(2, 3, 4, 5, 6))
+        }
+      }
+    }
+  }
+
   test("checkpointFormatVersion2 validate transformWithState") {
     withTempDir { checkpointDir =>
       val inputData = MemoryStream[String]
@@ -1174,28 +1277,30 @@ class RocksDBStateStoreCheckpointFormatV2Suite extends StreamTest
   test("checkpointFormatVersion2 racing commits don't return incorrect checkpointInfo") {
     val sqlConf = new SQLConf()
     sqlConf.setConf(SQLConf.STATE_STORE_CHECKPOINT_FORMAT_VERSION, 2)
-
-    withTempDir { checkpointDir =>
-      val provider = new CkptIdCollectingStateStoreProviderWrapper()
-      provider.init(
-        StateStoreId(checkpointDir.toString, 0, 0),
-        StateStoreTestsHelper.keySchema,
-        StateStoreTestsHelper.valueSchema,
-        PrefixKeyScanStateEncoderSpec(StateStoreTestsHelper.keySchema, 1),
-        useColumnFamilies = false,
-        new StateStoreConf(sqlConf),
-        new Configuration
-      )
-
-      val store1 = provider.getStore(0)
-      val store1NewVersion = store1.commit()
-      val store2 = provider.getStore(1)
-      val store2NewVersion = store2.commit()
-      val store1CheckpointInfo = store1.getStateStoreCheckpointInfo()
-      val store2CheckpointInfo = store2.getStateStoreCheckpointInfo()
-
-      assert(store1CheckpointInfo.batchVersion == store1NewVersion)
-      assert(store2CheckpointInfo.batchVersion == store2NewVersion)
+    val sc = spark.sparkContext
+    withCoordinatorRef(sc) { _ =>
+      withTempDir { checkpointDir =>
+        val hadoopConf = new Configuration()
+        hadoopConf.set(StreamExecution.RUN_ID_KEY, UUID.randomUUID().toString)
+        val provider = new CkptIdCollectingStateStoreProviderWrapper()
+        provider.init(
+          StateStoreId(checkpointDir.toString, 0, 0),
+          StateStoreTestsHelper.keySchema,
+          StateStoreTestsHelper.valueSchema,
+          PrefixKeyScanStateEncoderSpec(StateStoreTestsHelper.keySchema, 1),
+          useColumnFamilies = false,
+          new StateStoreConf(sqlConf),
+          hadoopConf
+        )
+        val store1 = provider.getStore(0)
+        val store1NewVersion = store1.commit()
+        val store2 = provider.getStore(1)
+        val store2NewVersion = store2.commit()
+        val store1CheckpointInfo = store1.getStateStoreCheckpointInfo()
+        val store2CheckpointInfo = store2.getStateStoreCheckpointInfo()
+        assert(store1CheckpointInfo.batchVersion == store1NewVersion)
+        assert(store2CheckpointInfo.batchVersion == store2NewVersion)
+      }
     }
   }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreIntegrationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreIntegrationSuite.scala
index e0af281fecb9d..38e5b15465b89 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreIntegrationSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreIntegrationSuite.scala
@@ -21,10 +21,11 @@ import java.io.File
 
 import scala.jdk.CollectionConverters.SetHasAsScala
 
-import org.scalatest.time.{Minute, Span}
+import org.scalatest.time.{Millis, Minute, Seconds, Span}
 
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StreamingQueryWrapper}
-import org.apache.spark.sql.functions.count
+import org.apache.spark.memory.UnifiedMemoryManager
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamingQueryWrapper}
+import org.apache.spark.sql.functions.{count, max}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming._
 import org.apache.spark.sql.streaming.OutputMode.Update
@@ -109,7 +110,10 @@ class RocksDBStateStoreIntegrationSuite extends StreamTest
               "rocksdbTotalBytesReadThroughIterator", "rocksdbTotalBytesWrittenByFlush",
               "rocksdbPinnedBlocksMemoryUsage", "rocksdbNumInternalColFamiliesKeys",
               "rocksdbNumExternalColumnFamilies", "rocksdbNumInternalColumnFamilies",
-              "SnapshotLastUploaded.partition_0_default"))
+              "SnapshotLastUploaded.partition_0_default", "rocksdbChangeLogWriterCommitLatencyMs",
+              "rocksdbSaveZipFilesLatencyMs", "rocksdbLoadFromSnapshotLatencyMs",
+              "rocksdbLoadLatencyMs", "rocksdbReplayChangeLogLatencyMs",
+              "rocksdbNumReplayChangelogFiles"))
           }
         } finally {
           query.stop()
@@ -314,4 +318,131 @@ class RocksDBStateStoreIntegrationSuite extends StreamTest
     assert(changelogVersionsPresent(dirForPartition0) == List(3L, 4L))
     assert(snapshotVersionsPresent(dirForPartition0).contains(5L))
   }
+
+  // Test with both bounded memory enabled and disabled
+  Seq(true, false).foreach { boundedMemoryEnabled =>
+    test(s"RocksDB memory tracking integration with UnifiedMemoryManager" +
+      s" with boundedMemory=$boundedMemoryEnabled") {
+      withTempDir { dir =>
+        withSQLConf(
+          (SQLConf.STATE_STORE_PROVIDER_CLASS.key -> classOf[RocksDBStateStoreProvider].getName),
+          (SQLConf.CHECKPOINT_LOCATION.key -> dir.getCanonicalPath),
+          (SQLConf.SHUFFLE_PARTITIONS.key -> "5"),
+          (SQLConf.STREAMING_MAINTENANCE_INTERVAL.key -> (5 * 60 * 1000).toString),
+          ("spark.memory.unmanagedMemoryPollingInterval" -> "100ms"),
+          ("spark.sql.streaming.stateStore.rocksdb.boundedMemoryUsage" ->
+            boundedMemoryEnabled.toString)) {
+
+          // Use rate stream to ensure continuous state operations that trigger memory updates
+          val query = spark.readStream
+            .format("rate")
+            .option("rowsPerSecond", "10") // Continuous but not overwhelming
+            .load()
+            .selectExpr("value % 100 as key", "value")
+            .groupBy("key")
+            .agg(count("*").as("count"), max("value").as("max_value"))
+            .writeStream
+            .format("console")
+            .outputMode("update")
+            .trigger(Trigger.ProcessingTime(200)) // Regular triggers to ensure state operations
+            .start()
+
+          try {
+            // Check for memory tracking - the continuous stream should trigger memory updates
+            var initialRocksDBMemory = 0L
+            eventually(timeout(Span(20, Seconds)), interval(Span(500, Millis))) {
+              initialRocksDBMemory = UnifiedMemoryManager.getMemoryByComponentType("RocksDB")
+              assert(initialRocksDBMemory > 0L,
+                s"RocksDB memory should be tracked with boundedMemory=$boundedMemoryEnabled")
+            }
+
+            logInfo(s"RocksDB memory detected: $initialRocksDBMemory bytes " +
+              s"with boundedMemory=$boundedMemoryEnabled")
+
+            // Verify memory tracking remains stable during continued operation
+            eventually(timeout(Span(5, Seconds)), interval(Span(500, Millis))) {
+              val currentMemory = UnifiedMemoryManager.getMemoryByComponentType("RocksDB")
+              assert(currentMemory > 0L,
+                s"RocksDB memory tracking should remain active during stream processing: " +
+                  s"got $currentMemory bytes (initial: $initialRocksDBMemory) " +
+                  s"with boundedMemory=$boundedMemoryEnabled")
+            }
+
+            val finalMemory = UnifiedMemoryManager.getMemoryByComponentType("RocksDB")
+            logInfo(s"RocksDB memory tracking test completed successfully: " +
+              s"initial=$initialRocksDBMemory bytes, final=$finalMemory bytes " +
+              s"with boundedMemory=$boundedMemoryEnabled")
+
+          } finally {
+            query.stop()
+            // Clean up unmanaged memory users
+            UnifiedMemoryManager.clearUnmanagedMemoryUsers()
+          }
+        }
+      }
+    }
+  }
+
+  testWithColumnFamilies("bounded memory usage calculation",
+    TestWithBothChangelogCheckpointingEnabledAndDisabled) { colFamiliesEnabled =>
+    withTempDir { dir =>
+      withSQLConf(
+        (SQLConf.STATE_STORE_PROVIDER_CLASS.key -> classOf[RocksDBStateStoreProvider].getName),
+        (SQLConf.CHECKPOINT_LOCATION.key -> dir.getCanonicalPath),
+        (SQLConf.SHUFFLE_PARTITIONS.key -> "2"), // Use 2 partitions to test multiple providers
+        (s"${RocksDBConf.ROCKSDB_SQL_CONF_NAME_PREFIX}.boundedMemoryUsage" -> "true")) {
+
+        // Clear any existing providers from previous tests
+        RocksDBMemoryManager.resetWriteBufferManagerAndCache
+
+        val inputData = MemoryStream[Int]
+
+        val query = inputData.toDS().toDF("value")
+          .select($"value")
+          .groupBy($"value")
+          .agg(count("*"))
+          .writeStream
+          .format("console")
+          .outputMode("complete")
+          .start()
+
+        try {
+          // Initially no providers should be registered
+          assert(RocksDBMemoryManager.getNumRocksDBInstances(true) == 0)
+
+          // Add data to trigger state store creation
+          inputData.addData(1, 2, 3, 4)
+          query.processAllAvailable()
+
+          // With 2 partitions, we should have 2 bounded memory providers registered
+          assert(RocksDBMemoryManager.getNumRocksDBInstances(true) == 2)
+
+          assert(RocksDBMemoryManager.getNumRocksDBInstances(false) == 0)
+
+          // Add more data and check providers remain registered
+          inputData.addData(5, 6, 7, 8)
+          query.processAllAvailable()
+
+          // Should still have 2 instances
+          assert(RocksDBMemoryManager.getNumRocksDBInstances(true) == 2)
+
+          // Verify that the progress contains reasonable memory usage values
+          // With bounded memory, each provider should report its share of total memory
+          // (not 0L as in the old implementation)
+          val progress = query.lastProgress
+          val stateOperators = progress.stateOperators
+          assert(stateOperators.nonEmpty)
+
+          // Check that memory usage is reported at the operator level
+          stateOperators.foreach { op =>
+            // Memory usage is reported in memoryUsedBytes, not in customMetrics
+            val memUsage = op.memoryUsedBytes
+            assert(memUsage > 0L, s"Memory usage should be greater than 0, but was $memUsage")
+          }
+        } finally {
+          query.stop()
+        }
+      }
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreLockHardeningSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreLockHardeningSuite.scala
new file mode 100644
index 0000000000000..03e5bf692ef87
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreLockHardeningSuite.scala
@@ -0,0 +1,805 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.execution.streaming.state
+
+import java.util.UUID
+import java.util.concurrent.{CountDownLatch, TimeUnit}
+
+import scala.concurrent.{ExecutionContext, Future}
+import scala.util.Random
+
+import org.apache.hadoop.conf.Configuration
+import org.scalactic.source.Position
+import org.scalatest.{BeforeAndAfter, PrivateMethodTester, Tag}
+import org.scalatest.matchers.should.Matchers
+import org.scalatest.time.SpanSugar._
+
+import org.apache.spark.{SparkException, SparkFunSuite, SparkRuntimeException, TaskContext}
+import org.apache.spark.sql.catalyst.plans.PlanTestBase
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
+import org.apache.spark.sql.execution.streaming.state.StateStoreTestsHelper._
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.sql.types.StructType
+import org.apache.spark.util.ThreadUtils
+import org.apache.spark.util.ThreadUtils.awaitResult
+
+/**
+ * Comprehensive test cases for RocksDB State Store lock hardening implementation.
+ * These tests verify the state machine behavior and prevent problematic concurrent executions.
+ */
+class RocksDBStateStoreLockHardeningSuite extends SparkFunSuite
+    with PlanTestBase
+    with AlsoTestWithRocksDBFeatures
+    with PrivateMethodTester
+    with SharedSparkSession
+    with BeforeAndAfter
+    with Matchers {
+
+  before {
+    StateStore.stop()
+    require(!StateStore.isMaintenanceRunning)
+    spark.streams.stateStoreCoordinator // initialize the lazy coordinator
+  }
+
+  after {
+    StateStore.stop()
+    require(!StateStore.isMaintenanceRunning)
+  }
+
+  protected def tryWithProviderResource[T](
+      provider: RocksDBStateStoreProvider)(f: RocksDBStateStoreProvider => T): T = {
+    try {
+      f(provider)
+    } finally {
+      provider.close()
+    }
+  }
+
+  def newStoreProvider(): RocksDBStateStoreProvider = {
+    newStoreProvider(StateStoreId(newDir(), Random.nextInt(), 0))
+  }
+
+  def newStoreProvider(storeId: StateStoreId): RocksDBStateStoreProvider = {
+    newStoreProvider(storeId, NoPrefixKeyStateEncoderSpec(keySchema))
+  }
+
+  def newStoreProvider(storeId: StateStoreId, useColumnFamilies: Boolean):
+  RocksDBStateStoreProvider = {
+    newStoreProvider(storeId, NoPrefixKeyStateEncoderSpec(keySchema),
+      useColumnFamilies = useColumnFamilies)
+  }
+
+  def newStoreProvider(useColumnFamilies: Boolean): RocksDBStateStoreProvider = {
+    newStoreProvider(StateStoreId(newDir(), Random.nextInt(), 0),
+      NoPrefixKeyStateEncoderSpec(keySchema),
+      useColumnFamilies = useColumnFamilies)
+  }
+
+  def newStoreProvider(
+      useColumnFamilies: Boolean,
+      useMultipleValuesPerKey: Boolean): RocksDBStateStoreProvider = {
+    newStoreProvider(StateStoreId(newDir(), Random.nextInt(), 0),
+      NoPrefixKeyStateEncoderSpec(keySchema),
+      useColumnFamilies = useColumnFamilies,
+      useMultipleValuesPerKey = useMultipleValuesPerKey
+    )
+  }
+
+  def newStoreProvider(storeId: StateStoreId, conf: Configuration): RocksDBStateStoreProvider = {
+    newStoreProvider(storeId, NoPrefixKeyStateEncoderSpec(keySchema), conf = conf)
+  }
+
+  def newStoreProvider(
+      keySchema: StructType,
+      keyStateEncoderSpec: KeyStateEncoderSpec,
+      useColumnFamilies: Boolean): RocksDBStateStoreProvider = {
+    newStoreProvider(StateStoreId(newDir(), Random.nextInt(), 0),
+      keyStateEncoderSpec = keyStateEncoderSpec,
+      keySchema = keySchema,
+      useColumnFamilies = useColumnFamilies)
+  }
+
+  def newStoreProvider(
+      storeId: StateStoreId,
+      keyStateEncoderSpec: KeyStateEncoderSpec,
+      keySchema: StructType = keySchema,
+      sqlConf: Option[SQLConf] = None,
+      conf: Configuration = new Configuration,
+      useColumnFamilies: Boolean = false,
+      useMultipleValuesPerKey: Boolean = false): RocksDBStateStoreProvider = {
+    val provider = new RocksDBStateStoreProvider()
+    val testStateSchemaProvider = new TestStateSchemaProvider
+    conf.set(StreamExecution.RUN_ID_KEY, UUID.randomUUID().toString)
+    provider.init(
+      storeId,
+      keySchema,
+      valueSchema,
+      keyStateEncoderSpec,
+      useColumnFamilies,
+      new StateStoreConf(sqlConf.getOrElse(SQLConf.get)),
+      conf,
+      useMultipleValuesPerKey,
+      stateSchemaProvider = Some(testStateSchemaProvider))
+    provider
+  }
+
+  override protected def test(testName: String, testTags: Tag*)(testBody: => Any)
+                             (implicit pos: Position): Unit = {
+    super.test(s"$testName", testTags: _*) {
+      withSQLConf("spark.sql.streaming.stateStore.rocksdb.lockAcquireTimeoutMs" -> "2000") {
+        testBody
+      }
+    }
+  }
+
+  // Custom ExecutionContext for concurrent testing
+  implicit val ec: ExecutionContext = ExecutionContext.fromExecutor(
+    ThreadUtils.newDaemonFixedThreadPool(5, "lock-hardening-test-pool"))
+
+  val timeout = 10.seconds
+
+  test("lock hardening: metrics atomicity - prevent cross-thread metric contamination") {
+    import scala.concurrent.ExecutionContext
+
+    // Create separate execution contexts to simulate different threads
+    implicit val ec1: ExecutionContext = ExecutionContext.fromExecutor(
+      ThreadUtils.newDaemonSingleThreadExecutor("thread-1"))
+    implicit val ec2: ExecutionContext = ExecutionContext.fromExecutor(
+      ThreadUtils.newDaemonSingleThreadExecutor("thread-2"))
+
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      @volatile var thread1Metrics: StateStoreMetrics = null
+      @volatile var thread2Metrics: StateStoreMetrics = null
+
+      // Thread 1: Complete transaction and store metrics
+      val future1 = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        val store1 = provider.getStore(0)
+        put(store1, "a", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+        assert(store1.commit() === 1)
+
+        // Store metrics from thread 1's perspective
+        thread1Metrics = store1.metrics
+        taskContext.markTaskCompleted(None)
+      }(ec1)
+
+      // Wait for thread 1 to complete
+      ThreadUtils.awaitResult(future1, 5.seconds)
+
+      // Thread 2: Start new transaction and access metrics
+      val future2 = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        val store2 = provider.getStore(1)
+        put(store2, "b", 0, 2, StateStore.DEFAULT_COL_FAMILY_NAME)
+        assert(store2.commit() === 2)
+
+        // Store metrics from thread 2's perspective
+        thread2Metrics = store2.metrics
+        taskContext.markTaskCompleted(None)
+      }(ec2)
+
+      ThreadUtils.awaitResult(future2, 5.seconds)
+
+      // Verify each thread gets its own correct metrics
+      // Thread 1 should see metrics reflecting its commit (1 key)
+      assert(thread1Metrics.numKeys === 1,
+        s"Thread 1 should see 1 key, but saw ${thread1Metrics.numKeys}")
+
+      // Thread 2 should see metrics reflecting its commit (2 keys total)
+      assert(thread2Metrics.numKeys === 2,
+        s"Thread 2 should see 2 keys, but saw ${thread2Metrics.numKeys}")
+
+      // This test verifies that:
+      // 1. Metrics are stored locally during commit (no cross-thread contamination)
+      // 2. Each thread gets the correct metrics for its transaction
+      // 3. No thread gets metrics from another thread's transaction
+    }
+  }
+
+  test("lock hardening: abort after commit prevention") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+
+      // Commit the store
+      store.commit()
+
+      // Attempting to abort after commit should throw StateStoreOperationOutOfOrder
+      val exception = intercept[SparkRuntimeException] {
+        store.abort()
+      }
+
+      checkError(
+        exception,
+        condition = "STATE_STORE_OPERATION_OUT_OF_ORDER",
+        parameters = Map("errorMsg" ->
+          ("Expected possible states (" +
+            "UPDATING, ABORTED) but found COMMITTED"))
+      )
+    }
+  }
+
+  test("lock hardening: access after close prevention") {
+    val provider = newStoreProvider(useColumnFamilies = false)
+    val store = provider.getStore(0)
+    put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+    store.commit()
+
+    // Manually trigger state machine close to ensure proper state transition
+    val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+    val stateMachineObj = provider invokePrivate stateMachine()
+    stateMachineObj.asInstanceOf[RocksDBStateMachine].close()
+
+    // Attempting to get a new store after close should fail
+    // with StateStoreInvalidStateMachineTransition
+    val exception = intercept[StateStoreInvalidStateMachineTransition] {
+      provider.getStore(1)
+    }
+
+    assert(exception.getMessage.contains("Old state: CLOSED"))
+  }
+
+  test("lock hardening: state machine operation ordering after commit") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+      store.commit()
+
+      // All update operations should fail after commit due to invalid stamp
+      val putException = intercept[StateStoreInvalidStamp] {
+        put(store, "key2", 0, 2, StateStore.DEFAULT_COL_FAMILY_NAME)
+      }
+      assert(putException.getMessage.contains("Invalid stamp"))
+
+      val removeException = intercept[StateStoreInvalidStamp] {
+        remove(store, { case (key, _) => key == "key" }, StateStore.DEFAULT_COL_FAMILY_NAME)
+      }
+      assert(removeException.getMessage.contains("Invalid stamp"))
+
+      // Get operations should also fail with invalid stamp
+      val getException = intercept[StateStoreInvalidStamp] {
+        get(store, "key", 0, StateStore.DEFAULT_COL_FAMILY_NAME)
+      }
+      assert(getException.getMessage.contains("Invalid stamp"))
+    }
+  }
+
+  test("lock hardening: state machine operation ordering after abort") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+      store.abort()
+
+      // All operations should fail after abort due to invalid stamp
+      val putException = intercept[StateStoreInvalidStamp] {
+        put(store, "key2", 0, 2, StateStore.DEFAULT_COL_FAMILY_NAME)
+      }
+      assert(putException.getMessage.contains("Invalid stamp"))
+
+      val getException = intercept[StateStoreInvalidStamp] {
+        get(store, "key", 0, StateStore.DEFAULT_COL_FAMILY_NAME)
+      }
+      assert(getException.getMessage.contains("Invalid stamp"))
+    }
+  }
+
+  test("lock hardening: concurrent state store instances prevention") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store1 = provider.getStore(0)
+      assertAcquiredThreadIsCurrentThread(provider)
+
+      // Latches to coordinate timing between threads
+      val threadStarted = new CountDownLatch(1)
+      val proceedToAcquire = new CountDownLatch(1)
+      val lockAttempted = new CountDownLatch(1)
+
+      // Start concurrent thread that will timeout waiting
+      val concurrentFuture = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        try {
+          threadStarted.countDown()
+
+          // Wait for signal to proceed with lock acquisition
+          proceedToAcquire.await(5, TimeUnit.SECONDS)
+
+          lockAttempted.countDown()
+
+          // This should block and eventually timeout/fail
+          provider.getStore(0)
+          false // Should not reach here
+        } catch {
+          case ex: Exception if ex.getMessage.contains("could not be acquired") => true
+          case ex: Exception if ex.getMessage.contains("not released") => true
+          case ex: Exception if ex.getMessage.contains("Waiting to acquire lock") => true
+          case ex: Exception =>
+            // Log the actual exception for debugging
+            logInfo(s"Unexpected exception: ${ex.getClass.getName}: ${ex.getMessage}")
+            false
+        }
+      }
+
+      // Wait for concurrent thread to start
+      assert(threadStarted.await(5, TimeUnit.SECONDS), "Concurrent thread should start")
+
+      // Signal the concurrent thread to proceed with lock acquisition
+      proceedToAcquire.countDown()
+
+      // Wait for the concurrent thread to attempt lock acquisition
+      assert(lockAttempted.await(5, TimeUnit.SECONDS), "Concurrent thread should attempt lock")
+
+      // Give the concurrent thread time to hit the blocking code and timeout
+      Thread.sleep(2500) // Wait longer than the 2 second timeout in awaitNotLocked
+
+      // The concurrent thread should have timed out by now, so commit to release lock
+      store1.commit()
+
+      // Now the concurrent future should return with the expected error
+      val result = awaitResult(concurrentFuture, 5.seconds)
+      assert(result, "Concurrent access should be prevented with proper error")
+
+      // After commit, new access should work
+      val secondStore = provider.getStore(1)
+      assertAcquiredThreadIsCurrentThread(provider)
+      secondStore.abort()
+    }
+  }
+
+  test("lock hardening: task completion listener releases ownership") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      var taskCompleted = false
+      var storeStamp: Long = -1
+
+      val taskFuture = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        val store = provider.getStore(0)
+        val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+        val stateMachineObj = provider invokePrivate stateMachine()
+        storeStamp = stateMachineObj.asInstanceOf[RocksDBStateMachine].currentValidStamp.get()
+        put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+
+        // Simulate task failure without explicit abort
+        taskContext.markTaskCompleted(Some(new SparkException("Task failure injection")))
+        taskCompleted = true
+
+        // Don't explicitly abort - let TaskCompletionListener handle it
+      }
+
+      awaitResult(taskFuture, timeout)
+      assert(taskCompleted)
+
+      // Wait a bit for TaskCompletionListener to execute
+      Thread.sleep(100)
+
+      // Verify that ownership was released by the TaskCompletionListener
+      val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+      val stateMachineObj = provider invokePrivate stateMachine()
+      val currentStamp = stateMachineObj.asInstanceOf[RocksDBStateMachine].currentValidStamp.get()
+      assert(currentStamp == -1,
+        s"State machine should be unlocked (stamp = -1) but was $currentStamp")
+    }
+  }
+
+  test("lock hardening: concurrent access serialization without deadlocks") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val numThreads = 3
+      val latch = new CountDownLatch(numThreads)
+      var completedThreads = 0
+      val results = new Array[Boolean](numThreads)
+      var exceptions = List.empty[Throwable]
+
+      val futures = (0 until numThreads).map { threadId =>
+        Future {
+          val taskContext = TaskContext.empty()
+          TaskContext.setTaskContext(taskContext)
+
+          try {
+            latch.countDown()
+            latch.await(5, TimeUnit.SECONDS) // Wait for all threads to be ready
+
+            val store = provider.getStore(0)
+            put(store, s"key$threadId",
+              threadId, threadId * 100, StateStore.DEFAULT_COL_FAMILY_NAME)
+
+            // Verify this thread has ownership
+            assertAcquiredThreadIsCurrentThread(provider)
+
+            store.commit()
+
+            synchronized {
+              completedThreads += 1
+              results(threadId) = true
+            }
+            true
+
+          } catch {
+            case ex: Throwable =>
+              synchronized {
+                exceptions = ex :: exceptions
+              }
+              false
+          }
+        }
+      }
+
+      // Wait for all futures to complete
+      futures.foreach(f => awaitResult(f, timeout))
+
+      // Verify results
+      assert(exceptions.isEmpty, s"Unexpected exceptions: ${exceptions.mkString(", ")}")
+      assert(completedThreads == numThreads,
+        s"Expected $numThreads threads to complete, got $completedThreads")
+      assert(results.forall(identity), "All threads should have completed successfully")
+    }
+  }
+
+  test("lock hardening: read-to-write store upgrade stamp consistency") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      // Get a read-only store first
+      val readStore = provider.getReadStore(0)
+
+      // Upgrade to write store
+      val writeStore = provider.upgradeReadStoreToWriteStore(readStore, 0)
+
+      // Verify the upgrade maintains stamp consistency
+      assertAcquiredThreadIsCurrentThread(provider)
+
+      // Should be able to perform write operations
+      put(writeStore, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+      writeStore.commit()
+
+      // Verify read store operations now fail with invalid stamp
+      val exception = intercept[StateStoreInvalidStamp] {
+        readStore.get(dataToKeyRow("key", 0), StateStore.DEFAULT_COL_FAMILY_NAME)
+      }
+      assert(exception.getMessage.contains("Invalid stamp"))
+    }
+  }
+
+  test("lock hardening: provider state machine transitions") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      // Initially should be in RELEASED state (no acquired thread info)
+      val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+      val stateMachineObj = provider invokePrivate stateMachine()
+      val initialThreadInfo =
+        stateMachineObj.asInstanceOf[RocksDBStateMachine].getAcquiredThreadInfo
+      assert(initialThreadInfo.isEmpty, "Initial state should have no acquired thread info")
+
+      // Acquire a store - should transition to ACQUIRED
+      val store = provider.getStore(0)
+      assertAcquiredThreadIsCurrentThread(provider)
+
+      // Verify stamp is valid
+      val stateMachine2 = PrivateMethod[Any](Symbol("stateMachine"))
+      val stateMachineObj2 = provider invokePrivate stateMachine2()
+      val stamp = stateMachineObj2.asInstanceOf[RocksDBStateMachine].currentValidStamp.get()
+      assert(stamp != -1, "Valid stamp should not be -1")
+
+      // Commit and verify transition back to RELEASED
+      store.commit()
+
+      val stateMachine3 = PrivateMethod[Any](Symbol("stateMachine"))
+      val stateMachineObj3 = provider invokePrivate stateMachine3()
+      val finalStamp = stateMachineObj3.asInstanceOf[RocksDBStateMachine].currentValidStamp.get()
+      assert(finalStamp == -1, "After commit, stamp should be -1 (released)")
+
+      // Note: Thread info may still be present after commit as it's only cleared when
+      // the provider is accessed again or explicitly released
+    }
+  }
+
+  test("lock hardening: metrics access control during UPDATING state") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+
+      // Metrics should not be accessible during UPDATING state
+      val exception = intercept[SparkRuntimeException] {
+        store.metrics
+      }
+
+      checkError(
+        exception,
+        condition = "STATE_STORE_OPERATION_OUT_OF_ORDER",
+        parameters = Map("errorMsg" ->
+          "Cannot get metrics in UPDATING state")
+      )
+
+      // After commit, metrics should be accessible
+      store.commit()
+      val metrics = store.metrics
+      assert(metrics.numKeys == 1)
+    }
+  }
+
+  test("lock hardening: checkpoint info access control during UPDATING state") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+
+      // Checkpoint info should not be accessible during UPDATING state
+      val exception = intercept[SparkRuntimeException] {
+        store.getStateStoreCheckpointInfo()
+      }
+
+      checkError(
+        exception,
+        condition = "STATE_STORE_OPERATION_OUT_OF_ORDER",
+        parameters = Map("errorMsg" ->
+          "Cannot get metrics in UPDATING state")
+      )
+
+      // After commit, checkpoint info should be accessible
+      store.commit()
+      val checkpointInfo = store.getStateStoreCheckpointInfo()
+      assert(checkpointInfo != null)
+    }
+  }
+
+  test("lock hardening: multiple instance prevention with detailed error") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store1 = provider.getStore(0)
+
+      // Try to get another instance from a different thread
+      val concurrentFuture = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        val startTime = System.currentTimeMillis()
+        val exception = intercept[SparkException] {
+          provider.getStore(0)
+        }
+        val endTime = System.currentTimeMillis()
+
+        // Verify error message contains expected details
+        val message = exception.getMessage
+        (message.contains("UNRELEASED_THREAD_ERROR"),
+          endTime - startTime)
+      }
+
+      val (hasCorrectError, duration) = awaitResult(concurrentFuture, timeout)
+      assert(hasCorrectError, "Should get unreleased thread error or timeout waiting for lock")
+
+      // Verify it actually waited (didn't fail immediately)
+      assert(duration >= 2000,
+        s"Should have waited at least 2 seconds but only waited $duration ms")
+
+      store1.commit()
+    }
+  }
+
+  test("lock hardening: stamp verification prevents unauthorized access") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+      val stateMachineObj = provider invokePrivate stateMachine()
+      val validStamp = stateMachineObj.asInstanceOf[RocksDBStateMachine].currentValidStamp.get()
+
+      // Simulate stamp verification with correct stamp
+      stateMachineObj.asInstanceOf[RocksDBStateMachine].verifyStamp(validStamp) // Should not throw
+
+      // Simulate stamp verification with incorrect stamp
+      val incorrectStamp = validStamp + 1
+      val exception = intercept[StateStoreInvalidStamp] {
+        stateMachineObj.asInstanceOf[RocksDBStateMachine].verifyStamp(incorrectStamp)
+      }
+      assert(exception.getMessage.contains("Invalid stamp"))
+
+      store.abort()
+
+      // After abort, even the originally valid stamp should be invalid
+      val postAbortException = intercept[StateStoreInvalidStamp] {
+        val stateMachine2 = PrivateMethod[Any](Symbol("stateMachine"))
+        val stateMachineObj2 = provider invokePrivate stateMachine2()
+        stateMachineObj2.asInstanceOf[RocksDBStateMachine].verifyStamp(validStamp)
+      }
+      assert(postAbortException.getMessage.contains("Invalid stamp"))
+    }
+  }
+
+  test("SPARK-53276: safe provider close during concurrent commit operations") {
+    // This test simulates the scenario fixed by SPARK-53276:
+    // - Multiple partitions are processing, some hit errors while others are committing
+    // - StateStore.stop() is called, which tries to close all providers
+    // - The fix ensures RocksDB is only closed when no other thread is using it
+
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val commitInProgressLatch = new CountDownLatch(1)
+      val proceedWithCloseLatch = new CountDownLatch(1)
+      val commitCompletedLatch = new CountDownLatch(1)
+
+      @volatile var commitThreadException: Option[Throwable] = None
+      @volatile var closeResult: Option[Boolean] = None
+
+      // Thread 1: Simulate partition that's in the middle of commit (partition 1)
+      val commitFuture = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        try {
+          val store = provider.getStore(0)
+          put(store, "partition1_key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+
+          // Signal that we're about to start commit
+          commitInProgressLatch.countDown()
+
+          // Wait for close thread to start attempting close
+          proceedWithCloseLatch.await(5, TimeUnit.SECONDS)
+
+          // Simulate some commit processing time
+          Thread.sleep(500)
+
+          // This commit should succeed even while close() is being called
+          val version = store.commit()
+          assert(version === 1)
+
+          commitCompletedLatch.countDown()
+        } catch {
+          case ex: Throwable =>
+            commitThreadException = Some(ex)
+            commitCompletedLatch.countDown()
+        }
+      }
+
+      // Thread 2: Simulate StateStore.stop() being called (from partition 0 error)
+      val closeFuture = Future {
+        try {
+          // Wait for commit thread to start its transaction
+          commitInProgressLatch.await(5, TimeUnit.SECONDS)
+
+          // Signal commit thread to proceed with its work
+          proceedWithCloseLatch.countDown()
+
+          // Attempt to close the provider (this simulates StateStore.stop())
+          // With the fix, this should wait until the commit thread releases the RocksDB
+          provider.close()
+          closeResult = Some(true)
+
+        } catch {
+          case ex: Throwable =>
+            // Log unexpected exceptions for debugging
+            logInfo(s"Close thread exception: ${ex.getClass.getName}: ${ex.getMessage}")
+        }
+      }
+
+      // Wait for both operations to complete
+      awaitResult(commitFuture, 10.seconds)
+      awaitResult(closeFuture, 10.seconds)
+
+      // Verify that commit completed successfully without exceptions
+      assert(commitCompletedLatch.await(1, TimeUnit.SECONDS),
+        "Commit should have completed")
+      assert(commitThreadException.isEmpty,
+        s"Commit should not have thrown exception: ${commitThreadException.map(_.getMessage)}")
+
+      // The state machine should have coordinated the close properly:
+      // - Either close() returned true (indicating it was safe to close)
+      // - Or close() waited until the commit completed before proceeding
+
+      // After everything completes, the provider should be properly closed
+      val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+      val stateMachineObj = provider invokePrivate stateMachine()
+
+      // Attempting to get a new store should fail since provider is closed
+      val exception = intercept[StateStoreInvalidStateMachineTransition] {
+        provider.getStore(1)
+      }
+      assert(exception.getMessage.contains("Old state: CLOSED"))
+    }
+  }
+
+  test("SPARK-53276: close waits for concurrent operations to complete") {
+    // This test verifies that close() properly waits for ongoing operations
+    // to complete before actually closing the RocksDB instance
+
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val operationStarted = new CountDownLatch(1)
+      val proceedWithClose = new CountDownLatch(1)
+      val operationCompleted = new CountDownLatch(1)
+
+      @volatile var operationException: Option[Throwable] = None
+      @volatile var closeStartTime: Long = 0
+      @volatile var closeEndTime: Long = 0
+
+      // Thread 1: Long-running operation
+      val operationFuture = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        try {
+          val store = provider.getStore(0)
+          put(store, "key", 0, 1, StateStore.DEFAULT_COL_FAMILY_NAME)
+
+          operationStarted.countDown()
+
+          // Wait for close to be initiated
+          proceedWithClose.await(5, TimeUnit.SECONDS)
+
+          // Simulate some processing time
+          Thread.sleep(1000)
+
+          // This should complete successfully
+          store.commit()
+          operationCompleted.countDown()
+
+        } catch {
+          case ex: Throwable =>
+            operationException = Some(ex)
+            operationCompleted.countDown()
+        }
+      }
+
+      // Thread 2: Close operation
+      val closeFuture = Future {
+        // Wait for operation to start
+        operationStarted.await(5, TimeUnit.SECONDS)
+
+        // Signal operation to proceed
+        proceedWithClose.countDown()
+
+        // Start close - this should wait for the operation to complete
+        closeStartTime = System.currentTimeMillis()
+        provider.close()
+        closeEndTime = System.currentTimeMillis()
+      }
+
+      // Wait for both to complete
+      awaitResult(operationFuture, 10.seconds)
+      awaitResult(closeFuture, 10.seconds)
+
+      // Verify operation completed successfully
+      assert(operationCompleted.await(1, TimeUnit.SECONDS),
+        "Operation should have completed")
+      assert(operationException.isEmpty,
+        s"Operation should not have failed: ${operationException.map(_.getMessage)}")
+
+      // Verify close waited for operation (should take at least 1 second)
+      val closeDuration = closeEndTime - closeStartTime
+      assert(closeDuration >= 900, // Allow some margin for timing
+        s"Close should have waited for operation, but took only $closeDuration ms")
+
+      // Verify provider is properly closed
+      val exception = intercept[StateStoreInvalidStateMachineTransition] {
+        provider.getStore(1)
+      }
+      assert(exception.getMessage.contains("Old state: CLOSED"))
+    }
+  }
+
+  // Helper method to assert current thread has ownership
+  def assertAcquiredThreadIsCurrentThread(provider: RocksDBStateStoreProvider): Unit = {
+    val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+    val stateMachineObj = provider invokePrivate stateMachine()
+    val threadInfo = stateMachineObj.asInstanceOf[RocksDBStateMachine].getAcquiredThreadInfo
+    assert(threadInfo.isDefined,
+      "acquired thread info should not be null after load")
+    val threadId = threadInfo.get.threadRef.get.get.getId
+    assert(
+      threadId == Thread.currentThread().getId,
+      s"acquired thread should be current thread ${Thread.currentThread().getId} " +
+        s"after load but was $threadId")
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreSuite.scala
index 99d7e255f9517..b7ed4ba260cc0 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBStateStoreSuite.scala
@@ -20,34 +20,52 @@ package org.apache.spark.sql.execution.streaming.state
 import java.util.UUID
 
 import scala.collection.immutable
+import scala.concurrent.{ExecutionContext, Future}
 import scala.util.Random
 
 import org.apache.avro.AvroTypeException
 import org.apache.hadoop.conf.Configuration
 import org.scalatest.BeforeAndAfter
+import org.scalatest.PrivateMethodTester
+import org.scalatest.matchers.should.Matchers
+import org.scalatest.time.SpanSugar._
 
-import org.apache.spark.{SparkConf, SparkUnsupportedOperationException}
+import org.apache.spark.{SparkConf, SparkException, SparkRuntimeException, SparkUnsupportedOperationException, TaskContext}
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.LocalSparkSession.withSparkSession
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.util.quietly
-import org.apache.spark.sql.execution.streaming.{StatefulOperatorStateInfo, StreamExecution}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.tags.ExtendedSQLTest
 import org.apache.spark.unsafe.Platform
 import org.apache.spark.unsafe.types.UTF8String
-import org.apache.spark.util.Utils
+import org.apache.spark.util.{ThreadUtils, Utils}
 
 @ExtendedSQLTest
 class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvider]
   with AlsoTestWithEncodingTypes
   with AlsoTestWithRocksDBFeatures
+  with PrivateMethodTester
   with SharedSparkSession
-  with BeforeAndAfter {
+  with BeforeAndAfter
+  with Matchers {
+
+  // Helper method to get RocksDBStateStore using PrivateMethodTester
+  private def getRocksDBStateStore(
+      provider: RocksDBStateStoreProvider, version: Long): provider.RocksDBStateStore = {
+    val getRocksDBStateStoreMethod =
+      PrivateMethod[provider.RocksDBStateStore](Symbol("getRocksDBStateStore"))
+    provider invokePrivate getRocksDBStateStoreMethod(version)
+  }
+
+  override def beforeEach(): Unit = {}
+  override def afterEach(): Unit = {}
 
   before {
     StateStore.stop()
@@ -68,30 +86,35 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
 
     tryWithProviderResource(newStoreProvider(colFamiliesEnabled)) { provider =>
       val store = provider.getStore(0)
-      val keyRow = dataToKeyRow("a", 0)
-      val valueRow = dataToValueRow(1)
-      store.put(keyRow, valueRow)
-      val iter = provider.rocksDB.iterator()
-      assert(iter.hasNext)
-      val kv = iter.next()
-
-      // Verify the version encoded in first byte of the key and value byte arrays
-      assert(Platform.getByte(kv.key, Platform.BYTE_ARRAY_OFFSET) === STATE_ENCODING_VERSION)
-      assert(Platform.getByte(kv.value, Platform.BYTE_ARRAY_OFFSET) === STATE_ENCODING_VERSION)
-
-      // The test verifies that the actual key-value pair (kv) matches these expected byte patterns
-      // exactly using sameElements, which ensures the serialization format remains consistent and
-      // backward compatible. This is particularly important for state storage where the format
-      // needs to be stable across Spark versions.
-      val (expectedKey, expectedValue) = if (conf.stateStoreEncodingFormat == "avro") {
-        (Array(0, 0, 0, 2, 2, 97, 2, 0), Array(0, 0, 0, 2, 2))
-      } else {
-        (Array(0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 24, 0, 0,
-          0, 0, 0, 0, 0, 0, 0, 0, 0, 97, 0, 0, 0, 0, 0, 0, 0),
-          Array(0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0))
+      try {
+        val keyRow = dataToKeyRow("a", 0)
+        val valueRow = dataToValueRow(1)
+        store.put(keyRow, valueRow)
+        val iter = provider.rocksDB.iterator()
+        assert(iter.hasNext)
+        val kv = iter.next()
+
+        // Verify the version encoded in first byte of the key and value byte arrays
+        assert(Platform.getByte(kv.key, Platform.BYTE_ARRAY_OFFSET) === STATE_ENCODING_VERSION)
+        assert(Platform.getByte(kv.value, Platform.BYTE_ARRAY_OFFSET) === STATE_ENCODING_VERSION)
+
+        // The test verifies that the actual key-value pair (kv) matches these expected
+        // byte patterns
+        // exactly using sameElements, which ensures the serialization format remains consistent and
+        // backward compatible. This is particularly important for state storage where the format
+        // needs to be stable across Spark versions.
+        val (expectedKey, expectedValue) = if (conf.stateStoreEncodingFormat == "avro") {
+          (Array(0, 0, 0, 2, 2, 97, 2, 0), Array(0, 0, 0, 2, 2))
+        } else {
+          (Array(0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 24, 0, 0,
+            0, 0, 0, 0, 0, 0, 0, 0, 0, 97, 0, 0, 0, 0, 0, 0, 0),
+            Array(0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0))
+        }
+        assert(kv.key.sameElements(expectedKey))
+        assert(kv.value.sameElements(expectedValue))
+      } finally {
+        if (!store.hasCommitted) store.abort()
       }
-      assert(kv.key.sameElements(expectedKey))
-      assert(kv.value.sameElements(expectedValue))
     }
   }
 
@@ -256,19 +279,20 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
     keySchemaWithSomeUnsupportedTypeCols.fields.zipWithIndex.foreach { case (field, index) =>
       val isAllowed = allowedRangeOrdinals.contains(index)
 
-      val getStore = () => {
+      if (isAllowed) {
         tryWithProviderResource(newStoreProvider(keySchemaWithSomeUnsupportedTypeCols,
             RangeKeyScanStateEncoderSpec(keySchemaWithSomeUnsupportedTypeCols, Seq(index)),
             colFamiliesEnabled)) { provider =>
-            provider.getStore(0)
+          val store = provider.getStore(0)
+          store.abort()
         }
-      }
-
-      if (isAllowed) {
-        getStore()
       } else {
         val ex = intercept[SparkUnsupportedOperationException] {
-          getStore()
+          tryWithProviderResource(newStoreProvider(keySchemaWithSomeUnsupportedTypeCols,
+              RangeKeyScanStateEncoderSpec(keySchemaWithSomeUnsupportedTypeCols, Seq(index)),
+              colFamiliesEnabled)) { provider =>
+            provider.getStore(0)
+          }
         }
         checkError(
           ex,
@@ -355,6 +379,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         key._1
       }.toSeq
       assert(result1 === (timerTimestamps ++ timerTimestamps1).sorted)
+      store1.commit()
     }
   }
 
@@ -522,6 +547,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         key._1
       }.toSeq
       assert(result1 === (timerTimestamps ++ timerTimestamps1).sorted)
+      store1.commit()
     }
   }
 
@@ -628,6 +654,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         (key._1, key._2)
       }.toSeq
       assert(result === timerTimestamps.sorted)
+      store.abort()
     }
   }
 
@@ -1320,89 +1347,95 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
     tryWithProviderResource(newStoreProvider(testSchema,
       RangeKeyScanStateEncoderSpec(testSchema, Seq(0, 1)), colFamiliesEnabled)) { provider =>
       val store = provider.getStore(0)
+      try {
+        val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
+        if (colFamiliesEnabled) {
+          store.createColFamilyIfAbsent(cfName,
+            testSchema, valueSchema,
+            RangeKeyScanStateEncoderSpec(testSchema, Seq(0, 1)))
+        }
 
-      val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
-      if (colFamiliesEnabled) {
-        store.createColFamilyIfAbsent(cfName,
-          testSchema, valueSchema,
-          RangeKeyScanStateEncoderSpec(testSchema, Seq(0, 1)))
-      }
-
-      val timerTimestamps = Seq((931L, 10), (null, 40), (452300L, 1),
-        (4200L, 68), (90L, 2000), (1L, 27), (1L, 394), (1L, 5), (3L, 980), (35L, 2112),
-        (6L, 90118), (9L, 95118), (6L, 87210), (null, 113), (null, 28), (null, -23), (null, -5534),
-        (-67450L, 2434), (-803L, 3422))
-      timerTimestamps.foreach { ts =>
-        // order by long col first and then by int col
-        val keyRow = schemaProj.apply(new GenericInternalRow(Array[Any](ts._1, ts._2,
-          UTF8String.fromString(Random.alphanumeric.take(Random.nextInt(20) + 1).mkString))))
-        val valueRow = dataToValueRow(1)
-        store.put(keyRow, valueRow, cfName)
-        assert(valueRowToData(store.get(keyRow, cfName)) === 1)
-      }
-
-      // verify that the expected null cols are seen
-      val nullRows = store.iterator(cfName).filter { kv =>
-        val keyRow = kv.key
-        keyRow.isNullAt(0)
-      }
-      assert(nullRows.size === 5)
+        val timerTimestamps = Seq((931L, 10), (null, 40), (452300L, 1),
+          (4200L, 68), (90L, 2000), (1L, 27), (1L, 394), (1L, 5), (3L, 980), (35L, 2112),
+          (6L, 90118), (9L, 95118), (6L, 87210), (null, 113), (null, 28),
+          (null, -23), (null, -5534), (-67450L, 2434), (-803L, 3422))
+        timerTimestamps.foreach { ts =>
+          // order by long col first and then by int col
+          val keyRow = schemaProj.apply(new GenericInternalRow(Array[Any](ts._1, ts._2,
+            UTF8String.fromString(Random.alphanumeric.take(Random.nextInt(20) + 1).mkString))))
+          val valueRow = dataToValueRow(1)
+          store.put(keyRow, valueRow, cfName)
+          assert(valueRowToData(store.get(keyRow, cfName)) === 1)
+        }
 
-      // filter out the null rows and verify the rest
-      val result: Seq[(Long, Int)] = store.iterator(cfName).filter { kv =>
-        val keyRow = kv.key
-        !keyRow.isNullAt(0)
-      }.map { kv =>
-        val keyRow = kv.key
-        val key = (keyRow.getLong(0), keyRow.getInt(1), keyRow.getString(2))
-        (key._1, key._2)
-      }.toSeq
+        // verify that the expected null cols are seen
+        val nullRows = store.iterator(cfName).filter { kv =>
+          val keyRow = kv.key
+          keyRow.isNullAt(0)
+        }
+        assert(nullRows.size === 5)
 
-      val timerTimestampsWithoutNulls = Seq((931L, 10), (452300L, 1),
-        (4200L, 68), (90L, 2000), (1L, 27), (1L, 394), (1L, 5), (3L, 980), (35L, 2112),
-        (6L, 90118), (9L, 95118), (6L, 87210), (-67450L, 2434), (-803L, 3422))
+        // filter out the null rows and verify the rest
+        val result: Seq[(Long, Int)] = store.iterator(cfName).filter { kv =>
+          val keyRow = kv.key
+          !keyRow.isNullAt(0)
+        }.map { kv =>
+          val keyRow = kv.key
+          val key = (keyRow.getLong(0), keyRow.getInt(1), keyRow.getString(2))
+          (key._1, key._2)
+        }.toSeq
 
-      assert(result === timerTimestampsWithoutNulls.sorted)
+        val timerTimestampsWithoutNulls = Seq((931L, 10), (452300L, 1),
+          (4200L, 68), (90L, 2000), (1L, 27), (1L, 394), (1L, 5), (3L, 980), (35L, 2112),
+          (6L, 90118), (9L, 95118), (6L, 87210), (-67450L, 2434), (-803L, 3422))
 
-      // verify that the null cols are seen in the correct order filtering for nulls
-      val nullRowsWithOrder = store.iterator(cfName).filter { kv =>
-        val keyRow = kv.key
-        keyRow.isNullAt(0)
-      }.map { kv =>
-        val keyRow = kv.key
-        keyRow.getInt(1)
-      }.toSeq
+        assert(result === timerTimestampsWithoutNulls.sorted)
 
-      assert(nullRowsWithOrder === Seq(-5534, -23, 28, 40, 113))
+        // verify that the null cols are seen in the correct order filtering for nulls
+        val nullRowsWithOrder = store.iterator(cfName).filter { kv =>
+          val keyRow = kv.key
+          keyRow.isNullAt(0)
+        }.map { kv =>
+          val keyRow = kv.key
+          keyRow.getInt(1)
+        }.toSeq
 
-      store.abort()
+        assert(nullRowsWithOrder === Seq(-5534, -23, 28, 40, 113))
+      } finally {
+        if (!store.hasCommitted) store.abort()
+      }
 
       val store1 = provider.getStore(0)
-      if (colFamiliesEnabled) {
-        store1.createColFamilyIfAbsent(cfName,
-          testSchema, valueSchema,
-          RangeKeyScanStateEncoderSpec(testSchema, Seq(0, 1)))
-      }
+      try {
+        val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
+        if (colFamiliesEnabled) {
+          store1.createColFamilyIfAbsent(cfName,
+            testSchema, valueSchema,
+            RangeKeyScanStateEncoderSpec(testSchema, Seq(0, 1)))
+        }
 
-      val timerTimestamps1 = Seq((null, 3), (null, 1), (null, 32),
-        (null, 113), (null, 40872), (null, -675456), (null, -924), (null, -666),
-        (null, 66))
-      timerTimestamps1.foreach { ts =>
-        // order by long col first and then by int col
-        val keyRow = schemaProj.apply(new GenericInternalRow(Array[Any](ts._1, ts._2,
-          UTF8String.fromString(Random.alphanumeric.take(Random.nextInt(20) + 1).mkString))))
-        val valueRow = dataToValueRow(1)
-        store1.put(keyRow, valueRow, cfName)
-        assert(valueRowToData(store1.get(keyRow, cfName)) === 1)
-      }
+        val timerTimestamps1 = Seq((null, 3), (null, 1), (null, 32),
+          (null, 113), (null, 40872), (null, -675456), (null, -924), (null, -666),
+          (null, 66))
+        timerTimestamps1.foreach { ts =>
+          // order by long col first and then by int col
+          val keyRow = schemaProj.apply(new GenericInternalRow(Array[Any](ts._1, ts._2,
+            UTF8String.fromString(Random.alphanumeric.take(Random.nextInt(20) + 1).mkString))))
+          val valueRow = dataToValueRow(1)
+          store1.put(keyRow, valueRow, cfName)
+          assert(valueRowToData(store1.get(keyRow, cfName)) === 1)
+        }
 
-      // verify that ordering for non-null columns on the right in still maintained
-      val result1: Seq[Int] = store.iterator(cfName).map { kv =>
-        val keyRow = kv.key
-        keyRow.getInt(1)
-      }.toSeq
+        // verify that ordering for non-null columns on the right in still maintained
+        val result1: Seq[Int] = store1.iterator(cfName).map { kv =>
+          val keyRow = kv.key
+          keyRow.getInt(1)
+        }.toSeq
 
-      assert(result1 === timerTimestamps1.map(_._2).sorted)
+        assert(result1 === timerTimestamps1.map(_._2).sorted)
+      } finally {
+        if (!store1.hasCommitted) store1.abort()
+      }
     }
   }
 
@@ -1457,6 +1490,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
           (key._1, key._2)
         }.toSeq
       assert(result.map(_._1) === timerTimestamps.map(_._1).sorted)
+      store.abort()
     }
   }
 
@@ -1502,6 +1536,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         (key._1, key._2)
       }.toSeq
       assert(result === timerTimestamps.sorted)
+      store.abort()
     }
   }
 
@@ -1513,37 +1548,42 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
     tryWithProviderResource(newStoreProvider(valueSchema,
       RangeKeyScanStateEncoderSpec(valueSchema, Seq(0)), colFamiliesEnabled)) { provider =>
       val store = provider.getStore(0)
-      val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
-      if (colFamiliesEnabled) {
-        store.createColFamilyIfAbsent(cfName,
-          valueSchema, valueSchema,
-          RangeKeyScanStateEncoderSpec(valueSchema, Seq(0)))
-      }
-
-      val timerTimestamps = Seq(931, 8000, 452300, 4200,
-        -3545, -343, 133, -90, -8014490, -79247,
-        90, 1, 2, 8, 3, 35, 6, 9, 5, -233)
-      timerTimestamps.foreach { ts =>
-        // non-timestamp col is of variable size
-        val keyRow = dataToValueRow(ts)
-        val valueRow = dataToValueRow(1)
-        store.put(keyRow, valueRow, cfName)
-        assert(valueRowToData(store.get(keyRow, cfName)) === 1)
-      }
+      try {
+        val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
+        if (colFamiliesEnabled) {
+          store.createColFamilyIfAbsent(cfName,
+            valueSchema, valueSchema,
+            RangeKeyScanStateEncoderSpec(valueSchema, Seq(0)))
+        }
 
-      val result = store.iterator(cfName).map { kv =>
-        valueRowToData(kv.key)
-      }.toSeq
-      assert(result === timerTimestamps.sorted)
+        val timerTimestamps = Seq(931, 8000, 452300, 4200,
+          -3545, -343, 133, -90, -8014490, -79247,
+          90, 1, 2, 8, 3, 35, 6, 9, 5, -233)
+        timerTimestamps.foreach { ts =>
+          // non-timestamp col is of variable size
+          val keyRow = dataToValueRow(ts)
+          val valueRow = dataToValueRow(1)
+          store.put(keyRow, valueRow, cfName)
+          assert(valueRowToData(store.get(keyRow, cfName)) === 1)
+        }
 
-      // also check for prefix scan
-      timerTimestamps.foreach { ts =>
-        val prefix = dataToValueRow(ts)
-        val result = store.prefixScan(prefix, cfName).map { kv =>
-          assert(valueRowToData(kv.value) === 1)
+        val result = store.iterator(cfName).map { kv =>
           valueRowToData(kv.key)
         }.toSeq
-        assert(result.size === 1)
+        assert(result === timerTimestamps.sorted)
+
+        // also check for prefix scan
+        timerTimestamps.foreach { ts =>
+          val prefix = dataToValueRow(ts)
+          val result = store.prefixScan(prefix, cfName).map { kv =>
+            assert(valueRowToData(kv.value) === 1)
+            valueRowToData(kv.key)
+          }.toSeq
+          assert(result.size === 1)
+        }
+        store.commit()
+      } finally {
+        if (!store.hasCommitted) store.abort()
       }
     }
   }
@@ -1555,32 +1595,36 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
       RangeKeyScanStateEncoderSpec(keySchemaWithRangeScan, Seq(0)),
       colFamiliesEnabled)) { provider =>
       val store = provider.getStore(0)
+      try {
+        val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
+        if (colFamiliesEnabled) {
+          store.createColFamilyIfAbsent(cfName,
+            keySchemaWithRangeScan, valueSchema,
+            RangeKeyScanStateEncoderSpec(keySchemaWithRangeScan, Seq(0)))
+        }
 
-      val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
-      if (colFamiliesEnabled) {
-        store.createColFamilyIfAbsent(cfName,
-          keySchemaWithRangeScan, valueSchema,
-          RangeKeyScanStateEncoderSpec(keySchemaWithRangeScan, Seq(0)))
-      }
-
-      val timerTimestamps = Seq(931L, -1331L, 8000L, 1L, -244L, -8350L, -55L)
-      timerTimestamps.zipWithIndex.foreach { case (ts, idx) =>
-        (1 to idx + 1).foreach { keyVal =>
-          val keyRow = dataToKeyRowWithRangeScan(ts, keyVal.toString)
-          val valueRow = dataToValueRow(1)
-          store.put(keyRow, valueRow, cfName)
-          assert(valueRowToData(store.get(keyRow, cfName)) === 1)
+        val timerTimestamps = Seq(931L, -1331L, 8000L, 1L, -244L, -8350L, -55L)
+        timerTimestamps.zipWithIndex.foreach { case (ts, idx) =>
+          (1 to idx + 1).foreach { keyVal =>
+            val keyRow = dataToKeyRowWithRangeScan(ts, keyVal.toString)
+            val valueRow = dataToValueRow(1)
+            store.put(keyRow, valueRow, cfName)
+            assert(valueRowToData(store.get(keyRow, cfName)) === 1)
+          }
         }
-      }
 
-      timerTimestamps.zipWithIndex.foreach { case (ts, idx) =>
-        val prefix = dataToPrefixKeyRowWithRangeScan(ts)
-        val result = store.prefixScan(prefix, cfName).map { kv =>
-          assert(valueRowToData(kv.value) === 1)
-          val key = keyRowWithRangeScanToData(kv.key)
-          key._2
-        }.toSeq
-        assert(result.size === idx + 1)
+        timerTimestamps.zipWithIndex.foreach { case (ts, idx) =>
+          val prefix = dataToPrefixKeyRowWithRangeScan(ts)
+          val result = store.prefixScan(prefix, cfName).map { kv =>
+            assert(valueRowToData(kv.value) === 1)
+            val key = keyRowWithRangeScanToData(kv.key)
+            key._2
+          }.toSeq
+          assert(result.size === idx + 1)
+        }
+        store.commit()
+      } finally {
+        if (!store.hasCommitted) store.abort()
       }
     }
   }
@@ -1608,6 +1652,81 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
       assert(valueRowToData(store.get(keyRow2)) === 2)
       store.remove(keyRow2)
       assert(store.get(keyRow2) === null)
+      store.abort()
+    }
+  }
+
+  testWithColumnFamiliesAndEncodingTypes(
+    "closing the iterator also closes the underlying rocksdb iterator",
+    TestWithBothChangelogCheckpointingEnabledAndDisabled) { colFamiliesEnabled =>
+
+    // use the same schema as value schema for single col key schema
+    tryWithProviderResource(newStoreProvider(valueSchema,
+      RangeKeyScanStateEncoderSpec(valueSchema, Seq(0)), colFamiliesEnabled)) { provider =>
+      val store = provider.getStore(0)
+      try {
+        val cfName = if (colFamiliesEnabled) "testColFamily" else "default"
+        if (colFamiliesEnabled) {
+          store.createColFamilyIfAbsent(cfName,
+            valueSchema, valueSchema,
+            RangeKeyScanStateEncoderSpec(valueSchema, Seq(0)))
+        }
+
+        val timerTimestamps = Seq(1, 2, 3, 22)
+        timerTimestamps.foreach { ts =>
+          val keyRow = dataToValueRow(ts)
+          val valueRow = dataToValueRow(1)
+          store.put(keyRow, valueRow, cfName)
+          assert(valueRowToData(store.get(keyRow, cfName)) === 1)
+        }
+
+        val iter1 = store.iterator(cfName)
+        for (i <- 1 to 4) {
+          assert(iter1.hasNext)
+          iter1.next()
+        }
+        // We were fully able to process the 4 elements
+        assert(!iter1.hasNext)
+
+        val iter2 = store.iterator(cfName)
+        for (i <- 1 to 2) {
+          assert(iter2.hasNext)
+          iter2.next()
+        }
+        // Close the iterator
+        iter2.close()
+        // After closing, this will call AbstractRocksIterator.isValid which should throw and
+        // exception since it no longer owns the underlying rocksdb iterator
+        val exception1 = intercept[AssertionError] {
+          iter2.next()
+        }
+        // Check that the exception is thrown from AbstractRocksIterator.isValid
+        assert(exception1.getStackTrace()(0).getClassName.contains("AbstractRocksIterator"))
+        assert(exception1.getStackTrace()(0).getMethodName.contains("isValid"))
+
+        // also check for prefix scan
+        val prefix = dataToValueRow(2)
+        val iter3 = store.prefixScan(prefix, cfName)
+
+        iter3.next()
+        assert(!iter3.hasNext)
+
+        val iter4 = store.prefixScan(prefix, cfName)
+        // Immediately close the iterator without calling next
+        iter4.close()
+
+        // Since we closed the iterator, this will throw an exception when we try to call next
+        val exception2 = intercept[AssertionError] {
+          iter4.next()
+        }
+        // Check that the exception is thrown from AbstractRocksIterator.isValid
+        assert(exception2.getStackTrace()(0).getClassName.contains("AbstractRocksIterator"))
+        assert(exception2.getStackTrace()(0).getMethodName.contains("isValid"))
+
+        store.commit()
+      } finally {
+        if (!store.hasCommitted) store.abort()
+      }
     }
   }
 
@@ -1642,6 +1761,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         assert(!iterator2.hasNext)
 
         assert(get(store, "a", 0).isEmpty)
+        store.abort()
       }
     }
   }
@@ -1681,6 +1801,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
           )
         }
       }
+      store.abort()
     }
   }
 
@@ -1717,6 +1838,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
           )
         }
       }
+      store.abort()
     }
   }
 
@@ -1726,30 +1848,34 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
       newStoreProvider(useColumnFamilies = colFamiliesEnabled)) { provider =>
       val store = provider.getStore(0)
 
-      val colFamilyName = "test"
+      try {
+        val colFamilyName = "test"
 
-      verifyStoreOperationUnsupported("put", colFamiliesEnabled, colFamilyName) {
-        store.put(dataToKeyRow("a", 1), dataToValueRow(1), colFamilyName)
-      }
+        verifyStoreOperationUnsupported("put", colFamiliesEnabled, colFamilyName) {
+          store.put(dataToKeyRow("a", 1), dataToValueRow(1), colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("remove", colFamiliesEnabled, colFamilyName) {
-        store.remove(dataToKeyRow("a", 1), colFamilyName)
-      }
+        verifyStoreOperationUnsupported("remove", colFamiliesEnabled, colFamilyName) {
+          store.remove(dataToKeyRow("a", 1), colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("get", colFamiliesEnabled, colFamilyName) {
-        store.get(dataToKeyRow("a", 1), colFamilyName)
-      }
+        verifyStoreOperationUnsupported("get", colFamiliesEnabled, colFamilyName) {
+          store.get(dataToKeyRow("a", 1), colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("iterator", colFamiliesEnabled, colFamilyName) {
-        store.iterator(colFamilyName)
-      }
+        verifyStoreOperationUnsupported("iterator", colFamiliesEnabled, colFamilyName) {
+          store.iterator(colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("merge", colFamiliesEnabled, colFamilyName) {
-        store.merge(dataToKeyRow("a", 1), dataToValueRow(1), colFamilyName)
-      }
+        verifyStoreOperationUnsupported("merge", colFamiliesEnabled, colFamilyName) {
+          store.merge(dataToKeyRow("a", 1), dataToValueRow(1), colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("prefixScan", colFamiliesEnabled, colFamilyName) {
-        store.prefixScan(dataToKeyRow("a", 1), colFamilyName)
+        verifyStoreOperationUnsupported("prefixScan", colFamiliesEnabled, colFamilyName) {
+          store.prefixScan(dataToKeyRow("a", 1), colFamilyName)
+        }
+      } finally {
+        if (!store.hasCommitted) store.abort()
       }
     }
   }
@@ -1790,12 +1916,10 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
       put(store, ("a", 1), 1, colFamily2)
       assert(valueRowToData(get(store, "a", 1, colFamily2)) === 1)
 
-      // calling commit on this store creates version 1
       store.commit()
 
       // reload version 0
       store = provider.getStore(0)
-
       val e = intercept[Exception]{
         get(store, "a", 1, colFamily1)
       }
@@ -1805,6 +1929,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         sqlState = Some("42802"),
         parameters = Map("operationType" -> "get", "colFamilyName" -> colFamily1)
       )
+      store.abort()
 
       store = provider.getStore(1)
       // version 1 data recovered correctly
@@ -1829,7 +1954,7 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
 
   test("verify that column family id is assigned correctly after removal") {
     tryWithProviderResource(newStoreProvider(useColumnFamilies = true)) { provider =>
-      var store = provider.getRocksDBStateStore(0)
+      var store = getRocksDBStateStore(provider, 0)
       val colFamily1: String = "abc"
       val colFamily2: String = "def"
       val colFamily3: String = "ghi"
@@ -1842,27 +1967,29 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         NoPrefixKeyStateEncoderSpec(keySchema))
       store.commit()
 
-      store = provider.getRocksDBStateStore(1)
+      store = getRocksDBStateStore(provider, 1)
       store.removeColFamilyIfExists(colFamily2)
       store.commit()
 
-      store = provider.getRocksDBStateStore(2)
+      store = getRocksDBStateStore(provider, 2)
       store.createColFamilyIfAbsent(colFamily3, keySchema, valueSchema,
         NoPrefixKeyStateEncoderSpec(keySchema))
       store.removeColFamilyIfExists(colFamily1)
       store.removeColFamilyIfExists(colFamily3)
       store.commit()
 
-      store = provider.getRocksDBStateStore(1)
+      store = getRocksDBStateStore(provider, 1)
       // this should return the old id, because we didn't remove this colFamily for version 1
       store.createColFamilyIfAbsent(colFamily1, keySchema, valueSchema,
         NoPrefixKeyStateEncoderSpec(keySchema))
+      store.abort()
 
-      store = provider.getRocksDBStateStore(3)
+      store = getRocksDBStateStore(provider, 3)
       store.createColFamilyIfAbsent(colFamily4, keySchema, valueSchema,
         NoPrefixKeyStateEncoderSpec(keySchema))
       store.createColFamilyIfAbsent(colFamily5, keySchema, valueSchema,
         NoPrefixKeyStateEncoderSpec(keySchema))
+      store.abort()
     }
   }
 
@@ -1943,10 +2070,12 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         val metricPair = store
           .metrics.customMetrics.find(_._1.name == "rocksdbNumInternalColFamiliesKeys")
         assert(metricPair.isDefined && metricPair.get._2 === 4)
-        assert(rowPairsToDataSet(store.iterator(cfName)) ===
+        val store1 = provider.getStore(1)
+        assert(rowPairsToDataSet(store1.iterator(cfName)) ===
           Set(("a", 0) -> 1, ("b", 0) -> 2, ("c", 0) -> 3, ("d", 0) -> 4, ("e", 0) -> 5))
-        assert(rowPairsToDataSet(store.iterator(internalCfName)) ===
+        assert(rowPairsToDataSet(store1.iterator(internalCfName)) ===
           Set(("a", 0) -> 1, ("m", 0) -> 2, ("n", 0) -> 3, ("b", 0) -> 4))
+        store1.abort()
 
         // Reload the store and remove some keys
         val reloadedProvider = newStoreProvider(store.id, colFamiliesEnabled)
@@ -1963,10 +2092,12 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
         val metricPairUpdated = reloadedStore
           .metrics.customMetrics.find(_._1.name == "rocksdbNumInternalColFamiliesKeys")
         assert(metricPairUpdated.isDefined && metricPairUpdated.get._2 === 3)
-        assert(rowPairsToDataSet(reloadedStore.iterator(cfName)) ===
+        val reloadedStore1 = reloadedProvider.getStore(2)
+        assert(rowPairsToDataSet(reloadedStore1.iterator(cfName)) ===
           Set(("a", 0) -> 1, ("c", 0) -> 3, ("d", 0) -> 4, ("e", 0) -> 5))
-        assert(rowPairsToDataSet(reloadedStore.iterator(internalCfName)) ===
+        assert(rowPairsToDataSet(reloadedStore1.iterator(internalCfName)) ===
           Set(("a", 0) -> 1, ("n", 0) -> 3, ("b", 0) -> 4))
+        reloadedStore1.commit()
       }
     }
   }
@@ -1980,36 +2111,455 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
       tryWithProviderResource(newStoreProvider(keySchema, keyEncoder, true)) { provider =>
         val store = provider.getStore(0)
 
-        val cfName = "testColFamily"
-        store.createColFamilyIfAbsent(cfName, keySchema, valueSchema, keyEncoder)
+        try {
+          val cfName = "testColFamily"
+          store.createColFamilyIfAbsent(cfName, keySchema, valueSchema, keyEncoder)
 
-        // remove non-exist col family will return false
-        assert(!store.removeColFamilyIfExists("non-existence"))
+          // remove non-exist col family will return false
+          assert(!store.removeColFamilyIfExists("non-existence"))
 
-        // put some test data into state store
-        val timerTimestamps = Seq(931L, 8000L, 452300L, 4200L, -1L, 90L, 1L, 2L, 8L,
-          -230L, -14569L, -92L, -7434253L, 35L, 6L, 9L, -323L, 5L)
-        timerTimestamps.foreach { ts =>
-          val keyRow = dataToKeyRow(ts.toString, ts.toInt)
-          val valueRow = dataToValueRow(1)
-          store.put(keyRow, valueRow, cfName)
+          // put some test data into state store
+          val timerTimestamps = Seq(931L, 8000L, 452300L, 4200L, -1L, 90L, 1L, 2L, 8L,
+            -230L, -14569L, -92L, -7434253L, 35L, 6L, 9L, -323L, 5L)
+          timerTimestamps.foreach { ts =>
+            val keyRow = dataToKeyRow(ts.toString, ts.toInt)
+            val valueRow = dataToValueRow(1)
+            store.put(keyRow, valueRow, cfName)
+          }
+          assert(store.iterator(cfName).toSeq.length == timerTimestamps.length)
+
+          // assert col family existence
+          assert(store.removeColFamilyIfExists(cfName))
+
+          val e = intercept[Exception] {
+            store.iterator(cfName)
+          }
+
+          checkError(
+            exception = e.asInstanceOf[StateStoreUnsupportedOperationOnMissingColumnFamily],
+            condition = "STATE_STORE_UNSUPPORTED_OPERATION_ON_MISSING_COLUMN_FAMILY",
+            sqlState = Some("42802"),
+            parameters = Map("operationType" -> "iterator", "colFamilyName" -> cfName)
+          )
+        } finally {
+          store.abort()
+        }
+      }
+    }
+  }
+
+  test("state transitions with commit and illegal operations") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      // Get a store and put some data
+      val store = provider.getStore(0)
+      put(store, "a", 0, 1)
+      put(store, "b", 0, 2)
+
+      // Verify data is accessible before commit
+      assert(get(store, "a", 0) === Some(1))
+      assert(get(store, "b", 0) === Some(2))
+
+      // Commit the changes
+      assert(store.commit() === 1)
+      assert(store.hasCommitted)
+
+      // Operations after commit should fail with IllegalStateException
+      val exception = intercept[StateStoreInvalidStamp] {
+        put(store, "c", 0, 3)
+      }
+      assert(exception.getMessage.contains("Invalid stamp"))
+
+      // Getting a new store for the same version should work
+      val store1 = provider.getStore(1)
+      assert(get(store1, "a", 0) === Some(1))
+      assert(get(store1, "b", 0) === Some(2))
+
+      // Can update the new store instance
+      put(store1, "c", 0, 3)
+      assert(get(store1, "c", 0) === Some(3))
+
+      // Commit the new changes
+      assert(store1.commit() === 2)
+    }
+  }
+
+  test("state transitions with abort and subsequent operations") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      // Get a store and put some data
+      val store = provider.getStore(0)
+      put(store, "a", 0, 1)
+      put(store, "b", 0, 2)
+
+      // Abort the changes
+      store.abort()
+
+      // Operations after abort should fail with IllegalStateException
+      val exception = intercept[StateStoreInvalidStamp] {
+        put(store, "c", 0, 3)
+      }
+      assert(exception.getMessage.contains("Invalid stamp"))
+
+      // Get a new store, should be empty since previous changes were aborted
+      val store1 = provider.getStore(0)
+      assert(store1.iterator().isEmpty)
+
+      // Put data and commit
+      put(store1, "d", 0, 4)
+      assert(store1.commit() === 1)
+
+      // Get a new store and verify data
+      val store2 = provider.getStore(1)
+      assert(get(store2, "d", 0) === Some(4))
+      store2.commit()
+    }
+  }
+
+  test("abort after commit throws StateStoreOperationOutOfOrder") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "a", 0, 1)
+      assert(store.commit() === 1)
+
+      // Abort after commit should throw a SparkRuntimeException
+      val exception = intercept[SparkRuntimeException] {
+        store.abort()
+      }
+      checkError(
+        exception,
+        condition = "STATE_STORE_OPERATION_OUT_OF_ORDER",
+        parameters = Map("errorMsg" ->
+          ("Expected possible states " +
+          "(UPDATING, ABORTED) but found COMMITTED"))
+      )
+
+      // Get a new store and verify data was committed
+      val store1 = provider.getStore(1)
+      assert(get(store1, "a", 0) === Some(1))
+      store1.commit()
+    }
+  }
+
+  test("multiple aborts are idempotent") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "a", 0, 1)
+
+      // First abort
+      store.abort()
+
+      // Second abort should not throw
+      store.abort()
+
+      // Operations should still fail
+      val exception = intercept[StateStoreInvalidStamp] {
+        put(store, "b", 0, 2)
+      }
+      assert(exception.getMessage.contains("Invalid stamp"))
+    }
+  }
+
+  test("multiple commits throw exception") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "a", 0, 1)
+      assert(store.commit() === 1)
+
+      // Second commit should fail with stamp verification
+      val exception = intercept[SparkRuntimeException] {
+        store.commit()
+      }
+      checkError(
+        exception,
+        condition = "STATE_STORE_OPERATION_OUT_OF_ORDER",
+        parameters = Map("errorMsg" ->
+          "Expected possible states (UPDATING) but found COMMITTED")
+      )
+    }
+  }
+
+  test("get metrics works only after commit") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "a", 0, 1)
+
+      // Getting metrics before commit should throw
+      val exception = intercept[SparkRuntimeException] {
+        store.metrics
+      }
+      checkError(
+        exception,
+        condition = "STATE_STORE_OPERATION_OUT_OF_ORDER",
+        parameters = Map("errorMsg" -> "Cannot get metrics in UPDATING state")
+      )
+      // Commit the changes
+      assert(store.commit() === 1)
+
+      // Getting metrics after commit should work
+      val metrics = store.metrics
+      assert(metrics.numKeys === 1)
+    }
+  }
+
+  test("get checkpoint info works only after commit") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+      put(store, "a", 0, 1)
+
+      // Getting checkpoint info before commit should throw
+      val exception = intercept[SparkRuntimeException] {
+        store.getStateStoreCheckpointInfo()
+      }
+      checkError(
+        exception,
+        condition = "STATE_STORE_OPERATION_OUT_OF_ORDER",
+        parameters = Map("errorMsg" -> "Cannot get metrics in UPDATING state")
+      )
+
+      // Commit the changes
+      assert(store.commit() === 1)
+
+      // Getting checkpoint info after commit should work
+      val checkpointInfo = store.getStateStoreCheckpointInfo()
+      assert(checkpointInfo != null)
+    }
+  }
+
+  test("read store and write store with common stamp") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      // First prepare some data
+      val initialStore = provider.getStore(0)
+      put(initialStore, "a", 0, 1)
+      assert(initialStore.commit() === 1)
+
+      // Get a read store
+      val readStore = provider.getReadStore(1)
+      assert(get(readStore, "a", 0) === Some(1))
+
+      // Get a write store from the read store
+      val writeStore = provider.upgradeReadStoreToWriteStore(
+        readStore, 1)
+
+      // Verify data access
+      assert(get(writeStore, "a", 0) === Some(1))
+
+      // Update through write store
+      put(writeStore, "b", 0, 2)
+      assert(get(writeStore, "b", 0) === Some(2))
+
+      // Commit the write store
+      assert(writeStore.commit() === 2)
+
+      // Get a new store and verify
+      val newStore = provider.getStore(2)
+      assert(get(newStore, "a", 0) === Some(1))
+      assert(get(newStore, "b", 0) === Some(2))
+      newStore.commit()
+    }
+  }
+
+  test("verify operation validation before and after commit") {
+    tryWithProviderResource(newStoreProvider(useColumnFamilies = false)) { provider =>
+      val store = provider.getStore(0)
+
+      // Put operations should work in UPDATING state
+      put(store, "a", 0, 1)
+      assert(get(store, "a", 0) === Some(1))
+
+      // Remove operations should work in UPDATING state
+      remove(store, _._1 == "a")
+      assert(get(store, "a", 0) === None)
+
+      // Iterator operations should work in UPDATING state
+      put(store, "b", 0, 2)
+      assert(rowPairsToDataSet(store.iterator()) === Set(("b", 0) -> 2))
+
+      // Commit should work in UPDATING state
+      assert(store.commit() === 1)
+
+      intercept[StateStoreInvalidStamp] {
+        put(store, "c", 0, 3)
+      }
+
+      intercept[StateStoreInvalidStamp] {
+        remove(store, _._1 == "b")
+      }
+
+      intercept[StateStoreInvalidStamp] {
+        store.iterator()
+      }
+
+      // Get a new store for the next version
+      val store1 = provider.getStore(1)
+
+      // Abort the store
+      store1.abort()
+
+      // Operations after abort should fail due to invalid stamp
+      intercept[StateStoreInvalidStamp] {
+        put(store1, "c", 0, 3)
+      }
+    }
+  }
+
+  test("Rocks DB task completion listener does not double unlock acquireThread") {
+    // This test verifies that a thread that locks then unlocks the db and then
+    // fires a completion listener (Thread 1) does not unlock the lock validly
+    // acquired by another thread (Thread 2).
+    //
+    // Timeline of this test (* means thread is active):
+    // STATE | MAIN             | THREAD 1         | THREAD 2         |
+    // ------| ---------------- | ---------------- | ---------------- |
+    // 0.    | wait for s3      | *load, commit    | wait for s1      |
+    //       |                  | *signal s1       |                  |
+    // ------| ---------------- | ---------------- | ---------------- |
+    // 1.    |                  | wait for s2      | *load, signal s2 |
+    // ------| ---------------- | ---------------- | ---------------- |
+    // 2.    |                  | *task complete   | wait for s4      |
+    //       |                  | *signal s3, END  |                  |
+    // ------| ---------------- | ---------------- | ---------------- |
+    // 3.    | *verify locked   |                  |                  |
+    //       | *signal s4       |                  |                  |
+    // ------| ---------------- | ---------------- | ---------------- |
+    // 4.    | wait for s5      |                  | *commit          |
+    //       |                  |                  | *signal s5, END  |
+    // ------| ---------------- | ---------------- | ---------------- |
+    // 5.    | *close db, END   |                  |                  |
+    //
+    // NOTE: state 4 and 5 are only for cleanup
+
+    // Create a custom ExecutionContext with 3 threads
+    implicit val ec: ExecutionContext = ExecutionContext.fromExecutor(
+      ThreadUtils.newDaemonFixedThreadPool(3, "pool-thread-executor"))
+    val stateLock = new Object()
+    var state = 0
+
+    tryWithProviderResource(newStoreProvider()) { provider =>
+      Future { // THREAD 1
+        // Set thread 1's task context so that it is not a clone
+        // of the main thread's taskContext, which will end if the
+        // task is marked as complete
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        stateLock.synchronized {
+          // -------------------- STATE 0 --------------------
+          // Simulate a task that loads and commits, db should be unlocked after
+          val store = provider.getStore(0)
+          store.commit()
+          // Signal that we have entered state 1
+          state = 1
+          stateLock.notifyAll()
+
+          // -------------------- STATE 2 --------------------
+          // Wait until we have entered state 2 (thread 2 has loaded db and acquired lock)
+          while (state != 2) {
+            stateLock.wait()
+          }
+
+          // thread 1's task context is marked as complete and signal
+          // that we have entered state 3
+          // At this point, thread 2 should still hold the DB lock.
+          taskContext.markTaskCompleted(None)
+          state = 3
+          stateLock.notifyAll()
+        }
+      }
+
+      Future { // THREAD 2
+        // Set thread 2's task context so that it is not a clone of thread 1's
+        // so it won't be marked as complete
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        stateLock.synchronized {
+          // -------------------- STATE 1 --------------------
+          // Wait until we have entered state 1 (thread 1 finished loading and committing)
+          while (state != 1) {
+            stateLock.wait()
+          }
+
+          // Load the db and signal that we have entered state 2
+          val store = provider.getStore(1)
+          assertAcquiredThreadIsCurrentThread(provider)
+          state = 2
+          stateLock.notifyAll()
+
+          // -------------------- STATE 4 --------------------
+          // Wait until we have entered state 4 (thread 1 completed and
+          // main thread confirmed that lock is held)
+          while (state != 4) {
+            stateLock.wait()
+          }
+
+          // Ensure we still have the lock
+          assertAcquiredThreadIsCurrentThread(provider)
+
+          // commit and signal that we have entered state 5
+          store.commit()
+          state = 5
+          stateLock.notifyAll()
         }
-        assert(store.iterator(cfName).toSeq.length == timerTimestamps.length)
+      }
 
-        // assert col family existence
-        assert(store.removeColFamilyIfExists(cfName))
+      // MAIN THREAD
+      stateLock.synchronized {
+        // -------------------- STATE 3 --------------------
+        // Wait until we have entered state 3 (thread 1 is complete)
+        while (state != 3) {
+          stateLock.wait()
+        }
 
-        val e = intercept[Exception] {
-          store.iterator(cfName)
+        // Verify that the lock is being held
+        val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+        val stateMachineObj = provider invokePrivate stateMachine()
+        val threadInfo = stateMachineObj.asInstanceOf[RocksDBStateMachine].getAcquiredThreadInfo
+        assert(threadInfo.nonEmpty, s"acquiredThreadInfo was None when it should be Some")
+
+        // Signal that we have entered state 4 (thread 2 can now release lock)
+        state = 4
+        stateLock.notifyAll()
+
+        // -------------------- STATE 5 --------------------
+        // Wait until we have entered state 5 (thread 2 has released lock)
+        // so that we can clean up
+        while (state != 5) {
+          stateLock.wait()
         }
+      }
+    }
+  }
 
-        checkError(
-          exception = e.asInstanceOf[StateStoreUnsupportedOperationOnMissingColumnFamily],
-          condition = "STATE_STORE_UNSUPPORTED_OPERATION_ON_MISSING_COLUMN_FAMILY",
-          sqlState = Some("42802"),
-          parameters = Map("operationType" -> "iterator", "colFamilyName" -> cfName)
-        )
+  test("RocksDB task completion listener correctly releases for failed task") {
+    // This test verifies that a thread that locks the DB and then fails
+    // can rely on the completion listener to release the lock.
+
+    // Create a custom ExecutionContext with 1 thread
+    implicit val ec: ExecutionContext = ExecutionContext.fromExecutor(
+      ThreadUtils.newDaemonSingleThreadExecutor("single-thread-executor"))
+    val timeout = 5.seconds
+
+    tryWithProviderResource(newStoreProvider()) { provider =>
+      // New task that will load and then complete with failure
+      val fut = Future {
+        val taskContext = TaskContext.empty()
+        TaskContext.setTaskContext(taskContext)
+
+        provider.getStore(0)
+        assertAcquiredThreadIsCurrentThread(provider)
+
+        // Task completion listener should unlock
+        taskContext.markTaskCompleted(
+          Some(new SparkException("Task failure injection")))
       }
+
+      ThreadUtils.awaitResult(fut, timeout)
+
+      // Assert that db is not locked
+      val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+      val stateMachineObj = provider invokePrivate stateMachine()
+      val stamp = stateMachineObj.asInstanceOf[RocksDBStateMachine].currentValidStamp.get()
+      assert(stamp == -1,
+        s"state machine stamp should be -1 (unlocked) but was $stamp")
     }
   }
 
@@ -2125,7 +2675,12 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
     tryWithProviderResource(newStoreProvider(provider.stateStoreId,
       useColumnFamilies)) { reloadedProvider =>
       val versionToRead = if (version < 0) reloadedProvider.latestVersion else version
-      reloadedProvider.getStore(versionToRead).iterator().map(rowPairToDataPair).toSet
+      val store = reloadedProvider.getStore(versionToRead)
+      try {
+        store.iterator().map(rowPairToDataPair).toSet
+      } finally {
+        if (!store.hasCommitted) store.abort()
+      }
     }
   }
 
@@ -2173,5 +2728,18 @@ class RocksDBStateStoreSuite extends StateStoreSuiteBase[RocksDBStateStoreProvid
       }
     }
   }
+
+  def assertAcquiredThreadIsCurrentThread(provider: RocksDBStateStoreProvider): Unit = {
+    val stateMachine = PrivateMethod[Any](Symbol("stateMachine"))
+    val stateMachineObj = provider invokePrivate stateMachine()
+    val threadInfo = stateMachineObj.asInstanceOf[RocksDBStateMachine].getAcquiredThreadInfo
+    assert(threadInfo.isDefined,
+      "acquired thread info should not be null after load")
+    val threadId = threadInfo.get.threadRef.get.get.getId
+    assert(
+      threadId == Thread.currentThread().getId,
+      s"acquired thread should be curent thread ${Thread.currentThread().getId} " +
+        s"after load but was $threadId")
+  }
 }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBSuite.scala
index bd9c838eaa6a8..6f4125bb8b5c5 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/RocksDBSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.execution.streaming.state
 
 import java.io._
-import java.nio.charset.Charset
+import java.nio.file.Files
 import java.util.UUID
 import java.util.concurrent.Executors
 
@@ -28,7 +28,6 @@ import scala.concurrent.duration._
 import scala.language.implicitConversions
 import scala.util.Random
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FSDataInputStream, Path}
 import org.rocksdb.CompressionType
@@ -42,8 +41,9 @@ import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.UnsafeProjection
 import org.apache.spark.sql.catalyst.util.quietly
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, CreateAtomicTestManager, FileContextBasedCheckpointFileManager, FileSystemBasedCheckpointFileManager}
-import org.apache.spark.sql.execution.streaming.CheckpointFileManager.{CancellableFSDataOutputStream, RenameBasedFSDataOutputStream}
+import org.apache.spark.sql.execution.streaming.CreateAtomicTestManager
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, FileContextBasedCheckpointFileManager, FileSystemBasedCheckpointFileManager}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager.{CancellableFSDataOutputStream, RenameBasedFSDataOutputStream}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.STREAMING_CHECKPOINT_FILE_MANAGER_CLASS
 import org.apache.spark.sql.test.{SharedSparkSession, SQLTestUtils}
@@ -2152,81 +2152,6 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
     }
   }
 
-  testWithStateStoreCheckpointIdsAndColumnFamilies("disallow concurrent updates to the same " +
-    "RocksDB instance",
-    TestWithBothChangelogCheckpointingEnabledAndDisabled) {
-    case (enableStateStoreCheckpointIds, colFamiliesEnabled) =>
-    quietly {
-      val versionToUniqueId = new mutable.HashMap[Long, String]()
-      withDB(
-        Utils.createTempDir().toString,
-        conf = dbConf.copy(lockAcquireTimeoutMs = 20),
-        useColumnFamilies = colFamiliesEnabled,
-        enableStateStoreCheckpointIds = enableStateStoreCheckpointIds,
-        versionToUniqueId = versionToUniqueId) { db =>
-        // DB has been loaded so current thread has already
-        // acquired the lock on the RocksDB instance
-
-        db.load(0, versionToUniqueId.get(0)) // Current thread should be able to load again
-
-        // Another thread should not be able to load while current thread is using it
-        var ex = intercept[SparkException] {
-          ThreadUtils.runInNewThread("concurrent-test-thread-1") {
-            db.load(0, versionToUniqueId.get(0))
-          }
-        }
-        checkError(
-          ex,
-          condition = "CANNOT_LOAD_STATE_STORE.UNRELEASED_THREAD_ERROR",
-          parameters = Map(
-            "loggingId" -> "\\[Thread-\\d+\\]",
-            "operationType" -> "load_store",
-            "newAcquiredThreadInfo" -> "\\[ThreadId: Some\\(\\d+\\)\\]",
-            "acquiredThreadInfo" -> "\\[ThreadId: Some\\(\\d+\\)\\]",
-            "timeWaitedMs" -> "\\d+",
-            "stackTraceOutput" -> "(?s).*"
-          ),
-          matchPVals = true
-        )
-
-        // Commit should release the instance allowing other threads to load new version
-        db.commit()
-        ThreadUtils.runInNewThread("concurrent-test-thread-2") {
-          db.load(1, versionToUniqueId.get(1))
-          db.commit()
-        }
-
-        // Another thread should not be able to load while current thread is using it
-        db.load(2, versionToUniqueId.get(2))
-        ex = intercept[SparkException] {
-          ThreadUtils.runInNewThread("concurrent-test-thread-2") {
-            db.load(2, versionToUniqueId.get(2))
-          }
-        }
-        checkError(
-          ex,
-          condition = "CANNOT_LOAD_STATE_STORE.UNRELEASED_THREAD_ERROR",
-          parameters = Map(
-            "loggingId" -> "\\[Thread-\\d+\\]",
-            "operationType" -> "load_store",
-            "newAcquiredThreadInfo" -> "\\[ThreadId: Some\\(\\d+\\)\\]",
-            "acquiredThreadInfo" -> "\\[ThreadId: Some\\(\\d+\\)\\]",
-            "timeWaitedMs" -> "\\d+",
-            "stackTraceOutput" -> "(?s).*"
-          ),
-          matchPVals = true
-        )
-
-        // Rollback should release the instance allowing other threads to load new version
-        db.rollback()
-        ThreadUtils.runInNewThread("concurrent-test-thread-3") {
-          db.load(1, versionToUniqueId.get(1))
-          db.commit()
-        }
-      }
-    }
-  }
-
   testWithColumnFamilies("ensure concurrent access lock is released after Spark task completes",
     TestWithBothChangelogCheckpointingEnabledAndDisabled) { colFamiliesEnabled =>
     RocksDBSuite.withSingletonDB {
@@ -2251,7 +2176,7 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
     withTempDir { dir =>
       val file2 = new File(dir, "json")
       val json2 = """{"sstFiles":[],"numKeys":0}"""
-      FileUtils.write(file2, s"v2\n$json2", Charset.defaultCharset)
+      Files.writeString(file2.toPath, s"v2\n$json2")
       val e = intercept[SparkException] {
         RocksDBCheckpointMetadata.readFromFile(file2)
       }
@@ -2269,7 +2194,7 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
       assert(metadata.json == json)
       withTempDir { dir =>
         val file = new File(dir, "json")
-        FileUtils.write(file, s"v1\n$json", Charset.defaultCharset)
+        Files.writeString(file.toPath, s"v1\n$json")
         assert(metadata == RocksDBCheckpointMetadata.readFromFile(file))
       }
     }
@@ -2401,6 +2326,132 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
     }
   }
 
+  testWithChangelogCheckpointingEnabled("RocksDB metric Maps do not change after retrieved") {
+    withTempDir { dir =>
+      val remoteDir = dir.getCanonicalPath
+      val conf = dbConf
+
+      withDB(remoteDir, conf = conf) { db =>
+        db.load(0)
+        db.put("a", "5")
+        db.put("b", "5")
+        db.commit()
+
+        // These should not change after retrieval
+        val m1 = db.metricsOpt.get
+
+        db.load(1)
+        db.put("a", "5")
+        db.put("b", "5")
+        db.commit()
+
+        val m2 = db.metricsOpt.get
+
+        // verify that the metrics maps are not shared
+        assert(!m1.lastCommitLatencyMs.eq(m2.lastCommitLatencyMs))
+        assert(!m1.loadMetrics.eq(m2.loadMetrics))
+        assert(!m1.nativeOpsHistograms.eq(m2.nativeOpsHistograms))
+        assert(!m1.nativeOpsMetrics.eq(m2.nativeOpsMetrics))
+      }
+    }
+  }
+
+  test("load metrics are populated correctly") {
+    withTempDir { dir =>
+      val remoteDir = dir.getCanonicalPath
+      val conf = dbConf
+
+      withDB(remoteDir, conf = conf) { db =>
+        db.load(0)
+        db.put("a", "5")
+        db.put("b", "5")
+        db.commit()
+
+        db.doMaintenance() // upload snapshot
+        db.rollback() // invalidate the db, so next load will reload from dfs
+
+        db.load(1)
+        db.put("a", "10")
+        db.put("b", "25")
+        db.commit()
+
+        val m1 = db.metricsOpt.get
+        assert(m1.loadMetrics("load") > 0)
+        // since we called load, loadFromSnapshot should not be populated
+        assert(!m1.loadMetrics.contains("loadFromSnapshot"))
+
+        if (conf.enableChangelogCheckpointing) {
+          assert(m1.loadMetrics("replayChangelog") > 0)
+          assert(m1.loadMetrics("numReplayChangeLogFiles") == 1)
+        } else {
+          assert(!m1.loadMetrics.contains("replayChangelog"))
+          assert(!m1.loadMetrics.contains("numReplayChangeLogFiles"))
+        }
+      }
+    }
+  }
+
+  testWithChangelogCheckpointingEnabled("load from snapshot metrics are populated correctly") {
+    withTempDir { dir =>
+      val remoteDir = dir.getCanonicalPath
+      // We want a snapshot for every two delta files
+      val conf = dbConf.copy(minDeltasForSnapshot = 1)
+
+      withDB(remoteDir, conf = conf) { db =>
+        db.load(0)
+        db.put("a", "5")
+        db.commit()
+        db.doMaintenance()
+
+        db.load(1)
+        db.put("b", "10")
+        db.commit()
+        db.doMaintenance()
+
+        db.loadFromSnapshot(0, 1)
+
+        db.refreshRecordedMetricsForTest()
+        val m1 = db.metricsOpt.get
+        assert(m1.loadMetrics("loadFromSnapshot") > 0)
+        // since we called loadFromSnapshot, load should not be populated
+        assert(!m1.loadMetrics.contains("load"))
+        assert(m1.loadMetrics("replayChangelog") > 0)
+        assert(m1.loadMetrics("numReplayChangeLogFiles") == 1)
+      }
+    }
+  }
+
+  test("commit metrics are populated correctly") {
+    withTempDir { dir =>
+      val remoteDir = dir.getCanonicalPath
+      val conf = dbConf.copy()
+
+      withDB(remoteDir, conf = conf) { db =>
+        db.load(0)
+        db.put("a", "5")
+        db.put("b", "5")
+        db.commit()
+        db.doMaintenance() // upload snapshot
+
+        val m1 = db.metricsOpt.get
+        assert(m1.lastCommitLatencyMs("fileSync") > 0)
+
+        if (conf.enableChangelogCheckpointing) {
+          // Since changelog checkpoint is enabled, we should populate this metric
+          assert(m1.lastCommitLatencyMs("changeLogWriterCommit") > 0)
+          // A snapshot is not forced when changelog checkpointing is enabled
+          assert(!m1.lastCommitLatencyMs.contains("saveZipFiles"))
+        } else {
+          // When changelog checkpoint is NOT enabled we should
+          // always populate this metric in the snapshot
+          assert(m1.lastCommitLatencyMs("saveZipFiles") > 0)
+          // This metric is not populated when changelog checkpointing is disabled
+          assert(!m1.lastCommitLatencyMs.contains("changeLogWriterCommit"))
+        }
+      }
+    }
+  }
+
   // Add tests to check valid and invalid values for max_open_files passed to the underlying
   // RocksDB instance.
   Seq("-1", "100", "1000").foreach { maxOpenFiles =>
@@ -2547,11 +2598,7 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
               db.load(0)
               db.put("a", "1")
               db.commit()
-              if (boundedMemoryUsage == "true") {
-                assert(db.metricsOpt.get.totalMemUsageBytes === 0)
-              } else {
-                assert(db.metricsOpt.get.totalMemUsageBytes > 0)
-              }
+              assert(db.metricsOpt.get.totalMemUsageBytes > 0)
               db.getWriteBufferManagerAndCache()
             }
 
@@ -2562,11 +2609,7 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
               db.load(0)
               db.put("a", "1")
               db.commit()
-              if (boundedMemoryUsage == "true") {
-                assert(db.metricsOpt.get.totalMemUsageBytes === 0)
-              } else {
-                assert(db.metricsOpt.get.totalMemUsageBytes > 0)
-              }
+              assert(db.metricsOpt.get.totalMemUsageBytes > 0)
               db.getWriteBufferManagerAndCache()
             }
 
@@ -2616,7 +2659,7 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
             db.remove("a")
             db.put("c", "3")
             db.commit()
-            assert(db.metricsOpt.get.totalMemUsageBytes === 0)
+            assert(db.metricsOpt.get.totalMemUsageBytes > 0)
           }
         } finally {
           RocksDBMemoryManager.resetWriteBufferManagerAndCache
@@ -3211,6 +3254,11 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
     }
   }
 
+  test("Calling getInstanceMemoryUsage on an ID " +
+    "that doesn't exist doesn't throw an error") {
+    RocksDBMemoryManager.getInstanceMemoryUsage("This ID doesn't exist", 0L)
+  }
+
   testWithChangelogCheckpointingEnabled(
     "SPARK-51717 - validate that RocksDB file mapping is cleared " +
       "when we reload version 0 after we have created a snapshot to avoid SST mismatch") {
@@ -3339,146 +3387,6 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
     }
   }
 
-  test("Rocks DB task completion listener does not double unlock acquireThread") {
-    // This test verifies that a thread that locks then unlocks the db and then
-    // fires a completion listener (Thread 1) does not unlock the lock validly
-    // acquired by another thread (Thread 2).
-    //
-    // Timeline of this test (* means thread is active):
-    // STATE | MAIN             | THREAD 1         | THREAD 2         |
-    // ------| ---------------- | ---------------- | ---------------- |
-    // 0.    | wait for s3      | *load, commit    | wait for s1      |
-    //       |                  | *signal s1       |                  |
-    // ------| ---------------- | ---------------- | ---------------- |
-    // 1.    |                  | wait for s2      | *load, signal s2 |
-    // ------| ---------------- | ---------------- | ---------------- |
-    // 2.    |                  | *task complete   | wait for s4      |
-    //       |                  | *signal s3, END  |                  |
-    // ------| ---------------- | ---------------- | ---------------- |
-    // 3.    | *verify locked   |                  |                  |
-    //       | *signal s4       |                  |                  |
-    // ------| ---------------- | ---------------- | ---------------- |
-    // 4.    | wait for s5      |                  | *commit          |
-    //       |                  |                  | *signal s5, END  |
-    // ------| ---------------- | ---------------- | ---------------- |
-    // 5.    | *close db, END   |                  |                  |
-    //
-    // NOTE: state 4 and 5 are only for cleanup
-
-    // Create a custom ExecutionContext with 3 threads
-    implicit val ec: ExecutionContext = ExecutionContext.fromExecutor(
-      ThreadUtils.newDaemonFixedThreadPool(3, "pool-thread-executor"))
-    val stateLock = new Object()
-    var state = 0
-
-    withTempDir { dir =>
-      val remoteDir = dir.getCanonicalPath
-      val db = new RocksDB(
-        remoteDir,
-        conf = dbConf,
-        localRootDir = Utils.createTempDir(),
-        hadoopConf = new Configuration(),
-        loggingId = s"[Thread-${Thread.currentThread.getId}]",
-        useColumnFamilies = false
-      )
-      try {
-        Future { // THREAD 1
-          // Set thread 1's task context so that it is not a clone
-          // of the main thread's taskContext, which will end if the
-          // task is marked as complete
-          val taskContext = TaskContext.empty()
-          TaskContext.setTaskContext(taskContext)
-
-          stateLock.synchronized {
-            // -------------------- STATE 0 --------------------
-            // Simulate a task that loads and commits, db should be unlocked after
-            db.load(0)
-            db.put("a", "1")
-            db.commit()
-            // Signal that we have entered state 1
-            state = 1
-            stateLock.notifyAll()
-
-            // -------------------- STATE 2 --------------------
-            // Wait until we have entered state 2 (thread 2 has loaded db and acquired lock)
-            while (state != 2) {
-              stateLock.wait()
-            }
-
-            // thread 1's task context is marked as complete and signal
-            // that we have entered state 3
-            // At this point, thread 2 should still hold the DB lock.
-            taskContext.markTaskCompleted(None)
-            state = 3
-            stateLock.notifyAll()
-          }
-        }
-
-        Future { // THREAD 2
-          // Set thread 2's task context so that it is not a clone of thread 1's
-          // so it won't be marked as complete
-          val taskContext = TaskContext.empty()
-          TaskContext.setTaskContext(taskContext)
-
-          stateLock.synchronized {
-            // -------------------- STATE 1 --------------------
-            // Wait until we have entered state 1 (thread 1 finished loading and committing)
-            while (state != 1) {
-              stateLock.wait()
-            }
-
-            // Load the db and signal that we have entered state 2
-            db.load(1)
-            assertAcquiredThreadIsCurrentThread(db)
-            state = 2
-            stateLock.notifyAll()
-
-            // -------------------- STATE 4 --------------------
-            // Wait until we have entered state 4 (thread 1 completed and
-            // main thread confirmed that lock is held)
-            while (state != 4) {
-              stateLock.wait()
-            }
-
-            // Ensure we still have the lock
-            assertAcquiredThreadIsCurrentThread(db)
-
-            // commit and signal that we have entered state 5
-            db.commit()
-            state = 5
-            stateLock.notifyAll()
-          }
-        }
-
-        // MAIN THREAD
-        stateLock.synchronized {
-          // -------------------- STATE 3 --------------------
-          // Wait until we have entered state 3 (thread 1 is complete)
-          while (state != 3) {
-            stateLock.wait()
-          }
-
-          // Verify that the lock is being held
-          val threadInfo = db.getAcquiredThreadInfo()
-          assert(threadInfo.nonEmpty, s"acquiredThreadInfo was None when it should be Some")
-
-          // Signal that we have entered state 4 (thread 2 can now release lock)
-          state = 4
-          stateLock.notifyAll()
-
-          // -------------------- STATE 5 --------------------
-          // Wait until we have entered state 5 (thread 2 has released lock)
-          // so that we can clean up
-          while (state != 5) {
-            stateLock.wait()
-          }
-        }
-      } finally {
-        db.close()
-      }
-    }
-  }
-
   test("RocksDB task completion listener correctly releases for failed task") {
     // This test verifies that a thread that locks the DB and then fails
     // can rely on the completion listener to release the lock.
@@ -3500,7 +3408,6 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
           TaskContext.setTaskContext(taskContext)
 
           db.load(0)
-          assertAcquiredThreadIsCurrentThread(db)
 
           // Task completion listener should unlock
           taskContext.markTaskCompleted(
@@ -3508,10 +3415,6 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
         }
 
         ThreadUtils.awaitResult(fut, timeout)
-
-        // Assert that db is not locked
-        val threadInfo = db.getAcquiredThreadInfo()
-        assert(threadInfo.isEmpty, s"acquiredThreadInfo should be None but was $threadInfo")
       }
     }
   }
@@ -3534,15 +3437,85 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
     }
   }
 
-  private def assertAcquiredThreadIsCurrentThread(db: RocksDB): Unit = {
-    val threadInfo = db.getAcquiredThreadInfo()
-    assert(threadInfo != None,
-      "acquired thread info should not be null after load")
-    val threadId = threadInfo.get.threadRef.get.get.getId
-    assert(
-      threadId == Thread.currentThread().getId,
-      s"acquired thread should be curent thread ${Thread.currentThread().getId} " +
-        s"after load but was $threadId")
+  testWithChangelogCheckpointingEnabled("SPARK-52553 - v1 changelog with invalid version number" +
+    " does not cause NumberFormatException") {
+    withTempDir { dir =>
+      withDB(dir.getCanonicalPath) { db =>
+        // In v1 changelog, the first key size would be written first in the file.
+        // We want the first few bytes in the changelog file to represent the UTF-8 string "v)"
+        // Because it has a prefix v, the changelog factory would try to parse ) as the version.
+        val dfsChangelogFileMethod = PrivateMethod[Path](Symbol("dfsChangelogFile"))
+        val changelogFilePath = db.fileManager invokePrivate dfsChangelogFileMethod(1L, None)
+
+        val fileManagerMethod = PrivateMethod[CheckpointFileManager](Symbol("fm"))
+        val fm = db.fileManager invokePrivate fileManagerMethod()
+
+        val codecMethod = PrivateMethod[CompressionCodec](Symbol("codec"))
+        val codec = db.fileManager invokePrivate codecMethod()
+
+        // Write a changelog file (1.changelog) with the desired content
+        val output = new DataOutputStream(codec.compressedOutputStream(
+          fm.createAtomic(changelogFilePath, overwriteIfPossible = true)))
+        // Write the string "v)"
+        output.writeUTF("v)")
+        output.close()
+
+        // Now try to read the changelog file using changelog reader
+        // It shouldn't throw NumberFormatException
+        val changelogReader = db.fileManager.getChangelogReader(1)
+        assert(changelogReader.version === 1)
+        changelogReader.closeIfNeeded()
+      }
+    }
+  }
+
+  test("SPARK-52637: RocksDB compaction leading to incorrect file mapping during load " +
+    "does not lead to versionID mismatch") {
+    val sqlConf = new SQLConf
+    sqlConf.setConf(
+      SQLConf.STATE_STORE_MIN_DELTAS_FOR_SNAPSHOT,
+      1)
+    val dbConf = RocksDBConf(StateStoreConf(sqlConf))
+
+    withTempDir { remoteDir => withTempDir { localDir =>
+      withDB(remoteDir.toString, localDir = localDir, conf = dbConf) { db =>
+        db.load(0)
+        db.commit()
+
+        val workingDir = localDir.listFiles().filter(_.getName.startsWith("workingDir")).head
+
+        logInfo(s"files: ${db.fileManager.listRocksDBFiles(workingDir)}")
+
+        db.load(1)
+        db.put("0", "0")
+        db.commit()
+
+        db.doMaintenance() // upload snapshot to remoteDir
+
+        // confirm that sst files exist
+        assert(db.fileManager.listRocksDBFiles(workingDir)._1.nonEmpty)
+        db.fileManager.listRocksDBFiles(workingDir)._1
+          .foreach(file => file.delete()) // simulate rocksdb compaction by removing SST files
+
+        // confirm that there are entries in the mapping
+        val fileMapping = PrivateMethod[RocksDBFileMapping](Symbol("rocksDBFileMapping"))
+        val localFileMappings = PrivateMethod[mutable.Map[String, (Long, RocksDBImmutableFile)]](
+          Symbol("localFileMappings"))
+        val fileMappingObj = db invokePrivate fileMapping()
+        val localFileMappingsObj = fileMappingObj invokePrivate localFileMappings()
+        assert(localFileMappingsObj.exists { case (_, (version, _)) =>
+          version >= 1
+        })
+
+        // reload version 1
+        db.load(1)
+
+        // ensure that there are no leftover fileMappings from the first load of version 1
+        assert(!localFileMappingsObj.exists { case (_, (version, _)) =>
+          version >= 1
+        })
+      }
+    }}
   }
 
   private def dbConf = RocksDBConf(StateStoreConf(SQLConf.get.clone()))
@@ -3635,7 +3608,8 @@ class RocksDBSuite extends AlsoTestWithRocksDBFeatures with SharedSparkSession
   def generateFiles(dir: String, fileToLengths: Seq[(String, Int)]): Unit = {
     fileToLengths.foreach { case (fileName, length) =>
       val file = new File(dir, fileName)
-      FileUtils.write(file, "a" * length, Charset.defaultCharset)
+      file.getParentFile().mkdirs()
+      Files.writeString(file.toPath, "a".repeat(length))
     }
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityCheckerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityCheckerSuite.scala
index 000c1b7a225ea..bbdc5440b39e8 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityCheckerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateSchemaCompatibilityCheckerSuite.scala
@@ -25,7 +25,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkUnsupportedOperationException
-import org.apache.spark.sql.execution.streaming.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
 import org.apache.spark.sql.execution.streaming.state.StateStoreTestsHelper.newDir
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
@@ -52,20 +52,20 @@ class StateSchemaCompatibilityCheckerSuite extends SharedSparkSession {
     .add(StructField("value3", structSchema, nullable = true))
 
   private val longKeySchema = new StructType()
-    .add(StructField("key" + "1" * 64 * 1024, IntegerType, nullable = true))
-    .add(StructField("key" + "2" * 64 * 1024, StringType, nullable = true))
-    .add(StructField("key" + "3" * 64 * 1024, structSchema, nullable = true))
+    .add(StructField("key" + "1".repeat(64 * 1024), IntegerType, nullable = true))
+    .add(StructField("key" + "2".repeat(64 * 1024), StringType, nullable = true))
+    .add(StructField("key" + "3".repeat( 64 * 1024), structSchema, nullable = true))
 
   private val longValueSchema = new StructType()
-    .add(StructField("value" + "1" * 64 * 1024, IntegerType, nullable = true))
-    .add(StructField("value" + "2" * 64 * 1024, StringType, nullable = true))
-    .add(StructField("value" + "3" * 64 * 1024, structSchema, nullable = true))
+    .add(StructField("value" + "1".repeat(64 * 1024), IntegerType, nullable = true))
+    .add(StructField("value" + "2".repeat(64 * 1024), StringType, nullable = true))
+    .add(StructField("value" + "3".repeat(64 * 1024), structSchema, nullable = true))
 
   private val keySchema65535Bytes = new StructType()
-    .add(StructField("k" * (65535 - 87), IntegerType, nullable = true))
+    .add(StructField("k".repeat(65535 - 87), IntegerType, nullable = true))
 
   private val valueSchema65535Bytes = new StructType()
-    .add(StructField("v" * (65535 - 87), IntegerType, nullable = true))
+    .add(StructField("v".repeat(65535 - 87), IntegerType, nullable = true))
 
   private val keySchemaWithCollation = new StructType()
     .add(StructField("key1", IntegerType, nullable = true))
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCompatibilitySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCompatibilitySuite.scala
index 5a5f3dd58d267..2e896ce465402 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCompatibilitySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCompatibilitySuite.scala
@@ -19,13 +19,11 @@ package org.apache.spark.sql.execution.streaming.state
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.SparkFunSuite
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.catalyst.plans.PlanTestBase
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.Update
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.count
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamTest
@@ -37,7 +35,7 @@ class StateStoreCompatibilitySuite extends StreamTest with StateStoreCodecsTest
      val resourceUri = this.getClass.getResource(
        "/structured-streaming/checkpoint-version-3.0.0-streaming-statestore-codec/").toURI
      val checkpointDir = Utils.createTempDir().getCanonicalFile
-     FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+     Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
      import testImplicits._
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinatorSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinatorSuite.scala
index 09118edc4357a..723bb0a876234 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinatorSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreCoordinatorSuite.scala
@@ -25,8 +25,9 @@ import org.scalatest.time.SpanSugar._
 import org.apache.spark.{SharedSparkContext, SparkContext, SparkFunSuite}
 import org.apache.spark.scheduler.ExecutorCacheTaskLocation
 import org.apache.spark.sql.classic.SparkSession
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StreamingQueryWrapper}
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.{LeftSide, RightSide}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.{LeftSide, RightSide}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.SymmetricHashJoinStateManager
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamingQueryWrapper}
 import org.apache.spark.sql.functions.{count, expr}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.{StreamingQuery, StreamTest, Trigger}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreInstanceMetricSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreInstanceMetricSuite.scala
index 4d842e1c87b8a..df4d19226b9d3 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreInstanceMetricSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreInstanceMetricSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.execution.streaming.state
 import scala.concurrent.duration.DurationInt
 import scala.jdk.CollectionConverters.MapHasAsScala
 
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.expr
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDDSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDDSuite.scala
index 1f9fd17eda600..b4eeca748285d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDDSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreRDDSuite.scala
@@ -32,7 +32,7 @@ import org.apache.spark.sql.LocalSparkSession._
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.util.quietly
 import org.apache.spark.sql.classic.ClassicConversions._
-import org.apache.spark.sql.execution.streaming.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.tags.ExtendedSQLTest
 import org.apache.spark.util.{CompletionIterator, Utils}
@@ -59,6 +59,151 @@ class StateStoreRDDSuite extends SparkFunSuite with BeforeAndAfter {
     }
   }
 
+  test("SPARK-51955: ReadStateStore reuse and upgrade to WriteStore") {
+
+    // Use the same queryRunId for both operations to ensure provider reuse
+    val queryRunId = UUID.randomUUID()
+
+    withSparkSession(SparkSession.builder()
+      .config(sparkConf)
+      .config(SQLConf.STATE_STORE_PROVIDER_CLASS.key, classOf[RocksDBStateStoreProvider].getName)
+      .config(SQLConf.SHUFFLE_PARTITIONS.key, "1")
+      .getOrCreate()) { spark =>
+      implicit val sqlContext = spark.sqlContext
+      val path = Utils.createDirectory(tempDir, Random.nextFloat().toString).toString
+
+      // Create initial data in the state store (version 0)
+      val initialData = makeRDD(spark.sparkContext, Seq(("a", 0), ("b", 0)))
+      val setupRDD = initialData.mapPartitionsWithStateStore(
+        sqlContext,
+        operatorStateInfo(path, queryRunId, version = 0),
+        keySchema,
+        valueSchema,
+        NoPrefixKeyStateEncoderSpec(keySchema)
+      ) { (store, iter) =>
+        // Set initial values: a->1, b->2
+        iter.foreach { case (s, i) =>
+          val key = dataToKeyRow(s, i)
+          store.put(key, dataToValueRow(if (s == "a") 1 else 2))
+        }
+        store.commit()
+        Iterator.empty
+      }
+      setupRDD.count() // Force evaluation
+
+      // Create input data for our chained operations
+      val inputData = makeRDD(spark.sparkContext, Seq(("a", 0), ("b", 0), ("c", 0)))
+
+      var mappedReadStore: ReadStateStore = null
+      var mappedWriteStore: StateStore = null
+
+      // Chain operations: first read with ReadStateStore, then write with StateStore
+      val chainedResults = inputData
+        // First pass: read-only state store access
+        .mapPartitionsWithReadStateStore(
+          operatorStateInfo(path, queryRunId, version = 1),
+          keySchema,
+          valueSchema,
+          NoPrefixKeyStateEncoderSpec(keySchema),
+          spark.sessionState,
+          Some(castToImpl(spark).streams.stateStoreCoordinator)
+        ) { (readStore, iter) =>
+          mappedReadStore = readStore
+
+          // Read values and store them for later verification
+          val inputItems = iter.toSeq // Materialize the input data
+
+          val readValues = inputItems.map { case (s, i) =>
+            val key = dataToKeyRow(s, i)
+            val value = Option(readStore.get(key)).map(valueRowToData)
+            ((s, i), value)
+          }
+
+          // Also capture all state store entries
+          val allValues = readStore.iterator().map(rowPairToDataPair).toSeq
+
+          // Return everything as a single tuple - only create one element in the iterator
+          Iterator((readValues, allValues, inputItems))
+        }
+        // Second pass: use StateStore to write updates (should reuse the read store)
+        .mapPartitionsWithStateStore(
+          operatorStateInfo(path, queryRunId, version = 1),
+          keySchema,
+          valueSchema,
+          NoPrefixKeyStateEncoderSpec(keySchema),
+          spark.sessionState,
+          Some(castToImpl(spark).streams.stateStoreCoordinator)
+        ) { (writeStore, writeIter) =>
+          if (writeIter.hasNext) {
+            val (readValues, allStoreValues, originalItems) = writeIter.next()
+            mappedWriteStore = writeStore
+            // Get all existing values from the write store to verify reuse
+            val storeValues = writeStore.iterator().map(rowPairToDataPair).toSeq
+
+            // Update values for a and c from the original items
+            originalItems.filter(p => p._1 == "a" || p._1 == "c").foreach { case (s, i) =>
+              val key = dataToKeyRow(s, i)
+              val oldValue = Option(writeStore.get(key)).map(valueRowToData).getOrElse(0)
+              val newValue = oldValue + 10 // Add 10 to existing values
+              writeStore.put(key, dataToValueRow(newValue))
+            }
+            writeStore.commit()
+
+            // Return all collected information for verification
+            Iterator((readValues, allStoreValues, storeValues))
+          } else {
+            Iterator.empty
+          }
+        }
+
+      // Collect the results
+      val (readValues, initialStoreState, writeStoreValues) = chainedResults.collect().head
+
+      // Verify read results
+      assert(readValues.toSet === Set(
+        ("a", 0) -> Some(1),
+        ("b", 0) -> Some(2),
+        ("c", 0) -> None
+      ))
+
+      // Verify store state matches expected values
+      assert(initialStoreState.toSet === Set((("a", 0), 1), (("b", 0), 2)))
+
+      // Verify the existing values in the write store (should be the same as initial state)
+      assert(writeStoreValues.toSet === Set((("a", 0), 1), (("b", 0), 2)))
+
+      // Verify that the same store was used for both read and write operations
+      assert(mappedReadStore == mappedWriteStore,
+        "StateStoreThreadLocalTracker should indicate the read store was reused")
+
+      // Create another ReadStateStoreRDD to verify the final state (version 2)
+      val verifyData = makeRDD(spark.sparkContext, Seq(("a", 0), ("b", 0), ("c", 0)))
+      val verifyRDD = verifyData.mapPartitionsWithReadStateStore(
+        operatorStateInfo(path, version = 2),
+        keySchema,
+        valueSchema,
+        NoPrefixKeyStateEncoderSpec(keySchema),
+        spark.sessionState,
+        Some(castToImpl(spark).streams.stateStoreCoordinator)
+      ) { (store, iter) =>
+        iter.map { case (s, i) =>
+          val key = dataToKeyRow(s, i)
+          val value = Option(store.get(key)).map(valueRowToData)
+          ((s, i), value)
+        }
+      }
+
+      // Verify the final state has the expected values
+      // a: 1 + 10 = 11, b: 2 (unchanged), c: 0 + 10 = 10
+      val finalResults = verifyRDD.collect().toSet
+      assert(finalResults === Set(
+        ("a", 0) -> Some(11),
+        ("b", 0) -> Some(2),
+        ("c", 0) -> Some(10)
+      ))
+    }
+  }
+
   test("versioning and immutability") {
     withSparkSession(SparkSession.builder().config(sparkConf).getOrCreate()) { spark =>
       val path = Utils.createDirectory(tempDir, Random.nextFloat().toString).toString
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreSuite.scala
index aa4a50b853a42..4d1e789a70b06 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StateStoreSuite.scala
@@ -17,17 +17,17 @@
 
 package org.apache.spark.sql.execution.streaming.state
 
-import java.io.{File, IOException}
+import java.io.{ByteArrayInputStream, ByteArrayOutputStream, File, IOException, ObjectInputStream, ObjectOutputStream}
 import java.net.URI
 import java.util
 import java.util.UUID
+import java.util.concurrent.{ConcurrentLinkedQueue, CountDownLatch, TimeUnit}
 import java.util.concurrent.atomic.AtomicBoolean
 
 import scala.collection.mutable
 import scala.jdk.CollectionConverters._
 import scala.util.Random
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs._
 import org.json4s.DefaultFormats
@@ -38,10 +38,12 @@ import org.scalatest.time.SpanSugar._
 
 import org.apache.spark._
 import org.apache.spark.LocalSparkContext._
+import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.util.quietly
 import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamExecution}
 import org.apache.spark.sql.execution.streaming.state.StateStoreCoordinatorSuite.withCoordinatorRef
 import org.apache.spark.sql.functions.count
 import org.apache.spark.sql.internal.SQLConf
@@ -50,6 +52,134 @@ import org.apache.spark.tags.ExtendedSQLTest
 import org.apache.spark.unsafe.types.UTF8String
 import org.apache.spark.util.Utils
 
+/**
+ * A test StateStoreProvider implementation that controls maintenance execution
+ * timing using a CountDownLatch to simulate concurrent maintenance scenarios.
+ *
+ * This provider is used to test the scenario where a task thread attempts to
+ * unload a provider via maintenance while it's already being processed by a
+ * maintenance thread. This tests the awaitProcessThisPartition functionality
+ * that ensures proper synchronization in StateStore's maintenance thread pool.
+ */
+class SignalingStateStoreProvider extends StateStoreProvider with Logging {
+  import SignalingStateStoreProvider._
+  private var id: StateStoreId = null
+
+  override def init(
+      stateStoreId: StateStoreId,
+      keySchema: StructType,
+      valueSchema: StructType,
+      keyStateEncoderSpec: KeyStateEncoderSpec,
+      useColumnFamilies: Boolean,
+      storeConfs: StateStoreConf,
+      hadoopConf: Configuration,
+      useMultipleValuesPerKey: Boolean = false,
+      stateSchemaProvider: Option[StateSchemaProvider] = None): Unit = {
+    id = stateStoreId
+  }
+
+  override def stateStoreId: StateStoreId = id
+
+  /**
+   * Records which thread called close() to verify that only maintenance threads close providers
+   */
+  override def close(): Unit = {
+    closeThreadName = Thread.currentThread.getName
+  }
+
+  /**
+   * This test implementation doesn't need to provide an actual store
+   */
+  override def getStore(
+      version: Long,
+      uniqueId: Option[String]): StateStore = null
+
+  /**
+   * Simulates a maintenance operation that blocks until a signal is received.
+   * This allows testing the scenario where a provider is already under maintenance
+   * when a task thread tries to trigger another maintenance operation on it.
+   */
+  override def doMaintenance(): Unit = {
+    maintenanceStarted = true
+    logInfo(s"Maintenance started on thread: ${Thread.currentThread().getName}")
+
+    // Block until the test signals to continue
+    continueSignal.await()
+
+    logInfo(s"Maintenance continuing after signal on thread: ${Thread.currentThread().getName}")
+  }
+}
+
+/**
+ * Companion object that tracks state and provides synchronization primitives
+ * for testing concurrent maintenance scenarios
+ */
+object SignalingStateStoreProvider extends Logging {
+  // For tracking state across threads
+  var maintenanceStarted: Boolean = false
+  var taskSubmittedMaintenance: Boolean = false
+  var closeThreadName: String = ""
+
+  // Added for queue testing
+  var providerWasQueued: Boolean = false
+
+  // For coordination between threads
+  var continueSignal = new CountDownLatch(1)
+  val maintenanceStartedLatch = new CountDownLatch(1)
+  val taskAttemptCompletedLatch = new CountDownLatch(1)
+
+  /**
+   * Resets all test state between test runs
+   */
+  def reset(): Unit = {
+    maintenanceStarted = false
+    taskSubmittedMaintenance = false
+    closeThreadName = ""
+
+    // Reset the latch to ensure maintenance will block again
+    try {
+      continueSignal = new CountDownLatch(1)
+    } catch {
+      case e: Exception =>
+        logError(s"Error resetting latch: ${e.getMessage}")
+    }
+  }
+}
+
+class FakeStateStoreProviderTracksCloseThread extends StateStoreProvider {
+  import FakeStateStoreProviderTracksCloseThread._
+  private var id: StateStoreId = null
+
+  override def init(
+      stateStoreId: StateStoreId,
+      keySchema: StructType,
+      valueSchema: StructType,
+      keyStateEncoderSpec: KeyStateEncoderSpec,
+      useColumnFamilies: Boolean,
+      storeConfs: StateStoreConf,
+      hadoopConf: Configuration,
+      useMultipleValuesPerKey: Boolean = false,
+      stateSchemaProvider: Option[StateSchemaProvider] = None): Unit = {
+    id = stateStoreId
+  }
+
+  override def stateStoreId: StateStoreId = id
+
+  override def close(): Unit = {
+    closeThreadNames = Thread.currentThread.getName :: closeThreadNames
+  }
+
+  override def getStore(
+      version: Long,
+      uniqueId: Option[String]): StateStore = null
+
+  override def doMaintenance(): Unit = {}
+}
+
+private object FakeStateStoreProviderTracksCloseThread {
+  var closeThreadNames: List[String] = Nil
+}
+
 // MaintenanceErrorOnCertainPartitionsProvider is a test-only provider that throws an
 // exception during maintenance for partitions 0 and 1 (these are arbitrary choices). It is
 // used to test that an exception in a single provider's maintenance does not affect other
@@ -138,6 +268,262 @@ class StateStoreSuite extends StateStoreSuiteBase[HDFSBackedStateStoreProvider]
     require(!StateStore.isMaintenanceRunning)
   }
 
+  test("SPARK-51596: submitMaintenanceWorkForProvider from task thread adds" +
+    " to queue when timeout occurs") {
+    // Reset tracking variables for a clean test
+    SignalingStateStoreProvider.reset()
+
+    val sqlConf = getDefaultSQLConf(
+      SQLConf.STATE_STORE_MIN_DELTAS_FOR_SNAPSHOT.defaultValue.get,
+      SQLConf.MAX_BATCHES_TO_RETAIN_IN_MEMORY.defaultValue.get
+    )
+
+    // Critical: Set a very short timeout to ensure awaitProcessThisPartition fails quickly
+    sqlConf.setConf(SQLConf.STATE_STORE_MAINTENANCE_PROCESSING_TIMEOUT, 1L) // 1 second
+
+    // Maintenance interval large enough that we control timing manually
+    sqlConf.setConf(SQLConf.STREAMING_MAINTENANCE_INTERVAL, 30000L)
+    sqlConf.setConf(SQLConf.NUM_STATE_STORE_MAINTENANCE_THREADS, 4)
+
+    // Use our test provider
+    sqlConf.setConf(
+      SQLConf.STATE_STORE_PROVIDER_CLASS,
+      classOf[SignalingStateStoreProvider].getName
+    )
+
+    val conf = new SparkConf().setMaster("local").setAppName("test")
+
+    withSpark(SparkContext.getOrCreate(conf)) { sc =>
+      withCoordinatorRef(sc) { _ =>
+        val rootLocation = s"${Utils.createTempDir().getAbsolutePath}/spark-51596-timeout-queue"
+        val providerId = StateStoreProviderId(StateStoreId(rootLocation, 0, 0), UUID.randomUUID)
+
+        // Load the provider to start the maintenance system
+        StateStore.get(
+          providerId,
+          keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
+          0, None, None, useColumnFamilies = false,
+          new StateStoreConf(sqlConf), new Configuration()
+        )
+
+        // Access the queue via reflection for verification
+        val queueField = PrivateMethod[ConcurrentLinkedQueue[
+          (StateStoreProviderId, StateStoreProvider)]](
+          Symbol("unloadedProvidersToClose"))
+        val queue = StateStore invokePrivate queueField()
+        assert(queue.isEmpty, "Queue should start empty")
+
+        // Manually trigger maintenance which will block
+        val maintenanceMethod = PrivateMethod[Unit](Symbol("doMaintenance"))
+        StateStore invokePrivate maintenanceMethod()
+
+        // Wait for maintenance to start
+        eventually(timeout(5.seconds)) {
+          assert(SignalingStateStoreProvider.maintenanceStarted)
+          assert(StateStore.isLoaded(providerId))
+        }
+
+        // Now get access to the provider to simulate a task thread
+        val loadedProvidersField = PrivateMethod[
+          mutable.HashMap[StateStoreProviderId, StateStoreProvider]](
+          Symbol("loadedProviders"))
+        val loadedProviders = StateStore invokePrivate loadedProvidersField()
+        val provider = loadedProviders.synchronized { loadedProviders.get(providerId).get }
+        val maintenancePartitionsField = PrivateMethod[
+          mutable.HashSet[StateStoreProviderId]](
+          Symbol("maintenancePartitions"))
+        val maintenancePartitions = StateStore invokePrivate maintenancePartitionsField()
+
+        // Create a task thread that will attempt to submit maintenance
+        val taskThread = new Thread(() => {
+          try {
+            // Call submitMaintenanceWorkForProvider directly since that's what we're testing
+            val submitMaintenanceMethod = PrivateMethod[Unit](
+              Symbol("submitMaintenanceWorkForProvider"))
+            StateStore invokePrivate submitMaintenanceMethod(
+              providerId, provider, new StateStoreConf(sqlConf),
+              MaintenanceTaskType.FromTaskThread)
+
+            SignalingStateStoreProvider.taskSubmittedMaintenance = true
+            SignalingStateStoreProvider.taskAttemptCompletedLatch.countDown()
+          } catch {
+            case e: Exception =>
+              logError(s"Error in task thread: ${e.getMessage}", e)
+          }
+        })
+
+        // Start the task thread - it should timeout and add provider to queue
+        taskThread.start()
+
+        // Wait for task attempt to complete
+        assert(SignalingStateStoreProvider
+          .taskAttemptCompletedLatch.await(10, TimeUnit.SECONDS),
+          "Task thread didn't complete")
+
+        // Critical verification: After timeout, the provider should be in the queue
+        eventually(timeout(5.seconds)) {
+          assert(queue.size() == 1, "Provider should be queued after timeout")
+        }
+        val (queuedId, _) = queue.peek()
+        assert(queuedId == providerId, "Queued provider has wrong ID")
+
+        // Now allow the first maintenance to complete
+        SignalingStateStoreProvider.continueSignal.countDown()
+
+        eventually(timeout(5.seconds)) {
+          assert(maintenancePartitions.isEmpty,
+            "Maintenance partitions should be removed from")
+        }
+        // Manually trigger another maintenance to process the queue
+        StateStore invokePrivate maintenanceMethod()
+
+        // Verify the queue eventually gets processed
+        eventually(timeout(5.seconds)) {
+          assert(queue.isEmpty, "Queue should be emptied after maintenance")
+        }
+      }
+    }
+  }
+
+  test("SPARK-51596: queued maintenance tasks get processed when lock is available") {
+    // Reset tracking variables for a clean test
+    SignalingStateStoreProvider.reset()
+
+    val sqlConf = getDefaultSQLConf(
+      SQLConf.STATE_STORE_MIN_DELTAS_FOR_SNAPSHOT.defaultValue.get,
+      SQLConf.MAX_BATCHES_TO_RETAIN_IN_MEMORY.defaultValue.get
+    )
+    // Use a maintenance interval large enough that we control timing explicitly
+    sqlConf.setConf(SQLConf.STREAMING_MAINTENANCE_INTERVAL, 30000L)
+    // Set our special provider class that lets us control maintenance timing
+    sqlConf.setConf(
+      SQLConf.STATE_STORE_PROVIDER_CLASS,
+      classOf[SignalingStateStoreProvider].getName
+    )
+
+    val conf = new SparkConf().setMaster("local").setAppName("test")
+
+    withSpark(SparkContext.getOrCreate(conf)) { sc =>
+      withCoordinatorRef(sc) { coordinatorRef =>
+        val rootLocation = s"${Utils.createTempDir().getAbsolutePath}/spark-51596-queue"
+
+        // Create two providers that we'll use for the test
+        val provider1Id =
+          StateStoreProviderId(StateStoreId(rootLocation, 0, 0), UUID.randomUUID)
+        val provider2Id =
+          StateStoreProviderId(StateStoreId(rootLocation, 0, 1), UUID.randomUUID)
+
+        // Get the first provider to load it
+        StateStore.get(
+          provider1Id,
+          keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
+          0, None, None, useColumnFamilies = false,
+          new StateStoreConf(sqlConf), new Configuration()
+        )
+
+        // Manually trigger maintenance for provider1, which will block in doMaintenance()
+        val maintenanceMethod = PrivateMethod[Unit](Symbol("doMaintenance"))
+        StateStore invokePrivate maintenanceMethod()
+
+        // Wait for maintenance to start before continuing
+        eventually(timeout(5.seconds)) {
+          assert(SignalingStateStoreProvider.maintenanceStarted)
+          assert(StateStore.isLoaded(provider1Id))
+        }
+
+        // Now make the first provider "stale" by reporting it active on another executor
+        coordinatorRef.reportActiveInstance(provider1Id, "otherhost", "otherexec", Seq.empty)
+
+        // Get provider2 which will cause a maintenance task for provider1 to be queued
+        // (since provider1 is already under maintenance and can't be processed immediately)
+        StateStore.get(
+          provider2Id,
+          keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
+          0, None, None, useColumnFamilies = false,
+          new StateStoreConf(sqlConf), new Configuration()
+        )
+
+        // Mark that task submitted maintenance
+        SignalingStateStoreProvider.taskSubmittedMaintenance = true
+
+        // Unblock the first maintenance operation
+        SignalingStateStoreProvider.continueSignal.countDown()
+
+        // Verify that provider1 is eventually unloaded by the maintenance thread
+        // after the first maintenance completes and the queued maintenance runs
+        eventually(timeout(5.seconds)) {
+          // Provider1 should be unloaded
+          assert(!StateStore.isLoaded(provider1Id))
+          // Provider2 should still be loaded
+          assert(StateStore.isLoaded(provider2Id))
+          // Close should have been called on a maintenance thread
+          assert(SignalingStateStoreProvider.closeThreadName.contains("maintenance"))
+        }
+
+        // Get the partitionsForMaintenance field to check the queue is empty
+        val partitionsField = PrivateMethod[
+          ConcurrentLinkedQueue[StateStoreProviderId]](Symbol("unloadedProvidersToClose"))
+        val queue = StateStore invokePrivate partitionsField()
+        assert(queue.isEmpty, "Maintenance queue should be empty after processing queued tasks")
+      }
+    }
+  }
+
+  test("SPARK-51596: unloading only occurs on maintenance thread but occurs promptly") {
+    // Reset closeThreadNames
+    FakeStateStoreProviderTracksCloseThread.closeThreadNames = Nil
+
+    val sqlConf = getDefaultSQLConf(
+      SQLConf.STATE_STORE_MIN_DELTAS_FOR_SNAPSHOT.defaultValue.get,
+      SQLConf.MAX_BATCHES_TO_RETAIN_IN_MEMORY.defaultValue.get
+    )
+    // Make maintenance interval very large (30s) so that task thread runs before maintenance.
+    sqlConf.setConf(SQLConf.STREAMING_MAINTENANCE_INTERVAL, 30000L)
+    // Use the `FakeStateStoreProviderTracksCloseThread` to run the test
+    sqlConf.setConf(
+      SQLConf.STATE_STORE_PROVIDER_CLASS,
+      classOf[FakeStateStoreProviderTracksCloseThread].getName
+    )
+
+    val conf = new SparkConf().setMaster("local").setAppName("test")
+
+    withSpark(SparkContext.getOrCreate(conf)) { sc =>
+      withCoordinatorRef(sc) { coordinatorRef =>
+        val rootLocation = s"${Utils.createTempDir().getAbsolutePath}/spark-51596"
+        val providerId =
+          StateStoreProviderId(StateStoreId(rootLocation, 0, 0), UUID.randomUUID)
+        val providerId2 =
+          StateStoreProviderId(StateStoreId(rootLocation, 0, 1), UUID.randomUUID)
+
+        // Create provider to start the maintenance task + pool
+        StateStore.get(
+          providerId,
+          keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
+          0, None, None, useColumnFamilies = false, new StateStoreConf(sqlConf), new Configuration()
+        )
+
+        // Report instance active on another executor
+        coordinatorRef.reportActiveInstance(providerId, "otherhost", "otherexec", Seq.empty)
+
+        // Load another provider to trigger task unload
+        StateStore.get(
+          providerId2,
+          keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
+          0, None, None, useColumnFamilies = false, new StateStoreConf(sqlConf), new Configuration()
+        )
+
+        // Wait for close to occur. Timeout is less than maintenance interval,
+        // so should only close by task triggering.
+        eventually(timeout(5.seconds)) {
+          assert(FakeStateStoreProviderTracksCloseThread.closeThreadNames.size == 1)
+          FakeStateStoreProviderTracksCloseThread.closeThreadNames.foreach { name =>
+            assert(name.contains("state-store-maintenance-thread"))}
+        }
+      }
+    }
+  }
+
+
   test("retaining only two latest versions when MAX_BATCHES_TO_RETAIN_IN_MEMORY set to 2") {
     tryWithProviderResource(
       newStoreProvider(minDeltasForSnapshot = 10, numOfVersToRetainInMemory = 2)) { provider =>
@@ -204,31 +590,35 @@ class StateStoreSuite extends StateStoreSuiteBase[HDFSBackedStateStoreProvider]
     tryWithProviderResource(newStoreProvider(opId = Random.nextInt(), partition = 0,
       minDeltasForSnapshot = 5)) { provider =>
       val store = provider.getStore(0)
-      val keyRow = dataToKeyRow("a", 0)
-      val valueRow = dataToValueRow(1)
-      val colFamilyName = "test"
-      verifyStoreOperationUnsupported("put") {
-        store.put(keyRow, valueRow, colFamilyName)
-      }
+      try {
+        val keyRow = dataToKeyRow("a", 0)
+        val valueRow = dataToValueRow(1)
+        val colFamilyName = "test"
+        verifyStoreOperationUnsupported("put") {
+          store.put(keyRow, valueRow, colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("remove") {
-        store.remove(keyRow, colFamilyName)
-      }
+        verifyStoreOperationUnsupported("remove") {
+          store.remove(keyRow, colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("get") {
-        store.get(keyRow, colFamilyName)
-      }
+        verifyStoreOperationUnsupported("get") {
+          store.get(keyRow, colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("merge") {
-        store.merge(keyRow, valueRow, colFamilyName)
-      }
+        verifyStoreOperationUnsupported("merge") {
+          store.merge(keyRow, valueRow, colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("iterator") {
-        store.iterator(colFamilyName)
-      }
+        verifyStoreOperationUnsupported("iterator") {
+          store.iterator(colFamilyName)
+        }
 
-      verifyStoreOperationUnsupported("prefixScan") {
-        store.prefixScan(keyRow, colFamilyName)
+        verifyStoreOperationUnsupported("prefixScan") {
+          store.prefixScan(keyRow, colFamilyName)
+        }
+      } finally {
+        if (!store.hasCommitted) store.abort()
       }
     }
   }
@@ -347,8 +737,8 @@ class StateStoreSuite extends StateStoreSuiteBase[HDFSBackedStateStoreProvider]
       provider.getStore(0).commit()
 
       // Verify we don't leak temp files
-      val tempFiles = FileUtils.listFiles(new File(provider.stateStoreId.checkpointRootLocation),
-        null, true).asScala.filter(_.getName.startsWith("temp-"))
+      val tempFiles = Utils.listFiles(new File(provider.stateStoreId.checkpointRootLocation))
+        .asScala.filter(_.getName.startsWith("temp-"))
       assert(tempFiles.isEmpty)
     }
   }
@@ -402,8 +792,9 @@ class StateStoreSuite extends StateStoreSuiteBase[HDFSBackedStateStoreProvider]
         condition = "CANNOT_LOAD_STATE_STORE.CANNOT_READ_DELTA_FILE_NOT_EXISTS",
         parameters = Map(
           "fileToRead" -> s"${provider.stateStoreId.storeCheckpointLocation()}/1.delta",
-          "clazz" -> s"${provider.toString()}"
-        )
+          "clazz" -> "HDFSStateStoreProvider\\[.+\\]"
+        ),
+        matchPVals = true
       )
     }
   }
@@ -986,6 +1377,43 @@ class StateStoreSuite extends StateStoreSuiteBase[HDFSBackedStateStoreProvider]
     }
   }
 
+  test("SPARK-52740: HDFSBackedStateStoreProvider checkpoint format version 2 with " +
+    "deserialized sqlConf throws error correctly") {
+    val sqlConf = getDefaultSQLConf(SQLConf.STATE_STORE_MIN_DELTAS_FOR_SNAPSHOT.defaultValue.get,
+      SQLConf.MAX_BATCHES_TO_RETAIN_IN_MEMORY.defaultValue.get)
+    sqlConf.setConf(SQLConf.STATE_STORE_CHECKPOINT_FORMAT_VERSION, 2)
+    val originalConf = new StateStoreConf(sqlConf)
+
+    // Serialize
+    val baos = new ByteArrayOutputStream()
+    val oos = new ObjectOutputStream(baos)
+    oos.writeObject(originalConf)
+    oos.close()
+
+    // Deserialize
+    val bais = new ByteArrayInputStream(baos.toByteArray)
+    val ois = new ObjectInputStream(bais)
+    val deserializedConf = ois.readObject().asInstanceOf[StateStoreConf]
+    ois.close()
+
+    val provider = new HDFSBackedStateStoreProvider()
+    val hadoopConf = new Configuration()
+    hadoopConf.set(StreamExecution.RUN_ID_KEY, UUID.randomUUID().toString)
+
+    val e = intercept[AssertionError] {
+      provider.init(
+        StateStoreId(newDir(), Random.nextInt(), 0),
+        keySchema,
+        valueSchema,
+        NoPrefixKeyStateEncoderSpec(keySchema),
+        useColumnFamilies = false,
+        deserializedConf,
+        hadoopConf)
+    }
+    assert(e.getMessage.contains(
+      "HDFS State Store Provider doesn't support checkpointFormatVersion >= 2"))
+  }
+
   override def newStoreProvider(): HDFSBackedStateStoreProvider = {
     newStoreProvider(opId = Random.nextInt(), partition = 0)
   }
@@ -1033,7 +1461,12 @@ class StateStoreSuite extends StateStoreSuiteBase[HDFSBackedStateStoreProvider]
       if (version < 0) {
         reloadedProvider.latestIterator().map(rowPairToDataPair).toSet
       } else {
-        reloadedProvider.getStore(version).iterator().map(rowPairToDataPair).toSet
+        val store = reloadedProvider.getStore(version)
+        try {
+          store.iterator().map(rowPairToDataPair).toSet
+        } finally {
+          if (!store.hasCommitted) store.abort()
+        }
       }
     }
   }
@@ -1138,7 +1571,6 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
       assert(!store.hasCommitted)
       assert(get(store, "a", 0) === None)
       assert(store.iterator().isEmpty)
-      assert(store.metrics.numKeys === 0)
 
       // Verify state after updating
       put(store, "a", 0, 1)
@@ -1154,9 +1586,9 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
       assert(store.commit() === 1)
 
       assert(store.hasCommitted)
-      assert(rowPairsToDataSet(store.iterator()) === Set(("b", 0) -> 2))
-      assert(getLatestData(provider,
-        useColumnFamilies = colFamiliesEnabled) === Set(("b", 0) -> 2))
+      val store1 = provider.getStore(1)
+      assert(rowPairsToDataSet(store1.iterator()) === Set(("b", 0) -> 2))
+      store1.abort()
 
       // Trying to get newer versions should fail
       var e = intercept[SparkException] {
@@ -1174,11 +1606,9 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
         val reloadedStore = reloadedProvider.getStore(1)
         put(reloadedStore, "c", 0, 4)
         assert(reloadedStore.commit() === 2)
-        assert(rowPairsToDataSet(reloadedStore.iterator()) === Set(("b", 0) -> 2, ("c", 0) -> 4))
-        assert(getLatestData(provider, useColumnFamilies = colFamiliesEnabled)
-          === Set(("b", 0) -> 2, ("c", 0) -> 4))
-        assert(getData(provider, version = 1, useColumnFamilies = colFamiliesEnabled)
-          === Set(("b", 0) -> 2))
+        val reloadedStore1 = reloadedProvider.getStore(2)
+        assert(rowPairsToDataSet(reloadedStore1.iterator()) === Set(("b", 0) -> 2, ("c", 0) -> 4))
+        reloadedStore1.commit()
       }
     }
   }
@@ -1240,6 +1670,7 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
       // prefix scan should not reflect the uncommitted changes
       verifyScan(key1AtVersion0, key2AtVersion0)
       verifyScan(Seq("d"), Seq.empty)
+      store.abort()
     }
   }
 
@@ -1256,16 +1687,19 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
       put(store, "e", 0, 5)
       assert(store.commit() === 1)
       assert(store.metrics.numKeys === 5)
-      assert(rowPairsToDataSet(store.iterator()) ===
+      val store1 = provider.getStore(1)
+      assert(rowPairsToDataSet(store1.iterator()) ===
         Set(("a", 0) -> 1, ("b", 0) -> 2, ("c", 0) -> 3, ("d", 0) -> 4, ("e", 0) -> 5))
+      store1.abort()
 
-      val reloadedProvider = newStoreProvider(store.id, colFamiliesEnabled)
-      val reloadedStore = reloadedProvider.getStore(1)
-      remove(reloadedStore, _._1 == "b")
-      assert(reloadedStore.commit() === 2)
-      assert(reloadedStore.metrics.numKeys === 4)
-      assert(rowPairsToDataSet(reloadedStore.iterator()) ===
-        Set(("a", 0) -> 1, ("c", 0) -> 3, ("d", 0) -> 4, ("e", 0) -> 5))
+      tryWithProviderResource(newStoreProvider(store.id, colFamiliesEnabled)) { reloadedProvider =>
+        val reloadedStore = reloadedProvider.getStore(1)
+        remove(reloadedStore, _._1 == "b")
+        assert(rowPairsToDataSet(reloadedStore.iterator()) ===
+          Set(("a", 0) -> 1, ("c", 0) -> 3, ("d", 0) -> 4, ("e", 0) -> 5))
+        assert(reloadedStore.commit() === 2)
+        assert(reloadedStore.metrics.numKeys === 4)
+      }
     }
   }
 
@@ -1274,20 +1708,24 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
       // Verify state before starting a new set of updates
       assert(getLatestData(provider, useColumnFamilies = colFamiliesEnabled).isEmpty)
       val store = provider.getStore(0)
-      put(store, "a", 0, 1)
-      put(store, "b", 0, 2)
-
-      // Updates should work while iterating of filtered entries
-      val filtered = store.iterator().filter { tuple => keyRowToData(tuple.key) == ("a", 0) }
-      filtered.foreach { tuple =>
-        store.put(tuple.key, dataToValueRow(valueRowToData(tuple.value) + 1))
+      try {
+        put(store, "a", 0, 1)
+        put(store, "b", 0, 2)
+
+        // Updates should work while iterating of filtered entries
+        val filtered = store.iterator().filter { tuple => keyRowToData(tuple.key) == ("a", 0) }
+        filtered.foreach { tuple =>
+          store.put(tuple.key, dataToValueRow(valueRowToData(tuple.value) + 1))
+        }
+        assert(get(store, "a", 0) === Some(2))
+
+        // Removes should work while iterating of filtered entries
+        val filtered2 = store.iterator().filter { tuple => keyRowToData(tuple.key) == ("b", 0) }
+        filtered2.foreach { tuple => store.remove(tuple.key) }
+        assert(get(store, "b", 0) === None)
+      } finally {
+        if (!store.hasCommitted) store.abort()
       }
-      assert(get(store, "a", 0) === Some(2))
-
-      // Removes should work while iterating of filtered entries
-      val filtered2 = store.iterator().filter { tuple => keyRowToData(tuple.key) == ("b", 0) }
-      filtered2.foreach { tuple => store.remove(tuple.key) }
-      assert(get(store, "b", 0) === None)
     }
   }
 
@@ -1295,8 +1733,8 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
     tryWithProviderResource(newStoreProvider(colFamiliesEnabled)) { provider =>
       val store = provider.getStore(0)
       put(store, "a", 0, 1)
-      store.commit()
       assert(rowPairsToDataSet(store.iterator()) === Set(("a", 0) -> 1))
+      store.commit()
 
       // cancelUpdates should not change the data in the files
       val store1 = provider.getStore(1)
@@ -1341,11 +1779,12 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
 
       val store = provider.getStore(0)
       put(store, "a", 0, 1)
-      assert(store.commit() === 1)
       assert(rowPairsToDataSet(store.iterator()) === Set(("a", 0) -> 1))
+      assert(store.commit() === 1)
 
       val store1_ = provider.getStore(1)
       assert(rowPairsToDataSet(store1_.iterator()) === Set(("a", 0) -> 1))
+      store1_.abort()
 
       checkInvalidVersion(-1, provider.isInstanceOf[HDFSBackedStateStoreProvider])
       checkInvalidVersion(2, provider.isInstanceOf[HDFSBackedStateStoreProvider])
@@ -1354,8 +1793,8 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
       val store1 = provider.getStore(1)
       assert(rowPairsToDataSet(store1.iterator()) === Set(("a", 0) -> 1))
       put(store1, "b", 0, 1)
-      assert(store1.commit() === 2)
       assert(rowPairsToDataSet(store1.iterator()) === Set(("a", 0) -> 1, ("b", 0) -> 1))
+      assert(store1.commit() === 2)
 
       checkInvalidVersion(-1, provider.isInstanceOf[HDFSBackedStateStoreProvider])
       checkInvalidVersion(3, provider.isInstanceOf[HDFSBackedStateStoreProvider])
@@ -1380,23 +1819,25 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
 
       put(store, key1, key2, 1)
       store.commit()
-      assert(rowPairsToDataSet(store.iterator()) === Set((key1, key2) -> 1))
+      val store1 = provider0.getStore(1)
+      assert(rowPairsToDataSet(store1.iterator()) === Set((key1, key2) -> 1))
+      store1.abort()
     }
 
     // two state stores
     tryWithProviderResource(newStoreProvider(storeId, colFamiliesEnabled)) { provider1 =>
       val restoreStore = provider1.getReadStore(1)
-      val saveStore = provider1.getStore(1)
+      val saveStore = provider1.upgradeReadStoreToWriteStore(restoreStore, 1)
 
       put(saveStore, key1, key2, get(restoreStore, key1, key2).get + 1)
       saveStore.commit()
-      restoreStore.abort()
     }
 
     // check that state is correct for next batch
     tryWithProviderResource(newStoreProvider(storeId, colFamiliesEnabled)) { provider2 =>
       val finalStore = provider2.getStore(2)
       assert(rowPairsToDataSet(finalStore.iterator()) === Set((key1, key2) -> 2))
+      finalStore.abort()
     }
   }
 
@@ -1411,17 +1852,126 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
     val storeId = StateStoreId(dir, operatorId = 0, partitionId = 0)
     tryWithProviderResource(newStoreProvider(storeId, conf)) { provider =>
       val store = provider.getStore(0)
-      put(store, "a", 0, 0)
-      val e = intercept[SparkException](quietly { store.commit() } )
+      try {
+        put(store, "a", 0, 0)
+        val e = intercept[SparkException](quietly {
+          store.commit()
+        })
+
+        assert(e.getCondition == "CANNOT_WRITE_STATE_STORE.CANNOT_COMMIT")
+        if (store.getClass.getName contains ROCKSDB_STATE_STORE) {
+          assert(e.getMessage contains "RocksDBStateStore")
+        } else {
+          assert(e.getMessage contains "HDFSStateStore")
+        }
+        assert(e.getMessage contains "operatorId=0")
+        assert(e.getMessage contains "partitionId=0")
+        assert(e.getMessage contains "Error writing state store files")
+        assert(e.getCause.getMessage.contains("Failed to rename"))
+      } finally {
+        if (!store.hasCommitted) store.abort()
+      }
+    }
+  }
 
-      assert(e.getCondition == "CANNOT_WRITE_STATE_STORE.CANNOT_COMMIT")
-      if (store.getClass.getName contains ROCKSDB_STATE_STORE) {
-        assert(e.getMessage contains "RocksDBStateStore[id=(op=0,part=0)")
-      } else {
-        assert(e.getMessage contains "HDFSStateStore[id=(op=0,part=0)")
+  test("two concurrent StateStores - one for read-only and one for read-write with release()") {
+    val dir = Utils.createTempDir().getAbsolutePath
+    val storeId = StateStoreId(dir, 0L, 1)
+    val storeProviderId = StateStoreProviderId(storeId, UUID.randomUUID)
+    val key1 = "a"
+    val key2 = 0
+    val storeConf = StateStoreConf.empty
+    val hadoopConf = new Configuration()
+
+    quietly {
+      withSpark(SparkContext.getOrCreate(
+        new SparkConf().setMaster("local").setAppName("test"))) { sc =>
+        withCoordinatorRef(sc) { _ =>
+          // Prime state
+          val store = StateStore.get(
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            0, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          put(store, key1, key2, 1)
+          store.commit()
+
+          // Get two state stores - one read-only and one read-write
+          val restoreStore = StateStore.getReadOnly(
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            1, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          val saveStore = StateStore.get(
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            1, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          // Update the write store based on data from read store
+          put(saveStore, key1, key2, get(restoreStore, key1, key2).get + 1)
+          saveStore.commit()
+
+          // Check that state is correct for next batch
+          val finalStore = StateStore.get(
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            2, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          assert(get(finalStore, key1, key2) === Some(2))
+        }
+      }
+    }
+  }
+
+  test("getWriteStore correctly uses existing read store") {
+    val dir = Utils.createTempDir().getAbsolutePath
+    val storeId = StateStoreId(dir, 0L, 1)
+    val storeProviderId = StateStoreProviderId(storeId, UUID.randomUUID)
+    val storeConf = StateStoreConf.empty
+    val hadoopConf = new Configuration()
+
+    quietly {
+      withSpark(SparkContext.getOrCreate(
+        new SparkConf().setMaster("local").setAppName("test"))) { sc =>
+        withCoordinatorRef(sc) { _ =>
+          // Prime state
+          val store = StateStore.get(
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            0, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          put(store, "a", 0, 1)
+          store.commit()
+
+          // Get a read-only store
+          val readStore = StateStore.getReadOnly(
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            1, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          // Convert it to a write store using the new getWriteStore method
+          val writeStore = StateStore.getWriteStore(
+            readStore,
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            1, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          // The write store should still have access to the data
+          assert(get(writeStore, "a", 0) === Some(1))
+
+          // Update and commit with the write store
+          put(writeStore, "a", 0, 2)
+          writeStore.commit()
+
+          // Check that the state was updated correctly
+          val finalStore = StateStore.get(
+            storeProviderId, keySchema, valueSchema,
+            NoPrefixKeyStateEncoderSpec(keySchema),
+            2, None, None, useColumnFamilies = false, storeConf, hadoopConf)
+
+          assert(get(finalStore, "a", 0) === Some(2))
+        }
       }
-      assert(e.getMessage contains "Error writing state store files")
-      assert(e.getCause.getMessage.contains("Failed to rename"))
     }
   }
 
@@ -1571,7 +2121,7 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
           assert(rowPairsToDataSet(store0reloaded.iterator()) === Set.empty)
 
           // Verify that you can remove the store and still reload and use it
-          StateStore.unload(storeId)
+          StateStore.removeFromLoadedProvidersAndClose(storeId)
           assert(!StateStore.isLoaded(storeId))
 
           val store1reloaded = StateStore.get(
@@ -1595,10 +2145,9 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
     tryWithProviderResource(newStoreProvider(minDeltasForSnapshot = 1,
       numOfVersToRetainInMemory = 1)) { provider =>
       val store = provider.getStore(0)
-      val noDataMemoryUsed = store.metrics.memoryUsedBytes
       put(store, "a", 0, 1)
       store.commit()
-      assert(store.metrics.memoryUsedBytes > noDataMemoryUsed)
+      assert(store.metrics.memoryUsedBytes > 0)
     }
   }
 
@@ -1624,16 +2173,60 @@ abstract class StateStoreSuiteBase[ProviderClass <: StateStoreProvider]
     assert(combinedMetrics.customMetrics(customTimingMetric) == 400L)
   }
 
+  test("StateStoreIterator onClose method is called only when close() is called") {
+    // Test that the iterator functions as normal without closing
+    {
+      var closed = false
+
+      val iterator = new StateStoreIterator(Iterator(1, 2, 3, 4), () => {
+        closed = true
+      })
+
+      // next() should work as expected
+      for (i <- 1 to 4) {
+        assert(iterator.next() == i)
+      }
+
+      // close() is never called, so closed should remain false
+      assert(!closed)
+    }
+    // Test that the onClose method is called when close() is called
+    {
+      var closed = false
+
+      val iterator = new StateStoreIterator(Iterator(1, 2, 3, 4), () => {
+        closed = true
+      })
+
+      // next() should work as expected
+      assert(iterator.next() == 1)
+      assert(iterator.next() == 2)
+
+      // close() should call the onClose function which sets closed to true
+      assert(!closed)
+      iterator.close()
+      assert(closed)
+
+      // Calling close() again should not cause any issue
+      iterator.close()
+      assert(closed)
+    }
+  }
+
   test("SPARK-35659: StateStore.put cannot put null value") {
     tryWithProviderResource(newStoreProvider()) { provider =>
       // Verify state before starting a new set of updates
       assert(getLatestData(provider, useColumnFamilies = false).isEmpty)
 
       val store = provider.getStore(0)
-      val err = intercept[IllegalArgumentException] {
-        store.put(dataToKeyRow("key", 0), null)
+      try {
+        val err = intercept[IllegalArgumentException] {
+          store.put(dataToKeyRow("key", 0), null)
+        }
+        assert(err.getMessage.contains("Cannot put a null value"))
+      } finally {
+        if (!store.hasCommitted) store.abort()
       }
-      assert(err.getMessage.contains("Cannot put a null value"))
     }
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StatefulProcessorHandleSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StatefulProcessorHandleSuite.scala
index 0d74aade67194..a68965dd7845e 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StatefulProcessorHandleSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StatefulProcessorHandleSuite.scala
@@ -22,7 +22,7 @@ import java.util.UUID
 
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.Encoders
-import org.apache.spark.sql.execution.streaming.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl, StatefulProcessorHandleState}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl, StatefulProcessorHandleState}
 import org.apache.spark.sql.streaming.{TimeMode, TTLConfig}
 
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingAggregationStateManagerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingAggregationStateManagerSuite.scala
index 6685b140960d9..30ae505477ef4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingAggregationStateManagerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingAggregationStateManagerSuite.scala
@@ -20,6 +20,7 @@ package org.apache.spark.sql.execution.streaming.state
 import org.apache.spark.sql.catalyst.expressions.{Attribute, SpecificInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.expressions.codegen.GenerateUnsafeProjection
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
+import org.apache.spark.sql.execution.streaming.operators.stateful.StreamingAggregationStateManager
 import org.apache.spark.sql.streaming.StreamTest
 import org.apache.spark.sql.types.{IntegerType, StructField, StructType}
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingSessionWindowStateManagerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingSessionWindowStateManagerSuite.scala
index 4d687a5655e0e..f3b76a8df0475 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingSessionWindowStateManagerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/StreamingSessionWindowStateManagerSuite.scala
@@ -25,7 +25,7 @@ import org.scalatest.BeforeAndAfter
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
-import org.apache.spark.sql.execution.streaming.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StatefulOperatorStateInfo, StreamingSessionWindowStateManager}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamTest
 import org.apache.spark.sql.types.{IntegerType, LongType, StringType, StructType}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/SymmetricHashJoinStateManagerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/SymmetricHashJoinStateManagerSuite.scala
index 781d0390f72cf..44364626c20dd 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/SymmetricHashJoinStateManagerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/SymmetricHashJoinStateManagerSuite.scala
@@ -29,8 +29,9 @@ import org.apache.spark.sql.catalyst.expressions.codegen.GeneratePredicate
 import org.apache.spark.sql.catalyst.plans.logical.EventTimeWatermark
 import org.apache.spark.sql.catalyst.types.DataTypeUtils.toAttributes
 import org.apache.spark.sql.execution.metric.SQLMetric
-import org.apache.spark.sql.execution.streaming.StatefulOperatorStateInfo
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.LeftSide
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.{JoinStateManagerStoreGenerator, SymmetricHashJoinStateManager}
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.LeftSide
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamTest
 import org.apache.spark.sql.types._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/TimerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/TimerSuite.scala
index 428845d5ebcbb..c74599a6aa746 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/TimerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/TimerSuite.scala
@@ -19,7 +19,8 @@ package org.apache.spark.sql.execution.streaming.state
 
 import org.apache.spark.sql.Encoders
 import org.apache.spark.sql.catalyst.encoders.{encoderFor, ExpressionEncoder}
-import org.apache.spark.sql.execution.streaming.{ImplicitGroupingKeyTracker, TimerStateImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.ImplicitGroupingKeyTracker
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.timers.TimerStateImpl
 import org.apache.spark.sql.streaming.TimeMode
 
 /**
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ValueStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ValueStateSuite.scala
index 909e888a3dd9c..fbe33ddc32db2 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ValueStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/streaming/state/ValueStateSuite.scala
@@ -25,10 +25,13 @@ import scala.util.Random
 import org.apache.hadoop.conf.Configuration
 import org.scalatest.BeforeAndAfter
 
-import org.apache.spark.{SparkException, SparkUnsupportedOperationException}
+import org.apache.spark.{SparkException, SparkUnsupportedOperationException, TaskContext}
+import org.apache.spark.TaskContext.withTaskContext
 import org.apache.spark.sql.Encoders
 import org.apache.spark.sql.catalyst.encoders.{encoderFor, ExpressionEncoder}
-import org.apache.spark.sql.execution.streaming.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl, StreamExecution, ValueStateImplWithTTL}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statefulprocessor.{ImplicitGroupingKeyTracker, StatefulProcessorHandleImpl}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.ValueStateImplWithTTL
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.{TimeMode, TTLConfig, ValueState}
 import org.apache.spark.sql.test.SharedSparkSession
@@ -188,10 +191,13 @@ class ValueStateSuite extends StateVariableSuiteBase {
     val storeId = StateStoreId(newDir(), Random.nextInt(), 0)
     val provider = new HDFSBackedStateStoreProvider()
     val storeConf = new StateStoreConf(new SQLConf())
+    val hadoopConf = new Configuration()
+    hadoopConf.set(StreamExecution.RUN_ID_KEY, UUID.randomUUID().toString)
+
     val ex = intercept[StateStoreMultipleColumnFamiliesNotSupportedException] {
       provider.init(
         storeId, keySchema, valueSchema, NoPrefixKeyStateEncoderSpec(keySchema),
-        useColumnFamilies = true, storeConf, new Configuration)
+        useColumnFamilies = true, storeConf, hadoopConf)
     }
     checkError(
       ex,
@@ -473,7 +479,14 @@ abstract class StateVariableSuiteBase extends SharedSparkSession
   protected def tryWithProviderResource[T](
       provider: StateStoreProvider)(f: StateStoreProvider => T): T = {
     try {
-      f(provider)
+      val tc = TaskContext.empty()
+      try {
+        withTaskContext(tc) {
+          f(provider)
+        }
+      } finally {
+        tc.markTaskCompleted(None)
+      }
     } finally {
       provider.close()
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListenerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListenerSuite.scala
index 115f326971d32..800a58f0c1d63 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListenerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/ui/SQLAppStatusListenerSuite.scala
@@ -610,8 +610,7 @@ abstract class SQLAppStatusListenerSuite extends SharedSparkSession with JsonTes
 
   test("roundtripping SparkListenerDriverAccumUpdates through JsonProtocol (SPARK-18462)") {
     val event = SparkListenerDriverAccumUpdates(1L, Seq((2L, 3L)))
-    val jsonProtocol = new JsonProtocol(new SparkConf())
-    val json = jsonProtocol.sparkEventToJsonString(event)
+    val json = JsonProtocol.sparkEventToJsonString(event)
     assertValidDataInJson(parse(json),
       parse("""
         |{
@@ -620,7 +619,7 @@ abstract class SQLAppStatusListenerSuite extends SharedSparkSession with JsonTes
         |  "accumUpdates": [[2,3]]
         |}
       """.stripMargin))
-    jsonProtocol.sparkEventFromJson(json) match {
+    JsonProtocol.sparkEventFromJson(json) match {
       case SparkListenerDriverAccumUpdates(executionId, accums) =>
         assert(executionId == 1L)
         accums.foreach { case (a, b) =>
@@ -638,7 +637,7 @@ abstract class SQLAppStatusListenerSuite extends SharedSparkSession with JsonTes
         |  "accumUpdates": [[4294967294,3]]
         |}
       """.stripMargin
-    jsonProtocol.sparkEventFromJson(longJson) match {
+    JsonProtocol.sparkEventFromJson(longJson) match {
       case SparkListenerDriverAccumUpdates(executionId, accums) =>
         assert(executionId == 4294967294L)
         accums.foreach { case (a, b) =>
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/vectorized/ColumnVectorSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/vectorized/ColumnVectorSuite.scala
index 0edbfd10d8cde..a0fe44b96e7d4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/vectorized/ColumnVectorSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/vectorized/ColumnVectorSuite.scala
@@ -18,6 +18,7 @@
 package org.apache.spark.sql.execution.vectorized
 
 import org.apache.spark.SparkFunSuite
+import org.apache.spark.sql.YearUDT
 import org.apache.spark.sql.catalyst.expressions.SpecificInternalRow
 import org.apache.spark.sql.catalyst.plans.SQLHelper
 import org.apache.spark.sql.execution.columnar.{ColumnAccessor, ColumnDictionary}
@@ -926,5 +927,27 @@ class ColumnVectorSuite extends SparkFunSuite with SQLHelper {
       }
     }
   }
-}
 
+  val yearUDT = new YearUDT
+  testVectors("user defined type", 10, yearUDT) { testVector =>
+    assert(testVector.dataType() === IntegerType)
+    (0 until 10).foreach { i =>
+      testVector.appendInt(i)
+    }
+  }
+
+  testVectors("user defined type in map type",
+    10, MapType(IntegerType, yearUDT)) { testVector =>
+    assert(testVector.dataType() === MapType(IntegerType, IntegerType))
+  }
+
+  testVectors("user defined type in array type",
+    10, ArrayType(yearUDT, containsNull = true)) { testVector =>
+    assert(testVector.dataType() === ArrayType(IntegerType, containsNull = true))
+  }
+
+  testVectors("user defined type in struct type",
+    10, StructType(Seq(StructField("year", yearUDT)))) { testVector =>
+    assert(testVector.dataType() === StructType(Seq(StructField("year", IntegerType))))
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/internal/CatalogSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/internal/CatalogSuite.scala
index 1fe7530044e50..ebfffc14b0144 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/internal/CatalogSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/internal/CatalogSuite.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.internal
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.sql.{AnalysisException, DataFrame}
@@ -32,13 +31,14 @@ import org.apache.spark.sql.catalyst.expressions.GenericInternalRow
 import org.apache.spark.sql.catalyst.plans.logical.Range
 import org.apache.spark.sql.classic.Catalog
 import org.apache.spark.sql.connector.{FakeV2Provider, InMemoryTableSessionCatalog}
-import org.apache.spark.sql.connector.catalog.{CatalogManager, Identifier, InMemoryCatalog}
+import org.apache.spark.sql.connector.catalog.{CatalogManager, CatalogV2Util, Identifier, InMemoryCatalog}
 import org.apache.spark.sql.connector.catalog.CatalogV2Implicits.CatalogHelper
 import org.apache.spark.sql.connector.catalog.functions._
 import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.storage.StorageLevel
 import org.apache.spark.unsafe.types.UTF8String
+import org.apache.spark.util.Utils
 
 
 /**
@@ -811,7 +811,7 @@ class CatalogSuite extends SharedSparkSession with AnalysisTest with BeforeAndAf
     val testCatalog =
       spark.sessionState.catalogManager.catalog(catalogName).asTableCatalog
     val table = testCatalog.loadTable(Identifier.of(Array(dbName), tableName))
-    assert(table.schema().equals(tableSchema))
+    assert(table.columns sameElements CatalogV2Util.structTypeToV2Columns(tableSchema))
     assert(table.properties().get("provider").equals(classOf[FakeV2Provider].getName))
     assert(table.properties().get("comment").equals(description))
   }
@@ -831,7 +831,7 @@ class CatalogSuite extends SharedSparkSession with AnalysisTest with BeforeAndAf
       val testCatalog =
         spark.sessionState.catalogManager.catalog("testcat").asTableCatalog
       val table = testCatalog.loadTable(Identifier.of(Array(dbName), tableName))
-      assert(table.schema().equals(tableSchema))
+      assert(table.columns sameElements CatalogV2Util.structTypeToV2Columns(tableSchema))
       assert(table.properties().get("provider").equals(classOf[FakeV2Provider].getName))
       assert(table.properties().get("comment").equals(description))
       assert(table.properties().get("path").equals(dir.getAbsolutePath))
@@ -999,7 +999,7 @@ class CatalogSuite extends SharedSparkSession with AnalysisTest with BeforeAndAf
       spark.catalog.cacheTable(tableName)
       assert(spark.table(tableName).collect().length == 1)
 
-      FileUtils.deleteDirectory(dir)
+      Utils.deleteRecursively(dir)
       assert(spark.table(tableName).collect().length == 1)
 
       spark.catalog.refreshTable(tableName)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCMetricsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCMetricsSuite.scala
new file mode 100644
index 0000000000000..07c73e088e989
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCMetricsSuite.scala
@@ -0,0 +1,110 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc
+
+import java.sql.{Connection, DriverManager, Statement}
+import java.util.Properties
+
+import org.apache.spark.SparkConf
+import org.apache.spark.sql.QueryTest
+import org.apache.spark.sql.execution.datasources.v2.jdbc.JDBCTableCatalog
+import org.apache.spark.sql.execution.metric.SQLMetric
+import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.util.Utils
+
+class JDBCMetricsSuite extends QueryTest with SharedSparkSession {
+
+  val tempDir = Utils.createTempDir()
+  val url = s"jdbc:h2:${tempDir.getCanonicalPath};user=testUser;password=testPass"
+  val properties = new Properties()
+  properties.setProperty("user", "testUser")
+  properties.setProperty("password", "testPass")
+
+  private def withConnection[T](f: Connection => T): T = {
+    val conn = DriverManager.getConnection(url, new Properties())
+    try {
+      f(conn)
+    } finally {
+      conn.close()
+    }
+  }
+
+  override def sparkConf: SparkConf =
+    super.sparkConf
+      .set("spark.sql.catalog.h2", classOf[JDBCTableCatalog].getName)
+      .set("spark.sql.catalog.h2.url", url)
+      .set("spark.sql.catalog.h2.driver", "org.h2.Driver")
+      .set("spark.sql.catalog.h2.pushDownAggregate", "true")
+      .set("spark.sql.catalog.h2.pushDownLimit", "true")
+      .set("spark.sql.catalog.h2.pushDownOffset", "true")
+      .set("spark.sql.catalog.h2.pushDownJoin", "true")
+
+  override def beforeAll(): Unit = {
+    super.beforeAll()
+    Utils.classForName("org.h2.Driver")
+    withConnection { conn =>
+      val statement: Statement = conn.createStatement()
+      statement.addBatch("create schema test")
+      statement.addBatch(
+        "create table test.people (name TEXT(32) NOT NULL, theid INTEGER NOT NULL)")
+      statement.addBatch("insert into test.people values ('dany', 1)")
+      statement.addBatch("insert into test.people values ('mary', 2)")
+      statement.addBatch("insert into test.people values ('alex', 3)")
+      statement.executeBatch()
+    }
+  }
+
+  override def afterAll(): Unit = {
+    Utils.deleteRecursively(tempDir)
+    super.afterAll()
+  }
+
+  private def hasMetricKeyValue(metrics: Map[String, SQLMetric], metricKey: String): Unit = {
+    val optionMetric = metrics.get(metricKey)
+    assert(optionMetric.isDefined)
+    if(optionMetric.isDefined) {
+      val metric = optionMetric.get
+      assert(metric.value >= 0)
+    }
+  }
+
+  test("schema fetch time metric: JDBC v1") {
+    val df = spark.read
+      .format("jdbc")
+      .option("url", url)
+      .option("query", "SELECT * FROM TEST.PEOPLE")
+      .load()
+    hasMetricKeyValue(
+      df.queryExecution.executedPlan.collectLeaves().head.metrics,
+      "remoteSchemaFetchTime")
+  }
+
+  test("schema fetch time metric: JDBC v2") {
+    val df = sql("SELECT * FROM h2.TEST.PEOPLE")
+    hasMetricKeyValue(
+      df.queryExecution.executedPlan.collectLeaves().head.metrics,
+      "remoteSchemaFetchTime")
+  }
+
+  test("schema fetch time metric: DataFrameReader jdbc") {
+    val df = spark.read.jdbc(url, "TEST.PEOPLE", Array[String](), new Properties())
+    hasMetricKeyValue(
+      df.queryExecution.executedPlan.collectLeaves().head.metrics,
+      "remoteSchemaFetchTime")
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCSuite.scala
index 6896f6993fb33..276062fb1daae 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCSuite.scala
@@ -102,15 +102,97 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
     properties.setProperty("password", "testPass")
 
     conn = DriverManager.getConnection(url, properties)
-    conn.prepareStatement("create schema test").executeUpdate()
-    conn.prepareStatement(
-      "create table test.people (name TEXT(32) NOT NULL, theid INTEGER NOT NULL)").executeUpdate()
-    conn.prepareStatement("insert into test.people values ('fred', 1)").executeUpdate()
-    conn.prepareStatement("insert into test.people values ('mary', 2)").executeUpdate()
-    conn.prepareStatement(
-      "insert into test.people values ('joe ''foo'' \"bar\"', 3)").executeUpdate()
-    conn.commit()
+    val batchStmt = conn.createStatement()
 
+    batchStmt.addBatch("create schema test")
+
+    batchStmt.addBatch("create table test.people (name TEXT(32) NOT NULL, " +
+      "theid INTEGER NOT NULL)")
+    batchStmt.addBatch("insert into test.people values ('fred', 1)")
+    batchStmt.addBatch("insert into test.people values ('mary', 2)")
+    batchStmt.addBatch("insert into test.people values ('joe ''foo'' \"bar\"', 3)")
+
+    batchStmt.addBatch("create table test.inttypes (a INT, b BOOLEAN, c TINYINT, " +
+      "d SMALLINT, e BIGINT)")
+    batchStmt.addBatch("insert into test.inttypes values (1, false, 3, 4, 1234567890123)")
+    batchStmt.addBatch("insert into test.inttypes values (null, null, null, null, null)")
+
+    batchStmt.addBatch("create table test.timetypes (a TIME, b DATE, c TIMESTAMP(7))")
+    batchStmt.addBatch("insert into test.timetypes values " +
+      "('12:34:56', '1996-01-01', '2002-02-20 11:22:33.543543543')")
+    batchStmt.addBatch("insert into test.timetypes values " +
+      "('12:34:56', null, '2002-02-20 11:22:33.543543543')")
+
+    batchStmt.addBatch("CREATE TABLE test.timezone (tz TIMESTAMP WITH TIME ZONE) " +
+      "AS SELECT '1999-01-08 04:05:06.543543543-08:00'")
+
+    batchStmt.addBatch("CREATE TABLE test.array_table (ar Integer ARRAY) " +
+      "AS SELECT ARRAY[1, 2, 3]")
+
+    batchStmt.addBatch("create table test.flttypes (a DOUBLE, b REAL, c DECIMAL(38, 18))")
+    batchStmt.addBatch("insert into test.flttypes values " +
+      "(1.0000000000000002220446049250313080847263336181640625, " +
+      "1.00000011920928955078125, 123456789012345.543215432154321)")
+
+    batchStmt.addBatch("create table test.nulltypes (a INT, b BOOLEAN, c TINYINT, " +
+      "d BINARY(20), e VARCHAR(20), f VARCHAR_IGNORECASE(20), g CHAR(20), h BLOB, i CLOB, " +
+      "j TIME, k DATE, l TIMESTAMP, m DOUBLE, n REAL, o DECIMAL(38, 18))")
+    batchStmt.addBatch("insert into test.nulltypes values " +
+      "(null, null, null, null, null, null, null, null, null, null, null, null, null, null, null)")
+
+    batchStmt.addBatch("create table test.emp(name TEXT(32) NOT NULL, theid INTEGER, " +
+      "\"Dept\" INTEGER)")
+    batchStmt.addBatch("insert into test.emp values ('fred', 1, 10)")
+    batchStmt.addBatch("insert into test.emp values ('mary', 2, null)")
+    batchStmt.addBatch("insert into test.emp values ('joe ''foo'' \"bar\"', 3, 30)")
+    batchStmt.addBatch("insert into test.emp values ('kathy', null, null)")
+
+    batchStmt.addBatch("create table test.seq(id INTEGER)")
+    (0 to 6).foreach { value =>
+      batchStmt.addBatch(s"insert into test.seq values ($value)")
+    }
+    batchStmt.addBatch("insert into test.seq values (null)")
+
+    batchStmt.addBatch("create table test.\"mixedCaseCols\" (\"Name\" TEXT(32), " +
+      "\"Id\" INTEGER NOT NULL)")
+    batchStmt.addBatch("""insert into test."mixedCaseCols" values ('fred', 1)""")
+    batchStmt.addBatch("""insert into test."mixedCaseCols" values ('mary', 2)""")
+    batchStmt.addBatch("""insert into test."mixedCaseCols" values (null, 3)""")
+
+    batchStmt.addBatch("CREATE TABLE test.partition (THEID INTEGER, `THE ID` INTEGER) " +
+      "AS SELECT 1, 1")
+
+    batchStmt.addBatch("CREATE TABLE test.datetime (d DATE, t TIMESTAMP)")
+    batchStmt.addBatch("INSERT INTO test.datetime VALUES " +
+      "('2018-07-06', '2018-07-06 05:50:00.0')")
+    batchStmt.addBatch("INSERT INTO test.datetime VALUES " +
+      "('2018-07-06', '2018-07-06 08:10:08.0')")
+    batchStmt.addBatch("INSERT INTO test.datetime VALUES " +
+      "('2018-07-08', '2018-07-08 13:32:01.0')")
+    batchStmt.addBatch("INSERT INTO test.datetime VALUES " +
+      "('2018-07-12', '2018-07-12 09:51:15.0')")
+
+    batchStmt.addBatch("CREATE TABLE test.composite_name (`last name` TEXT(32) NOT NULL, " +
+      "id INTEGER NOT NULL)")
+    batchStmt.addBatch("INSERT INTO test.composite_name VALUES ('smith', 1)")
+    batchStmt.addBatch("INSERT INTO test.composite_name VALUES ('jones', 2)")
+
+    batchStmt.executeBatch()
+
+    conn
+      .prepareStatement("create table test.strtypes" +
+        "(a BINARY(20), b VARCHAR(20), c VARCHAR_IGNORECASE(20), d CHAR(20), e BLOB, f CLOB)")
+      .executeUpdate()
+    val strtypesStmt = conn.prepareStatement("insert into test.strtypes values (?, ?, ?, ?, ?, ?)")
+    strtypesStmt.setBytes(1, testBytes)
+    strtypesStmt.setString(2, "Sensitive")
+    strtypesStmt.setString(3, "Insensitive")
+    strtypesStmt.setString(4, "Twenty-byte CHAR")
+    strtypesStmt.setBytes(5, testBytes)
+    strtypesStmt.setString(6, "I am a clob!")
+    strtypesStmt.executeUpdate()
+
+    // Spark SQL views creation
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW foobar
@@ -143,13 +225,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
         |         upperBound '9223372036854775807', numPartitions '3')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement("create table test.inttypes (a INT, b BOOLEAN, c TINYINT, "
-      + "d SMALLINT, e BIGINT)").executeUpdate()
-    conn.prepareStatement("insert into test.inttypes values (1, false, 3, 4, 1234567890123)"
-        ).executeUpdate()
-    conn.prepareStatement("insert into test.inttypes values (null, null, null, null, null)"
-        ).executeUpdate()
-    conn.commit()
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW inttypes
@@ -157,16 +232,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
         |OPTIONS (url '$url', dbtable 'TEST.INTTYPES', user 'testUser', password 'testPass')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement("create table test.strtypes (a BINARY(20), b VARCHAR(20), "
-      + "c VARCHAR_IGNORECASE(20), d CHAR(20), e BLOB, f CLOB)").executeUpdate()
-    val stmt = conn.prepareStatement("insert into test.strtypes values (?, ?, ?, ?, ?, ?)")
-    stmt.setBytes(1, testBytes)
-    stmt.setString(2, "Sensitive")
-    stmt.setString(3, "Insensitive")
-    stmt.setString(4, "Twenty-byte CHAR")
-    stmt.setBytes(5, testBytes)
-    stmt.setString(6, "I am a clob!")
-    stmt.executeUpdate()
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW strtypes
@@ -174,13 +239,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
         |OPTIONS (url '$url', dbtable 'TEST.STRTYPES', user 'testUser', password 'testPass')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement("create table test.timetypes (a TIME, b DATE, c TIMESTAMP(7))"
-        ).executeUpdate()
-    conn.prepareStatement("insert into test.timetypes values ('12:34:56', "
-      + "'1996-01-01', '2002-02-20 11:22:33.543543543')").executeUpdate()
-    conn.prepareStatement("insert into test.timetypes values ('12:34:56', "
-      + "null, '2002-02-20 11:22:33.543543543')").executeUpdate()
-    conn.commit()
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW timetypes
@@ -188,23 +246,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
         |OPTIONS (url '$url', dbtable 'TEST.TIMETYPES', user 'testUser', password 'testPass')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement("CREATE TABLE test.timezone (tz TIMESTAMP WITH TIME ZONE) " +
-      "AS SELECT '1999-01-08 04:05:06.543543543-08:00'")
-      .executeUpdate()
-    conn.commit()
-
-    conn.prepareStatement("CREATE TABLE test.array_table (ar Integer ARRAY) " +
-      "AS SELECT ARRAY[1, 2, 3]")
-      .executeUpdate()
-    conn.commit()
-
-    conn.prepareStatement("create table test.flttypes (a DOUBLE, b REAL, c DECIMAL(38, 18))"
-        ).executeUpdate()
-    conn.prepareStatement("insert into test.flttypes values ("
-      + "1.0000000000000002220446049250313080847263336181640625, "
-      + "1.00000011920928955078125, "
-      + "123456789012345.543215432154321)").executeUpdate()
-    conn.commit()
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW flttypes
@@ -212,16 +253,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
         |OPTIONS (url '$url', dbtable 'TEST.FLTTYPES', user 'testUser', password 'testPass')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement(
-      s"""
-        |create table test.nulltypes (a INT, b BOOLEAN, c TINYINT, d BINARY(20), e VARCHAR(20),
-        |f VARCHAR_IGNORECASE(20), g CHAR(20), h BLOB, i CLOB, j TIME, k DATE, l TIMESTAMP,
-        |m DOUBLE, n REAL, o DECIMAL(38, 18))
-       """.stripMargin.replaceAll("\n", " ")).executeUpdate()
-    conn.prepareStatement("insert into test.nulltypes values ("
-      + "null, null, null, null, null, null, null, null, null, "
-      + "null, null, null, null, null, null)").executeUpdate()
-    conn.commit()
     sql(
       s"""
          |CREATE OR REPLACE TEMPORARY VIEW nulltypes
@@ -229,29 +260,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
          |OPTIONS (url '$url', dbtable 'TEST.NULLTYPES', user 'testUser', password 'testPass')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement(
-      "create table test.emp(name TEXT(32) NOT NULL," +
-        " theid INTEGER, \"Dept\" INTEGER)").executeUpdate()
-    conn.prepareStatement(
-      "insert into test.emp values ('fred', 1, 10)").executeUpdate()
-    conn.prepareStatement(
-      "insert into test.emp values ('mary', 2, null)").executeUpdate()
-    conn.prepareStatement(
-      "insert into test.emp values ('joe ''foo'' \"bar\"', 3, 30)").executeUpdate()
-    conn.prepareStatement(
-      "insert into test.emp values ('kathy', null, null)").executeUpdate()
-    conn.commit()
-
-    conn.prepareStatement(
-      "create table test.seq(id INTEGER)").executeUpdate()
-    (0 to 6).foreach { value =>
-      conn.prepareStatement(
-        s"insert into test.seq values ($value)").executeUpdate()
-    }
-    conn.prepareStatement(
-      "insert into test.seq values (null)").executeUpdate()
-    conn.commit()
-
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW nullparts
@@ -260,14 +268,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
         |partitionColumn '"Dept"', lowerBound '1', upperBound '4', numPartitions '3')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement(
-      """create table test."mixedCaseCols" ("Name" TEXT(32), "Id" INTEGER NOT NULL)""")
-      .executeUpdate()
-    conn.prepareStatement("""insert into test."mixedCaseCols" values ('fred', 1)""").executeUpdate()
-    conn.prepareStatement("""insert into test."mixedCaseCols" values ('mary', 2)""").executeUpdate()
-    conn.prepareStatement("""insert into test."mixedCaseCols" values (null, 3)""").executeUpdate()
-    conn.commit()
-
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW mixedCaseCols
@@ -275,29 +275,6 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
         |OPTIONS (url '$url', dbtable 'TEST."mixedCaseCols"', user 'testUser', password 'testPass')
        """.stripMargin.replaceAll("\n", " "))
 
-    conn.prepareStatement("CREATE TABLE test.partition (THEID INTEGER, `THE ID` INTEGER) " +
-      "AS SELECT 1, 1")
-      .executeUpdate()
-    conn.commit()
-
-    conn.prepareStatement("CREATE TABLE test.datetime (d DATE, t TIMESTAMP)").executeUpdate()
-    conn.prepareStatement(
-      "INSERT INTO test.datetime VALUES ('2018-07-06', '2018-07-06 05:50:00.0')").executeUpdate()
-    conn.prepareStatement(
-      "INSERT INTO test.datetime VALUES ('2018-07-06', '2018-07-06 08:10:08.0')").executeUpdate()
-    conn.prepareStatement(
-      "INSERT INTO test.datetime VALUES ('2018-07-08', '2018-07-08 13:32:01.0')").executeUpdate()
-    conn.prepareStatement(
-      "INSERT INTO test.datetime VALUES ('2018-07-12', '2018-07-12 09:51:15.0')").executeUpdate()
-    conn.commit()
-
-    conn.prepareStatement(
-      "CREATE TABLE test.composite_name (`last name` TEXT(32) NOT NULL, id INTEGER NOT NULL)")
-      .executeUpdate()
-    conn.prepareStatement("INSERT INTO test.composite_name VALUES ('smith', 1)").executeUpdate()
-    conn.prepareStatement("INSERT INTO test.composite_name VALUES ('jones', 2)").executeUpdate()
-    conn.commit()
-
     sql(
       s"""
         |CREATE OR REPLACE TEMPORARY VIEW composite_name
@@ -803,17 +780,23 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
   }
 
   test("quote column names by jdbc dialect") {
-    val MySQL = JdbcDialects.get("jdbc:mysql://127.0.0.1/db")
-    val Postgres = JdbcDialects.get("jdbc:postgresql://127.0.0.1/db")
-    val Derby = JdbcDialects.get("jdbc:derby:db")
-
-    val columns = Seq("abc", "key")
-    val MySQLColumns = columns.map(MySQL.quoteIdentifier(_))
-    val PostgresColumns = columns.map(Postgres.quoteIdentifier(_))
-    val DerbyColumns = columns.map(Derby.quoteIdentifier(_))
-    assert(MySQLColumns === Seq("`abc`", "`key`"))
-    assert(PostgresColumns === Seq(""""abc"""", """"key""""))
-    assert(DerbyColumns === Seq(""""abc"""", """"key""""))
+    val mySQLDialect = JdbcDialects.get("jdbc:mysql://127.0.0.1/db")
+    val postgresDialect = JdbcDialects.get("jdbc:postgresql://127.0.0.1/db")
+    val derbyDialect = JdbcDialects.get("jdbc:derby:db")
+    val oracleDialect = JdbcDialects.get("jdbc:oracle:thin:@//localhost:1521/orcl")
+    val databricksDialect = JdbcDialects.get("jdbc:databricks://host/db")
+
+    val columns = Seq("abc", "key", "double_quote\"", "back`")
+    val mySQLColumns = columns.map(mySQLDialect.quoteIdentifier)
+    val postgresColumns = columns.map(postgresDialect.quoteIdentifier)
+    val derbyColumns = columns.map(derbyDialect.quoteIdentifier)
+    val oracleColumns = columns.map(oracleDialect.quoteIdentifier)
+    val databricksColumns = columns.map(databricksDialect.quoteIdentifier)
+    assertResult(Seq("`abc`", "`key`", "`double_quote\"`", "`back```"))(mySQLColumns)
+    assertResult(Seq("\"abc\"", "\"key\"", "\"double_quote\"\"\"", "\"back`\""))(postgresColumns)
+    assertResult(Seq("\"abc\"", "\"key\"", "\"double_quote\"\"\"", "\"back`\""))(derbyColumns)
+    assertResult(Seq("\"abc\"", "\"key\"", "\"double_quote\"\"\"", "\"back`\""))(oracleColumns)
+    assertResult(Seq("`abc`", "`key`", "`double_quote\"`", "`back```"))(databricksColumns)
   }
 
   test("compile filters") {
@@ -1710,7 +1693,7 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
 
       val quotedPrtColName = testH2Dialect.quoteIdentifier(expectedColumnName)
       df.logicalPlan match {
-        case LogicalRelationWithTable(JDBCRelation(_, parts, _), _) =>
+        case LogicalRelationWithTable(JDBCRelation(_, parts, _, _), _) =>
           val whereClauses = parts.map(_.asInstanceOf[JDBCPartition].whereClause).toSet
           assert(whereClauses === Set(
             s"$quotedPrtColName < 2 or $quotedPrtColName is null",
@@ -1852,7 +1835,7 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
       .load()
 
     df1.logicalPlan match {
-      case LogicalRelationWithTable(JDBCRelation(_, parts, _), _) =>
+      case LogicalRelationWithTable(JDBCRelation(_, parts, _, _), _) =>
         val whereClauses = parts.map(_.asInstanceOf[JDBCPartition].whereClause).toSet
         assert(whereClauses === Set(
           """"D" < '2018-07-11' or "D" is null""",
@@ -1872,7 +1855,7 @@ class JDBCSuite extends QueryTest with SharedSparkSession {
       .load()
 
     df2.logicalPlan match {
-      case LogicalRelationWithTable(JDBCRelation(_, parts, _), _) =>
+      case LogicalRelationWithTable(JDBCRelation(_, parts, _, _), _) =>
         val whereClauses = parts.map(_.asInstanceOf[JDBCPartition].whereClause).toSet
         assert(whereClauses === Set(
           """"T" < '2018-07-15 20:50:32.5' or "T" is null""",
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCV2Suite.scala b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCV2Suite.scala
index ac087562824df..c6a48d98fa980 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCV2Suite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/JDBCV2Suite.scala
@@ -18,11 +18,10 @@
 package org.apache.spark.sql.jdbc
 
 import java.sql.{Connection, DriverManager}
-import java.util.Properties
+import java.util.{HexFormat, Properties}
 
 import scala.util.control.NonFatal
 
-import org.apache.commons.codec.binary.Hex
 import test.org.apache.spark.sql.connector.catalog.functions.JavaStrLen.JavaStrLenStaticMagic
 
 import org.apache.spark.{SparkConf, SparkException, SparkIllegalArgumentException}
@@ -35,7 +34,8 @@ import org.apache.spark.sql.connector.catalog.{Catalogs, Identifier, TableCatalo
 import org.apache.spark.sql.connector.catalog.functions.{ScalarFunction, UnboundFunction}
 import org.apache.spark.sql.connector.catalog.index.SupportsIndex
 import org.apache.spark.sql.connector.expressions.Expression
-import org.apache.spark.sql.execution.FormattedMode
+import org.apache.spark.sql.execution.{FormattedMode, RowDataSourceScanExec}
+import org.apache.spark.sql.execution.datasources.jdbc.{JDBCDatabaseMetadata, JDBCRDD}
 import org.apache.spark.sql.execution.datasources.v2.{DataSourceV2ScanRelation, V1ScanWrapper}
 import org.apache.spark.sql.execution.datasources.v2.jdbc.JDBCTableCatalog
 import org.apache.spark.sql.functions.{abs, acos, asin, atan, atan2, avg, ceil, coalesce, cos, cosh, cot, count, count_distinct, degrees, exp, floor, lit, log => logarithm, log10, not, pow, radians, round, signum, sin, sinh, sqrt, sum, tan, tanh, udf, when}
@@ -141,6 +141,7 @@ class JDBCV2Suite extends QueryTest with SharedSparkSession with ExplainSuiteHel
     .set("spark.sql.catalog.h2.pushDownAggregate", "true")
     .set("spark.sql.catalog.h2.pushDownLimit", "true")
     .set("spark.sql.catalog.h2.pushDownOffset", "true")
+    .set("spark.sql.catalog.h2.pushDownJoin", "true")
 
   private def withConnection[T](f: Connection => T): T = {
     val conn = DriverManager.getConnection(url, new Properties())
@@ -155,102 +156,93 @@ class JDBCV2Suite extends QueryTest with SharedSparkSession with ExplainSuiteHel
     super.beforeAll()
     Utils.classForName("org.h2.Driver")
     withConnection { conn =>
-      conn.prepareStatement("CREATE SCHEMA \"test\"").executeUpdate()
-      conn.prepareStatement(
+
+      val batchStmt = conn.createStatement()
+      batchStmt.addBatch("CREATE SCHEMA \"test\"")
+
+      batchStmt.addBatch(
         "CREATE TABLE \"test\".\"empty_table\" (name TEXT(32) NOT NULL, id INTEGER NOT NULL)")
-        .executeUpdate()
-      conn.prepareStatement(
+
+      batchStmt.addBatch(
         "CREATE TABLE \"test\".\"people\" (name TEXT(32) NOT NULL, id INTEGER NOT NULL)")
-        .executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"people\" VALUES ('fred', 1)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"people\" VALUES ('mary', 2)").executeUpdate()
-      conn.prepareStatement(
+      batchStmt.addBatch("INSERT INTO \"test\".\"people\" VALUES ('fred', 1)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"people\" VALUES ('mary', 2)")
+
+      batchStmt.addBatch(
         "CREATE TABLE \"test\".\"employee\" (dept INTEGER, name TEXT(32), salary NUMERIC(20, 2)," +
-          " bonus DOUBLE, is_manager BOOLEAN)").executeUpdate()
-      conn.prepareStatement(
-        "INSERT INTO \"test\".\"employee\" VALUES (1, 'amy', 10000, 1000, true)").executeUpdate()
-      conn.prepareStatement(
-        "INSERT INTO \"test\".\"employee\" VALUES (2, 'alex', 12000, 1200, false)").executeUpdate()
-      conn.prepareStatement(
-        "INSERT INTO \"test\".\"employee\" VALUES (1, 'cathy', 9000, 1200, false)").executeUpdate()
-      conn.prepareStatement(
-        "INSERT INTO \"test\".\"employee\" VALUES (2, 'david', 10000, 1300, true)").executeUpdate()
-      conn.prepareStatement(
-        "INSERT INTO \"test\".\"employee\" VALUES (6, 'jen', 12000, 1200, true)").executeUpdate()
-      conn.prepareStatement(
+          " bonus DOUBLE, is_manager BOOLEAN)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee\" VALUES (1, 'amy', 10000, 1000, true)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee\" VALUES (2, 'alex', 12000, 1200, false)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee\" VALUES (1, 'cathy', 9000, 1200, false)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee\" VALUES (2, 'david', 10000, 1300, true)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee\" VALUES (6, 'jen', 12000, 1200, true)")
+
+      batchStmt.addBatch(
         "CREATE TABLE \"test\".\"dept\" (\"dept id\" INTEGER NOT NULL, \"dept.id\" INTEGER)")
-        .executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"dept\" VALUES (1, 1)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"dept\" VALUES (2, 1)").executeUpdate()
+      batchStmt.addBatch("INSERT INTO \"test\".\"dept\" VALUES (1, 1)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"dept\" VALUES (2, 1)")
 
       // scalastyle:off
-      conn.prepareStatement(
-        "CREATE TABLE \"test\".\"person\" (\"名\" INTEGER NOT NULL)").executeUpdate()
+      batchStmt.addBatch("CREATE TABLE \"test\".\"person\" (\"名\" INTEGER NOT NULL)")
       // scalastyle:on
-      conn.prepareStatement("INSERT INTO \"test\".\"person\" VALUES (1)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"person\" VALUES (2)").executeUpdate()
-      conn.prepareStatement(
-        """CREATE TABLE "test"."view1" ("|col1" INTEGER, "|col2" INTEGER)""").executeUpdate()
-      conn.prepareStatement(
-        """CREATE TABLE "test"."view2" ("|col1" INTEGER, "|col3" INTEGER)""").executeUpdate()
-
-      conn.prepareStatement(
+      batchStmt.addBatch("INSERT INTO \"test\".\"person\" VALUES (1)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"person\" VALUES (2)")
+
+      batchStmt.addBatch(
+        """CREATE TABLE "test"."view1" ("|col1" INTEGER, "|col2" INTEGER)""")
+      batchStmt.addBatch(
+        """CREATE TABLE "test"."view2" ("|col1" INTEGER, "|col3" INTEGER)""")
+
+      batchStmt.addBatch(
         "CREATE TABLE \"test\".\"item\" (id INTEGER, name TEXT(32), price NUMERIC(23, 3))")
-        .executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"item\" VALUES " +
-        "(1, 'bottle', 11111111111111111111.123)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"item\" VALUES " +
-        "(1, 'bottle', 99999999999999999999.123)").executeUpdate()
+      batchStmt.addBatch("INSERT INTO \"test\".\"item\"" +
+        "VALUES (1, 'bottle', 11111111111111111111.123)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"item\"" +
+        "VALUES (1, 'bottle', 99999999999999999999.123)")
 
-      conn.prepareStatement(
+      batchStmt.addBatch(
         "CREATE TABLE \"test\".\"datetime\" (name TEXT(32), date1 DATE, time1 TIMESTAMP)")
-        .executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"datetime\" VALUES " +
-        "('amy', '2022-05-19', '2022-05-19 00:00:00')").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"datetime\" VALUES " +
-        "('alex', '2022-05-18', '2022-05-18 00:00:00')").executeUpdate()
-
-      conn.prepareStatement(
-        "CREATE TABLE \"test\".\"address\" (email TEXT(32) NOT NULL)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"address\" VALUES " +
-        "('abc_def@gmail.com')").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"address\" VALUES " +
-        "('abc%def@gmail.com')").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"address\" VALUES " +
-        "('abc%_def@gmail.com')").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"address\" VALUES " +
-        "('abc_%def@gmail.com')").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"address\" VALUES " +
-        "('abc_''%def@gmail.com')").executeUpdate()
-
-      conn.prepareStatement("CREATE TABLE \"test\".\"binary_tab\" (name TEXT(32),b BINARY(20))")
+      batchStmt.addBatch("INSERT INTO \"test\".\"datetime\"" +
+        "VALUES ('amy', '2022-05-19', '2022-05-19 00:00:00')")
+      batchStmt.addBatch("INSERT INTO \"test\".\"datetime\"" +
+        "VALUES ('alex', '2022-05-18', '2022-05-18 00:00:00')")
+
+      batchStmt.addBatch(
+        "CREATE TABLE \"test\".\"address\" (email TEXT(32) NOT NULL)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"address\" VALUES ('abc_def@gmail.com')")
+      batchStmt.addBatch("INSERT INTO \"test\".\"address\" VALUES ('abc%def@gmail.com')")
+      batchStmt.addBatch("INSERT INTO \"test\".\"address\" VALUES ('abc%_def@gmail.com')")
+      batchStmt.addBatch("INSERT INTO \"test\".\"address\" VALUES ('abc_%def@gmail.com')")
+      batchStmt.addBatch("INSERT INTO \"test\".\"address\" VALUES ('abc_''%def@gmail.com')")
+
+      batchStmt.addBatch("CREATE TABLE \"test\".\"employee_bonus\" " +
+        "(name TEXT(32), salary NUMERIC(20, 2), bonus DOUBLE, factor DOUBLE)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee_bonus\"" +
+        "VALUES ('amy', 10000, 1000, 0.1)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee_bonus\"" +
+        "VALUES ('alex', 12000, 1200, 0.1)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee_bonus\"" +
+        "VALUES ('cathy', 8000, 1200, 0.15)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee_bonus\"" +
+        "VALUES ('david', 10000, 1300, 0.13)")
+      batchStmt.addBatch("INSERT INTO \"test\".\"employee_bonus\"" +
+        "VALUES ('jen', 12000, 2400, 0.2)")
+
+      batchStmt.addBatch(
+        "CREATE TABLE \"test\".\"strings_with_nulls\" (str TEXT(32))")
+      batchStmt.addBatch("INSERT INTO \"test\".\"strings_with_nulls\" VALUES ('abc')")
+      batchStmt.addBatch("INSERT INTO \"test\".\"strings_with_nulls\" VALUES ('a a a')")
+      batchStmt.addBatch("INSERT INTO \"test\".\"strings_with_nulls\" VALUES (null)")
+
+      batchStmt.executeBatch()
+
+      conn
+        .prepareStatement("CREATE TABLE \"test\".\"binary_tab\" (name TEXT(32),b BINARY(20))")
         .executeUpdate()
       val stmt = conn.prepareStatement("INSERT INTO \"test\".\"binary_tab\" VALUES (?, ?)")
       stmt.setString(1, "jen")
       stmt.setBytes(2, testBytes)
       stmt.executeUpdate()
-
-      conn.prepareStatement("CREATE TABLE \"test\".\"employee_bonus\" " +
-        "(name TEXT(32), salary NUMERIC(20, 2), bonus DOUBLE, factor DOUBLE)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"employee_bonus\" " +
-        "VALUES ('amy', 10000, 1000, 0.1)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"employee_bonus\" " +
-        "VALUES ('alex', 12000, 1200, 0.1)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"employee_bonus\" " +
-        "VALUES ('cathy', 8000, 1200, 0.15)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"employee_bonus\" " +
-        "VALUES ('david', 10000, 1300, 0.13)").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"employee_bonus\" " +
-        "VALUES ('jen', 12000, 2400, 0.2)").executeUpdate()
-
-      conn.prepareStatement(
-        "CREATE TABLE \"test\".\"strings_with_nulls\" (str TEXT(32))").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"strings_with_nulls\" VALUES " +
-        "('abc')").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"strings_with_nulls\" VALUES " +
-        "('a a a')").executeUpdate()
-      conn.prepareStatement("INSERT INTO \"test\".\"strings_with_nulls\" VALUES " +
-        "(null)").executeUpdate()
     }
     h2Dialect.registerFunction("my_avg", IntegralAverage)
     h2Dialect.registerFunction("my_strlen", StrLen(CharLength))
@@ -3110,7 +3102,7 @@ class JDBCV2Suite extends QueryTest with SharedSparkSession with ExplainSuiteHel
   }
 
   test("SPARK-50792: Format binary data as a binary literal in JDBC.") {
-    val hexBinary = Hex.encodeHexString(testBytes, false)
+    val hexBinary = HexFormat.of().withUpperCase().formatHex(testBytes)
     val binary = "X'" + hexBinary + "'"
     val df = sql(s"SELECT * FROM h2.test.binary_tab WHERE b = $binary")
     checkFiltersRemoved(df)
@@ -3119,4 +3111,23 @@ class JDBCV2Suite extends QueryTest with SharedSparkSession with ExplainSuiteHel
       Row("jen", Array(99, -122, -121, -56, -51, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0)))
   }
 
+  test("SPARK-52730: Database metadata is available in JDBCRDD") {
+    val df = sql("SELECT * FROM h2.test.people")
+    // Force query execution as metadata is stored during execution
+    df.collect()
+
+    val jdbcRdd = df.queryExecution.executedPlan
+      .collect { case r: RowDataSourceScanExec => r }
+      .head.rdd.asInstanceOf[JDBCRDD]
+
+    // This is the Metadata for the testing H2 database
+    val expectedMetadata = JDBCDatabaseMetadata(
+      databaseMajorVersion = Some(2),
+      databaseMinorVersion = Some(3),
+      databaseDriverMajorVersion = Some(2),
+      databaseDriverMinorVersion = Some(3)
+    )
+
+    assertResult(expectedMetadata) { jdbcRdd.getDatabaseMetadata }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/jdbc/v2/JDBCV2JoinPushdownIntegrationSuiteBase.scala b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/v2/JDBCV2JoinPushdownIntegrationSuiteBase.scala
new file mode 100644
index 0000000000000..d0639f77d6da6
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/v2/JDBCV2JoinPushdownIntegrationSuiteBase.scala
@@ -0,0 +1,752 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc.v2
+
+import java.sql.{Connection, DriverManager}
+import java.util.Properties
+
+import org.apache.spark.SparkConf
+import org.apache.spark.sql.{QueryTest, Row}
+import org.apache.spark.sql.connector.DataSourcePushdownTestUtils
+import org.apache.spark.sql.execution.datasources.jdbc.JdbcUtils
+import org.apache.spark.sql.execution.datasources.v2.DataSourceV2ScanRelation
+import org.apache.spark.sql.execution.datasources.v2.jdbc.JDBCTableCatalog
+import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.jdbc.JdbcDialect
+import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.sql.types.{DataType, DataTypes, StructField, StructType}
+
+trait JDBCV2JoinPushdownIntegrationSuiteBase
+  extends QueryTest
+  with SharedSparkSession
+  with DataSourcePushdownTestUtils {
+  val catalogName: String = "join_pushdown_catalog"
+  val namespace: String = "join_schema"
+  val url: String
+
+  val joinTableName1: String = "join_table_1"
+  val joinTableName2: String = "join_table_2"
+  val joinTableName3: String = "join_table_3"
+  val joinTableName4: String = "join_table_4"
+
+  val jdbcDialect: JdbcDialect
+
+  override def sparkConf: SparkConf = super.sparkConf
+    .set(s"spark.sql.catalog.$catalogName", classOf[JDBCTableCatalog].getName)
+    .set(SQLConf.ANSI_ENABLED.key, "true")
+    .set(s"spark.sql.catalog.$catalogName.url", url)
+    .set(s"spark.sql.catalog.$catalogName.pushDownJoin", "true")
+    .set(s"spark.sql.catalog.$catalogName.pushDownAggregate", "true")
+    .set(s"spark.sql.catalog.$catalogName.pushDownLimit", "true")
+    .set(s"spark.sql.catalog.$catalogName.pushDownOffset", "true")
+    .set(s"spark.sql.catalog.$catalogName.caseSensitive", "false")
+
+  protected def catalogAndNamespace = s"$catalogName.${caseConvert(namespace)}"
+  protected def casedJoinTableName1 = caseConvert(joinTableName1)
+  protected def casedJoinTableName2 = caseConvert(joinTableName2)
+  protected def casedJoinTableName3 = caseConvert(joinTableName3)
+  protected def casedJoinTableName4 = caseConvert(joinTableName4)
+
+  def qualifyTableName(tableName: String): String = {
+    val fullyQualifiedCasedNamespace = jdbcDialect.quoteIdentifier(caseConvert(namespace))
+    val fullyQualifiedCasedTableName = jdbcDialect.quoteIdentifier(caseConvert(tableName))
+    s"$fullyQualifiedCasedNamespace.$fullyQualifiedCasedTableName"
+  }
+
+  def quoteSchemaName(schemaName: String): String =
+    jdbcDialect.quoteIdentifier(caseConvert(namespace))
+
+  private lazy val fullyQualifiedTableName1: String = qualifyTableName(joinTableName1)
+  private lazy val fullyQualifiedTableName2: String = qualifyTableName(joinTableName2)
+  private lazy val fullyQualifiedTableName3: String = qualifyTableName(joinTableName3)
+  private lazy val fullyQualifiedTableName4: String = qualifyTableName(joinTableName4)
+
+  protected def getJDBCTypeString(dt: DataType): String = {
+    JdbcUtils.getJdbcType(dt, jdbcDialect).databaseTypeDefinition.toUpperCase()
+  }
+
+  protected def caseConvert(identifier: String): String = identifier
+
+  // Quote the identifier to remain original case, for example, MySql convert [`ID`, ID]
+  // to [ID, id]
+  protected def remainColumnCase(identifier: String): String = "\"" + identifier + "\""
+
+  protected def withConnection[T](f: Connection => T): T = {
+    val conn = DriverManager.getConnection(url, new Properties())
+    try {
+      f(conn)
+    } finally {
+      conn.close()
+    }
+  }
+
+  protected val integerType = DataTypes.IntegerType
+
+  protected val stringType = DataTypes.StringType
+
+  protected val decimalType = DataTypes.createDecimalType(10, 2)
+
+  /**
+   * This method should cover the following:
+   * <ul>
+   *   <li>Create the schema where testing tables will be stored.
+   *   <li>Create the testing tables {@code joinTableName1} and {@code joinTableName2}
+   *   in above schema.
+   *   <li>Populate the tables with the data.
+   * </ul>
+   */
+  def dataPreparation(): Unit = {
+    schemaPreparation()
+    tablePreparation()
+    fillJoinTables()
+  }
+
+  def schemaPreparation(): Unit = {
+    withConnection {conn =>
+      conn
+        .prepareStatement(s"CREATE SCHEMA ${quoteSchemaName(namespace)}")
+        .executeUpdate()
+    }
+  }
+
+  def tablePreparation(): Unit = {
+    withConnection{ conn =>
+      conn.prepareStatement(
+        s"""CREATE TABLE $fullyQualifiedTableName1 (
+           |  ID ${getJDBCTypeString(integerType)},
+           |  AMOUNT ${getJDBCTypeString(decimalType)},
+           |  ADDRESS ${getJDBCTypeString(stringType)}
+           |)""".stripMargin
+      ).executeUpdate()
+
+      conn.prepareStatement(
+        s"""CREATE TABLE $fullyQualifiedTableName2 (
+           |  ID ${getJDBCTypeString(integerType)},
+           |  NEXT_ID ${getJDBCTypeString(integerType)},
+           |  SALARY ${getJDBCTypeString(decimalType)},
+           |  SURNAME ${getJDBCTypeString(stringType)}
+           |)""".stripMargin
+      ).executeUpdate()
+
+      // Complex situations with different capitalization and quotation marks.
+      conn.prepareStatement(
+        s"""CREATE TABLE $fullyQualifiedTableName3(
+           |${remainColumnCase("id")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("id_1")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("id_2")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("id_1_1")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("sid")} ${getJDBCTypeString(integerType)}
+           |)""".stripMargin
+      ).executeUpdate()
+      conn.prepareStatement(
+        s"""CREATE TABLE $fullyQualifiedTableName4 (
+           |${remainColumnCase("id")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("id_1")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("id_2")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("id_2_1")} ${getJDBCTypeString(integerType)},
+           |${remainColumnCase("Sid")} ${getJDBCTypeString(integerType)}
+           |)""".stripMargin
+      ).executeUpdate()
+    }
+  }
+
+  private val random = new java.util.Random(42)
+
+  private val table1Data = (1 to 100).map { i =>
+    val id = i % 11
+    val amount = BigDecimal.valueOf(random.nextDouble() * 10000)
+      .setScale(2, BigDecimal.RoundingMode.HALF_UP)
+    val address = s"address_$i"
+    (id, amount, address)
+  }
+
+  private val table2Data = (1 to 100).map { i =>
+    val id = (i % 17)
+    val next_id = (id + 1) % 17
+    val salary = BigDecimal.valueOf(random.nextDouble() * 50000)
+      .setScale(2, BigDecimal.RoundingMode.HALF_UP)
+    val surname = s"surname_$i"
+    (id, next_id, salary, surname)
+  }
+
+  def fillJoinTables(): Unit = {
+    withConnection { conn =>
+      val insertStmt1 = conn.prepareStatement(
+        s"INSERT INTO $fullyQualifiedTableName1 (id, amount, address) VALUES (?, ?, ?)"
+      )
+      table1Data.foreach { case (id, amount, address) =>
+        insertStmt1.setInt(1, id)
+        insertStmt1.setBigDecimal(2, amount.bigDecimal)
+        insertStmt1.setString(3, address)
+        insertStmt1.addBatch()
+      }
+      insertStmt1.executeBatch()
+      insertStmt1.close()
+
+      val insertStmt2 = conn.prepareStatement(
+        s"INSERT INTO $fullyQualifiedTableName2 (id, next_id, salary, surname) VALUES (?, ?, ?, ?)"
+      )
+      table2Data.foreach { case (id, next_id, salary, surname) =>
+        insertStmt2.setInt(1, id)
+        insertStmt2.setInt(2, next_id)
+        insertStmt2.setBigDecimal(3, salary.bigDecimal)
+        insertStmt2.setString(4, surname)
+        insertStmt2.addBatch()
+      }
+      insertStmt2.executeBatch()
+      insertStmt2.close()
+
+      conn.createStatement().execute(
+        s"""INSERT INTO $fullyQualifiedTableName3 VALUES (0, 1, 2, 3, 4)""")
+      conn.createStatement().execute(
+        s"""INSERT INTO $fullyQualifiedTableName4 VALUES (0, -1, -2, -3, -4)""")
+    }
+  }
+
+  protected val supportsFilterPushdown: Boolean = true
+
+  protected val supportsLimitPushdown: Boolean = true
+
+  protected val supportsAggregatePushdown: Boolean = true
+
+  protected val supportsSortPushdown: Boolean = true
+
+  protected val supportsOffsetPushdown: Boolean = true
+
+  protected val supportsColumnPruning: Boolean = true
+
+  protected val supportsJoinPushdown: Boolean = true
+
+  // Condition-less joins are not supported in join pushdown
+  test("Test that 2-way join without condition should not have join pushed down") {
+    val sqlQuery =
+      s"""
+         |SELECT * FROM
+         |$catalogAndNamespace.$casedJoinTableName1 a,
+         |$catalogAndNamespace.$casedJoinTableName1 b
+         |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkJoinNotPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  // Condition-less joins are not supported in join pushdown
+  test("Test that multi-way join without condition should not have join pushed down") {
+    val sqlQuery = s"""
+      |SELECT * FROM
+      |$catalogAndNamespace.$casedJoinTableName1 a,
+      |$catalogAndNamespace.$casedJoinTableName1 b,
+      |$catalogAndNamespace.$casedJoinTableName1 c
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkJoinNotPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test self join with condition") {
+    val sqlQuery = s"""
+      |SELECT * FROM $catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 b
+      |ON a.id = b.id + 1""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      // scalastyle:off line.size.limit
+      checkJoinPushed(
+        df,
+        s"""PushedFilters: [${caseConvert("id")} = (${caseConvert("id_1")} + 1)], PushedJoins:\u0020
+           |[L]: Relation: $catalogAndNamespace.${caseConvert(joinTableName1)}
+           |     PushedFilters: [${caseConvert("id")} IS NOT NULL]
+           |[R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName1)}
+           |     PushedFilters: [${caseConvert("id")} IS NOT NULL]"""
+          .stripMargin
+      )
+      // scalastyle:on line.size.limit
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test multi-way self join with conditions") {
+    val sqlQuery = s"""
+      |SELECT * FROM
+      |$catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 b ON b.id = a.id + 1
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 c ON c.id = b.id - 1""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    assert(!rows.isEmpty)
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      // scalastyle:off line.size.limit
+      checkJoinPushed(
+        df,
+        s"""PushedFilters: [${caseConvert("id_2")} = (${caseConvert("id_1")} - 1)], PushedJoins:\u0020
+           |[L]: PushedFilters: [${caseConvert("id_1")} = (${caseConvert("id")} + 1)]
+           |     PushedJoins:
+           |     [L]: Relation: $catalogAndNamespace.${caseConvert(joinTableName1)}
+           |          PushedFilters: [${caseConvert("id")} IS NOT NULL]
+           |     [R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName1)}
+           |          PushedFilters: [${caseConvert("id")} IS NOT NULL]
+           |[R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName1)}
+           |     PushedFilters: [${caseConvert("id")} IS NOT NULL]""".stripMargin
+      )
+      // scalastyle:on line.size.limit
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test self join with column pruning") {
+    val sqlQuery = s"""
+      |SELECT a.id + 2, b.id, b.amount FROM
+      |$catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 b
+      |ON a.id = b.id + 1
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      val expectedSchema = StructType(
+        Seq(
+          StructField(caseConvert("id"), integerType), // ID
+          StructField(caseConvert("id_1"), integerType), // ID
+          StructField(caseConvert("amount"), decimalType) // AMOUNT
+        )
+      )
+      checkPrunedColumnsDataTypeAndNullability(df, expectedSchema)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test 2-way join with column pruning - different tables") {
+    val sqlQuery = s"""
+      |SELECT a.id, b.next_id FROM
+      |$catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName2 b
+      |ON a.id = b.next_id
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      val expectedSchema = StructType(
+        Seq(
+          StructField(caseConvert("id"), integerType), // ID
+          StructField(caseConvert("next_id"), integerType) // NEXT_ID
+        )
+      )
+      checkPrunedColumnsDataTypeAndNullability(df, expectedSchema)
+      checkPushedInfo(df,
+        s"PushedFilters: [${caseConvert("id")} IS NOT NULL",
+          s"${caseConvert("next_id")} IS NOT NULL",
+          s"${caseConvert("id")} = ${caseConvert("next_id")}]")
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test multi-way self join with column pruning") {
+    val sqlQuery = s"""
+      |SELECT a.id, b.*, c.id, c.amount + a.amount
+      |FROM $catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 b ON b.id = a.id + 1
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 c ON c.id = b.id - 1
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      val expectedSchema = StructType(
+        Seq(
+          StructField(caseConvert("id"), integerType), // ID
+          StructField(caseConvert("amount"), decimalType), // AMOUNT
+          StructField(caseConvert("id_1"), integerType), // ID
+          StructField(caseConvert("amount_1"), decimalType), // AMOUNT
+          StructField(caseConvert("address"), stringType), // ADDRESS
+          StructField(caseConvert("id_2"), integerType), // ID
+          StructField(caseConvert("amount_2"), decimalType) // AMOUNT
+        )
+      )
+      checkPrunedColumnsDataTypeAndNullability(df, expectedSchema)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test aliases not supported in join pushdown") {
+    val sqlQuery = s"""
+      |SELECT a.id, bc.*
+      |FROM $catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN (
+      |  SELECT b.*, c.id AS c_id, c.amount AS c_amount
+      |  FROM $catalogAndNamespace.$casedJoinTableName1 b
+      |  JOIN $catalogAndNamespace.$casedJoinTableName1 c ON c.id = b.id - 1
+      |) bc ON bc.id = a.id + 1
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkJoinNotPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test join with dataframe with duplicated columns") {
+    val df1 = sql(s"SELECT id FROM $catalogAndNamespace.$casedJoinTableName1")
+    val df2 = sql(s"SELECT id, id FROM $catalogAndNamespace.$casedJoinTableName1")
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      df1.join(df2, "id").collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val joinDf = df1.join(df2, "id")
+      checkAnswer(joinDf, rows)
+    }
+  }
+
+  test("Test aggregate on top of 2-way self join") {
+    val sqlQuery = s"""
+      |SELECT min(a.id + b.id), min(a.id)
+      |FROM $catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 b ON a.id = b.id + 1
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkAggregateRemoved(df, supportsAggregatePushdown)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test aggregate on top of multi-way self join") {
+    val sqlQuery = s"""
+      |SELECT min(a.id + b.id), min(a.id), min(c.id - 2)
+      |FROM $catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 b ON b.id = a.id + 1
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 c ON c.id = b.id - 1
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test sort limit on top of join is pushed down") {
+    val sqlQuery = s"""
+      |SELECT min(a.id + b.id), a.id, b.id
+      |FROM $catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName1 b ON b.id = a.id + 1
+      |GROUP BY a.id, b.id
+      |ORDER BY a.id
+      |LIMIT 1
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(
+      SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkSortRemoved(df, supportsSortPushdown)
+      checkLimitRemoved(df, supportsLimitPushdown)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test join with additional filters") {
+    val sqlQuery =
+      s"""
+         |SELECT t1.id, t1.address, t2.surname, t1.amount, t2.salary
+         |FROM $catalogAndNamespace.$casedJoinTableName1 t1
+         |JOIN $catalogAndNamespace.$casedJoinTableName2 t2 ON t1.id = t2.id
+         |WHERE t1.amount > 5000 AND t2.salary > 25000
+         |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+      checkFilterPushed(df, supportsFilterPushdown)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test join with complex condition") {
+    val sqlQuery =
+      s"""
+         |SELECT t1.id, t1.address, t2.surname, t1.amount + t2.salary as total
+         |FROM $catalogAndNamespace.$casedJoinTableName1 t1
+         |JOIN $catalogAndNamespace.$casedJoinTableName2 t2
+         |ON t1.id = t2.id AND t1.amount > 1000
+         |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test left outer join with condition should be pushed down") {
+    val sqlQuery =
+      s"""
+         |SELECT t1.id, t1.address, t2.surname
+         |FROM $catalogAndNamespace.$casedJoinTableName1 t1
+         |LEFT JOIN $catalogAndNamespace.$casedJoinTableName2 t2
+         |ON t1.id = t2.id
+         |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    assert(rows.nonEmpty)
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+      checkJoinPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test left outer join without condition - no pushdown") {
+    val sqlQuery =
+      s"""
+         |SELECT * FROM
+         |$catalogAndNamespace.$casedJoinTableName1 a
+         |LEFT JOIN
+         |$catalogAndNamespace.$casedJoinTableName2 b
+         |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkJoinNotPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test right outer join with condition should be pushed down") {
+    val sqlQuery =
+      s"""
+         |SELECT t1.id, t1.address, t2.surname
+         |FROM $catalogAndNamespace.$casedJoinTableName1 t1
+         |RIGHT JOIN $catalogAndNamespace.$casedJoinTableName2 t2
+         |ON t1.id = t2.id
+         |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    assert(rows.nonEmpty)
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+      checkJoinPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test right outer join without condition - no pushdown") {
+    val sqlQuery =
+      s"""
+         |SELECT * FROM
+         |$catalogAndNamespace.$casedJoinTableName1 a
+         |RIGHT JOIN
+         |$catalogAndNamespace.$casedJoinTableName2 b
+         |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkJoinNotPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test condition with aliased column") {
+    // After the first join, columns will be aliased because we are doing self join in CTE.
+    // Second join, is joining on aliased column, so the aliased value should be used in generated
+    // SQL query.
+    val sqlQuery = s"""
+      |WITH ws_wh AS (
+      |    SELECT
+      |        ws1.ID,
+      |        ws1.AMOUNT wh1,
+      |        ws2.AMOUNT wh2
+      |    FROM
+      |        $catalogAndNamespace.$casedJoinTableName1 ws1,
+      |        $catalogAndNamespace.$casedJoinTableName1 ws2
+      |    WHERE
+      |        ws1.ID = ws2.ID
+      |        AND ws1.AMOUNT <> ws2.AMOUNT
+      |)
+      |SELECT
+      |   NEXT_ID
+      |FROM
+      |   $catalogAndNamespace.$casedJoinTableName2,
+      |   ws_wh
+      |WHERE
+      |   NEXT_ID = ws_wh.ID
+      |""".stripMargin
+
+    val rows = withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "false") {
+      sql(sqlQuery).collect().toSeq
+    }
+
+    assert(!rows.isEmpty)
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      checkJoinPushed(df)
+      checkAnswer(df, rows)
+    }
+  }
+
+  test("Test complex duplicate column name alias") {
+    val sqlQuery = s"""
+                      |SELECT
+                      |    *
+                      |FROM $catalogAndNamespace.$casedJoinTableName3 a
+                      |JOIN $catalogAndNamespace.$casedJoinTableName4 b
+                      |ON a.id = b.id""".stripMargin
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+      val row = df.collect()(0)
+      assert(row.toString == Row(0, 1, 2, 3, 4, 0, -1, -2, -3, -4).toString)
+
+      assert(df.schema.fields.map(_.name) sameElements
+        Array("id", "id_1", "id_2", "id_1_1", "sid",
+          "id", "id_1", "id_2", "id_2_1", "Sid"),
+        "Unexpected schema names: " + df.schema.fields.map(_.name).mkString(","))
+
+      val schemaNames = df.queryExecution.optimizedPlan.collectFirst {
+        case j: DataSourceV2ScanRelation => j
+      }.get.schema.fields.map(_.name)
+      assert(schemaNames sameElements
+        Array("id", "id_1", "id_2", "id_1_1", "sid",
+          "id_3", "id_1_2", "id_2_2", "id_2_1", "Sid_1"),
+        "Unexpected schema names: " + schemaNames.mkString(","))
+
+      checkJoinPushed(df)
+    }
+  }
+
+  test("Test explain formatted") {
+    val sqlQuery = s"""
+      |SELECT * FROM $catalogAndNamespace.$casedJoinTableName1 a
+      |JOIN $catalogAndNamespace.$casedJoinTableName2 b
+      |ON a.id = b.id + 1
+      |JOIN $catalogAndNamespace.$casedJoinTableName3 c
+      |ON b.id = c.id + 1
+      |JOIN $catalogAndNamespace.$casedJoinTableName4 d
+      |ON c.id = d.id + 1
+      |""".stripMargin
+
+    withSQLConf(SQLConf.DATA_SOURCE_V2_JOIN_PUSHDOWN.key -> "true") {
+      val df = sql(sqlQuery)
+
+      // scalastyle:off line.size.limit
+      checkJoinPushed(
+        df,
+        s"""PushedFilters: [id_3 = (id_4 + 1)], PushedJoins:\u0020
+           |[L]: PushedFilters: [${caseConvert("id_1")} = (id_3 + 1)]
+           |     PushedJoins:
+           |     [L]: PushedFilters: [${caseConvert("id")} = (${caseConvert("id_1")} + 1)]
+           |          PushedJoins:
+           |          [L]: Relation: $catalogAndNamespace.${caseConvert(joinTableName1)}
+           |               PushedFilters: [${caseConvert("id")} IS NOT NULL]
+           |          [R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName2)}
+           |               PushedFilters: [${caseConvert("id")} IS NOT NULL]
+           |     [R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName3)}
+           |          PushedFilters: [id IS NOT NULL]
+           |[R]: Relation: $catalogAndNamespace.${caseConvert(joinTableName4)}
+           |     PushedFilters: [id IS NOT NULL]""".stripMargin
+      )
+      // scalastyle:on line.size.limit
+    }
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/jdbc/v2/JDBCV2JoinPushdownSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/v2/JDBCV2JoinPushdownSuite.scala
new file mode 100644
index 0000000000000..6304c1a1c54f1
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/jdbc/v2/JDBCV2JoinPushdownSuite.scala
@@ -0,0 +1,60 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.jdbc.v2
+
+import java.util.Locale
+
+import org.apache.spark.SparkConf
+import org.apache.spark.sql.{ExplainSuiteHelper, QueryTest}
+import org.apache.spark.sql.connector.DataSourcePushdownTestUtils
+import org.apache.spark.sql.jdbc.{H2Dialect, JdbcDialect, JdbcDialects}
+import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.util.Utils
+
+class JDBCV2JoinPushdownSuite
+  extends QueryTest
+  with SharedSparkSession
+  with ExplainSuiteHelper
+  with DataSourcePushdownTestUtils
+  with JDBCV2JoinPushdownIntegrationSuiteBase {
+  val tempDir = Utils.createTempDir()
+  override val url = s"jdbc:h2:${tempDir.getCanonicalPath};user=testUser;password=testPass"
+
+  override val jdbcDialect: JdbcDialect = H2Dialect()
+
+  override def sparkConf: SparkConf = super.sparkConf
+    .set(s"spark.sql.catalog.$catalogName.driver", "org.h2.Driver")
+
+  override def caseConvert(identifier: String): String = identifier.toUpperCase(Locale.ROOT)
+
+  override def beforeAll(): Unit = {
+    Utils.classForName("org.h2.Driver")
+    super.beforeAll()
+    dataPreparation()
+    // Registering the dialect because of CI running multiple tests. For example, in
+    // QueryExecutionErrorsSuite H2 dialect is being registered, and somewhere it is
+    // not registered back. The suite should be fixed, but to be safe for now, we are
+    // always registering H2 dialect before test execution.
+    JdbcDialects.registerDialect(H2Dialect())
+  }
+
+  override def afterAll(): Unit = {
+    Utils.deleteRecursively(tempDir)
+    super.afterAll()
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionSuite.scala
index 4e208caf4446a..0be9e5f0f578b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingExecutionSuite.scala
@@ -2743,6 +2743,101 @@ class SqlScriptingExecutionSuite extends QueryTest with SharedSparkSession {
     verifySqlScriptResult(sqlScript, expected = expected)
   }
 
+  test("local variable - multiple variables declared at once") {
+    val sqlScript =
+      """
+        |BEGIN
+        |  lbl1: BEGIN
+        |    DECLARE localVar1, localVar2, localVar3, localVar4 = 1;
+        |    SELECT localVar1;
+        |    SELECT lbl1.localVar1;
+        |    SELECT localVar2;
+        |    SELECT lbl1.localVar2;
+        |    SELECT localVar3;
+        |    SELECT lbl1.localVar3;
+        |    SELECT localVar4;
+        |    SELECT lbl1.localVar4;
+        |  END;
+        |END
+        |""".stripMargin
+    val expected = Seq(
+      Seq(Row(1)), // select localVar1
+      Seq(Row(1)), // select lbl1.localVar1
+      Seq(Row(1)), // select localVar2
+      Seq(Row(1)), // select lbl1.localVar2
+      Seq(Row(1)), // select localVar3
+      Seq(Row(1)), // select lbl1.localVar3
+      Seq(Row(1)), // select localVar4
+      Seq(Row(1)) // select lbl1.localVar4
+    )
+    verifySqlScriptResult(sqlScript, expected)
+  }
+
+  test("local variable - same variable declared twice within same DECLARE statement") {
+    val sqlScript =
+      """
+        |BEGIN
+        |  lbl1: BEGIN
+        |    DECLARE var1, vAr1 = 23;
+        |  END;
+        |END
+        |""".stripMargin
+
+    val e = intercept[AnalysisException] {
+      verifySqlScriptResult(sqlScript, Seq.empty[Seq[Row]])
+    }
+    checkError(
+      exception = e,
+      condition = "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE",
+      parameters = Map("variableName" -> toSQLId("lbl1.var1"))
+    )
+  }
+
+  test("local variable - same variable declared twice within same DECLARE OR REPLACE statement") {
+    val sqlScript =
+      """
+        |DECLARE OR REPLACE var1, vAr1 = 23
+        |""".stripMargin
+
+    val e = intercept[AnalysisException] {
+      spark.sql(sqlScript)
+    }
+    checkError(
+      exception = e,
+      condition = "DUPLICATE_VARIABLE_NAME_INSIDE_DECLARE",
+      parameters = Map("variableName" -> toSQLId("system.session.var1"))
+    )
+  }
+
+  test("local variable - variable declared via IDENTIFIER construct," +
+    "as well as a regular variable within the same DECLARE") {
+    val sqlScript =
+      """
+        |BEGIN
+        |  lbl1: BEGIN
+        |    DECLARE proxy = "var1";
+        |    DECLARE IDENTIFIER(proxy), var2 = 3;
+        |    SELECT proxy;
+        |    SELECT lbl1.proxy;
+        |    SELECT var1;
+        |    SELECT lbl1.var1;
+        |    SELECT var2;
+        |    SELECT lbl1.var2;
+        |  END;
+        |END
+        |""".stripMargin
+
+    val expected = Seq(
+      Seq(Row("var1")), // select proxy
+      Seq(Row("var1")), // select lbl1.proxy
+      Seq(Row(3)), // select var1
+      Seq(Row(3)), // select lbl1.var1
+      Seq(Row(3)), // select var2
+      Seq(Row(3)) // select lbl1.var2
+    )
+    verifySqlScriptResult(sqlScript, expected)
+  }
+
   test("Exception handler in a FOR loop - with condition") {
     withTable("t") {
       withView("v") {
@@ -2938,4 +3033,76 @@ class SqlScriptingExecutionSuite extends QueryTest with SharedSparkSession {
     )
     verifySqlScriptResult(sqlScript, expected = expected)
   }
+
+  test("Integer literal column in FOR query") {
+    val sqlScript1 =
+      """
+        |BEGIN
+        |  FOR SELECT 1 DO
+        |    SELECT 2;
+        |  END FOR;
+        |END
+        |""".stripMargin
+    verifySqlScriptResult(sqlScript1, Seq(Seq(Row(2))))
+
+    val sqlScript2 =
+      """
+        |BEGIN
+        |  FOR x AS SELECT 1 DO
+        |    SELECT x.`1`;
+        |  END FOR;
+        |END
+        |""".stripMargin
+    verifySqlScriptResult(sqlScript2, Seq(Seq(Row(1))))
+  }
+
+  test("Column with space in FOR query") {
+    val sqlScript1 =
+      """
+        |BEGIN
+        |  FOR SELECT 1 AS `Space Column` DO
+        |    SELECT `Space Column`;
+        |  END FOR;
+        |END
+        |""".stripMargin
+    val expected = Seq(Seq(Row(1)))
+    verifySqlScriptResult(sqlScript1, expected)
+
+    val sqlScript2 =
+      """
+        |BEGIN
+        |  FOR x AS SELECT 1 AS `Space Column` DO
+        |    SELECT x.`Space Column`;
+        |  END FOR;
+        |END
+        |""".stripMargin
+    verifySqlScriptResult(sqlScript2, expected)
+  }
+
+  test("FOR query referencing table with space") {
+    withTable("test_tbl") {
+      sql("CREATE TABLE test_tbl (`Space Column` INT) USING parquet")
+      sql("INSERT INTO test_tbl VALUES (1)")
+      val sqlScript1 =
+      """
+        |BEGIN
+        |  FOR SELECT * FROM test_tbl DO
+        |    SELECT `Space Column`;
+        |  END FOR;
+        |END
+        |""".stripMargin
+      val expected = Seq(Seq(Row(1)))
+      verifySqlScriptResult(sqlScript1, expected)
+
+      val sqlScript2 =
+      """
+        |BEGIN
+        |  FOR x AS SELECT * FROM test_tbl DO
+        |    SELECT x.`Space Column`;
+        |  END FOR;
+        |END
+        |""".stripMargin
+      verifySqlScriptResult(sqlScript2, expected)
+    }
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreterSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreterSuite.scala
index 85e37d4b23097..0eafb1fbce2cc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreterSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingInterpreterSuite.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.scripting
 
 import org.apache.spark.{SparkConf, SparkException, SparkNumberFormatException}
 import org.apache.spark.sql.{AnalysisException, QueryTest, Row}
-import org.apache.spark.sql.catalyst.{QueryPlanningTracker, SqlScriptingContextManager}
+import org.apache.spark.sql.catalyst.QueryPlanningTracker
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.plans.logical.CompoundBody
 import org.apache.spark.sql.classic.{DataFrame, Dataset}
@@ -33,7 +33,10 @@ import org.apache.spark.sql.test.SharedSparkSession
  * Output from the interpreter (iterator over executable statements) is then checked - statements
  *   are executed and output DataFrames are compared with expected outputs.
  */
-class SqlScriptingInterpreterSuite extends QueryTest with SharedSparkSession {
+class SqlScriptingInterpreterSuite
+    extends QueryTest
+    with SharedSparkSession
+    with SqlScriptingTestUtils {
 
   // Tests setup
   override protected def sparkConf: SparkConf = {
@@ -44,19 +47,9 @@ class SqlScriptingInterpreterSuite extends QueryTest with SharedSparkSession {
   private def runSqlScript(
       sqlText: String,
       args: Map[String, Expression] = Map.empty): Array[DataFrame] = {
-    val interpreter = SqlScriptingInterpreter(spark)
     val compoundBody = spark.sessionState.sqlParser.parsePlan(sqlText).asInstanceOf[CompoundBody]
 
-    // Initialize context so scopes can be entered correctly.
-    val context = new SqlScriptingExecutionContext()
-    val executionPlan = interpreter.buildExecutionPlan(compoundBody, args, context)
-    context.frames.append(new SqlScriptingExecutionFrame(
-      executionPlan, SqlScriptingFrameType.SQL_SCRIPT))
-    executionPlan.enterScope()
-
-    val handle =
-      SqlScriptingContextManager.create(new SqlScriptingContextManagerImpl(context))
-    handle.runWith {
+    withSqlScriptingContextManager(spark, compoundBody, args) { executionPlan =>
       executionPlan.getTreeIterator.flatMap {
         case statement: SingleStatementExec =>
           if (statement.isExecuted) {
@@ -3478,4 +3471,49 @@ class SqlScriptingInterpreterSuite extends QueryTest with SharedSparkSession {
       verifySqlScriptResult(sqlScript, expected)
     }
   }
+
+  test("Duplicate SQLEXCEPTION Handler") {
+    val sqlScript =
+      """
+        |BEGIN
+        |  DECLARE EXIT HANDLER FOR SQLEXCEPTION
+        |  BEGIN
+        |    SELECT 1;
+        |  END;
+        |  DECLARE EXIT HANDLER FOR SQLEXCEPTION
+        |  BEGIN
+        |    SELECT 2;
+        |  END;
+        |
+        |END""".stripMargin
+    checkError(
+      exception = intercept[SqlScriptingException] {
+        runSqlScript(sqlScript)
+      },
+      condition = "DUPLICATE_EXCEPTION_HANDLER.CONDITION",
+      parameters = Map("condition" -> "SQLEXCEPTION")
+    )
+  }
+
+  test("Duplicate NOT FOUND Handler") {
+    val sqlScript =
+      """
+        |BEGIN
+        |  DECLARE EXIT HANDLER FOR NOT FOUND
+        |  BEGIN
+        |    SELECT 1;
+        |  END;
+        |  DECLARE EXIT HANDLER FOR NOT FOUND
+        |  BEGIN
+        |    SELECT 2;
+        |  END;
+        |END""".stripMargin
+    checkError(
+      exception = intercept[SqlScriptingException] {
+        runSqlScript(sqlScript)
+      },
+      condition = "DUPLICATE_EXCEPTION_HANDLER.CONDITION",
+      parameters = Map("condition" -> "NOT FOUND")
+    )
+  }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingTestUtils.scala b/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingTestUtils.scala
new file mode 100644
index 0000000000000..e508de6547cd8
--- /dev/null
+++ b/sql/core/src/test/scala/org/apache/spark/sql/scripting/SqlScriptingTestUtils.scala
@@ -0,0 +1,67 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.scripting
+
+import org.apache.spark.sql.catalyst.SqlScriptingContextManager
+import org.apache.spark.sql.catalyst.expressions.Expression
+import org.apache.spark.sql.catalyst.plans.logical.CompoundBody
+import org.apache.spark.sql.classic.SparkSession
+
+/**
+ * Utility trait for SQL scripting context manager initialization in test suites.
+ *
+ * This trait provides common functionality for setting up SQL scripting execution contexts
+ * and context managers.
+ */
+trait SqlScriptingTestUtils {
+
+  /**
+   * Creates and initializes a SQL scripting context manager with the given compound body
+   * and arguments, then executes the provided body function within that context.
+   *
+   * Context needs to be initialized so scopes can be entered correctly.
+   *
+   * @param spark SparkSession to use
+   * @param compoundBody The compound body to execute
+   * @param args Arguments to pass to the execution plan
+   * @param body Function to execute within the scripting context
+   * @tparam R Return type of the body function
+   * @return Result of executing the body function
+   */
+  def withSqlScriptingContextManager[R](
+      spark: SparkSession,
+      compoundBody: CompoundBody,
+      args: Map[String, Expression] = Map.empty)(body: CompoundBodyExec => R): R = {
+
+    val interpreter = SqlScriptingInterpreter(spark)
+
+    val context = new SqlScriptingExecutionContext()
+    val executionPlan = interpreter.buildExecutionPlan(compoundBody, args, context)
+    context.frames.append(
+      new SqlScriptingExecutionFrame(executionPlan, SqlScriptingFrameType.SQL_SCRIPT)
+    )
+    executionPlan.enterScope()
+
+    val handle = SqlScriptingContextManager.create(
+      new SqlScriptingContextManagerImpl(context)
+    )
+    handle.runWith {
+      body(executionPlan)
+    }
+  }
+}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/sources/FilteredScanSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/sources/FilteredScanSuite.scala
index 94a3b5ed5788e..786e50eea2e71 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/sources/FilteredScanSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/sources/FilteredScanSuite.scala
@@ -224,15 +224,15 @@ class FilteredScanSuite extends DataSourceTest with SharedSparkSession {
 
   sqlTest(
     "SELECT a, b, c FROM oneToTenFiltered WHERE c like 'c%'",
-    Seq(Row(3, 3 * 2, "c" * 5 + "C" * 5)))
+    Seq(Row(3, 3 * 2, "c".repeat(5) + "C".repeat(5))))
 
   sqlTest(
     "SELECT a, b, c FROM oneToTenFiltered WHERE c like '%D'",
-    Seq(Row(4, 4 * 2, "d" * 5 + "D" * 5)))
+    Seq(Row(4, 4 * 2, "d".repeat(5) + "D".repeat(5))))
 
   sqlTest(
     "SELECT a, b, c FROM oneToTenFiltered WHERE c like '%eE%'",
-    Seq(Row(5, 5 * 2, "e" * 5 + "E" * 5)))
+    Seq(Row(5, 5 * 2, "e".repeat(5) + "E".repeat(5))))
 
   testPushDown("SELECT * FROM oneToTenFiltered WHERE A = 1", 1, Set("a", "b", "c"))
   testPushDown("SELECT a FROM oneToTenFiltered WHERE A = 1", 1, Set("a"))
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/sources/InsertSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/sources/InsertSuite.scala
index af10fbbbc506a..6678f9535fe0d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/sources/InsertSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/sources/InsertSuite.scala
@@ -1977,41 +1977,108 @@ class InsertSuite extends DataSourceTest with SharedSparkSession {
     withSQLConf(SQLConf.JSON_GENERATOR_WRITE_NULL_IF_WITH_DEFAULT_VALUE.key -> "true",
       SQLConf.JSON_GENERATOR_IGNORE_NULL_FIELDS.key -> "true") {
       withTable("t") {
-        sql("create table t (a int default 42) using json")
-        sql("insert into t values (null)")
-        checkAnswer(spark.table("t"), Row(null))
+        sql("create table t (a int default 42, b int) using json")
+        sql("insert into t values (null, null)")
+        // nulls should be written for fields with defaults, but not for fields without defaults.
+        checkAnswer(readTableAsText("t"), Row("{\"a\":null}"))
+        // default value is not filled in for existing fields.
+        checkAnswer(spark.table("t"), Row(null, null))
       }
     }
     withSQLConf(SQLConf.JSON_GENERATOR_WRITE_NULL_IF_WITH_DEFAULT_VALUE.key -> "false",
       SQLConf.JSON_GENERATOR_IGNORE_NULL_FIELDS.key -> "true") {
       withTable("t") {
-        sql("create table t (a int default 42) using json")
-        sql("insert into t values (null)")
-        checkAnswer(spark.table("t"), Row(42))
+        sql("create table t (a int default 42, b int) using json")
+        sql("insert into t(a,b) values (null, null)")
+        // nulls should not be written for either field
+        checkAnswer(readTableAsText("t"), Row("{}"))
+        // default value is filled in for missing fields.
+        checkAnswer(spark.table("t"), Row(42, null))
       }
     }
-  }
-
-  test("SPARK-39359 Restrict DEFAULT columns to allowlist of supported data source types") {
-    withSQLConf(SQLConf.DEFAULT_COLUMN_ALLOWED_PROVIDERS.key -> "csv,json,orc") {
-      checkError(
-        exception = intercept[AnalysisException] {
-          sql(s"create table t(a string default 'abc') using parquet")
-        },
-        condition = "DEFAULT_UNSUPPORTED",
-        parameters = Map("statementType" -> "CREATE TABLE", "dataSource" -> "parquet"))
+    // SPARK-52772 complex types get same null handling.
+    withSQLConf(SQLConf.JSON_GENERATOR_WRITE_NULL_IF_WITH_DEFAULT_VALUE.key -> "true",
+      SQLConf.JSON_GENERATOR_IGNORE_NULL_FIELDS.key -> "true") {
       withTable("t") {
-        sql(s"create table t(a string, b int) using parquet")
-        checkError(
-          exception = intercept[AnalysisException] {
-            sql("alter table t add column s bigint default 42")
-          },
-          condition = "DEFAULT_UNSUPPORTED",
-          parameters = Map(
-            "statementType" -> "ALTER TABLE ADD COLUMNS",
-            "dataSource" -> "parquet"))
+        sql("create table t (a struct<x: long> default struct(42), b int) using json")
+        // The cast gets the TableOutputResolver to enter the Struct,Struct case.
+        sql("insert into t values (cast(null as struct<x: int>), null)")
+        // nulls should be written for fields with defaults, but not for fields without defaults.
+        checkAnswer(readTableAsText("t"), Row("{\"a\":null}"))
+        // default value is not filled in for existing fields.
+        checkAnswer(spark.table("t"), Row(null, null))
+      }
+    }
+    withSQLConf(SQLConf.JSON_GENERATOR_WRITE_NULL_IF_WITH_DEFAULT_VALUE.key -> "false",
+      SQLConf.JSON_GENERATOR_IGNORE_NULL_FIELDS.key -> "true") {
+      withTable("t") {
+        sql("create table t (a struct<x: long> default struct(42), b int) using json")
+        sql("insert into t values (cast(null as struct<x: int>), null)")
+        // nulls should not be written for either field
+        checkAnswer(readTableAsText("t"), Row("{}"))
+        // default value is filled in for missing fields.
+        checkAnswer(spark.table("t"), Row(Row(42), null))
+      }
+    }
+    // SPARK-52772 Should not pick up JSON DEFAULT from source
+    withSQLConf(SQLConf.JSON_GENERATOR_WRITE_NULL_IF_WITH_DEFAULT_VALUE.key -> "true",
+      SQLConf.JSON_GENERATOR_IGNORE_NULL_FIELDS.key -> "true") {
+      withTable("t", "u") {
+        sql("create table t (a int default 42, b int) using json")
+        sql("create table u (a int, b int) using json") // NO DEFAULT
+        sql("insert into t values (null, null)")
+        sql("insert into u select a, b from t")
+        // t.a gets explicit null
+        checkAnswer(readTableAsText("t"), Row("{\"a\":null}"))
+        // u.a has null ignored
+        checkAnswer(readTableAsText("u"), Row("{}"))
+        // t.a reads explicit null
+        checkAnswer(spark.table("t"), Row(null, null))
+        // u.a reads implicit null
+        checkAnswer(spark.table("u"), Row(null, null))
       }
     }
+    withSQLConf(SQLConf.JSON_GENERATOR_WRITE_NULL_IF_WITH_DEFAULT_VALUE.key -> "false",
+      SQLConf.JSON_GENERATOR_IGNORE_NULL_FIELDS.key -> "true") {
+      withTable("t", "u") {
+        sql("create table t (a int default null, b int) using json")
+        sql("create table u (a int, b int) using json") // NO DEFAULT
+        sql("insert into t values (null, null)")
+        sql("insert into u select a, b from t")
+        // t.a gets explicit null
+        checkAnswer(readTableAsText("t"), Row("{}"))
+        // u.a has null ignored
+        checkAnswer(readTableAsText("u"), Row("{}"))
+        // t.a missing key becomes default value.
+        checkAnswer(spark.table("t"), Row(null, null))
+        // u.a reads implicit null
+        checkAnswer(spark.table("u"), Row(null, null))
+      }
+    }
+    // SPARK-52772 Should not pick up JSON DEFAULT from source, even after rewrites
+    withSQLConf(SQLConf.JSON_GENERATOR_WRITE_NULL_IF_WITH_DEFAULT_VALUE.key -> "true",
+      SQLConf.JSON_GENERATOR_IGNORE_NULL_FIELDS.key -> "true") {
+      withTable("t", "u") {
+        sql("create table t (a int default 42, b int) using json")
+        sql("create table u (a int, b int) using json") // NO DEFAULT
+        sql("insert into t values (null, null)")
+        sql("insert into u select cast(a as int), b from t")
+        // t.a gets explicit null
+        checkAnswer(readTableAsText("t"), Row("{\"a\":null}"))
+        // u.a has null ignored
+        checkAnswer(readTableAsText("u"), Row("{}"))
+        // t.a reads explicit null
+        checkAnswer(spark.table("t"), Row(null, null))
+        // u.a reads implicit null
+        checkAnswer(spark.table("u"), Row(null, null))
+      }
+    }
+  }
+
+  private def readTableAsText(tableName: String): DataFrame = {
+    val meta = spark.sessionState.catalog.getTableMetadata(TableIdentifier(tableName))
+    val path = meta.location.toString
+    spark.read.text(path)
   }
 
   test("SPARK-39557 INSERT INTO statements with tables with array defaults") {
@@ -2150,11 +2217,8 @@ class InsertSuite extends DataSourceTest with SharedSparkSession {
       Config(
         "parquet",
         useDataFrames = true),
-      // SPARK-47029: ALTER COLUMN DROP DEFAULT fails to work correctly with JSON data sources.
-      /*
       Config(
         "json"),
-        */
       Config(
         "json",
         useDataFrames = true),
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/sources/PartitionedWriteSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/sources/PartitionedWriteSuite.scala
index b18d8f816e301..e742fd68e9151 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/sources/PartitionedWriteSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/sources/PartitionedWriteSuite.scala
@@ -25,6 +25,7 @@ import org.apache.hadoop.mapreduce.{JobContext, TaskAttemptContext}
 
 import org.apache.spark.TestUtils
 import org.apache.spark.internal.Logging
+import org.apache.spark.internal.io.FileNameSpec
 import org.apache.spark.sql.{AnalysisException, QueryTest, Row}
 import org.apache.spark.sql.catalyst.catalog.ExternalCatalogUtils
 import org.apache.spark.sql.catalyst.util.DateTimeUtils
@@ -42,7 +43,7 @@ private class OnlyDetectCustomPathFileCommitProtocol(jobId: String, path: String
     with Serializable with Logging {
 
   override def newTaskTempFileAbsPath(
-      taskContext: TaskAttemptContext, absoluteDir: String, ext: String): String = {
+      taskContext: TaskAttemptContext, absoluteDir: String, spec: FileNameSpec): String = {
     throw new Exception("there should be no custom partition path")
   }
 }
@@ -264,9 +265,9 @@ private class PartitionFileExistCommitProtocol(
   override def setupJob(jobContext: JobContext): Unit = {
     super.setupJob(jobContext)
     val stagingDir = new File(new Path(path).toUri.getPath, s".spark-staging-$jobId")
-    stagingDir.mkdirs()
+    Utils.createDirectory(stagingDir)
     val stagingPartDir = new File(stagingDir, "p1=2")
-    stagingPartDir.mkdirs()
+    Utils.createDirectory(stagingPartDir)
     val conflictTaskFile = new File(stagingPartDir, s"part-00000-$jobId.c000.snappy.parquet")
     conflictTaskFile.createNewFile()
   }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/AcceptsLatestSeenOffsetSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/AcceptsLatestSeenOffsetSuite.scala
index 2dadbbe7cb237..2a4abd99f6c19 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/AcceptsLatestSeenOffsetSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/AcceptsLatestSeenOffsetSuite.scala
@@ -24,7 +24,8 @@ import org.apache.spark.sql.catalyst.plans.logical.Range
 import org.apache.spark.sql.classic.{DataFrame, Dataset, SparkSession}
 import org.apache.spark.sql.connector.read.streaming
 import org.apache.spark.sql.connector.read.streaming.{AcceptsLatestSeenOffset, SparkDataStream}
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.{Offset, Source}
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.execution.streaming.sources.{ContinuousMemoryStream, ContinuousMemoryStreamOffset}
 import org.apache.spark.sql.types.{LongType, StructType}
 import org.apache.spark.tags.SlowSQLTest
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/CommitLogSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/CommitLogSuite.scala
index 1af35d0a1db4d..aa5826572240f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/CommitLogSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/CommitLogSuite.scala
@@ -21,7 +21,7 @@ import java.io.{ByteArrayInputStream, FileInputStream, FileOutputStream}
 import java.nio.file.Path
 
 import org.apache.spark.SparkFunSuite
-import org.apache.spark.sql.execution.streaming.{CommitLog, CommitMetadata}
+import org.apache.spark.sql.execution.streaming.checkpointing.{CommitLog, CommitMetadata}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.test.SharedSparkSession
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/DeprecatedStreamingAggregationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/DeprecatedStreamingAggregationSuite.scala
index 7777887ec62c9..3bc7df41a147d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/DeprecatedStreamingAggregationSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/DeprecatedStreamingAggregationSuite.scala
@@ -19,8 +19,8 @@ package org.apache.spark.sql.streaming
 
 import org.scalatest.Assertions
 
-import org.apache.spark.sql.execution.streaming._
-import org.apache.spark.sql.execution.streaming.state.StreamingAggregationStateManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.StreamingAggregationStateManager
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.expressions.scalalang.typed
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.OutputMode._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/EventTimeWatermarkSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/EventTimeWatermarkSuite.scala
index 6a12ba7d14a49..db28ef4fc35a2 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/EventTimeWatermarkSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/EventTimeWatermarkSuite.scala
@@ -23,7 +23,6 @@ import java.text.SimpleDateFormat
 import java.util.{Calendar, Date, Locale}
 import java.util.concurrent.TimeUnit._
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.BeforeAndAfter
 import org.scalatest.matchers.must.Matchers
 import org.scalatest.matchers.should.Matchers._
@@ -33,7 +32,8 @@ import org.apache.spark.sql.{AnalysisException, DataFrame, Dataset}
 import org.apache.spark.sql.catalyst.plans.logical.EventTimeWatermark
 import org.apache.spark.sql.catalyst.util.DateTimeConstants._
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils.UTC
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.operators.stateful.{EventTimeStats, StateStoreSaveExec}
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.execution.streaming.sources.MemorySink
 import org.apache.spark.sql.functions.{count, expr, timestamp_seconds, window}
 import org.apache.spark.sql.internal.SQLConf
@@ -245,7 +245,7 @@ class EventTimeWatermarkSuite extends StreamTest with BeforeAndAfter with Matche
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(15)
     inputData.addData(10, 12, 14)
@@ -850,7 +850,7 @@ class EventTimeWatermarkSuite extends StreamTest with BeforeAndAfter with Matche
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     input1.addData(20)
     input2.addData(30)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSinkSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSinkSuite.scala
index 9742a00454569..067b0ca285d54 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSinkSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSinkSuite.scala
@@ -38,7 +38,9 @@ import org.apache.spark.sql.execution.DataSourceScanExec
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.datasources.parquet.ParquetFileFormat
 import org.apache.spark.sql.execution.datasources.v2.{BatchScanExec, DataSourceV2Relation, FileScan, FileTable}
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.ManifestFileCommitProtocol
+import org.apache.spark.sql.execution.streaming.runtime._
+import org.apache.spark.sql.execution.streaming.sinks.{FileStreamSink, FileStreamSinkLog, SinkFileStatus}
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{IntegerType, StructField, StructType}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSourceSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSourceSuite.scala
index a753da116924d..15a0f048dd8a5 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSourceSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FileStreamSourceSuite.scala
@@ -39,7 +39,9 @@ import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.util._
 import org.apache.spark.sql.connector.read.streaming.ReadLimit
 import org.apache.spark.sql.execution.streaming._
-import org.apache.spark.sql.execution.streaming.FileStreamSource.{FileEntry, SeenFilesMap, SourceFileArchiver}
+import org.apache.spark.sql.execution.streaming.runtime.{CleanSourceMode, FileStreamOptions, FileStreamSource, FileStreamSourceLog, FileStreamSourceOffset, MemoryStream, SerializedOffset, StreamExecution, StreamingExecutionRelation, StreamingQueryWrapper, StreamingRelation}
+import org.apache.spark.sql.execution.streaming.runtime.FileStreamSource.{FileEntry, SeenFilesMap, SourceFileArchiver}
+import org.apache.spark.sql.execution.streaming.sinks.{FileStreamSink, FileStreamSinkLog, SinkFileStatus}
 import org.apache.spark.sql.execution.streaming.sources.MemorySink
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
@@ -106,7 +108,7 @@ abstract class FileStreamSourceTest
     override def addData(source: FileStreamSource): Unit = {
       val tempFile = Utils.tempFileWith(new File(tmp, tmpFilePrefix))
       val finalFile = new File(src, tempFile.getName)
-      src.mkdirs()
+      Utils.createDirectory(src)
       require(stringToFile(tempFile, content).renameTo(finalFile))
       logInfo(s"Written text '$content' to file $finalFile")
     }
@@ -127,7 +129,7 @@ abstract class FileStreamSourceTest
     def writeToFile(df: DataFrame, src: File, tmp: File): Unit = {
       val tmpDir = Utils.tempFileWith(new File(tmp, "orc"))
       df.write.orc(tmpDir.getCanonicalPath)
-      src.mkdirs()
+      Utils.createDirectory(src)
       tmpDir.listFiles().foreach { f =>
         f.renameTo(new File(src, s"${f.getName}"))
       }
@@ -149,7 +151,7 @@ abstract class FileStreamSourceTest
     def writeToFile(df: DataFrame, src: File, tmp: File): Unit = {
       val tmpDir = Utils.tempFileWith(new File(tmp, "parquet"))
       df.write.parquet(tmpDir.getCanonicalPath)
-      src.mkdirs()
+      Utils.createDirectory(src)
       tmpDir.listFiles().foreach { f =>
         f.renameTo(new File(src, s"${f.getName}"))
       }
@@ -664,7 +666,7 @@ class FileStreamSourceSuite extends FileStreamSourceTest {
     withTempDirs { case (baseSrc, tmp) =>
       withSQLConf(SQLConf.STREAMING_SCHEMA_INFERENCE.key -> "true") {
         val src = new File(baseSrc, "type=X")
-        src.mkdirs()
+        Utils.createDirectory(src)
 
         // Add a file so that we can infer its schema
         stringToFile(new File(src, "existing"), "{'c': 'drop1'}\n{'c': 'keep2'}\n{'c': 'keep3'}")
@@ -1451,7 +1453,7 @@ class FileStreamSourceSuite extends FileStreamSourceTest {
 
   test("explain") {
     withTempDirs { case (src, tmp) =>
-      src.mkdirs()
+      Utils.createDirectory(src)
 
       val df = spark.readStream.format("text").load(src.getCanonicalPath).map(_.toString + "-x")
       // Test `explain` not throwing errors
@@ -1500,7 +1502,7 @@ class FileStreamSourceSuite extends FileStreamSourceTest {
 
     withTempDirs { case (root, tmp) =>
       val src = new File(root, "a=1")
-      src.mkdirs()
+      Utils.createDirectory(src)
 
       (1 to numFiles).map { _.toString }.foreach { i =>
         val tempFile = Utils.tempFileWith(new File(tmp, "text"))
@@ -1531,7 +1533,7 @@ class FileStreamSourceSuite extends FileStreamSourceTest {
         batchId: Long,
         expectedBatches: Int,
         expectedCompactInterval: Int): Boolean = {
-      import CompactibleFileStreamLog._
+      import org.apache.spark.sql.execution.streaming.runtime.CompactibleFileStreamLog._
 
       val fileSource = getSourcesFromStreamingQuery(execution).head
       val metadataLog = fileSource invokePrivate _metadataLog()
@@ -1924,8 +1926,8 @@ class FileStreamSourceSuite extends FileStreamSourceTest {
     withTempDirs { case (dir, tmp) =>
       val sourceDir1 = new File(dir, "source1")
       val sourceDir2 = new File(dir, "source2")
-      sourceDir1.mkdirs()
-      sourceDir2.mkdirs()
+      Utils.createDirectory(sourceDir1)
+      Utils.createDirectory(sourceDir2)
 
       val source1 = createFileStream("text", s"${sourceDir1.getCanonicalPath}")
       val source2 = createFileStream("text", s"${sourceDir2.getCanonicalPath}")
@@ -2595,7 +2597,7 @@ class FileStreamSourceSuite extends FileStreamSourceTest {
     val tempFile = Utils.tempFileWith(new File(tmp, "text"))
     val finalFile = new File(src, tempFile.getName)
     require(!src.exists(), s"$src exists, dir: ${src.isDirectory}, file: ${src.isFile}")
-    require(src.mkdirs(), s"Cannot create $src")
+    require(Utils.createDirectory(src), s"Cannot create $src")
     require(src.isDirectory(), s"$src is not a directory")
     require(stringToFile(tempFile, content).renameTo(finalFile))
     finalFile
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateDistributionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateDistributionSuite.scala
index 3320a682b1240..de81a3127e41a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateDistributionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateDistributionSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.streaming
 import org.apache.spark.sql.IntegratedUDFTestUtils.{shouldTestPandasUDFs, TestGroupedMapPandasUDFWithState}
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.Update
 import org.apache.spark.sql.execution.python.streaming.FlatMapGroupsInPandasWithStateExec
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.streaming.util.{StatefulOpClusteredDistributionTestHelper, StreamManualClock}
 import org.apache.spark.sql.types.{IntegerType, LongType, StringType, StructField, StructType}
 import org.apache.spark.tags.SlowSQLTest
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateSuite.scala
index 9c5714f682603..0017531e41e1a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsInPandasWithStateSuite.scala
@@ -22,7 +22,7 @@ import org.apache.spark.sql.Row
 import org.apache.spark.sql.catalyst.plans.logical.{NoTimeout, ProcessingTimeTimeout}
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.{Complete, Update}
 import org.apache.spark.sql.execution.python.streaming.FlatMapGroupsInPandasWithStateExec
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.{lit, timestamp_seconds}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateDistributionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateDistributionSuite.scala
index 04b5f3af64635..27c78e5865b02 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateDistributionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateDistributionSuite.scala
@@ -19,10 +19,9 @@ package org.apache.spark.sql.streaming
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.Update
-import org.apache.spark.sql.execution.streaming.{FlatMapGroupsWithStateExec, MemoryStream}
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.FlatMapGroupsWithStateExec
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.GroupStateTimeout.ProcessingTimeTimeout
 import org.apache.spark.sql.streaming.util.{StatefulOpClusteredDistributionTestHelper, StreamManualClock}
@@ -188,7 +187,7 @@ class FlatMapGroupsWithStateDistributionSuite extends StreamTest
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(("a", "a", 1L))
 
@@ -292,7 +291,7 @@ class FlatMapGroupsWithStateDistributionSuite extends StreamTest
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(("a", "a", 1L))
 
@@ -391,7 +390,7 @@ class FlatMapGroupsWithStateDistributionSuite extends StreamTest
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(("a", "a", 1L))
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateSuite.scala
index d785cc1a7f446..93efbe3b3cf5a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateSuite.scala
@@ -21,7 +21,6 @@ import java.io.File
 import java.nio.ByteOrder
 import java.sql.Timestamp
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.exceptions.TestFailedException
 
 import org.apache.spark.api.java.function.FlatMapGroupsWithStateFunction
@@ -33,8 +32,9 @@ import org.apache.spark.sql.catalyst.plans.physical.UnknownPartitioning
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes._
 import org.apache.spark.sql.execution.RDDScanExec
 import org.apache.spark.sql.execution.exchange.ShuffleExchangeExec
-import org.apache.spark.sql.execution.streaming._
-import org.apache.spark.sql.execution.streaming.state.{FlatMapGroupsWithStateExecHelper, MemoryStateStore, RocksDBStateStoreProvider, StateStore}
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.{FlatMapGroupsWithStateExec, FlatMapGroupsWithStateExecHelper, FlatMapGroupsWithStateUserFuncException}
+import org.apache.spark.sql.execution.streaming.runtime._
+import org.apache.spark.sql.execution.streaming.state.{MemoryStateStore, RocksDBStateStoreProvider, StateStore}
 import org.apache.spark.sql.functions.timestamp_seconds
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
@@ -53,7 +53,7 @@ class FlatMapGroupsWithStateSuite extends StateStoreMetricsTest {
   import testImplicits._
 
   import FlatMapGroupsWithStateSuite._
-  import GroupStateImpl._
+  import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl._
   import GroupStateTimeout._
 
   /**
@@ -609,7 +609,7 @@ class FlatMapGroupsWithStateSuite extends StateStoreMetricsTest {
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(("a", 11), ("a", 13), ("a", 15))
     inputData.addData(("a", 4))
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateWithInitialStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateWithInitialStateSuite.scala
index 418fbd5603a80..93d6e469c5ccb 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateWithInitialStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/FlatMapGroupsWithStateWithInitialStateSuite.scala
@@ -20,8 +20,8 @@ package org.apache.spark.sql.streaming
 import org.apache.spark.SparkException
 import org.apache.spark.sql.{AnalysisException, Dataset, KeyValueGroupedDataset}
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.Update
-import org.apache.spark.sql.execution.streaming.MemoryStream
-import org.apache.spark.sql.execution.streaming.state.FlatMapGroupsWithStateExecHelper
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.FlatMapGroupsWithStateExecHelper
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.FlatMapGroupsWithStateSuite.{assertCanGetProcessingTime, assertCannotGetWatermark}
 import org.apache.spark.sql.streaming.GroupStateTimeout.{EventTimeTimeout, NoTimeout, ProcessingTimeTimeout}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/GroupStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/GroupStateSuite.scala
index 69362dd60d889..7df9e1f335ae4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/GroupStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/GroupStateSuite.scala
@@ -21,8 +21,8 @@ import java.sql.Date
 
 import org.apache.spark.{SparkFunSuite, SparkUnsupportedOperationException}
 import org.apache.spark.api.java.Optional
-import org.apache.spark.sql.execution.streaming.GroupStateImpl
-import org.apache.spark.sql.execution.streaming.GroupStateImpl.NO_TIMESTAMP
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl
+import org.apache.spark.sql.execution.streaming.operators.stateful.flatmapgroupswithstate.GroupStateImpl.NO_TIMESTAMP
 import org.apache.spark.sql.streaming.GroupStateTimeout.{EventTimeTimeout, NoTimeout, ProcessingTimeTimeout}
 
 class GroupStateSuite extends SparkFunSuite {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/MemorySourceStressSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/MemorySourceStressSuite.scala
index 65ac6712ab45f..4a4decaadfa92 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/MemorySourceStressSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/MemorySourceStressSuite.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.streaming
 
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.tags.SlowSQLTest
 
 @SlowSQLTest
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/MultiStatefulOperatorsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/MultiStatefulOperatorsSuite.scala
index 980f9f48dcb05..21bf370f82a5f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/MultiStatefulOperatorsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/MultiStatefulOperatorsSuite.scala
@@ -22,7 +22,9 @@ import java.sql.Timestamp
 import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.sql.{DataFrame, SparkSession}
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StateStoreSaveExec, StreamingSymmetricHashJoinExec}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StateStoreSaveExec
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinExec
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.StateStore
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/OffsetSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/OffsetSuite.scala
index f208f9bd9b6e3..8680cefb7caae 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/OffsetSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/OffsetSuite.scala
@@ -18,7 +18,8 @@
 package org.apache.spark.sql.streaming
 
 import org.apache.spark.SparkFunSuite
-import org.apache.spark.sql.execution.streaming.{LongOffset, Offset, SerializedOffset}
+import org.apache.spark.sql.execution.streaming.Offset
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, SerializedOffset}
 
 trait OffsetSuite extends SparkFunSuite {
   /** Creates test to check all the comparisons of offsets given a `one` that is less than `two`. */
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/ReportSinkMetricsSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/ReportSinkMetricsSuite.scala
index c417693b5d7a6..7dd2e063c9c51 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/ReportSinkMetricsSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/ReportSinkMetricsSuite.scala
@@ -25,7 +25,7 @@ import org.apache.spark.sql.connector.catalog.{SupportsWrite, Table, TableCapabi
 import org.apache.spark.sql.connector.read.streaming.ReportsSinkMetrics
 import org.apache.spark.sql.connector.write._
 import org.apache.spark.sql.connector.write.streaming.{StreamingDataWriterFactory, StreamingWrite}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.sources.PackedRowWriterFactory
 import org.apache.spark.sql.internal.connector.{SimpleTableProvider, SupportsStreamingUpdateAsAppend}
 import org.apache.spark.sql.sources.{BaseRelation, CreatableRelationProvider, DataSourceRegister}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StateStoreMetricsTest.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StateStoreMetricsTest.scala
index 5f9ff25e16e73..e9bfaf2fc56a4 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StateStoreMetricsTest.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StateStoreMetricsTest.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.streaming
 
 import org.scalatest.time.SpanSugar._
 
-import org.apache.spark.sql.execution.streaming.StreamExecution
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.util.ArrayImplicits._
 
 trait StateStoreMetricsTest extends StreamTest {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamSuite.scala
index b0967d5ffdf10..cbb2eba7ecc89 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamSuite.scala
@@ -27,7 +27,6 @@ import scala.reflect.ClassTag
 import scala.util.control.ControlThrowable
 
 import com.google.common.util.concurrent.UncheckedExecutionException
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.conf.Configuration
 import org.scalatest.time.SpanSugar._
 
@@ -43,6 +42,8 @@ import org.apache.spark.sql.classic.ClassicConversions._
 import org.apache.spark.sql.execution.{LocalLimitExec, SimpleMode, SparkPlan}
 import org.apache.spark.sql.execution.command.ExplainCommand
 import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.operators.stateful.StreamingLocalLimitExec
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, MemoryStream, StreamExecution, StreamingExecutionRelation, StreamingQueryWrapper, StreamingRelation}
 import org.apache.spark.sql.execution.streaming.sources.{ContinuousMemoryStream, ForeachBatchUserFuncException, MemorySink}
 import org.apache.spark.sql.execution.streaming.state.{KeyStateEncoderSpec, StateSchemaProvider, StateStore, StateStoreConf, StateStoreId, StateStoreProvider}
 import org.apache.spark.sql.expressions.Window
@@ -767,7 +768,7 @@ class StreamSuite extends StreamTest {
     val dir1 = Utils.createTempDir().getCanonicalFile // not using withTempDir {}, makes test flaky
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(checkpointDir, dir1)
+    Utils.copyDirectory(checkpointDir, dir1)
     // Checkpoint data was generated by a query with 10 shuffle partitions.
     // In order to test reading from the checkpoint, the checkpoint must have two or more batches,
     // since the last batch may be rerun.
@@ -793,7 +794,7 @@ class StreamSuite extends StreamTest {
     // 2 - Check recovery with wrong num shuffle partitions
     prepareMemoryStream()
     val dir2 = Utils.createTempDir().getCanonicalFile
-    FileUtils.copyDirectory(checkpointDir, dir2)
+    Utils.copyDirectory(checkpointDir, dir2)
     // Since the number of partitions is greater than 10, should throw exception.
     withSQLConf(SQLConf.SHUFFLE_PARTITIONS.key -> "15") {
       var streamingQuery: StreamingQuery = null
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamTest.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamTest.scala
index a6efc2d8fa9c0..5b084c89eba1a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamTest.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamTest.scala
@@ -40,8 +40,9 @@ import org.apache.spark.sql.catalyst.util._
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2, SparkDataStream}
 import org.apache.spark.sql.execution.datasources.v2.StreamingDataSourceV2ScanRelation
-import org.apache.spark.sql.execution.streaming._
 import org.apache.spark.sql.execution.streaming.continuous.{ContinuousExecution, EpochCoordinatorRef, IncrementAndGetEpoch}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperator
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, MemoryStreamBase, MemoryStreamTable, MicroBatchExecution, StreamExecution, StreamingExecutionRelation, StreamingQueryWrapper}
 import org.apache.spark.sql.execution.streaming.sources.MemorySink
 import org.apache.spark.sql.execution.streaming.state.StateStore
 import org.apache.spark.sql.streaming.StreamingQueryListener._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationDistributionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationDistributionSuite.scala
index b4c4ec7acbfd2..465da3cd469f9 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationDistributionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationDistributionSuite.scala
@@ -19,12 +19,12 @@ package org.apache.spark.sql.streaming
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.Assertions
 
 import org.apache.spark.sql.catalyst.plans.physical.UnspecifiedDistribution
 import org.apache.spark.sql.execution.aggregate.BaseAggregateExec
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StateStoreRestoreExec, StateStoreSaveExec}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StateStoreRestoreExec, StateStoreSaveExec}
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.count
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.OutputMode.Update
@@ -101,7 +101,7 @@ class StreamingAggregationDistributionSuite extends StreamTest
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(3)
     inputData.addData(3, 2)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala
index 9cecd16364759..7825730d901da 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingAggregationSuite.scala
@@ -22,7 +22,6 @@ import java.util.{Locale, TimeZone}
 
 import scala.annotation.tailrec
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.Assertions
 
 import org.apache.spark.{SparkEnv, SparkException, SparkUnsupportedOperationException}
@@ -36,8 +35,10 @@ import org.apache.spark.sql.classic.{DataFrame, Dataset, SparkSession}
 import org.apache.spark.sql.execution.{SparkPlan, UnaryExecNode}
 import org.apache.spark.sql.execution.exchange.Exchange
 import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.operators.stateful.{StateStoreRestoreExec, StateStoreSaveExec, StreamingAggregationStateManager}
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, MemoryStream, StreamExecution}
 import org.apache.spark.sql.execution.streaming.sources.MemorySink
-import org.apache.spark.sql.execution.streaming.state.{StateStore, StateStoreValueSchemaNotCompatible, StreamingAggregationStateManager}
+import org.apache.spark.sql.execution.streaming.state.{StateStore, StateStoreValueSchemaNotCompatible}
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.OutputMode._
@@ -733,7 +734,7 @@ class StreamingAggregationSuite extends StateStoreMetricsTest with Assertions {
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(3)
     inputData.addData(3, 2)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationDistributionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationDistributionSuite.scala
index e23a44f06a4ac..449ba9aaa18cf 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationDistributionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationDistributionSuite.scala
@@ -19,10 +19,9 @@ package org.apache.spark.sql.streaming
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.Update
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StreamingDeduplicateExec}
+import org.apache.spark.sql.execution.streaming.operators.stateful.StreamingDeduplicateExec
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StatefulOpClusteredDistributionTestHelper
 import org.apache.spark.util.Utils
@@ -75,7 +74,7 @@ class StreamingDeduplicationDistributionSuite extends StreamTest
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
     inputData.addData(1, 1, 2)
     inputData.addData(3, 4)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationSuite.scala
index 040b99e55cb01..832b22d6304fc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationSuite.scala
@@ -19,12 +19,10 @@ package org.apache.spark.sql.streaming
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.DataFrame
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes._
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.StringType
@@ -321,7 +319,7 @@ class StreamingDeduplicationSuite extends StateStoreMetricsTest {
         },
         AssertOnQuery { q =>
           eventually(timeout(streamingTimeout)) {
-            q.lastProgress.sink.numOutputRows == 0L
+            assert(q.lastProgress.sink.numOutputRows == 0L)
             true
           }
         }
@@ -468,7 +466,7 @@ class StreamingDeduplicationSuite extends StateStoreMetricsTest {
       val checkpointDir = Utils.createTempDir().getCanonicalFile
       // Copy the checkpoint to a temp dir to prevent changes to the original.
       // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-      FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+      Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
       inputData.addData(("a", 1, "dummy"))
       inputData.addData(("a", 2, "dummy"), ("b", 3, "dummy"))
@@ -504,7 +502,7 @@ class StreamingDeduplicationSuite extends StateStoreMetricsTest {
       val checkpointDir = Utils.createTempDir().getCanonicalFile
       // Copy the checkpoint to a temp dir to prevent changes to the original.
       // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-      FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+      Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
       inputData.addData(("a", 1, "dummy"))
       inputData.addData(("a", 2, "dummy"), ("b", 3, "dummy"))
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationWithinWatermarkSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationWithinWatermarkSuite.scala
index af86e6ec88996..a6223cef32da2 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationWithinWatermarkSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingDeduplicationWithinWatermarkSuite.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.streaming
 
 import org.apache.spark.sql.{AnalysisException, Dataset, SaveMode}
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.Append
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.timestamp_seconds
 import org.apache.spark.tags.SlowSQLTest
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingJoinSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingJoinSuite.scala
index 43e064d86117b..22028a585e229 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingJoinSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingJoinSuite.scala
@@ -24,7 +24,6 @@ import java.util.{Locale, UUID}
 
 import scala.util.Random
 
-import org.apache.commons.io.FileUtils
 import org.apache.hadoop.fs.Path
 import org.scalactic.source.Position
 import org.scalatest.{BeforeAndAfter, Tag}
@@ -36,7 +35,10 @@ import org.apache.spark.sql.catalyst.expressions.{AttributeReference, Expression
 import org.apache.spark.sql.catalyst.plans.physical.HashPartitioning
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions
 import org.apache.spark.sql.execution.exchange.ShuffleExchangeExec
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, MemoryStream, StatefulOperatorStateInfo, StreamingSymmetricHashJoinExec, StreamingSymmetricHashJoinHelper}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.StatefulOperatorStateInfo
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.{StreamingSymmetricHashJoinExec, StreamingSymmetricHashJoinHelper}
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
@@ -49,8 +51,34 @@ trait AlsoTestWithVirtualColumnFamilyJoins extends SQLTestUtils {
   /** Tests both with and without join ops using virtual column families */
   override protected def test(testName: String, testTags: Tag*)(testBody: => Any)(
     implicit pos: Position): Unit = {
-    testWithVirtualColumnFamilyJoins(testName, testTags: _*)(testBody)
-    testWithoutVirtualColumnFamilyJoins(testName, testTags: _*)(testBody)
+    // Test with virtual column family joins with changelog checkpointing enabled and disabled
+    // Since virtual column family joins require RocksDB, we only test with RocksDB here.
+    Seq("false", "true").foreach { enabled =>
+      testWithVirtualColumnFamilyJoins(
+        testName + s" with (with changelog checkpointing = $enabled)", testTags: _*) {
+        withSQLConf(
+          "spark.sql.streaming.stateStore.rocksdb.changelogCheckpointing.enabled" -> enabled
+        ) {
+          testBody
+        }
+      }
+    }
+
+    // Test with both RocksDB and HDFS state store providers without virtual column family joins
+    val providers = Seq(
+      classOf[RocksDBStateStoreProvider].getName,
+      classOf[HDFSBackedStateStoreProvider].getName
+    )
+
+    providers.foreach { provider =>
+      testWithoutVirtualColumnFamilyJoins(testName + s" (with $provider)", testTags: _*) {
+        withSQLConf(
+          SQLConf.STATE_STORE_PROVIDER_CLASS.key -> provider
+        ) {
+          testBody
+        }
+      }
+    }
   }
 
   def testWithVirtualColumnFamilyJoins(testName: String, testTags: Tag*)(testBody: => Any): Unit = {
@@ -696,9 +724,7 @@ class StreamingInnerJoinSuite extends StreamingJoinSuite {
       })
   }
 
-  // This does not need to be run with virtual column family joins as it restores the state store
-  // provider to HDFS and join version to 1, effectively disabling the virtual column family join.
-  testWithoutVirtualColumnFamilyJoins(
+  test(
     "SPARK-26187 restore the stream-stream inner join query from Spark 2.4") {
     val inputStream = MemoryStream[(Int, Long)]
     val df = inputStream.toDS()
@@ -726,7 +752,7 @@ class StreamingInnerJoinSuite extends StreamingJoinSuite {
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
     inputStream.addData((1, 1L), (2, 2L), (3, 3L), (4, 4L), (5, 5L))
 
     testStream(query)(
@@ -792,7 +818,7 @@ class StreamingInnerJoinSuite extends StreamingJoinSuite {
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
     inputStream.addData((1, 1L, "a"), (2, 2L, "b"), (3, 3L, "c"), (4, 4L, "d"), (5, 5L, "e"))
 
     val ex = intercept[StreamingQueryException] {
@@ -862,7 +888,7 @@ class StreamingInnerJoinSuite extends StreamingJoinSuite {
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
     inputStream.addData((1, 1L, "a"), (2, 2L, "b"), (3, 3L, "c"), (4, 4L, "d"), (5, 5L, "e"))
 
     val ex = intercept[StreamingQueryException] {
@@ -1524,9 +1550,7 @@ class StreamingOuterJoinSuite extends StreamingJoinSuite {
     )
   }
 
-  // This does not need to be run with virtual column family joins as it restores the state store
-  // provider to HDFS and join version to 1, effectively disabling the virtual column family join.
-  testWithoutVirtualColumnFamilyJoins(
+  test(
     "SPARK-26187 restore the stream-stream outer join query from Spark 2.4") {
     val inputStream = MemoryStream[(Int, Long)]
     val df = inputStream.toDS()
@@ -1554,7 +1578,7 @@ class StreamingOuterJoinSuite extends StreamingJoinSuite {
     val checkpointDir = Utils.createTempDir().getCanonicalFile
     // Copy the checkpoint to a temp dir to prevent changes to the original.
     // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
     inputStream.addData((1, 1L), (2, 2L), (3, 3L), (4, 4L), (5, 5L))
 
     /*
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryHashPartitionVerifySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryHashPartitionVerifySuite.scala
index 3d8c20af3b384..a119edf6bdfba 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryHashPartitionVerifySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryHashPartitionVerifySuite.scala
@@ -22,14 +22,13 @@ import java.io.{BufferedWriter, DataInputStream, DataOutputStream, File, FileInp
 import scala.io.Source
 import scala.util.Random
 
-import com.google.common.io.ByteStreams
-
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.{RandomDataGenerator, Row}
 import org.apache.spark.sql.catalyst.CatalystTypeConverters
 import org.apache.spark.sql.catalyst.expressions.{BoundReference, GenericInternalRow, UnsafeProjection, UnsafeRow}
 import org.apache.spark.sql.catalyst.plans.physical._
 import org.apache.spark.sql.types.{BinaryType, DataType, DoubleType, FloatType, IntegerType, LongType, StringType, StructType, TimestampType}
+import org.apache.spark.util.Utils
 
 /**
  * To run the test suite:
@@ -110,7 +109,7 @@ class StreamingQueryHashPartitionVerifySuite extends StreamTest {
     val rows = (1 to numRows).map { _ =>
       val rowSize = is.readInt()
       val rowBuffer = new Array[Byte](rowSize)
-      ByteStreams.readFully(is, rowBuffer, 0, rowSize)
+      Utils.readFully(is, rowBuffer, 0, rowSize)
       val row = new UnsafeRow(1)
       row.pointTo(rowBuffer, rowSize)
       row
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenerSuite.scala
index 8a74355ed9305..e1d44efc172ea 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenerSuite.scala
@@ -26,12 +26,11 @@ import org.scalatest.BeforeAndAfter
 import org.scalatest.concurrent.PatienceConfiguration.Timeout
 import org.scalatest.concurrent.Waiters.Waiter
 
-import org.apache.spark.SparkConf
 import org.apache.spark.SparkException
 import org.apache.spark.scheduler._
 import org.apache.spark.sql.{Encoder, Row, SparkSession}
 import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2, ReadLimit}
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamingQueryListener._
 import org.apache.spark.sql.streaming.ui.StreamingQueryStatusListener
@@ -46,7 +45,6 @@ class StreamingQueryListenerSuite extends StreamTest with BeforeAndAfter {
 
   // To make === between double tolerate inexact values
   implicit val doubleEquality: Equality[Double] = TolerantNumerics.tolerantDoubleEquality(0.01)
-  private val jsonProtocol = new JsonProtocol(new SparkConf())
 
   after {
     spark.streams.active.foreach(_.stop())
@@ -259,8 +257,8 @@ class StreamingQueryListenerSuite extends StreamTest with BeforeAndAfter {
 
   test("QueryStartedEvent serialization") {
     def testSerialization(event: QueryStartedEvent): Unit = {
-      val json = jsonProtocol.sparkEventToJsonString(event)
-      val newEvent = jsonProtocol.sparkEventFromJson(json).asInstanceOf[QueryStartedEvent]
+      val json = JsonProtocol.sparkEventToJsonString(event)
+      val newEvent = JsonProtocol.sparkEventFromJson(json).asInstanceOf[QueryStartedEvent]
       assert(newEvent.id === event.id)
       assert(newEvent.runId === event.runId)
       assert(newEvent.name === event.name)
@@ -291,8 +289,8 @@ class StreamingQueryListenerSuite extends StreamTest with BeforeAndAfter {
   test("QueryProgressEvent serialization") {
     def testSerialization(event: QueryProgressEvent): Unit = {
       import scala.jdk.CollectionConverters._
-      val json = jsonProtocol.sparkEventToJsonString(event)
-      val newEvent = jsonProtocol.sparkEventFromJson(json).asInstanceOf[QueryProgressEvent]
+      val json = JsonProtocol.sparkEventToJsonString(event)
+      val newEvent = JsonProtocol.sparkEventFromJson(json).asInstanceOf[QueryProgressEvent]
       assert(newEvent.progress.json === event.progress.json)  // json as a proxy for equality
       assert(newEvent.progress.durationMs.asScala === event.progress.durationMs.asScala)
       assert(newEvent.progress.eventTime.asScala === event.progress.eventTime.asScala)
@@ -303,8 +301,8 @@ class StreamingQueryListenerSuite extends StreamTest with BeforeAndAfter {
 
   test("QueryTerminatedEvent serialization") {
     def testSerialization(event: QueryTerminatedEvent): Unit = {
-      val json = jsonProtocol.sparkEventToJsonString(event)
-      val newEvent = jsonProtocol.sparkEventFromJson(json).asInstanceOf[QueryTerminatedEvent]
+      val json = JsonProtocol.sparkEventToJsonString(event)
+      val newEvent = JsonProtocol.sparkEventFromJson(json).asInstanceOf[QueryTerminatedEvent]
       assert(newEvent.id === event.id)
       assert(newEvent.runId === event.runId)
       assert(newEvent.exception === event.exception)
@@ -591,7 +589,7 @@ class StreamingQueryListenerSuite extends StreamTest with BeforeAndAfter {
     val input = getClass.getResourceAsStream(s"/structured-streaming/$fileName")
     val events = mutable.ArrayBuffer[SparkListenerEvent]()
     try {
-      val replayer = new ReplayListenerBus(jsonProtocol) {
+      val replayer = new ReplayListenerBus() {
         // Redirect all parsed events to `events`
         override def doPostEvent(
             listener: SparkListenerInterface,
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenersConfSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenersConfSuite.scala
index 305d9ca8f451d..2353b6a4e9252 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenersConfSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryListenersConfSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.streaming
 import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.SparkConf
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.StaticSQLConf.STREAMING_QUERY_LISTENERS
 import org.apache.spark.sql.streaming.StreamingQueryListener._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryManagerSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryManagerSuite.scala
index 53cbbe6e786fe..c0a123a2895cc 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryManagerSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryManagerSuite.scala
@@ -31,7 +31,7 @@ import org.scalatest.time.SpanSugar._
 import org.apache.spark.SparkException
 import org.apache.spark.sql.{Dataset, Encoders}
 import org.apache.spark.sql.execution.datasources.v2.StreamingDataSourceV2ScanRelation
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.BlockingSource
 import org.apache.spark.tags.SlowSQLTest
@@ -320,6 +320,8 @@ class StreamingQueryManagerSuite extends StreamTest {
           val query1 = ds1.writeStream.format("parquet")
             .option("checkpointLocation", chkLocation).start(dataLocation)
           ms1.addData(1, 2, 3)
+          query1.processAllAvailable() // ensure offset log has been written
+
           val query2 = ds2.writeStream.format("parquet")
             .option("checkpointLocation", chkLocation).start(dataLocation)
           try {
@@ -382,6 +384,8 @@ class StreamingQueryManagerSuite extends StreamTest {
           val query1 = ms1.toDS().writeStream.format("parquet")
             .option("checkpointLocation", chkLocation).start(dataLocation)
           ms1.addData(1, 2, 3)
+          query1.processAllAvailable() // ensure offset log has been written
+
           val query2 = ds2.writeStream.format("parquet")
             .option("checkpointLocation", chkLocation).start(dataLocation)
           try {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryOptimizationCorrectnessSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryOptimizationCorrectnessSuite.scala
index f651bfb7f3c72..53fee34d43f11 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryOptimizationCorrectnessSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryOptimizationCorrectnessSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.streaming
 import java.sql.Timestamp
 
 import org.apache.spark.sql.Row
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.{count, expr, lit, timestamp_seconds, window}
 import org.apache.spark.sql.internal.SQLConf
 
@@ -458,11 +458,11 @@ class StreamingQueryOptimizationCorrectnessSuite extends StreamTest {
       withTempView("tv1", "tv2") {
         val inputStream1 = MemoryStream[Int]
         val ds1 = inputStream1.toDS()
-        ds1.registerTempTable("tv1")
+        ds1.createOrReplaceTempView("tv1")
 
         val inputStream2 = MemoryStream[Int]
         val ds2 = inputStream2.toDS()
-        ds2.registerTempTable("tv2")
+        ds2.createOrReplaceTempView("tv2")
 
         // DISTINCT is rewritten to AGGREGATE, hence an AGGREGATEs for each source
         val unioned = spark.sql(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryStatusAndProgressSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryStatusAndProgressSuite.scala
index e748ae8e7d7df..958b8b47c759a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryStatusAndProgressSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQueryStatusAndProgressSuite.scala
@@ -31,7 +31,7 @@ import org.scalatest.time.SpanSugar._
 
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamingQueryStatusAndProgressSuite._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQuerySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQuerySuite.scala
index ff23e00336a40..7ea53d41a150b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQuerySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingQuerySuite.scala
@@ -18,14 +18,13 @@
 package org.apache.spark.sql.streaming
 
 import java.io.File
-import java.nio.charset.StandardCharsets.UTF_8
+import java.nio.file.Files
 import java.util.Collections
 import java.util.concurrent.CountDownLatch
 
 import scala.collection.mutable
 import scala.util.{Success, Try}
 
-import org.apache.commons.io.FileUtils
 import org.apache.commons.lang3.RandomStringUtils
 import org.apache.hadoop.fs.Path
 import org.mockito.Mockito.when
@@ -46,12 +45,16 @@ import org.apache.spark.sql.connector.read.InputPartition
 import org.apache.spark.sql.connector.read.streaming.{Offset => OffsetV2, ReadLimit}
 import org.apache.spark.sql.execution.exchange.{REQUIRED_BY_STATEFUL_OPERATOR, ReusedExchangeExec, ShuffleExchangeExec}
 import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.checkpointing.{CheckpointFileManager, OffsetSeqMetadata}
+import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, MemoryStream, MetricsReporter, StreamExecution, StreamingExecutionRelation, StreamingQueryWrapper}
 import org.apache.spark.sql.execution.streaming.sources.{MemorySink, TestForeachWriter}
+import org.apache.spark.sql.execution.streaming.state.{HDFSBackedStateStoreProvider, RocksDBStateStoreProvider, StateStoreCheckpointLocationNotEmpty}
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.{BlockingSource, MockSourceProvider, StreamManualClock}
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.tags.SlowSQLTest
+import org.apache.spark.util.Utils
 
 @SlowSQLTest
 class StreamingQuerySuite extends StreamTest with BeforeAndAfter with Logging with MockitoSugar {
@@ -104,12 +107,14 @@ class StreamingQuerySuite extends StreamTest with BeforeAndAfter with Logging wi
       var cpDir: String = null
 
       def startQuery(restart: Boolean): StreamingQuery = {
-        if (cpDir == null || !restart) cpDir = s"$dir/${RandomStringUtils.randomAlphabetic(10)}"
+        if (cpDir == null || !restart) {
+          cpDir = s"$dir/${RandomStringUtils.secure.nextAlphabetic(10)}"
+        }
         MemoryStream[Int].toDS().groupBy().count()
           .writeStream
           .format("memory")
           .outputMode("complete")
-          .queryName(s"name${RandomStringUtils.randomAlphabetic(10)}")
+          .queryName(s"name${RandomStringUtils.secure.nextAlphabetic(10)}")
           .option("checkpointLocation", cpDir)
           .start()
       }
@@ -1095,7 +1100,7 @@ class StreamingQuerySuite extends StreamTest with BeforeAndAfter with Logging wi
     val inputDir = new File(input.toURI)
 
     // Copy test files to tempDir so that we won't modify the original data.
-    FileUtils.copyDirectory(inputDir, dir)
+    Utils.copyDirectory(inputDir, dir)
 
     // Spark 2.4 and earlier escaped the _spark_metadata path once
     val legacySparkMetadataDir = new File(
@@ -1106,10 +1111,10 @@ class StreamingQuerySuite extends StreamTest with BeforeAndAfter with Logging wi
     // Ideally we should copy "_spark_metadata" directly like what the user is supposed to do to
     // migrate to new version. However, in our test, "tempDir" will be different in each run and
     // we need to fix the absolute path in the metadata to match "tempDir".
-    val sparkMetadata = FileUtils.readFileToString(new File(legacySparkMetadataDir, "0"), UTF_8)
-    FileUtils.write(
-      new File(legacySparkMetadataDir, "0"),
-      sparkMetadata.replaceAll("TEMPDIR", dir.getCanonicalPath), UTF_8)
+    val sparkMetadata = Files.readString(new File(legacySparkMetadataDir, "0").toPath)
+    Files.writeString(
+      new File(legacySparkMetadataDir, "0").toPath,
+      sparkMetadata.replaceAll("TEMPDIR", dir.getCanonicalPath))
   }
 
   test("detect escaped path and report the migration guide") {
@@ -1160,7 +1165,7 @@ class StreamingQuerySuite extends StreamTest with BeforeAndAfter with Logging wi
       assertMigrationError(e2.getMessage, sparkMetadataDir, legacySparkMetadataDir)
 
       // Move "_spark_metadata" to fix the file sink and test the checkpoint path.
-      FileUtils.moveDirectory(legacySparkMetadataDir, sparkMetadataDir)
+      Utils.moveDirectory(legacySparkMetadataDir, sparkMetadataDir)
 
       // Restarting the streaming query should detect the legacy
       // checkpoint path and throw an error.
@@ -1174,7 +1179,7 @@ class StreamingQuerySuite extends StreamTest with BeforeAndAfter with Logging wi
       assertMigrationError(e3.getMessage, checkpointDir, legacyCheckpointDir)
 
       // Fix the checkpoint path and verify that the user can migrate the issue by moving files.
-      FileUtils.moveDirectory(legacyCheckpointDir, checkpointDir)
+      Utils.moveDirectory(legacyCheckpointDir, checkpointDir)
 
       val q = inputData.toDF()
         .writeStream
@@ -1471,6 +1476,86 @@ class StreamingQuerySuite extends StreamTest with BeforeAndAfter with Logging wi
     )
   }
 
+  private val TEST_PROVIDERS = Seq(
+    classOf[HDFSBackedStateStoreProvider].getName,
+    classOf[RocksDBStateStoreProvider].getName
+  )
+
+  TEST_PROVIDERS.foreach { provider =>
+    test("SPARK-53103: non empty state and commits checkpoint directory on first batch"
+      + s"(with $provider)") {
+      withSQLConf(
+        SQLConf.STATE_STORE_PROVIDER_CLASS.key -> provider) {
+
+        withTempDir { checkpointDir =>
+          val q = MemoryStream[Int].toDS().groupBy().count()
+            .writeStream
+            .format("memory")
+            .outputMode("complete")
+            .queryName(s"name${RandomStringUtils.secure.nextAlphabetic(10)}")
+            .option("checkpointLocation", checkpointDir.getCanonicalPath)
+            .start()
+          // Verify that the query can start successfully when the checkpoint directory is empty.
+          q.stop()
+        }
+
+        withTempDir { checkpointDir =>
+          val hadoopConf = spark.sessionState.newHadoopConf()
+          val fm = CheckpointFileManager.create(new Path(checkpointDir.toString), hadoopConf)
+
+          // Create a non-empty state checkpoint directory to simulate the case that the user
+          // a directory that already has state data.
+          fm.mkdirs(new Path(new Path(checkpointDir.getCanonicalPath, "state"), "0"))
+
+          checkError(
+            exception = intercept[StreamingQueryException] {
+              MemoryStream[Int].toDS().groupBy().count()
+                .writeStream
+                .format("memory")
+                .outputMode("complete")
+                .queryName(s"name${RandomStringUtils.secure.nextAlphabetic(10)}")
+                .option("checkpointLocation", checkpointDir.getCanonicalPath)
+                .start()
+                .processAllAvailable()
+            }.getCause.asInstanceOf[StateStoreCheckpointLocationNotEmpty],
+            condition = "STATE_STORE_CHECKPOINT_LOCATION_NOT_EMPTY",
+            sqlState = "42K03",
+            parameters = Map(
+              "checkpointLocation" ->
+                ("file:" + (new Path(checkpointDir.getCanonicalPath, "state")).toString)
+            ))
+        }
+
+        withTempDir { checkpointDir =>
+          val hadoopConf = spark.sessionState.newHadoopConf()
+          val fm = CheckpointFileManager.create(new Path(checkpointDir.toString), hadoopConf)
+
+          // Create a non-empty state checkpoint directory to simulate the case that the user
+          // a directory that already has commits data.
+          fm.mkdirs(new Path(new Path(checkpointDir.getCanonicalPath, "commits"), "0"))
+
+          checkError(
+            exception = intercept[StreamingQueryException] {
+              MemoryStream[Int].toDS().groupBy().count()
+                .writeStream
+                .format("memory")
+                .outputMode("complete")
+                .queryName(s"name${RandomStringUtils.secure.nextAlphabetic(10)}")
+                .option("checkpointLocation", checkpointDir.getCanonicalPath)
+                .start()
+                .processAllAvailable()
+            }.getCause.asInstanceOf[StateStoreCheckpointLocationNotEmpty],
+            condition = "STATE_STORE_CHECKPOINT_LOCATION_NOT_EMPTY",
+            sqlState = "42K03",
+            parameters = Map(
+              "checkpointLocation" ->
+                ("file:" + (new Path(checkpointDir.getCanonicalPath, "commits")).toString)
+            ))
+        }
+      }
+    }
+  }
+
   private def checkAppendOutputModeException(df: DataFrame): Unit = {
     withTempDir { outputDir =>
       withTempDir { checkpointDir =>
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSelfUnionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSelfUnionSuite.scala
index 44c909d8ae2d7..069fc717deabf 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSelfUnionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSelfUnionSuite.scala
@@ -22,7 +22,7 @@ import org.scalatest.concurrent.PatienceConfiguration.Timeout
 
 import org.apache.spark.sql.SaveMode
 import org.apache.spark.sql.connector.catalog.Identifier
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.streaming.test.{InMemoryStreamTable, InMemoryStreamTableCatalog}
 import org.apache.spark.sql.streaming.util.StreamManualClock
 import org.apache.spark.sql.types.{LongType, StructField, StructType}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowDistributionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowDistributionSuite.scala
index 36c7459ce82b2..e4221f2451790 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowDistributionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowDistributionSuite.scala
@@ -19,12 +19,11 @@ package org.apache.spark.sql.streaming
 
 import java.io.File
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.plans.physical.UnspecifiedDistribution
 import org.apache.spark.sql.execution.aggregate.BaseAggregateExec
-import org.apache.spark.sql.execution.streaming.{MemoryStream, SessionWindowStateStoreRestoreExec, SessionWindowStateStoreSaveExec}
+import org.apache.spark.sql.execution.streaming.operators.stateful.{SessionWindowStateStoreRestoreExec, SessionWindowStateStoreSaveExec}
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.functions.{count, session_window}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StatefulOpClusteredDistributionTestHelper
@@ -144,7 +143,7 @@ class StreamingSessionWindowDistributionSuite extends StreamTest
       val checkpointDir = Utils.createTempDir().getCanonicalFile
       // Copy the checkpoint to a temp dir to prevent changes to the original.
       // Not doing this will lead to the test passing on the first run, but fail subsequent runs.
-      FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+      Utils.copyDirectory(new File(resourceUri), checkpointDir)
 
       inputData.addData(
         ("hello world spark streaming", "key1", 40L),
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowSuite.scala
index ec3c145af686c..78e2c192ed50f 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSessionWindowSuite.scala
@@ -24,7 +24,7 @@ import org.scalatest.matchers.must.Matchers
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.{AnalysisException, Column, DataFrame, Encoder, Encoders}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{HDFSBackedStateStoreProvider, RocksDBStateStoreProvider}
 import org.apache.spark.sql.expressions.Aggregator
 import org.apache.spark.sql.functions._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingStateStoreFormatCompatibilitySuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingStateStoreFormatCompatibilitySuite.scala
index 1460ca55d1579..e14d0adc707c5 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingStateStoreFormatCompatibilitySuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingStateStoreFormatCompatibilitySuite.scala
@@ -21,12 +21,10 @@ import java.io.File
 
 import scala.annotation.tailrec
 
-import org.apache.commons.io.FileUtils
-
 import org.apache.spark.{SparkException, SparkUnsupportedOperationException}
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.catalyst.streaming.InternalOutputModes.Complete
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{StateStoreKeyRowFormatValidationFailure, StateStoreValueRowFormatValidationFailure}
 import org.apache.spark.sql.functions._
 import org.apache.spark.tags.SlowSQLTest
@@ -48,7 +46,7 @@ class StreamingStateStoreFormatCompatibilitySuite extends StreamTest {
     val resourceUri = this.getClass.getResource("/structured-streaming/" +
       s"checkpoint-version-2.4.5-for-compatibility-test-${testName}").toURI
     val checkpointDir = Utils.createTempDir().getCanonicalFile
-    FileUtils.copyDirectory(new File(resourceUri), checkpointDir)
+    Utils.copyDirectory(new File(resourceUri), checkpointDir)
     checkpointDir
   }
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSymmetricHashJoinHelperSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSymmetricHashJoinHelperSuite.scala
index b38d5d7dbce9d..3336cc680ac0d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSymmetricHashJoinHelperSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/StreamingSymmetricHashJoinHelperSuite.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.streaming
 import org.apache.spark.sql.catalyst.dsl.expressions._
 import org.apache.spark.sql.catalyst.expressions.{AttributeReference, Literal}
 import org.apache.spark.sql.execution.LocalTableScanExec
-import org.apache.spark.sql.execution.streaming.StreamingSymmetricHashJoinHelper.JoinConditionSplitPredicates
+import org.apache.spark.sql.execution.streaming.operators.stateful.join.StreamingSymmetricHashJoinHelper.JoinConditionSplitPredicates
 import org.apache.spark.sql.types._
 
 class StreamingSymmetricHashJoinHelperSuite extends StreamTest {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateSuite.scala
index 2fbc1d6afbbc9..b0a76e170ff58 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateSuite.scala
@@ -19,9 +19,10 @@ package org.apache.spark.sql.streaming
 
 import org.apache.spark.SparkIllegalArgumentException
 import org.apache.spark.sql.Encoders
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{AlsoTestWithEncodingTypes, AlsoTestWithRocksDBFeatures, RocksDBStateStoreProvider}
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.tags.SlowSQLTest
 
 case class InputRow(key: String, action: String, value: String)
 
@@ -221,8 +222,9 @@ class ToggleSaveAndEmitProcessor
   }
 }
 
+@SlowSQLTest
 class TransformWithListStateSuite extends StreamTest
-  with AlsoTestWithRocksDBFeatures with AlsoTestWithEncodingTypes {
+  with AlsoTestWithRocksDBFeatures with AlsoTestWithEncodingTypes with StateStoreMetricsTest {
   import testImplicits._
 
   test("test appending null value in list state throw exception") {
@@ -360,10 +362,14 @@ class TransformWithListStateSuite extends StreamTest
         // no interaction test
         AddData(inputData, InputRow("k1", "emit", "v1")),
         CheckNewAnswer(("k1", "v1")),
+        assertNumStateRows(total = 0, updated = 0), // emit does not change state
+
         // check simple append
         AddData(inputData, InputRow("k1", "append", "v2")),
         AddData(inputData, InputRow("k1", "emitAllInState", "")),
         CheckNewAnswer(("k1", "v2")),
+        assertNumStateRows(total = 0, updated = 1), // emitAllInState clears state
+
         // multiple appends are correctly stored and emitted
         AddData(inputData, InputRow("k2", "append", "v1")),
         AddData(inputData, InputRow("k1", "append", "v4")),
@@ -371,33 +377,45 @@ class TransformWithListStateSuite extends StreamTest
         AddData(inputData, InputRow("k1", "emit", "v5")),
         AddData(inputData, InputRow("k2", "emit", "v3")),
         CheckNewAnswer(("k1", "v5"), ("k2", "v3")),
+        assertNumStateRows(total = 2, updated = 3),
+
         AddData(inputData, InputRow("k1", "emitAllInState", "")),
         AddData(inputData, InputRow("k2", "emitAllInState", "")),
         CheckNewAnswer(("k2", "v1"), ("k2", "v2"), ("k1", "v4")),
+        assertNumStateRows(total = 0, updated = 0),
+
         // check appendAll with append
         AddData(inputData, InputRow("k3", "appendAll", "v1,v2,v3")),
         AddData(inputData, InputRow("k3", "emit", "v4")),
         AddData(inputData, InputRow("k3", "append", "v5")),
         CheckNewAnswer(("k3", "v4")),
+        assertNumStateRows(total = 1, updated = 4),
+
         AddData(inputData, InputRow("k3", "emitAllInState", "")),
         CheckNewAnswer(("k3", "v1"), ("k3", "v2"), ("k3", "v3"), ("k3", "v5")),
+        assertNumStateRows(total = 0, updated = 0),
+
         // check removal cleans up all data in state
         AddData(inputData, InputRow("k4", "append", "v2")),
-        AddData(inputData, InputRow("k4", "appendList", "v3,v4")),
+        AddData(inputData, InputRow("k4", "appendAll", "v3,v4")),
         AddData(inputData, InputRow("k4", "remove", "")),
         AddData(inputData, InputRow("k4", "emitAllInState", "")),
         CheckNewAnswer(),
+        assertNumStateRows(total = 0, updated = 3), // clearing state is a single update
+
         // check put cleans up previous state and adds new state
         AddData(inputData, InputRow("k5", "appendAll", "v1,v2,v3")),
         AddData(inputData, InputRow("k5", "append", "v4")),
         AddData(inputData, InputRow("k5", "put", "v5,v6")),
         AddData(inputData, InputRow("k5", "emitAllInState", "")),
         CheckNewAnswer(("k5", "v5"), ("k5", "v6")),
+        assertNumStateRows(total = 0, updated = 2), // put resets the updated count
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).customMetrics.get("numListStateVars") > 0)
           assert(q.lastProgress.stateOperators(0).numRowsUpdated === 2)
           assert(q.lastProgress.stateOperators(0).numRowsRemoved === 2)
-        }
+        },
+        StopStream
       )
     }
   }
@@ -417,9 +435,11 @@ class TransformWithListStateSuite extends StreamTest
         AddData(inputData, "k1"),
         AddData(inputData, "k2"),
         CheckNewAnswer(),
+        assertNumStateRows(total = 4, updated = 4),
         AddData(inputData, "k1"),
         AddData(inputData, "k2"),
-        CheckNewAnswer("k1", "k1", "k2", "k2")
+        CheckNewAnswer("k1", "k1", "k2", "k2"),
+        assertNumStateRows(total = 0, updated = 0)
       )
     }
   }
@@ -442,9 +462,11 @@ class TransformWithListStateSuite extends StreamTest
           // Write data with initial schema
           AddData(inputData, "item1", "item2"),
           CheckNewAnswer(("item1", 1), ("item2", 1)),
+          assertNumStateRows(total = 2, updated = 2),
           // Add more items to verify count increment
           AddData(inputData, "item1", "item3"),
           CheckNewAnswer(("item1", 2), ("item3", 1)),
+          assertNumStateRows(total = 3, updated = 2),
           StopStream
         )
 
@@ -463,6 +485,10 @@ class TransformWithListStateSuite extends StreamTest
             ("item1", "Migrated item item1 with count 1", 1),
             ("item1", "Migrated item item1 with count 2", 2),
             ("item1", "Updated item item1 with count 4", 4)),
+          // 3 listState total for keys item1, item2, item3
+          // For rows with key item1 we clear and readd 3 items (3 updates)
+          // rows with keys item2 and item3 are not migrated because they are not accessed
+          assertNumStateRows(total = 3, updated = 3),
           StopStream
         )
       }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateTTLSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateTTLSuite.scala
index bd3667b16591e..d2036a32f1d17 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateTTLSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithListStateTTLSuite.scala
@@ -20,10 +20,12 @@ package org.apache.spark.sql.streaming
 import java.time.Duration
 
 import org.apache.spark.sql.Encoders
-import org.apache.spark.sql.execution.streaming.{ListStateImplWithTTL, MemoryStream}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.ListStateImplWithTTL
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.RocksDBStateStoreProvider
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
+import org.apache.spark.tags.SlowSQLTest
 
 // MultiStatefulVariableTTLProcessor is a StatefulProcessor that consumes a stream of
 // strings and returns a stream of <string, count> pairs.
@@ -164,6 +166,7 @@ class ListStateTTLProcessor(ttlConfig: TTLConfig)
  * Test suite for testing list state with TTL.
  * We use the base TTL suite with a list state processor.
  */
+@SlowSQLTest
 class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
   with StateStoreMetricsTest {
 
@@ -199,26 +202,32 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
         AddData(inputStream, "k1"),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(("k1", 1)),
+        assertNumStateRows(total = 3, updated = 3),
 
         AddData(inputStream, "k2"),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(("k2", 1)),
+        assertNumStateRows(total = 6, updated = 3),
 
         AddData(inputStream, "k1"),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(("k1", 2)),
+        assertNumStateRows(total = 7, updated = 3),
 
         AddData(inputStream, "k2"),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(("k2", 2)),
+        assertNumStateRows(total = 8, updated = 3),
 
         AddData(inputStream, "k1"),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(("k1", 3)),
+        assertNumStateRows(total = 9, updated = 3),
 
         AddData(inputStream, "k2"),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(("k2", 3)),
+        assertNumStateRows(total = 10, updated = 3)
 
         // For each unique key that occurs t times, the MultiStatefulVariableTTLProcessor maintains:
         //    - Map state: t records in the primary, and t records in the TTL index
@@ -236,7 +245,6 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
         // The number of updated rows is the total across the last time assertNumStateRows
         // was called, and we only update numRowsUpdated for primary key updates. We ran 6 batches
         // and each wrote 3 primary keys, so the total number of updated rows is 6 * 3 = 18.
-        assertNumStateRows(total = 10, updated = 18)
       )
     }
   }
@@ -265,6 +273,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
         ),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(),
+        assertNumStateRows(total = 1, updated = 3),
         // get ttl values
         AddData(inputStream, InputEvent("k1", "get_ttl_value_from_state", -1, null)),
         AdvanceManualClock(1 * 1000),
@@ -273,6 +282,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           OutputEvent("k1", 2, isTTLValue = true, 62000),
           OutputEvent("k1", 3, isTTLValue = true, 62000)
         ),
+        assertNumStateRows(total = 1, updated = 0),
         // advance clock to add elements with later TTL
         AdvanceManualClock(45 * 1000), // batch timestamp: 48000
         AddData(inputStream,
@@ -282,6 +292,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
         ),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(),
+        assertNumStateRows(total = 1, updated = 3),
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).numRowsUpdated === 3)
         },
@@ -296,6 +307,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           OutputEvent("k1", 5, isTTLValue = true, 109000),
           OutputEvent("k1", 6, isTTLValue = true, 109000)
         ),
+        assertNumStateRows(total = 1, updated = 0),
         AddData(inputStream, InputEvent("k1", "get", -1, null)),
         // advance clock to expire the first three elements
         AdvanceManualClock(15 * 1000), // batch timestamp: 65000
@@ -304,6 +316,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           OutputEvent("k1", 5, isTTLValue = false, -1),
           OutputEvent("k1", 6, isTTLValue = false, -1)
         ),
+        assertNumStateRows(total = 1, updated = 0),
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).numRowsRemoved === 3)
         },
@@ -315,11 +328,13 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           OutputEvent("k1", 5, isTTLValue = false, -1),
           OutputEvent("k1", 6, isTTLValue = false, -1)
         ),
+        assertNumStateRows(total = 1, updated = 0),
         AddData(inputStream, InputEvent("k1", "get_values_in_ttl_state", -1, null)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(
           OutputEvent("k1", -1, isTTLValue = true, 109000)
-        )
+        ),
+        assertNumStateRows(total = 1, updated = 0)
       )
     }
   }
@@ -359,6 +374,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           // advance clock to trigger processing
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 3),
 
           // get ttl values
           AddData(inputStream, InputEvent("k1", "get_ttl_value_from_state", -1, null)),
@@ -368,6 +384,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 2, isTTLValue = true, 182000),
             OutputEvent("k1", 3, isTTLValue = true, 182000)
           ),
+          assertNumStateRows(total = 1, updated = 0),
 
           AddData(inputStream, InputEvent("k1", "get", -1, null)),
           AdvanceManualClock(1 * 1000),
@@ -376,6 +393,8 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 2, isTTLValue = false, -1),
             OutputEvent("k1", 3, isTTLValue = false, -1)
           ),
+          assertNumStateRows(total = 1, updated = 0),
+
           StopStream
         )
 
@@ -400,6 +419,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           // advance clock to trigger processing
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 3),
 
           // get all elements without enforcing ttl
           AddData(inputStream, InputEvent("k1", "get_without_enforcing_ttl", -1, null)),
@@ -412,6 +432,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 5, isTTLValue = false, -1),
             OutputEvent("k1", 6, isTTLValue = false, -1)
           ),
+          assertNumStateRows(total = 1, updated = 0),
 
           AddData(inputStream, InputEvent("k1", "get_ttl_value_from_state", -1, null)),
           AdvanceManualClock(1 * 1000),
@@ -423,6 +444,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 5, isTTLValue = true, 20000),
             OutputEvent("k1", 6, isTTLValue = true, 20000)
           ),
+          assertNumStateRows(total = 1, updated = 0),
           StopStream
         )
 
@@ -437,6 +459,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           // advance clock to trigger processing
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 3),
 
           // advance clock to expire the middle three elements
           AddData(inputStream, InputEvent("k1", "get_values_in_ttl_state", -1, null)),
@@ -444,6 +467,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           CheckNewAnswer(
             OutputEvent("k1", -1, isTTLValue = true, 20000)
           ),
+          assertNumStateRows(total = 1, updated = 0),
 
           // progress batch timestamp from 9000 to 54000, expiring the middle
           // three elements.
@@ -459,6 +483,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 8, isTTLValue = false, -1),
             OutputEvent("k1", 9, isTTLValue = false, -1)
           ),
+          assertNumStateRows(total = 1, updated = 0),
 
           AddData(inputStream, InputEvent("k1", "get_without_enforcing_ttl", -1, null)),
           AdvanceManualClock(1 * 1000),
@@ -470,6 +495,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 8, isTTLValue = false, -1),
             OutputEvent("k1", 9, isTTLValue = false, -1)
           ),
+          assertNumStateRows(total = 1, updated = 0),
 
           AddData(inputStream, InputEvent("k1", "get_values_in_ttl_state", -1, null)),
           AdvanceManualClock(1 * 1000),
@@ -514,14 +540,17 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           AddData(inputStream, InputEvent("k1", "append", 1)),
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 1),
 
           AddData(inputStream, InputEvent("k1", "append", 2)),
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 1),
 
           AddData(inputStream, InputEvent("k1", "append", 3)),
           AdvanceManualClock(1 * 1000), // Time is 3000
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 1),
 
           // Add a separate key; this should not be affected by k1 expiring.
           // It will have an expiration of 64000.
@@ -535,12 +564,14 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 2, isTTLValue = true, 62000),
             OutputEvent("k1", 3, isTTLValue = true, 63000)
           ),
+          assertNumStateRows(total = 2, updated = 1),
 
           AddData(inputStream, InputEvent("k1", "get_values_in_min_state", -1, null)),
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer( // Time is 5000 for this micro-batch
             OutputEvent("k1", -1, isTTLValue = true, 61000)
           ),
+          assertNumStateRows(total = 2, updated = 0),
 
           // The k1 records expire at 63000, and the current time is 5000. So, we advance the
           // clock by 63 - 5 = 58 seconds to expire those.
@@ -552,7 +583,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           //
           // It's important to check with assertNumStateRows, since the InputEvents
           // only return values for the current grouping key, not the entirety of RocksDB.
-          assertNumStateRows(total = 1, updated = 4),
+          assertNumStateRows(total = 1, updated = 0),
 
           // The k1 calls should both return no values. However, the k2 calls should return
           // one record each. We put these into one AddData call since we want them all to
@@ -617,6 +648,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           // advance clock to trigger processing
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 3),
 
           // get ttl values
           AddData(inputStream,
@@ -633,6 +665,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             // From the get_values_in_min_state call
             OutputEvent("k1", -1, isTTLValue = true, 121000)
           ),
+          assertNumStateRows(total = 1, updated = 0),
 
           AddData(inputStream, InputEvent("k1", "get", -1, null)),
           AdvanceManualClock(1 * 1000),
@@ -641,6 +674,8 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 2, isTTLValue = false, -1),
             OutputEvent("k1", 3, isTTLValue = false, -1)
           ),
+          assertNumStateRows(total = 1, updated = 0),
+
           StopStream
         )
 
@@ -656,6 +691,7 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
           // advance clock to trigger processing
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 1, updated = 3),
 
           // get ttl values
           AddData(inputStream, InputEvent("k1", "get_ttl_value_from_state", -1, null)),
@@ -668,12 +704,15 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 5, isTTLValue = true, 65000),
             OutputEvent("k1", 6, isTTLValue = true, 65000)
           ),
+          assertNumStateRows(total = 1, updated = 0),
+
           AddData(inputStream, InputEvent("k1", "get_values_in_ttl_state", -1, null)),
           AdvanceManualClock(1 * 1000),
-
           CheckNewAnswer(
             OutputEvent("k1", -1, isTTLValue = true, 65000)
           ),
+          assertNumStateRows(total = 1, updated = 0),
+
           // expire end values, batch timestamp from 7000 to 67000
           AdvanceManualClock(60 * 1000),
           AddData(inputStream, InputEvent("k1", "get", -1, null)),
@@ -683,6 +722,8 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 2, isTTLValue = false, -1),
             OutputEvent("k1", 3, isTTLValue = false, -1)
           ),
+          assertNumStateRows(total = 1, updated = 0),
+
           AddData(inputStream, InputEvent("k1", "get_without_enforcing_ttl", -1, null)),
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(
@@ -690,11 +731,63 @@ class TransformWithListStateTTLSuite extends TransformWithStateTTLTest
             OutputEvent("k1", 2, isTTLValue = false, -1),
             OutputEvent("k1", 3, isTTLValue = false, -1)
           ),
+          assertNumStateRows(total = 1, updated = 0),
+
           AddData(inputStream, InputEvent("k1", "get_values_in_ttl_state", -1, null)),
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(
             OutputEvent("k1", -1, isTTLValue = true, 121000)
           ),
+          assertNumStateRows(total = 1, updated = 0),
+
+          StopStream
+        )
+      }
+    }
+  }
+
+  test("SPARK-53069: stopping and restarting the query maintains correct state total rows") {
+    withSQLConf(SQLConf.STATE_STORE_PROVIDER_CLASS.key ->
+      classOf[RocksDBStateStoreProvider].getName,
+      SQLConf.SHUFFLE_PARTITIONS.key -> "1") {
+      withTempDir { checkpointLocation =>
+        val ttlConfig = TTLConfig(ttlDuration = Duration.ofMinutes(10))
+        val inputStream = MemoryStream[String]
+        val result = inputStream.toDS()
+          .groupByKey(x => x)
+          .transformWithState(
+            new MultiStatefulVariableTTLProcessor(ttlConfig),
+            TimeMode.ProcessingTime(),
+            OutputMode.Append())
+        val clock = new StreamManualClock
+
+        testStream(result)(
+          StartStream(Trigger.ProcessingTime("1 second"), triggerClock = clock,
+            checkpointLocation = checkpointLocation.getAbsolutePath),
+
+          AddData(inputStream, "k1"),
+          AdvanceManualClock(1 * 1000),
+          CheckNewAnswer(("k1", 1)),
+          assertNumStateRows(total = 3, updated = 3),
+
+          StopStream,
+          StartStream(Trigger.ProcessingTime("1 second"), triggerClock = clock,
+            checkpointLocation = checkpointLocation.getAbsolutePath),
+
+          AddData(inputStream, "k1"),
+          AdvanceManualClock(1 * 1000),
+          CheckNewAnswer(("k1", 2)),
+          assertNumStateRows(total = 4, updated = 3),
+
+          StopStream,
+          StartStream(Trigger.ProcessingTime("1 second"), triggerClock = clock,
+            checkpointLocation = checkpointLocation.getAbsolutePath),
+
+          AddData(inputStream, "k1"),
+          AdvanceManualClock(1 * 1000),
+          CheckNewAnswer(("k1", 3)),
+          assertNumStateRows(total = 5, updated = 3),
+
           StopStream
         )
       }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateSuite.scala
index c157f0a008392..fd73517d81816 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateSuite.scala
@@ -19,9 +19,10 @@ package org.apache.spark.sql.streaming
 
 import org.apache.spark.SparkIllegalArgumentException
 import org.apache.spark.sql.Encoders
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{AlsoTestWithEncodingTypes, AlsoTestWithRocksDBFeatures, RocksDBStateStoreProvider}
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.tags.SlowSQLTest
 
 case class InputMapRow(key: String, action: String, value: (String, String))
 
@@ -138,9 +139,11 @@ class EvolvedMapStateProcessor extends StatefulProcessor[String, String, (String
  * Class that adds integration tests for MapState types used in arbitrary stateful
  * operators such as transformWithState.
  */
+@SlowSQLTest
 class TransformWithMapStateSuite extends StreamTest
   with AlsoTestWithEncodingTypes
-  with AlsoTestWithRocksDBFeatures {
+  with AlsoTestWithRocksDBFeatures
+  with StateStoreMetricsTest {
   import testImplicits._
 
   private def testMapStateWithNullUserKey(inputMapRow: InputMapRow): Unit = {
@@ -182,7 +185,8 @@ class TransformWithMapStateSuite extends StreamTest
 
       testStream(result, OutputMode.Update())(
         AddData(inputData, InputMapRow("k1", "getValue", ("v1", ""))),
-        CheckAnswer(("k1", "v1", null))
+        CheckAnswer(("k1", "v1", null)),
+        assertNumStateRows(total = 0, updated = 0)
       )
     }
   }
@@ -232,6 +236,7 @@ class TransformWithMapStateSuite extends StreamTest
         AddData(inputData, InputMapRow("k1", "exists", ("", ""))),
         AddData(inputData, InputMapRow("k2", "exists", ("", ""))),
         CheckNewAnswer(("k1", "exists", "true"), ("k2", "exists", "false")),
+        assertNumStateRows(total = 1, updated = 1),
 
         // Test get and put with composite key
         AddData(inputData, InputMapRow("k1", "updateValue", ("v2", "5"))),
@@ -243,32 +248,42 @@ class TransformWithMapStateSuite extends StreamTest
         // Different grouping key, same user key
         AddData(inputData, InputMapRow("k1", "getValue", ("v2", ""))),
         CheckNewAnswer(("k1", "v2", "5")),
+        assertNumStateRows(total = 4, updated = 4), // new state store row for each (k, v) pair
+
         // Same grouping key, same user key, update value should reflect
         AddData(inputData, InputMapRow("k2", "getValue", ("v2", ""))),
         CheckNewAnswer(("k2", "v2", "12")),
+        assertNumStateRows(total = 4, updated = 0),
 
         // Test get full map for a given grouping key - prefixScan
         AddData(inputData, InputMapRow("k2", "iterator", ("", ""))),
         CheckNewAnswer(("k2", "v2", "12"), ("k2", "v4", "1")),
+        assertNumStateRows(total = 4, updated = 0),
 
         AddData(inputData, InputMapRow("k2", "keys", ("", ""))),
         CheckNewAnswer(("k2", "v2", ""), ("k2", "v4", "")),
+        assertNumStateRows(total = 4, updated = 0),
 
         AddData(inputData, InputMapRow("k2", "values", ("", ""))),
         CheckNewAnswer(("k2", "", "12"), ("k2", "", "1")),
+        assertNumStateRows(total = 4, updated = 0),
 
         // Test remove functionalities
         AddData(inputData, InputMapRow("k1", "removeKey", ("v2", ""))),
         AddData(inputData, InputMapRow("k1", "containsKey", ("v2", ""))),
         CheckNewAnswer(("k1", "v2", "false")),
+        assertNumStateRows(total = 3, updated = 0), // remove does not count as update
 
         AddData(inputData, InputMapRow("k2", "clear", ("", ""))),
         AddData(inputData, InputMapRow("k2", "iterator", ("", ""))),
         CheckNewAnswer(),
+        assertNumStateRows(total = 1, updated = 0),
+
         AddData(inputData, InputMapRow("k2", "exists", ("", ""))),
         AddData(inputData, InputMapRow("k1", "clear", ("", ""))),
         AddData(inputData, InputMapRow("k3", "updateValue", ("v7", "11"))),
         CheckNewAnswer(("k2", "exists", "false")),
+        assertNumStateRows(total = 1, updated = 1),
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).customMetrics.get("numMapStateVars") > 0)
           assert(q.lastProgress.stateOperators(0).numRowsUpdated === 1)
@@ -309,8 +324,10 @@ class TransformWithMapStateSuite extends StreamTest
           StartStream(checkpointLocation = dir.getCanonicalPath),
           AddData(inputData, "a", "b"),
           CheckNewAnswer(("a", "a", 1), ("b", "b", 1)),
+          assertNumStateRows(total = 2, updated = 2),
           AddData(inputData, "a"),
           CheckNewAnswer(("a", "a", 2)),
+          assertNumStateRows(total = 2, updated = 1),
           StopStream
         )
 
@@ -325,9 +342,11 @@ class TransformWithMapStateSuite extends StreamTest
           StartStream(checkpointLocation = dir.getCanonicalPath),
           AddData(inputData, "c"),
           CheckNewAnswer(("c", "c", 1)),
+          assertNumStateRows(total = 3, updated = 1),
           // Verify we can still read old state format
           AddData(inputData, "a"),
           CheckNewAnswer(("a", "a", 3)), // Count should continue from previous state
+          assertNumStateRows(total = 3, updated = 1),
           StopStream
         )
       }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateTTLSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateTTLSuite.scala
index c845059f20fe3..9470d2b65b375 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateTTLSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithMapStateTTLSuite.scala
@@ -20,10 +20,12 @@ package org.apache.spark.sql.streaming
 import java.time.Duration
 
 import org.apache.spark.sql.Encoders
-import org.apache.spark.sql.execution.streaming.{MapStateImplWithTTL, MemoryStream}
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.MapStateImplWithTTL
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.RocksDBStateStoreProvider
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
+import org.apache.spark.tags.SlowSQLTest
 
 class MapStateSingleKeyTTLProcessor(ttlConfig: TTLConfig)
   extends StatefulProcessor[String, InputEvent, OutputEvent] {
@@ -173,6 +175,7 @@ class MapStateTTLProcessor(ttlConfig: TTLConfig)
   }
 }
 
+@SlowSQLTest
 class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
 
   import testImplicits._
@@ -203,12 +206,18 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
         AddData(inputStream, MapInputEvent("k1", "key1", "put", 1)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(),
+        assertNumStateRows(total = 1, updated = 1),
+
         AddData(inputStream, MapInputEvent("k1", "key1", "get", -1)),
         AdvanceManualClock(30 * 1000),
         CheckNewAnswer(MapOutputEvent("k1", "key1", 1, isTTLValue = false, -1)),
+        assertNumStateRows(total = 1, updated = 0),
+
         AddData(inputStream, MapInputEvent("k1", "key2", "put", 2)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(),
+        assertNumStateRows(total = 2, updated = 1),
+
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).numRowsUpdated === 1)
         },
@@ -217,6 +226,7 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
         // advance clock to expire first key
         AdvanceManualClock(30 * 1000),
         CheckNewAnswer(MapOutputEvent("k1", "key2", 2, isTTLValue = false, -1)),
+        assertNumStateRows(total = 1, updated = 0),
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).numRowsRemoved === 1)
         },
@@ -248,6 +258,8 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
         ),
         AdvanceManualClock(1 * 1000), // batch timestamp: 1000
         CheckNewAnswer(),
+        assertNumStateRows(total = 2, updated = 2),
+
         AddData(inputStream,
           MapInputEvent("k1", "key1", "get", -1),
           MapInputEvent("k1", "key2", "get", -1)
@@ -257,6 +269,8 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
           MapOutputEvent("k1", "key1", 1, isTTLValue = false, -1),
           MapOutputEvent("k1", "key2", 2, isTTLValue = false, -1)
         ),
+        assertNumStateRows(total = 2, updated = 0),
+
         // get values from ttl state
         AddData(inputStream,
           MapInputEvent("k1", "", "get_values_in_ttl_state", -1)
@@ -266,6 +280,8 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
           MapOutputEvent("k1", "key1", -1, isTTLValue = true, 61000),
           MapOutputEvent("k1", "key2", -1, isTTLValue = true, 61000)
         ),
+        assertNumStateRows(total = 2, updated = 0),
+
         // advance clock to expire first two values
         AdvanceManualClock(30 * 1000), // batch timestamp: 62000
         AddData(inputStream,
@@ -280,6 +296,8 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
           MapOutputEvent("k1", "key4", 4, isTTLValue = false, -1),
           MapOutputEvent("k1", "key5", 5, isTTLValue = false, -1)
         ),
+        assertNumStateRows(total = 3, updated = 3),
+
         AddData(inputStream,
           MapInputEvent("k1", "", "get_values_in_ttl_state", -1)
         ),
@@ -289,6 +307,8 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
           MapOutputEvent("k1", "key4", -1, isTTLValue = true, 123000),
           MapOutputEvent("k1", "key5", -1, isTTLValue = true, 123000)
         ),
+        assertNumStateRows(total = 3, updated = 0),
+
         // get all values without enforcing ttl
         AddData(inputStream,
           MapInputEvent("k1", "key1", "get_without_enforcing_ttl", -1),
@@ -303,6 +323,8 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
           MapOutputEvent("k1", "key4", 4, isTTLValue = false, -1),
           MapOutputEvent("k1", "key5", 5, isTTLValue = false, -1)
         ),
+        assertNumStateRows(total = 3, updated = 0),
+
         // check that updating a key updates its TTL
         AddData(inputStream, MapInputEvent("k1", "key3", "put", 3)),
         AdvanceManualClock(1 * 1000),
@@ -313,11 +335,15 @@ class TransformWithMapStateTTLSuite extends TransformWithStateTTLTest {
           MapOutputEvent("k1", "key4", -1, isTTLValue = true, 123000),
           MapOutputEvent("k1", "key5", -1, isTTLValue = true, 123000)
         ),
+        assertNumStateRows(total = 3, updated = 1),
+
         AddData(inputStream, MapInputEvent("k1", "key3", "get_ttl_value_from_state", -1)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(
           MapOutputEvent("k1", "key3", 3, isTTLValue = true, 126000)
         ),
+        assertNumStateRows(total = 3, updated = 0),
+
         StopStream
       )
     }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateAvroSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateAvroSuite.scala
index ce0f2113eac5c..f0583e5e6830b 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateAvroSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateAvroSuite.scala
@@ -27,13 +27,16 @@ import org.scalatest.time.{Seconds, Span}
 import org.apache.spark.SparkUnsupportedOperationException
 import org.apache.spark.sql.Row
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, MemoryStream, MicroBatchExecution}
-import org.apache.spark.sql.execution.streaming.StreamingCheckpointConstants.DIR_NAME_OFFSETS
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, MicroBatchExecution}
+import org.apache.spark.sql.execution.streaming.runtime.StreamingCheckpointConstants.DIR_NAME_OFFSETS
 import org.apache.spark.sql.execution.streaming.state.{OperatorStateMetadataV2, RocksDBStateStoreProvider, StateStoreInvalidValueSchemaEvolution, StateStoreValueSchemaEvolutionThresholdExceeded}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
 import org.apache.spark.sql.types.StructType
+import org.apache.spark.tags.SlowSQLTest
 
+@SlowSQLTest
 class TransformWithStateAvroSuite extends TransformWithStateSuite {
 
   import testImplicits._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateChainingSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateChainingSuite.scala
index beb229ee513e3..7d065d561feb8 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateChainingSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateChainingSuite.scala
@@ -23,10 +23,11 @@ import java.time.{Instant, LocalDateTime, ZoneId}
 import org.apache.spark.{SparkRuntimeException, SparkThrowable}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.ExtendedAnalysisException
-import org.apache.spark.sql.execution.streaming.{MemoryStream, StreamExecution}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, StreamExecution}
 import org.apache.spark.sql.execution.streaming.state.{AlsoTestWithEncodingTypes, AlsoTestWithRocksDBFeatures, RocksDBStateStoreProvider}
 import org.apache.spark.sql.functions.window
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.tags.SlowSQLTest
 
 case class InputEventRow(
     key: String,
@@ -103,6 +104,7 @@ case class AggEventRow(
     window: Window,
     count: Long)
 
+@SlowSQLTest
 class TransformWithStateChainingSuite extends StreamTest
   with AlsoTestWithEncodingTypes
   with AlsoTestWithRocksDBFeatures {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateClusterSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateClusterSuite.scala
index 4f6c5268a7beb..f6f3b2bd8b795 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateClusterSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateClusterSuite.scala
@@ -20,9 +20,10 @@ package org.apache.spark.sql.streaming
 import org.apache.spark.{SparkConf, SparkFunSuite}
 import org.apache.spark.sql.{Dataset, Encoders, Row, SparkSession}
 import org.apache.spark.sql.LocalSparkSession.withSparkSession
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.RocksDBStateStoreProvider
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.tags.SlowSQLTest
 
 case class FruitState(
     name: String,
@@ -132,6 +133,7 @@ trait TransformWithStateClusterSuiteBase extends SparkFunSuite {
  * Test suite spawning local cluster with multiple executors to test serde of stateful
  * processors along with use of implicit encoders, if applicable in transformWithState operator.
  */
+@SlowSQLTest
 class TransformWithStateClusterSuite extends StreamTest with TransformWithStateClusterSuiteBase {
   testWithAndWithoutImplicitEncoders("streaming with transformWithState - " +
    "without initial state") { (spark, useImplicits) =>
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateInitialStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateInitialStateSuite.scala
index 056453fe2db10..5f4de279724a6 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateInitialStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateInitialStateSuite.scala
@@ -19,11 +19,12 @@ package org.apache.spark.sql.streaming
 
 import org.apache.spark.sql.{DataFrame, Dataset, Encoders, KeyValueGroupedDataset}
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{AlsoTestWithEncodingTypes, AlsoTestWithRocksDBFeatures, RocksDBStateStoreProvider}
 import org.apache.spark.sql.functions.{col, timestamp_seconds}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
+import org.apache.spark.tags.SlowSQLTest
 
 case class InitInputRow(key: String, action: String, value: Double)
 case class InputRowForInitialState(
@@ -360,6 +361,7 @@ class StatefulProcessorWithInitialStateEventTimerClass
  * Class that adds tests for transformWithState stateful
  * streaming operator with user-defined initial state
  */
+@SlowSQLTest
 class TransformWithStateInitialStateSuite extends StateStoreMetricsTest
   with AlsoTestWithEncodingTypes with AlsoTestWithRocksDBFeatures {
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateSuite.scala
index 148c451f37af7..2a1ec4c7ab611 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateSuite.scala
@@ -32,13 +32,16 @@ import org.apache.spark.sql.{Dataset, Encoders, Row}
 import org.apache.spark.sql.catalyst.util.stringToFile
 import org.apache.spark.sql.execution.datasources.v2.state.StateSourceOptions
 import org.apache.spark.sql.execution.exchange.ShuffleExchangeExec
-import org.apache.spark.sql.execution.streaming._
-import org.apache.spark.sql.execution.streaming.StreamingCheckpointConstants.DIR_NAME_OFFSETS
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.{TransformWithStateExec, TransformWithStateOperatorProperties, TransformWithStateVariableUtils}
+import org.apache.spark.sql.execution.streaming.runtime._
+import org.apache.spark.sql.execution.streaming.runtime.StreamingCheckpointConstants.DIR_NAME_OFFSETS
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.functions.timestamp_seconds
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
 import org.apache.spark.sql.types._
+import org.apache.spark.tags.SlowSQLTest
 
 object TransformWithStateSuiteUtils {
   val NUM_SHUFFLE_PARTITIONS = 5
@@ -1532,7 +1535,8 @@ abstract class TransformWithStateSuite extends StateStoreMetricsTest
 
         var index = 0
         val foreachBatchDf = df.writeStream
-          .foreachBatch((_: Dataset[(String, String)], _: Long) => {
+          .foreachBatch((ds: Dataset[(String, String)], _: Long) => {
+            ds.collect()
             index += 1
           })
           .trigger(Trigger.AvailableNow())
@@ -1559,7 +1563,8 @@ abstract class TransformWithStateSuite extends StateStoreMetricsTest
 
         def startTriggerAvailableNowQueryAndCheck(expectedIdx: Int): Unit = {
           val q = df.writeStream
-            .foreachBatch((_: Dataset[(String, String)], _: Long) => {
+            .foreachBatch((ds: Dataset[(String, String)], _: Long) => {
+              ds.collect()
               index += 1
             })
             .trigger(Trigger.AvailableNow)
@@ -2024,7 +2029,8 @@ abstract class TransformWithStateSuite extends StateStoreMetricsTest
         var index = 0
 
         val q = df.writeStream
-          .foreachBatch((_: Dataset[(String, String)], _: Long) => {
+          .foreachBatch((ds: Dataset[(String, String)], _: Long) => {
+            ds.collect()
             index += 1
           })
           .trigger(Trigger.AvailableNow)
@@ -2549,6 +2555,7 @@ abstract class TransformWithStateSuite extends StateStoreMetricsTest
   }
 }
 
+@SlowSQLTest
 class TransformWithStateValidationSuite extends StateStoreMetricsTest {
   import testImplicits._
 
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateTTLTest.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateTTLTest.scala
index 18e1626b3cd35..4fb1131440f79 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateTTLTest.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateTTLTest.scala
@@ -20,7 +20,7 @@ package org.apache.spark.sql.streaming
 import java.sql.Timestamp
 import java.time.Duration
 
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{AlsoTestWithEncodingTypes, AlsoTestWithRocksDBFeatures, RocksDBStateStoreProvider}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
@@ -42,7 +42,8 @@ case class OutputEvent(
  */
 abstract class TransformWithStateTTLTest
   extends StreamTest with AlsoTestWithEncodingTypes
-  with AlsoTestWithRocksDBFeatures {
+  with AlsoTestWithRocksDBFeatures
+  with StateStoreMetricsTest {
   import testImplicits._
 
   def getProcessor(ttlConfig: TTLConfig): StatefulProcessor[String, InputEvent, OutputEvent]
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateUnsafeRowSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateUnsafeRowSuite.scala
index b8d29560521ab..f578a209b18d7 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateUnsafeRowSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithStateUnsafeRowSuite.scala
@@ -21,11 +21,13 @@ import org.scalactic.source.Position
 import org.scalatest.Tag
 
 import org.apache.spark.SparkUnsupportedOperationException
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state.{RocksDBStateStoreProvider, StateStoreValueSchemaNotCompatible}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
+import org.apache.spark.tags.SlowSQLTest
 
+@SlowSQLTest
 class TransformWithStateUnsafeRowSuite extends TransformWithStateSuite {
 
   import testImplicits._
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithValueStateTTLSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithValueStateTTLSuite.scala
index 2b33b3feb307e..a42bf4ac97aea 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithValueStateTTLSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TransformWithValueStateTTLSuite.scala
@@ -23,11 +23,15 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.Encoders
-import org.apache.spark.sql.execution.streaming.{CheckpointFileManager, MemoryStream, ValueStateImpl, ValueStateImplWithTTL}
+import org.apache.spark.sql.execution.streaming.checkpointing.CheckpointFileManager
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.statevariables.ValueStateImpl
+import org.apache.spark.sql.execution.streaming.operators.stateful.transformwithstate.ttl.ValueStateImplWithTTL
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.execution.streaming.state._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.util.StreamManualClock
 import org.apache.spark.sql.types._
+import org.apache.spark.tags.SlowSQLTest
 
 object TTLInputProcessFunction {
   def processRow(
@@ -185,6 +189,7 @@ class TTLProcessorWithCompositeTypes(
   }
 }
 
+@SlowSQLTest
 class TransformWithValueStateTTLSuite extends TransformWithStateTTLTest {
 
   import testImplicits._
@@ -218,6 +223,8 @@ class TransformWithValueStateTTLSuite extends TransformWithStateTTLTest {
         // advance clock to trigger processing
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(),
+        assertNumStateRows(total = 2, updated = 2),
+
         // get both state values, and make sure we get unexpired value
         AddData(inputStream, InputEvent(ttlKey, "get", -1)),
         AddData(inputStream, InputEvent(noTtlKey, "get", -1)),
@@ -226,15 +233,21 @@ class TransformWithValueStateTTLSuite extends TransformWithStateTTLTest {
           OutputEvent(ttlKey, 1, isTTLValue = false, -1),
           OutputEvent(noTtlKey, 2, isTTLValue = false, -1)
         ),
+        assertNumStateRows(total = 2, updated = 0),
+
         // ensure ttl values were added correctly, and noTtlKey has no ttl values
         AddData(inputStream, InputEvent(ttlKey, "get_ttl_value_from_state", -1)),
         AddData(inputStream, InputEvent(noTtlKey, "get_ttl_value_from_state", -1)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(OutputEvent(ttlKey, 1, isTTLValue = true, 61000)),
+        assertNumStateRows(total = 2, updated = 0),
+
         AddData(inputStream, InputEvent(ttlKey, "get_values_in_ttl_state", -1)),
         AddData(inputStream, InputEvent(noTtlKey, "get_values_in_ttl_state", -1)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(OutputEvent(ttlKey, -1, isTTLValue = true, 61000)),
+        assertNumStateRows(total = 2, updated = 0),
+
         // advance clock after expiry
         AdvanceManualClock(60 * 1000),
         AddData(inputStream, InputEvent(ttlKey, "get", -1)),
@@ -243,19 +256,27 @@ class TransformWithValueStateTTLSuite extends TransformWithStateTTLTest {
         AdvanceManualClock(1 * 1000),
         // validate ttlKey is expired, bot noTtlKey is still present
         CheckNewAnswer(OutputEvent(noTtlKey, 2, isTTLValue = false, -1)),
+        assertNumStateRows(total = 1, updated = 0),
+
         // validate ttl value is removed in the value state column family
         AddData(inputStream, InputEvent(ttlKey, "get_ttl_value_from_state", -1)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(),
+        assertNumStateRows(total = 1, updated = 0),
+
         AddData(inputStream, InputEvent(ttlKey, "put", 3)),
         AdvanceManualClock(1 * 1000),
         CheckNewAnswer(),
+        assertNumStateRows(total = 2, updated = 1),
+
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).numRowsUpdated === 1)
         },
         AddData(inputStream, InputEvent(noTtlKey, "get", -1)),
         AdvanceManualClock(60 * 1000),
         CheckNewAnswer(OutputEvent(noTtlKey, 2, isTTLValue = false, -1)),
+        assertNumStateRows(total = 1, updated = 0),
+
         Execute { q =>
           assert(q.lastProgress.stateOperators(0).numRowsRemoved === 1)
         }
@@ -469,6 +490,7 @@ class TransformWithValueStateTTLSuite extends TransformWithStateTTLTest {
           AddData(inputStream, InputEvent(noTtlKey, "put", 2)),
           AdvanceManualClock(1 * 1000),
           CheckNewAnswer(),
+          assertNumStateRows(total = 2, updated = 2),
           Execute { q =>
             val schemaFilePath = fm.list(stateSchemaPath).toSeq.head.getPath
             val providerId = StateStoreProviderId(
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TriggerAvailableNowSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TriggerAvailableNowSuite.scala
index 659e2198f4377..3741ee8ab1feb 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/TriggerAvailableNowSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/TriggerAvailableNowSuite.scala
@@ -24,7 +24,8 @@ import org.apache.spark.sql.catalyst.util.stringToFile
 import org.apache.spark.sql.classic.{DataFrame, Dataset}
 import org.apache.spark.sql.connector.read.streaming
 import org.apache.spark.sql.connector.read.streaming.{ReadLimit, SupportsAdmissionControl}
-import org.apache.spark.sql.execution.streaming.{LongOffset, MemoryStream, MicroBatchExecution, MultiBatchExecutor, Offset, SerializedOffset, SingleBatchExecutor, Source, StreamingExecutionRelation, StreamingQueryWrapper}
+import org.apache.spark.sql.execution.streaming.{Offset, Source}
+  import org.apache.spark.sql.execution.streaming.runtime.{LongOffset, MemoryStream, MicroBatchExecution, MultiBatchExecutor, SerializedOffset, SingleBatchExecutor, StreamingExecutionRelation, StreamingQueryWrapper}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{LongType, StructType}
 import org.apache.spark.tags.SlowSQLTest
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousQueryStatusAndProgressSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousQueryStatusAndProgressSuite.scala
index d7aa99c30aad6..068001b06d903 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousQueryStatusAndProgressSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousQueryStatusAndProgressSuite.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.streaming.continuous
 
-import org.apache.spark.sql.execution.streaming.StreamExecution
+import org.apache.spark.sql.execution.streaming.runtime.StreamExecution
 import org.apache.spark.sql.execution.streaming.sources.ContinuousMemoryStream
 import org.apache.spark.sql.streaming.Trigger
 import org.apache.spark.tags.SlowSQLTest
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousSuite.scala
index f1a63ac0f7857..c70f21ae144b6 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/continuous/ContinuousSuite.scala
@@ -22,8 +22,8 @@ import java.sql.Timestamp
 import org.apache.spark.{SparkContext, SparkException}
 import org.apache.spark.scheduler.{SparkListener, SparkListenerTaskStart}
 import org.apache.spark.sql._
-import org.apache.spark.sql.execution.streaming._
 import org.apache.spark.sql.execution.streaming.continuous._
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.execution.streaming.sources.ContinuousMemoryStream
 import org.apache.spark.sql.functions._
 import org.apache.spark.sql.internal.SQLConf.{CONTINUOUS_STREAMING_EPOCH_BACKLOG_QUEUE_SIZE, MIN_BATCHES_TO_RETAIN}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/sources/StreamingDataSourceV2Suite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/sources/StreamingDataSourceV2Suite.scala
index 669fedcbe4b78..ab49fc669ed5d 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/sources/StreamingDataSourceV2Suite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/sources/StreamingDataSourceV2Suite.scala
@@ -29,7 +29,9 @@ import org.apache.spark.sql.connector.read.streaming.{ContinuousPartitionReaderF
 import org.apache.spark.sql.connector.write.{LogicalWriteInfo, PhysicalWriteInfo, Write, WriteBuilder, WriterCommitMessage}
 import org.apache.spark.sql.connector.write.streaming.{StreamingDataWriterFactory, StreamingWrite}
 import org.apache.spark.sql.execution.datasources.DataSource
-import org.apache.spark.sql.execution.streaming.{ContinuousTrigger, RateStreamOffset, Sink, StreamingQueryWrapper}
+import org.apache.spark.sql.execution.streaming.ContinuousTrigger
+import org.apache.spark.sql.execution.streaming.Sink
+import org.apache.spark.sql.execution.streaming.runtime.{RateStreamOffset, StreamingQueryWrapper}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.connector.SimpleTableProvider
 import org.apache.spark.sql.sources.{DataSourceRegister, StreamSinkProvider}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamReaderWriterSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamReaderWriterSuite.scala
index 200603cae5866..74db2a3843d76 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamReaderWriterSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamReaderWriterSuite.scala
@@ -34,7 +34,8 @@ import org.apache.spark.sql.catalyst.plans.logical.LocalRelation
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.classic.Dataset.ofRows
 import org.apache.spark.sql.execution.datasources.DataSourceUtils
-import org.apache.spark.sql.execution.streaming._
+import org.apache.spark.sql.execution.streaming.{Offset, Sink, Source}
+import org.apache.spark.sql.execution.streaming.runtime._
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.sources.{StreamSinkProvider, StreamSourceProvider}
 import org.apache.spark.sql.streaming.{OutputMode, StreamingQuery, StreamingQueryException, StreamTest}
@@ -567,7 +568,7 @@ class DataStreamReaderWriterSuite extends StreamTest with BeforeAndAfter {
   test("MemorySink can recover from a checkpoint in Complete Mode") {
     val checkpointLoc = newMetadataDir
     val checkpointDir = new File(checkpointLoc, "offsets")
-    checkpointDir.mkdirs()
+    Utils.createDirectory(checkpointDir)
     assert(checkpointDir.exists())
     testMemorySinkCheckpointRecovery(checkpointLoc, provideInWriter = true)
   }
@@ -575,7 +576,7 @@ class DataStreamReaderWriterSuite extends StreamTest with BeforeAndAfter {
   test("SPARK-18927: MemorySink can recover from a checkpoint provided in conf in Complete Mode") {
     val checkpointLoc = newMetadataDir
     val checkpointDir = new File(checkpointLoc, "offsets")
-    checkpointDir.mkdirs()
+    Utils.createDirectory(checkpointDir)
     assert(checkpointDir.exists())
     withSQLConf(SQLConf.CHECKPOINT_LOCATION.key -> checkpointLoc) {
       testMemorySinkCheckpointRecovery(checkpointLoc, provideInWriter = false)
@@ -588,7 +589,7 @@ class DataStreamReaderWriterSuite extends StreamTest with BeforeAndAfter {
     val df = ms.toDF().toDF("a")
     val checkpointLoc = newMetadataDir
     val checkpointDir = new File(checkpointLoc, "offsets")
-    checkpointDir.mkdirs()
+    Utils.createDirectory(checkpointDir)
     assert(checkpointDir.exists())
 
     val e = intercept[AnalysisException] {
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamTableAPISuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamTableAPISuite.scala
index aff3d045b52e3..89f6556229527 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamTableAPISuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/test/DataStreamTableAPISuite.scala
@@ -31,7 +31,7 @@ import org.apache.spark.sql.connector.{FakeV2Provider, FakeV2ProviderWithCustomS
 import org.apache.spark.sql.connector.catalog.{Column, Identifier, InMemoryTableCatalog, MetadataColumn, SupportsMetadataColumns, SupportsRead, Table, TableCapability, TableInfo, V2TableWithV1Fallback}
 import org.apache.spark.sql.connector.expressions.{ClusterByTransform, FieldReference, Transform}
 import org.apache.spark.sql.connector.read.ScanBuilder
-import org.apache.spark.sql.execution.streaming.{MemoryStream, MemoryStreamScanBuilder, StreamingQueryWrapper}
+import org.apache.spark.sql.execution.streaming.runtime.{MemoryStream, MemoryStreamScanBuilder, StreamingQueryWrapper}
 import org.apache.spark.sql.functions.lit
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.streaming.StreamTest
@@ -681,7 +681,7 @@ class NonStreamV2Table(override val name: String)
       tableType = CatalogTableType.MANAGED,
       storage = CatalogStorageFormat.empty,
       owner = null,
-      schema = schema(),
+      schema = StructType(Nil),
       provider = Some("parquet"))
   }
 }
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockOnStopSource.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockOnStopSource.scala
index daa8ca7bd9f51..ef79ddb645174 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockOnStopSource.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockOnStopSource.scala
@@ -25,11 +25,12 @@ import org.apache.zookeeper.KeeperException.UnimplementedException
 import org.apache.spark.sql.{Row, SparkSession, SQLContext}
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.classic.DataFrame
-import org.apache.spark.sql.connector.catalog.{SupportsRead, Table, TableCapability}
+import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Column, SupportsRead, Table, TableCapability}
 import org.apache.spark.sql.connector.catalog.TableCapability.CONTINUOUS_READ
 import org.apache.spark.sql.connector.read.{streaming, InputPartition, Scan, ScanBuilder}
 import org.apache.spark.sql.connector.read.streaming.{ContinuousPartitionReaderFactory, ContinuousStream, PartitionOffset}
-import org.apache.spark.sql.execution.streaming.{LongOffset, Offset, Source}
+import org.apache.spark.sql.execution.streaming.{Offset, Source}
+import org.apache.spark.sql.execution.streaming.runtime.LongOffset
 import org.apache.spark.sql.internal.connector.SimpleTableProvider
 import org.apache.spark.sql.sources.StreamSourceProvider
 import org.apache.spark.sql.types.{LongType, StructType}
@@ -93,8 +94,9 @@ class BlockOnStopSource(spark: SparkSession, latch: CountDownLatch) extends Sour
 
 /** A V2 Table, which can create a blocking streaming source for ContinuousExecution. */
 class BlockOnStopSourceTable(latch: CountDownLatch) extends Table with SupportsRead {
-  override def schema(): StructType = BlockOnStopSourceProvider.schema
-
+  override def columns(): Array[Column] = {
+    CatalogV2Util.structTypeToV2Columns(BlockOnStopSourceProvider.schema)
+  }
   override def name(): String = "blockingSource"
 
   override def capabilities(): util.Set[TableCapability] = util.EnumSet.of(CONTINUOUS_READ)
@@ -102,7 +104,7 @@ class BlockOnStopSourceTable(latch: CountDownLatch) extends Table with SupportsR
   override def newScanBuilder(options: CaseInsensitiveStringMap): ScanBuilder = {
     new ScanBuilder {
       override def build(): Scan = new Scan {
-        override def readSchema(): StructType = schema()
+        override def readSchema(): StructType = CatalogV2Util.v2ColumnsToStructType(columns())
 
         override def toContinuousStream(checkpointLocation: String): ContinuousStream = {
           new BlockOnStopContinuousStream(latch)
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockingSource.scala b/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockingSource.scala
index 6865e5e0269b9..b234adc76d557 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockingSource.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/streaming/util/BlockingSource.scala
@@ -20,7 +20,8 @@ package org.apache.spark.sql.streaming.util
 import java.util.concurrent.CountDownLatch
 
 import org.apache.spark.sql.{DataFrame, SQLContext}
-import org.apache.spark.sql.execution.streaming.{LongOffset, Offset, Sink, Source}
+import org.apache.spark.sql.execution.streaming.{Offset, Sink, Source}
+import org.apache.spark.sql.execution.streaming.runtime.LongOffset
 import org.apache.spark.sql.sources.{StreamSinkProvider, StreamSourceProvider}
 import org.apache.spark.sql.streaming.OutputMode
 import org.apache.spark.sql.types.{IntegerType, StructField, StructType}
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/util/DataFrameCallbackSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/util/DataFrameCallbackSuite.scala
index 1ec9aca857e22..0bde9b25017fe 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/util/DataFrameCallbackSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/util/DataFrameCallbackSuite.scala
@@ -24,7 +24,7 @@ import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
 import org.apache.spark._
-import org.apache.spark.internal.config.{EXECUTOR_HEARTBEAT_DROP_ZERO_ACCUMULATOR_UPDATES, EXECUTOR_HEARTBEAT_INTERVAL}
+import org.apache.spark.internal.config.EXECUTOR_HEARTBEAT_INTERVAL
 import org.apache.spark.scheduler.{SparkListener, SparkListenerEvent, SparkListenerExecutorMetricsUpdate}
 import org.apache.spark.sql.{functions, Encoder, Encoders, QueryTest, Row}
 import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeReference}
@@ -48,7 +48,9 @@ class DataFrameCallbackSuite extends QueryTest
   import functions._
 
   override protected def sparkConf: SparkConf = {
-    super.sparkConf.set(EXECUTOR_HEARTBEAT_DROP_ZERO_ACCUMULATOR_UPDATES, false)
+    val sparkConf = super.sparkConf
+    sparkConf.set(SQLConf.CLASSIC_SHUFFLE_DEPENDENCY_FILE_CLEANUP_ENABLED.key, "false")
+
   }
 
   test("execute callback functions when a DataFrame action finished successfully") {
@@ -256,11 +258,12 @@ class DataFrameCallbackSuite extends QueryTest
     withTable("tab") {
       spark.range(10).select($"id", $"id" % 5 as "p").write.partitionBy("p").saveAsTable("tab")
       sparkContext.listenerBus.waitUntilEmpty()
-      // CTAS would derive 3 query executions
-      // 1. CreateDataSourceTableAsSelectCommand
+      // CTAS would derive 4 query executions
+      // 1. DropTable
       // 2. InsertIntoHadoopFsRelationCommand
-      // 3. CommandResultExec
-      assert(commands.length == 6)
+      // 3. CreateDataSourceTableAsSelectCommand
+      // 4. SaveAsV1TableCommand
+      assert(commands.length == 7)
       assert(commands(5)._1 == "command")
       assert(commands(5)._2.isInstanceOf[CreateDataSourceTableAsSelectCommand])
       assert(commands(5)._2.asInstanceOf[CreateDataSourceTableAsSelectCommand]
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/AbstractService.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/AbstractService.java
index b31d024eeeeb9..1062f63971880 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/AbstractService.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/AbstractService.java
@@ -88,7 +88,7 @@ public synchronized void init(HiveConf hiveConf) {
     ensureCurrentState(STATE.NOTINITED);
     this.hiveConf = hiveConf;
     changeState(STATE.INITED);
-    LOG.info("Service:{} is inited.", MDC.of(LogKeys.SERVICE_NAME$.MODULE$, getName()));
+    LOG.info("Service:{} is inited.", MDC.of(LogKeys.SERVICE_NAME, getName()));
   }
 
   /**
@@ -103,7 +103,7 @@ public synchronized void start() {
     startTime = System.currentTimeMillis();
     ensureCurrentState(STATE.INITED);
     changeState(STATE.STARTED);
-    LOG.info("Service:{} is started.", MDC.of(LogKeys.SERVICE_NAME$.MODULE$, getName()));
+    LOG.info("Service:{} is started.", MDC.of(LogKeys.SERVICE_NAME, getName()));
   }
 
   /**
@@ -124,7 +124,7 @@ public synchronized void stop() {
     }
     ensureCurrentState(STATE.STARTED);
     changeState(STATE.STOPPED);
-    LOG.info("Service:{} is stopped.", MDC.of(LogKeys.SERVICE_NAME$.MODULE$, getName()));
+    LOG.info("Service:{} is stopped.", MDC.of(LogKeys.SERVICE_NAME, getName()));
   }
 
   @Override
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CompositeService.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CompositeService.java
index 663bcdb86f9f6..5b65c134a3a0d 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CompositeService.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CompositeService.java
@@ -73,7 +73,7 @@ public synchronized void start() {
       }
       super.start();
     } catch (Throwable e) {
-      LOG.error("Error starting services {}", e, MDC.of(LogKeys.SERVICE_NAME$.MODULE$, getName()));
+      LOG.error("Error starting services {}", e, MDC.of(LogKeys.SERVICE_NAME, getName()));
       // Note that the state of the failed service is still INITED and not
       // STARTED. Even though the last service is not started completely, still
       // call stop() on all services including failed service to make sure cleanup
@@ -103,7 +103,7 @@ private synchronized void stop(int numOfServicesStarted) {
       try {
         service.stop();
       } catch (Throwable t) {
-        LOG.info("Error stopping {}", t, MDC.of(LogKeys.SERVICE_NAME$.MODULE$, service.getName()));
+        LOG.info("Error stopping {}", t, MDC.of(LogKeys.SERVICE_NAME, service.getName()));
       }
     }
   }
@@ -127,7 +127,7 @@ public void run() {
         compositeService.stop();
       } catch (Throwable t) {
         LOG.info("Error stopping {}", t,
-          MDC.of(LogKeys.SERVICE_NAME$.MODULE$, compositeService.getName()));
+          MDC.of(LogKeys.SERVICE_NAME, compositeService.getName()));
       }
     }
   }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CookieSigner.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CookieSigner.java
index 0572ec5ac08fd..7dbc7063e8913 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CookieSigner.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/CookieSigner.java
@@ -19,8 +19,7 @@
 
 import java.security.MessageDigest;
 import java.security.NoSuchAlgorithmException;
-
-import org.apache.commons.codec.binary.Base64;
+import java.util.Base64;
 
 import org.apache.spark.internal.SparkLogger;
 import org.apache.spark.internal.SparkLoggerFactory;
@@ -95,7 +94,7 @@ private String getSignature(String str) {
       md.update(str.getBytes());
       md.update(secretBytes);
       byte[] digest = md.digest();
-      return new Base64(0).encodeToString(digest);
+      return Base64.getEncoder().encodeToString(digest);
     } catch (NoSuchAlgorithmException ex) {
       throw new RuntimeException("Invalid SHA digest String: " + SHA_STRING +
         " " + ex.getMessage(), ex);
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/ServiceOperations.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/ServiceOperations.java
index 92d733c563cab..f945eed0a5c60 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/ServiceOperations.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/ServiceOperations.java
@@ -133,7 +133,7 @@ public static Exception stopQuietly(Service service) {
       stop(service);
     } catch (Exception e) {
       LOG.warn("When stopping the service {}", e,
-        MDC.of(LogKeys.SERVICE_NAME$.MODULE$, service.getName()));
+        MDC.of(LogKeys.SERVICE_NAME, service.getName()));
       return e;
     }
     return null;
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HiveAuthFactory.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HiveAuthFactory.java
index 2bd6210f58c76..da4c170f93fd7 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HiveAuthFactory.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HiveAuthFactory.java
@@ -289,7 +289,7 @@ public String verifyDelegationToken(String delegationToken) throws HiveSQLExcept
       return delegationTokenManager.verifyDelegationToken(delegationToken);
     } catch (IOException e) {
       String msg = "Error verifying delegation token";
-      LOG.error(msg + " {}", e, MDC.of(LogKeys.TOKEN$.MODULE$, delegationToken));
+      LOG.error(msg + " {}", e, MDC.of(LogKeys.TOKEN, delegationToken));
       throw new HiveSQLException(msg + delegationToken, "08S01", e);
     }
   }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HttpAuthUtils.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HttpAuthUtils.java
index e307bdab04498..0a306abed5099 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HttpAuthUtils.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/HttpAuthUtils.java
@@ -22,6 +22,7 @@
 import java.security.PrivilegedExceptionAction;
 import java.security.SecureRandom;
 import java.util.Arrays;
+import java.util.Base64;
 import java.util.HashMap;
 import java.util.HashSet;
 import java.util.Map;
@@ -30,7 +31,6 @@
 
 import javax.security.auth.Subject;
 
-import org.apache.commons.codec.binary.Base64;
 import org.apache.hadoop.hive.shims.ShimLoader;
 import org.apache.hadoop.security.UserGroupInformation;
 import org.apache.http.protocol.BasicHttpContext;
@@ -113,7 +113,7 @@ public static String getUserNameFromCookieToken(String tokenStr) {
 
     if (!map.keySet().equals(COOKIE_ATTRIBUTES)) {
       LOG.error("Invalid token with missing attributes {}",
-        MDC.of(LogKeys.TOKEN$.MODULE$, tokenStr));
+        MDC.of(LogKeys.TOKEN, tokenStr));
       return null;
     }
     return map.get(COOKIE_CLIENT_USER_NAME);
@@ -133,7 +133,7 @@ private static Map<String, String> splitCookieToken(String tokenStr) {
       String part = st.nextToken();
       int separator = part.indexOf(COOKIE_KEY_VALUE_SEPARATOR);
       if (separator == -1) {
-        LOG.error("Invalid token string {}", MDC.of(LogKeys.TOKEN$.MODULE$, tokenStr));
+        LOG.error("Invalid token string {}", MDC.of(LogKeys.TOKEN, tokenStr));
         return null;
       }
       String key = part.substring(0, separator);
@@ -157,13 +157,11 @@ public static class HttpKerberosClientAction implements PrivilegedExceptionActio
     public static final String SERVER_HTTP_URL = "SERVER_HTTP_URL";
     private final String serverPrincipal;
     private final String serverHttpUrl;
-    private final Base64 base64codec;
     private final HttpContext httpContext;
 
     public HttpKerberosClientAction(String serverPrincipal, String serverHttpUrl) {
       this.serverPrincipal = serverPrincipal;
       this.serverHttpUrl = serverHttpUrl;
-      base64codec = new Base64(0);
       httpContext = new BasicHttpContext();
       httpContext.setAttribute(SERVER_HTTP_URL, serverHttpUrl);
     }
@@ -187,7 +185,7 @@ public String run() throws Exception {
       byte[] outToken = gssContext.initSecContext(inToken, 0, inToken.length);
       gssContext.dispose();
       // Base64 encoded and stringified token for server
-      return new String(base64codec.encode(outToken));
+      return Base64.getEncoder().encodeToString(outToken);
     }
   }
 }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/LdapAuthenticationProviderImpl.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/LdapAuthenticationProviderImpl.java
index b74151a42e1af..e6ae9dab8b3eb 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/LdapAuthenticationProviderImpl.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/auth/LdapAuthenticationProviderImpl.java
@@ -26,10 +26,11 @@
 import javax.naming.directory.InitialDirContext;
 import javax.security.sasl.AuthenticationException;
 
-import org.apache.commons.lang3.StringUtils;
 import org.apache.hadoop.hive.conf.HiveConf;
 import org.apache.hive.service.ServiceUtils;
 
+import org.apache.spark.util.Utils;
+
 public class LdapAuthenticationProviderImpl implements PasswdAuthenticationProvider {
 
   private final String ldapURL;
@@ -62,15 +63,15 @@ public void Authenticate(String user, String password) throws AuthenticationExce
 
     // setup the security principal
     List<String> candidatePrincipals = new ArrayList<>();
-    if (StringUtils.isBlank(userDNPattern)) {
-      if (StringUtils.isNotBlank(baseDN)) {
+    if (Utils.isBlank(userDNPattern)) {
+      if (Utils.isNotBlank(baseDN)) {
         String pattern = "uid=" + user + "," + baseDN;
         candidatePrincipals.add(pattern);
       }
     } else {
       String[] patterns = userDNPattern.split(":");
       for (String pattern : patterns) {
-        if (StringUtils.contains(pattern, ",") && StringUtils.contains(pattern, "=")) {
+        if (pattern.contains(",") && pattern.contains("=")) {
           candidatePrincipals.add(pattern.replaceAll("%s", user));
         }
       }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/CLIService.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/CLIService.java
index 86fb725d3a3cc..0ab721bbd2a1f 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/CLIService.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/CLIService.java
@@ -103,8 +103,8 @@ public synchronized void init(HiveConf hiveConf) {
       String keyTabFile = hiveConf.getVar(ConfVars.HIVE_SERVER2_SPNEGO_KEYTAB);
       if (principal.isEmpty() || keyTabFile.isEmpty()) {
         LOG.info("SPNego httpUGI not created, spNegoPrincipal: {}, keytabFile: {}",
-          MDC.of(LogKeys.PRINCIPAL$.MODULE$, principal),
-          MDC.of(LogKeys.KEYTAB_FILE$.MODULE$, keyTabFile));
+          MDC.of(LogKeys.PRINCIPAL, principal),
+          MDC.of(LogKeys.KEYTAB_FILE, keyTabFile));
       } else {
         try {
           this.httpUGI = HiveAuthFactory.loginFromSpnegoKeytabAndReturnUGI(hiveConf);
@@ -462,7 +462,7 @@ public OperationStatus getOperationStatus(OperationHandle opHandle)
       } catch (ExecutionException e) {
         // The background operation thread was aborted
         LOG.warn("{}: The background operation was aborted", e,
-          MDC.of(LogKeys.OPERATION_HANDLE$.MODULE$, opHandle));
+          MDC.of(LogKeys.OPERATION_HANDLE, opHandle));
       } catch (InterruptedException e) {
         // No op, this thread was interrupted
         // In this case, the call might return sooner than long polling timeout
@@ -556,7 +556,7 @@ public String getDelegationToken(SessionHandle sessionHandle, HiveAuthFactory au
       String owner, String renewer) throws HiveSQLException {
     String delegationToken = sessionManager.getSession(sessionHandle)
         .getDelegationToken(authFactory, owner, renewer);
-    LOG.info("{}: getDelegationToken()", MDC.of(LogKeys.SESSION_HANDLE$.MODULE$, sessionHandle));
+    LOG.info("{}: getDelegationToken()", MDC.of(LogKeys.SESSION_HANDLE, sessionHandle));
     return delegationToken;
   }
 
@@ -564,14 +564,14 @@ public String getDelegationToken(SessionHandle sessionHandle, HiveAuthFactory au
   public void cancelDelegationToken(SessionHandle sessionHandle, HiveAuthFactory authFactory,
       String tokenStr) throws HiveSQLException {
     sessionManager.getSession(sessionHandle).cancelDelegationToken(authFactory, tokenStr);
-    LOG.info("{}: cancelDelegationToken()", MDC.of(LogKeys.SESSION_HANDLE$.MODULE$, sessionHandle));
+    LOG.info("{}: cancelDelegationToken()", MDC.of(LogKeys.SESSION_HANDLE, sessionHandle));
   }
 
   @Override
   public void renewDelegationToken(SessionHandle sessionHandle, HiveAuthFactory authFactory,
       String tokenStr) throws HiveSQLException {
     sessionManager.getSession(sessionHandle).renewDelegationToken(authFactory, tokenStr);
-    LOG.info("{}: renewDelegationToken()", MDC.of(LogKeys.SESSION_HANDLE$.MODULE$, sessionHandle));
+    LOG.info("{}: renewDelegationToken()", MDC.of(LogKeys.SESSION_HANDLE, sessionHandle));
   }
 
   @Override
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/ColumnBasedSet.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/ColumnBasedSet.java
index 4331f6829fbf3..e573d3d43738c 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/ColumnBasedSet.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/ColumnBasedSet.java
@@ -71,7 +71,7 @@ public ColumnBasedSet(TRowSet tRowSet) throws TException {
         try {
           tvalue.read(protocol);
         } catch (TException e) {
-          LOG.error("{}", e, MDC.of(LogKeys.ERROR$.MODULE$, e.getMessage()));
+          LOG.error("{}", e, MDC.of(LogKeys.ERROR, e.getMessage()));
           throw new TException("Error reading column value from the row set blob", e);
         }
         columns.add(new ColumnBuffer(tvalue));
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/ClassicTableTypeMapping.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/ClassicTableTypeMapping.java
index 0b71b606b9d65..1fde723600bfc 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/ClassicTableTypeMapping.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/ClassicTableTypeMapping.java
@@ -17,16 +17,12 @@
 
 package org.apache.hive.service.cli.operation;
 
-import java.util.Arrays;
-import java.util.Collection;
 import java.util.HashMap;
 import java.util.HashSet;
+import java.util.List;
 import java.util.Map;
 import java.util.Set;
 
-import com.google.common.collect.ArrayListMultimap;
-import com.google.common.collect.Iterables;
-import com.google.common.collect.Multimap;
 import org.apache.hadoop.hive.metastore.TableType;
 
 import org.apache.spark.internal.SparkLogger;
@@ -52,7 +48,7 @@ public enum ClassicTableTypes {
   }
 
   private final Map<String, String> hiveToClientMap = new HashMap<String, String>();
-  private final Multimap<String, String> clientToHiveMap = ArrayListMultimap.create();
+  private final Map<String, List<String>> clientToHiveMap = new HashMap<>();
 
   public ClassicTableTypeMapping() {
     hiveToClientMap.put(TableType.MANAGED_TABLE.name(), ClassicTableTypes.TABLE.name());
@@ -61,22 +57,23 @@ public ClassicTableTypeMapping() {
     hiveToClientMap.put(TableType.MATERIALIZED_VIEW.toString(),
             ClassicTableTypes.MATERIALIZED_VIEW.toString());
 
-    clientToHiveMap.putAll(ClassicTableTypes.TABLE.name(), Arrays.asList(
-        TableType.MANAGED_TABLE.name(), TableType.EXTERNAL_TABLE.name()));
-    clientToHiveMap.put(ClassicTableTypes.VIEW.name(), TableType.VIRTUAL_VIEW.name());
+    clientToHiveMap.put(ClassicTableTypes.TABLE.name(),
+        List.of(TableType.MANAGED_TABLE.name(), TableType.EXTERNAL_TABLE.name()));
+    clientToHiveMap.put(ClassicTableTypes.VIEW.name(),
+        List.of(TableType.VIRTUAL_VIEW.name()));
     clientToHiveMap.put(ClassicTableTypes.MATERIALIZED_VIEW.toString(),
-            TableType.MATERIALIZED_VIEW.toString());
+        List.of(TableType.MATERIALIZED_VIEW.toString()));
   }
 
   @Override
   public String[] mapToHiveType(String clientTypeName) {
-    Collection<String> hiveTableType = clientToHiveMap.get(clientTypeName.toUpperCase());
+    List<String> hiveTableType = clientToHiveMap.get(clientTypeName.toUpperCase());
     if (hiveTableType == null) {
       LOG.warn("Not supported client table type {}",
-        MDC.of(LogKeys.TABLE_TYPE$.MODULE$, clientTypeName));
+        MDC.of(LogKeys.TABLE_TYPE, clientTypeName));
       return new String[] {clientTypeName};
     }
-    return Iterables.toArray(hiveTableType, String.class);
+    return hiveTableType.toArray(new String[0]);
   }
 
   @Override
@@ -84,7 +81,7 @@ public String mapToClientType(String hiveTypeName) {
     String clientTypeName = hiveToClientMap.get(hiveTypeName);
     if (clientTypeName == null) {
       LOG.warn("Invalid hive table type {}",
-        MDC.of(LogKeys.TABLE_TYPE$.MODULE$, hiveTypeName));
+        MDC.of(LogKeys.TABLE_TYPE, hiveTypeName));
       return hiveTypeName;
     }
     return clientTypeName;
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/LogDivertAppender.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/LogDivertAppender.java
index 32cc42f008bda..2a54d26190617 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/LogDivertAppender.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/LogDivertAppender.java
@@ -38,7 +38,6 @@
 import org.apache.logging.log4j.core.appender.ConsoleAppender;
 import org.apache.logging.log4j.core.appender.AbstractWriterAppender;
 import org.apache.logging.log4j.core.appender.WriterManager;
-import com.google.common.base.Joiner;
 import org.apache.logging.log4j.core.config.Property;
 import org.apache.logging.log4j.message.Message;
 
@@ -67,17 +66,17 @@ private static class NameFilter implements Filter {
     /* Patterns that are excluded in verbose logging level.
      * Filter out messages coming from log processing classes, or we'll run an infinite loop.
      */
-    private static final Pattern verboseExcludeNamePattern = Pattern.compile(Joiner.on("|")
-      .join(new String[] {LOG.getName(), OperationLog.class.getName(),
-      OperationManager.class.getName()}));
+    private static final Pattern verboseExcludeNamePattern = Pattern.compile(String.join("|",
+      LOG.getName(), OperationLog.class.getName(),
+      OperationManager.class.getName()));
 
     /* Patterns that are included in execution logging level.
      * In execution mode, show only select logger messages.
      */
-    private static final Pattern executionIncludeNamePattern = Pattern.compile(Joiner.on("|")
-      .join(new String[] {"org.apache.hadoop.mapreduce.JobSubmitter",
+    private static final Pattern executionIncludeNamePattern = Pattern.compile(String.join("|",
+      "org.apache.hadoop.mapreduce.JobSubmitter",
       "org.apache.hadoop.mapreduce.Job", "SessionState", Task.class.getName(),
-      "org.apache.hadoop.hive.ql.exec.spark.status.SparkJobMonitor"}));
+      "org.apache.hadoop.hive.ql.exec.spark.status.SparkJobMonitor"));
 
     /* Patterns that are included in performance logging level.
      * In performance mode, show execution and performance logger messages.
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/Operation.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/Operation.java
index f488a411c31f3..b5cf8991a4cb3 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/Operation.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/Operation.java
@@ -212,7 +212,7 @@ protected void createOperationLog() {
       try {
         if (operationLogFile.exists()) {
           LOG.warn("The operation log file should not exist, but it is already there: {}",
-            MDC.of(LogKeys.PATH$.MODULE$, operationLogFile.getAbsolutePath()));
+            MDC.of(LogKeys.PATH, operationLogFile.getAbsolutePath()));
           operationLogFile.delete();
         }
         if (!operationLogFile.createNewFile()) {
@@ -221,14 +221,14 @@ protected void createOperationLog() {
           if (!operationLogFile.canRead() || !operationLogFile.canWrite()) {
             LOG.warn("The already existed operation log file cannot be recreated, " +
               "and it cannot be read or written: {}",
-              MDC.of(LogKeys.PATH$.MODULE$, operationLogFile.getAbsolutePath()));
+              MDC.of(LogKeys.PATH, operationLogFile.getAbsolutePath()));
             isOperationLogEnabled = false;
             return;
           }
         }
       } catch (Exception e) {
         LOG.warn("Unable to create operation log file: {}", e,
-          MDC.of(LogKeys.PATH$.MODULE$, operationLogFile.getAbsolutePath()));
+          MDC.of(LogKeys.PATH, operationLogFile.getAbsolutePath()));
         isOperationLogEnabled = false;
         return;
       }
@@ -238,7 +238,7 @@ protected void createOperationLog() {
         operationLog = new OperationLog(opHandle.toString(), operationLogFile, parentSession.getHiveConf());
       } catch (FileNotFoundException e) {
         LOG.warn("Unable to instantiate OperationLog object for operation: {}", e,
-          MDC.of(LogKeys.OPERATION_HANDLE$.MODULE$, opHandle));
+          MDC.of(LogKeys.OPERATION_HANDLE, opHandle));
         isOperationLogEnabled = false;
         return;
       }
@@ -290,7 +290,7 @@ protected void cleanupOperationLog() {
       if (operationLog == null) {
         LOG.error("Operation [ {} ] logging is enabled, " +
           "but its OperationLog object cannot be found.",
-          MDC.of(LogKeys.OPERATION_HANDLE_ID$.MODULE$, opHandle.getHandleIdentifier()));
+          MDC.of(LogKeys.OPERATION_HANDLE_ID, opHandle.getHandleIdentifier()));
       } else {
         operationLog.close();
       }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/OperationManager.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/OperationManager.java
index fd8266d1a9acc..79c12d387a9dd 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/OperationManager.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/operation/OperationManager.java
@@ -293,7 +293,7 @@ public List<Operation> removeExpiredOperations(OperationHandle[] handles) {
       Operation operation = removeTimedOutOperation(handle);
       if (operation != null) {
         LOG.warn("Operation {} is timed-out and will be closed",
-          MDC.of(LogKeys.OPERATION_HANDLE$.MODULE$, handle));
+          MDC.of(LogKeys.OPERATION_HANDLE, handle));
         removed.add(operation);
       }
     }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/HiveSessionImpl.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/HiveSessionImpl.java
index 9d9b6f1c7b0e1..14404e3198863 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/HiveSessionImpl.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/HiveSessionImpl.java
@@ -28,8 +28,6 @@
 import java.util.Map;
 import java.util.Set;
 
-import org.apache.commons.io.FileUtils;
-import org.apache.commons.lang3.StringUtils;
 import org.apache.hadoop.hive.common.cli.HiveFileProcessor;
 import org.apache.hadoop.hive.common.cli.IHiveFileProcessor;
 import org.apache.hadoop.hive.conf.HiveConf;
@@ -75,6 +73,8 @@
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.internal.LogKeys;
 import org.apache.spark.internal.MDC;
+import org.apache.spark.network.util.JavaUtils;
+import org.apache.spark.util.Utils;
 
 import static org.apache.hadoop.hive.conf.SystemVariables.ENV_PREFIX;
 import static org.apache.hadoop.hive.conf.SystemVariables.HIVECONF_PREFIX;
@@ -151,7 +151,7 @@ public void open(Map<String, String> sessionConfMap) throws HiveSQLException {
       sessionState.loadReloadableAuxJars();
     } catch (IOException e) {
       String msg = "Failed to load reloadable jar file path.";
-      LOG.error("{}", e, MDC.of(LogKeys.ERROR$.MODULE$, msg));
+      LOG.error("{}", e, MDC.of(LogKeys.ERROR, msg));
       throw new HiveSQLException(msg, e);
     }
     // Process global init file: .hiverc
@@ -202,7 +202,7 @@ private void processGlobalInitFile() {
         }
         if (hivercFile.isFile()) {
           LOG.info("Running global init file: {}",
-            MDC.of(LogKeys.GLOBAL_INIT_FILE$.MODULE$, hivercFile));
+            MDC.of(LogKeys.GLOBAL_INIT_FILE, hivercFile));
           int rc = processor.processFile(hivercFile.getAbsolutePath());
           if (rc != 0) {
             LOG.error("Failed on initializing global .hiverc file");
@@ -303,28 +303,28 @@ private static void setConf(String varname, String key, String varvalue, boolean
   public void setOperationLogSessionDir(File operationLogRootDir) {
     if (!operationLogRootDir.exists()) {
       LOG.warn("The operation log root directory is removed, recreating: {}",
-        MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
-      if (!operationLogRootDir.mkdirs()) {
+        MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
+      if (!Utils.createDirectory(operationLogRootDir)) {
         LOG.warn("Unable to create operation log root directory: {}",
-          MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
+          MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
       }
     }
     if (!operationLogRootDir.canWrite()) {
       LOG.warn("The operation log root directory is not writable: {}",
-        MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
+        MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
     }
     sessionLogDir = new File(operationLogRootDir, sessionHandle.getHandleIdentifier().toString());
     isOperationLogEnabled = true;
     if (!sessionLogDir.exists()) {
       if (!sessionLogDir.mkdir()) {
         LOG.warn("Unable to create operation log session directory: {}",
-          MDC.of(LogKeys.PATH$.MODULE$, sessionLogDir.getAbsolutePath()));
+          MDC.of(LogKeys.PATH, sessionLogDir.getAbsolutePath()));
         isOperationLogEnabled = false;
       }
     }
     if (isOperationLogEnabled) {
       LOG.info("Operation log session directory is created: {}",
-        MDC.of(LogKeys.PATH$.MODULE$, sessionLogDir.getAbsolutePath()));
+        MDC.of(LogKeys.PATH, sessionLogDir.getAbsolutePath()));
     }
   }
 
@@ -609,7 +609,7 @@ public OperationHandle getColumns(String catalogName, String schemaName,
       String tableName, String columnName)  throws HiveSQLException {
     acquire(true);
     String addedJars = Utilities.getResourceFiles(hiveConf, SessionState.ResourceType.JAR);
-    if (StringUtils.isNotBlank(addedJars)) {
+    if (Utils.isNotBlank(addedJars)) {
        IMetaStoreClient metastoreClient = getSession().getMetaStoreClient();
        metastoreClient.setHiveAddedJars(addedJars);
     }
@@ -660,7 +660,7 @@ public void close() throws HiveSQLException {
           operationManager.closeOperation(opHandle);
         } catch (Exception e) {
           LOG.warn("Exception is thrown closing operation {}", e,
-            MDC.of(LogKeys.OPERATION_HANDLE$.MODULE$, opHandle));
+            MDC.of(LogKeys.OPERATION_HANDLE, opHandle));
         }
       }
       opHandleSet.clear();
@@ -709,13 +709,13 @@ private void cleanupPipeoutFile() {
 
     if (fileAry == null) {
       LOG.error("Unable to access pipeout files in {}",
-        MDC.of(LogKeys.LOCAL_SCRATCH_DIR$.MODULE$, lScratchDir));
+        MDC.of(LogKeys.LOCAL_SCRATCH_DIR, lScratchDir));
     } else {
       for (File file : fileAry) {
         try {
-          FileUtils.forceDelete(file);
+          JavaUtils.deleteRecursively(file);
         } catch (Exception e) {
-          LOG.error("Failed to cleanup pipeout file: {}", e, MDC.of(LogKeys.PATH$.MODULE$, file));
+          LOG.error("Failed to cleanup pipeout file: {}", e, MDC.of(LogKeys.PATH, file));
         }
       }
     }
@@ -724,10 +724,10 @@ private void cleanupPipeoutFile() {
   private void cleanupSessionLogDir() {
     if (isOperationLogEnabled) {
       try {
-        FileUtils.forceDelete(sessionLogDir);
+        JavaUtils.deleteRecursively(sessionLogDir);
       } catch (Exception e) {
         LOG.error("Failed to cleanup session log dir: {}", e,
-          MDC.of(LogKeys.SESSION_HANDLE$.MODULE$, sessionHandle));
+          MDC.of(LogKeys.SESSION_HANDLE, sessionHandle));
       }
     }
   }
@@ -777,7 +777,7 @@ private void closeTimedOutOperations(List<Operation> operations) {
           operation.close();
         } catch (Exception e) {
           LOG.warn("Exception is thrown closing timed-out operation {}", e,
-            MDC.of(LogKeys.OPERATION_HANDLE$.MODULE$, operation.getHandle()));
+            MDC.of(LogKeys.OPERATION_HANDLE, operation.getHandle()));
         }
       }
     } finally {
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/SessionManager.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/SessionManager.java
index 3f60fd00b82a7..23f6e272c49dd 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/SessionManager.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/session/SessionManager.java
@@ -28,7 +28,6 @@
 import java.util.concurrent.ThreadPoolExecutor;
 import java.util.concurrent.TimeUnit;
 
-import org.apache.commons.io.FileUtils;
 import org.apache.hadoop.hive.conf.HiveConf;
 import org.apache.hadoop.hive.conf.HiveConf.ConfVars;
 import org.apache.hive.service.CompositeService;
@@ -43,6 +42,8 @@
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.internal.LogKeys;
 import org.apache.spark.internal.MDC;
+import org.apache.spark.network.util.JavaUtils;
+import org.apache.spark.util.Utils;
 
 /**
  * SessionManager.
@@ -88,14 +89,14 @@ public synchronized void init(HiveConf hiveConf) {
   private void createBackgroundOperationPool() {
     int poolSize = hiveConf.getIntVar(ConfVars.HIVE_SERVER2_ASYNC_EXEC_THREADS);
     LOG.info("HiveServer2: Background operation thread pool size: {}",
-      MDC.of(LogKeys.THREAD_POOL_SIZE$.MODULE$, poolSize));
+      MDC.of(LogKeys.THREAD_POOL_SIZE, poolSize));
     int poolQueueSize = hiveConf.getIntVar(ConfVars.HIVE_SERVER2_ASYNC_EXEC_WAIT_QUEUE_SIZE);
     LOG.info("HiveServer2: Background operation thread wait queue size: {}",
-      MDC.of(LogKeys.THREAD_POOL_WAIT_QUEUE_SIZE$.MODULE$, poolQueueSize));
+      MDC.of(LogKeys.THREAD_POOL_WAIT_QUEUE_SIZE, poolQueueSize));
     long keepAliveTime = HiveConf.getTimeVar(
         hiveConf, ConfVars.HIVE_SERVER2_ASYNC_EXEC_KEEPALIVE_TIME, TimeUnit.SECONDS);
     LOG.info("HiveServer2: Background operation thread keepalive time: {} ms",
-      MDC.of(LogKeys.THREAD_POOL_KEEPALIVE_TIME$.MODULE$, keepAliveTime * 1000L));
+      MDC.of(LogKeys.THREAD_POOL_KEEPALIVE_TIME, keepAliveTime * 1000L));
 
     // Create a thread pool with #poolSize threads
     // Threads terminate when they are idle for more than the keepAliveTime
@@ -121,26 +122,26 @@ private void initOperationLogRootDir() {
 
     if (operationLogRootDir.exists() && !operationLogRootDir.isDirectory()) {
       LOG.warn("The operation log root directory exists, but it is not a directory: {}",
-        MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
+        MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
       isOperationLogEnabled = false;
     }
 
     if (!operationLogRootDir.exists()) {
-      if (!operationLogRootDir.mkdirs()) {
+      if (!Utils.createDirectory(operationLogRootDir)) {
         LOG.warn("Unable to create operation log root directory: {}",
-          MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
+          MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
         isOperationLogEnabled = false;
       }
     }
 
     if (isOperationLogEnabled) {
       LOG.info("Operation log root directory is created: {}",
-        MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
+        MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
       try {
-        FileUtils.forceDeleteOnExit(operationLogRootDir);
+        JavaUtils.forceDeleteOnExit(operationLogRootDir);
       } catch (IOException e) {
         LOG.warn("Failed to schedule cleanup HS2 operation logging root dir: {}", e,
-          MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
+          MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
       }
     }
   }
@@ -171,13 +172,13 @@ public void run() {
                 && (!checkOperation || session.getNoOperationTime() > sessionTimeout)) {
               SessionHandle handle = session.getSessionHandle();
               LOG.warn("Session {} is Timed-out (last access : {}) and will be closed",
-                MDC.of(LogKeys.SESSION_HANDLE$.MODULE$, handle),
-                MDC.of(LogKeys.LAST_ACCESS_TIME$.MODULE$, new Date(session.getLastAccessTime())));
+                MDC.of(LogKeys.SESSION_HANDLE, handle),
+                MDC.of(LogKeys.LAST_ACCESS_TIME, new Date(session.getLastAccessTime())));
               try {
                 closeSession(handle);
               } catch (HiveSQLException e) {
                 LOG.warn("Exception is thrown closing session {}", e,
-                  MDC.of(LogKeys.SESSION_HANDLE$.MODULE$, handle));
+                  MDC.of(LogKeys.SESSION_HANDLE, handle));
               }
             } else {
               session.closeExpiredOperations();
@@ -220,7 +221,7 @@ public synchronized void stop() {
       } catch (InterruptedException e) {
         LOG.warn("HIVE_SERVER2_ASYNC_EXEC_SHUTDOWN_TIMEOUT = {} ms has been exceeded. " +
           "RUNNING background operations will be shut down", e,
-          MDC.of(LogKeys.TIMEOUT$.MODULE$, timeout * 1000));
+          MDC.of(LogKeys.TIMEOUT, timeout * 1000));
       }
       backgroundOperationPool = null;
     }
@@ -230,10 +231,10 @@ public synchronized void stop() {
   private void cleanupLoggingRootDir() {
     if (isOperationLogEnabled) {
       try {
-        FileUtils.forceDelete(operationLogRootDir);
+        Utils.deleteRecursively(operationLogRootDir);
       } catch (Exception e) {
         LOG.warn("Failed to cleanup root dir of HS2 logging: {}", e,
-          MDC.of(LogKeys.PATH$.MODULE$, operationLogRootDir.getAbsolutePath()));
+          MDC.of(LogKeys.PATH, operationLogRootDir.getAbsolutePath()));
       }
     }
   }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftCLIService.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftCLIService.java
index 07af0013846ba..80d7b4e369d4c 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftCLIService.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftCLIService.java
@@ -46,6 +46,7 @@
 import org.apache.spark.internal.SparkLoggerFactory;
 import org.apache.spark.internal.LogKeys;
 import org.apache.spark.internal.MDC;
+import org.apache.spark.util.Utils;
 
 /**
  * ThriftCLIService.
@@ -250,7 +251,7 @@ private TStatus notSupportTokenErrorStatus() {
   @Override
   public TOpenSessionResp OpenSession(TOpenSessionReq req) throws TException {
     LOG.info("Client protocol version: {}",
-      MDC.of(LogKeys.PROTOCOL_VERSION$.MODULE$, req.getClient_protocol()));
+      MDC.of(LogKeys.PROTOCOL_VERSION, req.getClient_protocol()));
     TOpenSessionResp resp = new TOpenSessionResp();
     try {
       SessionHandle sessionHandle = getSessionHandle(req, resp);
@@ -286,7 +287,7 @@ public TSetClientInfoResp SetClientInfo(TSetClientInfoReq req) throws TException
         sb.append(e.getKey()).append(" = ").append(e.getValue());
       }
       if (sb != null) {
-        LOG.info("{}", MDC.of(LogKeys.SET_CLIENT_INFO_REQUEST$.MODULE$, sb));
+        LOG.info("{}", MDC.of(LogKeys.SET_CLIENT_INFO_REQUEST, sb));
       }
     }
     return new TSetClientInfoResp(OK_STATUS);
@@ -593,8 +594,7 @@ public TGetOperationStatusResp GetOperationStatus(TGetOperationStatusReq req) th
       if (opException != null) {
         resp.setSqlState(opException.getSQLState());
         resp.setErrorCode(opException.getErrorCode());
-        resp.setErrorMessage(org.apache.hadoop.util.StringUtils
-            .stringifyException(opException));
+        resp.setErrorMessage(Utils.stringifyException(opException));
       }
       resp.setStatus(OK_STATUS);
     } catch (Exception e) {
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftHttpServlet.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftHttpServlet.java
index d9bf361fdef63..350ef89ec4d27 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftHttpServlet.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/cli/thrift/ThriftHttpServlet.java
@@ -21,6 +21,7 @@
 import java.io.UnsupportedEncodingException;
 import java.security.PrivilegedExceptionAction;
 import java.security.SecureRandom;
+import java.util.Base64;
 import java.util.Map;
 import java.util.Set;
 import java.util.concurrent.TimeUnit;
@@ -31,7 +32,6 @@
 import jakarta.servlet.http.HttpServletResponse;
 import jakarta.ws.rs.core.NewCookie;
 
-import org.apache.commons.codec.binary.Base64;
 import org.apache.commons.codec.binary.StringUtils;
 import org.apache.hadoop.hive.conf.HiveConf;
 import org.apache.hadoop.hive.conf.HiveConf.ConfVars;
@@ -178,7 +178,7 @@ protected void doPost(HttpServletRequest request, HttpServletResponse response)
           response.addCookie(hs2Cookie);
         }
         LOG.info("Cookie added for clientUserName {}",
-          MDC.of(LogKeys.USER_NAME$.MODULE$, clientUserName));
+          MDC.of(LogKeys.USER_NAME, clientUserName));
       }
       super.doPost(request, response);
     }
@@ -232,7 +232,7 @@ private String getClientNameFromCookie(Cookie[] cookies) {
         String userName = HttpAuthUtils.getUserNameFromCookieToken(currValue);
 
         if (userName == null) {
-          LOG.warn("Invalid cookie token {}", MDC.of(LogKeys.TOKEN$.MODULE$, currValue));
+          LOG.warn("Invalid cookie token {}", MDC.of(LogKeys.TOKEN, currValue));
           continue;
         }
         //We have found a valid cookie in the client request.
@@ -423,7 +423,7 @@ public String run() throws HttpAuthenticationException {
         gssContext = manager.createContext(serverCreds);
         // Get service ticket from the authorization header
         String serviceTicketBase64 = getAuthHeader(request, authType);
-        byte[] inToken = Base64.decodeBase64(serviceTicketBase64.getBytes());
+        byte[] inToken = Base64.getDecoder().decode(serviceTicketBase64.getBytes());
         gssContext.acceptSecContext(inToken, 0, inToken.length);
         // Authenticate or deny based on its context completion
         if (!gssContext.isEstablished()) {
@@ -504,7 +504,7 @@ private String[] getAuthHeaderTokens(HttpServletRequest request,
       String authType) throws HttpAuthenticationException {
     String authHeaderBase64 = getAuthHeader(request, authType);
     String authHeaderString = StringUtils.newStringUtf8(
-        Base64.decodeBase64(authHeaderBase64.getBytes()));
+      Base64.getDecoder().decode(authHeaderBase64.getBytes()));
     String[] creds = authHeaderString.split(":");
     return creds;
   }
diff --git a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/server/HiveServer2.java b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/server/HiveServer2.java
index 46ee775e8dd49..9e3ec3fc61ce8 100644
--- a/sql/hive-thriftserver/src/main/java/org/apache/hive/service/server/HiveServer2.java
+++ b/sql/hive-thriftserver/src/main/java/org/apache/hive/service/server/HiveServer2.java
@@ -145,7 +145,7 @@ private static void startHiveServer2() throws Throwable {
           throw new Error("Max start attempts " + maxAttempts + " exhausted", throwable);
         } else {
           LOG.warn("Error starting HiveServer2 on attempt {}, will retry in 60 seconds",
-            throwable, MDC.of(LogKeys.NUM_RETRY$.MODULE$, attempts));
+            throwable, MDC.of(LogKeys.NUM_RETRY, attempts));
           try {
             Thread.sleep(60L * 1000L);
           } catch (InterruptedException e) {
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkExecuteStatementOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkExecuteStatementOperation.scala
index 2ba4d72c9e426..350aba1ab175b 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkExecuteStatementOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkExecuteStatementOperation.scala
@@ -30,7 +30,7 @@ import org.apache.hive.service.cli.operation.ExecuteStatementOperation
 import org.apache.hive.service.cli.session.HiveSession
 import org.apache.hive.service.rpc.thrift.{TCLIServiceConstants, TColumnDesc, TPrimitiveTypeEntry, TRowSet, TTableSchema, TTypeDesc, TTypeEntry, TTypeId, TTypeQualifiers, TTypeQualifierValue}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.{DataFrame, Row, SparkSession}
 import org.apache.spark.sql.catalyst.util.CharVarcharUtils
@@ -248,7 +248,7 @@ private[hive] class SparkExecuteStatementOperation(
         // then they may both call cleanup() before Spark Jobs are started. But before background
         // task interrupted, it may have started some spark job, so we need to cancel again to
         // make sure job was cancelled when background thread was interrupted
-        if (statementId != null) {
+        if (!sparkContext.isStopped && statementId != null) {
           sparkContext.cancelJobGroup(statementId,
             "The corresponding Thriftserver query has failed.")
         }
@@ -340,6 +340,7 @@ object SparkExecuteStatementOperation {
     case _: StringType => TTypeId.STRING_TYPE
     case _: DecimalType => TTypeId.DECIMAL_TYPE
     case DateType => TTypeId.DATE_TYPE
+    case _: TimeType => TTypeId.STRING_TYPE
     // TODO: Shall use TIMESTAMPLOCALTZ_TYPE, keep AS-IS now for
     // unnecessary behavior change
     case TimestampType => TTypeId.TIMESTAMP_TYPE
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetCatalogsOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetCatalogsOperation.scala
index 8dfe551892fad..a02b2ca8966de 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetCatalogsOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetCatalogsOperation.scala
@@ -22,7 +22,7 @@ import org.apache.hive.service.cli.OperationState
 import org.apache.hive.service.cli.operation.GetCatalogsOperation
 import org.apache.hive.service.cli.session.HiveSession
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetColumnsOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetColumnsOperation.scala
index 4560856cb0634..6c573ceb14ecf 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetColumnsOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetColumnsOperation.scala
@@ -27,7 +27,7 @@ import org.apache.hive.service.cli._
 import org.apache.hive.service.cli.operation.GetColumnsOperation
 import org.apache.hive.service.cli.session.HiveSession
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.TableIdentifier
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetFunctionsOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetFunctionsOperation.scala
index c59875b90c449..ec0da495d8744 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetFunctionsOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetFunctionsOperation.scala
@@ -27,7 +27,7 @@ import org.apache.hive.service.cli.operation.GetFunctionsOperation
 import org.apache.hive.service.cli.operation.MetadataOperation.DEFAULT_HIVE_CATALOG
 import org.apache.hive.service.cli.session.HiveSession
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.SparkSession
 
 /**
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetSchemasOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetSchemasOperation.scala
index 1db286a7a7f29..4b8b603eede59 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetSchemasOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetSchemasOperation.scala
@@ -25,7 +25,7 @@ import org.apache.hive.service.cli.operation.GetSchemasOperation
 import org.apache.hive.service.cli.operation.MetadataOperation.DEFAULT_HIVE_CATALOG
 import org.apache.hive.service.cli.session.HiveSession
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTableTypesOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTableTypesOperation.scala
index f8ed09857f1c9..e3e1cdbd36813 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTableTypesOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTableTypesOperation.scala
@@ -24,7 +24,7 @@ import org.apache.hive.service.cli._
 import org.apache.hive.service.cli.operation.GetTableTypesOperation
 import org.apache.hive.service.cli.session.HiveSession
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.catalog.CatalogTableType
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTablesOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTablesOperation.scala
index d57c590156d07..0579d567d0228 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTablesOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTablesOperation.scala
@@ -27,7 +27,7 @@ import org.apache.hive.service.cli._
 import org.apache.hive.service.cli.operation.GetTablesOperation
 import org.apache.hive.service.cli.session.HiveSession
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.catalog.CatalogTableType._
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTypeInfoOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTypeInfoOperation.scala
index c982eaaef6394..4af2265841b59 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTypeInfoOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkGetTypeInfoOperation.scala
@@ -26,7 +26,7 @@ import org.apache.hive.service.cli.OperationState
 import org.apache.hive.service.cli.operation.GetTypeInfoOperation
 import org.apache.hive.service.cli.session.HiveSession
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.SparkSession
 
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkOperation.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkOperation.scala
index f653e899ebf49..fea878bcf05d5 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkOperation.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkOperation.scala
@@ -21,7 +21,7 @@ import org.apache.hive.service.cli.{HiveSQLException, OperationState}
 import org.apache.hive.service.cli.operation.Operation
 
 import org.apache.spark.SparkContext
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{HIVE_OPERATION_TYPE, STATEMENT_ID}
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.CurrentUserContext.CURRENT_USER
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
index 083d9c4a0d436..02826abef8571 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLCLIDriver.scala
@@ -27,7 +27,6 @@ import scala.jdk.CollectionConverters._
 import jline.console.ConsoleReader
 import jline.console.completer.{ArgumentCompleter, Completer, StringsCompleter}
 import jline.console.history.FileHistory
-import org.apache.commons.lang3.StringUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.hive.cli.{CliDriver, CliSessionState, OptionsProcessor}
 import org.apache.hadoop.hive.common.HiveInterruptUtils
@@ -40,7 +39,7 @@ import sun.misc.{Signal, SignalHandler}
 
 import org.apache.spark.{ErrorMessageFormat, SparkConf, SparkThrowable, SparkThrowableHelper}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.analysis.FunctionRegistry
@@ -50,6 +49,7 @@ import org.apache.spark.sql.hive.security.HiveDelegationTokenProvider
 import org.apache.spark.sql.hive.thriftserver.SparkSQLCLIDriver.closeHiveSessionStateIfStarted
 import org.apache.spark.sql.internal.{SharedState, SQLConf}
 import org.apache.spark.sql.internal.SQLConf.LEGACY_EMPTY_CURRENT_DB_IN_CLI
+import org.apache.spark.util.{SparkStringUtils, Utils}
 import org.apache.spark.util.ShutdownHookManager
 import org.apache.spark.util.SparkExitCode._
 
@@ -166,9 +166,9 @@ private[hive] object SparkSQLCLIDriver extends Logging {
     // hive.aux.jars.path, here we add jars augmented by hiveconf to
     // Spark's SessionResourceLoader to obtain these jars.
     val auxJars = HiveConf.getVar(conf, HiveConf.getConfVars("hive.aux.jars.path"))
-    if (StringUtils.isNotBlank(auxJars)) {
+    if (SparkStringUtils.isNotBlank(auxJars)) {
       val resourceLoader = SparkSQLEnv.sparkSession.sessionState.resourceLoader
-      StringUtils.split(auxJars, ",").foreach(resourceLoader.addJar(_))
+      Utils.stringToSeq(auxJars).foreach(resourceLoader.addJar(_))
     }
 
     // The class loader of CliSessionState's conf is current main thread's class loader
@@ -504,7 +504,7 @@ private[hive] class SparkSQLCLIDriver extends CliDriver with Logging {
             case e: IOException =>
               console.printError(
                 s"""Failed with exception ${e.getClass.getName}: ${e.getMessage}
-                   |${org.apache.hadoop.util.StringUtils.stringifyException(e)}
+                   |${Utils.stringifyException(e)}
                  """.stripMargin)
               ret = 1
           }
@@ -572,11 +572,11 @@ private[hive] class SparkSQLCLIDriver extends CliDriver with Logging {
       val commands = splitSemiColon(line).asScala
       var command: String = ""
       for (oneCmd <- commands) {
-        if (StringUtils.endsWith(oneCmd, "\\")) {
-          command += StringUtils.chop(oneCmd) + ";"
+        if (oneCmd.endsWith("\\")) {
+          command += oneCmd.dropRight(1) + ";"
         } else {
           command += oneCmd
-          if (!StringUtils.isBlank(command)) {
+          if (!SparkStringUtils.isBlank(command)) {
             val ret = processCmd(command)
             command = ""
             lastRet = ret
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLDriver.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLDriver.scala
index 7cc181ea6945a..8b9b7352fdca2 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLDriver.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLDriver.scala
@@ -21,13 +21,12 @@ import java.util.{ArrayList => JArrayList, Arrays, List => JList}
 
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.lang3.exception.ExceptionUtils
 import org.apache.hadoop.hive.metastore.api.{FieldSchema, Schema}
 import org.apache.hadoop.hive.ql.Driver
 import org.apache.hadoop.hive.ql.processors.CommandProcessorResponse
 
 import org.apache.spark.SparkThrowable
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.COMMAND
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.plans.logical.CommandResult
@@ -35,6 +34,7 @@ import org.apache.spark.sql.classic.ClassicConversions._
 import org.apache.spark.sql.execution.{QueryExecution, QueryExecutionException, SQLExecution}
 import org.apache.spark.sql.execution.HiveResult.hiveResultString
 import org.apache.spark.sql.internal.{SQLConf, VariableSubstitution}
+import org.apache.spark.util.Utils
 
 
 private[hive] class SparkSQLDriver(val sparkSession: SparkSession = SparkSQLEnv.sparkSession)
@@ -86,7 +86,7 @@ private[hive] class SparkSQLDriver(val sparkSession: SparkSession = SparkSQLEnv.
           throw st
         case cause: Throwable =>
           logError(log"Failed in [${MDC(COMMAND, command)}]", cause)
-          throw new QueryExecutionException(ExceptionUtils.getStackTrace(cause))
+          throw new QueryExecutionException(Utils.stackTraceToString(cause))
     }
   }
 
diff --git a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2Listener.scala b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2Listener.scala
index 8d03d5f848b76..ee77776a77f2c 100644
--- a/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2Listener.scala
+++ b/sql/hive-thriftserver/src/main/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2Listener.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import org.apache.hive.service.server.HiveServer2
 
 import org.apache.spark.{SparkConf, SparkContext}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.Status.LIVE_ENTITY_UPDATE_PERIOD
 import org.apache.spark.scheduler._
diff --git a/sql/hive-thriftserver/src/test/resources/log4j2.properties b/sql/hive-thriftserver/src/test/resources/log4j2.properties
index 207fd3c22ab93..3ad0c9022836b 100644
--- a/sql/hive-thriftserver/src/test/resources/log4j2.properties
+++ b/sql/hive-thriftserver/src/test/resources/log4j2.properties
@@ -41,7 +41,6 @@ appender.file.layout.pattern = %d{HH:mm:ss.SSS} %t %p %c{1}: %m%n%ex
 
 appender.file.filter.1.type = Filters
 
-# Set the logger level of File Appender to WARN
 appender.file.filter.1.a.type = ThresholdFilter
 appender.file.filter.1.a.level = debug
 
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/HiveThriftServer2Suites.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/HiveThriftServer2Suites.scala
index 15b34416f0f15..44008481ff1e3 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/HiveThriftServer2Suites.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/HiveThriftServer2Suites.scala
@@ -19,7 +19,7 @@ package org.apache.spark.sql.hive.thriftserver
 
 import java.io.{File, FilenameFilter}
 import java.net.URL
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.sql.{Date, DriverManager, SQLException, Statement}
 import java.util.{Locale, UUID}
 
@@ -31,7 +31,6 @@ import scala.io.Source
 import scala.jdk.CollectionConverters._
 import scala.util.Try
 
-import com.google.common.io.Files
 import org.apache.hadoop.hive.conf.HiveConf.ConfVars
 import org.apache.hive.jdbc.HiveDriver
 import org.apache.hive.service.auth.PlainSaslHelper
@@ -1224,7 +1223,7 @@ abstract class HiveThriftServer2TestBase extends SparkFunSuite with BeforeAndAft
       // overrides all other potential log4j configurations contained in other dependency jar files.
       val tempLog4jConf = Utils.createTempDir().getCanonicalPath
 
-      Files.asCharSink(new File(s"$tempLog4jConf/log4j2.properties"), StandardCharsets.UTF_8).write(
+      Files.writeString(new File(s"$tempLog4jConf/log4j2.properties").toPath,
         """rootLogger.level = info
           |rootLogger.appenderRef.stdout.ref = console
           |appender.console.type = Console
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkMetadataOperationSuite.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkMetadataOperationSuite.scala
index 969b1da6cd4d4..abd2b1983b34e 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkMetadataOperationSuite.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkMetadataOperationSuite.scala
@@ -675,7 +675,7 @@ class SparkMetadataOperationSuite extends HiveThriftServer2TestBase {
       while (rowSet.next()) {
         assert(rowSet.getString("COLUMN_NAME") === "c" + idx)
         assert(rowSet.getInt("DATA_TYPE") === java.sql.Types.TIMESTAMP)
-        assert(rowSet.getString("TYPE_NAME") === "TIMESTAMP" + ("_NTZ" * idx))
+        assert(rowSet.getString("TYPE_NAME") === "TIMESTAMP" + "_NTZ".repeat(idx))
         assert(rowSet.getInt("COLUMN_SIZE") === 8)
         assert(rowSet.getInt("DECIMAL_DIGITS") === 6)
         assert(rowSet.getInt("NUM_PREC_RADIX") === 0)
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLEnvSuite.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLEnvSuite.scala
index d0bfa28f9f55e..c003c8a3e7196 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLEnvSuite.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/SparkSQLEnvSuite.scala
@@ -17,7 +17,6 @@
 
 package org.apache.spark.sql.hive.thriftserver
 
-import org.apache.commons.io.FileUtils
 import test.custom.listener.{DummyQueryExecutionListener, DummyStreamingQueryListener}
 
 import org.apache.spark.SparkFunSuite
@@ -31,7 +30,7 @@ import org.apache.spark.util.Utils
 class SparkSQLEnvSuite extends SparkFunSuite {
   test("SPARK-29604 external listeners should be initialized with Spark classloader") {
     val metastorePath = Utils.createTempDir("spark_derby")
-    FileUtils.forceDelete(metastorePath)
+    Utils.deleteRecursively(metastorePath)
 
     val jdbcUrl = s"jdbc:derby:;databaseName=$metastorePath;create=true"
 
@@ -61,7 +60,7 @@ class SparkSQLEnvSuite extends SparkFunSuite {
       } finally {
         SparkSQLEnv.stop()
         if (metastorePath.exists()) {
-          FileUtils.forceDelete(metastorePath)
+          Utils.deleteRecursively(metastorePath)
         }
       }
     }
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerQueryTestSuite.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerQueryTestSuite.scala
index 42e15b5ef5595..9bbd0ae711db4 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerQueryTestSuite.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerQueryTestSuite.scala
@@ -18,18 +18,16 @@
 package org.apache.spark.sql.hive.thriftserver
 
 import java.io.File
+import java.nio.file.Files
 import java.sql.{SQLException, Statement, Timestamp}
 import java.util.{Locale, MissingFormatArgumentException}
 
 import scala.util.control.NonFatal
 
-import org.apache.commons.lang3.exception.ExceptionUtils
-
 import org.apache.spark.SparkException
 import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SQLQueryTestSuite
 import org.apache.spark.sql.catalyst.analysis.NoSuchTableException
-import org.apache.spark.sql.catalyst.util.fileToString
 import org.apache.spark.sql.execution.HiveResult.{getBinaryFormatter, getTimeFormatters, toHiveString, BinaryFormatter, TimeFormatters}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.internal.SQLConf.TimestampTypes
@@ -105,13 +103,15 @@ class ThriftServerQueryTestSuite extends SQLQueryTestSuite with SharedThriftServ
     "timestampNTZ/datetime-special-ansi.sql",
     // SPARK-47264
     "view-with-default-collation.sql",
-    "collations.sql",
+    "collations-basic.sql",
+    "collations-aliases.sql",
+    "collations-padding-trim.sql",
+    "collations-string-functions.sql",
     "listagg-collations.sql",
     "pipe-operators.sql",
     // VARIANT type
     "variant/named-function-arguments.sql",
-    // SPARK-51516: Support the TIME data type by Thrift Server
-    "time.sql"
+    "variant-field-extractions.sql"
   )
 
   override def runQueries(
@@ -138,11 +138,13 @@ class ThriftServerQueryTestSuite extends SQLQueryTestSuite with SharedThriftServ
           statement.execute(s"SET ${SQLConf.ANSI_ENABLED.key} = true")
       }
 
+      val rowCounts = new Array[Int](queries.size)
       // Run the SQL queries preparing them for comparison.
       val outputs: Seq[QueryTestOutput] = withSQLConf(configSet: _*) {
-        queries.map { sql =>
+        queries.zipWithIndex.map { case (sql, i) =>
           val (_, output) = handleExceptions(getNormalizedResult(statement, sql))
           // We might need to do some query canonicalization in the future.
+          rowCounts(i) = output.length
           ExecutionOutput(
             sql = sql,
             schema = Some(""),
@@ -152,7 +154,7 @@ class ThriftServerQueryTestSuite extends SQLQueryTestSuite with SharedThriftServ
 
       // Read back the golden file.
       val expectedOutputs: Seq[QueryTestOutput] = {
-        val goldenOutput = fileToString(new File(testCase.resultFile))
+        val goldenOutput = Files.readString(new File(testCase.resultFile).toPath)
         val segments = goldenOutput.split("-- !query.*\n")
 
         // each query has 3 segments, plus the header
@@ -163,11 +165,19 @@ class ThriftServerQueryTestSuite extends SQLQueryTestSuite with SharedThriftServ
           val sql = segments(i * 3 + 1).trim
           val schema = segments(i * 3 + 2).trim
           val originalOut = segments(i * 3 + 3)
-          val output = if (schema != emptySchema && isNeedSort(sql)) {
-            originalOut.split("\n").sorted.mkString("\n")
-          } else {
-            originalOut
-          }
+          val output =
+            if (schema != emptySchema && isNeedSort(sql)) {
+              val splits = originalOut.split("\n")
+              if (splits.length > rowCounts(i)) {
+                // the result is multiline
+                val step = splits.length / rowCounts(i)
+                splits.grouped(step).map(_.mkString("\n")).toSeq.sorted.mkString("\n")
+              } else {
+                splits.sorted.mkString("\n")
+              }
+            } else {
+              originalOut
+            }
           ExecutionOutput(
             sql = sql,
             schema = Some(""),
@@ -299,7 +309,7 @@ class ThriftServerQueryTestSuite extends SQLQueryTestSuite with SharedThriftServ
       try {
         result
       } catch {
-        case NonFatal(e) => throw ExceptionUtils.getRootCause(e)
+        case NonFatal(e) => throw Utils.getRootCause(e)
       }
     }
   }
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerWithSparkContextSuite.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerWithSparkContextSuite.scala
index 33ac3ebc6c95b..a394295360f59 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerWithSparkContextSuite.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ThriftServerWithSparkContextSuite.scala
@@ -214,7 +214,7 @@ trait ThriftServerWithSparkContextSuite extends SharedThriftServer {
       val sessionHandle = client.openSession(user, "")
       val infoValue = client.getInfo(sessionHandle, GetInfoType.CLI_ODBC_KEYWORDS)
       // scalastyle:off line.size.limit
-      assert(infoValue.getStringValue == "ADD,AFTER,AGGREGATE,ALL,ALTER,ALWAYS,ANALYZE,AND,ANTI,ANY,ANY_VALUE,ARCHIVE,ARRAY,AS,ASC,AT,ATOMIC,AUTHORIZATION,BEGIN,BETWEEN,BIGINT,BINARY,BINDING,BOOLEAN,BOTH,BUCKET,BUCKETS,BY,BYTE,CACHE,CALL,CALLED,CASCADE,CASE,CAST,CATALOG,CATALOGS,CHANGE,CHAR,CHARACTER,CHECK,CLEAR,CLUSTER,CLUSTERED,CODEGEN,COLLATE,COLLATION,COLLECTION,COLUMN,COLUMNS,COMMENT,COMMIT,COMPACT,COMPACTIONS,COMPENSATION,COMPUTE,CONCATENATE,CONDITION,CONSTRAINT,CONTAINS,CONTINUE,COST,CREATE,CROSS,CUBE,CURRENT,CURRENT_DATE,CURRENT_TIME,CURRENT_TIMESTAMP,CURRENT_USER,DATA,DATABASE,DATABASES,DATE,DATEADD,DATEDIFF,DATE_ADD,DATE_DIFF,DAY,DAYOFYEAR,DAYS,DBPROPERTIES,DEC,DECIMAL,DECLARE,DEFAULT,DEFINED,DEFINER,DELETE,DELIMITED,DESC,DESCRIBE,DETERMINISTIC,DFS,DIRECTORIES,DIRECTORY,DISTINCT,DISTRIBUTE,DIV,DO,DOUBLE,DROP,ELSE,ELSEIF,END,ENFORCED,ESCAPE,ESCAPED,EVOLUTION,EXCEPT,EXCHANGE,EXCLUDE,EXECUTE,EXISTS,EXIT,EXPLAIN,EXPORT,EXTEND,EXTENDED,EXTERNAL,EXTRACT,FALSE,FETCH,FIELDS,FILEFORMAT,FILTER,FIRST,FLOAT,FLOW,FOLLOWING,FOR,FOREIGN,FORMAT,FORMATTED,FOUND,FROM,FULL,FUNCTION,FUNCTIONS,GENERATED,GLOBAL,GRANT,GROUP,GROUPING,HANDLER,HAVING,HOUR,HOURS,IDENTIFIER,IDENTITY,IF,IGNORE,ILIKE,IMMEDIATE,IMPORT,IN,INCLUDE,INCREMENT,INDEX,INDEXES,INNER,INPATH,INPUT,INPUTFORMAT,INSERT,INT,INTEGER,INTERSECT,INTERVAL,INTO,INVOKER,IS,ITEMS,ITERATE,JOIN,JSON,KEY,KEYS,LANGUAGE,LAST,LATERAL,LAZY,LEADING,LEAVE,LEFT,LEVEL,LIKE,LIMIT,LINES,LIST,LOAD,LOCAL,LOCATION,LOCK,LOCKS,LOGICAL,LONG,LOOP,MACRO,MAP,MATCHED,MATERIALIZED,MAX,MERGE,MICROSECOND,MICROSECONDS,MILLISECOND,MILLISECONDS,MINUS,MINUTE,MINUTES,MODIFIES,MONTH,MONTHS,MSCK,NAME,NAMESPACE,NAMESPACES,NANOSECOND,NANOSECONDS,NATURAL,NO,NONE,NORELY,NOT,NULL,NULLS,NUMERIC,OF,OFFSET,ON,ONLY,OPTION,OPTIONS,OR,ORDER,OUT,OUTER,OUTPUTFORMAT,OVER,OVERLAPS,OVERLAY,OVERWRITE,PARTITION,PARTITIONED,PARTITIONS,PERCENT,PIVOT,PLACING,POSITION,PRECEDING,PRIMARY,PRINCIPALS,PROCEDURE,PROCEDURES,PROPERTIES,PURGE,QUARTER,QUERY,RANGE,READS,REAL,RECORDREADER,RECORDWRITER,RECOVER,RECURSION,RECURSIVE,REDUCE,REFERENCES,REFRESH,RELY,RENAME,REPAIR,REPEAT,REPEATABLE,REPLACE,RESET,RESPECT,RESTRICT,RETURN,RETURNS,REVOKE,RIGHT,ROLE,ROLES,ROLLBACK,ROLLUP,ROW,ROWS,SCHEMA,SCHEMAS,SECOND,SECONDS,SECURITY,SELECT,SEMI,SEPARATED,SERDE,SERDEPROPERTIES,SESSION_USER,SET,SETS,SHORT,SHOW,SINGLE,SKEWED,SMALLINT,SOME,SORT,SORTED,SOURCE,SPECIFIC,SQL,SQLEXCEPTION,SQLSTATE,START,STATISTICS,STORED,STRATIFY,STREAM,STREAMING,STRING,STRUCT,SUBSTR,SUBSTRING,SYNC,SYSTEM_TIME,SYSTEM_VERSION,TABLE,TABLES,TABLESAMPLE,TARGET,TBLPROPERTIES,TERMINATED,THEN,TIME,TIMEDIFF,TIMESTAMP,TIMESTAMPADD,TIMESTAMPDIFF,TIMESTAMP_LTZ,TIMESTAMP_NTZ,TINYINT,TO,TOUCH,TRAILING,TRANSACTION,TRANSACTIONS,TRANSFORM,TRIM,TRUE,TRUNCATE,TRY_CAST,TYPE,UNARCHIVE,UNBOUNDED,UNCACHE,UNION,UNIQUE,UNKNOWN,UNLOCK,UNPIVOT,UNSET,UNTIL,UPDATE,USE,USER,USING,VALUE,VALUES,VAR,VARCHAR,VARIABLE,VARIANT,VERSION,VIEW,VIEWS,VOID,WEEK,WEEKS,WHEN,WHERE,WHILE,WINDOW,WITH,WITHIN,X,YEAR,YEARS,ZONE")
+      assert(infoValue.getStringValue == "ADD,AFTER,AGGREGATE,ALL,ALTER,ALWAYS,ANALYZE,AND,ANTI,ANY,ANY_VALUE,ARCHIVE,ARRAY,AS,ASC,AT,ATOMIC,AUTHORIZATION,BEGIN,BETWEEN,BIGINT,BINARY,BINDING,BOOLEAN,BOTH,BUCKET,BUCKETS,BY,BYTE,CACHE,CALL,CALLED,CASCADE,CASE,CAST,CATALOG,CATALOGS,CHANGE,CHAR,CHARACTER,CHECK,CLEAR,CLUSTER,CLUSTERED,CODEGEN,COLLATE,COLLATION,COLLECTION,COLUMN,COLUMNS,COMMENT,COMMIT,COMPACT,COMPACTIONS,COMPENSATION,COMPUTE,CONCATENATE,CONDITION,CONSTRAINT,CONTAINS,CONTINUE,COST,CREATE,CROSS,CUBE,CURRENT,CURRENT_DATE,CURRENT_TIME,CURRENT_TIMESTAMP,CURRENT_USER,DATA,DATABASE,DATABASES,DATE,DATEADD,DATEDIFF,DATE_ADD,DATE_DIFF,DAY,DAYOFYEAR,DAYS,DBPROPERTIES,DEC,DECIMAL,DECLARE,DEFAULT,DEFINED,DEFINER,DELETE,DELIMITED,DESC,DESCRIBE,DETERMINISTIC,DFS,DIRECTORIES,DIRECTORY,DISTINCT,DISTRIBUTE,DIV,DO,DOUBLE,DROP,ELSE,ELSEIF,END,ENFORCED,ESCAPE,ESCAPED,EVOLUTION,EXCEPT,EXCHANGE,EXCLUDE,EXECUTE,EXISTS,EXIT,EXPLAIN,EXPORT,EXTEND,EXTENDED,EXTERNAL,EXTRACT,FALSE,FETCH,FIELDS,FILEFORMAT,FILTER,FIRST,FLOAT,FLOW,FOLLOWING,FOR,FOREIGN,FORMAT,FORMATTED,FOUND,FROM,FULL,FUNCTION,FUNCTIONS,GENERATED,GLOBAL,GRANT,GROUP,GROUPING,HANDLER,HAVING,HOUR,HOURS,IDENTIFIER,IDENTITY,IF,IGNORE,ILIKE,IMMEDIATE,IMPORT,IN,INCLUDE,INCREMENT,INDEX,INDEXES,INNER,INPATH,INPUT,INPUTFORMAT,INSERT,INT,INTEGER,INTERSECT,INTERVAL,INTO,INVOKER,IS,ITEMS,ITERATE,JOIN,JSON,KEY,KEYS,LANGUAGE,LAST,LATERAL,LAZY,LEADING,LEAVE,LEFT,LEVEL,LIKE,LIMIT,LINES,LIST,LOAD,LOCAL,LOCATION,LOCK,LOCKS,LOGICAL,LONG,LOOP,MACRO,MAP,MATCHED,MATERIALIZED,MAX,MERGE,MICROSECOND,MICROSECONDS,MILLISECOND,MILLISECONDS,MINUS,MINUTE,MINUTES,MODIFIES,MONTH,MONTHS,MSCK,NAME,NAMESPACE,NAMESPACES,NANOSECOND,NANOSECONDS,NATURAL,NO,NONE,NORELY,NOT,NULL,NULLS,NUMERIC,OF,OFFSET,ON,ONLY,OPTION,OPTIONS,OR,ORDER,OUT,OUTER,OUTPUTFORMAT,OVER,OVERLAPS,OVERLAY,OVERWRITE,PARTITION,PARTITIONED,PARTITIONS,PERCENT,PIVOT,PLACING,POSITION,PRECEDING,PRIMARY,PRINCIPALS,PROCEDURE,PROCEDURES,PROPERTIES,PURGE,QUARTER,QUERY,RANGE,READS,REAL,RECORDREADER,RECORDWRITER,RECOVER,RECURSION,RECURSIVE,REDUCE,REFERENCES,REFRESH,RELY,RENAME,REPAIR,REPEAT,REPEATABLE,REPLACE,RESET,RESPECT,RESTRICT,RETURN,RETURNS,REVOKE,RIGHT,ROLE,ROLES,ROLLBACK,ROLLUP,ROW,ROWS,SCHEMA,SCHEMAS,SECOND,SECONDS,SECURITY,SELECT,SEMI,SEPARATED,SERDE,SERDEPROPERTIES,SESSION_USER,SET,SETS,SHORT,SHOW,SINGLE,SKEWED,SMALLINT,SOME,SORT,SORTED,SOURCE,SPECIFIC,SQL,SQLEXCEPTION,SQLSTATE,START,STATISTICS,STORED,STRATIFY,STREAM,STREAMING,STRING,STRUCT,SUBSTR,SUBSTRING,SYNC,SYSTEM_TIME,SYSTEM_VERSION,TABLE,TABLES,TABLESAMPLE,TARGET,TBLPROPERTIES,TERMINATED,THEN,TIME,TIMEDIFF,TIMESTAMP,TIMESTAMPADD,TIMESTAMPDIFF,TIMESTAMP_LTZ,TIMESTAMP_NTZ,TINYINT,TO,TOUCH,TRAILING,TRANSACTION,TRANSACTIONS,TRANSFORM,TRIM,TRUE,TRUNCATE,TRY_CAST,TYPE,UNARCHIVE,UNBOUNDED,UNCACHE,UNION,UNIQUE,UNKNOWN,UNLOCK,UNPIVOT,UNSET,UNTIL,UPDATE,USE,USER,USING,VALUE,VALUES,VAR,VARCHAR,VARIABLE,VARIANT,VERSION,VIEW,VIEWS,VOID,WEEK,WEEKS,WHEN,WHERE,WHILE,WINDOW,WITH,WITHIN,WITHOUT,X,YEAR,YEARS,ZONE")
       // scalastyle:on line.size.limit
     }
   }
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/UISeleniumSuite.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/UISeleniumSuite.scala
index 8d4a9886a2b25..02f60a3beb87d 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/UISeleniumSuite.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/UISeleniumSuite.scala
@@ -18,11 +18,10 @@
 package org.apache.spark.sql.hive.thriftserver
 
 import java.io.File
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 
 import scala.util.Random
 
-import com.google.common.io.Files
 import org.apache.hadoop.hive.conf.HiveConf.ConfVars
 import org.openqa.selenium.WebDriver
 import org.openqa.selenium.htmlunit.HtmlUnitDriver
@@ -75,7 +74,7 @@ class UISeleniumSuite
       // overrides all other potential log4j configurations contained in other dependency jar files.
       val tempLog4jConf = org.apache.spark.util.Utils.createTempDir().getCanonicalPath
 
-      Files.asCharSink(new File(s"$tempLog4jConf/log4j2.properties"), StandardCharsets.UTF_8).write(
+      Files.writeString(new File(s"$tempLog4jConf/log4j2.properties").toPath,
         """rootLogger.level = info
           |rootLogger.appenderRef.file.ref = console
           |appender.console.type = Console
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2ListenerSuite.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2ListenerSuite.scala
index 62d97772bcbc1..138f979d7bc3d 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2ListenerSuite.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/HiveThriftServer2ListenerSuite.scala
@@ -29,6 +29,7 @@ import org.apache.spark.scheduler.SparkListenerJobStart
 import org.apache.spark.sql.hive.thriftserver.HiveThriftServer2
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.status.ElementTrackingStore
+import org.apache.spark.util.Utils
 import org.apache.spark.util.kvstore.InMemoryStore
 
 class HiveThriftServer2ListenerSuite extends SparkFunSuite with BeforeAndAfter {
@@ -39,7 +40,7 @@ class HiveThriftServer2ListenerSuite extends SparkFunSuite with BeforeAndAfter {
     val tmpDirName = System.getProperty("java.io.tmpdir")
     val tmpDir = new File(tmpDirName)
     if (!tmpDir.exists()) {
-      tmpDir.mkdirs()
+      Utils.createDirectory(tmpDir)
     }
     super.beforeAll()
   }
diff --git a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/ThriftServerPageSuite.scala b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/ThriftServerPageSuite.scala
index 7cf17a089ea6b..806eabc96fe3f 100644
--- a/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/ThriftServerPageSuite.scala
+++ b/sql/hive-thriftserver/src/test/scala/org/apache/spark/sql/hive/thriftserver/ui/ThriftServerPageSuite.scala
@@ -28,6 +28,7 @@ import org.apache.spark.{SparkConf, SparkFunSuite}
 import org.apache.spark.scheduler.SparkListenerJobStart
 import org.apache.spark.sql.hive.thriftserver._
 import org.apache.spark.status.ElementTrackingStore
+import org.apache.spark.util.Utils
 import org.apache.spark.util.kvstore.InMemoryStore
 
 
@@ -39,7 +40,7 @@ class ThriftServerPageSuite extends SparkFunSuite with BeforeAndAfter {
     val tmpDirName = System.getProperty("java.io.tmpdir")
     val tmpDir = new File(tmpDirName)
     if (!tmpDir.exists()) {
-      tmpDir.mkdirs()
+      Utils.createDirectory(tmpDir)
     }
     super.beforeAll()
   }
diff --git a/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-hive2.3-results.txt b/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-hive2.3-results.txt
index 1731bdbc70caa..8bf9b1863f59b 100644
--- a/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-hive2.3-results.txt
+++ b/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-hive2.3-results.txt
@@ -1,11 +1,11 @@
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 insert hive table benchmark:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-INSERT INTO DYNAMIC                                3469           3757         408          0.0      338755.1       1.0X
-INSERT INTO HYBRID                                  528            550          32          0.0       51601.0       6.6X
-INSERT INTO STATIC                                  154            167          12          0.1       15085.4      22.5X
-INSERT OVERWRITE DYNAMIC                           2921           3144         316          0.0      285265.1       1.2X
-INSERT OVERWRITE HYBRID                             419            444          17          0.0       40879.7       8.3X
-INSERT OVERWRITE STATIC                             163            169           4          0.1       15940.9      21.3X
+INSERT INTO DYNAMIC                                3584           3886         428          0.0      349957.8       1.0X
+INSERT INTO HYBRID                                  456            470          11          0.0       44526.2       7.9X
+INSERT INTO STATIC                                  142            156          12          0.1       13859.1      25.3X
+INSERT OVERWRITE DYNAMIC                           2836           3061         318          0.0      276990.6       1.3X
+INSERT OVERWRITE HYBRID                             411            426          11          0.0       40154.7       8.7X
+INSERT OVERWRITE STATIC                             159            165           5          0.1       15532.0      22.5X
 
diff --git a/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-jdk21-hive2.3-results.txt b/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-jdk21-hive2.3-results.txt
index e1d2ef4130cc7..453fd680624e1 100644
--- a/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-jdk21-hive2.3-results.txt
+++ b/sql/hive/benchmarks/InsertIntoHiveTableBenchmark-jdk21-hive2.3-results.txt
@@ -1,11 +1,11 @@
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 insert hive table benchmark:              Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-INSERT INTO DYNAMIC                                3606           3947         482          0.0      352155.5       1.0X
-INSERT INTO HYBRID                                  486            553          74          0.0       47442.4       7.4X
-INSERT INTO STATIC                                  155            181          20          0.1       15168.1      23.2X
-INSERT OVERWRITE DYNAMIC                           3141           3345         289          0.0      306713.2       1.1X
-INSERT OVERWRITE HYBRID                             440            453          14          0.0       42952.8       8.2X
-INSERT OVERWRITE STATIC                             165            176          10          0.1       16129.7      21.8X
+INSERT INTO DYNAMIC                                3458           3852         557          0.0      337742.0       1.0X
+INSERT INTO HYBRID                                  464            488          20          0.0       45303.8       7.5X
+INSERT INTO STATIC                                  159            184          24          0.1       15516.8      21.8X
+INSERT OVERWRITE DYNAMIC                           3126           3259         188          0.0      305268.5       1.1X
+INSERT OVERWRITE HYBRID                             428            441          13          0.0       41749.9       8.1X
+INSERT OVERWRITE STATIC                             167            178           8          0.1       16353.5      20.7X
 
diff --git a/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-jdk21-results.txt b/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-jdk21-results.txt
index c85954ed703cf..e0a4c5c38f580 100644
--- a/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-jdk21-results.txt
+++ b/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-jdk21-results.txt
@@ -2,44 +2,44 @@
 Hive UDAF vs Spark AF
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 hive udaf vs spark af:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-hive udaf w/o group by                             3333           3360          28          0.0       50859.2       1.0X
-spark af w/o group by                                22             28           6          3.0         329.6     154.3X
-hive udaf w/ group by                              2189           2201          11          0.0       33404.4       1.5X
-spark af w/ group by w/o fallback                    23             27           5          2.9         343.8     147.9X
-spark af w/ group by w/ fallback                     26             31           5          2.5         402.5     126.4X
+hive udaf w/o group by                             3257           3385          72          0.0       49697.8       1.0X
+spark af w/o group by                                23             31           7          2.8         355.8     139.7X
+hive udaf w/ group by                              2159           2189          24          0.0       32941.0       1.5X
+spark af w/ group by w/o fallback                    24             27           4          2.8         359.2     138.3X
+spark af w/ group by w/ fallback                     27             34          11          2.4         410.5     121.1X
 
 
 ================================================================================================
 ObjectHashAggregateExec vs SortAggregateExec - typed_count
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 object agg v.s. sort agg:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sort agg w/ group by                              26462          26803         483          4.0         252.4       1.0X
-object agg w/ group by w/o fallback                7566           7599          23         13.9          72.2       3.5X
-object agg w/ group by w/ fallback                15156          15556         346          6.9         144.5       1.7X
-sort agg w/o group by                              4040           4062          21         26.0          38.5       6.6X
-object agg w/o group by w/o fallback               3899           3949          37         26.9          37.2       6.8X
+sort agg w/ group by                              23772          24387         870          4.4         226.7       1.0X
+object agg w/ group by w/o fallback                7729           7811          59         13.6          73.7       3.1X
+object agg w/ group by w/ fallback                15818          15955         151          6.6         150.8       1.5X
+sort agg w/o group by                              4211           4280          95         24.9          40.2       5.6X
+object agg w/o group by w/o fallback               4127           4168          35         25.4          39.4       5.8X
 
 
 ================================================================================================
 ObjectHashAggregateExec vs SortAggregateExec - percentile_approx
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 object agg v.s. sort agg:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sort agg w/ group by                                429            449          10          4.9         204.8       1.0X
-object agg w/ group by w/o fallback                 343            351           5          6.1         163.5       1.3X
-object agg w/ group by w/ fallback                  460            483          21          4.6         219.6       0.9X
-sort agg w/o group by                               280            284           4          7.5         133.7       1.5X
-object agg w/o group by w/o fallback                276            283           3          7.6         131.7       1.6X
+sort agg w/ group by                                449            474          11          4.7         213.9       1.0X
+object agg w/ group by w/o fallback                 357            366           5          5.9         170.2       1.3X
+object agg w/ group by w/ fallback                  484            507          15          4.3         230.9       0.9X
+sort agg w/o group by                               295            302           4          7.1         140.8       1.5X
+object agg w/o group by w/o fallback                296            302           4          7.1         141.1       1.5X
 
 
diff --git a/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-results.txt b/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-results.txt
index 2b236d633c79a..10c0e655fe088 100644
--- a/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-results.txt
+++ b/sql/hive/benchmarks/ObjectHashAggregateExecBenchmark-results.txt
@@ -2,44 +2,44 @@
 Hive UDAF vs Spark AF
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 hive udaf vs spark af:                    Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-hive udaf w/o group by                             3238           3296          34          0.0       49406.1       1.0X
-spark af w/o group by                                23             30           5          2.8         353.3     139.8X
-hive udaf w/ group by                              2057           2078          14          0.0       31390.4       1.6X
-spark af w/ group by w/o fallback                    24             29           4          2.7         370.2     133.5X
-spark af w/ group by w/ fallback                     28             31           4          2.4         421.7     117.2X
+hive udaf w/o group by                             3050           3218          95          0.0       46543.3       1.0X
+spark af w/o group by                                20             25           5          3.3         300.8     154.7X
+hive udaf w/ group by                              2055           2066          10          0.0       31350.2       1.5X
+spark af w/ group by w/o fallback                    22             26           4          2.9         343.3     135.6X
+spark af w/ group by w/ fallback                     26             29           3          2.5         395.7     117.6X
 
 
 ================================================================================================
 ObjectHashAggregateExec vs SortAggregateExec - typed_count
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 object agg v.s. sort agg:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sort agg w/ group by                              23909          23922          18          4.4         228.0       1.0X
-object agg w/ group by w/o fallback                7219           7796         283         14.5          68.8       3.3X
-object agg w/ group by w/ fallback                15464          15543         127          6.8         147.5       1.5X
-sort agg w/o group by                              4003           4024          17         26.2          38.2       6.0X
-object agg w/o group by w/o fallback               3911           3930          20         26.8          37.3       6.1X
+sort agg w/ group by                              24522          24800         394          4.3         233.9       1.0X
+object agg w/ group by w/o fallback                7249           7618         194         14.5          69.1       3.4X
+object agg w/ group by w/ fallback                15805          16342         665          6.6         150.7       1.6X
+sort agg w/o group by                              4098           4134          24         25.6          39.1       6.0X
+object agg w/o group by w/o fallback               3459           3498          33         30.3          33.0       7.1X
 
 
 ================================================================================================
 ObjectHashAggregateExec vs SortAggregateExec - percentile_approx
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 object agg v.s. sort agg:                 Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-sort agg w/ group by                                417            427           7          5.0         198.8       1.0X
-object agg w/ group by w/o fallback                 352            361           5          6.0         168.0       1.2X
-object agg w/ group by w/ fallback                  453            460           6          4.6         215.8       0.9X
-sort agg w/o group by                               285            290           7          7.4         135.8       1.5X
-object agg w/o group by w/o fallback                277            284           5          7.6         132.2       1.5X
+sort agg w/ group by                                418            426           6          5.0         199.5       1.0X
+object agg w/ group by w/o fallback                 351            356           5          6.0         167.4       1.2X
+object agg w/ group by w/ fallback                  449            461          14          4.7         214.0       0.9X
+sort agg w/o group by                               274            281           3          7.7         130.7       1.5X
+object agg w/o group by w/o fallback                268            274           3          7.8         127.8       1.6X
 
 
diff --git a/sql/hive/benchmarks/OrcReadBenchmark-jdk21-results.txt b/sql/hive/benchmarks/OrcReadBenchmark-jdk21-results.txt
index 190e0d498a144..2c8da9377a40e 100644
--- a/sql/hive/benchmarks/OrcReadBenchmark-jdk21-results.txt
+++ b/sql/hive/benchmarks/OrcReadBenchmark-jdk21-results.txt
@@ -2,221 +2,221 @@
 SQL Single Numeric Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   633            708         103         24.9          40.2       1.0X
-Native ORC MR                                       824            861          34         19.1          52.4       0.8X
-Native ORC Vectorized                                96            121          20        164.1           6.1       6.6X
+Hive built-in ORC                                   615            647          37         25.6          39.1       1.0X
+Native ORC MR                                       746            760          15         21.1          47.4       0.8X
+Native ORC Vectorized                                90            109          18        174.8           5.7       6.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   700            753          55         22.5          44.5       1.0X
-Native ORC MR                                       852            860           9         18.5          54.2       0.8X
-Native ORC Vectorized                                86            102          14        182.6           5.5       8.1X
+Hive built-in ORC                                   705            732          23         22.3          44.9       1.0X
+Native ORC MR                                       768            774           5         20.5          48.8       0.9X
+Native ORC Vectorized                                83            103          19        190.5           5.2       8.5X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   740            776          41         21.3          47.0       1.0X
-Native ORC MR                                       864            888          33         18.2          54.9       0.9X
-Native ORC Vectorized                               107            119          18        147.4           6.8       6.9X
+Hive built-in ORC                                   752            759           7         20.9          47.8       1.0X
+Native ORC MR                                       837            857          33         18.8          53.2       0.9X
+Native ORC Vectorized                               102            121          22        153.7           6.5       7.4X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   732            751          26         21.5          46.5       1.0X
-Native ORC MR                                       847            918          98         18.6          53.9       0.9X
-Native ORC Vectorized                                98            112          15        160.2           6.2       7.5X
+Hive built-in ORC                                   806            823          15         19.5          51.3       1.0X
+Native ORC MR                                       834            900          57         18.9          53.0       1.0X
+Native ORC Vectorized                               101            108          13        155.9           6.4       8.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   759            776          17         20.7          48.2       1.0X
-Native ORC MR                                       901            937          40         17.5          57.3       0.8X
-Native ORC Vectorized                               136            151          21        115.6           8.6       5.6X
+Hive built-in ORC                                   832            843          13         18.9          52.9       1.0X
+Native ORC MR                                       985            994           8         16.0          62.6       0.8X
+Native ORC Vectorized                               140            164          27        112.5           8.9       6.0X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   891            899           7         17.6          56.7       1.0X
-Native ORC MR                                       963           1002          55         16.3          61.3       0.9X
-Native ORC Vectorized                               220            245          27         71.4          14.0       4.0X
+Hive built-in ORC                                   931            973          50         16.9          59.2       1.0X
+Native ORC MR                                      1034           1041          11         15.2          65.7       0.9X
+Native ORC Vectorized                               293            308          25         53.7          18.6       3.2X
 
 
 ================================================================================================
 Int and String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int and String Scan:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1732           1745          19          6.1         165.1       1.0X
-Native ORC MR                                      1496           1497           1          7.0         142.7       1.2X
-Native ORC Vectorized                               616            634          33         17.0          58.8       2.8X
+Hive built-in ORC                                  1666           1694          39          6.3         158.9       1.0X
+Native ORC MR                                      1599           1617          26          6.6         152.5       1.0X
+Native ORC Vectorized                               608            648          59         17.2          58.0       2.7X
 
 
 ================================================================================================
 Partitioned Table Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partitioned Table:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Data column - Hive built-in ORC                     892            907          15         17.6          56.7       1.0X
-Data column - Native ORC MR                        1043           1080          52         15.1          66.3       0.9X
-Data column - Native ORC Vectorized                 110            126          13        143.3           7.0       8.1X
-Partition column - Hive built-in ORC                644            667          16         24.4          40.9       1.4X
-Partition column - Native ORC MR                    637            653          23         24.7          40.5       1.4X
-Partition column - Native ORC Vectorized             37             47           9        423.3           2.4      24.0X
-Both columns - Hive built-in ORC                    974           1012          55         16.2          61.9       0.9X
-Both columns - Native ORC MR                       1108           1147          56         14.2          70.4       0.8X
-Both columns - Native ORC Vectorized                119            144          22        131.7           7.6       7.5X
+Data column - Hive built-in ORC                     868            897          43         18.1          55.2       1.0X
+Data column - Native ORC MR                        1130           1163          46         13.9          71.9       0.8X
+Data column - Native ORC Vectorized                 105            123          20        150.3           6.7       8.3X
+Partition column - Hive built-in ORC                715            726          15         22.0          45.4       1.2X
+Partition column - Native ORC MR                    718            756          36         21.9          45.6       1.2X
+Partition column - Native ORC Vectorized             36             50          12        431.2           2.3      23.8X
+Both columns - Hive built-in ORC                   1035           1040           8         15.2          65.8       0.8X
+Both columns - Native ORC MR                       1060           1085          35         14.8          67.4       0.8X
+Both columns - Native ORC Vectorized                114            140          17        137.9           7.3       7.6X
 
 
 ================================================================================================
 Repeated String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repeated String:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   892            918          26         11.8          85.0       1.0X
-Native ORC MR                                       773            781           9         13.6          73.7       1.2X
-Native ORC Vectorized                               127            137          21         82.6          12.1       7.0X
+Hive built-in ORC                                   865            905          48         12.1          82.5       1.0X
+Native ORC MR                                       795            796           2         13.2          75.8       1.1X
+Native ORC Vectorized                               129            146          19         81.2          12.3       6.7X
 
 
 ================================================================================================
 String with Nulls Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (0.0%):            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1501           1514          19          7.0         143.1       1.0X
-Native ORC MR                                      1290           1311          30          8.1         123.0       1.2X
-Native ORC Vectorized                               294            336          38         35.7          28.0       5.1X
+Hive built-in ORC                                  1584           1586           2          6.6         151.1       1.0X
+Native ORC MR                                      1354           1358           6          7.7         129.1       1.2X
+Native ORC Vectorized                               307            320          17         34.1          29.3       5.2X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (50.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1229           1251          30          8.5         117.2       1.0X
-Native ORC MR                                      1168           1198          43          9.0         111.3       1.1X
-Native ORC Vectorized                               337            368          26         31.1          32.1       3.6X
+Hive built-in ORC                                  1370           1374           5          7.7         130.7       1.0X
+Native ORC MR                                      1225           1230           7          8.6         116.8       1.1X
+Native ORC Vectorized                               351            388          39         29.9          33.5       3.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (95.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   739            762          21         14.2          70.5       1.0X
-Native ORC MR                                       786            817          27         13.3          74.9       0.9X
-Native ORC Vectorized                               152            174          23         69.1          14.5       4.9X
+Hive built-in ORC                                   802            841          36         13.1          76.5       1.0X
+Native ORC MR                                       852            886          32         12.3          81.2       0.9X
+Native ORC Vectorized                               158            184          38         66.4          15.1       5.1X
 
 
 ================================================================================================
 Single Column Scan From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 100 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   544            571          29          1.9         519.1       1.0X
-Native ORC MR                                        89            116          25         11.8          84.5       6.1X
-Native ORC Vectorized                                31             39           7         33.4          29.9      17.4X
+Hive built-in ORC                                   506            549          33          2.1         482.8       1.0X
+Native ORC MR                                        93            110          12         11.3          88.6       5.5X
+Native ORC Vectorized                                32             38           7         32.8          30.5      15.9X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 200 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1047           1050           4          1.0         998.6       1.0X
-Native ORC MR                                        96            114          12         10.9          91.3      10.9X
-Native ORC Vectorized                                38             47           8         27.8          36.0      27.7X
+Hive built-in ORC                                   918            938          31          1.1         875.0       1.0X
+Native ORC MR                                        99            109          11         10.6          94.0       9.3X
+Native ORC Vectorized                                39             44           7         27.0          37.1      23.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 300 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1492           1512          29          0.7        1422.4       1.0X
-Native ORC MR                                       104            116          10         10.1          99.3      14.3X
-Native ORC Vectorized                                48             62           9         22.0          45.5      31.3X
+Hive built-in ORC                                  1344           1370          37          0.8        1282.1       1.0X
+Native ORC MR                                       109            117           7          9.6         103.7      12.4X
+Native ORC Vectorized                                48             57           8         22.0          45.4      28.3X
 
 
 ================================================================================================
 Struct scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 10 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   297            336          49          3.5         283.2       1.0X
-Native ORC MR                                       223            242          31          4.7         212.7       1.3X
-Native ORC Vectorized                                99            118          27         10.5          94.9       3.0X
+Hive built-in ORC                                   317            362          36          3.3         302.7       1.0X
+Native ORC MR                                       238            253          32          4.4         226.5       1.3X
+Native ORC Vectorized                               103            145          32         10.2          98.1       3.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 100 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   2094           2170         108          0.5        1996.8       1.0X
-Native ORC MR                                       1807           1809           3          0.6        1723.1       1.2X
-Native ORC Vectorized                                904            959          52          1.2         861.9       2.3X
+Hive built-in ORC                                   2362           2370          12          0.4        2252.3       1.0X
+Native ORC MR                                       1887           1893           8          0.6        1799.9       1.3X
+Native ORC Vectorized                                894            974          72          1.2         852.4       2.6X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 300 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   6187           6196          13          0.2        5899.9       1.0X
-Native ORC MR                                       5667           5781         161          0.2        5404.7       1.1X
-Native ORC Vectorized                               5772           5800          40          0.2        5504.4       1.1X
+Hive built-in ORC                                   6494           6505          15          0.2        6193.3       1.0X
+Native ORC MR                                       5955           6101         206          0.2        5679.2       1.1X
+Native ORC Vectorized                               5896           5932          50          0.2        5622.9       1.1X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 600 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  13134          13146          18          0.1       12525.1       1.0X
-Native ORC MR                                      13035          13123         124          0.1       12431.4       1.0X
-Native ORC Vectorized                              13009          13115         150          0.1       12406.0       1.0X
+Hive built-in ORC                                  13860          13860           1          0.1       13217.6       1.0X
+Native ORC MR                                      14092          14143          71          0.1       13439.6       1.0X
+Native ORC Vectorized                              13892          13970         110          0.1       13248.4       1.0X
 
 
 ================================================================================================
 Nested Struct scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Nested Struct Scan with 10 Elements, 10 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                        2116           2141          36          0.5        2017.6       1.0X
-Native ORC MR                                            1869           1988         169          0.6        1782.2       1.1X
-Native ORC Vectorized                                     545            599          43          1.9         520.0       3.9X
+Hive built-in ORC                                        2102           2198         135          0.5        2004.8       1.0X
+Native ORC MR                                            2397           2405          12          0.4        2286.0       0.9X
+Native ORC Vectorized                                     550            586          40          1.9         524.6       3.8X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Nested Struct Scan with 30 Elements, 10 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                        5477           5626         211          0.2        5223.4       1.0X
-Native ORC MR                                            4399           4557         225          0.2        4194.9       1.2X
-Native ORC Vectorized                                    1406           1452          65          0.7        1340.8       3.9X
+Hive built-in ORC                                        6204           6221          24          0.2        5916.8       1.0X
+Native ORC MR                                            5348           5427         112          0.2        5100.1       1.2X
+Native ORC Vectorized                                    1431           1437           9          0.7        1364.4       4.3X
 
-OpenJDK 64-Bit Server VM 21.0.6+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 21.0.8+9-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Nested Struct Scan with 10 Elements, 30 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                        5180           5200          27          0.2        4940.4       1.0X
-Native ORC MR                                            4879           4902          31          0.2        4653.5       1.1X
-Native ORC Vectorized                                    1951           1982          44          0.5        1860.8       2.7X
+Hive built-in ORC                                        5416           5443          39          0.2        5164.7       1.0X
+Native ORC MR                                            5974           6007          47          0.2        5697.5       0.9X
+Native ORC Vectorized                                    1883           1957         105          0.6        1795.4       2.9X
 
 
diff --git a/sql/hive/benchmarks/OrcReadBenchmark-results.txt b/sql/hive/benchmarks/OrcReadBenchmark-results.txt
index db30f2b7f9213..49699af856eca 100644
--- a/sql/hive/benchmarks/OrcReadBenchmark-results.txt
+++ b/sql/hive/benchmarks/OrcReadBenchmark-results.txt
@@ -2,221 +2,221 @@
 SQL Single Numeric Column Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single TINYINT Column Scan:           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   697            778         102         22.6          44.3       1.0X
-Native ORC MR                                       757            805          45         20.8          48.1       0.9X
-Native ORC Vectorized                               101            121          13        156.5           6.4       6.9X
+Hive built-in ORC                                   633            690          90         24.9          40.2       1.0X
+Native ORC MR                                       765            794          38         20.6          48.6       0.8X
+Native ORC Vectorized                                93            109          12        170.0           5.9       6.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single SMALLINT Column Scan:          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   687            745          54         22.9          43.7       1.0X
-Native ORC MR                                       741            759          20         21.2          47.1       0.9X
-Native ORC Vectorized                                80             98          11        196.7           5.1       8.6X
+Hive built-in ORC                                   641            685          46         24.5          40.8       1.0X
+Native ORC MR                                       724            727           4         21.7          46.0       0.9X
+Native ORC Vectorized                                81             96          12        193.7           5.2       7.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single INT Column Scan:               Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   695            709          12         22.6          44.2       1.0X
-Native ORC MR                                       741            755          13         21.2          47.1       0.9X
-Native ORC Vectorized                                87             99           9        180.7           5.5       8.0X
+Hive built-in ORC                                   671            683          13         23.4          42.7       1.0X
+Native ORC MR                                       711            775          60         22.1          45.2       0.9X
+Native ORC Vectorized                                89            101           8        177.7           5.6       7.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single BIGINT Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   686            759          63         22.9          43.6       1.0X
-Native ORC MR                                       737            743           7         21.3          46.8       0.9X
-Native ORC Vectorized                                88             96          11        179.7           5.6       7.8X
+Hive built-in ORC                                   682            722          40         23.1          43.4       1.0X
+Native ORC MR                                       724            728           4         21.7          46.0       0.9X
+Native ORC Vectorized                                87             96          10        181.0           5.5       7.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single FLOAT Column Scan:             Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   804            818          20         19.6          51.1       1.0X
-Native ORC MR                                       815            849          51         19.3          51.8       1.0X
-Native ORC Vectorized                               141            159          21        111.2           9.0       5.7X
+Hive built-in ORC                                   709            735          45         22.2          45.1       1.0X
+Native ORC MR                                       807            812           6         19.5          51.3       0.9X
+Native ORC Vectorized                               140            146           9        112.2           8.9       5.1X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 SQL Single DOUBLE Column Scan:            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   869            917          67         18.1          55.2       1.0X
-Native ORC MR                                       875            878           6         18.0          55.6       1.0X
-Native ORC Vectorized                               225            243          21         69.8          14.3       3.9X
+Hive built-in ORC                                   783            822          64         20.1          49.8       1.0X
+Native ORC MR                                       869            890          24         18.1          55.2       0.9X
+Native ORC Vectorized                               223            232           7         70.5          14.2       3.5X
 
 
 ================================================================================================
 Int and String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Int and String Scan:                      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1465           1476          17          7.2         139.7       1.0X
-Native ORC MR                                      1430           1433           5          7.3         136.4       1.0X
-Native ORC Vectorized                               588            602          12         17.8          56.1       2.5X
+Hive built-in ORC                                  1440           1443           4          7.3         137.3       1.0X
+Native ORC MR                                      1402           1437          49          7.5         133.7       1.0X
+Native ORC Vectorized                               591            599           7         17.7          56.4       2.4X
 
 
 ================================================================================================
 Partitioned Table Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Partitioned Table:                        Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Data column - Hive built-in ORC                     816            833          27         19.3          51.9       1.0X
-Data column - Native ORC MR                         987           1007          28         15.9          62.8       0.8X
-Data column - Native ORC Vectorized                  91            101           6        172.0           5.8       8.9X
-Partition column - Hive built-in ORC                627            651          26         25.1          39.9       1.3X
-Partition column - Native ORC MR                    605            613           8         26.0          38.5       1.3X
-Partition column - Native ORC Vectorized             36             45           6        440.4           2.3      22.8X
-Both columns - Hive built-in ORC                    920            933          20         17.1          58.5       0.9X
-Both columns - Native ORC MR                        973           1000          29         16.2          61.8       0.8X
-Both columns - Native ORC Vectorized                105            119          12        149.5           6.7       7.8X
+Data column - Hive built-in ORC                     816            831          23         19.3          51.9       1.0X
+Data column - Native ORC MR                         907            939          48         17.3          57.7       0.9X
+Data column - Native ORC Vectorized                  89            101           9        175.8           5.7       9.1X
+Partition column - Hive built-in ORC                613            621           7         25.7          38.9       1.3X
+Partition column - Native ORC MR                    578            608          22         27.2          36.8       1.4X
+Partition column - Native ORC Vectorized             38             48           7        413.0           2.4      21.4X
+Both columns - Hive built-in ORC                    960            976          17         16.4          61.0       0.9X
+Both columns - Native ORC MR                        999           1037          54         15.7          63.5       0.8X
+Both columns - Native ORC Vectorized                105            126          10        149.7           6.7       7.8X
 
 
 ================================================================================================
 Repeated String Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Repeated String:                          Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   854            860           6         12.3          81.4       1.0X
-Native ORC MR                                       750            812          97         14.0          71.6       1.1X
-Native ORC Vectorized                               129            134           6         81.3          12.3       6.6X
+Hive built-in ORC                                   838            844           6         12.5          79.9       1.0X
+Native ORC MR                                       740            746           5         14.2          70.6       1.1X
+Native ORC Vectorized                               133            140          10         79.1          12.7       6.3X
 
 
 ================================================================================================
 String with Nulls Scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (0.0%):            Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1443           1452          12          7.3         137.6       1.0X
-Native ORC MR                                      1252           1257           8          8.4         119.4       1.2X
-Native ORC Vectorized                               304            316          15         34.5          29.0       4.8X
+Hive built-in ORC                                  1499           1530          45          7.0         142.9       1.0X
+Native ORC MR                                      1245           1286          58          8.4         118.7       1.2X
+Native ORC Vectorized                               289            305          18         36.3          27.6       5.2X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (50.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1199           1201           3          8.7         114.4       1.0X
-Native ORC MR                                      1133           1145          17          9.3         108.0       1.1X
-Native ORC Vectorized                               348            390          29         30.1          33.2       3.4X
+Hive built-in ORC                                  1232           1237           8          8.5         117.5       1.0X
+Native ORC MR                                      1134           1156          31          9.2         108.2       1.1X
+Native ORC Vectorized                               344            357          13         30.5          32.8       3.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 String with Nulls Scan (95.0%):           Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   696            697           1         15.1          66.4       1.0X
-Native ORC MR                                       752            762           8         13.9          71.8       0.9X
-Native ORC Vectorized                               153            175          18         68.5          14.6       4.5X
+Hive built-in ORC                                   701            704           7         15.0          66.8       1.0X
+Native ORC MR                                       720            736          25         14.6          68.7       1.0X
+Native ORC Vectorized                               154            176          22         68.1          14.7       4.6X
 
 
 ================================================================================================
 Single Column Scan From Wide Columns
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 100 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   407            422          17          2.6         387.8       1.0X
-Native ORC MR                                        82             95          11         12.7          78.6       4.9X
-Native ORC Vectorized                                31             39           7         33.6          29.8      13.0X
+Hive built-in ORC                                   419            452          36          2.5         399.4       1.0X
+Native ORC MR                                        84            103          15         12.4          80.4       5.0X
+Native ORC Vectorized                                32             37           4         32.5          30.8      13.0X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 200 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   779            791          16          1.3         743.1       1.0X
-Native ORC MR                                        89            104          11         11.8          84.9       8.7X
-Native ORC Vectorized                                37             45           7         28.6          35.0      21.2X
+Hive built-in ORC                                   730            736           7          1.4         696.3       1.0X
+Native ORC MR                                        93            106          12         11.3          88.2       7.9X
+Native ORC Vectorized                                43             49           5         24.3          41.2      16.9X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Column Scan from 300 columns:      Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  1026           1040          20          1.0         978.6       1.0X
-Native ORC MR                                       100            114          10         10.4          95.7      10.2X
-Native ORC Vectorized                                44             49           4         23.6          42.4      23.1X
+Hive built-in ORC                                  1085           1088           3          1.0        1035.1       1.0X
+Native ORC MR                                       105            120          11         10.0          99.8      10.4X
+Native ORC Vectorized                                48             58           8         21.7          46.0      22.5X
 
 
 ================================================================================================
 Struct scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 10 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   414            441          22          2.5         394.9       1.0X
-Native ORC MR                                       276            290           9          3.8         263.7       1.5X
-Native ORC Vectorized                               106            141          16          9.9         101.5       3.9X
+Hive built-in ORC                                   469            484           9          2.2         447.6       1.0X
+Native ORC MR                                       293            295           1          3.6         279.6       1.6X
+Native ORC Vectorized                               134            145           8          7.8         127.4       3.5X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 100 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   2412           2484         102          0.4        2300.1       1.0X
-Native ORC MR                                       1561           1699         196          0.7        1488.5       1.5X
-Native ORC Vectorized                                883            926          51          1.2         842.5       2.7X
+Hive built-in ORC                                   2977           3012          49          0.4        2839.1       1.0X
+Native ORC MR                                       1648           1657          13          0.6        1571.9       1.8X
+Native ORC Vectorized                               1058           1073          21          1.0        1009.3       2.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 300 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                   7217           7220           3          0.1        6882.8       1.0X
-Native ORC MR                                       5209           5292         117          0.2        4967.9       1.4X
-Native ORC Vectorized                               5348           5369          30          0.2        5100.6       1.3X
+Hive built-in ORC                                   8718           8875         221          0.1        8314.2       1.0X
+Native ORC MR                                       5706           5708           3          0.2        5441.5       1.5X
+Native ORC Vectorized                               5543           5621         110          0.2        5286.1       1.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Single Struct Column Scan with 600 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 -------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                  15457          15492          49          0.1       14741.3       1.0X
-Native ORC MR                                      12657          12684          38          0.1       12070.2       1.2X
-Native ORC Vectorized                              12803          12872          98          0.1       12210.1       1.2X
+Hive built-in ORC                                  18608          18614           8          0.1       17746.2       1.0X
+Native ORC MR                                      13003          13134         187          0.1       12400.2       1.4X
+Native ORC Vectorized                              13037          13128         128          0.1       12433.0       1.4X
 
 
 ================================================================================================
 Nested Struct scan
 ================================================================================================
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Nested Struct Scan with 10 Elements, 10 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                        2795           2829          49          0.4        2665.1       1.0X
-Native ORC MR                                            2267           2272           7          0.5        2161.8       1.2X
-Native ORC Vectorized                                     628            644          17          1.7         599.1       4.4X
+Hive built-in ORC                                        3055           3149         132          0.3        2913.7       1.0X
+Native ORC MR                                            1986           2077         129          0.5        1893.9       1.5X
+Native ORC Vectorized                                     666            678          12          1.6         634.9       4.6X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Nested Struct Scan with 30 Elements, 10 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                        6921           6931          13          0.2        6600.8       1.0X
-Native ORC MR                                            4921           5138         306          0.2        4693.2       1.4X
-Native ORC Vectorized                                    1506           1520          19          0.7        1436.3       4.6X
+Hive built-in ORC                                        9228           9232           6          0.1        8800.2       1.0X
+Native ORC MR                                            4661           4696          49          0.2        4445.4       2.0X
+Native ORC Vectorized                                    1598           1626          39          0.7        1523.8       5.8X
 
-OpenJDK 64-Bit Server VM 17.0.14+7-LTS on Linux 6.8.0-1020-azure
+OpenJDK 64-Bit Server VM 17.0.16+8-LTS on Linux 6.11.0-1018-azure
 AMD EPYC 7763 64-Core Processor
 Nested Struct Scan with 10 Elements, 30 Fields:  Best Time(ms)   Avg Time(ms)   Stdev(ms)    Rate(M/s)   Per Row(ns)   Relative
 ------------------------------------------------------------------------------------------------------------------------------
-Hive built-in ORC                                        6523           6694         243          0.2        6220.7       1.0X
-Native ORC MR                                            5414           5416           4          0.2        5162.9       1.2X
-Native ORC Vectorized                                    1906           1932          36          0.6        1817.7       3.4X
+Hive built-in ORC                                        7773           7788          20          0.1        7413.3       1.0X
+Native ORC MR                                            5252           5272          27          0.2        5008.9       1.5X
+Native ORC Vectorized                                    2071           2134          90          0.5        1974.9       3.8X
 
 
diff --git a/sql/hive/pom.xml b/sql/hive/pom.xml
index 45e1400f22108..1d4c7b784c0af 100644
--- a/sql/hive/pom.xml
+++ b/sql/hive/pom.xml
@@ -63,6 +63,18 @@
       <type>test-jar</type>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>org.apache.spark</groupId>
+      <artifactId>spark-pipelines_${scala.binary.version}</artifactId>
+      <version>${project.version}</version>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.spark</groupId>
+      <artifactId>spark-pipelines_${scala.binary.version}</artifactId>
+      <version>${project.version}</version>
+      <type>test-jar</type>
+      <scope>test</scope>
+    </dependency>
     <dependency>
       <groupId>org.apache.spark</groupId>
       <artifactId>spark-catalyst_${scala.binary.version}</artifactId>
@@ -139,10 +151,6 @@
       <groupId>org.apache.httpcomponents</groupId>
       <artifactId>httpclient</artifactId>
     </dependency>
-    <dependency>
-      <groupId>org.codehaus.jackson</groupId>
-      <artifactId>jackson-mapper-asl</artifactId>
-    </dependency>
     <!-- transitive dependencies of hive-exec-core doesn't declare -->
     <dependency>
       <groupId>javax.servlet</groupId>
@@ -156,10 +164,6 @@
       <groupId>joda-time</groupId>
       <artifactId>joda-time</artifactId>
     </dependency>
-    <dependency>
-      <groupId>org.jodd</groupId>
-      <artifactId>jodd-core</artifactId>
-    </dependency>
     <dependency>
       <groupId>com.google.code.findbugs</groupId>
       <artifactId>jsr305</artifactId>
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveExternalCatalog.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveExternalCatalog.scala
index 5c7a60151c496..6389e130b6a2c 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveExternalCatalog.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveExternalCatalog.scala
@@ -34,7 +34,7 @@ import org.apache.hadoop.hive.serde.serdeConstants.SERIALIZATION_FORMAT
 import org.apache.thrift.TException
 
 import org.apache.spark.{SparkConf, SparkException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{DATABASE_NAME, INCOMPATIBLE_TYPES, PROVIDER, SCHEMA, SCHEMA2, TABLE_NAME}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.TableIdentifier
@@ -735,6 +735,49 @@ private[spark] class HiveExternalCatalog(conf: SparkConf, hadoopConf: Configurat
     }
   }
 
+  /**
+   * Alter the schema of a table identified by the provided database and table name.
+   */
+  override def alterTableSchema(
+      db: String,
+      table: String,
+      newSchema: StructType): Unit = withClient {
+    requireTableExists(db, table)
+    val oldTable = getTable(db, table)
+    val schemaProps = {
+      tableMetaToTableProps(oldTable, StructType(newSchema)).toMap
+    }
+
+    val partCols = oldTable.partitionColumnNames
+    assert(newSchema.map(_.name).takeRight(partCols.length) == partCols,
+      s"Partition columns ${partCols.mkString("[", ", ", "]")} are only supported at the end of " +
+        s"the new schema ${newSchema.catalogString} for now.")
+
+    val newDataSchema = StructType(newSchema.filter(
+      f => !oldTable.partitionColumnNames.contains(f.name)))
+    val hiveSchema = removeCollation(newDataSchema)
+
+    if (isDatasourceTable(oldTable)) {
+      // For data source tables, first try to write it with the schema set; if that does not work,
+      // try again with updated properties and the partition schema. This is a simplified version of
+      // what createDataSourceTable() does, and may leave the table in a state unreadable by Hive
+      // (for example, the schema does not match the data source schema, or does not match the
+      // storage descriptor).
+      try {
+        client.alterTableDataSchema(db, table, hiveSchema, schemaProps)
+      } catch {
+        case NonFatal(e) =>
+          val warningMessage = log"Could not alter schema of table " +
+            log"${MDC(TABLE_NAME, oldTable.identifier.quotedString)} in a Hive compatible way. " +
+            log"Updating Hive metastore in Spark SQL specific format."
+          logWarning(warningMessage, e)
+          client.alterTableDataSchema(db, table, EMPTY_DATA_SCHEMA, schemaProps)
+      }
+    } else {
+      client.alterTableDataSchema(db, table, hiveSchema, schemaProps)
+    }
+  }
+
   private def removeCollation(schema: StructType): StructType = {
     // Since collated strings do not exist in Hive as a type we need to replace them with
     // the the regular string type. However, as we save the original schema in the table
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveMetastoreCatalog.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveMetastoreCatalog.scala
index bd35342b909f3..fcad044e58715 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveMetastoreCatalog.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveMetastoreCatalog.scala
@@ -25,7 +25,7 @@ import com.google.common.util.concurrent.Striped
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.{QualifiedTableName, TableIdentifier}
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionStateBuilder.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionStateBuilder.scala
index 375eb55d2e482..f9bebce7cbfab 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionStateBuilder.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionStateBuilder.scala
@@ -28,7 +28,7 @@ import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.analysis.{Analyzer, EvalSubqueriesForTimeTravel, InvokeProcedures, ReplaceCharWithVarchar, ResolveDataSource, ResolveSessionCatalog, ResolveTranspose}
 import org.apache.spark.sql.catalyst.analysis.resolver.ResolverExtension
 import org.apache.spark.sql.catalyst.catalog.{ExternalCatalogWithListener, InvalidUDFClassException}
-import org.apache.spark.sql.catalyst.expressions.Expression
+import org.apache.spark.sql.catalyst.expressions.{Expression, ExtractSemiStructuredFields}
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.classic.{SparkSession, Strategy}
@@ -39,7 +39,7 @@ import org.apache.spark.sql.execution.analysis.DetectAmbiguousSelfJoin
 import org.apache.spark.sql.execution.command.CommandCheck
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.datasources.v2.TableCapabilityCheck
-import org.apache.spark.sql.execution.streaming.ResolveWriteToStream
+import org.apache.spark.sql.execution.streaming.runtime.ResolveWriteToStream
 import org.apache.spark.sql.hive.HiveShim.HiveFunctionWrapper
 import org.apache.spark.sql.hive.client.HiveClient
 import org.apache.spark.sql.hive.execution.PruneHiveTablePartitions
@@ -133,6 +133,7 @@ class HiveSessionStateBuilder(
         new DetermineTableStats(session) +:
         new ResolveTranspose(session) +:
         new InvokeProcedures(session) +:
+        ExtractSemiStructuredFields +:
         customResolutionRules
 
     override val postHocResolutionRules: Seq[Rule[LogicalPlan]] =
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveShim.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveShim.scala
index 34683da55ccc9..c6b5f6c2c657f 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveShim.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveShim.scala
@@ -18,10 +18,10 @@
 package org.apache.spark.sql.hive
 
 import java.rmi.server.UID
+import java.util.Objects
 
 import scala.jdk.CollectionConverters._
 
-import com.google.common.base.Objects
 import org.apache.avro.Schema
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.hive.ql.exec.SerializationUtilities
@@ -129,7 +129,7 @@ private[hive] object HiveShim {
 
     override def hashCode(): Int = {
       if (functionClassName == HIVE_GENERIC_UDF_MACRO_CLS) {
-        Objects.hashCode(functionClassName, instance.asInstanceOf[GenericUDFMacro].getBody())
+        Objects.hash(functionClassName, instance.asInstanceOf[GenericUDFMacro].getBody())
       } else {
         functionClassName.hashCode()
       }
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveUtils.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveUtils.scala
index 11a1f1166e5ef..a36501d1eaf41 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveUtils.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveUtils.scala
@@ -36,7 +36,7 @@ import org.apache.hive.common.util.HiveVersionInfo
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys
 import org.apache.spark.sql.catalyst.catalog.CatalogTable
 import org.apache.spark.sql.classic.SQLContext
@@ -76,7 +76,7 @@ private[spark] object HiveUtils extends Logging {
     .doc("Version of the Hive metastore. Available options are " +
       "<code>2.0.0</code> through <code>2.3.10</code>, " +
       "<code>3.0.0</code> through <code>3.1.3</code> and " +
-      "<code>4.0.0</code> through <code>4.0.1</code>.")
+      "<code>4.0.0</code> through <code>4.1.0</code>.")
     .version("1.4.0")
     .stringConf
     .checkValue(isCompatibleHiveVersion, "Unsupported Hive Metastore version")
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/TableReader.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/TableReader.scala
index 8af0403b1d9b2..d6f62284d2e7c 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/TableReader.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/TableReader.scala
@@ -36,7 +36,7 @@ import org.apache.hadoop.mapred.{FileInputFormat, InputFormat => oldInputClass,
 import org.apache.hadoop.mapreduce.{InputFormat => newInputClass}
 
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.{EmptyRDD, HadoopRDD, NewHadoopRDD, RDD, UnionRDD}
 import org.apache.spark.sql.SparkSession
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveClientImpl.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveClientImpl.scala
index 8f7b892cf83b9..f1fe95b8a318f 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveClientImpl.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveClientImpl.scala
@@ -29,7 +29,6 @@ import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
-import org.apache.commons.lang3.exception.ExceptionUtils
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.hive.common.StatsSetupConst
@@ -50,7 +49,7 @@ import org.apache.thrift.transport.{TEndpointTransport, TTransport}
 
 import org.apache.spark.{SparkConf, SparkException, SparkThrowable}
 import org.apache.spark.deploy.SparkHadoopUtil.SOURCE_SPARK
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.internal.config.Tests.IS_TESTING
 import org.apache.spark.metrics.source.HiveCatalogMetrics
@@ -127,6 +126,7 @@ private[hive] class HiveClientImpl(
     case hive.v3_0 => new Shim_v3_0()
     case hive.v3_1 => new Shim_v3_1()
     case hive.v4_0 => new Shim_v4_0()
+    case hive.v4_1 => new Shim_v4_1()
   }
 
   // Create an internal session state for this HiveClientImpl.
@@ -920,7 +920,7 @@ private[hive] class HiveClientImpl(
               // Wrap the original hive error with QueryExecutionException and throw it
               // if there is an error in query processing.
               // This works for hive 4.x and later versions.
-              throw new QueryExecutionException(ExceptionUtils.getStackTrace(e))
+              throw new QueryExecutionException(Utils.stackTraceToString(e))
           } finally {
             closeDriver(driver)
           }
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveShim.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveShim.scala
index 2eb6c787c3e02..ef27669f5ba09 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveShim.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/HiveShim.scala
@@ -38,7 +38,7 @@ import org.apache.hadoop.hive.ql.processors.{CommandProcessor, CommandProcessorF
 import org.apache.hadoop.hive.ql.session.SessionState
 import org.apache.hadoop.hive.serde.serdeConstants
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{CONFIG, CONFIG2, CONFIG3}
 import org.apache.spark.metrics.source.HiveCatalogMetrics
 import org.apache.spark.sql.catalyst.{FunctionIdentifier, InternalRow}
@@ -749,12 +749,12 @@ private[client] class Shim_v2_0 extends Shim with Logging {
       }
     }
 
-    def convertInToOr(name: String, values: Seq[String]): String = {
-      values.map(value => s"$name = $value").mkString("(", " or ", ")")
+    def convertIn(name: String, values: Seq[String]): String = {
+      s"($name) in (${values.mkString(", ")})"
     }
 
-    def convertNotInToAnd(name: String, values: Seq[String]): String = {
-      values.map(value => s"$name != $value").mkString("(", " and ", ")")
+    def convertNotIn(name: String, values: Seq[String]): String = {
+      s"($name) not in (${values.mkString(", ")})"
     }
 
     def hasNullLiteral(list: Seq[Expression]): Boolean = list.exists {
@@ -786,11 +786,11 @@ private[client] class Shim_v2_0 extends Shim with Logging {
 
       case In(ExtractAttribute(SupportedAttribute(name)), ExtractableLiterals(values))
           if useAdvanced =>
-        Some(convertInToOr(name, values))
+        Some(convertIn(name, values))
 
       case Not(In(ExtractAttribute(SupportedAttribute(name)), ExtractableLiterals(values)))
           if useAdvanced =>
-        Some(convertNotInToAnd(name, values))
+        Some(convertNotIn(name, values))
 
       case InSet(child, values) if useAdvanced && values.size > inSetThreshold =>
         val dataType = child.dataType
@@ -802,19 +802,19 @@ private[client] class Shim_v2_0 extends Shim with Logging {
 
       case InSet(child @ ExtractAttribute(SupportedAttribute(name)), ExtractableDateValues(values))
           if useAdvanced && child.dataType == DateType =>
-        Some(convertInToOr(name, values))
+        Some(convertIn(name, values))
 
       case Not(InSet(child @ ExtractAttribute(SupportedAttribute(name)),
         ExtractableDateValues(values))) if useAdvanced && child.dataType == DateType =>
-        Some(convertNotInToAnd(name, values))
+        Some(convertNotIn(name, values))
 
       case InSet(ExtractAttribute(SupportedAttribute(name)), ExtractableValues(values))
           if useAdvanced =>
-        Some(convertInToOr(name, values))
+        Some(convertIn(name, values))
 
       case Not(InSet(ExtractAttribute(SupportedAttribute(name)), ExtractableValues(values)))
           if useAdvanced =>
-        Some(convertNotInToAnd(name, values))
+        Some(convertNotIn(name, values))
 
       case op @ SpecialBinaryComparison(
           ExtractAttribute(SupportedAttribute(name)), ExtractableLiteral(value)) =>
@@ -1543,3 +1543,5 @@ private[client] class Shim_v4_0 extends Shim_v3_1 {
     renamePartitionMethod.invoke(hive, table, oldPartSpec, newPart, writeIdInLoadTableOrPartition)
   }
 }
+
+private[client] class Shim_v4_1 extends Shim_v4_0
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/IsolatedClientLoader.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/IsolatedClientLoader.scala
index 482983e698a25..c439dfbd91692 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/IsolatedClientLoader.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/IsolatedClientLoader.scala
@@ -24,13 +24,12 @@ import java.util
 
 import scala.util.Try
 
-import org.apache.commons.io.{FileUtils, IOUtils}
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.hive.shims.ShimLoader
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.SparkSubmit
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{FALLBACK_VERSION, HADOOP_VERSION, PATH}
 import org.apache.spark.sql.catalyst.util.quietly
 import org.apache.spark.sql.errors.QueryExecutionErrors
@@ -66,7 +65,7 @@ private[hive] object IsolatedClientLoader extends Logging {
           case e: RuntimeException if e.getMessage.contains("hadoop") =>
             // If the error message contains hadoop, it is probably because the hadoop
             // version cannot be resolved.
-            val fallbackVersion = "3.4.1"
+            val fallbackVersion = "3.4.2"
             logWarning(log"Failed to resolve Hadoop artifacts for the version " +
               log"${MDC(HADOOP_VERSION, hadoopVersion)}. We will change the hadoop version from " +
               log"${MDC(HADOOP_VERSION, hadoopVersion)} to " +
@@ -99,6 +98,7 @@ private[hive] object IsolatedClientLoader extends Logging {
       case (3, 0, _) => Some(hive.v3_0)
       case (3, 1, _) => Some(hive.v3_1)
       case (4, 0, _) => Some(hive.v4_0)
+      case (4, 1, _) => Some(hive.v4_1)
       case _ => None
     }.getOrElse {
       throw QueryExecutionErrors.unsupportedHiveMetastoreVersionError(
@@ -149,7 +149,7 @@ private[hive] object IsolatedClientLoader extends Logging {
 
     // TODO: Remove copy logic.
     val tempDir = Utils.createTempDir(namePrefix = s"hive-${version}")
-    allFiles.foreach(f => FileUtils.copyFileToDirectory(f, tempDir))
+    allFiles.foreach(f => Utils.copyFileToDirectory(f, tempDir))
     logInfo(log"Downloaded metastore jars to ${MDC(PATH, tempDir.getCanonicalPath)}")
     tempDir.listFiles().map(_.toURI.toURL).toImmutableArraySeq
   }
@@ -258,7 +258,7 @@ private[hive] class IsolatedClientLoader(
             if (isBarrierClass(name)) {
               // For barrier classes, we construct a new copy of the class.
               val bytes = Utils.tryWithResource(
-                baseClassLoader.getResourceAsStream(classToPath(name)))(IOUtils.toByteArray)
+                baseClassLoader.getResourceAsStream(classToPath(name)))(_.readAllBytes)
               logDebug(s"custom defining: $name - ${util.Arrays.hashCode(bytes)}")
               defineClass(name, bytes, 0, bytes.length)
             } else if (!isSharedClass(name)) {
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/package.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/package.scala
index 6a9815342e73a..d7a0c58b4016e 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/package.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/client/package.scala
@@ -101,8 +101,25 @@ package object client {
         "org.pentaho:pentaho-aggdesigner-algorithm",
         "org.apache.hive:hive-vector-code-gen"))
 
+    case object v4_1 extends HiveVersion("4.1.0",
+      extraDeps =
+        "org.antlr:antlr4-runtime:4.9.3" ::
+        "org.apache.derby:derby:10.14.1.0" ::
+        "org.apache.hadoop:hadoop-hdfs:3.4.1" ::
+        "org.datanucleus:datanucleus-api-jdo:6.0.5" ::
+        "org.datanucleus:datanucleus-core:6.0.11" ::
+        "org.datanucleus:datanucleus-rdbms:6.0.10" ::
+        "org.datanucleus:javax.jdo:3.2.1" ::
+        "org.springframework:spring-core:5.3.39" ::
+        "org.springframework:spring-jdbc:5.3.39" :: Nil,
+      exclusions =
+        "org.apache.curator:*" ::
+        "org.apache.hive:hive-service-rpc" ::
+        "org.apache.tez:tez-api" ::
+        "org.apache.zookeeper:zookeeper" :: Nil)
+
     val allSupportedHiveVersions: Set[HiveVersion] =
-      Set(v2_0, v2_1, v2_2, v2_3, v3_0, v3_1, v4_0)
+      Set(v2_0, v2_1, v2_2, v2_3, v3_0, v3_1, v4_0, v4_1)
   }
   // scalastyle:on
 
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveFileFormat.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveFileFormat.scala
index d8f9405780d8c..5506cf8dae073 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveFileFormat.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveFileFormat.scala
@@ -31,7 +31,7 @@ import org.apache.hadoop.io.Writable
 import org.apache.hadoop.mapred.{JobConf, Reporter}
 import org.apache.hadoop.mapreduce.{Job, TaskAttemptContext}
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_NAME
 import org.apache.spark.internal.config.SPECULATION_ENABLED
 import org.apache.spark.sql.SparkSession
@@ -39,6 +39,7 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.errors.QueryExecutionErrors
 import org.apache.spark.sql.execution.datasources.{FileFormat, OutputWriter, OutputWriterFactory}
 import org.apache.spark.sql.hive.{HiveInspectors, HiveTableUtil}
+import org.apache.spark.sql.internal.SessionStateHelper
 import org.apache.spark.sql.sources.DataSourceRegister
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.util.SerializableJobConf
@@ -49,7 +50,10 @@ import org.apache.spark.util.SerializableJobConf
  * TODO: implement the read logic.
  */
 case class HiveFileFormat(fileSinkConf: FileSinkDesc)
-  extends FileFormat with DataSourceRegister with Logging {
+  extends FileFormat
+  with SessionStateHelper
+  with DataSourceRegister
+  with Logging {
 
   def this() = this(null)
 
@@ -75,7 +79,7 @@ case class HiveFileFormat(fileSinkConf: FileSinkDesc)
 
     // When speculation is on and output committer class name contains "Direct", we should warn
     // users that they may loss data if they are using a direct output committer.
-    val speculationEnabled = sparkSession.sparkContext.conf.get(SPECULATION_ENABLED)
+    val speculationEnabled = getSparkConf(sparkSession).get(SPECULATION_ENABLED)
     val outputCommitterClass = conf.get("mapred.output.committer.class", "")
     if (speculationEnabled && outputCommitterClass.contains("Direct")) {
       val warningMessage =
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveTempPath.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveTempPath.scala
index d97d3cd6dd4a9..3864d1601504c 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveTempPath.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/execution/HiveTempPath.scala
@@ -31,7 +31,7 @@ import org.apache.hadoop.hive.common.FileUtils
 import org.apache.hadoop.hive.ql.exec.TaskRunner
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.errors.QueryExecutionErrors
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileFormat.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileFormat.scala
index 7f58f69269dd5..ba37e5c176ded 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileFormat.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileFormat.scala
@@ -17,14 +17,13 @@
 
 package org.apache.spark.sql.hive.orc
 
-import java.util.Properties
+import java.util.{Base64, Properties}
 
 import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
 import com.esotericsoftware.kryo.Kryo
 import com.esotericsoftware.kryo.io.Output
-import org.apache.commons.codec.binary.Base64
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, Path}
 import org.apache.hadoop.hive.ql.io.orc._
@@ -47,6 +46,7 @@ import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.datasources.orc.{OrcFilters, OrcOptions, OrcUtils}
 import org.apache.spark.sql.hive.{HiveInspectors, HiveShim}
+import org.apache.spark.sql.internal.SessionStateHelper
 import org.apache.spark.sql.sources._
 import org.apache.spark.sql.types._
 import org.apache.spark.util.SerializableConfiguration
@@ -55,7 +55,10 @@ import org.apache.spark.util.SerializableConfiguration
  * `FileFormat` for reading ORC files. If this is moved or renamed, please update
  * `DataSource`'s backwardCompatibilityMap.
  */
-case class OrcFileFormat() extends FileFormat with DataSourceRegister with Serializable {
+case class OrcFileFormat() extends FileFormat
+  with DataSourceRegister
+  with SessionStateHelper
+  with Serializable {
 
   override def shortName(): String = "orc"
 
@@ -65,14 +68,14 @@ case class OrcFileFormat() extends FileFormat with DataSourceRegister with Seria
       sparkSession: SparkSession,
       options: Map[String, String],
       files: Seq[FileStatus]): Option[StructType] = {
-    val orcOptions = new OrcOptions(options, sparkSession.sessionState.conf)
+    val orcOptions = new OrcOptions(options, getSqlConf(sparkSession))
     if (orcOptions.mergeSchema) {
       SchemaMergeUtils.mergeSchemasInParallel(
         sparkSession, options, files, OrcFileOperator.readOrcSchemasInParallel)
     } else {
       OrcFileOperator.readSchema(
         files.map(_.getPath.toString),
-        Some(sparkSession.sessionState.newHadoopConfWithOptions(options)),
+        Some(getHadoopConf(sparkSession, options)),
         orcOptions.ignoreCorruptFiles
       )
     }
@@ -84,7 +87,7 @@ case class OrcFileFormat() extends FileFormat with DataSourceRegister with Seria
       options: Map[String, String],
       dataSchema: StructType): OutputWriterFactory = {
 
-    val orcOptions = new OrcOptions(options, sparkSession.sessionState.conf)
+    val orcOptions = new OrcOptions(options, getSqlConf(sparkSession))
 
     val configuration = job.getConfiguration
 
@@ -134,7 +137,7 @@ case class OrcFileFormat() extends FileFormat with DataSourceRegister with Seria
       options: Map[String, String],
       hadoopConf: Configuration): (PartitionedFile) => Iterator[InternalRow] = {
 
-    if (sparkSession.sessionState.conf.orcFilterPushDown) {
+    if (getSqlConf(sparkSession).orcFilterPushDown) {
       // Sets pushed predicates
       OrcFilters.createFilter(requiredSchema, filters).foreach { f =>
         hadoopConf.set(OrcFileFormat.SARG_PUSHDOWN, toKryo(f))
@@ -145,7 +148,7 @@ case class OrcFileFormat() extends FileFormat with DataSourceRegister with Seria
     val broadcastedHadoopConf =
       SerializableConfiguration.broadcast(sparkSession.sparkContext, hadoopConf)
     val ignoreCorruptFiles =
-      new OrcOptions(options, sparkSession.sessionState.conf).ignoreCorruptFiles
+      new OrcOptions(options, getSqlConf(sparkSession)).ignoreCorruptFiles
 
     (file: PartitionedFile) => {
       val conf = broadcastedHadoopConf.value.value
@@ -215,7 +218,7 @@ case class OrcFileFormat() extends FileFormat with DataSourceRegister with Seria
     val out = new Output(4 * 1024, 10 * 1024 * 1024)
     kryo.writeObject(out, sarg)
     out.close()
-    Base64.encodeBase64String(out.toBytes)
+    Base64.getEncoder().encodeToString(out.toBytes)
   }
 }
 
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileOperator.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileOperator.scala
index d588e9f5bd5c4..f0730b743fe67 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileOperator.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/orc/OrcFileOperator.scala
@@ -25,7 +25,7 @@ import org.apache.hadoop.hive.ql.io.orc.{OrcFile, Reader}
 import org.apache.hadoop.hive.serde2.objectinspector.StructObjectInspector
 
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.sql.catalyst.parser.CatalystSqlParser
 import org.apache.spark.sql.errors.QueryExecutionErrors
diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/security/HiveDelegationTokenProvider.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/security/HiveDelegationTokenProvider.scala
index 0e357d5e39b26..d7f4305018609 100644
--- a/sql/hive/src/main/scala/org/apache/spark/sql/hive/security/HiveDelegationTokenProvider.scala
+++ b/sql/hive/src/main/scala/org/apache/spark/sql/hive/security/HiveDelegationTokenProvider.scala
@@ -32,7 +32,7 @@ import org.apache.hadoop.security.token.Token
 
 import org.apache.spark.SparkConf
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.CLASS_NAME
 import org.apache.spark.internal.config.KEYTAB
 import org.apache.spark.security.HadoopDelegationTokenProvider
@@ -114,7 +114,7 @@ private[spark] class HiveDelegationTokenProvider
       None
     } catch {
       case NonFatal(e) =>
-        logWarning(Utils.createFailedToGetTokenMessage(serviceName, e))
+        logWarning(Utils.createFailedToGetTokenMessage(serviceName), e)
         None
       case e: NoClassDefFoundError =>
         logWarning(classNotFoundErrorStr)
diff --git a/sql/hive/src/test/java/org/apache/spark/sql/hive/execution/UDFListString.java b/sql/hive/src/test/java/org/apache/spark/sql/hive/execution/UDFListString.java
index f33210ebdae1b..9603928cbfeb8 100644
--- a/sql/hive/src/test/java/org/apache/spark/sql/hive/execution/UDFListString.java
+++ b/sql/hive/src/test/java/org/apache/spark/sql/hive/execution/UDFListString.java
@@ -19,9 +19,10 @@
 
 import java.util.List;
 
-import org.apache.commons.lang3.StringUtils;
 import org.apache.hadoop.hive.ql.exec.UDF;
 
+import org.apache.spark.network.util.JavaUtils;
+
 public class UDFListString extends UDF {
 
   public String evaluate(Object a) {
@@ -31,7 +32,7 @@ public String evaluate(Object a) {
     @SuppressWarnings("unchecked")
     List<Object> s = (List<Object>) a;
 
-    return StringUtils.join(s, ',');
+    return JavaUtils.join(s, ",");
   }
 
 
diff --git a/sql/hive/src/test/resources/golden/literal_string-2-2cf4b7268b47246afdf6c792acca379d b/sql/hive/src/test/resources/golden/literal_string-2-2cf4b7268b47246afdf6c792acca379d
index 1d05317d62547..22255f8fd786d 100644
--- a/sql/hive/src/test/resources/golden/literal_string-2-2cf4b7268b47246afdf6c792acca379d
+++ b/sql/hive/src/test/resources/golden/literal_string-2-2cf4b7268b47246afdf6c792acca379d
@@ -1 +1 @@
-facebook	facebook	facebook	facebook	facebook	facebook	facebook	facebook	facebook	facebook
+face'book	facebook	facebook	face"book	facebook	facebook	facebook	facebook	facebook	facebook
diff --git a/sql/hive/src/test/resources/log4j2.properties b/sql/hive/src/test/resources/log4j2.properties
index c91f417bc6b24..2f1e2f36ad57b 100644
--- a/sql/hive/src/test/resources/log4j2.properties
+++ b/sql/hive/src/test/resources/log4j2.properties
@@ -36,7 +36,6 @@ appender.file.fileName = target/unit-tests.log
 appender.file.layout.type = PatternLayout
 appender.file.layout.pattern = %d{HH:mm:ss.SSS} %t %p %c{1}: %m%n%ex
 
-# Set the logger level of File Appender to INFO
 appender.file.filter.threshold.type = ThresholdFilter
 appender.file.filter.threshold.level = info
 
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/DynamicPartitionPruningHiveScanSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/DynamicPartitionPruningHiveScanSuite.scala
index 52abd248f3ae2..ff8cbc0ad6eec 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/DynamicPartitionPruningHiveScanSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/DynamicPartitionPruningHiveScanSuite.scala
@@ -24,6 +24,7 @@ import org.apache.spark.sql.execution.adaptive.{DisableAdaptiveExecutionSuite, E
 import org.apache.spark.sql.hive.execution.HiveTableScanExec
 import org.apache.spark.sql.hive.test.TestHiveSingleton
 import org.apache.spark.sql.test.SQLTestUtils
+import org.apache.spark.tags.SlowHiveTest
 
 abstract class DynamicPartitionPruningHiveScanSuiteBase
     extends DynamicPartitionPruningSuiteBase with TestHiveSingleton with SQLTestUtils {
@@ -43,8 +44,10 @@ abstract class DynamicPartitionPruningHiveScanSuiteBase
   }
 }
 
+@SlowHiveTest
 class DynamicPartitionPruningHiveScanSuiteAEOff extends DynamicPartitionPruningHiveScanSuiteBase
   with DisableAdaptiveExecutionSuite
 
+@SlowHiveTest
 class DynamicPartitionPruningHiveScanSuiteAEOn extends DynamicPartitionPruningHiveScanSuiteBase
   with EnableAdaptiveExecutionSuite
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/ErrorPositionSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/ErrorPositionSuite.scala
index aa1973de7f678..a4caf78bed051 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/ErrorPositionSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/ErrorPositionSuite.scala
@@ -165,7 +165,7 @@ class ErrorPositionSuite extends QueryTest with TestHiveSingleton with BeforeAnd
           |
           |Actual: $actualStart, Expected: $expectedStart
           |$line
-          |${" " * actualStart}^
+          |${" ".repeat(actualStart)}^
           |0123456789 123456789 1234567890
           |          2         3
         """.stripMargin)
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogSuite.scala
index 655491d245356..db522b72e4cca 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogSuite.scala
@@ -103,7 +103,7 @@ class HiveExternalCatalogSuite extends ExternalCatalogSuite {
       """.stripMargin)
 
     val newSchema = new StructType().add("a", "string").add("b", "string").add("c", "string")
-    catalog.alterTableDataSchema("db1", "t", newSchema)
+    catalog.alterTableSchema("db1", "t", newSchema)
 
     assert(catalog.getTable("db1", "t").schema == newSchema)
     val bucketString = externalCatalog.client.runSqlHive("DESC FORMATTED db1.t")
@@ -234,7 +234,7 @@ class HiveExternalCatalogSuite extends ExternalCatalogSuite {
     val newSchema = StructType(Seq(
       StructField("col1", StringType("UTF8_LCASE"))
     ))
-    catalog.alterTableDataSchema("db1", tableName, newSchema)
+    catalog.alterTableSchema("db1", tableName, newSchema)
 
     val alteredRawTable = externalCatalog.getRawTable("db1", tableName)
     assert(DataTypeUtils.sameType(alteredRawTable.schema, noCollationsSchema))
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogVersionsSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogVersionsSuite.scala
index 32f2c6d508d33..6581d39c707e7 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogVersionsSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveExternalCatalogVersionsSuite.scala
@@ -24,7 +24,6 @@ import java.nio.file.{Files, Paths}
 import scala.sys.process._
 import scala.util.control.NonFatal
 
-import org.apache.commons.lang3.{JavaVersion, SystemUtils}
 import org.apache.hadoop.conf.Configuration
 import org.scalatest.time.Span
 import org.scalatest.time.SpanSugar._
@@ -143,7 +142,7 @@ class HiveExternalCatalogVersionsSuite extends SparkSubmitTestUtils {
 
     val outDir = new File(targetDir)
     if (!outDir.exists()) {
-      outDir.mkdirs()
+      Utils.createDirectory(outDir)
     }
 
     // propagate exceptions up to the caller of getFileFromUrl
@@ -200,7 +199,7 @@ class HiveExternalCatalogVersionsSuite extends SparkSubmitTestUtils {
 
     if (PROCESS_TABLES.testingVersions.isEmpty) {
       if (PROCESS_TABLES.isPythonVersionAvailable) {
-        if (SystemUtils.isJavaVersionAtMost(JavaVersion.JAVA_17)) {
+        if (Utils.isJavaVersionAtMost17) {
           logError("Fail to get the latest Spark versions to test.")
         } else {
           logInfo("Skip tests because old Spark versions don't support Java 21.")
@@ -265,7 +264,7 @@ object PROCESS_TABLES extends QueryTest with SQLTestUtils {
     "https://dist.apache.org/repos/dist/release")
   // Tests the latest version of every release line if Java version is at most 17.
   val testingVersions: Seq[String] = if (isPythonVersionAvailable &&
-      SystemUtils.isJavaVersionAtMost(JavaVersion.JAVA_17)) {
+      Utils.isJavaVersionAtMost17) {
     import scala.io.Source
     val sparkVersionPattern = """<a href="spark-(\d.\d.\d)/">""".r
     try Utils.tryWithResource(
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveParquetSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveParquetSuite.scala
index 6d7248a7dd67f..8fd37234f08e1 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveParquetSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveParquetSuite.scala
@@ -17,10 +17,15 @@
 
 package org.apache.spark.sql.hive
 
+import java.io.File
 import java.time.{Duration, Period}
 import java.time.temporal.ChronoUnit
 
+import org.apache.hadoop.fs.Path
+import org.apache.parquet.hadoop.ParquetFileReader
+
 import org.apache.spark.sql.{AnalysisException, QueryTest, Row}
+import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.execution.datasources.parquet.{ParquetCompressionCodec, ParquetTest}
 import org.apache.spark.sql.hive.test.TestHiveSingleton
 import org.apache.spark.sql.internal.SQLConf
@@ -179,4 +184,41 @@ class HiveParquetSuite extends QueryTest
       }
     }
   }
+
+  test("SPARK-52574: Ensure compression codec is correctly applied in Hive tables and dirs") {
+    withSQLConf(
+      HiveUtils.CONVERT_METASTORE_PARQUET.key -> "false",
+      HiveUtils.CONVERT_METASTORE_INSERT_DIR.key -> "false",
+      SQLConf.PARQUET_COMPRESSION.key -> ParquetCompressionCodec.SNAPPY.lowerCaseName()) {
+      withTable("tbl") {
+        sql("CREATE TABLE tbl(id int) STORED AS PARQUET")
+        sql("INSERT INTO tbl SELECT id AS part FROM range(10)")
+        val tblMata = spark.sessionState.catalog.getTableMetadata(TableIdentifier("tbl"))
+        checkCompressionCodec(new File(tblMata.storage.locationUri.get))
+      }
+
+      withTempPath { dir =>
+        sql(
+          s"""
+             |INSERT OVERWRITE LOCAL DIRECTORY '${dir.getCanonicalPath}'
+             |STORED AS parquet
+             |SELECT id FROM range(10)
+             |""".stripMargin)
+        checkCompressionCodec(dir)
+      }
+    }
+
+    def checkCompressionCodec(dir: File): Unit = {
+      val parquetFiles = dir.listFiles().filter(_.getName.startsWith("part-"))
+      assert(parquetFiles.nonEmpty, "No Parquet files found")
+
+      val conf = spark.sessionState.newHadoopConf()
+      val file = parquetFiles.head
+      val footer = ParquetFileReader.readFooter(conf, new Path(file.getAbsolutePath))
+
+      val codec = footer.getBlocks.get(0).getColumns.get(0).getCodec.name()
+      assert(codec.equalsIgnoreCase(ParquetCompressionCodec.SNAPPY.lowerCaseName()),
+        s"Expected ${ParquetCompressionCodec.SNAPPY.lowerCaseName()} compression but found $codec")
+    }
+  }
 }
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveTableRelationResolverSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveTableRelationResolverSuite.scala
index 8861d2c1f1683..674b726e94fb4 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveTableRelationResolverSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/HiveTableRelationResolverSuite.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.sql.hive
 
-import org.apache.spark.sql.catalyst.analysis.{FunctionResolution, UnresolvedRelation}
+import org.apache.spark.sql.catalyst.analysis.UnresolvedRelation
 import org.apache.spark.sql.catalyst.analysis.resolver.{
   MetadataResolver,
   ProhibitedResolver,
@@ -26,7 +26,6 @@ import org.apache.spark.sql.catalyst.analysis.resolver.{
 import org.apache.spark.sql.catalyst.catalog.HiveTableRelation
 import org.apache.spark.sql.catalyst.plans.logical.SubqueryAlias
 import org.apache.spark.sql.execution.datasources.LogicalRelation
-import org.apache.spark.sql.hive.HiveUtils
 import org.apache.spark.sql.hive.test.TestHiveSingleton
 import org.apache.spark.sql.test.SQLTestUtils
 import org.apache.spark.sql.types.{IntegerType, StringType, StructField, StructType}
@@ -77,7 +76,6 @@ class HiveTableRelationResolverSuite extends TestHiveSingleton with SQLTestUtils
     val metadataResolver = new MetadataResolver(
       spark.sessionState.catalogManager,
       relationResolution,
-      new FunctionResolution(spark.sessionState.catalogManager, relationResolution),
       extensions = spark.sessionState.analyzer.singlePassMetadataResolverExtensions
     )
     val hiveTableRelationResolver = new HiveTableRelationResolver(
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/InsertSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/InsertSuite.scala
index 3a37ef8d922cd..f9c001a1a0777 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/InsertSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/InsertSuite.scala
@@ -18,14 +18,15 @@
 package org.apache.spark.sql.hive
 
 import java.io.File
+import java.nio.file.Files
 import java.util.Locale
 
-import com.google.common.io.Files
 import org.apache.hadoop.fs.Path
 import org.scalatest.BeforeAndAfter
 
 import org.apache.spark.SparkException
 import org.apache.spark.sql.{QueryTest, _}
+import org.apache.spark.sql.catalyst.expressions.Hex
 import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.hive.execution.HiveTempPath
 import org.apache.spark.sql.hive.test.TestHiveSingleton
@@ -823,8 +824,7 @@ class InsertSuite extends QueryTest with TestHiveSingleton with BeforeAndAfter
       withTempDir { dir =>
         val file = new File(dir, "test.hex")
         val hex = "AABBCC"
-        val bs = org.apache.commons.codec.binary.Hex.decodeHex(hex.toCharArray)
-        Files.write(bs, file)
+        Files.write(file.toPath, Hex.unhex(hex))
         val path = file.getParent
         sql(s"create table t1 (c string) STORED AS TEXTFILE location '$path'")
         checkAnswer(
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/StatisticsSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/StatisticsSuite.scala
index e2f0040afe57c..80a213c9466b1 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/StatisticsSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/StatisticsSuite.scala
@@ -1068,14 +1068,14 @@ class StatisticsSuite extends StatisticsCollectionTestBase with TestHiveSingleto
           withTempPaths(numPaths = 2) { case Seq(dir1, dir2) =>
             val partDir1 = new File(new File(dir1, "ds=2008-04-09"), "hr=11")
             val file1 = new File(partDir1, "data")
-            file1.getParentFile.mkdirs()
+            Utils.createDirectory(file1.getParentFile)
             Utils.tryWithResource(new PrintWriter(file1)) { writer =>
               writer.write("1,a")
             }
 
             val partDir2 = new File(new File(dir2, "ds=2008-04-09"), "hr=12")
             val file2 = new File(partDir2, "data")
-            file2.getParentFile.mkdirs()
+            Utils.createDirectory(file2.getParentFile)
             Utils.tryWithResource(new PrintWriter(file2)) { writer =>
               writer.write("1,a")
             }
@@ -1602,42 +1602,44 @@ class StatisticsSuite extends StatisticsCollectionTestBase with TestHiveSingleto
     val tbl = "SPARK_30269"
     val ext_tbl = "SPARK_30269_external"
     withTempDir { dir =>
-      withTable(tbl, ext_tbl) {
-        sql(s"CREATE TABLE $tbl (key INT, value STRING, ds STRING)" +
-          "USING parquet PARTITIONED BY (ds)")
-        sql(
-          s"""
-             | CREATE TABLE $ext_tbl (key INT, value STRING, ds STRING)
-             | USING PARQUET
-             | PARTITIONED BY (ds)
-             | LOCATION '${dir.toURI}'
+      withSQLConf(SQLConf.AUTO_SIZE_UPDATE_ENABLED.key -> "false") {
+        withTable(tbl, ext_tbl) {
+          sql(s"CREATE TABLE $tbl (key INT, value STRING, ds STRING)" +
+            "USING parquet PARTITIONED BY (ds)")
+          sql(
+            s"""
+               | CREATE TABLE $ext_tbl (key INT, value STRING, ds STRING)
+               | USING PARQUET
+               | PARTITIONED BY (ds)
+               | LOCATION '${dir.toURI}'
            """.stripMargin)
 
-        Seq(tbl, ext_tbl).foreach { tblName =>
-          sql(s"INSERT INTO $tblName VALUES (1, 'a', '2019-12-13')")
-
-          val expectedSize = 690
-          // analyze table
-          sql(s"ANALYZE TABLE $tblName COMPUTE STATISTICS NOSCAN")
-          var tableStats = getTableStats(tblName)
-          assert(tableStats.sizeInBytes == expectedSize)
-          assert(tableStats.rowCount.isEmpty)
-
-          sql(s"ANALYZE TABLE $tblName COMPUTE STATISTICS")
-          tableStats = getTableStats(tblName)
-          assert(tableStats.sizeInBytes == expectedSize)
-          assert(tableStats.rowCount.get == 1)
-
-          // analyze a single partition
-          sql(s"ANALYZE TABLE $tblName PARTITION (ds='2019-12-13') COMPUTE STATISTICS NOSCAN")
-          var partStats = getPartitionStats(tblName, Map("ds" -> "2019-12-13"))
-          assert(partStats.sizeInBytes == expectedSize)
-          assert(partStats.rowCount.isEmpty)
-
-          sql(s"ANALYZE TABLE $tblName PARTITION (ds='2019-12-13') COMPUTE STATISTICS")
-          partStats = getPartitionStats(tblName, Map("ds" -> "2019-12-13"))
-          assert(partStats.sizeInBytes == expectedSize)
-          assert(partStats.rowCount.get == 1)
+          Seq(tbl, ext_tbl).foreach { tblName =>
+            sql(s"INSERT INTO $tblName VALUES (1, 'a', '2019-12-13')")
+            assert(getCatalogTable(tblName).stats.isEmpty)
+
+            // analyze table
+            sql(s"ANALYZE TABLE $tblName COMPUTE STATISTICS NOSCAN")
+            var tableStats = getTableStats(tblName)
+            val expectedSize = tableStats.sizeInBytes
+            assert(tableStats.rowCount.isEmpty)
+
+            sql(s"ANALYZE TABLE $tblName COMPUTE STATISTICS")
+            tableStats = getTableStats(tblName)
+            assert(tableStats.sizeInBytes == expectedSize)
+            assert(tableStats.rowCount.get == 1)
+
+            // analyze a single partition
+            sql(s"ANALYZE TABLE $tblName PARTITION (ds='2019-12-13') COMPUTE STATISTICS NOSCAN")
+            var partStats = getPartitionStats(tblName, Map("ds" -> "2019-12-13"))
+            assert(partStats.sizeInBytes == expectedSize)
+            assert(partStats.rowCount.isEmpty)
+
+            sql(s"ANALYZE TABLE $tblName PARTITION (ds='2019-12-13') COMPUTE STATISTICS")
+            partStats = getPartitionStats(tblName, Map("ds" -> "2019-12-13"))
+            assert(partStats.sizeInBytes == expectedSize)
+            assert(partStats.rowCount.get == 1)
+          }
         }
       }
     }
@@ -1670,14 +1672,14 @@ class StatisticsSuite extends StatisticsCollectionTestBase with TestHiveSingleto
         withTempPaths(numPaths = 2) { case Seq(dir1, dir2) =>
           val partDir1 = new File(new File(dir1, "ds=2008-04-09"), "hr=11")
           val file1 = new File(partDir1, "data")
-          file1.getParentFile.mkdirs()
+          Utils.createDirectory(file1.getParentFile)
           Utils.tryWithResource(new PrintWriter(file1)) { writer =>
             writer.write("1,a")
           }
 
           val partDir2 = new File(new File(dir2, "ds=2008-04-09"), "hr=12")
           val file2 = new File(partDir2, "data")
-          file2.getParentFile.mkdirs()
+          Utils.createDirectory(file2.getParentFile)
           Utils.tryWithResource(new PrintWriter(file2)) { writer =>
             writer.write("1,a")
           }
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/FiltersSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/FiltersSuite.scala
index da4f193101a62..27b0276fa63b5 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/FiltersSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/FiltersSuite.scala
@@ -71,7 +71,7 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
   filterTest("date filter with IN predicate",
     (a("datecol", DateType) in
       (Literal(Date.valueOf("2019-01-01")), Literal(Date.valueOf("2019-01-07")))) :: Nil,
-    "(datecol = \"2019-01-01\" or datecol = \"2019-01-07\")")
+    "(datecol) in (\"2019-01-01\", \"2019-01-07\")")
 
   filterTest("date and string filter",
     (Literal(Date.valueOf("2019-01-01")) === a("datecol", DateType)) ::
@@ -84,7 +84,7 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
 
   filterTest("string filter with InSet predicate",
     InSet(a("strcol", StringType), Set("1", "2").map(s => UTF8String.fromString(s))) :: Nil,
-    "(strcol = \"1\" or strcol = \"2\")")
+    "(strcol) in (\"1\", \"2\")")
 
   filterTest("skip varchar",
     (Literal("") === a("varchar", StringType)) :: Nil,
@@ -97,7 +97,7 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
 
   filterTest("SPARK-24879 null literals should be ignored for IN constructs",
     (a("intcol", IntegerType) in (Literal(1), Literal(null))) :: Nil,
-    "(intcol = 1)")
+    "(intcol) in (1)")
 
   filterTest("NOT: int and string filters",
     (a("intcol", IntegerType) =!= Literal(1)) :: (Literal("a") =!= a("strcol", IntegerType)) :: Nil,
@@ -109,7 +109,7 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
 
   filterTest("not-in, string filter",
     (Not(In(a("strcol", StringType), Seq(Literal("a"), Literal("b"))))) :: Nil,
-    """(strcol != "a" and strcol != "b")""")
+    """(strcol) not in ("a", "b")""")
 
   filterTest("not-in, string filter with null",
     (Not(In(a("strcol", StringType), Seq(Literal("a"), Literal("b"), Literal(null))))) :: Nil,
@@ -118,7 +118,7 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
   filterTest("not-in, date filter",
     (Not(In(a("datecol", DateType),
       Seq(Literal(Date.valueOf("2021-01-01")), Literal(Date.valueOf("2021-01-02")))))) :: Nil,
-    """(datecol != "2021-01-01" and datecol != "2021-01-02")""")
+    """(datecol) not in ("2021-01-01", "2021-01-02")""")
 
   filterTest("not-in, date filter with null",
     (Not(In(a("datecol", DateType),
@@ -128,7 +128,7 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
 
   filterTest("not-inset, string filter",
     (Not(InSet(a("strcol", StringType), Set(Literal("a").eval(), Literal("b").eval())))) :: Nil,
-    """(strcol != "a" and strcol != "b")""")
+    """(strcol) not in ("a", "b")""")
 
   filterTest("not-inset, string filter with null",
     (Not(InSet(a("strcol", StringType),
@@ -139,7 +139,7 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
     (Not(InSet(a("datecol", DateType),
       Set(Literal(Date.valueOf("2020-01-01")).eval(),
         Literal(Date.valueOf("2020-01-02")).eval())))) :: Nil,
-    """(datecol != "2020-01-01" and datecol != "2020-01-02")""")
+    """(datecol) not in ("2020-01-01", "2020-01-02")""")
 
   filterTest("not-inset, date filter with null",
     (Not(InSet(a("datecol", DateType),
@@ -239,14 +239,14 @@ class FiltersSuite extends SparkFunSuite with PlanTest {
     withSQLConf(SQLConf.HIVE_METASTORE_PARTITION_PRUNING_INSET_THRESHOLD.key -> "3") {
       val intFilter = InSet(a("p", IntegerType), Set(null, 1, 2))
       val intConverted = shim.convertFilters(testTable, Seq(intFilter))
-      assert(intConverted == "(p = 1 or p = 2)")
+      assert(intConverted == "(p) in (1, 2)")
     }
 
     withSQLConf(SQLConf.HIVE_METASTORE_PARTITION_PRUNING_INSET_THRESHOLD.key -> "3") {
       val dateFilter = InSet(a("p", DateType), Set(null,
         Literal(Date.valueOf("2020-01-01")).eval(), Literal(Date.valueOf("2021-01-01")).eval()))
       val dateConverted = shim.convertFilters(testTable, Seq(dateFilter))
-      assert(dateConverted == "(p = \"2020-01-01\" or p = \"2021-01-01\")")
+      assert(dateConverted == "(p) in (\"2020-01-01\", \"2021-01-01\")")
     }
   }
 
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientSuite.scala
index 355fece722b3f..d0d848bcb562b 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientSuite.scala
@@ -45,6 +45,8 @@ class HiveClientSuite(version: String) extends HiveVersionSuite(version) {
 
   private val emptyDir = Utils.createTempDir().getCanonicalPath
 
+  private val ver = IsolatedClientLoader.hiveVersion(version)
+
   /**
    * Drops table `tableName` after calling `f`.
    */
@@ -166,7 +168,7 @@ class HiveClientSuite(version: String) extends HiveVersionSuite(version) {
     // test alter database location
     val tempDatabasePath2 = Utils.createTempDir().toURI
     // Hive support altering database location since HIVE-8472.
-    if (version == "3.0" || version == "3.1" || version == "4.0") {
+    if (ver.compare(hive.v3_0) >= 0) {
       client.alterDatabase(database.copy(locationUri = tempDatabasePath2))
       val uriInCatalog = client.getDatabase("temporary").locationUri
       assert("file" === uriInCatalog.getScheme)
@@ -336,7 +338,7 @@ class HiveClientSuite(version: String) extends HiveVersionSuite(version) {
   }
 
   test("listTables(database)") {
-    assert(client.listTables("default") === Seq("src", "temporary", "view1"))
+    assert((client.listTables("default") diff Seq("src", "temporary", "view1")) === Nil)
   }
 
   test("listTables(database, pattern)") {
@@ -579,7 +581,7 @@ class HiveClientSuite(version: String) extends HiveVersionSuite(version) {
 
   test("sql create index and reset") {
     // HIVE-18448 Since Hive 3.0, INDEX is not supported.
-    if (version != "3.0" && version != "3.1" && version != "4.0") {
+    if (ver.compare(hive.v3_0) < 0) {
       client.runSqlHive("CREATE TABLE indexed_table (key INT)")
       client.runSqlHive("CREATE INDEX index_1 ON TABLE indexed_table(key) " +
         "as 'COMPACT' WITH DEFERRED REBUILD")
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientVersions.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientVersions.scala
index f54760e44b969..c06e2dea40f9e 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientVersions.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/client/HiveClientVersions.scala
@@ -22,6 +22,6 @@ private[client] trait HiveClientVersions {
   protected val versions = if (testVersions.nonEmpty) {
     testVersions.get.split(",").map(_.trim).filter(_.nonEmpty).toIndexedSeq
   } else {
-    IndexedSeq("2.0", "2.1", "2.2", "2.3", "3.0", "3.1", "4.0")
+    IndexedSeq("2.0", "2.1", "2.2", "2.3", "3.0", "3.1", "4.0", "4.1")
   }
 }
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/AggregationQuerySuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/AggregationQuerySuite.scala
index 13e1e5e5eef47..626367b509314 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/AggregationQuerySuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/AggregationQuerySuite.scala
@@ -23,7 +23,7 @@ import test.org.apache.spark.sql.MyDoubleAvg
 import test.org.apache.spark.sql.MyDoubleSum
 
 import org.apache.spark.sql.{AnalysisException, DataFrame, QueryTest, RandomDataGenerator, Row}
-import org.apache.spark.sql.catalyst.expressions.CodegenObjectFactoryMode
+import org.apache.spark.sql.catalyst.expressions.{CodegenObjectFactoryMode, UnsafeRow}
 import org.apache.spark.sql.classic.ClassicConversions.castToImpl
 import org.apache.spark.sql.classic.Dataset
 import org.apache.spark.sql.expressions.{MutableAggregationBuffer, UserDefinedAggregateFunction}
@@ -899,11 +899,15 @@ abstract class AggregationQuerySuite extends QueryTest with SQLTestUtils with Te
       ArrayType(IntegerType), MapType(StringType, LongType), struct,
       new TestUDT.MyDenseVectorUDT()) ++ dayTimeIntervalTypes ++ unsafeRowMutableFieldTypes ++
       timeTypes
-    // Right now, we will use SortAggregate to handle UDAFs.
-    // UnsafeRow.mutableFieldTypes.asScala.toSeq will trigger SortAggregate to use
-    // UnsafeRow as the aggregation buffer. While, dataTypes will trigger
-    // SortAggregate to use a safe row as the aggregation buffer.
-    Seq(dataTypes).foreach { dataTypes =>
+    // A schema that contains only data types where UnsafeRow.isMutable is true
+    // will trigger the aggregator to use unsafe row as the aggregation buffer.
+    // Other dataTypes will trigger the aggregator to use a safe row as the
+    // aggregation buffer.
+    //
+    // Below we want to test with *both* UnsafeRow and safe row as the underlying
+    // buffer.
+    val mutableDataTypes = dataTypes.filter(UnsafeRow.isMutable)
+    Seq(dataTypes, mutableDataTypes).foreach { dataTypes =>
       val fields = dataTypes.zipWithIndex.map { case (dataType, index) =>
         StructField(s"col$index", dataType, nullable = true)
       }
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveCommandSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveCommandSuite.scala
index 6ecb611699f1e..9a11bd4f539d7 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveCommandSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveCommandSuite.scala
@@ -18,8 +18,9 @@
 package org.apache.spark.sql.hive.execution
 
 import java.io.File
+import java.nio.file.Files
+import java.nio.file.StandardCopyOption
 
-import com.google.common.io.Files
 import org.apache.hadoop.fs.{FileContext, FsConstants, Path}
 
 import org.apache.spark.sql.{AnalysisException, QueryTest, Row}
@@ -147,7 +148,7 @@ class HiveCommandSuite extends QueryTest with SQLTestUtils with TestHiveSingleto
         fn(testData)
       } else {
         val tmp = File.createTempFile(testData.getName(), ".tmp")
-        Files.copy(testData, tmp)
+        Files.copy(testData.toPath, tmp.toPath, StandardCopyOption.REPLACE_EXISTING)
         try {
           fn(tmp)
         } finally {
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveComparisonTest.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveComparisonTest.scala
index c4ccb07cb10b1..f7dcd28c50378 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveComparisonTest.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveComparisonTest.scala
@@ -19,6 +19,7 @@ package org.apache.spark.sql.hive.execution
 
 import java.io._
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util
 import java.util.Locale
 
@@ -322,7 +323,7 @@ abstract class HiveComparisonTest extends SparkFunSuite with BeforeAndAfterAll {
         val hiveCachedResults = hiveCacheFiles.flatMap { cachedAnswerFile =>
           logDebug(s"Looking for cached answer file $cachedAnswerFile.")
           if (cachedAnswerFile.exists) {
-            Some(fileToString(cachedAnswerFile))
+            Some(Files.readString(cachedAnswerFile.toPath))
           } else {
             logDebug(s"File $cachedAnswerFile not found")
             None
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveDDLSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveDDLSuite.scala
index 13e8d3721d81e..d3f625542d96f 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveDDLSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveDDLSuite.scala
@@ -2650,7 +2650,7 @@ class HiveDDLSuite
   }
 
   test("SPARK-21216: join with a streaming DataFrame") {
-    import org.apache.spark.sql.execution.streaming.MemoryStream
+    import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
     import testImplicits._
 
     implicit val _sqlContext = spark.sqlContext
@@ -3418,7 +3418,7 @@ class HiveDDLSuite
       assert(loaded.properties().get("foo") == "bar")
 
       verify(spyCatalog, times(1)).alterTable(any[CatalogTable])
-      verify(spyCatalog, times(0)).alterTableDataSchema(
+      verify(spyCatalog, times(0)).alterTableSchema(
         any[String], any[String], any[StructType])
 
       v2SessionCatalog.alterTable(identifier,
@@ -3428,7 +3428,7 @@ class HiveDDLSuite
       assert(loaded2.columns.head.comment() == "comment2")
 
       verify(spyCatalog, times(1)).alterTable(any[CatalogTable])
-      verify(spyCatalog, times(1)).alterTableDataSchema(
+      verify(spyCatalog, times(1)).alterTableSchema(
         any[String], any[String], any[StructType])
     }
   }
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/Hive_2_1_DDLSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveIncompatibleColTypeChangeSuite.scala
similarity index 61%
rename from sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/Hive_2_1_DDLSuite.scala
rename to sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveIncompatibleColTypeChangeSuite.scala
index 0c54381551bf8..bfbbc3bd4ff9c 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/Hive_2_1_DDLSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveIncompatibleColTypeChangeSuite.scala
@@ -17,49 +17,23 @@
 
 package org.apache.spark.sql.hive.execution
 
-import org.apache.hadoop.conf.Configuration
-
-import org.apache.spark.{SparkConf, SparkFunSuite}
-import org.apache.spark.launcher.SparkLauncher
+import org.apache.spark.SparkFunSuite
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.hive.{HiveExternalCatalog, HiveUtils}
 import org.apache.spark.sql.hive.test.TestHiveSingleton
-import org.apache.spark.sql.internal.StaticSQLConf._
 import org.apache.spark.sql.types._
-import org.apache.spark.tags.{ExtendedHiveTest, SlowHiveTest}
-import org.apache.spark.util.Utils
 
 /**
- * A separate set of DDL tests that uses Hive 2.1 libraries, which behave a little differently
- * from the built-in ones.
+ * A separate set of Hive DDL tests when setting
+ * `hive.metastore.disallow.incompatible.col.type.changes=true`
  */
-@SlowHiveTest
-@ExtendedHiveTest
-class Hive_2_1_DDLSuite extends SparkFunSuite with TestHiveSingleton {
-
-  // Create a custom HiveExternalCatalog instance with the desired configuration. We cannot
-  // use SparkSession here since there's already an active on managed by the TestHive object.
-  private var catalog = {
-    val warehouse = Utils.createTempDir()
-    val metastore = Utils.createTempDir()
-    metastore.delete()
-    val sparkConf = new SparkConf()
-      .set(SparkLauncher.SPARK_MASTER, "local")
-      .set(WAREHOUSE_PATH.key, warehouse.toURI().toString())
-      .set(CATALOG_IMPLEMENTATION.key, "hive")
-      .set(HiveUtils.HIVE_METASTORE_VERSION.key, "2.1")
-      .set(HiveUtils.HIVE_METASTORE_JARS.key, "maven")
+class HiveIncompatibleColTypeChangeSuite extends SparkFunSuite with TestHiveSingleton {
 
-    val hadoopConf = new Configuration()
-    hadoopConf.set("hive.metastore.warehouse.dir", warehouse.toURI().toString())
-    hadoopConf.set("javax.jdo.option.ConnectionURL",
-      s"jdbc:derby:;databaseName=${metastore.getAbsolutePath()};create=true")
-    // These options are needed since the defaults in Hive 2.1 cause exceptions with an
-    // empty metastore db.
-    hadoopConf.set("datanucleus.schema.autoCreateAll", "true")
-    hadoopConf.set("hive.metastore.schema.verification", "false")
+  private val catalog = spark.sessionState.catalog.externalCatalog
 
-    new HiveExternalCatalog(sparkConf, hadoopConf)
+  override def beforeAll(): Unit = {
+    super.beforeAll()
+    hiveClient.runSqlHive(
+      "SET hive.metastore.disallow.incompatible.col.type.changes=true")
   }
 
   override def afterEach(): Unit = {
@@ -71,7 +45,8 @@ class Hive_2_1_DDLSuite extends SparkFunSuite with TestHiveSingleton {
 
   override def afterAll(): Unit = {
     try {
-      catalog = null
+      hiveClient.runSqlHive(
+        "SET hive.metastore.disallow.incompatible.col.type.changes=false")
     } finally {
       super.afterAll()
     }
@@ -122,9 +97,9 @@ class Hive_2_1_DDLSuite extends SparkFunSuite with TestHiveSingleton {
       updatedSchema: StructType,
       hiveCompatible: Boolean = true): Unit = {
     spark.sql(createTableStmt)
-    val oldTable = spark.sessionState.catalog.externalCatalog.getTable("default", tableName)
+    val oldTable = catalog.getTable("default", tableName)
     catalog.createTable(oldTable, true)
-    catalog.alterTableDataSchema("default", tableName, updatedSchema)
+    catalog.alterTableSchema("default", tableName, updatedSchema)
 
     val updatedTable = catalog.getTable("default", tableName)
     assert(updatedTable.schema.fieldNames === updatedSchema.fieldNames)
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveQueryFileTest.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveQueryFileTest.scala
index 192fff2b98879..d515c9913cb17 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveQueryFileTest.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveQueryFileTest.scala
@@ -18,8 +18,7 @@
 package org.apache.spark.sql.hive.execution
 
 import java.io.File
-
-import org.apache.spark.sql.catalyst.util._
+import java.nio.file.Files
 
 /**
  * A framework for running the query tests that are listed as a set of text files.
@@ -67,7 +66,7 @@ abstract class HiveQueryFileTest extends HiveComparisonTest {
         realIncludeList.map(_.r.pattern.matcher(testCaseName).matches()).reduceLeft(_||_) ||
         runAll) {
         // Build a test case and submit it to scala test framework...
-        val queriesString = fileToString(testCaseFile)
+        val queriesString = Files.readString(testCaseFile.toPath)
         createQueryTest(testCaseName, queriesString, reset = true, tryWithoutResettingFirst = true)
       } else {
         // Only output warnings for the built in includeList as this clutters the output when the
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveSerDeReadWriteSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveSerDeReadWriteSuite.scala
index 1922144a92efa..a5b4f3115ca32 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveSerDeReadWriteSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveSerDeReadWriteSuite.scala
@@ -107,9 +107,10 @@ class HiveSerDeReadWriteSuite extends QueryTest with SQLTestUtils with TestHiveS
     withTable("hive_serde") {
       hiveClient.runSqlHive(s"CREATE TABLE hive_serde (c1 CHAR(10)) STORED AS $fileFormat")
       hiveClient.runSqlHive("INSERT INTO TABLE hive_serde values('s')")
-      checkAnswer(spark.table("hive_serde"), Row("s" + " " * 9))
+      checkAnswer(spark.table("hive_serde"), Row("s" + " ".repeat(9)))
       spark.sql(s"INSERT INTO TABLE hive_serde values('s3')")
-      checkAnswer(spark.table("hive_serde"), Seq(Row("s" + " " * 9), Row("s3" + " " * 8)))
+      checkAnswer(spark.table("hive_serde"),
+        Seq(Row("s" + " ".repeat(9)), Row("s3" + " ".repeat(8))))
     }
   }
 
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/SQLQuerySuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/SQLQuerySuite.scala
index 78d30866b4f2c..ae53691d4931f 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/SQLQuerySuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/SQLQuerySuite.scala
@@ -19,11 +19,10 @@ package org.apache.spark.sql.hive.execution
 
 import java.io.File
 import java.net.URI
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.sql.{Date, Timestamp}
 import java.util.{Locale, Set}
 
-import com.google.common.io.{Files, FileWriteMode}
 import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.{SPARK_DOC_ROOT, SparkException, TestUtils}
@@ -1950,10 +1949,10 @@ abstract class SQLQuerySuiteBase extends QueryTest with SQLTestUtils with TestHi
       val path = dir.toURI.toString.stripSuffix("/")
       val dirPath = dir.getAbsoluteFile
       for (i <- 1 to 3) {
-        Files.asCharSink(new File(dirPath, s"part-r-0000$i"), StandardCharsets.UTF_8).write(s"$i")
+        Files.writeString(new File(dirPath, s"part-r-0000$i").toPath, s"$i")
       }
       for (i <- 5 to 7) {
-        Files.asCharSink(new File(dirPath, s"part-s-0000$i"), StandardCharsets.UTF_8).write(s"$i")
+        Files.writeString(new File(dirPath, s"part-s-0000$i").toPath, s"$i")
       }
 
       withTable("load_t") {
@@ -1974,7 +1973,7 @@ abstract class SQLQuerySuiteBase extends QueryTest with SQLTestUtils with TestHi
       val path = dir.toURI.toString.stripSuffix("/")
       val dirPath = dir.getAbsoluteFile
       for (i <- 1 to 3) {
-        Files.asCharSink(new File(dirPath, s"part-r-0000 $i"), StandardCharsets.UTF_8).write(s"$i")
+        Files.writeString(new File(dirPath, s"part-r-0000 $i").toPath, s"$i")
       }
       withTable("load_t") {
         sql("CREATE TABLE load_t (a STRING) USING hive")
@@ -1989,7 +1988,7 @@ abstract class SQLQuerySuiteBase extends QueryTest with SQLTestUtils with TestHi
       val path = dir.toURI.toString.stripSuffix("/")
       val dirPath = dir.getAbsoluteFile
       for (i <- 1 to 3) {
-        Files.asCharSink(new File(dirPath, s"part-r-0000$i"), StandardCharsets.UTF_8).write(s"$i")
+        Files.writeString(new File(dirPath, s"part-r-0000$i").toPath, s"$i")
       }
       withTable("load_t") {
         sql("CREATE TABLE load_t (a STRING) USING hive")
@@ -2013,7 +2012,7 @@ abstract class SQLQuerySuiteBase extends QueryTest with SQLTestUtils with TestHi
       val path = dir.toURI.toString.stripSuffix("/")
       val dirPath = dir.getAbsoluteFile
       for (i <- 1 to 3) {
-        Files.asCharSink(new File(dirPath, s"part-r-0000$i"), StandardCharsets.UTF_8).write(s"$i")
+        Files.writeString(new File(dirPath, s"part-r-0000$i").toPath, s"$i")
       }
       withTable("load_t1") {
         sql("CREATE TABLE load_t1 (a STRING) USING hive")
@@ -2028,7 +2027,7 @@ abstract class SQLQuerySuiteBase extends QueryTest with SQLTestUtils with TestHi
       val path = dir.toURI.toString.stripSuffix("/")
       val dirPath = dir.getAbsoluteFile
       for (i <- 1 to 3) {
-        Files.asCharSink(new File(dirPath, s"part-r-0000$i"), StandardCharsets.UTF_8).write(s"$i")
+        Files.writeString(new File(dirPath, s"part-r-0000$i").toPath, s"$i")
       }
       withTable("load_t2") {
         sql("CREATE TABLE load_t2 (a STRING) USING hive")
@@ -2042,8 +2041,7 @@ abstract class SQLQuerySuiteBase extends QueryTest with SQLTestUtils with TestHi
     withTempDir { dir =>
       val path = dir.toURI.toString.stripSuffix("/")
       val dirPath = dir.getAbsoluteFile
-      Files.asCharSink(
-        new File(dirPath, "part-r-000011"), StandardCharsets.UTF_8, FileWriteMode.APPEND).write("1")
+      Files.writeString(new File(dirPath, "part-r-000011").toPath, "1")
       withTable("part_table") {
         withSQLConf(SQLConf.CASE_SENSITIVE.key -> "false") {
           sql(
@@ -2543,7 +2541,7 @@ abstract class SQLQuerySuiteBase extends QueryTest with SQLTestUtils with TestHi
     withTempDir { dir =>
       withSQLConf(HiveUtils.CONVERT_METASTORE_PARQUET.key -> "false") {
         withTable("test_precision") {
-          val df = sql(s"SELECT 'dummy' AS name, ${"1" * 20}.${"2" * 18} AS value")
+          val df = sql(s"SELECT 'dummy' AS name, ${"1".repeat(20)}.${"2".repeat(18)} AS value")
           df.write.mode("Overwrite").parquet(dir.getAbsolutePath)
           sql(
             s"""
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/UDAQuerySuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/UDAQuerySuite.scala
index ce1b41ecc6dd7..78f3df324175e 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/UDAQuerySuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/UDAQuerySuite.scala
@@ -60,6 +60,22 @@ object LongProductSumAgg extends Aggregator[(jlLong, jlLong), Long, jlLong] {
   def outputEncoder: Encoder[jlLong] = Encoders.LONG
 }
 
+final case class Reduce[T: Encoder](r: (T, T) => T)(implicit i: Encoder[Option[T]])
+  extends Aggregator[T, Option[T], T] {
+  def zero: Option[T] = None
+  def reduce(b: Option[T], a: T): Option[T] = Some(b.fold(a)(r(_, a)))
+  def merge(b1: Option[T], b2: Option[T]): Option[T] =
+    (b1, b2) match {
+      case (Some(a), Some(b)) => Some(r(a, b))
+      case (Some(a), None) => Some(a)
+      case (None, Some(b)) => Some(b)
+      case (None, None) => None
+    }
+  def finish(reduction: Option[T]): T = reduction.get
+  def bufferEncoder: Encoder[Option[T]] = implicitly
+  def outputEncoder: Encoder[T] = implicitly
+}
+
 @SQLUserDefinedType(udt = classOf[CountSerDeUDT])
 case class CountSerDeSQL(nSer: Int, nDeSer: Int, sum: Int)
 
@@ -180,6 +196,9 @@ abstract class UDAQuerySuite extends QueryTest with SQLTestUtils with TestHiveSi
     val data4 = Seq[Boolean](true, false, true).toDF("boolvalues")
     data4.write.saveAsTable("agg4")
 
+    val data5 = Seq[(Int, (Int, Int))]((1, (2, 3))).toDF("key", "value")
+    data5.write.saveAsTable("agg5")
+
     val emptyDF = spark.createDataFrame(
       sparkContext.emptyRDD[Row],
       StructType(StructField("key", StringType) :: StructField("value", IntegerType) :: Nil))
@@ -190,6 +209,8 @@ abstract class UDAQuerySuite extends QueryTest with SQLTestUtils with TestHiveSi
     spark.udf.register("mydoubleavg", udaf(MyDoubleAvgAgg))
     spark.udf.register("longProductSum", udaf(LongProductSumAgg))
     spark.udf.register("arraysum", udaf(ArrayDataAgg))
+    spark.udf.register("reduceOptionPair", udaf(Reduce[Option[(Int, Int)]](
+      (opt1, opt2) => opt1.zip(opt2).map { case ((a1, b1), (a2, b2)) => (a1 + a2, b1 + b2) })))
   }
 
   override def afterAll(): Unit = {
@@ -371,6 +392,12 @@ abstract class UDAQuerySuite extends QueryTest with SQLTestUtils with TestHiveSi
       Row(Seq(12.0, 15.0, 18.0)) :: Nil)
   }
 
+  test("SPARK-52023: Returning Option[Product] from udaf") {
+    checkAnswer(
+      spark.sql("SELECT reduceOptionPair(value) FROM agg5 GROUP BY key"),
+      Row(Row(2, 3)) :: Nil)
+  }
+
   test("verify aggregator ser/de behavior") {
     val data = sparkContext.parallelize((1 to 100).toSeq, 3).toDF("value1")
     val agg = udaf(CountSerDeAgg)
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/orc/HiveOrcQuerySuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/orc/HiveOrcQuerySuite.scala
index 15f8666322e32..45f5d2f273e32 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/orc/HiveOrcQuerySuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/orc/HiveOrcQuerySuite.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.hive.orc
 
 import java.io.File
 
-import com.google.common.io.Files
 import org.apache.hadoop.fs.Path
 import org.apache.orc.OrcConf
 
@@ -32,6 +31,7 @@ import org.apache.spark.sql.hive.{HiveSessionCatalog, HiveUtils}
 import org.apache.spark.sql.hive.test.TestHiveSingleton
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.TimeType
+import org.apache.spark.util.Utils
 
 class HiveOrcQuerySuite extends OrcQueryTest with TestHiveSingleton {
   import testImplicits._
@@ -195,7 +195,7 @@ class HiveOrcQuerySuite extends OrcQueryTest with TestHiveSingleton {
         withTempPath { dir =>
           withTable("spark_19809") {
             sql(s"CREATE TABLE spark_19809(a int) STORED AS ORC LOCATION '$dir'")
-            Files.touch(new File(s"${dir.getCanonicalPath}", "zero.orc"))
+            Utils.touch(new File(s"${dir.getCanonicalPath}", "zero.orc"))
 
             Seq(true, false).foreach { convertMetastoreOrc =>
               withSQLConf(HiveUtils.CONVERT_METASTORE_ORC.key -> convertMetastoreOrc.toString) {
diff --git a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/SharedJDBCIntegrationTests.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/pipelines/HiveMaterializeTablesSuite.scala
similarity index 56%
rename from connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/SharedJDBCIntegrationTests.scala
rename to sql/hive/src/test/scala/org/apache/spark/sql/hive/pipelines/HiveMaterializeTablesSuite.scala
index 33dc2f9c98112..f57125438ccf3 100644
--- a/connector/docker-integration-tests/src/test/scala/org/apache/spark/sql/jdbc/SharedJDBCIntegrationTests.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/pipelines/HiveMaterializeTablesSuite.scala
@@ -15,20 +15,28 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.jdbc
+package org.apache.spark.sql.hive.pipelines
 
-import org.apache.spark.SparkException
-import org.apache.spark.sql.QueryTest
+import org.apache.spark.sql.SQLContext
+import org.apache.spark.sql.hive.test.TestHiveSingleton
+import org.apache.spark.sql.pipelines.graph.MaterializeTablesSuite
 
-trait SharedJDBCIntegrationTests extends QueryTest {
-  protected def jdbcUrl: String
+class HiveMaterializeTablesSuite extends MaterializeTablesSuite with TestHiveSingleton {
+  override def afterAll(): Unit = {
+    try {
+      hiveContext.reset()
+    } finally {
+      super.afterAll()
+    }
+  }
 
-  test("SPARK-52184: Wrap external engine syntax error") {
-    val e = intercept[SparkException] {
-      spark.read.format("jdbc")
-        .option("url", jdbcUrl)
-        .option("query", "THIS IS NOT VALID SQL").load()
+  override def afterEach(): Unit = {
+    try {
+      spark.artifactManager.cleanUpResourcesForTesting()
+    } finally {
+      super.afterEach()
     }
-    assert(e.getCondition.startsWith("JDBC_EXTERNAL_ENGINE_SYNTAX_ERROR"))
   }
+
+  override protected implicit def sqlContext: SQLContext = spark.sqlContext
 }
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/security/HiveHadoopDelegationTokenManagerSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/security/HiveHadoopDelegationTokenManagerSuite.scala
index a811886517c60..2432f7a379e5f 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/hive/security/HiveHadoopDelegationTokenManagerSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/hive/security/HiveHadoopDelegationTokenManagerSuite.scala
@@ -17,7 +17,6 @@
 
 package org.apache.spark.sql.hive.security
 
-import org.apache.commons.io.IOUtils
 import org.apache.hadoop.conf.Configuration
 import org.scalatest.Assertions._
 
@@ -65,7 +64,7 @@ class HiveHadoopDelegationTokenManagerSuite extends SparkFunSuite {
         val classFileName = name.replaceAll("\\.", "/") + ".class"
         val in = currentLoader.getResourceAsStream(classFileName)
         if (in != null) {
-          val bytes = IOUtils.toByteArray(in)
+          val bytes = in.readAllBytes()
           return defineClass(name, bytes, 0, bytes.length)
         }
 
diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/sources/ParquetHadoopFsRelationSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/sources/ParquetHadoopFsRelationSuite.scala
index 84ee19e62bca2..aa913d23cfc3e 100644
--- a/sql/hive/src/test/scala/org/apache/spark/sql/sources/ParquetHadoopFsRelationSuite.scala
+++ b/sql/hive/src/test/scala/org/apache/spark/sql/sources/ParquetHadoopFsRelationSuite.scala
@@ -19,7 +19,6 @@ package org.apache.spark.sql.sources
 
 import java.io.File
 
-import com.google.common.io.Files
 import org.apache.hadoop.fs.Path
 import org.apache.parquet.hadoop.ParquetOutputFormat
 
@@ -29,6 +28,7 @@ import org.apache.spark.sql.execution.datasources.SQLHadoopMapReduceCommitProtoc
 import org.apache.spark.sql.execution.datasources.parquet.ParquetCompressionCodec
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types._
+import org.apache.spark.util.Utils
 
 
 class ParquetHadoopFsRelationSuite extends HadoopFsRelationTest {
@@ -88,8 +88,7 @@ class ParquetHadoopFsRelationSuite extends HadoopFsRelationTest {
       // Creates an arbitrary file.  If this directory gets scanned, ParquetRelation2 will throw
       // since it's not a valid Parquet file.
       val emptyFile = new File(path, "empty")
-      Files.createParentDirs(emptyFile)
-      Files.touch(emptyFile)
+      Utils.touch(emptyFile)
 
       // This shouldn't throw anything.
       df.write.format("parquet").mode(SaveMode.Ignore).save(path)
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/CoreDataflowNodeProcessor.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/CoreDataflowNodeProcessor.scala
index d33924c2e1c37..fcab53ae32ac7 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/CoreDataflowNodeProcessor.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/CoreDataflowNodeProcessor.scala
@@ -80,12 +80,6 @@ class CoreDataflowNodeProcessor(rawGraph: DataflowGraph) {
         val resolvedFlowsToTable = flowsToTable.map { flow =>
           resolvedFlowNodesMap.get(flow.identifier)
         }
-
-        // Assign isStreamingTable (MV or ST) to the table based on the resolvedFlowsToTable
-        val tableWithType = table.copy(
-          isStreamingTableOpt = Option(resolvedFlowsToTable.exists(f => f.df.isStreaming))
-        )
-
         // We mark all tables as virtual to ensure resolution uses incoming flows
         // rather than previously materialized tables.
         val virtualTableInput = VirtualTableInput(
@@ -95,7 +89,7 @@ class CoreDataflowNodeProcessor(rawGraph: DataflowGraph) {
           availableFlows = resolvedFlowsToTable
         )
         resolvedInputs.put(table.identifier, virtualTableInput)
-        Seq(tableWithType)
+        Seq(table)
       case view: View =>
         // For view, add the flow to resolvedInputs and return empty.
         require(upstreamNodes.size == 1, "Found multiple flows to view")
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DataflowGraph.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DataflowGraph.scala
index 0263a2fef4f44..c49f151c5da1b 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DataflowGraph.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DataflowGraph.scala
@@ -191,6 +191,7 @@ case class DataflowGraph(flows: Seq[Flow], tables: Seq[Table], views: Seq[View])
     validatePersistedViewSources()
     validateEveryDatasetHasFlow()
     validateTablesAreResettable()
+    validateFlowStreamingness()
     inferredSchema
   }.failed
 
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DatasetManager.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DatasetManager.scala
index 79c5ef36b0bc4..05e12a3f7859f 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DatasetManager.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/DatasetManager.scala
@@ -21,7 +21,7 @@ import scala.jdk.CollectionConverters._
 import scala.util.control.{NonFatal, NoStackTrace}
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.AnalysisException
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.connector.catalog.{
@@ -31,6 +31,7 @@ import org.apache.spark.sql.connector.catalog.{
   TableChange,
   TableInfo
 }
+import org.apache.spark.sql.connector.catalog.CatalogV2Util.v2ColumnsToStructType
 import org.apache.spark.sql.connector.expressions.Expressions
 import org.apache.spark.sql.pipelines.graph.QueryOrigin.ExceptionHelpers
 import org.apache.spark.sql.pipelines.util.SchemaInferenceUtils.diffSchemas
@@ -178,15 +179,15 @@ object DatasetManager extends Logging {
     }
 
     // Wipe the data if we need to
-    if ((isFullRefresh || !table.isStreamingTableOpt.get) && existingTableOpt.isDefined) {
+    if ((isFullRefresh || !table.isStreamingTable) && existingTableOpt.isDefined) {
       context.spark.sql(s"TRUNCATE TABLE ${table.identifier.quotedString}")
     }
 
     // Alter the table if we need to
     if (existingTableOpt.isDefined) {
-      val existingSchema = existingTableOpt.get.schema()
+      val existingSchema = v2ColumnsToStructType(existingTableOpt.get.columns())
 
-      val targetSchema = if (table.isStreamingTableOpt.get && !isFullRefresh) {
+      val targetSchema = if (table.isStreamingTable && !isFullRefresh) {
         SchemaMergingUtils.mergeSchemas(existingSchema, outputSchema)
       } else {
         outputSchema
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/Flow.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/Flow.scala
index 2378b6f8d96a6..40fb8dbbe5dcc 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/Flow.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/Flow.scala
@@ -55,9 +55,6 @@ trait Flow extends GraphElement with Logging {
   /** The current query context (catalog and database) when the query is defined. */
   def queryContext: QueryContext
 
-  /** The comment associated with this flow */
-  def comment: Option[String]
-
   def sqlConf: Map[String, String]
 }
 
@@ -127,7 +124,6 @@ case class UnresolvedFlow(
     func: FlowFunction,
     queryContext: QueryContext,
     sqlConf: Map[String, String],
-    comment: Option[String] = None,
     override val once: Boolean,
     override val origin: QueryOrigin
 ) extends Flow
@@ -145,7 +141,6 @@ trait ResolutionCompletedFlow extends Flow {
   val destinationIdentifier: TableIdentifier = flow.destinationIdentifier
   def func: FlowFunction = flow.func
   def queryContext: QueryContext = flow.queryContext
-  def comment: Option[String] = flow.comment
   def sqlConf: Map[String, String] = funcResult.sqlConf
   def origin: QueryOrigin = flow.origin
 }
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowAnalysis.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowAnalysis.scala
index 7e2e97f2b5d74..311bdfd6a3d2d 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowAnalysis.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowAnalysis.scala
@@ -112,23 +112,29 @@ object FlowAnalysis {
         // - SELECT ... FROM STREAM(t1)
         // - SELECT ... FROM STREAM t1
         case u: UnresolvedRelation if u.isStreaming =>
-          readStreamInput(
+          val resolved = readStreamInput(
             context,
             name = IdentifierHelper.toQuotedString(u.multipartIdentifier),
             spark.readStream,
             streamingReadOptions = StreamingReadOptions()
           ).queryExecution.analyzed
-
+          // Spark Connect requires the PLAN_ID_TAG to be propagated to the resolved plan
+          // to allow correct analysis of the parent plan that contains this subquery
+          resolved.mergeTagsFrom(u)
+          resolved
         // Batch read on another dataset in the pipeline
         case u: UnresolvedRelation =>
-          readBatchInput(
+          val resolved = readBatchInput(
             context,
             name = IdentifierHelper.toQuotedString(u.multipartIdentifier),
             batchReadOptions = BatchReadOptions()
           ).queryExecution.analyzed
+          // Spark Connect requires the PLAN_ID_TAG to be propagated to the resolved plan
+          // to allow correct analysis of the parent plan that contains this subquery
+          resolved.mergeTagsFrom(u)
+          resolved
       }
     Dataset.ofRows(spark, resolvedPlan)
-
   }
 
   /**
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowExecution.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowExecution.scala
index 5c981a2442edd..68daa60c8b1a3 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowExecution.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/FlowExecution.scala
@@ -24,7 +24,7 @@ import scala.concurrent.{ExecutionContext, Future}
 import scala.util.{Failure, Success}
 import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.classic.SparkSession
 import org.apache.spark.sql.pipelines.graph.QueryOrigin.ExceptionHelpers
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphExecution.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphExecution.scala
index 381449711dbbb..4c969f1bbefd0 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphExecution.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphExecution.scala
@@ -22,7 +22,7 @@ import scala.concurrent.ExecutionContext
 import scala.jdk.CollectionConverters._
 import scala.util.{Failure, Success}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.pipelines.logging.StreamListener
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphRegistrationContext.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphRegistrationContext.scala
index 0e2ba42b15e59..4494bbe0d3100 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphRegistrationContext.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphRegistrationContext.scala
@@ -50,6 +50,13 @@ class GraphRegistrationContext(
   }
 
   def toDataflowGraph: DataflowGraph = {
+    if (tables.isEmpty && views.collect { case v: PersistedView =>
+        v
+      }.isEmpty) {
+      throw new AnalysisException(
+        errorClass = "RUN_EMPTY_PIPELINE",
+        messageParameters = Map.empty)
+    }
     val qualifiedTables = tables.toSeq.map { t =>
       t.copy(
         identifier = GraphIdentifierManager
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphValidations.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphValidations.scala
index 648a5154d42e1..18aad5fe07cb7 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphValidations.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/GraphValidations.scala
@@ -55,6 +55,82 @@ trait GraphValidations extends Logging {
     multiQueryTables
   }
 
+  /**
+   * Validate that each resolved flow is correctly either a streaming flow or non-streaming flow,
+   * depending on the flow type (ex. once flow vs non-once flow) and the dataset type the flow
+   * writes to (ex. streaming table vs materialized view).
+   */
+  protected[graph] def validateFlowStreamingness(): Unit = {
+    flowsTo.foreach { case (destTableIdentifier, flowsToDataset) =>
+      // The identifier should correspond to exactly one of a table or view
+      val destTableOpt = table.get(destTableIdentifier)
+      val destViewOpt = view.get(destTableIdentifier)
+
+      val resolvedFlowsToDataset: Seq[ResolvedFlow] = flowsToDataset.collect {
+        case rf: ResolvedFlow => rf
+      }
+
+      resolvedFlowsToDataset.foreach { resolvedFlow: ResolvedFlow =>
+        // A flow must be successfully analyzed, thus resolved, in order to determine if it is
+        // streaming or not. Unresolved flows will throw an exception anyway via
+        // [[validateSuccessfulFlowAnalysis]], so don't check them here.
+        if (resolvedFlow.once) {
+          // Once flows by definition should be batch flows, not streaming.
+          if (resolvedFlow.df.isStreaming) {
+            throw new AnalysisException(
+              errorClass = "INVALID_FLOW_QUERY_TYPE.STREAMING_RELATION_FOR_ONCE_FLOW",
+              messageParameters = Map(
+                "flowIdentifier" -> resolvedFlow.identifier.quotedString
+              )
+            )
+          }
+        } else {
+          destTableOpt.foreach { destTable =>
+            if (destTable.isStreamingTable) {
+              if (!resolvedFlow.df.isStreaming) {
+                throw new AnalysisException(
+                  errorClass = "INVALID_FLOW_QUERY_TYPE.BATCH_RELATION_FOR_STREAMING_TABLE",
+                  messageParameters = Map(
+                    "flowIdentifier" -> resolvedFlow.identifier.quotedString,
+                    "tableIdentifier" -> destTableIdentifier.quotedString
+                  )
+                )
+              }
+            } else {
+              if (resolvedFlow.df.isStreaming) {
+                // This check intentionally does NOT prevent materialized views from reading from
+                // a streaming table using a _batch_ read, which is still considered valid.
+                throw new AnalysisException(
+                  errorClass = "INVALID_FLOW_QUERY_TYPE.STREAMING_RELATION_FOR_MATERIALIZED_VIEW",
+                  messageParameters = Map(
+                    "flowIdentifier" -> resolvedFlow.identifier.quotedString,
+                    "tableIdentifier" -> destTableIdentifier.quotedString
+                  )
+                )
+              }
+            }
+          }
+
+          destViewOpt.foreach {
+            case _: PersistedView =>
+              if (resolvedFlow.df.isStreaming) {
+                throw new AnalysisException(
+                  errorClass = "INVALID_FLOW_QUERY_TYPE.STREAMING_RELATION_FOR_PERSISTED_VIEW",
+                  messageParameters = Map(
+                    "flowIdentifier" -> resolvedFlow.identifier.quotedString,
+                    "viewIdentifier" -> destTableIdentifier.quotedString
+                  )
+                )
+              }
+            case _: TemporaryView =>
+              // Temporary views' flows are allowed to be either streaming or batch, so no
+              // validation needs to be done for them
+          }
+        }
+      }
+    }
+  }
+
   /** Throws an exception if the flows in this graph are not topologically sorted. */
   protected[graph] def validateGraphIsTopologicallySorted(): Unit = {
     val visitedNodes = mutable.Set.empty[TableIdentifier] // Set of visited nodes
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineExecution.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineExecution.scala
index 92de9ff4c4070..5bb6e25eaf450 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineExecution.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineExecution.scala
@@ -21,6 +21,7 @@ import org.apache.spark.sql.pipelines.common.RunState
 import org.apache.spark.sql.pipelines.logging.{
   ConstructPipelineEvent,
   EventLevel,
+  PipelineEvent,
   PipelineEventOrigin,
   RunProgress
 }
@@ -38,31 +39,19 @@ class PipelineExecution(context: PipelineUpdateContext) {
 
   def executionStarted: Boolean = synchronized { graphExecution.nonEmpty }
 
-
   /**
    * Starts the pipeline execution by initializing the graph and starting the graph execution
    * thread. This function does not block on the completion of the graph execution thread.
    */
   def startPipeline(): Unit = synchronized {
     // Initialize the graph.
-    val initializedGraph = initializeGraph()
+    val resolvedGraph = resolveGraph()
+    val initializedGraph = DatasetManager.materializeDatasets(resolvedGraph, context)
 
     // Execute the graph.
     graphExecution = Option(
       new TriggeredGraphExecution(initializedGraph, context, onCompletion = terminationReason => {
-        context.eventBuffer.addEvent(
-          ConstructPipelineEvent(
-            origin = PipelineEventOrigin(
-              flowName = None,
-              datasetName = None,
-              sourceCodeLocation = None
-            ),
-            level = EventLevel.INFO,
-            message = terminationReason.message,
-            details = RunProgress(terminationReason.terminalState),
-            exception = terminationReason.cause
-          )
-        )
+        context.eventCallback(constructTerminationEvent(terminationReason))
       })
     )
     graphExecution.foreach(_.start())
@@ -75,7 +64,7 @@ class PipelineExecution(context: PipelineUpdateContext) {
       context.pipelineExecution.awaitCompletion()
     } catch {
       case e: Throwable =>
-        context.eventBuffer.addEvent(
+        context.eventCallback(
           ConstructPipelineEvent(
             origin = PipelineEventOrigin(
               flowName = None,
@@ -91,15 +80,38 @@ class PipelineExecution(context: PipelineUpdateContext) {
     }
   }
 
-  private def initializeGraph(): DataflowGraph = {
-    val resolvedGraph = try {
+  /** Validates that the pipeline graph can be successfully resolved and validates it. */
+  def dryRunPipeline(): Unit = synchronized {
+    resolveGraph()
+    context.eventCallback(
+      constructTerminationEvent(RunCompletion())
+    )
+  }
+
+  private def constructTerminationEvent(
+      terminationReason: RunTerminationReason
+  ): PipelineEvent = {
+    ConstructPipelineEvent(
+      origin = PipelineEventOrigin(
+        flowName = None,
+        datasetName = None,
+        sourceCodeLocation = None
+      ),
+      level = EventLevel.INFO,
+      message = terminationReason.message,
+      details = RunProgress(terminationReason.terminalState),
+      exception = terminationReason.cause
+    )
+  }
+
+  private def resolveGraph(): DataflowGraph = {
+    try {
       context.unresolvedGraph.resolve().validate()
     } catch {
       case e: UnresolvedPipelineException =>
         handleInvalidPipeline(e)
         throw e
     }
-    DatasetManager.materializeDatasets(resolvedGraph, context)
   }
 
   /** Waits for the execution to complete. Only used in tests */
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContext.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContext.scala
index 5a1ab88a432fb..d6f2020809337 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContext.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContext.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.pipelines.graph
 
 import org.apache.spark.sql.classic.SparkSession
-import org.apache.spark.sql.pipelines.logging.{FlowProgressEventLogger, PipelineRunEventBuffer}
+import org.apache.spark.sql.pipelines.logging.{FlowProgressEventLogger, PipelineEvent}
 
 trait PipelineUpdateContext {
 
@@ -50,8 +50,8 @@ trait PipelineUpdateContext {
     UnionFlowFilter(flowFilterForTables, resetCheckpointFlows)
   }
 
-  /** Buffer containing internal events that are emitted during a run of a pipeline. */
-  def eventBuffer: PipelineRunEventBuffer
+  /** Callback to invoke for internal events that are emitted during a run of a pipeline. */
+  def eventCallback: PipelineEvent => Unit
 
   /** Emits internal flow progress events into the event buffer. */
   def flowProgressEventLogger: FlowProgressEventLogger
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContextImpl.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContextImpl.scala
index 30f56d7a8e2c2..5a298c2f17d97 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContextImpl.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/PipelineUpdateContextImpl.scala
@@ -17,39 +17,30 @@
 
 package org.apache.spark.sql.pipelines.graph
 
-import scala.annotation.unused
-
 import org.apache.spark.sql.classic.SparkSession
-import org.apache.spark.sql.pipelines.logging.{
-  FlowProgressEventLogger,
-  PipelineEvent,
-  PipelineRunEventBuffer
-}
+import org.apache.spark.sql.pipelines.logging.{FlowProgressEventLogger, PipelineEvent}
 
 /**
  * An implementation of the PipelineUpdateContext trait used in production.
  * @param unresolvedGraph The graph (unresolved) to be executed in this update.
  * @param eventCallback A callback function to be called when an event is added to the event buffer.
+ * @param refreshTables Filter for which tables should be refreshed when performing this update.
+ * @param fullRefreshTables Filter for which tables should be full refreshed
+ *                          when performing this update.
  */
-@unused(
-  "TODO(SPARK-51727) construct this spark connect server when we expose APIs for users " +
-  "to interact with a pipeline"
-)
 class PipelineUpdateContextImpl(
     override val unresolvedGraph: DataflowGraph,
-    eventCallback: PipelineEvent => Unit
+    override val eventCallback: PipelineEvent => Unit,
+    override val refreshTables: TableFilter = AllTables,
+    override val fullRefreshTables: TableFilter = NoTables
 ) extends PipelineUpdateContext {
 
   override val spark: SparkSession = SparkSession.getActiveSession.getOrElse(
     throw new IllegalStateException("SparkSession is not available")
   )
 
-  override val eventBuffer = new PipelineRunEventBuffer(eventCallback)
-
   override val flowProgressEventLogger: FlowProgressEventLogger =
-    new FlowProgressEventLogger(eventBuffer = eventBuffer)
+    new FlowProgressEventLogger(eventCallback = eventCallback)
 
-  override val refreshTables: TableFilter = AllTables
-  override val fullRefreshTables: TableFilter = NoTables
   override val resetCheckpointFlows: FlowFilter = NoFlows
 }
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/QueryOriginType.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/QueryOriginType.scala
index c24575d581736..007002c2ad45c 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/QueryOriginType.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/QueryOriginType.scala
@@ -15,7 +15,7 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.pipelines
+package org.apache.spark.sql.pipelines.graph
 
 object QueryOriginType extends Enumeration {
   type QueryOriginType = Value
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/SqlGraphRegistrationContext.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/SqlGraphRegistrationContext.scala
index 30fe7c8dd5243..113fd1652cd73 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/SqlGraphRegistrationContext.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/SqlGraphRegistrationContext.scala
@@ -24,7 +24,7 @@ import org.apache.spark.sql.catalyst.analysis.UnresolvedRelation
 import org.apache.spark.sql.catalyst.plans.logical.{CreateFlowCommand, CreateMaterializedViewAsSelect, CreateStreamingTable, CreateStreamingTableAsSelect, CreateView, InsertIntoStatement, LogicalPlan}
 import org.apache.spark.sql.catalyst.util.StringUtils
 import org.apache.spark.sql.execution.command.{CreateViewCommand, SetCatalogCommand, SetCommand, SetNamespaceCommand}
-import org.apache.spark.sql.pipelines.{Language, QueryOriginType}
+import org.apache.spark.sql.pipelines.Language
 import org.apache.spark.sql.types.StructType
 
 /**
@@ -199,7 +199,7 @@ class SqlGraphRegistrationContext(
           ),
           format = cst.tableSpec.provider,
           normalizedPath = None,
-          isStreamingTableOpt = None
+          isStreamingTable = true
         )
       )
     }
@@ -230,7 +230,7 @@ class SqlGraphRegistrationContext(
           ),
           format = cst.tableSpec.provider,
           normalizedPath = None,
-          isStreamingTableOpt = None
+          isStreamingTable = true
         )
       )
 
@@ -246,7 +246,6 @@ class SqlGraphRegistrationContext(
             currentCatalog = context.getCurrentCatalogOpt,
             currentDatabase = context.getCurrentDatabaseOpt
           ),
-          comment = cst.tableSpec.comment,
           origin = queryOrigin.copy(
             objectName = Option(stIdentifier.unquotedString),
             objectType = Option(QueryOriginType.Flow.toString)
@@ -281,7 +280,7 @@ class SqlGraphRegistrationContext(
           ),
           format = cmv.tableSpec.provider,
           normalizedPath = None,
-          isStreamingTableOpt = None
+          isStreamingTable = false
         )
       )
 
@@ -297,7 +296,6 @@ class SqlGraphRegistrationContext(
             currentCatalog = context.getCurrentCatalogOpt,
             currentDatabase = context.getCurrentDatabaseOpt
           ),
-          comment = cmv.tableSpec.comment,
           origin = queryOrigin.copy(
             objectName = Option(mvIdentifier.unquotedString),
             objectType = Option(QueryOriginType.Flow.toString)
@@ -343,8 +341,7 @@ class SqlGraphRegistrationContext(
           origin = queryOrigin.copy(
             objectName = Option(viewIdentifier.unquotedString),
             objectType = Option(QueryOriginType.Flow.toString)
-          ),
-          comment = None
+          )
         )
       )
     }
@@ -387,8 +384,7 @@ class SqlGraphRegistrationContext(
           origin = queryOrigin.copy(
             objectName = Option(viewIdentifier.unquotedString),
             objectType = Option(QueryOriginType.Flow.toString)
-          ),
-          comment = None
+          )
         )
       )
     }
@@ -454,7 +450,6 @@ class SqlGraphRegistrationContext(
         UnresolvedFlow(
           identifier = flowIdentifier,
           destinationIdentifier = qualifiedDestinationIdentifier,
-          comment = cf.comment,
           func = FlowAnalysis.createFlowFunctionFromLogicalPlan(flowQueryLogicalPlan),
           sqlConf = context.getSqlConf,
           once = isOnce,
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecution.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecution.scala
index 503a1aa8e2816..c57f125aed331 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecution.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecution.scala
@@ -25,7 +25,7 @@ import scala.jdk.CollectionConverters._
 import scala.util.Try
 import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.pipelines.graph.TriggeredGraphExecution._
 import org.apache.spark.sql.pipelines.util.ExponentialBackoffStrategy
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/elements.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/elements.scala
index 770776b29cf08..b58f6e2297fb6 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/elements.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/graph/elements.scala
@@ -27,7 +27,7 @@ import org.apache.spark.sql.Row
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.catalyst.encoders.ExpressionEncoder
 import org.apache.spark.sql.classic.{DataFrame, SparkSession}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.pipelines.common.DatasetType
 import org.apache.spark.sql.pipelines.util.{
   BatchReadOptions,
@@ -114,8 +114,7 @@ sealed trait TableInput extends Input {
  *                       path (if not defined, we will normalize a managed storage path for it).
  * @param properties Table Properties to set in table metadata.
  * @param comment User-specified comment that can be placed on the table.
- * @param isStreamingTableOpt if the table is a streaming table, will be None until we have resolved
- *                            flows into table
+ * @param isStreamingTable if the table is a streaming table, as defined by the source code.
  */
 case class Table(
     identifier: TableIdentifier,
@@ -125,7 +124,7 @@ case class Table(
     properties: Map[String, String] = Map.empty,
     comment: Option[String],
     baseOrigin: QueryOrigin,
-    isStreamingTableOpt: Option[Boolean],
+    isStreamingTable: Boolean,
     format: Option[String]
 ) extends TableInput
     with Output {
@@ -163,17 +162,6 @@ case class Table(
     normalizedPath.get
   }
 
-  /**
-   * Tell if a table is a streaming table or not. This property is not set until we have resolved
-   * the flows into the table. The exception reminds engineers that they cant call at random time.
-   */
-  def isStreamingTable: Boolean = isStreamingTableOpt.getOrElse {
-    throw new IllegalStateException(
-      "Cannot identify whether the table is streaming table or not. You may need to resolve the " +
-      "flows into table."
-    )
-  }
-
   /**
    * Get the DatasetType of the table
    */
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/logging/FlowProgressEventLogger.scala b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/logging/FlowProgressEventLogger.scala
index 348a562c8b168..8475acd8984fe 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/logging/FlowProgressEventLogger.scala
+++ b/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/logging/FlowProgressEventLogger.scala
@@ -36,9 +36,9 @@ import org.apache.spark.sql.pipelines.graph.{FlowExecution, ResolutionCompletedF
  *  - All flow progress events other than errors/warnings will be logged at INFO level (including
  *    flow progress events with metrics) and error/warning messages will be logged at their level.
  *
- * @param eventBuffer Event log to log the flow progress events.
+ * @param eventCallback Callback to invoke on the flow progress events.
  */
-class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Logging {
+class FlowProgressEventLogger(eventCallback: PipelineEvent => Unit) extends Logging {
 
   /**
    * This map stores flow identifier to a boolean representing whether flow is running.
@@ -57,7 +57,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
    * INFO level, since flows are only queued once.
    */
   def recordQueued(flow: ResolvedFlow): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -76,7 +76,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
    */
   def recordPlanningForBatchFlow(batchFlow: ResolvedFlow): Unit = synchronized {
     if (batchFlow.df.isStreaming) return
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(batchFlow.displayName),
@@ -97,7 +97,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
    * logged at METRICS. All other cases will be logged at INFO.
    */
   def recordStart(flowExecution: FlowExecution): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flowExecution.displayName),
@@ -114,7 +114,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
 
   /** Records flow progress events with flow status as RUNNING. */
   def recordRunning(flow: ResolvedFlow): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -142,7 +142,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
   ): Unit = synchronized {
     val eventLogMessage = messageOpt.getOrElse(s"Flow '${flow.displayName}' has FAILED.")
 
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -165,7 +165,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
    * record skipped should be used when the flow is skipped because of upstream flow failures.
    */
   def recordSkippedOnUpStreamFailure(flow: ResolvedFlow): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -188,7 +188,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
    * upstream failures use [[recordSkippedOnUpStreamFailure]] function.
    */
   def recordSkipped(flow: ResolvedFlow): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -208,7 +208,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
 
   /** Records flow progress events with flow status as EXCLUDED at INFO level.  */
   def recordExcluded(flow: ResolvedFlow): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -232,7 +232,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
       message: Option[String] = None,
       cause: Option[Throwable] = None
   ): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -252,7 +252,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
 
   /** Records flow progress events with flow status as IDLE. */
   def recordIdle(flow: ResolvedFlow): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
@@ -277,7 +277,7 @@ class FlowProgressEventLogger(eventBuffer: PipelineRunEventBuffer) extends Loggi
    * event.
    */
   def recordCompletion(flow: ResolvedFlow): Unit = synchronized {
-    eventBuffer.addEvent(
+    eventCallback(
       ConstructPipelineEvent(
         origin = PipelineEventOrigin(
           flowName = Option(flow.displayName),
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectInvalidPipelineSuite.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectInvalidPipelineSuite.scala
index fbeef5f0fe04a..f37716b4a24d3 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectInvalidPipelineSuite.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectInvalidPipelineSuite.scala
@@ -18,8 +18,9 @@
 package org.apache.spark.sql.pipelines.graph
 
 import org.apache.spark.sql.AnalysisException
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.pipelines.utils.{PipelineTest, TestGraphRegistrationContext}
+import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.{IntegerType, StructType}
 
 /**
@@ -27,11 +28,11 @@ import org.apache.spark.sql.types.{IntegerType, StructType}
  * examples are all semantically correct but contain logical errors which should be found
  * when connect is called and thrown when validate() is called.
  */
-class ConnectInvalidPipelineSuite extends PipelineTest {
+class ConnectInvalidPipelineSuite extends PipelineTest with SharedSparkSession {
 
   test("Missing source") {
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("b", query = readFlowFunc("a"))
+      registerPersistedView("b", query = readFlowFunc("a"))
     }
 
     val dfg = new P().resolveToDataflowGraph()
@@ -41,19 +42,22 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     }
     assert(ex.getMessage.contains("Failed to resolve flows in the pipeline"))
     assertAnalysisException(
-      ex.directFailures(fullyQualifiedIdentifier("b", isView = true)),
+      ex.directFailures(fullyQualifiedIdentifier("b")),
       "TABLE_OR_VIEW_NOT_FOUND"
     )
   }
 
   test("Correctly differentiate between upstream and downstream errors") {
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(spark.range(5).toDF()))
-      registerView("b", query = readFlowFunc("nonExistentFlow"))
-      registerView("c", query = readFlowFunc("b"))
-      registerView("d", query = dfFlowFunc(spark.range(5).toDF()))
-      registerView("e", query = sqlFlowFunc(spark, "SELECT nonExistentColumn FROM RANGE(5)"))
-      registerView("f", query = readFlowFunc("e"))
+      registerPersistedView("a", query = dfFlowFunc(spark.range(5).toDF()))
+      registerPersistedView("b", query = readFlowFunc("nonExistentFlow"))
+      registerPersistedView("c", query = readFlowFunc("b"))
+      registerPersistedView("d", query = dfFlowFunc(spark.range(5).toDF()))
+      registerPersistedView(
+        "e",
+        query = sqlFlowFunc(spark, "SELECT nonExistentColumn FROM RANGE(5)")
+      )
+      registerPersistedView("f", query = readFlowFunc("e"))
     }
 
     val dfg = new P().resolveToDataflowGraph()
@@ -65,65 +69,65 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     assert(
       ex.getMessage.contains(
         s"Flows with errors: " +
-        s"${fullyQualifiedIdentifier("b", isView = true).unquotedString}," +
-        s" ${fullyQualifiedIdentifier("e", isView = true).unquotedString}"
+        s"${fullyQualifiedIdentifier("b").unquotedString}," +
+        s" ${fullyQualifiedIdentifier("e").unquotedString}"
       )
     )
     assert(
       ex.getMessage.contains(
         s"Flows that failed due to upstream errors: " +
-        s"${fullyQualifiedIdentifier("c", isView = true).unquotedString}, " +
-        s"${fullyQualifiedIdentifier("f", isView = true).unquotedString}"
+        s"${fullyQualifiedIdentifier("c").unquotedString}, " +
+        s"${fullyQualifiedIdentifier("f").unquotedString}"
       )
     )
     assert(
       ex.directFailures.keySet == Set(
-        fullyQualifiedIdentifier("b", isView = true),
-        fullyQualifiedIdentifier("e", isView = true)
+        fullyQualifiedIdentifier("b"),
+        fullyQualifiedIdentifier("e")
       )
     )
     assert(
       ex.downstreamFailures.keySet == Set(
-        fullyQualifiedIdentifier("c", isView = true),
-        fullyQualifiedIdentifier("f", isView = true)
+        fullyQualifiedIdentifier("c"),
+        fullyQualifiedIdentifier("f")
       )
     )
     assertAnalysisException(
-      ex.directFailures(fullyQualifiedIdentifier("b", isView = true)),
+      ex.directFailures(fullyQualifiedIdentifier("b")),
       "TABLE_OR_VIEW_NOT_FOUND"
     )
     assert(
-      ex.directFailures(fullyQualifiedIdentifier("e", isView = true))
+      ex.directFailures(fullyQualifiedIdentifier("e"))
         .isInstanceOf[AnalysisException]
     )
     assert(
-      ex.directFailures(fullyQualifiedIdentifier("e", isView = true))
+      ex.directFailures(fullyQualifiedIdentifier("e"))
         .getMessage
         .contains("nonExistentColumn")
     )
     assert(
-      ex.downstreamFailures(fullyQualifiedIdentifier("c", isView = true))
+      ex.downstreamFailures(fullyQualifiedIdentifier("c"))
         .isInstanceOf[UnresolvedDatasetException]
     )
     assert(
-      ex.downstreamFailures(fullyQualifiedIdentifier("c", isView = true))
+      ex.downstreamFailures(fullyQualifiedIdentifier("c"))
         .getMessage
         .contains(
           s"Failed to read dataset " +
-          s"'${fullyQualifiedIdentifier("b", isView = true).unquotedString}'. " +
+          s"'${fullyQualifiedIdentifier("b").unquotedString}'. " +
           s"Dataset is defined in the pipeline but could not be resolved"
         )
     )
     assert(
-      ex.downstreamFailures(fullyQualifiedIdentifier("f", isView = true))
+      ex.downstreamFailures(fullyQualifiedIdentifier("f"))
         .isInstanceOf[UnresolvedDatasetException]
     )
     assert(
-      ex.downstreamFailures(fullyQualifiedIdentifier("f", isView = true))
+      ex.downstreamFailures(fullyQualifiedIdentifier("f"))
         .getMessage
         .contains(
           s"Failed to read dataset " +
-          s"'${fullyQualifiedIdentifier("e", isView = true).unquotedString}'. " +
+          s"'${fullyQualifiedIdentifier("e").unquotedString}'. " +
           s"Dataset is defined in the pipeline but could not be resolved"
         )
     )
@@ -147,14 +151,14 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("z")))
-      registerView("b", query = sqlFlowFunc(spark, "SELECT x FROM a"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("z")))
+      registerPersistedView("b", query = sqlFlowFunc(spark, "SELECT x FROM a"))
     }
 
     val dfg = new P().resolveToDataflowGraph()
     val ex = intercept[UnresolvedPipelineException] {
       dfg.validate()
-    }.directFailures(fullyQualifiedIdentifier("b", isView = true)).getMessage
+    }.directFailures(fullyQualifiedIdentifier("b")).getMessage
     verifyUnresolveColumnError(ex, "x", Seq("z"))
   }
 
@@ -163,9 +167,9 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
-      registerView("b", query = dfFlowFunc(Seq("a", "b", "c").toDF("y")))
-      registerView("c", query = sqlFlowFunc(spark, "SELECT * FROM a JOIN b USING (x)"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView("b", query = dfFlowFunc(Seq("a", "b", "c").toDF("y")))
+      registerPersistedView("c", query = sqlFlowFunc(spark, "SELECT * FROM a JOIN b USING (x)"))
     }
 
     val dfg = new P().resolveToDataflowGraph()
@@ -173,7 +177,7 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
       dfg.validate()
     }
     assert(
-      ex.directFailures(fullyQualifiedIdentifier("c", isView = true))
+      ex.directFailures(fullyQualifiedIdentifier("c"))
         .getMessage
         .contains("USING column `x` cannot be resolved on the right side")
     )
@@ -184,9 +188,12 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
-      registerView("b", query = dfFlowFunc(Seq(true, false).toDF("x")))
-      registerView("c", query = sqlFlowFunc(spark, "SELECT x FROM a UNION SELECT x FROM b"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView("b", query = dfFlowFunc(Seq(true, false).toDF("x")))
+      registerPersistedView(
+        "c",
+        query = sqlFlowFunc(spark, "SELECT x FROM a UNION SELECT x FROM b")
+      )
     }
 
     val dfg = new P().resolveToDataflowGraph()
@@ -195,37 +202,37 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
       dfg.validate()
     }
     assert(
-      ex.directFailures(fullyQualifiedIdentifier("c", isView = true))
+      ex.directFailures(fullyQualifiedIdentifier("c"))
         .getMessage
         .contains("compatible column types") ||
-      ex.directFailures(fullyQualifiedIdentifier("c", isView = true))
-        .getMessage
-        .contains("Failed to merge incompatible data types")
+        ex.directFailures(fullyQualifiedIdentifier("c"))
+          .getMessage
+          .contains("Failed to merge incompatible data types")
     )
   }
 
   test("Self reference") {
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = readFlowFunc("a"))
+      registerPersistedView("a", query = readFlowFunc("a"))
     }
     val e = intercept[CircularDependencyException] {
       new P().resolveToDataflowGraph().validate()
     }
-    assert(e.upstreamDataset == fullyQualifiedIdentifier("a", isView = true))
-    assert(e.downstreamTable == fullyQualifiedIdentifier("a", isView = true))
+    assert(e.upstreamDataset == fullyQualifiedIdentifier("a"))
+    assert(e.downstreamTable == fullyQualifiedIdentifier("a"))
   }
 
   test("Cyclic graph - simple") {
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = readFlowFunc("b"))
-      registerView("b", query = readFlowFunc("a"))
+      registerPersistedView("a", query = readFlowFunc("b"))
+      registerPersistedView("b", query = readFlowFunc("a"))
     }
     val e = intercept[CircularDependencyException] {
       new P().resolveToDataflowGraph().validate()
     }
     val cycle = Set(
-      fullyQualifiedIdentifier("a", isView = true),
-      fullyQualifiedIdentifier("b", isView = true)
+      fullyQualifiedIdentifier("a"),
+      fullyQualifiedIdentifier("b")
     )
     assert(e.upstreamDataset != e.downstreamTable)
     assert(cycle.contains(e.upstreamDataset))
@@ -237,16 +244,19 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
-      registerView("b", query = sqlFlowFunc(spark, "SELECT * FROM a UNION SELECT * FROM d"))
-      registerView("c", query = readFlowFunc("b"))
-      registerView("d", query = readFlowFunc("c"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView(
+        "b",
+        query = sqlFlowFunc(spark, "SELECT * FROM a UNION SELECT * FROM d")
+      )
+      registerPersistedView("c", query = readFlowFunc("b"))
+      registerPersistedView("d", query = readFlowFunc("c"))
     }
     val cycle =
       Set(
-        fullyQualifiedIdentifier("b", isView = true),
-        fullyQualifiedIdentifier("c", isView = true),
-        fullyQualifiedIdentifier("d", isView = true)
+        fullyQualifiedIdentifier("b"),
+        fullyQualifiedIdentifier("c"),
+        fullyQualifiedIdentifier("d")
       )
     val e = intercept[CircularDependencyException] {
       new P().resolveToDataflowGraph().validate()
@@ -341,7 +351,7 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     val p = new TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1).toDF()), sqlConf = Map("x" -> "a-val"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1).toDF()), sqlConf = Map("x" -> "a-val"))
       registerTable("b", query = Option(readFlowFunc("a")), sqlConf = Map("x" -> "b-val"))
     }
     val ex = intercept[AnalysisException] { p.resolveToDataflowGraph() }
@@ -354,7 +364,7 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     assert(
       ex.getMessage.contains(
         s"'x' is defined by both " +
-        s"'${fullyQualifiedIdentifier("a", isView = true).unquotedString}' " +
+        s"'${fullyQualifiedIdentifier("a").unquotedString}' " +
         s"and '${fullyQualifiedIdentifier("b").unquotedString}'"
       )
     )
@@ -365,8 +375,8 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     val p = new TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1).toDF()), sqlConf = Map("x" -> "a-val"))
-      registerView("b", query = dfFlowFunc(Seq(1).toDF()), sqlConf = Map("x" -> "b-val"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1).toDF()), sqlConf = Map("x" -> "a-val"))
+      registerPersistedView("b", query = dfFlowFunc(Seq(1).toDF()), sqlConf = Map("x" -> "b-val"))
       registerTable(
         "c",
         query = Option(sqlFlowFunc(spark, "SELECT * FROM a UNION SELECT * FROM b")),
@@ -383,8 +393,8 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     assert(
       ex.getMessage.contains(
         s"'x' is defined by both " +
-        s"'${fullyQualifiedIdentifier("a", isView = true).unquotedString}' " +
-        s"and '${fullyQualifiedIdentifier("b", isView = true).unquotedString}'"
+        s"'${fullyQualifiedIdentifier("a").unquotedString}' " +
+        s"and '${fullyQualifiedIdentifier("b").unquotedString}'"
       )
     )
   }
@@ -394,7 +404,7 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     val p = new TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1).toDF()))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1).toDF()))
       registerTable("b", query = Option(readStreamFlowFunc("a")))
     }
     val ex = intercept[UnresolvedPipelineException] { p.resolveToDataflowGraph().validate() }
@@ -402,7 +412,7 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
       ex.directFailures(fullyQualifiedIdentifier("b"))
         .getMessage
         .contains(
-          s"View ${fullyQualifiedIdentifier("a", isView = true).quotedString}" +
+          s"View ${fullyQualifiedIdentifier("a").quotedString}" +
           s" is a batch view and must be referenced using SparkSession#read."
         )
     )
@@ -415,7 +425,7 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
     val p = new TestGraphRegistrationContext(spark) {
       val mem = MemoryStream[Int]
       mem.addData(1)
-      registerView("a", query = dfFlowFunc(mem.toDF()))
+      registerPersistedView("a", query = dfFlowFunc(mem.toDF()))
       registerTable("b", query = Option(readFlowFunc("a")))
     }
     val ex = intercept[UnresolvedPipelineException] { p.resolveToDataflowGraph().validate() }
@@ -423,12 +433,83 @@ class ConnectInvalidPipelineSuite extends PipelineTest {
       ex.directFailures(fullyQualifiedIdentifier("b"))
         .getMessage
         .contains(
-          s"View ${fullyQualifiedIdentifier("a", isView = true).quotedString} " +
+          s"View ${fullyQualifiedIdentifier("a").quotedString} " +
           s"is a streaming view and must be referenced using SparkSession#readStream"
         )
     )
   }
 
+  test("Streaming table backed by batch relation fails validation") {
+    val session = spark
+    import session.implicits._
+
+    val graph = new TestGraphRegistrationContext(spark) {
+      registerTable("a", query = Option(dfFlowFunc(Seq(1, 2).toDF())))
+    }.resolveToDataflowGraph()
+
+    val ex = intercept[AnalysisException] {
+      graph.validate()
+    }
+
+    checkError(
+      exception = ex,
+      condition = "INVALID_FLOW_QUERY_TYPE.BATCH_RELATION_FOR_STREAMING_TABLE",
+      parameters = Map(
+        "flowIdentifier" -> fullyQualifiedIdentifier("a").quotedString,
+        "tableIdentifier" -> fullyQualifiedIdentifier("a").quotedString
+      )
+    )
+  }
+
+  test("Materialized view backed by streaming relation fails validation") {
+    val session = spark
+    import session.implicits._
+
+    val graph = new TestGraphRegistrationContext(spark) {
+      registerMaterializedView("a", query = dfFlowFunc(MemoryStream[Int].toDF()))
+    }.resolveToDataflowGraph()
+
+    val ex = intercept[AnalysisException] {
+      graph.validate()
+    }
+
+    checkError(
+      exception = ex,
+      condition = "INVALID_FLOW_QUERY_TYPE.STREAMING_RELATION_FOR_MATERIALIZED_VIEW",
+      parameters = Map(
+        "flowIdentifier" -> fullyQualifiedIdentifier("a").quotedString,
+        "tableIdentifier" -> fullyQualifiedIdentifier("a").quotedString
+      )
+    )
+  }
+
+  test("Once flow backed by streaming relation fails validation") {
+    val session = spark
+    import session.implicits._
+
+    val graph = new TestGraphRegistrationContext(spark) {
+      registerTable("a")
+      registerFlow(
+        destinationName = "a",
+        name = "once_flow",
+        query = dfFlowFunc(MemoryStream[Int].toDF()),
+        once = true
+      )
+    }.resolveToDataflowGraph()
+
+    val ex = intercept[AnalysisException] {
+      graph.validate()
+    }
+
+    checkError(
+      exception = ex,
+      condition = "INVALID_FLOW_QUERY_TYPE.STREAMING_RELATION_FOR_ONCE_FLOW",
+      parameters = Map(
+        "flowIdentifier" -> fullyQualifiedIdentifier("once_flow").quotedString
+      )
+    )
+  }
+
   test("Inferred schema that isn't a subset of user-specified schema") {
     val session = spark
     import session.implicits._
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectValidPipelineSuite.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectValidPipelineSuite.scala
index 52b081a8955db..2c0e2a728c69f 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectValidPipelineSuite.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/ConnectValidPipelineSuite.scala
@@ -20,8 +20,9 @@ package org.apache.spark.sql.pipelines.graph
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.catalyst.analysis.UnresolvedRelation
 import org.apache.spark.sql.catalyst.plans.logical.Union
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.pipelines.utils.{PipelineTest, TestGraphRegistrationContext}
+import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.util.CaseInsensitiveStringMap
 
@@ -30,17 +31,17 @@ import org.apache.spark.sql.util.CaseInsensitiveStringMap
  * examples are all semantically correct and logically correct and connect should not result in any
  * errors.
  */
-class ConnectValidPipelineSuite extends PipelineTest {
+class ConnectValidPipelineSuite extends PipelineTest with SharedSparkSession {
   test("Extra simple") {
     val session = spark
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("b", query = dfFlowFunc(Seq(1, 2, 3).toDF("y")))
+      registerPersistedView("b", query = dfFlowFunc(Seq(1, 2, 3).toDF("y")))
     }
     val p = new P().resolveToDataflowGraph()
     val outSchema = new StructType().add("y", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("b", isView = true), outSchema)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("b"), outSchema)
   }
 
   test("Simple") {
@@ -48,20 +49,20 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
-      registerView("b", query = sqlFlowFunc(spark, "SELECT x as y FROM a"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView("b", query = sqlFlowFunc(spark, "SELECT x as y FROM a"))
     }
     val p = new P().resolveToDataflowGraph()
     verifyFlowSchema(
       p,
-      fullyQualifiedIdentifier("a", isView = true),
+      fullyQualifiedIdentifier("a"),
       new StructType().add("x", IntegerType, false)
     )
     val outSchema = new StructType().add("y", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("b", isView = true), outSchema)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("b"), outSchema)
     assert(
-      p.resolvedFlow(fullyQualifiedIdentifier("b", isView = true)).inputs == Set(
-        fullyQualifiedIdentifier("a", isView = true)
+      p.resolvedFlow(fullyQualifiedIdentifier("b")).inputs == Set(
+        fullyQualifiedIdentifier("a")
       ),
       "Flow did not have the expected inputs"
     )
@@ -72,15 +73,15 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
-      registerView("c", query = sqlFlowFunc(spark, "SELECT y as z FROM b"))
-      registerView("b", query = sqlFlowFunc(spark, "SELECT x as y FROM a"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView("c", query = sqlFlowFunc(spark, "SELECT y as z FROM b"))
+      registerPersistedView("b", query = sqlFlowFunc(spark, "SELECT x as y FROM a"))
     }
     val p = new P().resolveToDataflowGraph()
     val schemaAB = new StructType().add("y", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("b", isView = true), schemaAB)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("b"), schemaAB)
     val schemaBC = new StructType().add("z", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("c", isView = true), schemaBC)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("c"), schemaBC)
   }
 
   test("Multi-hop schema merging") {
@@ -88,17 +89,17 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView(
+      registerPersistedView(
         "b",
         query = sqlFlowFunc(spark, """SELECT * FROM VALUES ((1)) OUTER JOIN d ON false""")
       )
-      registerView("e", query = readFlowFunc("b"))
-      registerView("d", query = dfFlowFunc(Seq(1).toDF("y")))
+      registerPersistedView("e", query = readFlowFunc("b"))
+      registerPersistedView("d", query = dfFlowFunc(Seq(1).toDF("y")))
     }
     val p = new P().resolveToDataflowGraph()
     val schemaE = new StructType().add("col1", IntegerType, false).add("y", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("b", isView = true), schemaE)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("e", isView = true), schemaE)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("b"), schemaE)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("e"), schemaE)
   }
 
   test("Cross product join merges schema") {
@@ -106,17 +107,17 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
-      registerView("b", query = dfFlowFunc(Seq(4, 5, 6).toDF("y")))
-      registerView("c", query = sqlFlowFunc(spark, "SELECT * FROM a CROSS JOIN b"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView("b", query = dfFlowFunc(Seq(4, 5, 6).toDF("y")))
+      registerPersistedView("c", query = sqlFlowFunc(spark, "SELECT * FROM a CROSS JOIN b"))
     }
     val p = new P().resolveToDataflowGraph()
     val schemaC = new StructType().add("x", IntegerType, false).add("y", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("c", isView = true), schemaC)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("c"), schemaC)
     assert(
-      p.resolvedFlow(fullyQualifiedIdentifier("c", isView = true)).inputs == Set(
-        fullyQualifiedIdentifier("a", isView = true),
-        fullyQualifiedIdentifier("b", isView = true)
+      p.resolvedFlow(fullyQualifiedIdentifier("c")).inputs == Set(
+        fullyQualifiedIdentifier("a"),
+        fullyQualifiedIdentifier("b")
       ),
       "Flow did not have the expected inputs"
     )
@@ -127,20 +128,26 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq((1, "a"), (2, "b"), (3, "c")).toDF("x", "y")))
-      registerView("b", query = dfFlowFunc(Seq((2, "m"), (3, "n"), (4, "o")).toDF("x", "z")))
-      registerView("c", query = sqlFlowFunc(spark, "SELECT * FROM a JOIN b USING (x)"))
+      registerPersistedView(
+        "a",
+        query = dfFlowFunc(Seq((1, "a"), (2, "b"), (3, "c")).toDF("x", "y"))
+      )
+      registerPersistedView(
+        "b",
+        query = dfFlowFunc(Seq((2, "m"), (3, "n"), (4, "o")).toDF("x", "z"))
+      )
+      registerPersistedView("c", query = sqlFlowFunc(spark, "SELECT * FROM a JOIN b USING (x)"))
     }
     val p = new P().resolveToDataflowGraph()
     val schemaC = new StructType()
       .add("x", IntegerType, false)
       .add("y", StringType)
       .add("z", StringType)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("c", isView = true), schemaC)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("c"), schemaC)
     assert(
-      p.resolvedFlow(fullyQualifiedIdentifier("c", isView = true)).inputs == Set(
-        fullyQualifiedIdentifier("a", isView = true),
-        fullyQualifiedIdentifier("b", isView = true)
+      p.resolvedFlow(fullyQualifiedIdentifier("c")).inputs == Set(
+        fullyQualifiedIdentifier("a"),
+        fullyQualifiedIdentifier("b")
       ),
       "Flow did not have the expected inputs"
     )
@@ -153,9 +160,9 @@ class ConnectValidPipelineSuite extends PipelineTest {
     class P extends TestGraphRegistrationContext(spark) {
       val ints = MemoryStream[Int]
       ints.addData(1, 2, 3, 4)
-      registerView("a", query = dfFlowFunc(ints.toDF()))
-      registerView("b", query = dfFlowFunc(Seq(1, 2, 3).toDF()))
-      registerView(
+      registerPersistedView("a", query = dfFlowFunc(ints.toDF()))
+      registerPersistedView("b", query = dfFlowFunc(Seq(1, 2, 3).toDF()))
+      registerPersistedView(
         "c",
         query = FlowAnalysis.createFlowFunctionFromLogicalPlan(
           Union(
@@ -175,13 +182,13 @@ class ConnectValidPipelineSuite extends PipelineTest {
     val p = new P().resolveToDataflowGraph()
     verifyFlowSchema(
       p,
-      fullyQualifiedIdentifier("c", isView = true),
+      fullyQualifiedIdentifier("c"),
       new StructType().add("value", IntegerType, false)
     )
     assert(
-      p.resolvedFlow(fullyQualifiedIdentifier("c", isView = true)).inputs == Set(
-        fullyQualifiedIdentifier("a", isView = true),
-        fullyQualifiedIdentifier("b", isView = true)
+      p.resolvedFlow(fullyQualifiedIdentifier("c")).inputs == Set(
+        fullyQualifiedIdentifier("a"),
+        fullyQualifiedIdentifier("b")
       ),
       "Flow did not have the expected inputs"
     )
@@ -196,9 +203,9 @@ class ConnectValidPipelineSuite extends PipelineTest {
       ints1.addData(1, 2, 3, 4)
       val ints2 = MemoryStream[Int]
       ints2.addData(1, 2, 3, 4)
-      registerView("a", query = dfFlowFunc(ints1.toDF()))
-      registerView("b", query = dfFlowFunc(ints2.toDF()))
-      registerView(
+      registerPersistedView("a", query = dfFlowFunc(ints1.toDF()))
+      registerPersistedView("b", query = dfFlowFunc(ints2.toDF()))
+      registerPersistedView(
         "c",
         query = FlowAnalysis.createFlowFunctionFromLogicalPlan(
           Union(
@@ -222,13 +229,13 @@ class ConnectValidPipelineSuite extends PipelineTest {
     val p = new P().resolveToDataflowGraph()
     verifyFlowSchema(
       p,
-      fullyQualifiedIdentifier("c", isView = true),
+      fullyQualifiedIdentifier("c"),
       new StructType().add("value", IntegerType, false)
     )
     assert(
-      p.resolvedFlow(fullyQualifiedIdentifier("c", isView = true)).inputs == Set(
-        fullyQualifiedIdentifier("a", isView = true),
-        fullyQualifiedIdentifier("b", isView = true)
+      p.resolvedFlow(fullyQualifiedIdentifier("c")).inputs == Set(
+        fullyQualifiedIdentifier("a"),
+        fullyQualifiedIdentifier("b")
       ),
       "Flow did not have the expected inputs"
     )
@@ -239,16 +246,16 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
-      registerView("b", query = dfFlowFunc(Seq(4, 5, 6).toDF("y")))
-      registerView(
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView("b", query = dfFlowFunc(Seq(4, 5, 6).toDF("y")))
+      registerPersistedView(
         "c",
         query = sqlFlowFunc(spark, "SELECT x AS z FROM a UNION SELECT y AS z FROM b")
       )
     }
     val p = new P().resolveToDataflowGraph()
     val schema = new StructType().add("z", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("c", isView = true), schema)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("c"), schema)
   }
 
   test("Connect retains and fuses confs") {
@@ -259,9 +266,9 @@ class ConnectValidPipelineSuite extends PipelineTest {
     //          d
     //      c /
     val p = new TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1).toDF("x")), Map("a" -> "a-val"))
-      registerView("b", query = readFlowFunc("a"), Map("b" -> "b-val"))
-      registerView("c", query = dfFlowFunc(Seq(2).toDF("x")), Map("c" -> "c-val"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1).toDF("x")), Map("a" -> "a-val"))
+      registerPersistedView("b", query = readFlowFunc("a"), Map("b" -> "b-val"))
+      registerPersistedView("c", query = dfFlowFunc(Seq(2).toDF("x")), Map("c" -> "c-val"))
       registerTable(
         "d",
         query = Option(sqlFlowFunc(spark, "SELECT * FROM b UNION SELECT * FROM c")),
@@ -271,7 +278,7 @@ class ConnectValidPipelineSuite extends PipelineTest {
     val graph = p.resolveToDataflowGraph()
     assert(
       graph
-        .flow(fullyQualifiedIdentifier("d", isView = false))
+        .flow(fullyQualifiedIdentifier("d"))
         .sqlConf == Map("a" -> "a-val", "b" -> "b-val", "c" -> "c-val", "d" -> "d-val")
     )
   }
@@ -281,9 +288,13 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     val p = new TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1).toDF("x")), Map("a" -> "a-val"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1).toDF("x")), Map("a" -> "a-val"))
       registerTable("b", query = Option(readFlowFunc("a")), Map("b" -> "b-val"))
-      registerView("c", query = dfFlowFunc(Seq(2).toDF("x")), sqlConf = Map("c" -> "c-val"))
+      registerPersistedView(
+        "c",
+        query = dfFlowFunc(Seq(2).toDF("x")),
+        sqlConf = Map("c" -> "c-val")
+      )
       registerTable(
         "d",
         query = Option(sqlFlowFunc(spark, "SELECT * FROM b UNION SELECT * FROM c")),
@@ -291,13 +302,13 @@ class ConnectValidPipelineSuite extends PipelineTest {
       )
     }
     val graph = p.resolveToDataflowGraph()
-    assert(graph.flow(fullyQualifiedIdentifier("a", isView = true)).sqlConf == Map("a" -> "a-val"))
+    assert(graph.flow(fullyQualifiedIdentifier("a")).sqlConf == Map("a" -> "a-val"))
     assert(
       graph
         .flow(fullyQualifiedIdentifier("b"))
         .sqlConf == Map("a" -> "a-val", "b" -> "b-val")
     )
-    assert(graph.flow(fullyQualifiedIdentifier("c", isView = true)).sqlConf == Map("c" -> "c-val"))
+    assert(graph.flow(fullyQualifiedIdentifier("c")).sqlConf == Map("c" -> "c-val"))
     assert(
       graph
         .flow(fullyQualifiedIdentifier("d"))
@@ -310,8 +321,8 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     val p = new TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")), Map("key" -> "val"))
-      registerView("b", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")), Map("key" -> "val"))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")), Map("key" -> "val"))
+      registerPersistedView("b", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")), Map("key" -> "val"))
       registerTable(
         "c",
         query = Option(sqlFlowFunc(spark, "SELECT * FROM a UNION SELECT * FROM b")),
@@ -327,17 +338,17 @@ class ConnectValidPipelineSuite extends PipelineTest {
     import session.implicits._
 
     class P extends TestGraphRegistrationContext(spark) {
-      registerView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
+      registerPersistedView("a", query = dfFlowFunc(Seq(1, 2, 3).toDF("x")))
       registerTable("b")
       registerFlow("b", "`b-query`", readFlowFunc("a"))
     }
     val p = new P().resolveToDataflowGraph()
     val schema = new StructType().add("x", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("a", isView = true), schema)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("a"), schema)
     verifyFlowSchema(p, fullyQualifiedIdentifier("b-query"), schema)
     assert(
       p.resolvedFlow(fullyQualifiedIdentifier("b-query")).inputs == Set(
-        fullyQualifiedIdentifier("a", isView = true)
+        fullyQualifiedIdentifier("a")
       ),
       "Flow did not have the expected inputs"
     )
@@ -349,18 +360,18 @@ class ConnectValidPipelineSuite extends PipelineTest {
 
     class P extends TestGraphRegistrationContext(spark) {
       val mem = MemoryStream[Int]
-      registerView("a", query = dfFlowFunc(mem.toDF()))
+      registerPersistedView("a", query = dfFlowFunc(mem.toDF()))
       registerTable("b")
       registerFlow("b", "b", dfFlowFunc(mem.toDF().select($"value" as "y")))
       registerFlow("b", "b2", readStreamFlowFunc("a"))
     }
     val p = new P().resolveToDataflowGraph()
     val schema = new StructType().add("value", IntegerType, false)
-    verifyFlowSchema(p, fullyQualifiedIdentifier("a", isView = true), schema)
+    verifyFlowSchema(p, fullyQualifiedIdentifier("a"), schema)
     verifyFlowSchema(p, fullyQualifiedIdentifier("b2"), schema)
     assert(
       p.resolvedFlow(fullyQualifiedIdentifier("b2")).inputs == Set(
-        fullyQualifiedIdentifier("a", isView = true)
+        fullyQualifiedIdentifier("a")
       ),
       "Flow did not have the expected inputs"
     )
@@ -393,8 +404,8 @@ class ConnectValidPipelineSuite extends PipelineTest {
     val graph = new TestGraphRegistrationContext(spark) {
       val mem = MemoryStream[Int]
       mem.addData(1, 2)
-      registerView("complete-view", query = dfFlowFunc(Seq(1, 2).toDF("x")))
-      registerView("incremental-view", query = dfFlowFunc(mem.toDF()))
+      registerPersistedView("complete-view", query = dfFlowFunc(Seq(1, 2).toDF("x")))
+      registerPersistedView("incremental-view", query = dfFlowFunc(mem.toDF()))
       registerTable("`complete-table`", query = Option(readFlowFunc("complete-view")))
       registerTable("`incremental-table`")
       registerFlow(
@@ -418,12 +429,12 @@ class ConnectValidPipelineSuite extends PipelineTest {
 
     assert(
       graph
-        .flow(fullyQualifiedIdentifier("complete-view", isView = true))
+        .flow(fullyQualifiedIdentifier("complete-view"))
         .isInstanceOf[CompleteFlow]
     )
     assert(
       graph
-        .flow(fullyQualifiedIdentifier("incremental-view", isView = true))
+        .flow(fullyQualifiedIdentifier("incremental-view"))
         .isInstanceOf[StreamingFlow]
     )
     assert(
@@ -486,7 +497,7 @@ class ConnectValidPipelineSuite extends PipelineTest {
     assert(
       pipeline.flow.contains(identifier),
       s"Flow ${identifier.unquotedString} not found," +
-      s" all flow names: ${pipeline.flow.keys.map(_.unquotedString)}"
+        s" all flow names: ${pipeline.flow.keys.map(_.unquotedString)}"
     )
     assert(
       pipeline.resolvedFlow.contains(identifier),
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/MaterializeTablesSuite.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/MaterializeTablesSuite.scala
index 2587f503222e8..72e292ec5070a 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/MaterializeTablesSuite.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/MaterializeTablesSuite.scala
@@ -22,36 +22,35 @@ import scala.jdk.CollectionConverters._
 import org.apache.spark.SparkThrowable
 import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Identifier, TableCatalog}
 import org.apache.spark.sql.connector.expressions.Expressions
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.pipelines.graph.DatasetManager.TableMaterializationException
 import org.apache.spark.sql.pipelines.utils.{BaseCoreExecutionTest, TestGraphRegistrationContext}
+import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types._
 import org.apache.spark.util.Utils.exceptionString
 
+class DefaultMaterializeTablesSuite extends MaterializeTablesSuite with SharedSparkSession
+
 /**
  * Local integration tests for materialization of `Table`s in a `DataflowGraph` to make sure
  * tables are written with the appropriate schemas.
  */
-class MaterializeTablesSuite extends BaseCoreExecutionTest {
+abstract class MaterializeTablesSuite extends BaseCoreExecutionTest {
   test("basic") {
     val session = spark
     import session.implicits._
 
     materializeGraph(
       new TestGraphRegistrationContext(spark) {
-        registerFlow(
-          "a",
-          "a",
-          query = dfFlowFunc(Seq((1, 1), (2, 3)).toDF("x", "x2"))
-        )
-        registerTable(
+        registerMaterializedView(
           "a",
           specifiedSchema = Option(
             new StructType()
               .add("x", IntegerType, nullable = false, "comment1")
               .add("x2", IntegerType, nullable = true, "comment2")
           ),
-          comment = Option("p-comment")
+          comment = Option("p-comment"),
+          query = dfFlowFunc(Seq((1, 1), (2, 3)).toDF("x", "x2"))
         )
       }.resolveToDataflowGraph()
     )
@@ -71,19 +70,15 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
 
     materializeGraph(
       new TestGraphRegistrationContext(spark) {
-        registerFlow(
-          "a",
-          "a",
-          query = dfFlowFunc(Seq((1, 1), (2, 3)).toDF("x", "x2"))
-        )
-        registerTable(
+        registerMaterializedView(
           "a",
           specifiedSchema = Option(
             new StructType()
               .add("x", IntegerType, nullable = false, "comment3")
               .add("x2", IntegerType, nullable = true, "comment4")
           ),
-          comment = Option("p-comment")
+          comment = Option("p-comment"),
+          query = dfFlowFunc(Seq((1, 1), (2, 3)).toDF("x", "x2"))
         )
       }.resolveToDataflowGraph()
     )
@@ -99,19 +94,15 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
 
     materializeGraph(
       new TestGraphRegistrationContext(spark) {
-        registerFlow(
-          "a",
-          "a",
-          query = dfFlowFunc(Seq((1, 1), (2, 3)).toDF("x", "x2"))
-        )
-        registerTable(
+        registerMaterializedView(
           "a",
           specifiedSchema = Option(
             new StructType()
               .add("x", IntegerType, nullable = false)
               .add("x2", IntegerType, nullable = true)
           ),
-          comment = Option("p-comment")
+          comment = Option("p-comment"),
+          query = dfFlowFunc(Seq((1, 1), (2, 3)).toDF("x", "x2"))
         )
       }.resolveToDataflowGraph()
     )
@@ -205,9 +196,9 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
         query = Option(dfFlowFunc(spark.readStream.format("rate").load()))
       )
       // Defines a column called timestamp as `int`.
-      registerTable(
+      registerMaterializedView(
         "b",
-        query = Option(sqlFlowFunc(spark, "SELECT value AS timestamp FROM a"))
+        query = sqlFlowFunc(spark, "SELECT value AS timestamp FROM a")
       )
     }
     materializeGraph(new P1().resolveToDataflowGraph())
@@ -226,9 +217,9 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
         query = Option(dfFlowFunc(spark.readStream.format("rate").load()))
       )
       // Defines a column called timestamp as `timestamp`.
-      registerTable(
+      registerMaterializedView(
         "b",
-        query = Option(sqlFlowFunc(spark, "SELECT timestamp FROM a"))
+        query = sqlFlowFunc(spark, "SELECT timestamp FROM a")
       )
     }
     materializeGraph(new P2().resolveToDataflowGraph())
@@ -313,14 +304,14 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
 
     materializeGraph(
       new TestGraphRegistrationContext(spark) {
-        registerFlow("t4", "t4", query = dfFlowFunc(Seq[Short](1, 2).toDF("x")))
-        registerTable(
+        registerMaterializedView(
           "t4",
           specifiedSchema = Option(
             new StructType()
               .add("x", IntegerType, nullable = true, "this is column x")
               .add("z", LongType, nullable = true, "this is column z")
-          )
+          ),
+          query = dfFlowFunc(Seq[Short](1, 2).toDF("x"))
         )
       }.resolveToDataflowGraph()
     )
@@ -367,10 +358,10 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
 
     // Works fine for a complete table
     materializeGraph(new TestGraphRegistrationContext(spark) {
-      registerTable(
+      registerMaterializedView(
         "t6",
         specifiedSchema = Option(new StructType().add("x", IntegerType)),
-        query = Option(dfFlowFunc(Seq(1, 2).toDF("x")))
+        query = dfFlowFunc(Seq(1, 2).toDF("x"))
       )
     }.resolveToDataflowGraph())
     val table2 = catalog.loadTable(identifier)
@@ -585,7 +576,7 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
       val rawGraph =
         new TestGraphRegistrationContext(spark) {
           registerView("a", query = dfFlowFunc(Seq((1, 2), (2, 3)).toDF("x", "y")))
-          registerTable("b", query = Option(sqlFlowFunc(spark, "SELECT x FROM a")))
+          registerMaterializedView("b", query = sqlFlowFunc(spark, "SELECT x FROM a"))
         }.resolveToDataflowGraph()
 
       val graph = materializeGraph(rawGraph)
@@ -619,7 +610,7 @@ class MaterializeTablesSuite extends BaseCoreExecutionTest {
       materializeGraph(
         new TestGraphRegistrationContext(spark) {
           registerView("a", query = dfFlowFunc(Seq((1, 2), (2, 3)).toDF("x", "y")))
-          registerTable("b", query = Option(sqlFlowFunc(spark, "SELECT y FROM a")))
+          registerMaterializedView("b", query = sqlFlowFunc(spark, "SELECT y FROM a"))
         }.resolveToDataflowGraph()
       )
       val table2 = catalog.loadTable(identifier)
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlPipelineSuite.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlPipelineSuite.scala
index 130a024f2bb18..ae345b79fc53d 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlPipelineSuite.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlPipelineSuite.scala
@@ -17,24 +17,15 @@
 package org.apache.spark.sql.pipelines.graph
 
 import org.apache.spark.sql.{AnalysisException, Row}
-import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.catalyst.parser.ParseException
 import org.apache.spark.sql.pipelines.utils.{PipelineTest, TestGraphRegistrationContext}
-import org.apache.spark.sql.test.SQLTestUtils
+import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.{LongType, StructType}
 import org.apache.spark.util.Utils
 
-class SqlPipelineSuite extends PipelineTest with SQLTestUtils {
-  private val externalTable1Ident = TableIdentifier(
-    table = "external_t1",
-    database = Option(TestGraphRegistrationContext.DEFAULT_DATABASE),
-    catalog = Option(TestGraphRegistrationContext.DEFAULT_CATALOG)
-  )
-  private val externalTable2Ident = TableIdentifier(
-    table = "external_t2",
-    database = Option(TestGraphRegistrationContext.DEFAULT_DATABASE),
-    catalog = Option(TestGraphRegistrationContext.DEFAULT_CATALOG)
-  )
+class SqlPipelineSuite extends PipelineTest with SharedSparkSession {
+  private val externalTable1Ident = fullyQualifiedIdentifier("external_t1")
+  private val externalTable2Ident = fullyQualifiedIdentifier("external_t2")
 
   override def beforeEach(): Unit = {
     super.beforeEach()
@@ -139,7 +130,6 @@ class SqlPipelineSuite extends PipelineTest with SQLTestUtils {
       resolvedDataflowGraph.resolvedFlows
         .filter(_.identifier == fullyQualifiedIdentifier("a"))
         .head
-    assert(flowA.comment.contains("this is a comment"))
     checkAnswer(flowA.df, Seq(Row(1), Row(2), Row(3)))
   }
 
@@ -402,32 +392,41 @@ class SqlPipelineSuite extends PipelineTest with SQLTestUtils {
   gridTest(s"Pipeline dataset can read from file based data sources")(
     Seq("parquet", "orc", "json", "csv")
   ) { fileFormat =>
+    // TODO: streaming file data sources in SQL is not currently supported. If and when it is,
+    //  streaming tables should also be able to directly stream from file based data sources. Until
+    //  then, users must stream from a regular table that has loaded the file data. A streaming
+    //  table reading from a materialized view or temp view is not supported.
     val tmpDir = Utils.createTempDir().getAbsolutePath
     spark.sql("SELECT * FROM RANGE(3)").write.format(fileFormat).mode("overwrite").save(tmpDir)
 
-    val unresolvedDataflowGraph = unresolvedDataflowGraphFromSql(
-      sqlText = s"""
-                   |CREATE MATERIALIZED VIEW a AS SELECT * FROM $fileFormat.`$tmpDir`;
-                   |CREATE STREAMING TABLE b AS SELECT * FROM STREAM($fileFormat.`$tmpDir`)
-                   |""".stripMargin
-    )
+    val externalTableIdent = fullyQualifiedIdentifier("t")
+    spark.sql(s"CREATE TABLE $externalTableIdent AS SELECT * FROM $fileFormat.`$tmpDir`")
 
-    startPipelineAndWaitForCompletion(unresolvedDataflowGraph)
+    withTable(externalTableIdent.quotedString) {
+      val unresolvedDataflowGraph = unresolvedDataflowGraphFromSql(
+        sqlText =
+          s"""
+             |CREATE MATERIALIZED VIEW a AS SELECT * FROM $fileFormat.`$tmpDir`;
+             |CREATE STREAMING TABLE b AS SELECT * FROM STREAM $externalTableIdent
+             |""".stripMargin
+      )
+
+      startPipelineAndWaitForCompletion(unresolvedDataflowGraph)
 
-    Seq("a", "b").foreach { datasetName =>
-      val datasetFullyQualifiedName =
-        fullyQualifiedIdentifier(datasetName).quotedString
-      spark.sql(s"REFRESH TABLE $datasetFullyQualifiedName")
-      val expectedRows = if (fileFormat == "csv") {
-        // CSV values are read as strings
-        Seq("0", "1", "2")
-      } else {
-        Seq(0, 1, 2)
+      Seq("a", "b").foreach { datasetName =>
+        val datasetFullyQualifiedName =
+          fullyQualifiedIdentifier(datasetName).quotedString
+        val expectedRows = if (fileFormat == "csv") {
+          // CSV values are read as strings
+          Set("0", "1", "2")
+        } else {
+          Set(0, 1, 2)
+        }
+        assert(
+          spark.sql(s"SELECT * FROM $datasetFullyQualifiedName").collect().toSet ==
+            expectedRows.map(Row(_))
+        )
       }
-      checkAnswer(
-        spark.sql(s"SELECT * FROM $datasetFullyQualifiedName"),
-        expectedRows.map(Row(_))
-      )
     }
   }
 
@@ -744,6 +743,41 @@ class SqlPipelineSuite extends PipelineTest with SQLTestUtils {
     )
   }
 
+  test("groupby and rollup works with internal datasets") {
+    val unresolvedDataflowGraph = unresolvedDataflowGraphFromSql(
+      sqlText = s"""
+                   |CREATE MATERIALIZED VIEW src AS
+                   |    SELECT id
+                   |    FROM range(3);
+                   |
+                   |CREATE MATERIALIZED VIEW groupby_result AS
+                   |    SELECT id, SUM(id) AS sum_id, COUNT(*) AS cnt
+                   |    FROM src
+                   |    GROUP BY id;
+                   |
+                   |CREATE MATERIALIZED VIEW rollup_result AS
+                   |    SELECT id, SUM(id) AS sum_id, COUNT(*) AS cnt
+                   |    FROM src
+                   |    GROUP BY ROLLUP(id);
+                   |""".stripMargin
+    )
+
+    startPipelineAndWaitForCompletion(unresolvedDataflowGraph)
+
+    val groupbyDf = spark.table(fullyQualifiedIdentifier("groupby_result"))
+    val rollupDf = spark.table(fullyQualifiedIdentifier("rollup_result"))
+
+    // groupBy should have exactly one row per id [0,1,2]
+    assert(groupbyDf.select("id").collect().map(_.getLong(0)).toSet == Set(0L, 1L, 2L))
+
+    // rollup should have all groupBy rows + one extra (the total row)
+    assert(rollupDf.count() == groupbyDf.count() + 1)
+
+    // verify the rollup total row: id IS NULL, sum_id=3, cnt=3
+    val totalRow = rollupDf.filter("id IS NULL").collect().head
+    assert(totalRow.getLong(1) == 3L && totalRow.getLong(2) == 3L)
+  }
+
   test("Empty streaming table definition is disallowed") {
     val unresolvedDataflowGraph = unresolvedDataflowGraphFromSql(
       sqlText = "CREATE STREAMING TABLE st;"
@@ -852,4 +886,65 @@ class SqlPipelineSuite extends PipelineTest with SQLTestUtils {
       )
     )
   }
+
+  test("No table defined pipeline fails with RUN_EMPTY_PIPELINE") {
+    val graphRegistrationContext = new TestGraphRegistrationContext(spark)
+    val sqlGraphRegistrationContext = new SqlGraphRegistrationContext(graphRegistrationContext)
+
+    sqlGraphRegistrationContext.processSqlFile(sqlText = "", sqlFilePath = "a.sql", spark = spark)
+
+    checkError(
+      exception = intercept[AnalysisException] {
+        graphRegistrationContext.toDataflowGraph
+      },
+      condition = "RUN_EMPTY_PIPELINE",
+      sqlState = Option("42617"),
+      parameters = Map.empty
+    )
+  }
+
+  test("Pipeline with only temp views fails with RUN_EMPTY_PIPELINE") {
+    val graphRegistrationContext = new TestGraphRegistrationContext(spark)
+    val sqlGraphRegistrationContext = new SqlGraphRegistrationContext(graphRegistrationContext)
+
+    sqlGraphRegistrationContext.processSqlFile(
+      sqlText = s"""
+                   |CREATE TEMPORARY VIEW a AS SELECT id FROM range(1,3);
+                   |""".stripMargin,
+      sqlFilePath = "a.sql",
+      spark = spark
+    )
+
+    checkError(
+      exception = intercept[AnalysisException] {
+        graphRegistrationContext.toDataflowGraph
+      },
+      condition = "RUN_EMPTY_PIPELINE",
+      sqlState = Option("42617"),
+      parameters = Map.empty
+    )
+  }
+
+  test("Pipeline with only flow fails with RUN_EMPTY_PIPELINE") {
+    val graphRegistrationContext = new TestGraphRegistrationContext(spark)
+    val sqlGraphRegistrationContext = new SqlGraphRegistrationContext(graphRegistrationContext)
+
+    sqlGraphRegistrationContext.processSqlFile(
+      sqlText = s"""
+                   |CREATE FLOW f AS INSERT INTO a BY NAME
+                   |SELECT 1;
+                   |""".stripMargin,
+      sqlFilePath = "a.sql",
+      spark = spark
+    )
+
+    checkError(
+      exception = intercept[AnalysisException] {
+        graphRegistrationContext.toDataflowGraph
+      },
+      condition = "RUN_EMPTY_PIPELINE",
+      sqlState = Option("42617"),
+      parameters = Map.empty
+    )
+  }
 }
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlQueryOriginSuite.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlQueryOriginSuite.scala
index 58c71fe961c89..8b004bd9fe7cd 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlQueryOriginSuite.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/SqlQueryOriginSuite.scala
@@ -18,8 +18,9 @@ package org.apache.spark.sql.pipelines.graph
 
 import org.apache.spark.sql.pipelines.Language
 import org.apache.spark.sql.pipelines.utils.PipelineTest
+import org.apache.spark.sql.test.SharedSparkSession
 
-class SqlQueryOriginSuite extends PipelineTest {
+class SqlQueryOriginSuite extends PipelineTest with SharedSparkSession {
   test("basic test") {
     val sqlQueryOrigins = SqlGraphRegistrationContext.splitSqlFileIntoQueries(
       spark,
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecutionSuite.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecutionSuite.scala
index 7c0fc35ace292..4aaa139378b93 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecutionSuite.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/graph/TriggeredGraphExecutionSuite.scala
@@ -23,14 +23,15 @@ import org.apache.spark.sql.{functions, Row}
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.classic.{DataFrame, Dataset}
 import org.apache.spark.sql.connector.catalog.{CatalogV2Util, Identifier, TableCatalog}
-import org.apache.spark.sql.execution.streaming.MemoryStream
+import org.apache.spark.sql.execution.streaming.runtime.MemoryStream
 import org.apache.spark.sql.pipelines.common.{FlowStatus, RunState}
 import org.apache.spark.sql.pipelines.graph.TriggeredGraphExecution.StreamState
 import org.apache.spark.sql.pipelines.logging.EventLevel
 import org.apache.spark.sql.pipelines.utils.{ExecutionTest, TestGraphRegistrationContext}
+import org.apache.spark.sql.test.SharedSparkSession
 import org.apache.spark.sql.types.{IntegerType, StringType, StructType}
 
-class TriggeredGraphExecutionSuite extends ExecutionTest {
+class TriggeredGraphExecutionSuite extends ExecutionTest with SharedSparkSession {
 
   /** Returns a Dataset of Longs from the table with the given identifier. */
   private def getTable(identifier: TableIdentifier): Dataset[Long] = {
@@ -55,8 +56,8 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
     import session.implicits._
 
     val pipelineDef = new TestGraphRegistrationContext(spark) {
-      registerTable("a", query = Option(dfFlowFunc(Seq(1, 2).toDF("x"))))
-      registerTable("b", query = Option(readFlowFunc("a")))
+      registerMaterializedView("a", query = dfFlowFunc(Seq(1, 2).toDF("x")))
+      registerMaterializedView("b", query = readFlowFunc("a"))
     }
     val unresolvedGraph = pipelineDef.toDataflowGraph
     val resolvedGraph = unresolvedGraph.resolve()
@@ -101,8 +102,8 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
     import session.implicits._
 
     val pipelineDef = new TestGraphRegistrationContext(spark) {
-      registerTable("a", query = Option(dfFlowFunc(Seq(1, 2).toDF("x"))))
-      registerTable("b", query = Option(readFlowFunc("a")))
+      registerMaterializedView("a", query = dfFlowFunc(Seq(1, 2).toDF("x")))
+      registerMaterializedView("b", query = readFlowFunc("a"))
       registerView("c", query = readStreamFlowFunc("a"))
       registerTable("d", query = Option(readStreamFlowFunc("c")))
     }
@@ -119,13 +120,13 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
 
     val cFlow =
       resolvedGraph.resolvedFlows
-        .filter(_.identifier == fullyQualifiedIdentifier("c", isView = true))
+        .filter(_.identifier == fullyQualifiedIdentifier("c", isTemporaryView = true))
         .head
     assert(cFlow.inputs == Set(fullyQualifiedIdentifier("a")))
 
     val dFlow =
       resolvedGraph.resolvedFlows.filter(_.identifier == fullyQualifiedIdentifier("d")).head
-    assert(dFlow.inputs == Set(fullyQualifiedIdentifier("c", isView = true)))
+    assert(dFlow.inputs == Set(fullyQualifiedIdentifier("c", isTemporaryView = true)))
 
     val updateContext = TestPipelineUpdateContext(spark, unresolvedGraph)
     updateContext.pipelineExecution.runPipeline()
@@ -167,7 +168,7 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
     // no flow progress event for c, as it is a temporary view
     assertNoFlowProgressEvent(
       eventBuffer = updateContext.eventBuffer,
-      identifier = fullyQualifiedIdentifier("c", isView = true),
+      identifier = fullyQualifiedIdentifier("c", isTemporaryView = true),
       flowStatus = FlowStatus.STARTING
     )
     checkAnswer(
@@ -478,27 +479,27 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
 
     val specifiedSchema = new StructType().add("x", "int", nullable = true)
     val pipelineDef = new TestGraphRegistrationContext(spark) {
-      registerTable(
+      registerMaterializedView(
         "specified_schema",
-        query = Option(dfFlowFunc(Seq(1, 2).toDF("x"))),
+        query = dfFlowFunc(Seq(1, 2).toDF("x")),
         specifiedSchema = Option(specifiedSchema)
       )
 
-      registerTable(
+      registerMaterializedView(
         "specified_schema_stream",
-        query = Option(dfFlowFunc(Seq(1, 2).toDF("x"))),
+        query = dfFlowFunc(Seq(1, 2).toDF("x")),
         specifiedSchema = Option(specifiedSchema)
       )
 
-      registerTable(
+      registerMaterializedView(
         "specified_schema_downstream",
-        query = Option(readStreamFlowFunc("specified_schema")),
+        query = readFlowFunc("specified_schema"),
         specifiedSchema = Option(specifiedSchema)
       )
 
-      registerTable(
+      registerMaterializedView(
         "specified_schema_downbatch",
-        query = Option(readFlowFunc("specified_schema_stream")),
+        query = readFlowFunc("specified_schema_stream"),
         specifiedSchema = Option(specifiedSchema)
       )
     }
@@ -609,20 +610,18 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
     import session.implicits._
 
     val pipelineDef = new TestGraphRegistrationContext(spark) {
-      registerTable("integer_input", query = Option(dfFlowFunc(Seq(1, 2, 3, 4).toDF("value"))))
-      registerTable(
+      registerMaterializedView("integer_input", query = dfFlowFunc(Seq(1, 2, 3, 4).toDF("value")))
+      registerMaterializedView(
         "double",
-        query = Option(sqlFlowFunc(spark, "SELECT value * 2 as value FROM integer_input"))
+        query = sqlFlowFunc(spark, "SELECT value * 2 as value FROM integer_input")
       )
-      registerTable(
+      registerMaterializedView(
         "string_input",
-        query = Option(dfFlowFunc(Seq("a", "b", "c", "d").toDF("value")))
+        query = dfFlowFunc(Seq("a", "b", "c", "d").toDF("value"))
       )
-      registerTable(
+      registerMaterializedView(
         "append_x",
-        query = Option(
-          sqlFlowFunc(spark, "SELECT CONCAT(value, 'x') as value FROM string_input")
-        )
+        query = sqlFlowFunc(spark, "SELECT CONCAT(value, 'x') as value FROM string_input")
       )
     }
 
@@ -666,28 +665,24 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
     import session.implicits._
 
     val pipelineDef = new TestGraphRegistrationContext(spark) {
-      registerTable("integer_input", query = Option(dfFlowFunc(Seq(1, 2, 3, 4).toDF("nums"))))
-      registerTable(
+      registerMaterializedView("integer_input", query = dfFlowFunc(Seq(1, 2, 3, 4).toDF("nums")))
+      registerMaterializedView(
         "double",
-        query = Option(sqlFlowFunc(spark, "SELECT nums * 2 as nums FROM integer_input"))
+        query = sqlFlowFunc(spark, "SELECT nums * 2 as nums FROM integer_input")
       )
-      registerTable(
+      registerMaterializedView(
         "string_input",
-        query = Option(dfFlowFunc(Seq("a", "b", "c", "d").toDF("text")))
+        query = dfFlowFunc(Seq("a", "b", "c", "d").toDF("text"))
       )
-      registerTable(
+      registerMaterializedView(
         "append_x",
-        query = Option(
-          sqlFlowFunc(spark, "SELECT CONCAT(text, 'x') as text FROM string_input")
-        )
+        query = sqlFlowFunc(spark, "SELECT CONCAT(text, 'x') as text FROM string_input")
       )
-      registerTable(
+      registerMaterializedView(
         "merged",
-        query = Option(
-          sqlFlowFunc(
-            spark,
-            "SELECT * FROM double FULL OUTER JOIN append_x ON nums::STRING = text"
-          )
+        query = sqlFlowFunc(
+          spark,
+          "SELECT * FROM double FULL OUTER JOIN append_x ON nums::STRING = text"
         )
       )
     }
@@ -745,34 +740,28 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
     import session.implicits._
 
     val pipelineDef = new TestGraphRegistrationContext(spark) {
-      registerTable(
+      registerMaterializedView(
         "input_table",
-        query = Option(
-          dfFlowFunc(
-            Seq((1, 1), (1, 2), (2, 3), (2, 4)).toDF("x", "y")
-          )
+        query = dfFlowFunc(
+          Seq((1, 1), (1, 2), (2, 3), (2, 4)).toDF("x", "y")
         )
       )
-      registerTable(
+      registerMaterializedView(
         "left_split",
-        query = Option(
-          sqlFlowFunc(
-            spark,
-            "SELECT x FROM input_table WHERE x IS NOT NULL"
-          )
+        query = sqlFlowFunc(
+          spark,
+          "SELECT x FROM input_table WHERE x IS NOT NULL"
         )
       )
-      registerTable(
+      registerMaterializedView(
         "right_split",
-        query = Option(sqlFlowFunc(spark, "SELECT y FROM input_table WHERE y IS NOT NULL"))
+        query = sqlFlowFunc(spark, "SELECT y FROM input_table WHERE y IS NOT NULL")
       )
-      registerTable(
+      registerMaterializedView(
         "merged",
-        query = Option(
-          sqlFlowFunc(
-            spark,
-            "SELECT * FROM left_split FULL OUTER JOIN right_split ON x = y"
-          )
+        query = sqlFlowFunc(
+          spark,
+          "SELECT * FROM left_split FULL OUTER JOIN right_split ON x = y"
         )
       )
     }
@@ -883,7 +872,10 @@ class TriggeredGraphExecutionSuite extends ExecutionTest {
         "evens",
         query = sqlFlowFunc(spark, "SELECT * FROM all WHERE value % 2 = 0")
       )
-      registerTable("max_evens", query = Option(sqlFlowFunc(spark, "SELECT MAX(value) FROM evens")))
+      registerMaterializedView(
+        "max_evens",
+        query = sqlFlowFunc(spark, "SELECT MAX(value) FROM evens")
+      )
     }
     val graph1 = pipelineDef.toDataflowGraph
 
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/ExecutionTest.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/ExecutionTest.scala
index eebe1e7e83e53..991a47d6b562f 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/ExecutionTest.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/ExecutionTest.scala
@@ -34,7 +34,6 @@ import org.apache.spark.sql.pipelines.logging.{
   FlowProgress,
   FlowProgressEventLogger,
   PipelineEvent,
-  PipelineRunEventBuffer,
   RunProgress
 }
 
@@ -60,12 +59,12 @@ trait TestPipelineUpdateContextMixin {
       refreshTables: TableFilter = AllTables,
       resetCheckpointFlows: FlowFilter = AllFlows
   ) extends PipelineUpdateContext {
-    val eventBuffer = new PipelineRunEventBuffer(eventCallback = _ => ())
+    val eventBuffer = new PipelineRunEventBuffer()
+
+    override val eventCallback: PipelineEvent => Unit = eventBuffer.addEvent
 
     override def flowProgressEventLogger: FlowProgressEventLogger = {
-      new FlowProgressEventLogger(
-        eventBuffer = eventBuffer
-      )
+      new FlowProgressEventLogger(eventCallback = eventCallback)
     }
   }
 }
diff --git a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/logging/PipelineRunEventBuffer.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/PipelineRunEventBuffer.scala
similarity index 77%
rename from sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/logging/PipelineRunEventBuffer.scala
rename to sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/PipelineRunEventBuffer.scala
index 1ef2a561a9913..e3ea61595993f 100644
--- a/sql/pipelines/src/main/scala/org/apache/spark/sql/pipelines/logging/PipelineRunEventBuffer.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/PipelineRunEventBuffer.scala
@@ -15,33 +15,28 @@
  * limitations under the License.
  */
 
-package org.apache.spark.sql.pipelines.logging
+package org.apache.spark.sql.pipelines.utils
 
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.internal.Logging
+import org.apache.spark.sql.pipelines.logging.PipelineEvent
 
 /**
  * An in-memory buffer which contains the internal events that are emitted during a run of a
  * pipeline.
- *
- * @param eventCallback A callback function to be called when an event is added to the buffer.
  */
-class PipelineRunEventBuffer(eventCallback: PipelineEvent => Unit) extends Logging {
+class PipelineRunEventBuffer extends Logging {
 
   /**
    * A buffer to hold the events emitted during a pipeline run.
    * This buffer is thread-safe and can be accessed concurrently.
-   *
-   * TODO(SPARK-52409): Deprecate this class to be used in test only and use a more
-   *                    robust event logging system in production.
    */
   private val events = ArrayBuffer[PipelineEvent]()
 
   def addEvent(event: PipelineEvent): Unit = synchronized {
     val eventToAdd = event
     events.append(eventToAdd)
-    eventCallback(event)
   }
 
   def clear(): Unit = synchronized {
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/PipelineTest.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/PipelineTest.scala
index 48f2f26fb450c..8db5c0c626b39 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/PipelineTest.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/PipelineTest.scala
@@ -26,30 +26,34 @@ import scala.util.control.NonFatal
 
 import org.scalactic.source
 import org.scalatest.{BeforeAndAfterAll, BeforeAndAfterEach, Tag}
+import org.scalatest.concurrent.Eventually
 import org.scalatest.matchers.should.Matchers
 
-import org.apache.spark.{SparkConf, SparkFunSuite}
+import org.apache.spark.SparkFunSuite
 import org.apache.spark.internal.Logging
-import org.apache.spark.sql.{Column, QueryTest, Row, TypedColumn}
+import org.apache.spark.sql.{Column, QueryTest, Row, SQLContext, TypedColumn}
 import org.apache.spark.sql.catalyst.TableIdentifier
 import org.apache.spark.sql.classic.{DataFrame, Dataset, SparkSession}
 import org.apache.spark.sql.execution._
 import org.apache.spark.sql.pipelines.graph.{DataflowGraph, PipelineUpdateContextImpl, SqlGraphRegistrationContext}
 import org.apache.spark.sql.pipelines.utils.PipelineTest.{cleanupMetastore, createTempDir}
-import org.apache.spark.sql.test.SharedSparkSession
 
 abstract class PipelineTest
     extends SparkFunSuite
-    with SharedSparkSession
     with BeforeAndAfterAll
     with BeforeAndAfterEach
     with Matchers
     with SparkErrorTestMixin
     with TargetCatalogAndDatabaseMixin
-    with Logging {
+    with Logging
+    with Eventually {
 
   final protected val storageRoot = createTempDir()
 
+  protected def spark: SparkSession
+
+  protected implicit def sqlContext: SQLContext
+
   def sql(text: String): DataFrame = spark.sql(text)
 
   protected def startPipelineAndWaitForCompletion(unresolvedDataflowGraph: DataflowGraph): Unit = {
@@ -59,15 +63,6 @@ abstract class PipelineTest
     updateContext.pipelineExecution.awaitCompletion()
   }
 
-  /**
-   * Spark confs set here will be the default spark confs for all spark sessions created in tests.
-   */
-  override def sparkConf: SparkConf = {
-    super.sparkConf
-      .set("spark.sql.shuffle.partitions", "2")
-      .set("spark.sql.session.timeZone", "UTC")
-  }
-
   /** Returns the dataset name in the event log. */
   protected def eventLogName(
       name: String,
@@ -83,9 +78,9 @@ abstract class PipelineTest
       name: String,
       catalog: Option[String] = catalogInPipelineSpec,
       database: Option[String] = databaseInPipelineSpec,
-      isView: Boolean = false
+      isTemporaryView: Boolean = false
   ): TableIdentifier = {
-    if (isView) {
+    if (isTemporaryView) {
       TableIdentifier(name)
     } else {
       TableIdentifier(
@@ -126,7 +121,7 @@ abstract class PipelineTest
     )
   }
 
-  override def beforeEach(): Unit = {
+  protected override def beforeEach(): Unit = {
     super.beforeEach()
     cleanupMetastore(spark)
     (catalogInPipelineSpec, databaseInPipelineSpec) match {
@@ -137,7 +132,7 @@ abstract class PipelineTest
     }
   }
 
-  override def afterEach(): Unit = {
+  protected override def afterEach(): Unit = {
     cleanupMetastore(spark)
     super.afterEach()
   }
@@ -319,15 +314,7 @@ abstract class PipelineTest
 
   /**
    * Helper method to verify unresolved column error message. We expect three elements to be present
-   * in the message: error class, unresolved column name, list of suggested columns. There are three
-   * significant differences between different versions of DBR:
-   * - Error class changed in DBR 11.3 from `MISSING_COLUMN` to `UNRESOLVED_COLUMN.WITH_SUGGESTION`
-   * - Name parts in suggested columns are escaped with backticks starting from DBR 11.3,
-   *   e.g. table.column => `table`.`column`
-   * - Starting from DBR 13.1 suggested columns qualification matches unresolved column, i.e. if
-   *   unresolved column is a single-part identifier then suggested column will be as well. E.g.
-   *   for unresolved column `x` suggested columns will omit catalog/schema or `LIVE` qualifier. For
-   *   this reason we verify only last part of suggested column name.
+   * in the message: error class, unresolved column name, list of suggested columns.
    */
   protected def verifyUnresolveColumnError(
       errorMessage: String,
diff --git a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/TestGraphRegistrationContext.scala b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/TestGraphRegistrationContext.scala
index 3449c5155c754..e5ac83a231e62 100644
--- a/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/TestGraphRegistrationContext.scala
+++ b/sql/pipelines/src/test/scala/org/apache/spark/sql/pipelines/utils/TestGraphRegistrationContext.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.sql.pipelines.utils
 
 import org.apache.spark.sql.catalyst.TableIdentifier
-import org.apache.spark.sql.catalyst.analysis.{LocalTempView, UnresolvedRelation, ViewType}
+import org.apache.spark.sql.catalyst.analysis.{LocalTempView, PersistedView => PersistedViewType, UnresolvedRelation, ViewType}
 import org.apache.spark.sql.classic.{DataFrame, SparkSession}
 import org.apache.spark.sql.pipelines.graph.{
   DataflowGraph,
@@ -50,6 +50,7 @@ class TestGraphRegistrationContext(
 
   // scalastyle:off
   // Disable scalastyle to ignore argument count.
+  /** Registers a streaming table in this [[TestGraphRegistrationContext]] */
   def registerTable(
       name: String,
       query: Option[FlowFunction] = None,
@@ -62,6 +63,70 @@ class TestGraphRegistrationContext(
       format: Option[String] = None,
       catalog: Option[String] = None,
       database: Option[String] = None
+  ): Unit = registerTable(
+    name,
+    query,
+    sqlConf,
+    comment,
+    specifiedSchema,
+    partitionCols,
+    properties,
+    baseOrigin,
+    format,
+    catalog,
+    database,
+    isStreamingTable = true
+  )
+  // scalastyle:on
+
+  // scalastyle:off
+  // Disable scalastyle to ignore argument count.
+  /** Registers a materialized view in this [[TestGraphRegistrationContext]] */
+  def registerMaterializedView(
+      name: String,
+      // Unlike for streaming tables, a materialized view MUST be defined alongside a query
+      // function.
+      query: FlowFunction,
+      sqlConf: Map[String, String] = Map.empty,
+      comment: Option[String] = None,
+      specifiedSchema: Option[StructType] = None,
+      partitionCols: Option[Seq[String]] = None,
+      properties: Map[String, String] = Map.empty,
+      baseOrigin: QueryOrigin = QueryOrigin.empty,
+      format: Option[String] = None,
+      catalog: Option[String] = None,
+      database: Option[String] = None
+): Unit = registerTable(
+    name,
+    Option(query),
+    sqlConf,
+    comment,
+    specifiedSchema,
+    partitionCols,
+    properties,
+    baseOrigin,
+    format,
+    catalog,
+    database,
+    isStreamingTable = false
+  )
+  // scalastyle:on
+
+  // scalastyle:off
+  // Disable scalastyle to ignore argument count.
+  private def registerTable(
+      name: String,
+      query: Option[FlowFunction],
+      sqlConf: Map[String, String],
+      comment: Option[String],
+      specifiedSchema: Option[StructType],
+      partitionCols: Option[Seq[String]],
+      properties: Map[String, String],
+      baseOrigin: QueryOrigin,
+      format: Option[String],
+      catalog: Option[String],
+      database: Option[String],
+      isStreamingTable: Boolean
   ): Unit = {
     // scalastyle:on
     val tableIdentifier = GraphIdentifierManager.parseTableIdentifier(name, spark)
@@ -75,7 +140,7 @@ class TestGraphRegistrationContext(
         baseOrigin = baseOrigin,
         format = format.orElse(Some("parquet")),
         normalizedPath = None,
-        isStreamingTableOpt = None
+        isStreamingTable = isStreamingTable
       )
     )
 
@@ -91,13 +156,31 @@ class TestGraphRegistrationContext(
           ),
           sqlConf = sqlConf,
           once = false,
-          comment = comment,
           origin = baseOrigin
         )
       )
     }
   }
 
+  def registerPersistedView(
+      name: String,
+      query: FlowFunction,
+      sqlConf: Map[String, String] = Map.empty,
+      comment: Option[String] = None,
+      origin: QueryOrigin = QueryOrigin.empty,
+      catalog: Option[String] = None,
+      database: Option[String] = None): Unit = {
+    registerView(
+      name = name,
+      query = query,
+      sqlConf = sqlConf,
+      comment = comment,
+      origin = origin,
+      viewType = PersistedViewType,
+      catalog = catalog,
+      database = database)
+  }
+
   def registerView(
       name: String,
       query: FlowFunction,
@@ -142,7 +225,6 @@ class TestGraphRegistrationContext(
         ),
         sqlConf = sqlConf,
         once = false,
-        comment = comment,
         origin = origin
       )
     )
@@ -171,7 +253,6 @@ class TestGraphRegistrationContext(
         ),
         sqlConf = Map.empty,
         once = once,
-        comment = None,
         origin = QueryOrigin()
       )
     )
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/Checkpoint.scala b/streaming/src/main/scala/org/apache/spark/streaming/Checkpoint.scala
index f09f9caf129bd..1a4e6a2a402c0 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/Checkpoint.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/Checkpoint.scala
@@ -28,7 +28,7 @@ import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.{SparkConf, SparkException}
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{BACKUP_FILE, CHECKPOINT_FILE, CHECKPOINT_TIME, NUM_RETRY, PATH, TEMP_FILE}
 import org.apache.spark.internal.config.UI._
 import org.apache.spark.io.CompressionCodec
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/DStreamGraph.scala b/streaming/src/main/scala/org/apache/spark/streaming/DStreamGraph.scala
index 52e0379c2a48d..c286c33866549 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/DStreamGraph.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/DStreamGraph.scala
@@ -22,7 +22,7 @@ import java.io.{IOException, ObjectInputStream, ObjectOutputStream}
 import scala.collection.mutable
 import scala.collection.parallel.immutable.ParVector
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.streaming.dstream.{DStream, InputDStream, ReceiverInputDStream}
 import org.apache.spark.streaming.scheduler.Job
 import org.apache.spark.util.Utils
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/StreamingContext.scala b/streaming/src/main/scala/org/apache/spark/streaming/StreamingContext.scala
index 94b695e6452e5..79bc38318f919 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/StreamingContext.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/StreamingContext.scala
@@ -36,7 +36,7 @@ import org.apache.spark._
 import org.apache.spark.annotation.DeveloperApi
 import org.apache.spark.deploy.SparkHadoopUtil
 import org.apache.spark.input.FixedLengthBinaryInputFormat
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.rdd.{RDD, RDDOperationScope}
 import org.apache.spark.scheduler.LiveListenerBus
 import org.apache.spark.serializer.SerializationDebugger
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
index f0f9046c6b623..74edbd9996dd4 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStream.scala
@@ -26,7 +26,7 @@ import scala.reflect.ClassTag
 import scala.util.matching.Regex
 
 import org.apache.spark.{SparkContext, SparkException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{FROM_TIME, SLIDE_DURATION, TO_TIME}
 import org.apache.spark.internal.io.SparkHadoopWriterUtils
 import org.apache.spark.rdd.{BlockRDD, RDD, RDDOperationScope}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala
index 128a5fded49a9..7845db610ac92 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/DStreamCheckpointData.scala
@@ -24,7 +24,7 @@ import scala.reflect.ClassTag
 
 import org.apache.hadoop.fs.{FileSystem, Path}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{PATH, TIME}
 import org.apache.spark.streaming.Time
 import org.apache.spark.util.Utils
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/FileInputDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/FileInputDStream.scala
index b067c505da0dd..f7cdd047d9ebf 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/FileInputDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/FileInputDStream.scala
@@ -26,7 +26,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileStatus, FileSystem, Path}
 import org.apache.hadoop.mapreduce.{InputFormat => NewInputFormat}
 
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.{RDD, UnionRDD}
 import org.apache.spark.streaming._
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/InputDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/InputDStream.scala
index 2deb388eb4b82..2cb10e4513437 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/InputDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/InputDStream.scala
@@ -23,7 +23,6 @@ import scala.reflect.ClassTag
 
 import org.apache.spark.SparkContext
 import org.apache.spark.internal.LogKeys.{LAST_VALID_TIME, TIME}
-import org.apache.spark.internal.MDC
 import org.apache.spark.rdd.RDDOperationScope
 import org.apache.spark.streaming.{Duration, StreamingContext, Time}
 import org.apache.spark.streaming.scheduler.RateController
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/RawInputDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/RawInputDStream.scala
index de7882032122a..8466e9f70843d 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/RawInputDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/RawInputDStream.scala
@@ -25,7 +25,7 @@ import java.util.concurrent.ArrayBlockingQueue
 
 import scala.reflect.ClassTag
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.storage.StorageLevel
 import org.apache.spark.streaming.StreamingContext
 import org.apache.spark.streaming.receiver.Receiver
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/dstream/SocketInputDStream.scala b/streaming/src/main/scala/org/apache/spark/streaming/dstream/SocketInputDStream.scala
index 83f36b760db3a..256e065b5cac3 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/dstream/SocketInputDStream.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/dstream/SocketInputDStream.scala
@@ -24,7 +24,7 @@ import java.nio.charset.StandardCharsets
 import scala.reflect.ClassTag
 import scala.util.control.NonFatal
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.storage.StorageLevel
 import org.apache.spark.streaming.StreamingContext
 import org.apache.spark.streaming.receiver.Receiver
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala b/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala
index 12c6c95f7d8d3..4b48288822752 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/rdd/WriteAheadLogBackedBlockRDD.scala
@@ -24,7 +24,7 @@ import scala.reflect.ClassTag
 import scala.util.control.NonFatal
 
 import org.apache.spark._
-import org.apache.spark.internal.{LogKeys, MDC}
+import org.apache.spark.internal.{LogKeys}
 import org.apache.spark.rdd.BlockRDD
 import org.apache.spark.storage.{BlockId, StorageLevel}
 import org.apache.spark.streaming.util._
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/BlockGenerator.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/BlockGenerator.scala
index fae68123773dd..47c579b0bfce7 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/BlockGenerator.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/BlockGenerator.scala
@@ -22,7 +22,7 @@ import java.util.concurrent.{ArrayBlockingQueue, TimeUnit}
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.{SparkConf, SparkException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.StreamingConf.BLOCK_INTERVAL
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceivedBlockHandler.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceivedBlockHandler.scala
index e513a75b69903..85fe8b857727c 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceivedBlockHandler.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceivedBlockHandler.scala
@@ -24,7 +24,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.{SparkConf, SparkException}
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.{EFFECTIVE_STORAGE_LEVEL, STORAGE_LEVEL, STORAGE_LEVEL_DESERIALIZED, STORAGE_LEVEL_REPLICATION}
 import org.apache.spark.serializer.SerializerManager
 import org.apache.spark.storage._
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisor.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisor.scala
index 7cc08b421f780..0850922578304 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisor.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisor.scala
@@ -25,7 +25,7 @@ import scala.concurrent._
 import scala.util.control.NonFatal
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{DELAY, ERROR, MESSAGE, STREAM_ID}
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.util.{ThreadUtils, Utils}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
index aafa99bd5285d..2f0e281040e92 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/receiver/ReceiverSupervisorImpl.scala
@@ -24,18 +24,17 @@ import java.util.concurrent.atomic.AtomicLong
 import scala.collection.mutable.ArrayBuffer
 import scala.jdk.CollectionConverters._
 
-import com.google.common.base.Throwables
 import org.apache.hadoop.conf.Configuration
 
 import org.apache.spark.{SparkEnv, SparkException}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{ERROR, MESSAGE}
 import org.apache.spark.rpc.{RpcEnv, ThreadSafeRpcEndpoint}
 import org.apache.spark.storage.StreamBlockId
 import org.apache.spark.streaming.Time
 import org.apache.spark.streaming.scheduler._
 import org.apache.spark.streaming.util.WriteAheadLogUtils
-import org.apache.spark.util.RpcUtils
+import org.apache.spark.util.{RpcUtils, Utils}
 
 /**
  * Concrete implementation of [[org.apache.spark.streaming.receiver.ReceiverSupervisor]]
@@ -168,7 +167,7 @@ private[streaming] class ReceiverSupervisorImpl(
 
   /** Report error to the receiver tracker */
   def reportError(message: String, error: Throwable): Unit = {
-    val errorString = Option(error).map(Throwables.getStackTraceAsString).getOrElse("")
+    val errorString = Option(error).map(Utils.stackTraceToString).getOrElse("")
     trackerEndpoint.send(ReportError(streamId, message, errorString))
     logWarning(log"Reported error ${MDC(MESSAGE, message)} - ${MDC(ERROR, error)}")
   }
@@ -196,7 +195,7 @@ private[streaming] class ReceiverSupervisorImpl(
 
   override protected def onReceiverStop(message: String, error: Option[Throwable]): Unit = {
     logInfo(log"Deregistering receiver ${MDC(LogKeys.STREAM_ID, streamId)}")
-    val errorString = error.map(Throwables.getStackTraceAsString).getOrElse("")
+    val errorString = error.map(Utils.stackTraceToString).getOrElse("")
     trackerEndpoint.askSync[Boolean](DeregisterReceiver(streamId, message, errorString))
     logInfo(log"Stopped receiver ${MDC(LogKeys.STREAM_ID, streamId)}")
   }
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ExecutorAllocationManager.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ExecutorAllocationManager.scala
index 903cde8082db7..e55914e17dbae 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ExecutorAllocationManager.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ExecutorAllocationManager.scala
@@ -21,7 +21,7 @@ package org.apache.spark.streaming.scheduler
 import scala.util.Random
 
 import org.apache.spark.{ExecutorAllocationClient, SparkConf}
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.config.DECOMMISSION_ENABLED
 import org.apache.spark.internal.config.Streaming._
 import org.apache.spark.resource.ResourceProfile
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/InputInfoTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/InputInfoTracker.scala
index bd9ea7b5a2688..0021c2536e804 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/InputInfoTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/InputInfoTracker.scala
@@ -20,7 +20,7 @@ package org.apache.spark.streaming.scheduler
 import scala.collection.mutable
 
 import org.apache.spark.annotation.DeveloperApi
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.streaming.{StreamingContext, Time}
 
 /**
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala
index 856695ac2c982..2e82e7db74ff6 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobGenerator.scala
@@ -21,7 +21,7 @@ import java.util.concurrent.TimeUnit
 
 import scala.util.{Failure, Success, Try}
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys._
 import org.apache.spark.rdd.RDD
 import org.apache.spark.streaming.{Checkpoint, CheckpointWriter, StreamingConf, Time}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobScheduler.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobScheduler.scala
index 852b5cd492a25..79c041cd5c109 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobScheduler.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/JobScheduler.scala
@@ -24,7 +24,7 @@ import scala.jdk.CollectionConverters._
 import scala.util.Failure
 
 import org.apache.spark.ExecutorAllocationClient
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.io.SparkHadoopWriterUtils
 import org.apache.spark.rdd.RDD
 import org.apache.spark.streaming._
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
index 7fb35a04be6da..b76208f873761 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceivedBlockTracker.scala
@@ -27,7 +27,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{RECEIVED_BLOCK_INFO, RECEIVED_BLOCK_TRACKER_LOG_EVENT}
 import org.apache.spark.network.util.JavaUtils
 import org.apache.spark.streaming.Time
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
index a37ba04c10123..c2ca04c7be931 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/ReceiverTracker.scala
@@ -24,7 +24,7 @@ import scala.concurrent.ExecutionContext
 import scala.util.{Failure, Success}
 
 import org.apache.spark._
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{ERROR, MESSAGE, RECEIVER_ID, RECEIVER_IDS, STREAM_ID}
 import org.apache.spark.rdd.RDD
 import org.apache.spark.rpc._
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/rate/PIDRateEstimator.scala b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/rate/PIDRateEstimator.scala
index 1b05a6ac30cc4..ad6e7a0b68952 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/scheduler/rate/PIDRateEstimator.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/scheduler/rate/PIDRateEstimator.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.streaming.scheduler.rate
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 
 /**
  * Implements a proportional-integral-derivative (PID) controller which acts on
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/util/BatchedWriteAheadLog.scala b/streaming/src/main/scala/org/apache/spark/streaming/util/BatchedWriteAheadLog.scala
index 8befe53efffa7..de7aaced39fac 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/util/BatchedWriteAheadLog.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/util/BatchedWriteAheadLog.scala
@@ -29,7 +29,7 @@ import scala.jdk.CollectionConverters._
 import scala.util.control.NonFatal
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.RECORDS
 import org.apache.spark.network.util.JavaUtils
 import org.apache.spark.util.{ThreadUtils, Utils}
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/util/FileBasedWriteAheadLog.scala b/streaming/src/main/scala/org/apache/spark/streaming/util/FileBasedWriteAheadLog.scala
index d90095c73785a..024de96b986e1 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/util/FileBasedWriteAheadLog.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/util/FileBasedWriteAheadLog.scala
@@ -31,7 +31,7 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.internal.LogKeys.{NUM_RETRY, WRITE_AHEAD_LOG_INFO}
 import org.apache.spark.util.{CompletionIterator, ThreadUtils}
 import org.apache.spark.util.ArrayImplicits._
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/util/RawTextSender.scala b/streaming/src/main/scala/org/apache/spark/streaming/util/RawTextSender.scala
index 459338f3517fa..0a98c87e90008 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/util/RawTextSender.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/util/RawTextSender.scala
@@ -24,7 +24,7 @@ import java.nio.ByteBuffer
 import scala.io.Source
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.serializer.KryoSerializer
 import org.apache.spark.util.{IntParam, Utils}
 
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/util/RecurringTimer.scala b/streaming/src/main/scala/org/apache/spark/streaming/util/RecurringTimer.scala
index 80363d626bbad..ad50a71e061c3 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/util/RecurringTimer.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/util/RecurringTimer.scala
@@ -17,7 +17,7 @@
 
 package org.apache.spark.streaming.util
 
-import org.apache.spark.internal.{Logging, LogKeys, MDC}
+import org.apache.spark.internal.{Logging, LogKeys}
 import org.apache.spark.util.{Clock, SystemClock}
 
 private[streaming]
diff --git a/streaming/src/main/scala/org/apache/spark/streaming/util/StateMap.scala b/streaming/src/main/scala/org/apache/spark/streaming/util/StateMap.scala
index c125bd13cd355..674a53b1cdf56 100644
--- a/streaming/src/main/scala/org/apache/spark/streaming/util/StateMap.scala
+++ b/streaming/src/main/scala/org/apache/spark/streaming/util/StateMap.scala
@@ -202,7 +202,7 @@ private[streaming] class OpenHashMapBasedStateMap[K, S](
   /** Get all the data of this map as string formatted as a tree based on the delta depth */
   override def toDebugString(): String = {
     val tabs = if (deltaChainLength > 0) {
-      ("    " * (deltaChainLength - 1)) + "+--- "
+      ("    ".repeat(deltaChainLength - 1)) + "+--- "
     } else ""
     parentStateMap.toDebugString() + "\n" + deltaMap.iterator.mkString(tabs, "\n" + tabs, "")
   }
diff --git a/streaming/src/test/java/org/apache/spark/streaming/JavaMapWithStateSuite.java b/streaming/src/test/java/org/apache/spark/streaming/JavaMapWithStateSuite.java
index 8aaafc3d3d5e2..9874385761e07 100644
--- a/streaming/src/test/java/org/apache/spark/streaming/JavaMapWithStateSuite.java
+++ b/streaming/src/test/java/org/apache/spark/streaming/JavaMapWithStateSuite.java
@@ -21,12 +21,12 @@
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
+import java.util.HashSet;
 import java.util.List;
 import java.util.Set;
 
 import scala.Tuple2;
 
-import com.google.common.collect.Sets;
 import org.apache.spark.streaming.api.java.JavaDStream;
 import org.apache.spark.util.ManualClock;
 import org.junit.jupiter.api.Assertions;
@@ -106,23 +106,23 @@ public void testBasicFunction() {
 
     List<Set<Integer>> outputData = Arrays.asList(
         Collections.emptySet(),
-        Sets.newHashSet(1),
-        Sets.newHashSet(2, 1),
-        Sets.newHashSet(3, 2, 1),
-        Sets.newHashSet(4, 3),
-        Sets.newHashSet(5),
+        Set.of(1),
+        Set.of(2, 1),
+        Set.of(3, 2, 1),
+        Set.of(4, 3),
+        Set.of(5),
         Collections.emptySet()
     );
 
     @SuppressWarnings("unchecked")
     List<Set<Tuple2<String, Integer>>> stateData = Arrays.asList(
         Collections.emptySet(),
-        Sets.newHashSet(new Tuple2<>("a", 1)),
-        Sets.newHashSet(new Tuple2<>("a", 2), new Tuple2<>("b", 1)),
-        Sets.newHashSet(new Tuple2<>("a", 3), new Tuple2<>("b", 2), new Tuple2<>("c", 1)),
-        Sets.newHashSet(new Tuple2<>("a", 4), new Tuple2<>("b", 3), new Tuple2<>("c", 1)),
-        Sets.newHashSet(new Tuple2<>("a", 5), new Tuple2<>("b", 3), new Tuple2<>("c", 1)),
-        Sets.newHashSet(new Tuple2<>("a", 5), new Tuple2<>("b", 3), new Tuple2<>("c", 1))
+        Set.of(new Tuple2<>("a", 1)),
+        Set.of(new Tuple2<>("a", 2), new Tuple2<>("b", 1)),
+        Set.of(new Tuple2<>("a", 3), new Tuple2<>("b", 2), new Tuple2<>("c", 1)),
+        Set.of(new Tuple2<>("a", 4), new Tuple2<>("b", 3), new Tuple2<>("c", 1)),
+        Set.of(new Tuple2<>("a", 5), new Tuple2<>("b", 3), new Tuple2<>("c", 1)),
+        Set.of(new Tuple2<>("a", 5), new Tuple2<>("b", 3), new Tuple2<>("c", 1))
     );
 
     Function3<String, Optional<Integer>, State<Integer>, Integer> mappingFunc =
@@ -150,11 +150,11 @@ private <K, S, T> void testOperation(
 
     List<Set<T>> collectedOutputs =
         Collections.synchronizedList(new ArrayList<>());
-    mapWithStateDStream.foreachRDD(rdd -> collectedOutputs.add(Sets.newHashSet(rdd.collect())));
+    mapWithStateDStream.foreachRDD(rdd -> collectedOutputs.add(new HashSet<>(rdd.collect())));
     List<Set<Tuple2<K, S>>> collectedStateSnapshots =
         Collections.synchronizedList(new ArrayList<>());
     mapWithStateDStream.stateSnapshots().foreachRDD(rdd ->
-        collectedStateSnapshots.add(Sets.newHashSet(rdd.collect())));
+        collectedStateSnapshots.add(new HashSet<>(rdd.collect())));
     BatchCounter batchCounter = new BatchCounter(ssc.ssc());
     ssc.start();
     ((ManualClock) ssc.ssc().scheduler().clock())
diff --git a/streaming/src/test/java/test/org/apache/spark/streaming/Java8APISuite.java b/streaming/src/test/java/test/org/apache/spark/streaming/Java8APISuite.java
index 00b1fee764535..82ad517fefc2c 100644
--- a/streaming/src/test/java/test/org/apache/spark/streaming/Java8APISuite.java
+++ b/streaming/src/test/java/test/org/apache/spark/streaming/Java8APISuite.java
@@ -31,7 +31,6 @@
 import org.apache.spark.streaming.Time;
 import scala.Tuple2;
 
-import com.google.common.collect.Sets;
 import org.junit.jupiter.api.Assertions;
 import org.junit.jupiter.api.Test;
 
@@ -218,12 +217,12 @@ public void testTransformWith() {
 
 
     List<Set<Tuple2<String, Tuple2<String, String>>>> expected = Arrays.asList(
-      Sets.newHashSet(
+      Set.of(
         new Tuple2<>("california",
           new Tuple2<>("dodgers", "giants")),
         new Tuple2<>("new york",
           new Tuple2<>("yankees", "mets"))),
-      Sets.newHashSet(
+      Set.of(
         new Tuple2<>("california",
           new Tuple2<>("sharks", "ducks")),
         new Tuple2<>("new york",
@@ -244,7 +243,7 @@ public void testTransformWith() {
     List<List<Tuple2<String, Tuple2<String, String>>>> result = JavaTestUtils.runStreams(ssc, 2, 2);
     List<Set<Tuple2<String, Tuple2<String, String>>>> unorderedResult = new ArrayList<>();
     for (List<Tuple2<String, Tuple2<String, String>>> res : result) {
-      unorderedResult.add(Sets.newHashSet(res));
+      unorderedResult.add(new HashSet<>(res));
     }
 
     Assertions.assertEquals(expected, unorderedResult);
diff --git a/streaming/src/test/java/test/org/apache/spark/streaming/JavaAPISuite.java b/streaming/src/test/java/test/org/apache/spark/streaming/JavaAPISuite.java
index 73c2e89f3729a..9753efecc0a59 100644
--- a/streaming/src/test/java/test/org/apache/spark/streaming/JavaAPISuite.java
+++ b/streaming/src/test/java/test/org/apache/spark/streaming/JavaAPISuite.java
@@ -19,6 +19,7 @@
 
 import java.io.*;
 import java.nio.charset.StandardCharsets;
+import java.nio.file.Files;
 import java.util.*;
 import java.util.concurrent.atomic.AtomicBoolean;
 
@@ -39,9 +40,6 @@
 import org.junit.jupiter.api.Assertions;
 import org.junit.jupiter.api.Test;
 
-import com.google.common.io.Files;
-import com.google.common.collect.Sets;
-
 import org.apache.spark.HashPartitioner;
 import org.apache.spark.SparkConf;
 import org.apache.spark.api.java.JavaPairRDD;
@@ -442,13 +440,13 @@ public void testTransformWith() {
             new Tuple2<>("new york", "islanders")));
 
 
-    List<HashSet<Tuple2<String, Tuple2<String, String>>>> expected = Arrays.asList(
-        Sets.newHashSet(
+    List<Set<Tuple2<String, Tuple2<String, String>>>> expected = Arrays.asList(
+        Set.of(
             new Tuple2<>("california",
                          new Tuple2<>("dodgers", "giants")),
             new Tuple2<>("new york",
                          new Tuple2<>("yankees", "mets"))),
-        Sets.newHashSet(
+        Set.of(
             new Tuple2<>("california",
                          new Tuple2<>("sharks", "ducks")),
             new Tuple2<>("new york",
@@ -471,7 +469,7 @@ public void testTransformWith() {
     List<List<Tuple2<String, Tuple2<String, String>>>> result = JavaTestUtils.runStreams(ssc, 2, 2);
     List<HashSet<Tuple2<String, Tuple2<String, String>>>> unorderedResult = new ArrayList<>();
     for (List<Tuple2<String, Tuple2<String, String>>> res: result) {
-      unorderedResult.add(Sets.newHashSet(res));
+      unorderedResult.add(new HashSet<>(res));
     }
 
     Assertions.assertEquals(expected, unorderedResult);
@@ -1161,15 +1159,15 @@ public void testCountByValueAndWindow() {
         Arrays.asList("hello", "moon"),
         Arrays.asList("hello"));
 
-    List<HashSet<Tuple2<String, Long>>> expected = Arrays.asList(
-        Sets.newHashSet(
+    List<Set<Tuple2<String, Long>>> expected = Arrays.asList(
+        Set.of(
             new Tuple2<>("hello", 1L),
             new Tuple2<>("world", 1L)),
-        Sets.newHashSet(
+        Set.of(
             new Tuple2<>("hello", 2L),
             new Tuple2<>("world", 1L),
             new Tuple2<>("moon", 1L)),
-        Sets.newHashSet(
+        Set.of(
             new Tuple2<>("hello", 2L),
             new Tuple2<>("moon", 1L)));
 
@@ -1181,7 +1179,7 @@ public void testCountByValueAndWindow() {
     List<List<Tuple2<String, Long>>> result = JavaTestUtils.runStreams(ssc, 3, 3);
     List<Set<Tuple2<String, Long>>> unorderedResult = new ArrayList<>();
     for (List<Tuple2<String, Long>> res: result) {
-      unorderedResult.add(Sets.newHashSet(res));
+      unorderedResult.add(new HashSet<>(res));
     }
 
     Assertions.assertEquals(expected, unorderedResult);
@@ -1641,7 +1639,7 @@ public void testRawSocketStream() {
 
   private static List<List<String>> fileTestPrepare(File testDir) throws IOException {
     File existingFile = new File(testDir, "0");
-    Files.asCharSink(existingFile, StandardCharsets.UTF_8).write("0\n");
+    Files.writeString(existingFile.toPath(), "0\n");
     Assertions.assertTrue(existingFile.setLastModified(1000));
     Assertions.assertEquals(1000, existingFile.lastModified());
     return Arrays.asList(Arrays.asList("0"));
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/CheckpointSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/CheckpointSuite.scala
index 4aeb0e043a973..8a32f07537ff8 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/CheckpointSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/CheckpointSuite.scala
@@ -18,13 +18,12 @@
 package org.apache.spark.streaming
 
 import java.io._
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.concurrent.ConcurrentLinkedQueue
 
 import scala.jdk.CollectionConverters._
 import scala.reflect.ClassTag
 
-import com.google.common.io.Files
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileSystem, Path}
 import org.apache.hadoop.io.{IntWritable, Text}
@@ -649,7 +648,7 @@ class CheckpointSuite extends TestSuiteBase with LocalStreamingContext with DStr
      */
     def writeFile(i: Int, clock: Clock): Unit = {
       val file = new File(testDir, i.toString)
-      Files.asCharSink(file, StandardCharsets.UTF_8).write(s"$i\n")
+      Files.writeString(file.toPath, s"$i\n")
       assert(file.setLastModified(clock.getTimeMillis()))
       // Check that the file's modification date is actually the value we wrote, since rounding or
       // truncation will break the test:
@@ -879,8 +878,8 @@ class CheckpointSuite extends TestSuiteBase with LocalStreamingContext with DStr
     assert(checkpointFiles.size === 2)
     // Although bytes2 was written with an old time, it contains the latest status, so we should
     // try to read from it at first.
-    assert(Files.toByteArray(checkpointFiles(0)) === bytes2)
-    assert(Files.toByteArray(checkpointFiles(1)) === bytes1)
+    assert(Files.readAllBytes(checkpointFiles(0).toPath) === bytes2)
+    assert(Files.readAllBytes(checkpointFiles(1).toPath) === bytes1)
     checkpointWriter.stop()
   }
 
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/InputStreamsSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/InputStreamsSuite.scala
index 64335a96045bf..d9a084e482ebc 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/InputStreamsSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/InputStreamsSuite.scala
@@ -20,14 +20,13 @@ package org.apache.spark.streaming
 import java.io.{BufferedWriter, File, OutputStreamWriter}
 import java.net.{ServerSocket, Socket, SocketException}
 import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.concurrent._
 import java.util.concurrent.atomic.AtomicInteger
 
 import scala.collection.mutable
 import scala.jdk.CollectionConverters._
 
-import com.google.common.io.Files
-import org.apache.commons.io.IOUtils
 import org.apache.hadoop.fs.{FileSystem, Path}
 import org.apache.hadoop.io.{LongWritable, Text}
 import org.apache.hadoop.mapreduce.lib.input.TextInputFormat
@@ -132,7 +131,7 @@ class InputStreamsSuite extends TestSuiteBase with BeforeAndAfter {
       val batchDuration = Seconds(2)
       // Create a file that exists before the StreamingContext is created:
       val existingFile = new File(testDir, "0")
-      Files.asCharSink(existingFile, StandardCharsets.UTF_8).write("0\n")
+      Files.writeString(existingFile.toPath, "0\n")
       assert(existingFile.setLastModified(10000) && existingFile.lastModified === 10000)
 
       // Set up the streaming context and input streams
@@ -156,7 +155,7 @@ class InputStreamsSuite extends TestSuiteBase with BeforeAndAfter {
         for (i <- 0 until numCopies) {
           Thread.sleep(batchDuration.milliseconds)
           val file = new File(testDir, i.toString)
-          Files.write(input.map(b => (b + i).toByte), file)
+          Files.write(file.toPath, input.map(b => (b + i).toByte))
           assert(file.setLastModified(clock.getTimeMillis()))
           assert(file.lastModified === clock.getTimeMillis())
           logInfo(s"Created file $file")
@@ -191,7 +190,7 @@ class InputStreamsSuite extends TestSuiteBase with BeforeAndAfter {
 
       // Create a file that exists before the StreamingContext is created:
       val existingFile = new File(testDir, "0")
-      Files.asCharSink(existingFile, StandardCharsets.UTF_8).write("0\n")
+      Files.writeString(existingFile.toPath, "0\n")
       assert(existingFile.setLastModified(10000) && existingFile.lastModified === 10000)
 
       val pathWithWildCard = testDir.toString + "/*/"
@@ -215,7 +214,7 @@ class InputStreamsSuite extends TestSuiteBase with BeforeAndAfter {
 
         def createFileAndAdvanceTime(data: Int, dir: File): Unit = {
           val file = new File(testSubDir1, data.toString)
-          Files.asCharSink(file, StandardCharsets.UTF_8).write(s"$data\n")
+          Files.writeString(file.toPath, s"$data\n")
           assert(file.setLastModified(clock.getTimeMillis()))
           assert(file.lastModified === clock.getTimeMillis())
           logInfo(s"Created file $file")
@@ -264,7 +263,7 @@ class InputStreamsSuite extends TestSuiteBase with BeforeAndAfter {
 
         def write(path: Path, text: String): Unit = {
           val out = fs.create(path, true)
-          IOUtils.write(text, out, StandardCharsets.UTF_8)
+          out.write(text.getBytes(StandardCharsets.UTF_8))
           out.close()
         }
 
@@ -478,7 +477,7 @@ class InputStreamsSuite extends TestSuiteBase with BeforeAndAfter {
       val batchDuration = Seconds(2)
       // Create a file that exists before the StreamingContext is created:
       val existingFile = new File(testDir, "0")
-      Files.asCharSink(existingFile, StandardCharsets.UTF_8).write("0\n")
+      Files.writeString(existingFile.toPath, "0\n")
       assert(existingFile.setLastModified(10000) && existingFile.lastModified === 10000)
 
       // Set up the streaming context and input streams
@@ -502,7 +501,7 @@ class InputStreamsSuite extends TestSuiteBase with BeforeAndAfter {
         val input = Seq(1, 2, 3, 4, 5)
         input.foreach { i =>
           val file = new File(testDir, i.toString)
-          Files.asCharSink(file, StandardCharsets.UTF_8).write(s"$i\n")
+          Files.writeString(file.toPath, s"$i\n")
           assert(file.setLastModified(clock.getTimeMillis()))
           assert(file.lastModified === clock.getTimeMillis())
           logInfo("Created file " + file)
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/MasterFailureTest.scala b/streaming/src/test/scala/org/apache/spark/streaming/MasterFailureTest.scala
index 793730ef0b3ac..83914dfdc3895 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/MasterFailureTest.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/MasterFailureTest.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.streaming
 
 import java.io.{File, IOException}
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.UUID
 import java.util.concurrent.TimeUnit
 
@@ -27,12 +27,11 @@ import scala.jdk.CollectionConverters._
 import scala.reflect.ClassTag
 import scala.util.Random
 
-import com.google.common.io.Files
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.scalatest.Assertions._
 
-import org.apache.spark.internal.{Logging, MDC}
+import org.apache.spark.internal.Logging
 import org.apache.spark.internal.LogKeys.PATH
 import org.apache.spark.streaming.dstream.DStream
 import org.apache.spark.util.Utils
@@ -375,7 +374,7 @@ class FileGeneratingThread(input: Seq[String], testDir: Path, interval: Long)
         val localFile = new File(localTestDir, (i + 1).toString)
         val hadoopFile = new Path(testDir, (i + 1).toString)
         val tempHadoopFile = new Path(testDir, ".tmp_" + (i + 1).toString)
-        Files.asCharSink(localFile, StandardCharsets.UTF_8).write(input(i) + "\n")
+        Files.writeString(localFile.toPath, input(i) + "\n")
         var tries = 0
         var done = false
             while (!done && tries < maxTries) {
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/StreamingContextSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/StreamingContextSuite.scala
index b2d060b8e042c..564713af88aec 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/StreamingContextSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/StreamingContextSuite.scala
@@ -18,7 +18,7 @@
 package org.apache.spark.streaming
 
 import java.io.{File, NotSerializableException}
-import java.nio.charset.StandardCharsets
+import java.nio.file.Files
 import java.util.Locale
 import java.util.concurrent.{CountDownLatch, TimeUnit}
 import java.util.concurrent.atomic.AtomicInteger
@@ -26,7 +26,6 @@ import java.util.concurrent.atomic.AtomicInteger
 import scala.collection.mutable.ArrayBuffer
 import scala.collection.mutable.Queue
 
-import org.apache.commons.io.FileUtils
 import org.scalatest.{Assertions, PrivateMethodTester}
 import org.scalatest.concurrent.{Signaler, ThreadSignaler, TimeLimits}
 import org.scalatest.concurrent.Eventually._
@@ -910,7 +909,7 @@ class StreamingContextSuite
   def createCorruptedCheckpoint(): String = {
     val checkpointDirectory = Utils.createTempDir().getAbsolutePath()
     val fakeCheckpointFile = Checkpoint.checkpointFile(checkpointDirectory, Time(1000))
-    FileUtils.write(new File(fakeCheckpointFile.toString()), "blablabla", StandardCharsets.UTF_8)
+    Files.writeString(new File(fakeCheckpointFile.toString()).toPath, "blablabla")
     assert(Checkpoint.getCheckpointFiles(checkpointDirectory).nonEmpty)
     checkpointDirectory
   }
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/util/RateLimitedOutputStreamSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/util/RateLimitedOutputStreamSuite.scala
index 895da1a11e543..ee1d1bc3dee79 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/util/RateLimitedOutputStreamSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/util/RateLimitedOutputStreamSuite.scala
@@ -33,7 +33,7 @@ class RateLimitedOutputStreamSuite extends SparkFunSuite {
 
   test("write") {
     val underlying = new ByteArrayOutputStream
-    val data = "X" * 41000
+    val data = "X".repeat(41000)
     val stream = new RateLimitedOutputStream(underlying, desiredBytesPerSec = 10000)
     val elapsedNs = benchmark { stream.write(data.getBytes(StandardCharsets.UTF_8)) }
 
diff --git a/streaming/src/test/scala/org/apache/spark/streaming/util/WriteAheadLogSuite.scala b/streaming/src/test/scala/org/apache/spark/streaming/util/WriteAheadLogSuite.scala
index cf9d5b7387f79..2d68e7572d9d8 100644
--- a/streaming/src/test/scala/org/apache/spark/streaming/util/WriteAheadLogSuite.scala
+++ b/streaming/src/test/scala/org/apache/spark/streaming/util/WriteAheadLogSuite.scala
@@ -27,7 +27,6 @@ import scala.concurrent.duration._
 import scala.jdk.CollectionConverters._
 import scala.language.implicitConversions
 
-import org.apache.commons.lang3.{JavaVersion, SystemUtils}
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 import org.mockito.ArgumentCaptor
@@ -477,7 +476,7 @@ class BatchedWriteAheadLogSuite extends CommonWriteAheadLogTests(
     val batchedWal = new BatchedWriteAheadLog(wal, sparkConf)
 
     val e = intercept[SparkException] {
-      val buffer = if (SystemUtils.isJavaVersionAtMost(JavaVersion.JAVA_17)) {
+      val buffer = if (Utils.isJavaVersionAtMost17) {
         mock[ByteBuffer]
       } else {
         // SPARK-40731: Use a 0 size `ByteBuffer` instead of `mock[ByteBuffer]`
@@ -553,7 +552,7 @@ class BatchedWriteAheadLogSuite extends CommonWriteAheadLogTests(
     batchedWal.close()
     verify(wal, times(1)).close()
 
-    val buffer = if (SystemUtils.isJavaVersionAtMost(JavaVersion.JAVA_17)) {
+    val buffer = if (Utils.isJavaVersionAtMost17) {
       mock[ByteBuffer]
     } else {
       // SPARK-40731: Use a 0 size `ByteBuffer` instead of `mock[ByteBuffer]`
diff --git a/ui-test/package-lock.json b/ui-test/package-lock.json
index 31343ca4ef837..6dab5ac5782d9 100644
--- a/ui-test/package-lock.json
+++ b/ui-test/package-lock.json
@@ -1235,10 +1235,11 @@
       "dev": true
     },
     "node_modules/brace-expansion": {
-      "version": "1.1.11",
-      "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.11.tgz",
-      "integrity": "sha512-iCuPHDFgrHX7H2vEI/5xpz07zSHB00TpugqhmYtVmMO6518mCuRMoOYFldEBl0g187ufozdaHgWKcYFb61qGiA==",
+      "version": "1.1.12",
+      "resolved": "https://registry.npmjs.org/brace-expansion/-/brace-expansion-1.1.12.tgz",
+      "integrity": "sha512-9T9UjW3r0UW5c1Q7GTwllptXwhvYmEzFhzMfZ9H7FQWt+uZePjZPjBP/W1ZEyZ1twGWom5/56TF4lPcqjnDHcg==",
       "dev": true,
+      "license": "MIT",
       "dependencies": {
         "balanced-match": "^1.0.0",
         "concat-map": "0.0.1"
@@ -1303,6 +1304,20 @@
       "integrity": "sha512-E+XQCRwSbaaiChtv6k6Dwgc+bx+Bs6vuKJHHl5kox/BaKbhiXzqQOwK4cO22yElGp2OCmjwVhT3HmxgyPGnJfQ==",
       "dev": true
     },
+    "node_modules/call-bind-apply-helpers": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/call-bind-apply-helpers/-/call-bind-apply-helpers-1.0.2.tgz",
+      "integrity": "sha512-Sp1ablJ0ivDkSzjcaJdxEunN5/XvksFJ2sMBFfq6x0ryhQV/2b/KwFe21cMpmHtPOSij8K99/wSfoEuTObmuMQ==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "es-errors": "^1.3.0",
+        "function-bind": "^1.1.2"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
     "node_modules/callsites": {
       "version": "3.1.0",
       "resolved": "https://registry.npmjs.org/callsites/-/callsites-3.1.0.tgz",
@@ -1586,6 +1601,21 @@
         "node": ">=12"
       }
     },
+    "node_modules/dunder-proto": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/dunder-proto/-/dunder-proto-1.0.1.tgz",
+      "integrity": "sha512-KIN/nDJBQRcXw0MLVhZE9iQHmG68qAVIBg9CqmUYjmQIhgij9U5MFvrqkUL5FbtyyzZuOeOt0zdeRe4UY7ct+A==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "call-bind-apply-helpers": "^1.0.1",
+        "es-errors": "^1.3.0",
+        "gopd": "^1.2.0"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
     "node_modules/electron-to-chromium": {
       "version": "1.4.588",
       "resolved": "https://registry.npmjs.org/electron-to-chromium/-/electron-to-chromium-1.4.588.tgz",
@@ -1631,6 +1661,55 @@
         "is-arrayish": "^0.2.1"
       }
     },
+    "node_modules/es-define-property": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/es-define-property/-/es-define-property-1.0.1.tgz",
+      "integrity": "sha512-e3nRfgfUZ4rNGL232gUgX06QNyyez04KdjFrF+LTRoOXmrOgFKDg4BCdsjW8EnT69eqdYGmRpJwiPVYNrCaW3g==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
+    "node_modules/es-errors": {
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/es-errors/-/es-errors-1.3.0.tgz",
+      "integrity": "sha512-Zf5H2Kxt2xjTvbJvP2ZWLEICxA6j+hAmMzIlypy4xcBg1vKVnx89Wy0GbS+kf5cwCVFFzdCFh2XSCFNULS6csw==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
+    "node_modules/es-object-atoms": {
+      "version": "1.1.1",
+      "resolved": "https://registry.npmjs.org/es-object-atoms/-/es-object-atoms-1.1.1.tgz",
+      "integrity": "sha512-FGgH2h8zKNim9ljj7dankFPcICIK9Cp5bm+c2gQSYePhpaG5+esrLODihIorn+Pe6FGJzWhXQotPv73jTaldXA==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "es-errors": "^1.3.0"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
+    "node_modules/es-set-tostringtag": {
+      "version": "2.1.0",
+      "resolved": "https://registry.npmjs.org/es-set-tostringtag/-/es-set-tostringtag-2.1.0.tgz",
+      "integrity": "sha512-j6vWzfrGVfyXxge+O0x5sh6cvxAog0a/4Rdd2K36zCMV5eJ+/+tOAngRO8cODMNWbVRdVlmGZQL2YS3yR8bIUA==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "es-errors": "^1.3.0",
+        "get-intrinsic": "^1.2.6",
+        "has-tostringtag": "^1.0.2",
+        "hasown": "^2.0.2"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
     "node_modules/escalade": {
       "version": "3.1.1",
       "resolved": "https://registry.npmjs.org/escalade/-/escalade-3.1.1.tgz",
@@ -1790,13 +1869,16 @@
       }
     },
     "node_modules/form-data": {
-      "version": "4.0.0",
-      "resolved": "https://registry.npmjs.org/form-data/-/form-data-4.0.0.tgz",
-      "integrity": "sha512-ETEklSGi5t0QMZuiXoA/Q6vcnxcLQP5vdugSpuAyi6SVGi2clPPp+xgEhuMaHC+zGgn31Kd235W35f7Hykkaww==",
+      "version": "4.0.4",
+      "resolved": "https://registry.npmjs.org/form-data/-/form-data-4.0.4.tgz",
+      "integrity": "sha512-KrGhL9Q4zjj0kiUt5OO4Mr/A/jlI2jDYs5eHBpYHPcBEVSiipAvn2Ko2HnPe20rmcuuvMHNdZFp+4IlGTMF0Ow==",
       "dev": true,
+      "license": "MIT",
       "dependencies": {
         "asynckit": "^0.4.0",
         "combined-stream": "^1.0.8",
+        "es-set-tostringtag": "^2.1.0",
+        "hasown": "^2.0.2",
         "mime-types": "^2.1.12"
       },
       "engines": {
@@ -1850,6 +1932,31 @@
         "node": "6.* || 8.* || >= 10.*"
       }
     },
+    "node_modules/get-intrinsic": {
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/get-intrinsic/-/get-intrinsic-1.3.0.tgz",
+      "integrity": "sha512-9fSjSaos/fRIVIp+xSJlE6lfwhES7LNtKaCBIamHsjr2na1BiABJPo0mOjjz8GJDURarmCPGqaiVg5mfjb98CQ==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "call-bind-apply-helpers": "^1.0.2",
+        "es-define-property": "^1.0.1",
+        "es-errors": "^1.3.0",
+        "es-object-atoms": "^1.1.1",
+        "function-bind": "^1.1.2",
+        "get-proto": "^1.0.1",
+        "gopd": "^1.2.0",
+        "has-symbols": "^1.1.0",
+        "hasown": "^2.0.2",
+        "math-intrinsics": "^1.1.0"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
     "node_modules/get-package-type": {
       "version": "0.1.0",
       "resolved": "https://registry.npmjs.org/get-package-type/-/get-package-type-0.1.0.tgz",
@@ -1859,6 +1966,20 @@
         "node": ">=8.0.0"
       }
     },
+    "node_modules/get-proto": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/get-proto/-/get-proto-1.0.1.tgz",
+      "integrity": "sha512-sTSfBjoXBp89JvIKIefqw7U2CCebsc74kiY6awiGogKtoSGbgjYE/G/+l9sF3MWFPNc9IcoOC4ODfKHfxFmp0g==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "dunder-proto": "^1.0.1",
+        "es-object-atoms": "^1.0.0"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
     "node_modules/get-stream": {
       "version": "6.0.1",
       "resolved": "https://registry.npmjs.org/get-stream/-/get-stream-6.0.1.tgz",
@@ -1900,6 +2021,19 @@
         "node": ">=4"
       }
     },
+    "node_modules/gopd": {
+      "version": "1.2.0",
+      "resolved": "https://registry.npmjs.org/gopd/-/gopd-1.2.0.tgz",
+      "integrity": "sha512-ZUKRh6/kUFoAiTAtTYPZJ3hw9wNxx+BIBOijnlG9PnrJsCcSjs1wyyD6vJpaYtgnzDrKYRSqf3OO6Rfa93xsRg==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
     "node_modules/graceful-fs": {
       "version": "4.2.11",
       "resolved": "https://registry.npmjs.org/graceful-fs/-/graceful-fs-4.2.11.tgz",
@@ -1915,11 +2049,41 @@
         "node": ">=8"
       }
     },
+    "node_modules/has-symbols": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/has-symbols/-/has-symbols-1.1.0.tgz",
+      "integrity": "sha512-1cDNdwJ2Jaohmb3sg4OmKaMBwuC48sYni5HUw2DvsC8LjGTLK9h+eb1X6RyuOHe4hT0ULCW68iomhjUoKUqlPQ==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
+    "node_modules/has-tostringtag": {
+      "version": "1.0.2",
+      "resolved": "https://registry.npmjs.org/has-tostringtag/-/has-tostringtag-1.0.2.tgz",
+      "integrity": "sha512-NqADB8VjPFLM2V0VvHUewwwsw0ZWBaIdgo+ieHtK3hasLz4qeCRjYcqfB6AQrBggRKppKF8L52/VqdVsO47Dlw==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "has-symbols": "^1.0.3"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
     "node_modules/hasown": {
-      "version": "2.0.0",
-      "resolved": "https://registry.npmjs.org/hasown/-/hasown-2.0.0.tgz",
-      "integrity": "sha512-vUptKVTpIJhcczKBbgnS+RtcuYMB8+oNzPK2/Hp3hanz8JmpATdmmgLgSaadVREkDm+e2giHwY3ZRkyjSIDDFA==",
+      "version": "2.0.2",
+      "resolved": "https://registry.npmjs.org/hasown/-/hasown-2.0.2.tgz",
+      "integrity": "sha512-0hJU9SCPvmMzIBdZFqNPXWa6dqh7WdH0cII9y+CyS8rG3nL48Bclra9HmKhVVUHyPWNH5Y7xDwAB7bfgSjkUMQ==",
       "dev": true,
+      "license": "MIT",
       "dependencies": {
         "function-bind": "^1.1.2"
       },
@@ -3080,6 +3244,16 @@
         "tmpl": "1.0.5"
       }
     },
+    "node_modules/math-intrinsics": {
+      "version": "1.1.0",
+      "resolved": "https://registry.npmjs.org/math-intrinsics/-/math-intrinsics-1.1.0.tgz",
+      "integrity": "sha512-/IXtbwEk5HTPyEwyKX6hGkYXxM9nbj64B+ilVJnC/R6B0pH5G4V3b0pVbL7DBj4tkhBAppbQUlf6F6Xl9LHu1g==",
+      "dev": true,
+      "license": "MIT",
+      "engines": {
+        "node": ">= 0.4"
+      }
+    },
     "node_modules/merge-stream": {
       "version": "2.0.0",
       "resolved": "https://registry.npmjs.org/merge-stream/-/merge-stream-2.0.0.tgz",